|  | /* | 
|  | * Copyright (c) 2021, Alliance for Open Media. All rights reserved. | 
|  | * | 
|  | * This source code is subject to the terms of the BSD 2 Clause License and | 
|  | * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License | 
|  | * was not distributed with this source code in the LICENSE file, you can | 
|  | * obtain it at www.aomedia.org/license/software. If the Alliance for Open | 
|  | * Media Patent License 1.0 was not distributed with this source code in the | 
|  | * PATENTS file, you can obtain it at www.aomedia.org/license/patent. | 
|  | */ | 
|  |  | 
|  | #include <memory> | 
|  | #include <new> | 
|  | #include <tuple> | 
|  |  | 
|  | #include "aom/aom_integer.h" | 
|  | #include "aom_ports/aom_timer.h" | 
|  | #include "av1/encoder/ml.h" | 
|  | #include "config/aom_config.h" | 
|  | #include "config/aom_dsp_rtcd.h" | 
|  | #include "config/av1_rtcd.h" | 
|  | #include "gtest/gtest.h" | 
|  | #include "test/acm_random.h" | 
|  | #include "test/register_state_check.h" | 
|  | #include "test/util.h" | 
|  |  | 
|  | namespace { | 
|  | using FastSoftmaxFn = void (*)(const float *const input, float *output); | 
|  | using FastSoftmaxTestParams = std::tuple<const FastSoftmaxFn, int>; | 
|  |  | 
|  | // Error thresholds for functional equivalence | 
|  | constexpr float kRelEpsilon = 5e-2f; | 
|  | constexpr float kAbsEpsilon = 5e-3f; | 
|  |  | 
|  | class FastSoftmaxTest : public ::testing::TestWithParam<FastSoftmaxTestParams> { | 
|  | public: | 
|  | FastSoftmaxTest() : target_fn_(GET_PARAM(0)), num_classes_(GET_PARAM(1)) {} | 
|  | void SetUp() override { | 
|  | ref_buf_.reset(new (std::nothrow) float[num_classes_]()); | 
|  | ASSERT_NE(ref_buf_, nullptr); | 
|  | dst_buf_.reset(new (std::nothrow) float[num_classes_]()); | 
|  | ASSERT_NE(dst_buf_, nullptr); | 
|  | input_.reset(new (std::nothrow) float[num_classes_]()); | 
|  | ASSERT_NE(input_, nullptr); | 
|  | } | 
|  | void RunSoftmaxTest(); | 
|  | void RunSoftmaxSpeedTest(const int run_times); | 
|  | void FillInputBuf(); | 
|  |  | 
|  | private: | 
|  | const FastSoftmaxFn target_fn_; | 
|  | const int num_classes_; | 
|  | std::unique_ptr<float[]> ref_buf_, dst_buf_, input_; | 
|  | libaom_test::ACMRandom rng_; | 
|  | }; | 
|  |  | 
|  | void FastSoftmaxTest::FillInputBuf() { | 
|  | for (int idx = 0; idx < num_classes_; idx++) { | 
|  | input_[idx] = ((float)rng_.Rand31() - (1 << 30)) / (1u << 30); | 
|  | } | 
|  | } | 
|  |  | 
|  | void FastSoftmaxTest::RunSoftmaxTest() { | 
|  | av1_nn_softmax(input_.get(), ref_buf_.get(), num_classes_); | 
|  | target_fn_(input_.get(), dst_buf_.get()); | 
|  |  | 
|  | for (int idx = 0; idx < num_classes_; idx++) { | 
|  | if (ref_buf_[idx] < kAbsEpsilon) { | 
|  | ASSERT_LE(dst_buf_[idx], kAbsEpsilon) | 
|  | << "Reference output was near-zero, test output was not" << std::endl; | 
|  | } else { | 
|  | const float error = dst_buf_[idx] - ref_buf_[idx]; | 
|  | const float relative_error = fabsf(error / ref_buf_[idx]); | 
|  | ASSERT_LE(relative_error, kRelEpsilon) | 
|  | << "Excessive relative error between reference and test output" | 
|  | << std::endl; | 
|  | ASSERT_LE(error, kAbsEpsilon) | 
|  | << "Excessive absolute error between reference and test output" | 
|  | << std::endl; | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | void FastSoftmaxTest::RunSoftmaxSpeedTest(const int run_times) { | 
|  | aom_usec_timer timer; | 
|  | aom_usec_timer_start(&timer); | 
|  | for (int idx = 0; idx < run_times; idx++) { | 
|  | target_fn_(input_.get(), dst_buf_.get()); | 
|  | } | 
|  | aom_usec_timer_mark(&timer); | 
|  | const int64_t time = aom_usec_timer_elapsed(&timer); | 
|  | std::cout << "Test with " << num_classes_ << " classes took " << time | 
|  | << " us." << std::endl; | 
|  | } | 
|  |  | 
|  | TEST_P(FastSoftmaxTest, RandomValues) { | 
|  | FillInputBuf(); | 
|  | RunSoftmaxTest(); | 
|  | } | 
|  |  | 
|  | TEST_P(FastSoftmaxTest, DISABLED_Speed) { | 
|  | constexpr int kNumTimes = 1000000; | 
|  | RunSoftmaxSpeedTest(kNumTimes); | 
|  | } | 
|  |  | 
|  | void AnchorSoftmax16Fn(const float *input, float *output) { | 
|  | av1_nn_softmax(input, output, 16); | 
|  | } | 
|  |  | 
|  | const FastSoftmaxTestParams kArrayParams_c[] = { | 
|  | FastSoftmaxTestParams(AnchorSoftmax16Fn, 16), | 
|  | FastSoftmaxTestParams(av1_nn_fast_softmax_16_c, 16) | 
|  | }; | 
|  | INSTANTIATE_TEST_SUITE_P(C, FastSoftmaxTest, | 
|  | ::testing::ValuesIn(kArrayParams_c)); | 
|  |  | 
|  | #if HAVE_SSE3 && !CONFIG_EXCLUDE_SIMD_MISMATCH | 
|  | INSTANTIATE_TEST_SUITE_P( | 
|  | SSE3, FastSoftmaxTest, | 
|  | ::testing::Values(FastSoftmaxTestParams(av1_nn_fast_softmax_16_sse3, 16))); | 
|  | #endif | 
|  | }  // namespace |