| /* | 
 |  * Copyright (c) 2016, Alliance for Open Media. All rights reserved. | 
 |  * | 
 |  * This source code is subject to the terms of the BSD 2 Clause License and | 
 |  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License | 
 |  * was not distributed with this source code in the LICENSE file, you can | 
 |  * obtain it at www.aomedia.org/license/software. If the Alliance for Open | 
 |  * Media Patent License 1.0 was not distributed with this source code in the | 
 |  * PATENTS file, you can obtain it at www.aomedia.org/license/patent. | 
 |  */ | 
 |  | 
 | #include <tuple> | 
 |  | 
 | #include "gtest/gtest.h" | 
 |  | 
 | #include "config/av1_rtcd.h" | 
 |  | 
 | #include "test/acm_random.h" | 
 | #include "test/register_state_check.h" | 
 | #include "test/util.h" | 
 | #include "av1/common/enums.h" | 
 |  | 
 | namespace { | 
 |  | 
 | using libaom_test::ACMRandom; | 
 | using std::tuple; | 
 |  | 
 | using Predictor = void (*)(uint8_t *dst, ptrdiff_t stride, TX_SIZE tx_size, | 
 |                            const uint8_t *above, const uint8_t *left, int mode); | 
 |  | 
 | // Note: | 
 | //  Test parameter list: | 
 | //  Reference predictor, optimized predictor, prediction mode, tx size | 
 | // | 
 | using PredFuncMode = tuple<Predictor, Predictor, int>; | 
 | using PredParams = tuple<PredFuncMode, TX_SIZE>; | 
 |  | 
 | const int MaxTxSize = 32; | 
 |  | 
 | const int MaxTestNum = 100; | 
 |  | 
 | class AV1FilterIntraPredTest : public ::testing::TestWithParam<PredParams> { | 
 |  public: | 
 |   ~AV1FilterIntraPredTest() override = default; | 
 |   void SetUp() override { | 
 |     PredFuncMode funcMode = GET_PARAM(0); | 
 |     predFuncRef_ = std::get<0>(funcMode); | 
 |     predFunc_ = std::get<1>(funcMode); | 
 |     mode_ = std::get<2>(funcMode); | 
 |     txSize_ = GET_PARAM(1); | 
 |  | 
 |     alloc_ = new uint8_t[2 * MaxTxSize + 1]; | 
 |     predRef_ = new uint8_t[MaxTxSize * MaxTxSize]; | 
 |     pred_ = new uint8_t[MaxTxSize * MaxTxSize]; | 
 |     ASSERT_NE(alloc_, nullptr); | 
 |     ASSERT_NE(predRef_, nullptr); | 
 |     ASSERT_NE(pred_, nullptr); | 
 |   } | 
 |  | 
 |   void TearDown() override { | 
 |     delete[] alloc_; | 
 |     delete[] predRef_; | 
 |     delete[] pred_; | 
 |   } | 
 |  | 
 |  protected: | 
 |   void RunTest() const { | 
 |     int tstIndex = 0; | 
 |     int stride = tx_size_wide[txSize_]; | 
 |     uint8_t *left = alloc_; | 
 |     uint8_t *above = alloc_ + MaxTxSize; | 
 |     while (tstIndex < MaxTestNum) { | 
 |       PrepareBuffer(); | 
 |       predFuncRef_(predRef_, stride, txSize_, &above[1], left, mode_); | 
 |       API_REGISTER_STATE_CHECK( | 
 |           predFunc_(pred_, stride, txSize_, &above[1], left, mode_)); | 
 |       DiffPred(tstIndex); | 
 |       tstIndex += 1; | 
 |     } | 
 |   } | 
 |   void RunSpeedTest() const { | 
 |     int stride = tx_size_wide[txSize_]; | 
 |     uint8_t *left = alloc_; | 
 |     uint8_t *above = alloc_ + MaxTxSize; | 
 |     const int numIter = 5000; | 
 |  | 
 |     PrepareBuffer(); | 
 |     aom_usec_timer ref_timer; | 
 |     aom_usec_timer_start(&ref_timer); | 
 |     for (int i = 0; i < numIter; i++) { | 
 |       predFuncRef_(predRef_, stride, txSize_, &above[1], left, mode_); | 
 |     } | 
 |     aom_usec_timer_mark(&ref_timer); | 
 |  | 
 |     aom_usec_timer timer; | 
 |     aom_usec_timer_start(&timer); | 
 |     for (int i = 0; i < numIter; i++) { | 
 |       predFunc_(pred_, stride, txSize_, &above[1], left, mode_); | 
 |     } | 
 |     aom_usec_timer_mark(&timer); | 
 |  | 
 |     const int ref_sum_time = | 
 |         static_cast<int>(aom_usec_timer_elapsed(&ref_timer)); | 
 |     const int sum_time = static_cast<int>(aom_usec_timer_elapsed(&timer)); | 
 |  | 
 |     printf("c_time = %d \t simd_time = %d \t Gain = %4.2f \t mode =  %d \n", | 
 |            ref_sum_time, sum_time, | 
 |            (static_cast<float>(ref_sum_time) / static_cast<float>(sum_time)), | 
 |            static_cast<int>(mode_)); | 
 |  | 
 |     DiffPred(0); | 
 |   } | 
 |  | 
 |  private: | 
 |   void PrepareBuffer() const { | 
 |     ACMRandom rnd(ACMRandom::DeterministicSeed()); | 
 |     int i = 0; | 
 |     while (i < (2 * MaxTxSize + 1)) { | 
 |       alloc_[i] = rnd.Rand8(); | 
 |       i++; | 
 |     } | 
 |   } | 
 |  | 
 |   void DiffPred(int testNum) const { | 
 |     int i = 0; | 
 |     while (i < tx_size_wide[txSize_] * tx_size_high[txSize_]) { | 
 |       EXPECT_EQ(predRef_[i], pred_[i]) << "Error at position: " << i << " " | 
 |                                        << "Tx size: " << tx_size_wide[txSize_] | 
 |                                        << "x" << tx_size_high[txSize_] << " " | 
 |                                        << "Test number: " << testNum; | 
 |       i++; | 
 |     } | 
 |   } | 
 |  | 
 |   Predictor predFunc_; | 
 |   Predictor predFuncRef_; | 
 |   int mode_; | 
 |   TX_SIZE txSize_; | 
 |   uint8_t *alloc_; | 
 |   uint8_t *pred_; | 
 |   uint8_t *predRef_; | 
 | }; | 
 |  | 
 | TEST_P(AV1FilterIntraPredTest, BitExactCheck) { RunTest(); } | 
 |  | 
 | TEST_P(AV1FilterIntraPredTest, DISABLED_Speed) { RunSpeedTest(); } | 
 |  | 
 | using ::testing::make_tuple; | 
 | #if HAVE_SSE4_1 | 
 | const PredFuncMode kPredFuncMdArray[] = { | 
 |   make_tuple(&av1_filter_intra_predictor_c, &av1_filter_intra_predictor_sse4_1, | 
 |              FILTER_DC_PRED), | 
 |   make_tuple(&av1_filter_intra_predictor_c, &av1_filter_intra_predictor_sse4_1, | 
 |              FILTER_V_PRED), | 
 |   make_tuple(&av1_filter_intra_predictor_c, &av1_filter_intra_predictor_sse4_1, | 
 |              FILTER_H_PRED), | 
 |   make_tuple(&av1_filter_intra_predictor_c, &av1_filter_intra_predictor_sse4_1, | 
 |              FILTER_D157_PRED), | 
 |   make_tuple(&av1_filter_intra_predictor_c, &av1_filter_intra_predictor_sse4_1, | 
 |              FILTER_PAETH_PRED), | 
 | }; | 
 |  | 
 | const TX_SIZE kTxSize[] = { TX_4X4,  TX_8X8,  TX_16X16, TX_32X32, TX_4X8, | 
 |                             TX_8X4,  TX_8X16, TX_16X8,  TX_16X32, TX_32X16, | 
 |                             TX_4X16, TX_16X4, TX_8X32,  TX_32X8 }; | 
 |  | 
 | INSTANTIATE_TEST_SUITE_P( | 
 |     SSE4_1, AV1FilterIntraPredTest, | 
 |     ::testing::Combine(::testing::ValuesIn(kPredFuncMdArray), | 
 |                        ::testing::ValuesIn(kTxSize))); | 
 | #endif  // HAVE_SSE4_1 | 
 |  | 
 | #if HAVE_NEON | 
 | const PredFuncMode kPredFuncMdArrayNEON[] = { | 
 |   make_tuple(&av1_filter_intra_predictor_c, &av1_filter_intra_predictor_neon, | 
 |              FILTER_DC_PRED), | 
 |   make_tuple(&av1_filter_intra_predictor_c, &av1_filter_intra_predictor_neon, | 
 |              FILTER_V_PRED), | 
 |   make_tuple(&av1_filter_intra_predictor_c, &av1_filter_intra_predictor_neon, | 
 |              FILTER_H_PRED), | 
 |   make_tuple(&av1_filter_intra_predictor_c, &av1_filter_intra_predictor_neon, | 
 |              FILTER_D157_PRED), | 
 |   make_tuple(&av1_filter_intra_predictor_c, &av1_filter_intra_predictor_neon, | 
 |              FILTER_PAETH_PRED), | 
 | }; | 
 |  | 
 | const TX_SIZE kTxSizeNEON[] = { TX_4X4,  TX_8X8,  TX_16X16, TX_32X32, TX_4X8, | 
 |                                 TX_8X4,  TX_8X16, TX_16X8,  TX_16X32, TX_32X16, | 
 |                                 TX_4X16, TX_16X4, TX_8X32,  TX_32X8 }; | 
 |  | 
 | INSTANTIATE_TEST_SUITE_P( | 
 |     NEON, AV1FilterIntraPredTest, | 
 |     ::testing::Combine(::testing::ValuesIn(kPredFuncMdArrayNEON), | 
 |                        ::testing::ValuesIn(kTxSizeNEON))); | 
 | #endif  // HAVE_NEON | 
 |  | 
 | }  // namespace |