| /* | 
 |  * Copyright (c) 2025, Alliance for Open Media. All rights reserved | 
 |  * | 
 |  * This source code is subject to the terms of the BSD 3-Clause Clear License | 
 |  * and the Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear | 
 |  * License was not distributed with this source code in the LICENSE file, you | 
 |  * can obtain it at aomedia.org/license/software-license/bsd-3-c-c/.  If the | 
 |  * Alliance for Open Media Patent License 1.0 was not distributed with this | 
 |  * source code in the PATENTS file, you can obtain it at | 
 |  * aomedia.org/license/patent-license/. | 
 |  */ | 
 |  | 
 | #include "config/av1_rtcd.h" | 
 |  | 
 | #include "test/acm_random.h" | 
 | #include "test/util.h" | 
 |  | 
 | namespace { | 
 | typedef void (*make_bawp_func)(uint16_t *dst, int dst_stride, int16_t alpha, | 
 |                                int32_t beta, int shift, int bw, int bh, int bd); | 
 | #if HAVE_AVX2 | 
 | const BLOCK_SIZE kValidBlockSize[] = { | 
 |   BLOCK_4X4,     BLOCK_4X8,     BLOCK_8X4,     BLOCK_8X8,     BLOCK_8X16, | 
 |   BLOCK_16X8,    BLOCK_16X16,   BLOCK_16X32,   BLOCK_32X16,   BLOCK_32X32, | 
 |   BLOCK_32X64,   BLOCK_64X32,   BLOCK_64X64,   BLOCK_64X128,  BLOCK_128X64, | 
 |   BLOCK_128X128, BLOCK_128X256, BLOCK_256X128, BLOCK_256X256, BLOCK_4X16, | 
 |   BLOCK_16X4,    BLOCK_8X32,    BLOCK_32X8,    BLOCK_16X64,   BLOCK_64X16, | 
 |   BLOCK_4X32,    BLOCK_32X4,    BLOCK_8X64,    BLOCK_64X8,    BLOCK_4X64, | 
 |   BLOCK_64X4, | 
 | }; | 
 | #endif  // HAVE_AVX2 | 
 |  | 
 | typedef std::tuple<make_bawp_func, BLOCK_SIZE> BAWPParam; | 
 |  | 
 | class BAWPTest : public ::testing::TestWithParam<BAWPParam> { | 
 |  public: | 
 |   ~BAWPTest(); | 
 |   void SetUp(); | 
 |  | 
 |   void TearDown(); | 
 |  | 
 |  protected: | 
 |   void RunCheckOutput(make_bawp_func test_impl, BLOCK_SIZE bsize); | 
 |   void RunSpeedTest(make_bawp_func test_impl, BLOCK_SIZE bsize); | 
 |   bool CheckResult(int width, int height) { | 
 |     for (int y = 0; y < height; ++y) { | 
 |       for (int x = 0; x < width; ++x) { | 
 |         const int idx = y * width + x; | 
 |         if (pred1_[idx] != pred2_[idx]) { | 
 |           printf("%dx%d mismatch @%d(%d,%d) ", width, height, idx, x, y); | 
 |           printf("%d != %d ", pred1_[idx], pred2_[idx]); | 
 |           return false; | 
 |         } | 
 |       } | 
 |     } | 
 |     return true; | 
 |   } | 
 |  | 
 |   libaom_test::ACMRandom rnd_; | 
 |   uint16_t *pred1_; | 
 |   uint16_t *pred2_; | 
 | }; | 
 | GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(BAWPTest); | 
 |  | 
 | BAWPTest::~BAWPTest() {} | 
 |  | 
 | void BAWPTest::SetUp() { | 
 |   rnd_.Reset(libaom_test::ACMRandom::DeterministicSeed()); | 
 |  | 
 |   pred1_ = (uint16_t *)aom_memalign( | 
 |       16, MAX_SB_SIZE * MAX_SB_SIZE * sizeof(uint16_t)); | 
 |   ASSERT_NE(pred1_, nullptr); | 
 |   pred2_ = (uint16_t *)aom_memalign( | 
 |       16, MAX_SB_SIZE * MAX_SB_SIZE * sizeof(uint16_t)); | 
 |   ASSERT_NE(pred2_, nullptr); | 
 |   for (int i = 0; i < (MAX_SB_SIZE * MAX_SB_SIZE); ++i) { | 
 |     pred1_[i] = rnd_.Rand16(); | 
 |     pred2_[i] = pred1_[i]; | 
 |   } | 
 | } | 
 |  | 
 | void BAWPTest::TearDown() { | 
 |   aom_free(pred1_); | 
 |   aom_free(pred2_); | 
 | } | 
 |  | 
 | void BAWPTest::RunCheckOutput(make_bawp_func test_impl, BLOCK_SIZE bsize) { | 
 |   const int w = block_size_wide[bsize]; | 
 |   const int h = block_size_high[bsize]; | 
 |   const int16_t alpha = 320; | 
 |   const int32_t beta = -42036; | 
 |   const int shift = 8; | 
 |   int bd[3] = { 8, 10, 12 }; | 
 |   for (int i = 0; i < 3; ++i) { | 
 |     av1_make_bawp_block_c(pred1_, MAX_SB_SIZE, alpha, beta, shift, w, h, bd[i]); | 
 |     test_impl(pred2_, MAX_SB_SIZE, alpha, beta, shift, w, h, bd[i]); | 
 |  | 
 |     ASSERT_EQ(CheckResult(w, h), true); | 
 |   } | 
 | } | 
 |  | 
 | void BAWPTest::RunSpeedTest(make_bawp_func test_impl, BLOCK_SIZE bsize) { | 
 |   const int w = block_size_wide[bsize]; | 
 |   const int h = block_size_high[bsize]; | 
 |   const int num_loops = 1000000000 / (w + h); | 
 |   const int16_t alpha = 320; | 
 |   const int32_t beta = -42036; | 
 |   const int shift = 8; | 
 |   int bd = 8; | 
 |  | 
 |   make_bawp_func functions[2] = { av1_make_bawp_block_c, test_impl }; | 
 |   double elapsed_time[2] = { 0.0 }; | 
 |   for (int i = 0; i < 2; ++i) { | 
 |     aom_usec_timer timer; | 
 |     aom_usec_timer_start(&timer); | 
 |     make_bawp_func func = functions[i]; | 
 |     for (int j = 0; j < num_loops; ++j) { | 
 |       func(pred1_, MAX_SB_SIZE, alpha, beta, shift, w, h, bd); | 
 |     } | 
 |     aom_usec_timer_mark(&timer); | 
 |     const double time = static_cast<double>(aom_usec_timer_elapsed(&timer)); | 
 |     elapsed_time[i] = 1000.0 * time; | 
 |   } | 
 |   printf("BAWP %3dx%-3d: c_time=%7.2fs, simd_time=%7.2fs, scaling=%3.2f\n", w, | 
 |          h, elapsed_time[0], elapsed_time[1], | 
 |          elapsed_time[0] / elapsed_time[1]); | 
 | } | 
 |  | 
 | TEST_P(BAWPTest, CheckOutput) { RunCheckOutput(GET_PARAM(0), GET_PARAM(1)); } | 
 |  | 
 | TEST_P(BAWPTest, DISABLED_Speed) { RunSpeedTest(GET_PARAM(0), GET_PARAM(1)); } | 
 |  | 
 | #if HAVE_AVX2 | 
 | INSTANTIATE_TEST_SUITE_P( | 
 |     AVX2, BAWPTest, | 
 |     ::testing::Combine(::testing::Values(&av1_make_bawp_block_avx2), | 
 |                        ::testing::ValuesIn(kValidBlockSize))); | 
 | #endif  // HAVE_AVX2 | 
 | }  // namespace |