|  | /* | 
|  | * Copyright (c) 2025, Alliance for Open Media. All rights reserved | 
|  | * | 
|  | * This source code is subject to the terms of the BSD 3-Clause Clear License | 
|  | * and the Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear | 
|  | * License was not distributed with this source code in the LICENSE file, you | 
|  | * can obtain it at aomedia.org/license/software-license/bsd-3-c-c/.  If the | 
|  | * Alliance for Open Media Patent License 1.0 was not distributed with this | 
|  | * source code in the PATENTS file, you can obtain it at | 
|  | * aomedia.org/license/patent-license/. | 
|  | */ | 
|  |  | 
|  | #include "config/av1_rtcd.h" | 
|  |  | 
|  | #include "test/acm_random.h" | 
|  | #include "test/util.h" | 
|  |  | 
|  | #if CONFIG_BAWP | 
|  | namespace { | 
|  | typedef void (*make_bawp_func)(uint16_t *dst, int dst_stride, int16_t alpha, | 
|  | int32_t beta, int shift, int bw, int bh, int bd); | 
|  | #if HAVE_AVX2 | 
|  | const BLOCK_SIZE kValidBlockSize[] = { | 
|  | BLOCK_4X4,     BLOCK_4X8,     BLOCK_8X4,     BLOCK_8X8, | 
|  | BLOCK_8X16,    BLOCK_16X8,    BLOCK_16X16,   BLOCK_16X32, | 
|  | BLOCK_32X16,   BLOCK_32X32,   BLOCK_32X64,   BLOCK_64X32, | 
|  | BLOCK_64X64,   BLOCK_64X128,  BLOCK_128X64,  BLOCK_128X128, | 
|  | #if CONFIG_EXT_RECUR_PARTITIONS | 
|  | BLOCK_128X256, BLOCK_256X128, BLOCK_256X256, | 
|  | #endif  // CONFIG_EXT_RECUR_PARTITIONS | 
|  | BLOCK_4X16,    BLOCK_16X4,    BLOCK_8X32,    BLOCK_32X8, | 
|  | BLOCK_16X64,   BLOCK_64X16, | 
|  | #if CONFIG_EXT_RECUR_PARTITIONS | 
|  | BLOCK_4X32,    BLOCK_32X4,    BLOCK_8X64,    BLOCK_64X8, | 
|  | BLOCK_4X64,    BLOCK_64X4, | 
|  | #endif  // CONFIG_EXT_RECUR_PARTITIONS | 
|  | }; | 
|  | #endif  // HAVE_AVX2 | 
|  |  | 
|  | typedef std::tuple<make_bawp_func, BLOCK_SIZE> BAWPParam; | 
|  |  | 
|  | class BAWPTest : public ::testing::TestWithParam<BAWPParam> { | 
|  | public: | 
|  | ~BAWPTest(); | 
|  | void SetUp(); | 
|  |  | 
|  | void TearDown(); | 
|  |  | 
|  | protected: | 
|  | void RunCheckOutput(make_bawp_func test_impl, BLOCK_SIZE bsize); | 
|  | void RunSpeedTest(make_bawp_func test_impl, BLOCK_SIZE bsize); | 
|  | bool CheckResult(int width, int height) { | 
|  | for (int y = 0; y < height; ++y) { | 
|  | for (int x = 0; x < width; ++x) { | 
|  | const int idx = y * width + x; | 
|  | if (pred1_[idx] != pred2_[idx]) { | 
|  | printf("%dx%d mismatch @%d(%d,%d) ", width, height, idx, x, y); | 
|  | printf("%d != %d ", pred1_[idx], pred2_[idx]); | 
|  | return false; | 
|  | } | 
|  | } | 
|  | } | 
|  | return true; | 
|  | } | 
|  |  | 
|  | libaom_test::ACMRandom rnd_; | 
|  | uint16_t *pred1_; | 
|  | uint16_t *pred2_; | 
|  | }; | 
|  | GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(BAWPTest); | 
|  |  | 
|  | BAWPTest::~BAWPTest() {} | 
|  |  | 
|  | void BAWPTest::SetUp() { | 
|  | rnd_.Reset(libaom_test::ACMRandom::DeterministicSeed()); | 
|  |  | 
|  | pred1_ = (uint16_t *)aom_memalign( | 
|  | 16, MAX_SB_SIZE * MAX_SB_SIZE * sizeof(uint16_t)); | 
|  | ASSERT_NE(pred1_, nullptr); | 
|  | pred2_ = (uint16_t *)aom_memalign( | 
|  | 16, MAX_SB_SIZE * MAX_SB_SIZE * sizeof(uint16_t)); | 
|  | ASSERT_NE(pred2_, nullptr); | 
|  | for (int i = 0; i < (MAX_SB_SIZE * MAX_SB_SIZE); ++i) { | 
|  | pred1_[i] = rnd_.Rand16(); | 
|  | pred2_[i] = pred1_[i]; | 
|  | } | 
|  | } | 
|  |  | 
|  | void BAWPTest::TearDown() { | 
|  | aom_free(pred1_); | 
|  | aom_free(pred2_); | 
|  | } | 
|  |  | 
|  | void BAWPTest::RunCheckOutput(make_bawp_func test_impl, BLOCK_SIZE bsize) { | 
|  | const int w = block_size_wide[bsize]; | 
|  | const int h = block_size_high[bsize]; | 
|  | const int16_t alpha = 320; | 
|  | const int32_t beta = -42036; | 
|  | const int shift = 8; | 
|  | int bd[3] = { 8, 10, 12 }; | 
|  | for (int i = 0; i < 3; ++i) { | 
|  | av1_make_bawp_block_c(pred1_, MAX_SB_SIZE, alpha, beta, shift, w, h, bd[i]); | 
|  | test_impl(pred2_, MAX_SB_SIZE, alpha, beta, shift, w, h, bd[i]); | 
|  |  | 
|  | ASSERT_EQ(CheckResult(w, h), true); | 
|  | } | 
|  | } | 
|  |  | 
|  | void BAWPTest::RunSpeedTest(make_bawp_func test_impl, BLOCK_SIZE bsize) { | 
|  | const int w = block_size_wide[bsize]; | 
|  | const int h = block_size_high[bsize]; | 
|  | const int num_loops = 1000000000 / (w + h); | 
|  | const int16_t alpha = 320; | 
|  | const int32_t beta = -42036; | 
|  | const int shift = 8; | 
|  | int bd = 8; | 
|  |  | 
|  | make_bawp_func functions[2] = { av1_make_bawp_block_c, test_impl }; | 
|  | double elapsed_time[2] = { 0.0 }; | 
|  | for (int i = 0; i < 2; ++i) { | 
|  | aom_usec_timer timer; | 
|  | aom_usec_timer_start(&timer); | 
|  | make_bawp_func func = functions[i]; | 
|  | for (int j = 0; j < num_loops; ++j) { | 
|  | func(pred1_, MAX_SB_SIZE, alpha, beta, shift, w, h, bd); | 
|  | } | 
|  | aom_usec_timer_mark(&timer); | 
|  | const double time = static_cast<double>(aom_usec_timer_elapsed(&timer)); | 
|  | elapsed_time[i] = 1000.0 * time; | 
|  | } | 
|  | printf("BAWP %3dx%-3d: c_time=%7.2fs, simd_time=%7.2fs, scaling=%3.2f\n", w, | 
|  | h, elapsed_time[0], elapsed_time[1], | 
|  | elapsed_time[0] / elapsed_time[1]); | 
|  | } | 
|  |  | 
|  | TEST_P(BAWPTest, CheckOutput) { RunCheckOutput(GET_PARAM(0), GET_PARAM(1)); } | 
|  |  | 
|  | TEST_P(BAWPTest, DISABLED_Speed) { RunSpeedTest(GET_PARAM(0), GET_PARAM(1)); } | 
|  |  | 
|  | #if HAVE_AVX2 | 
|  | INSTANTIATE_TEST_SUITE_P( | 
|  | AVX2, BAWPTest, | 
|  | ::testing::Combine(::testing::Values(&av1_make_bawp_block_avx2), | 
|  | ::testing::ValuesIn(kValidBlockSize))); | 
|  | #endif  // HAVE_AVX2 | 
|  | }  // namespace | 
|  | #endif  // CONFIG_BAWP |