| /* | 
 |  * Copyright (c) 2021, Alliance for Open Media. All rights reserved | 
 |  * | 
 |  * This source code is subject to the terms of the BSD 3-Clause Clear License | 
 |  * and the Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear | 
 |  * License was not distributed with this source code in the LICENSE file, you | 
 |  * can obtain it at aomedia.org/license/software-license/bsd-3-c-c/.  If the | 
 |  * Alliance for Open Media Patent License 1.0 was not distributed with this | 
 |  * source code in the PATENTS file, you can obtain it at | 
 |  * aomedia.org/license/patent-license/. | 
 |  */ | 
 |  | 
 | #include <stdint.h> | 
 | #include <stdio.h> | 
 | #include <string.h> | 
 | #include <tuple> | 
 |  | 
 | #include "config/aom_config.h" | 
 | #include "config/av1_rtcd.h" | 
 |  | 
 | #include "aom_ports/mem.h" | 
 | #include "av1/common/scan.h" | 
 | #include "av1/common/txb_common.h" | 
 | #include "test/acm_random.h" | 
 | #include "test/clear_system_state.h" | 
 | #include "test/register_state_check.h" | 
 | #include "test/util.h" | 
 | #include "third_party/googletest/src/googletest/include/gtest/gtest.h" | 
 |  | 
 | namespace { | 
 | using libaom_test::ACMRandom; | 
 |  | 
 | typedef void (*buildcompdiffwtdmaskd16_func)( | 
 |     uint8_t *mask, DIFFWTD_MASK_TYPE mask_type, const CONV_BUF_TYPE *src0, | 
 |     int src0_stride, const CONV_BUF_TYPE *src1, int src1_stride, int h, int w, | 
 |     ConvolveParams *conv_params, int bd); | 
 |  | 
 | typedef std::tuple<int, buildcompdiffwtdmaskd16_func, BLOCK_SIZE> | 
 |     BuildCompDiffwtdMaskD16Param; | 
 |  | 
 | #if HAVE_SSE4_1 || HAVE_NEON | 
 | ::testing::internal::ParamGenerator<BuildCompDiffwtdMaskD16Param> BuildParams( | 
 |     buildcompdiffwtdmaskd16_func filter) { | 
 |   return ::testing::Combine(::testing::Range(8, 13, 2), | 
 |                             ::testing::Values(filter), | 
 |                             ::testing::Range(BLOCK_4X4, BLOCK_SIZES_ALL)); | 
 | } | 
 | #endif | 
 | class BuildCompDiffwtdMaskD16Test | 
 |     : public ::testing::TestWithParam<BuildCompDiffwtdMaskD16Param> { | 
 |  public: | 
 |   ~BuildCompDiffwtdMaskD16Test() {} | 
 |   virtual void TearDown() { libaom_test::ClearSystemState(); } | 
 |   void SetUp() { rnd_.Reset(ACMRandom::DeterministicSeed()); } | 
 |  | 
 |  protected: | 
 |   void RunCheckOutput(buildcompdiffwtdmaskd16_func test_impl); | 
 |   void RunSpeedTest(buildcompdiffwtdmaskd16_func test_impl, | 
 |                     DIFFWTD_MASK_TYPE mask_type); | 
 |   libaom_test::ACMRandom rnd_; | 
 | };  // class BuildCompDiffwtdMaskD16Test | 
 | GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(BuildCompDiffwtdMaskD16Test); | 
 |  | 
 | void BuildCompDiffwtdMaskD16Test::RunCheckOutput( | 
 |     buildcompdiffwtdmaskd16_func test_impl) { | 
 |   const int block_idx = GET_PARAM(2); | 
 |   const int bd = GET_PARAM(0); | 
 |   const int width = block_size_wide[block_idx]; | 
 |   const int height = block_size_high[block_idx]; | 
 |   DECLARE_ALIGNED(16, uint8_t, mask_ref[2 * MAX_SB_SQUARE]); | 
 |   DECLARE_ALIGNED(16, uint8_t, mask_test[2 * MAX_SB_SQUARE]); | 
 |   DECLARE_ALIGNED(32, uint16_t, src0[MAX_SB_SQUARE]); | 
 |   DECLARE_ALIGNED(32, uint16_t, src1[MAX_SB_SQUARE]); | 
 |  | 
 |   ConvolveParams conv_params = get_conv_params_no_round(0, 0, NULL, 0, 1, bd); | 
 |  | 
 |   int in_precision = | 
 |       bd + 2 * FILTER_BITS - conv_params.round_0 - conv_params.round_1 + 2; | 
 |  | 
 |   for (int i = 0; i < MAX_SB_SQUARE; i++) { | 
 |     src0[i] = rnd_.Rand16() & ((1 << in_precision) - 1); | 
 |     src1[i] = rnd_.Rand16() & ((1 << in_precision) - 1); | 
 |   } | 
 |  | 
 |   for (int mask_type = 0; mask_type < DIFFWTD_MASK_TYPES; mask_type++) { | 
 |     av1_build_compound_diffwtd_mask_d16_c( | 
 |         mask_ref, (DIFFWTD_MASK_TYPE)mask_type, src0, width, src1, width, | 
 |         height, width, &conv_params, bd); | 
 |  | 
 |     test_impl(mask_test, (DIFFWTD_MASK_TYPE)mask_type, src0, width, src1, width, | 
 |               height, width, &conv_params, bd); | 
 |  | 
 |     for (int r = 0; r < height; ++r) { | 
 |       for (int c = 0; c < width; ++c) { | 
 |         ASSERT_EQ(mask_ref[c + r * width], mask_test[c + r * width]) | 
 |             << "Mismatch at unit tests for BuildCompDiffwtdMaskD16Test\n" | 
 |             << " Pixel mismatch at index " | 
 |             << "[" << r << "," << c << "] " | 
 |             << " @ " << width << "x" << height << " inv " << mask_type; | 
 |       } | 
 |     } | 
 |   } | 
 | } | 
 |  | 
 | void BuildCompDiffwtdMaskD16Test::RunSpeedTest( | 
 |     buildcompdiffwtdmaskd16_func test_impl, DIFFWTD_MASK_TYPE mask_type) { | 
 |   const int block_idx = GET_PARAM(2); | 
 |   const int bd = GET_PARAM(0); | 
 |   const int width = block_size_wide[block_idx]; | 
 |   const int height = block_size_high[block_idx]; | 
 |   DECLARE_ALIGNED(16, uint8_t, mask[MAX_SB_SQUARE]); | 
 |   DECLARE_ALIGNED(32, uint16_t, src0[MAX_SB_SQUARE]); | 
 |   DECLARE_ALIGNED(32, uint16_t, src1[MAX_SB_SQUARE]); | 
 |  | 
 |   ConvolveParams conv_params = get_conv_params_no_round(0, 0, NULL, 0, 1, bd); | 
 |  | 
 |   int in_precision = | 
 |       bd + 2 * FILTER_BITS - conv_params.round_0 - conv_params.round_1 + 2; | 
 |  | 
 |   for (int i = 0; i < MAX_SB_SQUARE; i++) { | 
 |     src0[i] = rnd_.Rand16() & ((1 << in_precision) - 1); | 
 |     src1[i] = rnd_.Rand16() & ((1 << in_precision) - 1); | 
 |   } | 
 |  | 
 |   const int num_loops = 10000000 / (width + height); | 
 |   aom_usec_timer timer; | 
 |   aom_usec_timer_start(&timer); | 
 |  | 
 |   for (int i = 0; i < num_loops; ++i) | 
 |     av1_build_compound_diffwtd_mask_d16_c(mask, mask_type, src0, width, src1, | 
 |                                           width, height, width, &conv_params, | 
 |                                           bd); | 
 |  | 
 |   aom_usec_timer_mark(&timer); | 
 |   const int elapsed_time = static_cast<int>(aom_usec_timer_elapsed(&timer)); | 
 |  | 
 |   aom_usec_timer timer1; | 
 |   aom_usec_timer_start(&timer1); | 
 |  | 
 |   for (int i = 0; i < num_loops; ++i) | 
 |     test_impl(mask, mask_type, src0, width, src1, width, height, width, | 
 |               &conv_params, bd); | 
 |  | 
 |   aom_usec_timer_mark(&timer1); | 
 |   const int elapsed_time1 = static_cast<int>(aom_usec_timer_elapsed(&timer1)); | 
 |   printf("av1_build_compound_diffwtd_mask_d16  %3dx%-3d: %7.2f \n", width, | 
 |          height, elapsed_time / double(elapsed_time1)); | 
 | } | 
 | TEST_P(BuildCompDiffwtdMaskD16Test, CheckOutput) { | 
 |   RunCheckOutput(GET_PARAM(1)); | 
 | } | 
 |  | 
 | TEST_P(BuildCompDiffwtdMaskD16Test, DISABLED_Speed) { | 
 |   RunSpeedTest(GET_PARAM(1), DIFFWTD_38); | 
 |   RunSpeedTest(GET_PARAM(1), DIFFWTD_38_INV); | 
 | } | 
 |  | 
 | #if HAVE_SSE4_1 | 
 | INSTANTIATE_TEST_SUITE_P( | 
 |     SSE4_1, BuildCompDiffwtdMaskD16Test, | 
 |     BuildParams(av1_build_compound_diffwtd_mask_d16_sse4_1)); | 
 | #endif | 
 |  | 
 | #if HAVE_AVX2 | 
 | INSTANTIATE_TEST_SUITE_P(AVX2, BuildCompDiffwtdMaskD16Test, | 
 |                          BuildParams(av1_build_compound_diffwtd_mask_d16_avx2)); | 
 | #endif | 
 |  | 
 | #if HAVE_NEON | 
 | INSTANTIATE_TEST_SUITE_P(NEON, BuildCompDiffwtdMaskD16Test, | 
 |                          BuildParams(av1_build_compound_diffwtd_mask_d16_neon)); | 
 | #endif | 
 |  | 
 | }  // namespace |