|  | /* | 
|  | * Copyright (c) 2017, Alliance for Open Media. All rights reserved | 
|  | * | 
|  | * This source code is subject to the terms of the BSD 2 Clause License and | 
|  | * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License | 
|  | * was not distributed with this source code in the LICENSE file, you can | 
|  | * obtain it at www.aomedia.org/license/software. If the Alliance for Open | 
|  | * Media Patent License 1.0 was not distributed with this source code in the | 
|  | * PATENTS file, you can obtain it at www.aomedia.org/license/patent. | 
|  | */ | 
|  |  | 
|  | #include <stdint.h> | 
|  | #include <stdio.h> | 
|  | #include <string.h> | 
|  | #include <tuple> | 
|  |  | 
|  | #include "third_party/googletest/src/googletest/include/gtest/gtest.h" | 
|  |  | 
|  | #include "config/aom_config.h" | 
|  | #include "config/av1_rtcd.h" | 
|  |  | 
|  | #include "aom_ports/aom_timer.h" | 
|  | #include "aom_ports/mem.h" | 
|  | #include "av1/common/av1_common_int.h" | 
|  | #include "av1/common/idct.h" | 
|  | #include "av1/common/scan.h" | 
|  | #include "av1/common/txb_common.h" | 
|  | #include "test/acm_random.h" | 
|  | #include "test/clear_system_state.h" | 
|  | #include "test/register_state_check.h" | 
|  | #include "test/util.h" | 
|  |  | 
|  | namespace { | 
|  | using libaom_test::ACMRandom; | 
|  |  | 
|  | typedef void (*GetNzMapContextsFunc)(const uint8_t *const levels, | 
|  | const int16_t *const scan, | 
|  | const uint16_t eob, const TX_SIZE tx_size, | 
|  | const TX_CLASS tx_class, | 
|  | int8_t *const coeff_contexts); | 
|  |  | 
|  | class EncodeTxbTest : public ::testing::TestWithParam<GetNzMapContextsFunc> { | 
|  | public: | 
|  | EncodeTxbTest() : get_nz_map_contexts_func_(GetParam()) {} | 
|  |  | 
|  | virtual ~EncodeTxbTest() {} | 
|  |  | 
|  | virtual void SetUp() { | 
|  | coeff_contexts_ref_ = reinterpret_cast<int8_t *>( | 
|  | aom_memalign(16, sizeof(*coeff_contexts_ref_) * MAX_TX_SQUARE)); | 
|  | ASSERT_TRUE(coeff_contexts_ref_ != NULL); | 
|  | coeff_contexts_ = reinterpret_cast<int8_t *>( | 
|  | aom_memalign(16, sizeof(*coeff_contexts_) * MAX_TX_SQUARE)); | 
|  | ASSERT_TRUE(coeff_contexts_ != NULL); | 
|  | } | 
|  |  | 
|  | virtual void TearDown() { | 
|  | aom_free(coeff_contexts_ref_); | 
|  | aom_free(coeff_contexts_); | 
|  | libaom_test::ClearSystemState(); | 
|  | } | 
|  |  | 
|  | void GetNzMapContextsRun() { | 
|  | const int kNumTests = 10; | 
|  | int result = 0; | 
|  |  | 
|  | for (int is_inter = 0; is_inter < 2; ++is_inter) { | 
|  | for (int tx_type = DCT_DCT; tx_type < TX_TYPES; ++tx_type) { | 
|  | const TX_CLASS tx_class = tx_type_to_class[tx_type]; | 
|  | for (int tx_size = TX_4X4; tx_size < TX_SIZES_ALL; ++tx_size) { | 
|  | const int bwl = get_txb_bwl((TX_SIZE)tx_size); | 
|  | const int width = get_txb_wide((TX_SIZE)tx_size); | 
|  | const int height = get_txb_high((TX_SIZE)tx_size); | 
|  | const int real_width = tx_size_wide[tx_size]; | 
|  | const int real_height = tx_size_high[tx_size]; | 
|  | const int16_t *const scan = av1_scan_orders[tx_size][tx_type].scan; | 
|  |  | 
|  | levels_ = set_levels(levels_buf_, width); | 
|  | for (int i = 0; i < kNumTests && !result; ++i) { | 
|  | for (int eob = 1; eob <= width * height && !result; ++eob) { | 
|  | InitDataWithEob(scan, bwl, eob); | 
|  |  | 
|  | av1_get_nz_map_contexts_c(levels_, scan, eob, (TX_SIZE)tx_size, | 
|  | tx_class, coeff_contexts_ref_); | 
|  | get_nz_map_contexts_func_(levels_, scan, eob, (TX_SIZE)tx_size, | 
|  | tx_class, coeff_contexts_); | 
|  |  | 
|  | result = Compare(scan, eob); | 
|  |  | 
|  | EXPECT_EQ(result, 0) | 
|  | << " tx_class " << tx_class << " width " << real_width | 
|  | << " height " << real_height << " eob " << eob; | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | void SpeedTestGetNzMapContextsRun() { | 
|  | const int kNumTests = 2000000000; | 
|  | aom_usec_timer timer; | 
|  | aom_usec_timer timer_ref; | 
|  |  | 
|  | printf("Note: Only test the largest possible eob case!\n"); | 
|  | for (int tx_size = TX_4X4; tx_size < TX_SIZES_ALL; ++tx_size) { | 
|  | const int bwl = get_txb_bwl((TX_SIZE)tx_size); | 
|  | const int width = get_txb_wide((TX_SIZE)tx_size); | 
|  | const int height = get_txb_high((TX_SIZE)tx_size); | 
|  | const int real_width = tx_size_wide[tx_size]; | 
|  | const int real_height = tx_size_high[tx_size]; | 
|  | const TX_TYPE tx_type = DCT_DCT; | 
|  | const TX_CLASS tx_class = tx_type_to_class[tx_type]; | 
|  | const int16_t *const scan = av1_scan_orders[tx_size][tx_type].scan; | 
|  | const int eob = width * height; | 
|  | const int numTests = kNumTests / (width * height); | 
|  |  | 
|  | levels_ = set_levels(levels_buf_, width); | 
|  | InitDataWithEob(scan, bwl, eob); | 
|  |  | 
|  | aom_usec_timer_start(&timer_ref); | 
|  | for (int i = 0; i < numTests; ++i) { | 
|  | av1_get_nz_map_contexts_c(levels_, scan, eob, (TX_SIZE)tx_size, | 
|  | tx_class, coeff_contexts_ref_); | 
|  | } | 
|  | aom_usec_timer_mark(&timer_ref); | 
|  |  | 
|  | levels_ = set_levels(levels_buf_, width); | 
|  | InitDataWithEob(scan, bwl, eob); | 
|  |  | 
|  | aom_usec_timer_start(&timer); | 
|  | for (int i = 0; i < numTests; ++i) { | 
|  | get_nz_map_contexts_func_(levels_, scan, eob, (TX_SIZE)tx_size, | 
|  | tx_class, coeff_contexts_); | 
|  | } | 
|  | aom_usec_timer_mark(&timer); | 
|  |  | 
|  | const int elapsed_time_ref = | 
|  | static_cast<int>(aom_usec_timer_elapsed(&timer_ref)); | 
|  | const int elapsed_time = static_cast<int>(aom_usec_timer_elapsed(&timer)); | 
|  |  | 
|  | printf("get_nz_map_contexts_%2dx%2d: %7.1f ms ref %7.1f ms gain %4.2f\n", | 
|  | real_width, real_height, elapsed_time / 1000.0, | 
|  | elapsed_time_ref / 1000.0, | 
|  | (elapsed_time_ref * 1.0) / (elapsed_time * 1.0)); | 
|  | } | 
|  | } | 
|  |  | 
|  | private: | 
|  | void InitDataWithEob(const int16_t *const scan, const int bwl, | 
|  | const int eob) { | 
|  | memset(levels_buf_, 0, sizeof(levels_buf_)); | 
|  | memset(coeff_contexts_, 0, sizeof(*coeff_contexts_) * MAX_TX_SQUARE); | 
|  |  | 
|  | for (int c = 0; c < eob; ++c) { | 
|  | levels_[get_padded_idx(scan[c], bwl)] = | 
|  | static_cast<uint8_t>(clamp(rnd_.Rand8(), 0, INT8_MAX)); | 
|  | coeff_contexts_[scan[c]] = static_cast<int8_t>(rnd_.Rand16() >> 1); | 
|  | } | 
|  |  | 
|  | memcpy(coeff_contexts_ref_, coeff_contexts_, | 
|  | sizeof(*coeff_contexts_) * MAX_TX_SQUARE); | 
|  | } | 
|  |  | 
|  | bool Compare(const int16_t *const scan, const int eob) const { | 
|  | bool result = false; | 
|  | if (memcmp(coeff_contexts_, coeff_contexts_ref_, | 
|  | sizeof(*coeff_contexts_ref_) * MAX_TX_SQUARE)) { | 
|  | for (int i = 0; i < eob; i++) { | 
|  | const int pos = scan[i]; | 
|  | if (coeff_contexts_ref_[pos] != coeff_contexts_[pos]) { | 
|  | printf("coeff_contexts_[%d] diff:%6d (ref),%6d (opt)\n", pos, | 
|  | coeff_contexts_ref_[pos], coeff_contexts_[pos]); | 
|  | result = true; | 
|  | break; | 
|  | } | 
|  | } | 
|  | } | 
|  | return result; | 
|  | } | 
|  |  | 
|  | GetNzMapContextsFunc get_nz_map_contexts_func_; | 
|  | ACMRandom rnd_; | 
|  | uint8_t levels_buf_[TX_PAD_2D]; | 
|  | uint8_t *levels_; | 
|  | int8_t *coeff_contexts_ref_; | 
|  | int8_t *coeff_contexts_; | 
|  | }; | 
|  | GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(EncodeTxbTest); | 
|  |  | 
|  | TEST_P(EncodeTxbTest, GetNzMapContexts) { GetNzMapContextsRun(); } | 
|  |  | 
|  | TEST_P(EncodeTxbTest, DISABLED_SpeedTestGetNzMapContexts) { | 
|  | SpeedTestGetNzMapContextsRun(); | 
|  | } | 
|  |  | 
|  | #if HAVE_SSE2 | 
|  | INSTANTIATE_TEST_SUITE_P(SSE2, EncodeTxbTest, | 
|  | ::testing::Values(av1_get_nz_map_contexts_sse2)); | 
|  | #endif | 
|  |  | 
|  | #if HAVE_NEON | 
|  | INSTANTIATE_TEST_SUITE_P(NEON, EncodeTxbTest, | 
|  | ::testing::Values(av1_get_nz_map_contexts_neon)); | 
|  | #endif | 
|  |  | 
|  | typedef void (*av1_txb_init_levels_func)(const tran_low_t *const coeff, | 
|  | const int width, const int height, | 
|  | uint8_t *const levels); | 
|  |  | 
|  | typedef std::tuple<av1_txb_init_levels_func, int> TxbInitLevelParam; | 
|  |  | 
|  | class EncodeTxbInitLevelTest | 
|  | : public ::testing::TestWithParam<TxbInitLevelParam> { | 
|  | public: | 
|  | virtual ~EncodeTxbInitLevelTest() {} | 
|  | virtual void TearDown() { libaom_test::ClearSystemState(); } | 
|  | void RunTest(av1_txb_init_levels_func test_func, int tx_size, int is_speed); | 
|  | }; | 
|  | GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(EncodeTxbInitLevelTest); | 
|  |  | 
|  | void EncodeTxbInitLevelTest::RunTest(av1_txb_init_levels_func test_func, | 
|  | int tx_size, int is_speed) { | 
|  | const int width = get_txb_wide((TX_SIZE)tx_size); | 
|  | const int height = get_txb_high((TX_SIZE)tx_size); | 
|  | tran_low_t coeff[MAX_TX_SQUARE]; | 
|  |  | 
|  | uint8_t levels_buf[2][TX_PAD_2D]; | 
|  | uint8_t *const levels0 = set_levels(levels_buf[0], width); | 
|  | uint8_t *const levels1 = set_levels(levels_buf[1], width); | 
|  |  | 
|  | ACMRandom rnd(ACMRandom::DeterministicSeed()); | 
|  | for (int i = 0; i < width * height; i++) { | 
|  | coeff[i] = rnd.Rand15Signed() + rnd.Rand15Signed(); | 
|  | } | 
|  | for (int i = 0; i < TX_PAD_2D; i++) { | 
|  | levels_buf[0][i] = rnd.Rand8(); | 
|  | levels_buf[1][i] = rnd.Rand8(); | 
|  | } | 
|  | const int run_times = is_speed ? (width * height) * 10000 : 1; | 
|  | aom_usec_timer timer; | 
|  | aom_usec_timer_start(&timer); | 
|  | for (int i = 0; i < run_times; ++i) { | 
|  | av1_txb_init_levels_c(coeff, width, height, levels0); | 
|  | } | 
|  | const double t1 = get_time_mark(&timer); | 
|  | aom_usec_timer_start(&timer); | 
|  | for (int i = 0; i < run_times; ++i) { | 
|  | test_func(coeff, width, height, levels1); | 
|  | } | 
|  | const double t2 = get_time_mark(&timer); | 
|  | if (is_speed) { | 
|  | printf("init %3dx%-3d:%7.2f/%7.2fns", width, height, t1, t2); | 
|  | printf("(%3.2f)\n", t1 / t2); | 
|  | } | 
|  | const int stride = width + TX_PAD_HOR; | 
|  | for (int r = 0; r < height + TX_PAD_VER; ++r) { | 
|  | for (int c = 0; c < stride; ++c) { | 
|  | ASSERT_EQ(levels_buf[0][c + r * stride], levels_buf[1][c + r * stride]) | 
|  | << "[" << r << "," << c << "] " << run_times << width << "x" | 
|  | << height; | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | TEST_P(EncodeTxbInitLevelTest, match) { | 
|  | RunTest(GET_PARAM(0), GET_PARAM(1), 0); | 
|  | } | 
|  |  | 
|  | TEST_P(EncodeTxbInitLevelTest, DISABLED_Speed) { | 
|  | RunTest(GET_PARAM(0), GET_PARAM(1), 1); | 
|  | } | 
|  |  | 
|  | #if HAVE_SSE4_1 | 
|  | INSTANTIATE_TEST_SUITE_P( | 
|  | SSE4_1, EncodeTxbInitLevelTest, | 
|  | ::testing::Combine(::testing::Values(&av1_txb_init_levels_sse4_1), | 
|  | ::testing::Range(0, static_cast<int>(TX_SIZES_ALL), 1))); | 
|  | #endif | 
|  | #if HAVE_AVX2 | 
|  | INSTANTIATE_TEST_SUITE_P( | 
|  | AVX2, EncodeTxbInitLevelTest, | 
|  | ::testing::Combine(::testing::Values(&av1_txb_init_levels_avx2), | 
|  | ::testing::Range(0, static_cast<int>(TX_SIZES_ALL), 1))); | 
|  | #endif | 
|  | #if HAVE_NEON | 
|  | INSTANTIATE_TEST_SUITE_P( | 
|  | NEON, EncodeTxbInitLevelTest, | 
|  | ::testing::Combine(::testing::Values(&av1_txb_init_levels_neon), | 
|  | ::testing::Range(0, static_cast<int>(TX_SIZES_ALL), 1))); | 
|  | #endif | 
|  | }  // namespace |