| /* |
| * Copyright (c) 2016, Alliance for Open Media. All rights reserved |
| * |
| * This source code is subject to the terms of the BSD 2 Clause License and |
| * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License |
| * was not distributed with this source code in the LICENSE file, you can |
| * obtain it at www.aomedia.org/license/software. If the Alliance for Open |
| * Media Patent License 1.0 was not distributed with this source code in the |
| * PATENTS file, you can obtain it at www.aomedia.org/license/patent. |
| */ |
| |
| #include "third_party/googletest/src/include/gtest/gtest.h" |
| |
| #include "./av1_rtcd.h" |
| #include "test/acm_random.h" |
| #include "test/clear_system_state.h" |
| #include "test/register_state_check.h" |
| #include "test/util.h" |
| |
| namespace { |
| |
| using std::tr1::tuple; |
| using libaom_test::ACMRandom; |
| |
| typedef void (*ConvInit)(); |
| typedef void (*conv_filter_t)(const uint8_t *, int, uint8_t *, int, int, int, |
| const InterpFilterParams, const int, int, |
| ConvolveParams *); |
| #if CONFIG_AOM_HIGHBITDEPTH |
| typedef void (*hbd_conv_filter_t)(const uint16_t *, int, uint16_t *, int, int, |
| int, const InterpFilterParams, const int, int, |
| int, int); |
| #endif |
| |
| // Test parameter list: |
| // <convolve_horiz_func, convolve_vert_func, |
| // <width, height>, filter_params, subpel_x_q4, avg> |
| typedef tuple<int, int> BlockDimension; |
| typedef tuple<ConvInit, conv_filter_t, conv_filter_t, BlockDimension, |
| InterpFilter, int, int> |
| ConvParams; |
| #if CONFIG_AOM_HIGHBITDEPTH |
| // Test parameter list: |
| // <convolve_horiz_func, convolve_vert_func, |
| // <width, height>, filter_params, subpel_x_q4, avg, bit_dpeth> |
| typedef tuple<hbd_conv_filter_t, hbd_conv_filter_t, BlockDimension, |
| InterpFilter, int, int, int> |
| HbdConvParams; |
| #endif |
| |
| // Note: |
| // src_ and src_ref_ have special boundary requirement |
| // dst_ and dst_ref_ don't |
| const size_t maxWidth = 256; |
| const size_t maxHeight = 256; |
| const size_t maxBlockSize = maxWidth * maxHeight; |
| const int horizOffset = 32; |
| const int vertiOffset = 32; |
| const int stride = 128; |
| const int x_step_q4 = 16; |
| |
| class AV1ConvolveOptimzTest : public ::testing::TestWithParam<ConvParams> { |
| public: |
| virtual ~AV1ConvolveOptimzTest() {} |
| virtual void SetUp() { |
| ConvInit conv_init = GET_PARAM(0); |
| conv_init(); |
| conv_horiz_ = GET_PARAM(1); |
| conv_vert_ = GET_PARAM(2); |
| BlockDimension block = GET_PARAM(3); |
| width_ = std::tr1::get<0>(block); |
| height_ = std::tr1::get<1>(block); |
| filter_ = GET_PARAM(4); |
| subpel_ = GET_PARAM(5); |
| int ref = GET_PARAM(6); |
| const int plane = 0; |
| conv_params_ = get_conv_params(ref, plane); |
| |
| alloc_ = new uint8_t[maxBlockSize * 4]; |
| src_ = alloc_ + (vertiOffset * maxWidth); |
| src_ += horizOffset; |
| src_ref_ = src_ + maxBlockSize; |
| |
| dst_ = alloc_ + 2 * maxBlockSize; |
| dst_ref_ = alloc_ + 3 * maxBlockSize; |
| } |
| |
| virtual void TearDown() { |
| delete[] alloc_; |
| libaom_test::ClearSystemState(); |
| } |
| |
| protected: |
| void RunHorizFilterBitExactCheck(); |
| void RunVertFilterBitExactCheck(); |
| |
| private: |
| void PrepFilterBuffer(); |
| void DiffFilterBuffer(); |
| conv_filter_t conv_horiz_; |
| conv_filter_t conv_vert_; |
| uint8_t *alloc_; |
| uint8_t *src_; |
| uint8_t *dst_; |
| uint8_t *src_ref_; |
| uint8_t *dst_ref_; |
| int width_; |
| int height_; |
| int filter_; |
| int subpel_; |
| ConvolveParams conv_params_; |
| }; |
| |
| void AV1ConvolveOptimzTest::PrepFilterBuffer() { |
| int r, c; |
| ACMRandom rnd(ACMRandom::DeterministicSeed()); |
| |
| memset(alloc_, 0, 4 * maxBlockSize * sizeof(alloc_[0])); |
| |
| uint8_t *src_ptr = src_; |
| uint8_t *dst_ptr = dst_; |
| uint8_t *src_ref_ptr = src_ref_; |
| uint8_t *dst_ref_ptr = dst_ref_; |
| |
| for (r = 0; r < height_; ++r) { |
| for (c = 0; c < width_; ++c) { |
| src_ptr[c] = rnd.Rand8(); |
| src_ref_ptr[c] = src_ptr[c]; |
| dst_ptr[c] = rnd.Rand8(); |
| dst_ref_ptr[c] = dst_ptr[c]; |
| } |
| src_ptr += stride; |
| src_ref_ptr += stride; |
| dst_ptr += stride; |
| dst_ref_ptr += stride; |
| } |
| } |
| |
| void AV1ConvolveOptimzTest::DiffFilterBuffer() { |
| int r, c; |
| const uint8_t *dst_ptr = dst_; |
| const uint8_t *dst_ref_ptr = dst_ref_; |
| for (r = 0; r < height_; ++r) { |
| for (c = 0; c < width_; ++c) { |
| EXPECT_EQ((uint8_t)dst_ref_ptr[c], (uint8_t)dst_ptr[c]) |
| << "Error at row: " << r << " col: " << c << " " |
| << "w = " << width_ << " " |
| << "h = " << height_ << " " |
| << "filter group index = " << filter_ << " " |
| << "filter index = " << subpel_; |
| } |
| dst_ptr += stride; |
| dst_ref_ptr += stride; |
| } |
| } |
| |
| void AV1ConvolveOptimzTest::RunHorizFilterBitExactCheck() { |
| PrepFilterBuffer(); |
| |
| InterpFilterParams filter_params = av1_get_interp_filter_params(filter_); |
| |
| av1_convolve_horiz_c(src_ref_, stride, dst_ref_, stride, width_, height_, |
| filter_params, subpel_, x_step_q4, &conv_params_); |
| |
| conv_horiz_(src_, stride, dst_, stride, width_, height_, filter_params, |
| subpel_, x_step_q4, &conv_params_); |
| |
| DiffFilterBuffer(); |
| |
| // Note: |
| // Here we need calculate a height which is different from the specified one |
| // and test again. |
| int intermediate_height = |
| (((height_ - 1) * 16 + subpel_) >> SUBPEL_BITS) + filter_params.taps; |
| PrepFilterBuffer(); |
| |
| av1_convolve_horiz_c(src_ref_, stride, dst_ref_, stride, width_, |
| intermediate_height, filter_params, subpel_, x_step_q4, |
| &conv_params_); |
| |
| conv_horiz_(src_, stride, dst_, stride, width_, intermediate_height, |
| filter_params, subpel_, x_step_q4, &conv_params_); |
| |
| DiffFilterBuffer(); |
| } |
| |
| void AV1ConvolveOptimzTest::RunVertFilterBitExactCheck() { |
| PrepFilterBuffer(); |
| |
| InterpFilterParams filter_params = av1_get_interp_filter_params(filter_); |
| |
| av1_convolve_vert_c(src_ref_, stride, dst_ref_, stride, width_, height_, |
| filter_params, subpel_, x_step_q4, &conv_params_); |
| |
| conv_vert_(src_, stride, dst_, stride, width_, height_, filter_params, |
| subpel_, x_step_q4, &conv_params_); |
| |
| DiffFilterBuffer(); |
| } |
| |
| TEST_P(AV1ConvolveOptimzTest, HorizBitExactCheck) { |
| RunHorizFilterBitExactCheck(); |
| } |
| TEST_P(AV1ConvolveOptimzTest, VerticalBitExactCheck) { |
| RunVertFilterBitExactCheck(); |
| } |
| |
| using std::tr1::make_tuple; |
| |
| #if (HAVE_SSSE3 || HAVE_SSE4_1) && CONFIG_DUAL_FILTER |
| const BlockDimension kBlockDim[] = { |
| make_tuple(2, 2), make_tuple(2, 4), make_tuple(4, 4), |
| make_tuple(4, 8), make_tuple(8, 4), make_tuple(8, 8), |
| make_tuple(8, 16), make_tuple(16, 8), make_tuple(16, 16), |
| make_tuple(16, 32), make_tuple(32, 16), make_tuple(32, 32), |
| make_tuple(32, 64), make_tuple(64, 32), make_tuple(64, 64), |
| make_tuple(64, 128), make_tuple(128, 64), make_tuple(128, 128), |
| }; |
| |
| // 10/12-tap filters |
| const InterpFilter kFilter[] = { 6, 4, 2 }; |
| |
| const int kSubpelQ4[] = { 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 }; |
| |
| const int kAvg[] = { 0, 1 }; |
| #endif |
| |
| #if HAVE_SSSE3 && CONFIG_DUAL_FILTER |
| INSTANTIATE_TEST_CASE_P( |
| SSSE3, AV1ConvolveOptimzTest, |
| ::testing::Combine(::testing::Values(av1_convolve_init_ssse3), |
| ::testing::Values(av1_convolve_horiz_ssse3), |
| ::testing::Values(av1_convolve_vert_ssse3), |
| ::testing::ValuesIn(kBlockDim), |
| ::testing::ValuesIn(kFilter), |
| ::testing::ValuesIn(kSubpelQ4), |
| ::testing::ValuesIn(kAvg))); |
| #endif // HAVE_SSSE3 && CONFIG_DUAL_FILTER |
| |
| #if CONFIG_AOM_HIGHBITDEPTH |
| typedef ::testing::TestWithParam<HbdConvParams> TestWithHbdConvParams; |
| class AV1HbdConvolveOptimzTest : public TestWithHbdConvParams { |
| public: |
| virtual ~AV1HbdConvolveOptimzTest() {} |
| virtual void SetUp() { |
| conv_horiz_ = GET_PARAM(0); |
| conv_vert_ = GET_PARAM(1); |
| BlockDimension block = GET_PARAM(2); |
| width_ = std::tr1::get<0>(block); |
| height_ = std::tr1::get<1>(block); |
| filter_ = GET_PARAM(3); |
| subpel_ = GET_PARAM(4); |
| avg_ = GET_PARAM(5); |
| bit_depth_ = GET_PARAM(6); |
| |
| alloc_ = new uint16_t[maxBlockSize * 4]; |
| src_ = alloc_ + (vertiOffset * maxWidth); |
| src_ += horizOffset; |
| src_ref_ = src_ + maxBlockSize; |
| |
| dst_ = alloc_ + 2 * maxBlockSize; |
| dst_ref_ = alloc_ + 3 * maxBlockSize; |
| } |
| |
| virtual void TearDown() { |
| delete[] alloc_; |
| libaom_test::ClearSystemState(); |
| } |
| |
| protected: |
| void RunHorizFilterBitExactCheck(); |
| void RunVertFilterBitExactCheck(); |
| |
| private: |
| void PrepFilterBuffer(); |
| void DiffFilterBuffer(); |
| hbd_conv_filter_t conv_horiz_; |
| hbd_conv_filter_t conv_vert_; |
| uint16_t *alloc_; |
| uint16_t *src_; |
| uint16_t *dst_; |
| uint16_t *src_ref_; |
| uint16_t *dst_ref_; |
| int width_; |
| int height_; |
| int filter_; |
| int subpel_; |
| int avg_; |
| int bit_depth_; |
| }; |
| |
| void AV1HbdConvolveOptimzTest::PrepFilterBuffer() { |
| int r, c; |
| ACMRandom rnd(ACMRandom::DeterministicSeed()); |
| |
| memset(alloc_, 0, 4 * maxBlockSize * sizeof(alloc_[0])); |
| |
| uint16_t *src_ptr = src_; |
| uint16_t *dst_ptr = dst_; |
| uint16_t *dst_ref_ptr = dst_ref_; |
| uint16_t hbd_mask = (1 << bit_depth_) - 1; |
| |
| for (r = 0; r < height_; ++r) { |
| for (c = 0; c < width_; ++c) { |
| src_ptr[c] = rnd.Rand16() & hbd_mask; |
| dst_ptr[c] = rnd.Rand16() & hbd_mask; |
| dst_ref_ptr[c] = dst_ptr[c]; |
| } |
| src_ptr += stride; |
| dst_ptr += stride; |
| dst_ref_ptr += stride; |
| } |
| } |
| |
| void AV1HbdConvolveOptimzTest::DiffFilterBuffer() { |
| int r, c; |
| const uint16_t *dst_ptr = dst_; |
| const uint16_t *dst_ref_ptr = dst_ref_; |
| for (r = 0; r < height_; ++r) { |
| for (c = 0; c < width_; ++c) { |
| EXPECT_EQ((uint16_t)dst_ref_ptr[c], (uint16_t)dst_ptr[c]) |
| << "Error at row: " << r << " col: " << c << " " |
| << "w = " << width_ << " " |
| << "h = " << height_ << " " |
| << "filter group index = " << filter_ << " " |
| << "filter index = " << subpel_ << " " |
| << "bit depth = " << bit_depth_; |
| } |
| dst_ptr += stride; |
| dst_ref_ptr += stride; |
| } |
| } |
| |
| void AV1HbdConvolveOptimzTest::RunHorizFilterBitExactCheck() { |
| PrepFilterBuffer(); |
| |
| InterpFilterParams filter_params = av1_get_interp_filter_params(filter_); |
| |
| av1_highbd_convolve_horiz_c(src_, stride, dst_ref_, stride, width_, height_, |
| filter_params, subpel_, x_step_q4, avg_, |
| bit_depth_); |
| |
| conv_horiz_(src_, stride, dst_, stride, width_, height_, filter_params, |
| subpel_, x_step_q4, avg_, bit_depth_); |
| |
| DiffFilterBuffer(); |
| |
| // Note: |
| // Here we need calculate a height which is different from the specified one |
| // and test again. |
| int intermediate_height = |
| (((height_ - 1) * 16 + subpel_) >> SUBPEL_BITS) + filter_params.taps; |
| PrepFilterBuffer(); |
| |
| av1_highbd_convolve_horiz_c(src_, stride, dst_ref_, stride, width_, |
| intermediate_height, filter_params, subpel_, |
| x_step_q4, avg_, bit_depth_); |
| |
| conv_horiz_(src_, stride, dst_, stride, width_, intermediate_height, |
| filter_params, subpel_, x_step_q4, avg_, bit_depth_); |
| |
| DiffFilterBuffer(); |
| } |
| |
| void AV1HbdConvolveOptimzTest::RunVertFilterBitExactCheck() { |
| PrepFilterBuffer(); |
| |
| InterpFilterParams filter_params = av1_get_interp_filter_params(filter_); |
| |
| av1_highbd_convolve_vert_c(src_, stride, dst_ref_, stride, width_, height_, |
| filter_params, subpel_, x_step_q4, avg_, |
| bit_depth_); |
| |
| conv_vert_(src_, stride, dst_, stride, width_, height_, filter_params, |
| subpel_, x_step_q4, avg_, bit_depth_); |
| |
| DiffFilterBuffer(); |
| } |
| |
| TEST_P(AV1HbdConvolveOptimzTest, HorizBitExactCheck) { |
| RunHorizFilterBitExactCheck(); |
| } |
| TEST_P(AV1HbdConvolveOptimzTest, VertBitExactCheck) { |
| RunVertFilterBitExactCheck(); |
| } |
| |
| #if HAVE_SSE4_1 && CONFIG_DUAL_FILTER |
| |
| const int kBitdepth[] = { 10, 12 }; |
| |
| INSTANTIATE_TEST_CASE_P( |
| SSE4_1, AV1HbdConvolveOptimzTest, |
| ::testing::Combine(::testing::Values(av1_highbd_convolve_horiz_sse4_1), |
| ::testing::Values(av1_highbd_convolve_vert_sse4_1), |
| ::testing::ValuesIn(kBlockDim), |
| ::testing::ValuesIn(kFilter), |
| ::testing::ValuesIn(kSubpelQ4), |
| ::testing::ValuesIn(kAvg), |
| ::testing::ValuesIn(kBitdepth))); |
| #endif // HAVE_SSE4_1 && CONFIG_DUAL_FILTER |
| #endif // CONFIG_AOM_HIGHBITDEPTH |
| } // namespace |