Adds masked variance and sad functions for wedge
Adds masked variance and sad functions needed for wedge
prediction modes to come.
Change-Id: I25b231bbc345e6a494316abb0a7d5cd5586a3a54
diff --git a/test/masked_sad_test.cc b/test/masked_sad_test.cc
new file mode 100644
index 0000000..c09104c
--- /dev/null
+++ b/test/masked_sad_test.cc
@@ -0,0 +1,209 @@
+/*
+ * Copyright (c) 2015 The WebM project authors. All Rights Reserved.
+ *
+ * Use of this source code is governed by a BSD-style license
+ * that can be found in the LICENSE file in the root of the source
+ * tree. An additional intellectual property rights grant can be found
+ * in the file PATENTS. All contributing project authors may
+ * be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include <math.h>
+#include <stdlib.h>
+#include <string.h>
+
+#include "third_party/googletest/src/include/gtest/gtest.h"
+#include "test/acm_random.h"
+#include "test/clear_system_state.h"
+#include "test/register_state_check.h"
+#include "test/util.h"
+
+#include "./vpx_config.h"
+#include "./vpx_dsp_rtcd.h"
+#include "vpx/vpx_integer.h"
+
+using libvpx_test::ACMRandom;
+
+namespace {
+const int number_of_iterations = 500;
+
+typedef unsigned int (*MaskedSADFunc)(const uint8_t *a, int a_stride,
+ const uint8_t *b, int b_stride,
+ const uint8_t *m, int m_stride);
+typedef std::tr1::tuple<MaskedSADFunc, MaskedSADFunc> MaskedSADParam;
+
+class MaskedSADTest : public ::testing::TestWithParam<MaskedSADParam> {
+ public:
+ virtual ~MaskedSADTest() {}
+ virtual void SetUp() {
+ maskedSAD_op_ = GET_PARAM(0);
+ ref_maskedSAD_op_ = GET_PARAM(1);
+ }
+
+ virtual void TearDown() { libvpx_test::ClearSystemState(); }
+
+ protected:
+ MaskedSADFunc maskedSAD_op_;
+ MaskedSADFunc ref_maskedSAD_op_;
+};
+
+TEST_P(MaskedSADTest, OperationCheck) {
+ unsigned int ref_ret, ret;
+ ACMRandom rnd(ACMRandom::DeterministicSeed());
+ DECLARE_ALIGNED(16, uint8_t, src_ptr[4096]);
+ DECLARE_ALIGNED(16, uint8_t, ref_ptr[4096]);
+ DECLARE_ALIGNED(16, uint8_t, msk_ptr[4096]);
+ int err_count = 0;
+ int first_failure = -1;
+ int src_stride = 64;
+ int ref_stride = 64;
+ int msk_stride = 64;
+ for (int i = 0; i < number_of_iterations; ++i) {
+ for (int j = 0; j < 4096; j++) {
+ src_ptr[j] = rnd.Rand8();
+ ref_ptr[j] = rnd.Rand8();
+ msk_ptr[j] = ((rnd.Rand8()&0x7f) > 64) ? rnd.Rand8()&0x3f : 64;
+ assert(msk_ptr[j] <= 64);
+ }
+
+ ref_ret = ref_maskedSAD_op_(src_ptr, src_stride, ref_ptr, ref_stride,
+ msk_ptr, msk_stride);
+ ASM_REGISTER_STATE_CHECK(ret = maskedSAD_op_(src_ptr, src_stride,
+ ref_ptr, ref_stride,
+ msk_ptr, msk_stride));
+ if (ret != ref_ret) {
+ err_count++;
+ if (first_failure == -1)
+ first_failure = i;
+ }
+ }
+ EXPECT_EQ(0, err_count)
+ << "Error: Masked SAD Test, C output doesn't match SSSE3 output. "
+ << "First failed at test case " << first_failure;
+}
+
+#if CONFIG_VP9_HIGHBITDEPTH
+typedef unsigned int (*HighbdMaskedSADFunc)(const uint8_t *a, int a_stride,
+ const uint8_t *b, int b_stride,
+ const uint8_t *m, int m_stride);
+typedef std::tr1::tuple<HighbdMaskedSADFunc, HighbdMaskedSADFunc>
+ HighbdMaskedSADParam;
+
+class HighbdMaskedSADTest : public ::testing::
+ TestWithParam<HighbdMaskedSADParam> {
+ public:
+ virtual ~HighbdMaskedSADTest() {}
+ virtual void SetUp() {
+ maskedSAD_op_ = GET_PARAM(0);
+ ref_maskedSAD_op_ = GET_PARAM(1);
+ }
+
+ virtual void TearDown() { libvpx_test::ClearSystemState(); }
+
+ protected:
+ HighbdMaskedSADFunc maskedSAD_op_;
+ HighbdMaskedSADFunc ref_maskedSAD_op_;
+};
+
+TEST_P(HighbdMaskedSADTest, OperationCheck) {
+ unsigned int ref_ret, ret;
+ ACMRandom rnd(ACMRandom::DeterministicSeed());
+ DECLARE_ALIGNED(16, uint16_t, src_ptr[4096]);
+ DECLARE_ALIGNED(16, uint16_t, ref_ptr[4096]);
+ DECLARE_ALIGNED(16, uint8_t, msk_ptr[4096]);
+ uint8_t* src8_ptr = CONVERT_TO_BYTEPTR(src_ptr);
+ uint8_t* ref8_ptr = CONVERT_TO_BYTEPTR(ref_ptr);
+ int err_count = 0;
+ int first_failure = -1;
+ int src_stride = 64;
+ int ref_stride = 64;
+ int msk_stride = 64;
+ for (int i = 0; i < number_of_iterations; ++i) {
+ for (int j = 0; j < 4096; j++) {
+ src_ptr[j] = rnd.Rand16()&0xfff;
+ ref_ptr[j] = rnd.Rand16()&0xfff;
+ msk_ptr[j] = ((rnd.Rand8()&0x7f) > 64) ? rnd.Rand8()&0x3f : 64;
+ }
+
+ ref_ret = ref_maskedSAD_op_(src8_ptr, src_stride, ref8_ptr, ref_stride,
+ msk_ptr, msk_stride);
+ ASM_REGISTER_STATE_CHECK(ret = maskedSAD_op_(src8_ptr, src_stride,
+ ref8_ptr, ref_stride,
+ msk_ptr, msk_stride));
+ if (ret != ref_ret) {
+ err_count++;
+ if (first_failure == -1)
+ first_failure = i;
+ }
+ }
+ EXPECT_EQ(0, err_count)
+ << "Error: High BD Masked SAD Test, C output doesn't match SSSE3 output. "
+ << "First failed at test case " << first_failure;
+}
+#endif // CONFIG_VP9_HIGHBITDEPTH
+
+using std::tr1::make_tuple;
+
+#if HAVE_SSSE3
+INSTANTIATE_TEST_CASE_P(
+ SSSE3_C_COMPARE, MaskedSADTest,
+ ::testing::Values(
+ make_tuple(&vpx_masked_sad64x64_ssse3,
+ &vpx_masked_sad64x64_c),
+ make_tuple(&vpx_masked_sad64x32_ssse3,
+ &vpx_masked_sad64x32_c),
+ make_tuple(&vpx_masked_sad32x64_ssse3,
+ &vpx_masked_sad32x64_c),
+ make_tuple(&vpx_masked_sad32x32_ssse3,
+ &vpx_masked_sad32x32_c),
+ make_tuple(&vpx_masked_sad32x16_ssse3,
+ &vpx_masked_sad32x16_c),
+ make_tuple(&vpx_masked_sad16x32_ssse3,
+ &vpx_masked_sad16x32_c),
+ make_tuple(&vpx_masked_sad16x16_ssse3,
+ &vpx_masked_sad16x16_c),
+ make_tuple(&vpx_masked_sad16x8_ssse3,
+ &vpx_masked_sad16x8_c),
+ make_tuple(&vpx_masked_sad8x16_ssse3,
+ &vpx_masked_sad8x16_c),
+ make_tuple(&vpx_masked_sad8x8_ssse3,
+ &vpx_masked_sad8x8_c),
+ make_tuple(&vpx_masked_sad8x4_ssse3,
+ &vpx_masked_sad8x4_c),
+ make_tuple(&vpx_masked_sad4x8_ssse3,
+ &vpx_masked_sad4x8_c),
+ make_tuple(&vpx_masked_sad4x4_ssse3,
+ &vpx_masked_sad4x4_c)));
+#if CONFIG_VP9_HIGHBITDEPTH
+INSTANTIATE_TEST_CASE_P(
+ SSSE3_C_COMPARE, HighbdMaskedSADTest,
+ ::testing::Values(
+ make_tuple(&vp9_highbd_masked_sad64x64_ssse3,
+ &vp9_highbd_masked_sad64x64_c),
+ make_tuple(&vp9_highbd_masked_sad64x32_ssse3,
+ &vp9_highbd_masked_sad64x32_c),
+ make_tuple(&vp9_highbd_masked_sad32x64_ssse3,
+ &vp9_highbd_masked_sad32x64_c),
+ make_tuple(&vp9_highbd_masked_sad32x32_ssse3,
+ &vp9_highbd_masked_sad32x32_c),
+ make_tuple(&vp9_highbd_masked_sad32x16_ssse3,
+ &vp9_highbd_masked_sad32x16_c),
+ make_tuple(&vp9_highbd_masked_sad16x32_ssse3,
+ &vp9_highbd_masked_sad16x32_c),
+ make_tuple(&vp9_highbd_masked_sad16x16_ssse3,
+ &vp9_highbd_masked_sad16x16_c),
+ make_tuple(&vp9_highbd_masked_sad16x8_ssse3,
+ &vp9_highbd_masked_sad16x8_c),
+ make_tuple(&vp9_highbd_masked_sad8x16_ssse3,
+ &vp9_highbd_masked_sad8x16_c),
+ make_tuple(&vp9_highbd_masked_sad8x8_ssse3,
+ &vp9_highbd_masked_sad8x8_c),
+ make_tuple(&vp9_highbd_masked_sad8x4_ssse3,
+ &vp9_highbd_masked_sad8x4_c),
+ make_tuple(&vp9_highbd_masked_sad4x8_ssse3,
+ &vp9_highbd_masked_sad4x8_c),
+ make_tuple(&vp9_highbd_masked_sad4x4_ssse3,
+ &vp9_highbd_masked_sad4x4_c)));
+#endif // CONFIG_VP9_HIGHBITDEPTH
+#endif // HAVE_SSSE3
+} // namespace