test/variance_test.cc - aom - Git at Google

 /*
  * Copyright (c) 2016, Alliance for Open Media. All rights reserved
  *
  * This source code is subject to the terms of the BSD 2 Clause License and
  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
  * was not distributed with this source code in the LICENSE file, you can
  * obtain it at www.aomedia.org/license/software. If the Alliance for Open
  * Media Patent License 1.0 was not distributed with this source code in the
  * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
 */

 #include <cstdlib>
 #include <new>

 #include "third_party/googletest/src/include/gtest/gtest.h"

 #include "./aom_config.h"
 #include "./aom_dsp_rtcd.h"
 #include "test/acm_random.h"
 #include "test/clear_system_state.h"
 #include "test/register_state_check.h"
 #include "aom/aom_codec.h"
 #include "aom/aom_integer.h"
 #include "aom_mem/aom_mem.h"
 #include "aom_ports/mem.h"

 namespace {

 typedef unsigned int (*VarianceMxNFunc)(const uint8_t *a, int a_stride,
                                         const uint8_t *b, int b_stride,
                                         unsigned int *sse);
 typedef unsigned int (*SubpixVarMxNFunc)(const uint8_t *a, int a_stride,
                                          int xoffset, int yoffset,
                                          const uint8_t *b, int b_stride,
                                          unsigned int *sse);
 typedef unsigned int (*SubpixAvgVarMxNFunc)(const uint8_t *a, int a_stride,
                                             int xoffset, int yoffset,
                                             const uint8_t *b, int b_stride,
                                             uint32_t *sse,
                                             const uint8_t *second_pred);
 typedef unsigned int (*Get4x4SseFunc)(const uint8_t *a, int a_stride,
                                       const uint8_t *b, int b_stride);
 typedef unsigned int (*SumOfSquaresFunction)(const int16_t *src);

 using ::std::tr1::get;
 using ::std::tr1::make_tuple;
 using ::std::tr1::tuple;
 using libaom_test::ACMRandom;

 // Truncate high bit depth results by downshifting (with rounding) by:
 // 2 * (bit_depth - 8) for sse
 // (bit_depth - 8) for se
 static void RoundHighBitDepth(int bit_depth, int64_t *se, uint64_t *sse) {
   switch (bit_depth) {
     case AOM_BITS_12:
       *sse = (*sse + 128) >> 8;
       *se = (*se + 8) >> 4;
       break;
     case AOM_BITS_10:
       *sse = (*sse + 8) >> 4;
       *se = (*se + 2) >> 2;
       break;
     case AOM_BITS_8:
     default: break;
   }
 }

 static unsigned int mb_ss_ref(const int16_t *src) {
   unsigned int res = 0;
   for (int i = 0; i < 256; ++i) {
     res += src[i] * src[i];
   }
   return res;
 }

 static uint32_t variance_ref(const uint8_t *src, const uint8_t *ref, int l2w,
                              int l2h, int src_stride_coeff,
                              int ref_stride_coeff, uint32_t *sse_ptr,
                              bool use_high_bit_depth_,
                              aom_bit_depth_t bit_depth) {
   int64_t se = 0;
   uint64_t sse = 0;
   const int w = 1 << l2w;
   const int h = 1 << l2h;
   for (int y = 0; y < h; y++) {
     for (int x = 0; x < w; x++) {
       int diff;
       if (!use_high_bit_depth_) {
         diff = ref[w * y * ref_stride_coeff + x] -
                src[w * y * src_stride_coeff + x];
         se += diff;
         sse += diff * diff;
 #if CONFIG_AOM_HIGHBITDEPTH
       } else {
         diff = CONVERT_TO_SHORTPTR(ref)[w * y * ref_stride_coeff + x] -
                CONVERT_TO_SHORTPTR(src)[w * y * src_stride_coeff + x];
         se += diff;
         sse += diff * diff;
 #endif  // CONFIG_AOM_HIGHBITDEPTH
       }
     }
   }
   RoundHighBitDepth(bit_depth, &se, &sse);
   *sse_ptr = static_cast<uint32_t>(sse);
   return static_cast<uint32_t>(
       sse - ((static_cast<int64_t>(se) * se) >> (l2w + l2h)));
 }

 /* The subpel reference functions differ from the codec version in one aspect:
  * they calculate the bilinear factors directly instead of using a lookup table
  * and therefore upshift xoff and yoff by 1. Only every other calculated value
  * is used so the codec version shrinks the table to save space and maintain
  * compatibility with aom.
  */
 static uint32_t subpel_variance_ref(const uint8_t *ref, const uint8_t *src,
                                     int l2w, int l2h, int xoff, int yoff,
                                     uint32_t *sse_ptr, bool use_high_bit_depth_,
                                     aom_bit_depth_t bit_depth) {
   int64_t se = 0;
   uint64_t sse = 0;
   const int w = 1 << l2w;
   const int h = 1 << l2h;

   xoff <<= 1;
   yoff <<= 1;

   for (int y = 0; y < h; y++) {
     for (int x = 0; x < w; x++) {
       // Bilinear interpolation at a 16th pel step.
       if (!use_high_bit_depth_) {
         const int a1 = ref[(w + 1) * (y + 0) + x + 0];
         const int a2 = ref[(w + 1) * (y + 0) + x + 1];
         const int b1 = ref[(w + 1) * (y + 1) + x + 0];
         const int b2 = ref[(w + 1) * (y + 1) + x + 1];
         const int a = a1 + (((a2 - a1) * xoff + 8) >> 4);
         const int b = b1 + (((b2 - b1) * xoff + 8) >> 4);
         const int r = a + (((b - a) * yoff + 8) >> 4);
         const int diff = r - src[w * y + x];
         se += diff;
         sse += diff * diff;
 #if CONFIG_AOM_HIGHBITDEPTH
       } else {
         uint16_t *ref16 = CONVERT_TO_SHORTPTR(ref);
         uint16_t *src16 = CONVERT_TO_SHORTPTR(src);
         const int a1 = ref16[(w + 1) * (y + 0) + x + 0];
         const int a2 = ref16[(w + 1) * (y + 0) + x + 1];
         const int b1 = ref16[(w + 1) * (y + 1) + x + 0];
         const int b2 = ref16[(w + 1) * (y + 1) + x + 1];
         const int a = a1 + (((a2 - a1) * xoff + 8) >> 4);
         const int b = b1 + (((b2 - b1) * xoff + 8) >> 4);
         const int r = a + (((b - a) * yoff + 8) >> 4);
         const int diff = r - src16[w * y + x];
         se += diff;
         sse += diff * diff;
 #endif  // CONFIG_AOM_HIGHBITDEPTH
       }
     }
   }
   RoundHighBitDepth(bit_depth, &se, &sse);
   *sse_ptr = static_cast<uint32_t>(sse);
   return static_cast<uint32_t>(
       sse - ((static_cast<int64_t>(se) * se) >> (l2w + l2h)));
 }

 class SumOfSquaresTest : public ::testing::TestWithParam<SumOfSquaresFunction> {
  public:
   SumOfSquaresTest() : func_(GetParam()) {}

   virtual ~SumOfSquaresTest() { libaom_test::ClearSystemState(); }

  protected:
   void ConstTest();
   void RefTest();

   SumOfSquaresFunction func_;
   ACMRandom rnd_;
 };

 void SumOfSquaresTest::ConstTest() {
   int16_t mem[256];
   unsigned int res;
   for (int v = 0; v < 256; ++v) {
     for (int i = 0; i < 256; ++i) {
       mem[i] = v;
     }
     ASM_REGISTER_STATE_CHECK(res = func_(mem));
     EXPECT_EQ(256u * (v * v), res);
   }
 }

 void SumOfSquaresTest::RefTest() {
   int16_t mem[256];
   for (int i = 0; i < 100; ++i) {
     for (int j = 0; j < 256; ++j) {
       mem[j] = rnd_.Rand8() - rnd_.Rand8();
     }

     const unsigned int expected = mb_ss_ref(mem);
     unsigned int res;
     ASM_REGISTER_STATE_CHECK(res = func_(mem));
     EXPECT_EQ(expected, res);
   }
 }

 template <typename VarianceFunctionType>
 class VarianceTest : public ::testing::TestWithParam<
                          tuple<int, int, VarianceFunctionType, int> > {
  public:
   virtual void SetUp() {
     const tuple<int, int, VarianceFunctionType, int> &params = this->GetParam();
     log2width_ = get<0>(params);
     width_ = 1 << log2width_;
     log2height_ = get<1>(params);
     height_ = 1 << log2height_;
     variance_ = get<2>(params);
     if (get<3>(params)) {
       bit_depth_ = static_cast<aom_bit_depth_t>(get<3>(params));
       use_high_bit_depth_ = true;
     } else {
       bit_depth_ = AOM_BITS_8;
       use_high_bit_depth_ = false;
     }
     mask_ = (1 << bit_depth_) - 1;

     rnd_.Reset(ACMRandom::DeterministicSeed());
     block_size_ = width_ * height_;
     if (!use_high_bit_depth_) {
       src_ = reinterpret_cast<uint8_t *>(aom_memalign(16, block_size_ * 2));
       ref_ = new uint8_t[block_size_ * 2];
 #if CONFIG_AOM_HIGHBITDEPTH
     } else {
       src_ = CONVERT_TO_BYTEPTR(reinterpret_cast<uint16_t *>(
           aom_memalign(16, block_size_ * 2 * sizeof(uint16_t))));
       ref_ = CONVERT_TO_BYTEPTR(new uint16_t[block_size_ * 2]);
 #endif  // CONFIG_AOM_HIGHBITDEPTH
     }
     ASSERT_TRUE(src_ != NULL);
     ASSERT_TRUE(ref_ != NULL);
   }

   virtual void TearDown() {
     if (!use_high_bit_depth_) {
       aom_free(src_);
       delete[] ref_;
 #if CONFIG_AOM_HIGHBITDEPTH
     } else {
       aom_free(CONVERT_TO_SHORTPTR(src_));
       delete[] CONVERT_TO_SHORTPTR(ref_);
 #endif  // CONFIG_AOM_HIGHBITDEPTH
     }
     libaom_test::ClearSystemState();
   }

  protected:
   void ZeroTest();
   void RefTest();
   void RefStrideTest();
   void OneQuarterTest();

   ACMRandom rnd_;
   uint8_t *src_;
   uint8_t *ref_;
   int width_, log2width_;
   int height_, log2height_;
   aom_bit_depth_t bit_depth_;
   int mask_;
   bool use_high_bit_depth_;
   int block_size_;
   VarianceFunctionType variance_;
 };

 template <typename VarianceFunctionType>
 void VarianceTest<VarianceFunctionType>::ZeroTest() {
   for (int i = 0; i <= 255; ++i) {
     if (!use_high_bit_depth_) {
       memset(src_, i, block_size_);
 #if CONFIG_AOM_HIGHBITDEPTH
     } else {
       aom_memset16(CONVERT_TO_SHORTPTR(src_), i << (bit_depth_ - 8),
                    block_size_);
 #endif  // CONFIG_AOM_HIGHBITDEPTH
     }
     for (int j = 0; j <= 255; ++j) {
       if (!use_high_bit_depth_) {
         memset(ref_, j, block_size_);
 #if CONFIG_AOM_HIGHBITDEPTH
       } else {
         aom_memset16(CONVERT_TO_SHORTPTR(ref_), j << (bit_depth_ - 8),
                      block_size_);
 #endif  // CONFIG_AOM_HIGHBITDEPTH
       }
       unsigned int sse;
       unsigned int var;
       ASM_REGISTER_STATE_CHECK(var =
                                    variance_(src_, width_, ref_, width_, &sse));
       EXPECT_EQ(0u, var) << "src values: " << i << " ref values: " << j;
     }
   }
 }

 template <typename VarianceFunctionType>
 void VarianceTest<VarianceFunctionType>::RefTest() {
   for (int i = 0; i < 10; ++i) {
     for (int j = 0; j < block_size_; j++) {
       if (!use_high_bit_depth_) {
         src_[j] = rnd_.Rand8();
         ref_[j] = rnd_.Rand8();
 #if CONFIG_AOM_HIGHBITDEPTH
       } else {
         CONVERT_TO_SHORTPTR(src_)[j] = rnd_.Rand16() && mask_;
         CONVERT_TO_SHORTPTR(ref_)[j] = rnd_.Rand16() && mask_;
 #endif  // CONFIG_AOM_HIGHBITDEPTH
       }
     }
     unsigned int sse1, sse2;
     unsigned int var1;
     const int stride_coeff = 1;
     ASM_REGISTER_STATE_CHECK(var1 =
                                  variance_(src_, width_, ref_, width_, &sse1));
     const unsigned int var2 =
         variance_ref(src_, ref_, log2width_, log2height_, stride_coeff,
                      stride_coeff, &sse2, use_high_bit_depth_, bit_depth_);
     EXPECT_EQ(sse1, sse2);
     EXPECT_EQ(var1, var2);
   }
 }

 template <typename VarianceFunctionType>
 void VarianceTest<VarianceFunctionType>::RefStrideTest() {
   for (int i = 0; i < 10; ++i) {
     int ref_stride_coeff = i % 2;
     int src_stride_coeff = (i >> 1) % 2;
     for (int j = 0; j < block_size_; j++) {
       int ref_ind = (j / width_) * ref_stride_coeff * width_ + j % width_;
       int src_ind = (j / width_) * src_stride_coeff * width_ + j % width_;
       if (!use_high_bit_depth_) {
         src_[src_ind] = rnd_.Rand8();
         ref_[ref_ind] = rnd_.Rand8();
 #if CONFIG_AOM_HIGHBITDEPTH
       } else {
         CONVERT_TO_SHORTPTR(src_)[src_ind] = rnd_.Rand16() && mask_;
         CONVERT_TO_SHORTPTR(ref_)[ref_ind] = rnd_.Rand16() && mask_;
 #endif  // CONFIG_AOM_HIGHBITDEPTH
       }
     }
     unsigned int sse1, sse2;
     unsigned int var1;

     ASM_REGISTER_STATE_CHECK(var1 = variance_(src_, width_ * src_stride_coeff,
                                               ref_, width_ * ref_stride_coeff,
                                               &sse1));
     const unsigned int var2 =
         variance_ref(src_, ref_, log2width_, log2height_, src_stride_coeff,
                      ref_stride_coeff, &sse2, use_high_bit_depth_, bit_depth_);
     EXPECT_EQ(sse1, sse2);
     EXPECT_EQ(var1, var2);
   }
 }

 template <typename VarianceFunctionType>
 void VarianceTest<VarianceFunctionType>::OneQuarterTest() {
   const int half = block_size_ / 2;
   if (!use_high_bit_depth_) {
     memset(src_, 255, block_size_);
     memset(ref_, 255, half);
     memset(ref_ + half, 0, half);
 #if CONFIG_AOM_HIGHBITDEPTH
   } else {
     aom_memset16(CONVERT_TO_SHORTPTR(src_), 255 << (bit_depth_ - 8),
                  block_size_);
     aom_memset16(CONVERT_TO_SHORTPTR(ref_), 255 << (bit_depth_ - 8), half);
     aom_memset16(CONVERT_TO_SHORTPTR(ref_) + half, 0, half);
 #endif  // CONFIG_AOM_HIGHBITDEPTH
   }
   unsigned int sse;
   unsigned int var;
   ASM_REGISTER_STATE_CHECK(var = variance_(src_, width_, ref_, width_, &sse));
   const unsigned int expected = block_size_ * 255 * 255 / 4;
   EXPECT_EQ(expected, var);
 }

 template <typename MseFunctionType>
 class MseTest
     : public ::testing::TestWithParam<tuple<int, int, MseFunctionType> > {
  public:
   virtual void SetUp() {
     const tuple<int, int, MseFunctionType> &params = this->GetParam();
     log2width_ = get<0>(params);
     width_ = 1 << log2width_;
     log2height_ = get<1>(params);
     height_ = 1 << log2height_;
     mse_ = get<2>(params);

     rnd(ACMRandom::DeterministicSeed());
     block_size_ = width_ * height_;
     src_ = reinterpret_cast<uint8_t *>(aom_memalign(16, block_size_));
     ref_ = new uint8_t[block_size_];
     ASSERT_TRUE(src_ != NULL);
     ASSERT_TRUE(ref_ != NULL);
   }

   virtual void TearDown() {
     aom_free(src_);
     delete[] ref_;
     libaom_test::ClearSystemState();
   }

  protected:
   void RefTest_mse();
   void RefTest_sse();
   void MaxTest_mse();
   void MaxTest_sse();

   ACMRandom rnd;
   uint8_t *src_;
   uint8_t *ref_;
   int width_, log2width_;
   int height_, log2height_;
   int block_size_;
   MseFunctionType mse_;
 };

 template <typename MseFunctionType>
 void MseTest<MseFunctionType>::RefTest_mse() {
   for (int i = 0; i < 10; ++i) {
     for (int j = 0; j < block_size_; j++) {
       src_[j] = rnd.Rand8();
       ref_[j] = rnd.Rand8();
     }
     unsigned int sse1, sse2;
     const int stride_coeff = 1;
     ASM_REGISTER_STATE_CHECK(mse_(src_, width_, ref_, width_, &sse1));
     variance_ref(src_, ref_, log2width_, log2height_, stride_coeff,
                  stride_coeff, &sse2, false, AOM_BITS_8);
     EXPECT_EQ(sse1, sse2);
   }
 }

 template <typename MseFunctionType>
 void MseTest<MseFunctionType>::RefTest_sse() {
   for (int i = 0; i < 10; ++i) {
     for (int j = 0; j < block_size_; j++) {
       src_[j] = rnd.Rand8();
       ref_[j] = rnd.Rand8();
     }
     unsigned int sse2;
     unsigned int var1;
     const int stride_coeff = 1;
     ASM_REGISTER_STATE_CHECK(var1 = mse_(src_, width_, ref_, width_));
     variance_ref(src_, ref_, log2width_, log2height_, stride_coeff,
                  stride_coeff, &sse2, false, AOM_BITS_8);
     EXPECT_EQ(var1, sse2);
   }
 }

 template <typename MseFunctionType>
 void MseTest<MseFunctionType>::MaxTest_mse() {
   memset(src_, 255, block_size_);
   memset(ref_, 0, block_size_);
   unsigned int sse;
   ASM_REGISTER_STATE_CHECK(mse_(src_, width_, ref_, width_, &sse));
   const unsigned int expected = block_size_ * 255 * 255;
   EXPECT_EQ(expected, sse);
 }

 template <typename MseFunctionType>
 void MseTest<MseFunctionType>::MaxTest_sse() {
   memset(src_, 255, block_size_);
   memset(ref_, 0, block_size_);
   unsigned int var;
   ASM_REGISTER_STATE_CHECK(var = mse_(src_, width_, ref_, width_));
   const unsigned int expected = block_size_ * 255 * 255;
   EXPECT_EQ(expected, var);
 }

 static uint32_t subpel_avg_variance_ref(const uint8_t *ref, const uint8_t *src,
                                         const uint8_t *second_pred, int l2w,
                                         int l2h, int xoff, int yoff,
                                         uint32_t *sse_ptr,
                                         bool use_high_bit_depth,
                                         aom_bit_depth_t bit_depth) {
   int64_t se = 0;
   uint64_t sse = 0;
   const int w = 1 << l2w;
   const int h = 1 << l2h;

   xoff <<= 1;
   yoff <<= 1;

   for (int y = 0; y < h; y++) {
     for (int x = 0; x < w; x++) {
       // bilinear interpolation at a 16th pel step
       if (!use_high_bit_depth) {
         const int a1 = ref[(w + 1) * (y + 0) + x + 0];
         const int a2 = ref[(w + 1) * (y + 0) + x + 1];
         const int b1 = ref[(w + 1) * (y + 1) + x + 0];
         const int b2 = ref[(w + 1) * (y + 1) + x + 1];
         const int a = a1 + (((a2 - a1) * xoff + 8) >> 4);
         const int b = b1 + (((b2 - b1) * xoff + 8) >> 4);
         const int r = a + (((b - a) * yoff + 8) >> 4);
         const int diff =
             ((r + second_pred[w * y + x] + 1) >> 1) - src[w * y + x];
         se += diff;
         sse += diff * diff;
 #if CONFIG_AOM_HIGHBITDEPTH
       } else {
         uint16_t *ref16 = CONVERT_TO_SHORTPTR(ref);
         uint16_t *src16 = CONVERT_TO_SHORTPTR(src);
         uint16_t *sec16 = CONVERT_TO_SHORTPTR(second_pred);
         const int a1 = ref16[(w + 1) * (y + 0) + x + 0];
         const int a2 = ref16[(w + 1) * (y + 0) + x + 1];
         const int b1 = ref16[(w + 1) * (y + 1) + x + 0];
         const int b2 = ref16[(w + 1) * (y + 1) + x + 1];
         const int a = a1 + (((a2 - a1) * xoff + 8) >> 4);
         const int b = b1 + (((b2 - b1) * xoff + 8) >> 4);
         const int r = a + (((b - a) * yoff + 8) >> 4);
         const int diff = ((r + sec16[w * y + x] + 1) >> 1) - src16[w * y + x];
         se += diff;
         sse += diff * diff;
 #endif  // CONFIG_AOM_HIGHBITDEPTH
       }
     }
   }
   RoundHighBitDepth(bit_depth, &se, &sse);
   *sse_ptr = static_cast<uint32_t>(sse);
   return static_cast<uint32_t>(
       sse - ((static_cast<int64_t>(se) * se) >> (l2w + l2h)));
 }

 template <typename SubpelVarianceFunctionType>
 class SubpelVarianceTest
     : public ::testing::TestWithParam<
           tuple<int, int, SubpelVarianceFunctionType, int> > {
  public:
   virtual void SetUp() {
     const tuple<int, int, SubpelVarianceFunctionType, int> &params =
         this->GetParam();
     log2width_ = get<0>(params);
     width_ = 1 << log2width_;
     log2height_ = get<1>(params);
     height_ = 1 << log2height_;
     subpel_variance_ = get<2>(params);
     if (get<3>(params)) {
       bit_depth_ = (aom_bit_depth_t)get<3>(params);
       use_high_bit_depth_ = true;
     } else {
       bit_depth_ = AOM_BITS_8;
       use_high_bit_depth_ = false;
     }
     mask_ = (1 << bit_depth_) - 1;

     rnd_.Reset(ACMRandom::DeterministicSeed());
     block_size_ = width_ * height_;
     if (!use_high_bit_depth_) {
       src_ = reinterpret_cast<uint8_t *>(aom_memalign(16, block_size_));
       sec_ = reinterpret_cast<uint8_t *>(aom_memalign(16, block_size_));
       ref_ = new uint8_t[block_size_ + width_ + height_ + 1];
 #if CONFIG_AOM_HIGHBITDEPTH
     } else {
       src_ = CONVERT_TO_BYTEPTR(reinterpret_cast<uint16_t *>(
           aom_memalign(16, block_size_ * sizeof(uint16_t))));
       sec_ = CONVERT_TO_BYTEPTR(reinterpret_cast<uint16_t *>(
           aom_memalign(16, block_size_ * sizeof(uint16_t))));
       ref_ =
           CONVERT_TO_BYTEPTR(new uint16_t[block_size_ + width_ + height_ + 1]);
 #endif  // CONFIG_AOM_HIGHBITDEPTH
     }
     ASSERT_TRUE(src_ != NULL);
     ASSERT_TRUE(sec_ != NULL);
     ASSERT_TRUE(ref_ != NULL);
   }

   virtual void TearDown() {
     if (!use_high_bit_depth_) {
       aom_free(src_);
       delete[] ref_;
       aom_free(sec_);
 #if CONFIG_AOM_HIGHBITDEPTH
     } else {
       aom_free(CONVERT_TO_SHORTPTR(src_));
       delete[] CONVERT_TO_SHORTPTR(ref_);
       aom_free(CONVERT_TO_SHORTPTR(sec_));
 #endif  // CONFIG_AOM_HIGHBITDEPTH
     }
     libaom_test::ClearSystemState();
   }

  protected:
   void RefTest();
   void ExtremeRefTest();

   ACMRandom rnd_;
   uint8_t *src_;
   uint8_t *ref_;
   uint8_t *sec_;
   bool use_high_bit_depth_;
   aom_bit_depth_t bit_depth_;
   int width_, log2width_;
   int height_, log2height_;
   int block_size_, mask_;
   SubpelVarianceFunctionType subpel_variance_;
 };

 template <typename SubpelVarianceFunctionType>
 void SubpelVarianceTest<SubpelVarianceFunctionType>::RefTest() {
   for (int x = 0; x < 8; ++x) {
     for (int y = 0; y < 8; ++y) {
       if (!use_high_bit_depth_) {
         for (int j = 0; j < block_size_; j++) {
           src_[j] = rnd_.Rand8();
         }
         for (int j = 0; j < block_size_ + width_ + height_ + 1; j++) {
           ref_[j] = rnd_.Rand8();
         }
 #if CONFIG_AOM_HIGHBITDEPTH
       } else {
         for (int j = 0; j < block_size_; j++) {
           CONVERT_TO_SHORTPTR(src_)[j] = rnd_.Rand16() & mask_;
         }
         for (int j = 0; j < block_size_ + width_ + height_ + 1; j++) {
           CONVERT_TO_SHORTPTR(ref_)[j] = rnd_.Rand16() & mask_;
         }
 #endif  // CONFIG_AOM_HIGHBITDEPTH
       }
       unsigned int sse1, sse2;
       unsigned int var1;
       ASM_REGISTER_STATE_CHECK(
           var1 = subpel_variance_(ref_, width_ + 1, x, y, src_, width_, &sse1));
       const unsigned int var2 =
           subpel_variance_ref(ref_, src_, log2width_, log2height_, x, y, &sse2,
                               use_high_bit_depth_, bit_depth_);
       EXPECT_EQ(sse1, sse2) << "at position " << x << ", " << y;
       EXPECT_EQ(var1, var2) << "at position " << x << ", " << y;
     }
   }
 }

 template <typename SubpelVarianceFunctionType>
 void SubpelVarianceTest<SubpelVarianceFunctionType>::ExtremeRefTest() {
   // Compare against reference.
   // Src: Set the first half of values to 0, the second half to the maximum.
   // Ref: Set the first half of values to the maximum, the second half to 0.
   for (int x = 0; x < 8; ++x) {
     for (int y = 0; y < 8; ++y) {
       const int half = block_size_ / 2;
       if (!use_high_bit_depth_) {
         memset(src_, 0, half);
         memset(src_ + half, 255, half);
         memset(ref_, 255, half);
         memset(ref_ + half, 0, half + width_ + height_ + 1);
 #if CONFIG_AOM_HIGHBITDEPTH
       } else {
         aom_memset16(CONVERT_TO_SHORTPTR(src_), mask_, half);
         aom_memset16(CONVERT_TO_SHORTPTR(src_) + half, 0, half);
         aom_memset16(CONVERT_TO_SHORTPTR(ref_), 0, half);
         aom_memset16(CONVERT_TO_SHORTPTR(ref_) + half, mask_,
                      half + width_ + height_ + 1);
 #endif  // CONFIG_AOM_HIGHBITDEPTH
       }
       unsigned int sse1, sse2;
       unsigned int var1;
       ASM_REGISTER_STATE_CHECK(
           var1 = subpel_variance_(ref_, width_ + 1, x, y, src_, width_, &sse1));
       const unsigned int var2 =
           subpel_variance_ref(ref_, src_, log2width_, log2height_, x, y, &sse2,
                               use_high_bit_depth_, bit_depth_);
       EXPECT_EQ(sse1, sse2) << "for xoffset " << x << " and yoffset " << y;
       EXPECT_EQ(var1, var2) << "for xoffset " << x << " and yoffset " << y;
     }
   }
 }

 template <>
 void SubpelVarianceTest<SubpixAvgVarMxNFunc>::RefTest() {
   for (int x = 0; x < 8; ++x) {
     for (int y = 0; y < 8; ++y) {
       if (!use_high_bit_depth_) {
         for (int j = 0; j < block_size_; j++) {
           src_[j] = rnd_.Rand8();
           sec_[j] = rnd_.Rand8();
         }
         for (int j = 0; j < block_size_ + width_ + height_ + 1; j++) {
           ref_[j] = rnd_.Rand8();
         }
 #if CONFIG_AOM_HIGHBITDEPTH
       } else {
         for (int j = 0; j < block_size_; j++) {
           CONVERT_TO_SHORTPTR(src_)[j] = rnd_.Rand16() & mask_;
           CONVERT_TO_SHORTPTR(sec_)[j] = rnd_.Rand16() & mask_;
         }
         for (int j = 0; j < block_size_ + width_ + height_ + 1; j++) {
           CONVERT_TO_SHORTPTR(ref_)[j] = rnd_.Rand16() & mask_;
         }
 #endif  // CONFIG_AOM_HIGHBITDEPTH
       }
       unsigned int sse1, sse2;
       unsigned int var1;
       ASM_REGISTER_STATE_CHECK(var1 =
                                    subpel_variance_(ref_, width_ + 1, x, y,
                                                     src_, width_, &sse1, sec_));
       const unsigned int var2 =
           subpel_avg_variance_ref(ref_, src_, sec_, log2width_, log2height_, x,
                                   y, &sse2, use_high_bit_depth_, bit_depth_);
       EXPECT_EQ(sse1, sse2) << "at position " << x << ", " << y;
       EXPECT_EQ(var1, var2) << "at position " << x << ", " << y;
     }
   }
 }

 typedef MseTest<Get4x4SseFunc> AvxSseTest;
 typedef MseTest<VarianceMxNFunc> AvxMseTest;
 typedef VarianceTest<VarianceMxNFunc> AvxVarianceTest;
 typedef SubpelVarianceTest<SubpixVarMxNFunc> AvxSubpelVarianceTest;
 typedef SubpelVarianceTest<SubpixAvgVarMxNFunc> AvxSubpelAvgVarianceTest;

 TEST_P(AvxSseTest, Ref_sse) { RefTest_sse(); }
 TEST_P(AvxSseTest, Max_sse) { MaxTest_sse(); }
 TEST_P(AvxMseTest, Ref_mse) { RefTest_mse(); }
 TEST_P(AvxMseTest, Max_mse) { MaxTest_mse(); }
 TEST_P(AvxVarianceTest, Zero) { ZeroTest(); }
 TEST_P(AvxVarianceTest, Ref) { RefTest(); }
 TEST_P(AvxVarianceTest, RefStride) { RefStrideTest(); }
 TEST_P(AvxVarianceTest, OneQuarter) { OneQuarterTest(); }
 TEST_P(SumOfSquaresTest, Const) { ConstTest(); }
 TEST_P(SumOfSquaresTest, Ref) { RefTest(); }
 TEST_P(AvxSubpelVarianceTest, Ref) { RefTest(); }
 TEST_P(AvxSubpelVarianceTest, ExtremeRef) { ExtremeRefTest(); }
 TEST_P(AvxSubpelAvgVarianceTest, Ref) { RefTest(); }

 INSTANTIATE_TEST_CASE_P(C, SumOfSquaresTest,
                         ::testing::Values(aom_get_mb_ss_c));

 INSTANTIATE_TEST_CASE_P(C, AvxSseTest,
                         ::testing::Values(make_tuple(2, 2,
                                                      &aom_get4x4sse_cs_c)));

 INSTANTIATE_TEST_CASE_P(C, AvxMseTest,
                         ::testing::Values(make_tuple(4, 4, &aom_mse16x16_c),
                                           make_tuple(4, 3, &aom_mse16x8_c),
                                           make_tuple(3, 4, &aom_mse8x16_c),
                                           make_tuple(3, 3, &aom_mse8x8_c)));

 INSTANTIATE_TEST_CASE_P(
     C, AvxVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_variance64x64_c, 0),
                       make_tuple(6, 5, &aom_variance64x32_c, 0),
                       make_tuple(5, 6, &aom_variance32x64_c, 0),
                       make_tuple(5, 5, &aom_variance32x32_c, 0),
                       make_tuple(5, 4, &aom_variance32x16_c, 0),
                       make_tuple(4, 5, &aom_variance16x32_c, 0),
                       make_tuple(4, 4, &aom_variance16x16_c, 0),
                       make_tuple(4, 3, &aom_variance16x8_c, 0),
                       make_tuple(3, 4, &aom_variance8x16_c, 0),
                       make_tuple(3, 3, &aom_variance8x8_c, 0),
                       make_tuple(3, 2, &aom_variance8x4_c, 0),
                       make_tuple(2, 3, &aom_variance4x8_c, 0),
                       make_tuple(2, 2, &aom_variance4x4_c, 0)));

 INSTANTIATE_TEST_CASE_P(
     C, AvxSubpelVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_sub_pixel_variance64x64_c, 0),
                       make_tuple(6, 5, &aom_sub_pixel_variance64x32_c, 0),
                       make_tuple(5, 6, &aom_sub_pixel_variance32x64_c, 0),
                       make_tuple(5, 5, &aom_sub_pixel_variance32x32_c, 0),
                       make_tuple(5, 4, &aom_sub_pixel_variance32x16_c, 0),
                       make_tuple(4, 5, &aom_sub_pixel_variance16x32_c, 0),
                       make_tuple(4, 4, &aom_sub_pixel_variance16x16_c, 0),
                       make_tuple(4, 3, &aom_sub_pixel_variance16x8_c, 0),
                       make_tuple(3, 4, &aom_sub_pixel_variance8x16_c, 0),
                       make_tuple(3, 3, &aom_sub_pixel_variance8x8_c, 0),
                       make_tuple(3, 2, &aom_sub_pixel_variance8x4_c, 0),
                       make_tuple(2, 3, &aom_sub_pixel_variance4x8_c, 0),
                       make_tuple(2, 2, &aom_sub_pixel_variance4x4_c, 0)));

 INSTANTIATE_TEST_CASE_P(
     C, AvxSubpelAvgVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_sub_pixel_avg_variance64x64_c, 0),
                       make_tuple(6, 5, &aom_sub_pixel_avg_variance64x32_c, 0),
                       make_tuple(5, 6, &aom_sub_pixel_avg_variance32x64_c, 0),
                       make_tuple(5, 5, &aom_sub_pixel_avg_variance32x32_c, 0),
                       make_tuple(5, 4, &aom_sub_pixel_avg_variance32x16_c, 0),
                       make_tuple(4, 5, &aom_sub_pixel_avg_variance16x32_c, 0),
                       make_tuple(4, 4, &aom_sub_pixel_avg_variance16x16_c, 0),
                       make_tuple(4, 3, &aom_sub_pixel_avg_variance16x8_c, 0),
                       make_tuple(3, 4, &aom_sub_pixel_avg_variance8x16_c, 0),
                       make_tuple(3, 3, &aom_sub_pixel_avg_variance8x8_c, 0),
                       make_tuple(3, 2, &aom_sub_pixel_avg_variance8x4_c, 0),
                       make_tuple(2, 3, &aom_sub_pixel_avg_variance4x8_c, 0),
                       make_tuple(2, 2, &aom_sub_pixel_avg_variance4x4_c, 0)));

 #if CONFIG_AOM_HIGHBITDEPTH
 typedef MseTest<VarianceMxNFunc> AvxHBDMseTest;
 typedef VarianceTest<VarianceMxNFunc> AvxHBDVarianceTest;
 typedef SubpelVarianceTest<SubpixVarMxNFunc> AvxHBDSubpelVarianceTest;
 typedef SubpelVarianceTest<SubpixAvgVarMxNFunc> AvxHBDSubpelAvgVarianceTest;

 TEST_P(AvxHBDMseTest, Ref_mse) { RefTest_mse(); }
 TEST_P(AvxHBDMseTest, Max_mse) { MaxTest_mse(); }
 TEST_P(AvxHBDVarianceTest, Zero) { ZeroTest(); }
 TEST_P(AvxHBDVarianceTest, Ref) { RefTest(); }
 TEST_P(AvxHBDVarianceTest, RefStride) { RefStrideTest(); }
 TEST_P(AvxHBDVarianceTest, OneQuarter) { OneQuarterTest(); }
 TEST_P(AvxHBDSubpelVarianceTest, Ref) { RefTest(); }
 TEST_P(AvxHBDSubpelVarianceTest, ExtremeRef) { ExtremeRefTest(); }
 TEST_P(AvxHBDSubpelAvgVarianceTest, Ref) { RefTest(); }

 /* TODO(debargha): This test does not support the highbd version
 INSTANTIATE_TEST_CASE_P(
     C, AvxHBDMseTest,
     ::testing::Values(make_tuple(4, 4, &aom_highbd_12_mse16x16_c),
                       make_tuple(4, 4, &aom_highbd_12_mse16x8_c),
                       make_tuple(4, 4, &aom_highbd_12_mse8x16_c),
                       make_tuple(4, 4, &aom_highbd_12_mse8x8_c),
                       make_tuple(4, 4, &aom_highbd_10_mse16x16_c),
                       make_tuple(4, 4, &aom_highbd_10_mse16x8_c),
                       make_tuple(4, 4, &aom_highbd_10_mse8x16_c),
                       make_tuple(4, 4, &aom_highbd_10_mse8x8_c),
                       make_tuple(4, 4, &aom_highbd_8_mse16x16_c),
                       make_tuple(4, 4, &aom_highbd_8_mse16x8_c),
                       make_tuple(4, 4, &aom_highbd_8_mse8x16_c),
                       make_tuple(4, 4, &aom_highbd_8_mse8x8_c)));
 */

 INSTANTIATE_TEST_CASE_P(
     C, AvxHBDVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_highbd_12_variance64x64_c, 12),
                       make_tuple(6, 5, &aom_highbd_12_variance64x32_c, 12),
                       make_tuple(5, 6, &aom_highbd_12_variance32x64_c, 12),
                       make_tuple(5, 5, &aom_highbd_12_variance32x32_c, 12),
                       make_tuple(5, 4, &aom_highbd_12_variance32x16_c, 12),
                       make_tuple(4, 5, &aom_highbd_12_variance16x32_c, 12),
                       make_tuple(4, 4, &aom_highbd_12_variance16x16_c, 12),
                       make_tuple(4, 3, &aom_highbd_12_variance16x8_c, 12),
                       make_tuple(3, 4, &aom_highbd_12_variance8x16_c, 12),
                       make_tuple(3, 3, &aom_highbd_12_variance8x8_c, 12),
                       make_tuple(3, 2, &aom_highbd_12_variance8x4_c, 12),
                       make_tuple(2, 3, &aom_highbd_12_variance4x8_c, 12),
                       make_tuple(2, 2, &aom_highbd_12_variance4x4_c, 12),
                       make_tuple(6, 6, &aom_highbd_10_variance64x64_c, 10),
                       make_tuple(6, 5, &aom_highbd_10_variance64x32_c, 10),
                       make_tuple(5, 6, &aom_highbd_10_variance32x64_c, 10),
                       make_tuple(5, 5, &aom_highbd_10_variance32x32_c, 10),
                       make_tuple(5, 4, &aom_highbd_10_variance32x16_c, 10),
                       make_tuple(4, 5, &aom_highbd_10_variance16x32_c, 10),
                       make_tuple(4, 4, &aom_highbd_10_variance16x16_c, 10),
                       make_tuple(4, 3, &aom_highbd_10_variance16x8_c, 10),
                       make_tuple(3, 4, &aom_highbd_10_variance8x16_c, 10),
                       make_tuple(3, 3, &aom_highbd_10_variance8x8_c, 10),
                       make_tuple(3, 2, &aom_highbd_10_variance8x4_c, 10),
                       make_tuple(2, 3, &aom_highbd_10_variance4x8_c, 10),
                       make_tuple(2, 2, &aom_highbd_10_variance4x4_c, 10),
                       make_tuple(6, 6, &aom_highbd_8_variance64x64_c, 8),
                       make_tuple(6, 5, &aom_highbd_8_variance64x32_c, 8),
                       make_tuple(5, 6, &aom_highbd_8_variance32x64_c, 8),
                       make_tuple(5, 5, &aom_highbd_8_variance32x32_c, 8),
                       make_tuple(5, 4, &aom_highbd_8_variance32x16_c, 8),
                       make_tuple(4, 5, &aom_highbd_8_variance16x32_c, 8),
                       make_tuple(4, 4, &aom_highbd_8_variance16x16_c, 8),
                       make_tuple(4, 3, &aom_highbd_8_variance16x8_c, 8),
                       make_tuple(3, 4, &aom_highbd_8_variance8x16_c, 8),
                       make_tuple(3, 3, &aom_highbd_8_variance8x8_c, 8),
                       make_tuple(3, 2, &aom_highbd_8_variance8x4_c, 8),
                       make_tuple(2, 3, &aom_highbd_8_variance4x8_c, 8),
                       make_tuple(2, 2, &aom_highbd_8_variance4x4_c, 8)));

 INSTANTIATE_TEST_CASE_P(
     C, AvxHBDSubpelVarianceTest,
     ::testing::Values(
         make_tuple(6, 6, &aom_highbd_8_sub_pixel_variance64x64_c, 8),
         make_tuple(6, 5, &aom_highbd_8_sub_pixel_variance64x32_c, 8),
         make_tuple(5, 6, &aom_highbd_8_sub_pixel_variance32x64_c, 8),
         make_tuple(5, 5, &aom_highbd_8_sub_pixel_variance32x32_c, 8),
         make_tuple(5, 4, &aom_highbd_8_sub_pixel_variance32x16_c, 8),
         make_tuple(4, 5, &aom_highbd_8_sub_pixel_variance16x32_c, 8),
         make_tuple(4, 4, &aom_highbd_8_sub_pixel_variance16x16_c, 8),
         make_tuple(4, 3, &aom_highbd_8_sub_pixel_variance16x8_c, 8),
         make_tuple(3, 4, &aom_highbd_8_sub_pixel_variance8x16_c, 8),
         make_tuple(3, 3, &aom_highbd_8_sub_pixel_variance8x8_c, 8),
         make_tuple(3, 2, &aom_highbd_8_sub_pixel_variance8x4_c, 8),
         make_tuple(2, 3, &aom_highbd_8_sub_pixel_variance4x8_c, 8),
         make_tuple(2, 2, &aom_highbd_8_sub_pixel_variance4x4_c, 8),
         make_tuple(6, 6, &aom_highbd_10_sub_pixel_variance64x64_c, 10),
         make_tuple(6, 5, &aom_highbd_10_sub_pixel_variance64x32_c, 10),
         make_tuple(5, 6, &aom_highbd_10_sub_pixel_variance32x64_c, 10),
         make_tuple(5, 5, &aom_highbd_10_sub_pixel_variance32x32_c, 10),
         make_tuple(5, 4, &aom_highbd_10_sub_pixel_variance32x16_c, 10),
         make_tuple(4, 5, &aom_highbd_10_sub_pixel_variance16x32_c, 10),
         make_tuple(4, 4, &aom_highbd_10_sub_pixel_variance16x16_c, 10),
         make_tuple(4, 3, &aom_highbd_10_sub_pixel_variance16x8_c, 10),
         make_tuple(3, 4, &aom_highbd_10_sub_pixel_variance8x16_c, 10),
         make_tuple(3, 3, &aom_highbd_10_sub_pixel_variance8x8_c, 10),
         make_tuple(3, 2, &aom_highbd_10_sub_pixel_variance8x4_c, 10),
         make_tuple(2, 3, &aom_highbd_10_sub_pixel_variance4x8_c, 10),
         make_tuple(2, 2, &aom_highbd_10_sub_pixel_variance4x4_c, 10),
         make_tuple(6, 6, &aom_highbd_12_sub_pixel_variance64x64_c, 12),
         make_tuple(6, 5, &aom_highbd_12_sub_pixel_variance64x32_c, 12),
         make_tuple(5, 6, &aom_highbd_12_sub_pixel_variance32x64_c, 12),
         make_tuple(5, 5, &aom_highbd_12_sub_pixel_variance32x32_c, 12),
         make_tuple(5, 4, &aom_highbd_12_sub_pixel_variance32x16_c, 12),
         make_tuple(4, 5, &aom_highbd_12_sub_pixel_variance16x32_c, 12),
         make_tuple(4, 4, &aom_highbd_12_sub_pixel_variance16x16_c, 12),
         make_tuple(4, 3, &aom_highbd_12_sub_pixel_variance16x8_c, 12),
         make_tuple(3, 4, &aom_highbd_12_sub_pixel_variance8x16_c, 12),
         make_tuple(3, 3, &aom_highbd_12_sub_pixel_variance8x8_c, 12),
         make_tuple(3, 2, &aom_highbd_12_sub_pixel_variance8x4_c, 12),
         make_tuple(2, 3, &aom_highbd_12_sub_pixel_variance4x8_c, 12),
         make_tuple(2, 2, &aom_highbd_12_sub_pixel_variance4x4_c, 12)));

 INSTANTIATE_TEST_CASE_P(
     C, AvxHBDSubpelAvgVarianceTest,
     ::testing::Values(
         make_tuple(6, 6, &aom_highbd_8_sub_pixel_avg_variance64x64_c, 8),
         make_tuple(6, 5, &aom_highbd_8_sub_pixel_avg_variance64x32_c, 8),
         make_tuple(5, 6, &aom_highbd_8_sub_pixel_avg_variance32x64_c, 8),
         make_tuple(5, 5, &aom_highbd_8_sub_pixel_avg_variance32x32_c, 8),
         make_tuple(5, 4, &aom_highbd_8_sub_pixel_avg_variance32x16_c, 8),
         make_tuple(4, 5, &aom_highbd_8_sub_pixel_avg_variance16x32_c, 8),
         make_tuple(4, 4, &aom_highbd_8_sub_pixel_avg_variance16x16_c, 8),
         make_tuple(4, 3, &aom_highbd_8_sub_pixel_avg_variance16x8_c, 8),
         make_tuple(3, 4, &aom_highbd_8_sub_pixel_avg_variance8x16_c, 8),
         make_tuple(3, 3, &aom_highbd_8_sub_pixel_avg_variance8x8_c, 8),
         make_tuple(3, 2, &aom_highbd_8_sub_pixel_avg_variance8x4_c, 8),
         make_tuple(2, 3, &aom_highbd_8_sub_pixel_avg_variance4x8_c, 8),
         make_tuple(2, 2, &aom_highbd_8_sub_pixel_avg_variance4x4_c, 8),
         make_tuple(6, 6, &aom_highbd_10_sub_pixel_avg_variance64x64_c, 10),
         make_tuple(6, 5, &aom_highbd_10_sub_pixel_avg_variance64x32_c, 10),
         make_tuple(5, 6, &aom_highbd_10_sub_pixel_avg_variance32x64_c, 10),
         make_tuple(5, 5, &aom_highbd_10_sub_pixel_avg_variance32x32_c, 10),
         make_tuple(5, 4, &aom_highbd_10_sub_pixel_avg_variance32x16_c, 10),
         make_tuple(4, 5, &aom_highbd_10_sub_pixel_avg_variance16x32_c, 10),
         make_tuple(4, 4, &aom_highbd_10_sub_pixel_avg_variance16x16_c, 10),
         make_tuple(4, 3, &aom_highbd_10_sub_pixel_avg_variance16x8_c, 10),
         make_tuple(3, 4, &aom_highbd_10_sub_pixel_avg_variance8x16_c, 10),
         make_tuple(3, 3, &aom_highbd_10_sub_pixel_avg_variance8x8_c, 10),
         make_tuple(3, 2, &aom_highbd_10_sub_pixel_avg_variance8x4_c, 10),
         make_tuple(2, 3, &aom_highbd_10_sub_pixel_avg_variance4x8_c, 10),
         make_tuple(2, 2, &aom_highbd_10_sub_pixel_avg_variance4x4_c, 10),
         make_tuple(6, 6, &aom_highbd_12_sub_pixel_avg_variance64x64_c, 12),
         make_tuple(6, 5, &aom_highbd_12_sub_pixel_avg_variance64x32_c, 12),
         make_tuple(5, 6, &aom_highbd_12_sub_pixel_avg_variance32x64_c, 12),
         make_tuple(5, 5, &aom_highbd_12_sub_pixel_avg_variance32x32_c, 12),
         make_tuple(5, 4, &aom_highbd_12_sub_pixel_avg_variance32x16_c, 12),
         make_tuple(4, 5, &aom_highbd_12_sub_pixel_avg_variance16x32_c, 12),
         make_tuple(4, 4, &aom_highbd_12_sub_pixel_avg_variance16x16_c, 12),
         make_tuple(4, 3, &aom_highbd_12_sub_pixel_avg_variance16x8_c, 12),
         make_tuple(3, 4, &aom_highbd_12_sub_pixel_avg_variance8x16_c, 12),
         make_tuple(3, 3, &aom_highbd_12_sub_pixel_avg_variance8x8_c, 12),
         make_tuple(3, 2, &aom_highbd_12_sub_pixel_avg_variance8x4_c, 12),
         make_tuple(2, 3, &aom_highbd_12_sub_pixel_avg_variance4x8_c, 12),
         make_tuple(2, 2, &aom_highbd_12_sub_pixel_avg_variance4x4_c, 12)));
 #endif  // CONFIG_AOM_HIGHBITDEPTH

 #if HAVE_SSE2
 INSTANTIATE_TEST_CASE_P(SSE2, SumOfSquaresTest,
                         ::testing::Values(aom_get_mb_ss_sse2));

 INSTANTIATE_TEST_CASE_P(SSE2, AvxMseTest,
                         ::testing::Values(make_tuple(4, 4, &aom_mse16x16_sse2),
                                           make_tuple(4, 3, &aom_mse16x8_sse2),
                                           make_tuple(3, 4, &aom_mse8x16_sse2),
                                           make_tuple(3, 3, &aom_mse8x8_sse2)));

 INSTANTIATE_TEST_CASE_P(
     SSE2, AvxVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_variance64x64_sse2, 0),
                       make_tuple(6, 5, &aom_variance64x32_sse2, 0),
                       make_tuple(5, 6, &aom_variance32x64_sse2, 0),
                       make_tuple(5, 5, &aom_variance32x32_sse2, 0),
                       make_tuple(5, 4, &aom_variance32x16_sse2, 0),
                       make_tuple(4, 5, &aom_variance16x32_sse2, 0),
                       make_tuple(4, 4, &aom_variance16x16_sse2, 0),
                       make_tuple(4, 3, &aom_variance16x8_sse2, 0),
                       make_tuple(3, 4, &aom_variance8x16_sse2, 0),
                       make_tuple(3, 3, &aom_variance8x8_sse2, 0),
                       make_tuple(3, 2, &aom_variance8x4_sse2, 0),
                       make_tuple(2, 3, &aom_variance4x8_sse2, 0),
                       make_tuple(2, 2, &aom_variance4x4_sse2, 0)));

 #if CONFIG_USE_X86INC
 INSTANTIATE_TEST_CASE_P(
     SSE2, AvxSubpelVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_sub_pixel_variance64x64_sse2, 0),
                       make_tuple(6, 5, &aom_sub_pixel_variance64x32_sse2, 0),
                       make_tuple(5, 6, &aom_sub_pixel_variance32x64_sse2, 0),
                       make_tuple(5, 5, &aom_sub_pixel_variance32x32_sse2, 0),
                       make_tuple(5, 4, &aom_sub_pixel_variance32x16_sse2, 0),
                       make_tuple(4, 5, &aom_sub_pixel_variance16x32_sse2, 0),
                       make_tuple(4, 4, &aom_sub_pixel_variance16x16_sse2, 0),
                       make_tuple(4, 3, &aom_sub_pixel_variance16x8_sse2, 0),
                       make_tuple(3, 4, &aom_sub_pixel_variance8x16_sse2, 0),
                       make_tuple(3, 3, &aom_sub_pixel_variance8x8_sse2, 0),
                       make_tuple(3, 2, &aom_sub_pixel_variance8x4_sse2, 0),
                       make_tuple(2, 3, &aom_sub_pixel_variance4x8_sse, 0),
                       make_tuple(2, 2, &aom_sub_pixel_variance4x4_sse, 0)));

 INSTANTIATE_TEST_CASE_P(
     SSE2, AvxSubpelAvgVarianceTest,
     ::testing::Values(
         make_tuple(6, 6, &aom_sub_pixel_avg_variance64x64_sse2, 0),
         make_tuple(6, 5, &aom_sub_pixel_avg_variance64x32_sse2, 0),
         make_tuple(5, 6, &aom_sub_pixel_avg_variance32x64_sse2, 0),
         make_tuple(5, 5, &aom_sub_pixel_avg_variance32x32_sse2, 0),
         make_tuple(5, 4, &aom_sub_pixel_avg_variance32x16_sse2, 0),
         make_tuple(4, 5, &aom_sub_pixel_avg_variance16x32_sse2, 0),
         make_tuple(4, 4, &aom_sub_pixel_avg_variance16x16_sse2, 0),
         make_tuple(4, 3, &aom_sub_pixel_avg_variance16x8_sse2, 0),
         make_tuple(3, 4, &aom_sub_pixel_avg_variance8x16_sse2, 0),
         make_tuple(3, 3, &aom_sub_pixel_avg_variance8x8_sse2, 0),
         make_tuple(3, 2, &aom_sub_pixel_avg_variance8x4_sse2, 0),
         make_tuple(2, 3, &aom_sub_pixel_avg_variance4x8_sse, 0),
         make_tuple(2, 2, &aom_sub_pixel_avg_variance4x4_sse, 0)));
 #endif  // CONFIG_USE_X86INC

 #if CONFIG_AOM_HIGHBITDEPTH
 /* TODO(debargha): This test does not support the highbd version
 INSTANTIATE_TEST_CASE_P(
     SSE2, AvxHBDMseTest,
     ::testing::Values(make_tuple(4, 4, &aom_highbd_12_mse16x16_sse2),
                       make_tuple(4, 3, &aom_highbd_12_mse16x8_sse2),
                       make_tuple(3, 4, &aom_highbd_12_mse8x16_sse2),
                       make_tuple(3, 3, &aom_highbd_12_mse8x8_sse2),
                       make_tuple(4, 4, &aom_highbd_10_mse16x16_sse2),
                       make_tuple(4, 3, &aom_highbd_10_mse16x8_sse2),
                       make_tuple(3, 4, &aom_highbd_10_mse8x16_sse2),
                       make_tuple(3, 3, &aom_highbd_10_mse8x8_sse2),
                       make_tuple(4, 4, &aom_highbd_8_mse16x16_sse2),
                       make_tuple(4, 3, &aom_highbd_8_mse16x8_sse2),
                       make_tuple(3, 4, &aom_highbd_8_mse8x16_sse2),
                       make_tuple(3, 3, &aom_highbd_8_mse8x8_sse2)));
 */

 INSTANTIATE_TEST_CASE_P(
     SSE2, AvxHBDVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_highbd_12_variance64x64_sse2, 12),
                       make_tuple(6, 5, &aom_highbd_12_variance64x32_sse2, 12),
                       make_tuple(5, 6, &aom_highbd_12_variance32x64_sse2, 12),
                       make_tuple(5, 5, &aom_highbd_12_variance32x32_sse2, 12),
                       make_tuple(5, 4, &aom_highbd_12_variance32x16_sse2, 12),
                       make_tuple(4, 5, &aom_highbd_12_variance16x32_sse2, 12),
                       make_tuple(4, 4, &aom_highbd_12_variance16x16_sse2, 12),
                       make_tuple(4, 3, &aom_highbd_12_variance16x8_sse2, 12),
                       make_tuple(3, 4, &aom_highbd_12_variance8x16_sse2, 12),
                       make_tuple(3, 3, &aom_highbd_12_variance8x8_sse2, 12),
                       make_tuple(6, 6, &aom_highbd_10_variance64x64_sse2, 10),
                       make_tuple(6, 5, &aom_highbd_10_variance64x32_sse2, 10),
                       make_tuple(5, 6, &aom_highbd_10_variance32x64_sse2, 10),
                       make_tuple(5, 5, &aom_highbd_10_variance32x32_sse2, 10),
                       make_tuple(5, 4, &aom_highbd_10_variance32x16_sse2, 10),
                       make_tuple(4, 5, &aom_highbd_10_variance16x32_sse2, 10),
                       make_tuple(4, 4, &aom_highbd_10_variance16x16_sse2, 10),
                       make_tuple(4, 3, &aom_highbd_10_variance16x8_sse2, 10),
                       make_tuple(3, 4, &aom_highbd_10_variance8x16_sse2, 10),
                       make_tuple(3, 3, &aom_highbd_10_variance8x8_sse2, 10),
                       make_tuple(6, 6, &aom_highbd_8_variance64x64_sse2, 8),
                       make_tuple(6, 5, &aom_highbd_8_variance64x32_sse2, 8),
                       make_tuple(5, 6, &aom_highbd_8_variance32x64_sse2, 8),
                       make_tuple(5, 5, &aom_highbd_8_variance32x32_sse2, 8),
                       make_tuple(5, 4, &aom_highbd_8_variance32x16_sse2, 8),
                       make_tuple(4, 5, &aom_highbd_8_variance16x32_sse2, 8),
                       make_tuple(4, 4, &aom_highbd_8_variance16x16_sse2, 8),
                       make_tuple(4, 3, &aom_highbd_8_variance16x8_sse2, 8),
                       make_tuple(3, 4, &aom_highbd_8_variance8x16_sse2, 8),
                       make_tuple(3, 3, &aom_highbd_8_variance8x8_sse2, 8)));

 #if CONFIG_USE_X86INC
 INSTANTIATE_TEST_CASE_P(
     SSE2, AvxHBDSubpelVarianceTest,
     ::testing::Values(
         make_tuple(6, 6, &aom_highbd_12_sub_pixel_variance64x64_sse2, 12),
         make_tuple(6, 5, &aom_highbd_12_sub_pixel_variance64x32_sse2, 12),
         make_tuple(5, 6, &aom_highbd_12_sub_pixel_variance32x64_sse2, 12),
         make_tuple(5, 5, &aom_highbd_12_sub_pixel_variance32x32_sse2, 12),
         make_tuple(5, 4, &aom_highbd_12_sub_pixel_variance32x16_sse2, 12),
         make_tuple(4, 5, &aom_highbd_12_sub_pixel_variance16x32_sse2, 12),
         make_tuple(4, 4, &aom_highbd_12_sub_pixel_variance16x16_sse2, 12),
         make_tuple(4, 3, &aom_highbd_12_sub_pixel_variance16x8_sse2, 12),
         make_tuple(3, 4, &aom_highbd_12_sub_pixel_variance8x16_sse2, 12),
         make_tuple(3, 3, &aom_highbd_12_sub_pixel_variance8x8_sse2, 12),
         make_tuple(3, 2, &aom_highbd_12_sub_pixel_variance8x4_sse2, 12),
         make_tuple(6, 6, &aom_highbd_10_sub_pixel_variance64x64_sse2, 10),
         make_tuple(6, 5, &aom_highbd_10_sub_pixel_variance64x32_sse2, 10),
         make_tuple(5, 6, &aom_highbd_10_sub_pixel_variance32x64_sse2, 10),
         make_tuple(5, 5, &aom_highbd_10_sub_pixel_variance32x32_sse2, 10),
         make_tuple(5, 4, &aom_highbd_10_sub_pixel_variance32x16_sse2, 10),
         make_tuple(4, 5, &aom_highbd_10_sub_pixel_variance16x32_sse2, 10),
         make_tuple(4, 4, &aom_highbd_10_sub_pixel_variance16x16_sse2, 10),
         make_tuple(4, 3, &aom_highbd_10_sub_pixel_variance16x8_sse2, 10),
         make_tuple(3, 4, &aom_highbd_10_sub_pixel_variance8x16_sse2, 10),
         make_tuple(3, 3, &aom_highbd_10_sub_pixel_variance8x8_sse2, 10),
         make_tuple(3, 2, &aom_highbd_10_sub_pixel_variance8x4_sse2, 10),
         make_tuple(6, 6, &aom_highbd_8_sub_pixel_variance64x64_sse2, 8),
         make_tuple(6, 5, &aom_highbd_8_sub_pixel_variance64x32_sse2, 8),
         make_tuple(5, 6, &aom_highbd_8_sub_pixel_variance32x64_sse2, 8),
         make_tuple(5, 5, &aom_highbd_8_sub_pixel_variance32x32_sse2, 8),
         make_tuple(5, 4, &aom_highbd_8_sub_pixel_variance32x16_sse2, 8),
         make_tuple(4, 5, &aom_highbd_8_sub_pixel_variance16x32_sse2, 8),
         make_tuple(4, 4, &aom_highbd_8_sub_pixel_variance16x16_sse2, 8),
         make_tuple(4, 3, &aom_highbd_8_sub_pixel_variance16x8_sse2, 8),
         make_tuple(3, 4, &aom_highbd_8_sub_pixel_variance8x16_sse2, 8),
         make_tuple(3, 3, &aom_highbd_8_sub_pixel_variance8x8_sse2, 8),
         make_tuple(3, 2, &aom_highbd_8_sub_pixel_variance8x4_sse2, 8)));

 INSTANTIATE_TEST_CASE_P(
     SSE2, AvxHBDSubpelAvgVarianceTest,
     ::testing::Values(
         make_tuple(6, 6, &aom_highbd_12_sub_pixel_avg_variance64x64_sse2, 12),
         make_tuple(6, 5, &aom_highbd_12_sub_pixel_avg_variance64x32_sse2, 12),
         make_tuple(5, 6, &aom_highbd_12_sub_pixel_avg_variance32x64_sse2, 12),
         make_tuple(5, 5, &aom_highbd_12_sub_pixel_avg_variance32x32_sse2, 12),
         make_tuple(5, 4, &aom_highbd_12_sub_pixel_avg_variance32x16_sse2, 12),
         make_tuple(4, 5, &aom_highbd_12_sub_pixel_avg_variance16x32_sse2, 12),
         make_tuple(4, 4, &aom_highbd_12_sub_pixel_avg_variance16x16_sse2, 12),
         make_tuple(4, 3, &aom_highbd_12_sub_pixel_avg_variance16x8_sse2, 12),
         make_tuple(3, 4, &aom_highbd_12_sub_pixel_avg_variance8x16_sse2, 12),
         make_tuple(3, 3, &aom_highbd_12_sub_pixel_avg_variance8x8_sse2, 12),
         make_tuple(3, 2, &aom_highbd_12_sub_pixel_avg_variance8x4_sse2, 12),
         make_tuple(6, 6, &aom_highbd_10_sub_pixel_avg_variance64x64_sse2, 10),
         make_tuple(6, 5, &aom_highbd_10_sub_pixel_avg_variance64x32_sse2, 10),
         make_tuple(5, 6, &aom_highbd_10_sub_pixel_avg_variance32x64_sse2, 10),
         make_tuple(5, 5, &aom_highbd_10_sub_pixel_avg_variance32x32_sse2, 10),
         make_tuple(5, 4, &aom_highbd_10_sub_pixel_avg_variance32x16_sse2, 10),
         make_tuple(4, 5, &aom_highbd_10_sub_pixel_avg_variance16x32_sse2, 10),
         make_tuple(4, 4, &aom_highbd_10_sub_pixel_avg_variance16x16_sse2, 10),
         make_tuple(4, 3, &aom_highbd_10_sub_pixel_avg_variance16x8_sse2, 10),
         make_tuple(3, 4, &aom_highbd_10_sub_pixel_avg_variance8x16_sse2, 10),
         make_tuple(3, 3, &aom_highbd_10_sub_pixel_avg_variance8x8_sse2, 10),
         make_tuple(3, 2, &aom_highbd_10_sub_pixel_avg_variance8x4_sse2, 10),
         make_tuple(6, 6, &aom_highbd_8_sub_pixel_avg_variance64x64_sse2, 8),
         make_tuple(6, 5, &aom_highbd_8_sub_pixel_avg_variance64x32_sse2, 8),
         make_tuple(5, 6, &aom_highbd_8_sub_pixel_avg_variance32x64_sse2, 8),
         make_tuple(5, 5, &aom_highbd_8_sub_pixel_avg_variance32x32_sse2, 8),
         make_tuple(5, 4, &aom_highbd_8_sub_pixel_avg_variance32x16_sse2, 8),
         make_tuple(4, 5, &aom_highbd_8_sub_pixel_avg_variance16x32_sse2, 8),
         make_tuple(4, 4, &aom_highbd_8_sub_pixel_avg_variance16x16_sse2, 8),
         make_tuple(4, 3, &aom_highbd_8_sub_pixel_avg_variance16x8_sse2, 8),
         make_tuple(3, 4, &aom_highbd_8_sub_pixel_avg_variance8x16_sse2, 8),
         make_tuple(3, 3, &aom_highbd_8_sub_pixel_avg_variance8x8_sse2, 8),
         make_tuple(3, 2, &aom_highbd_8_sub_pixel_avg_variance8x4_sse2, 8)));
 #endif  // CONFIG_USE_X86INC
 #endif  // CONFIG_AOM_HIGHBITDEPTH
 #endif  // HAVE_SSE2

 #if HAVE_SSSE3
 #if CONFIG_USE_X86INC
 INSTANTIATE_TEST_CASE_P(
     SSSE3, AvxSubpelVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_sub_pixel_variance64x64_ssse3, 0),
                       make_tuple(6, 5, &aom_sub_pixel_variance64x32_ssse3, 0),
                       make_tuple(5, 6, &aom_sub_pixel_variance32x64_ssse3, 0),
                       make_tuple(5, 5, &aom_sub_pixel_variance32x32_ssse3, 0),
                       make_tuple(5, 4, &aom_sub_pixel_variance32x16_ssse3, 0),
                       make_tuple(4, 5, &aom_sub_pixel_variance16x32_ssse3, 0),
                       make_tuple(4, 4, &aom_sub_pixel_variance16x16_ssse3, 0),
                       make_tuple(4, 3, &aom_sub_pixel_variance16x8_ssse3, 0),
                       make_tuple(3, 4, &aom_sub_pixel_variance8x16_ssse3, 0),
                       make_tuple(3, 3, &aom_sub_pixel_variance8x8_ssse3, 0),
                       make_tuple(3, 2, &aom_sub_pixel_variance8x4_ssse3, 0),
                       make_tuple(2, 3, &aom_sub_pixel_variance4x8_ssse3, 0),
                       make_tuple(2, 2, &aom_sub_pixel_variance4x4_ssse3, 0)));

 INSTANTIATE_TEST_CASE_P(
     SSSE3, AvxSubpelAvgVarianceTest,
     ::testing::Values(
         make_tuple(6, 6, &aom_sub_pixel_avg_variance64x64_ssse3, 0),
         make_tuple(6, 5, &aom_sub_pixel_avg_variance64x32_ssse3, 0),
         make_tuple(5, 6, &aom_sub_pixel_avg_variance32x64_ssse3, 0),
         make_tuple(5, 5, &aom_sub_pixel_avg_variance32x32_ssse3, 0),
         make_tuple(5, 4, &aom_sub_pixel_avg_variance32x16_ssse3, 0),
         make_tuple(4, 5, &aom_sub_pixel_avg_variance16x32_ssse3, 0),
         make_tuple(4, 4, &aom_sub_pixel_avg_variance16x16_ssse3, 0),
         make_tuple(4, 3, &aom_sub_pixel_avg_variance16x8_ssse3, 0),
         make_tuple(3, 4, &aom_sub_pixel_avg_variance8x16_ssse3, 0),
         make_tuple(3, 3, &aom_sub_pixel_avg_variance8x8_ssse3, 0),
         make_tuple(3, 2, &aom_sub_pixel_avg_variance8x4_ssse3, 0),
         make_tuple(2, 3, &aom_sub_pixel_avg_variance4x8_ssse3, 0),
         make_tuple(2, 2, &aom_sub_pixel_avg_variance4x4_ssse3, 0)));
 #endif  // CONFIG_USE_X86INC
 #endif  // HAVE_SSSE3

 #if HAVE_AVX2
 INSTANTIATE_TEST_CASE_P(AVX2, AvxMseTest,
                         ::testing::Values(make_tuple(4, 4,
                                                      &aom_mse16x16_avx2)));

 INSTANTIATE_TEST_CASE_P(
     AVX2, AvxVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_variance64x64_avx2, 0),
                       make_tuple(6, 5, &aom_variance64x32_avx2, 0),
                       make_tuple(5, 5, &aom_variance32x32_avx2, 0),
                       make_tuple(5, 4, &aom_variance32x16_avx2, 0),
                       make_tuple(4, 4, &aom_variance16x16_avx2, 0)));

 INSTANTIATE_TEST_CASE_P(
     AVX2, AvxSubpelVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_sub_pixel_variance64x64_avx2, 0),
                       make_tuple(5, 5, &aom_sub_pixel_variance32x32_avx2, 0)));

 INSTANTIATE_TEST_CASE_P(
     AVX2, AvxSubpelAvgVarianceTest,
     ::testing::Values(
         make_tuple(6, 6, &aom_sub_pixel_avg_variance64x64_avx2, 0),
         make_tuple(5, 5, &aom_sub_pixel_avg_variance32x32_avx2, 0)));
 #endif  // HAVE_AVX2

 #if HAVE_MEDIA
 INSTANTIATE_TEST_CASE_P(MEDIA, AvxMseTest,
                         ::testing::Values(make_tuple(4, 4,
                                                      &aom_mse16x16_media)));

 INSTANTIATE_TEST_CASE_P(
     MEDIA, AvxVarianceTest,
     ::testing::Values(make_tuple(4, 4, &aom_variance16x16_media, 0),
                       make_tuple(3, 3, &aom_variance8x8_media, 0)));

 INSTANTIATE_TEST_CASE_P(
     MEDIA, AvxSubpelVarianceTest,
     ::testing::Values(make_tuple(4, 4, &aom_sub_pixel_variance16x16_media, 0),
                       make_tuple(3, 3, &aom_sub_pixel_variance8x8_media, 0)));
 #endif  // HAVE_MEDIA

 #if HAVE_NEON
 INSTANTIATE_TEST_CASE_P(NEON, AvxSseTest,
                         ::testing::Values(make_tuple(2, 2,
                                                      &aom_get4x4sse_cs_neon)));

 INSTANTIATE_TEST_CASE_P(NEON, AvxMseTest,
                         ::testing::Values(make_tuple(4, 4,
                                                      &aom_mse16x16_neon)));

 INSTANTIATE_TEST_CASE_P(
     NEON, AvxVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_variance64x64_neon, 0),
                       make_tuple(6, 5, &aom_variance64x32_neon, 0),
                       make_tuple(5, 6, &aom_variance32x64_neon, 0),
                       make_tuple(5, 5, &aom_variance32x32_neon, 0),
                       make_tuple(4, 4, &aom_variance16x16_neon, 0),
                       make_tuple(4, 3, &aom_variance16x8_neon, 0),
                       make_tuple(3, 4, &aom_variance8x16_neon, 0),
                       make_tuple(3, 3, &aom_variance8x8_neon, 0)));

 INSTANTIATE_TEST_CASE_P(
     NEON, AvxSubpelVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_sub_pixel_variance64x64_neon, 0),
                       make_tuple(5, 5, &aom_sub_pixel_variance32x32_neon, 0),
                       make_tuple(4, 4, &aom_sub_pixel_variance16x16_neon, 0),
                       make_tuple(3, 3, &aom_sub_pixel_variance8x8_neon, 0)));
 #endif  // HAVE_NEON

 #if HAVE_MSA
 INSTANTIATE_TEST_CASE_P(MSA, SumOfSquaresTest,
                         ::testing::Values(aom_get_mb_ss_msa));

 INSTANTIATE_TEST_CASE_P(MSA, AvxSseTest,
                         ::testing::Values(make_tuple(2, 2,
                                                      &aom_get4x4sse_cs_msa)));

 INSTANTIATE_TEST_CASE_P(MSA, AvxMseTest,
                         ::testing::Values(make_tuple(4, 4, &aom_mse16x16_msa),
                                           make_tuple(4, 3, &aom_mse16x8_msa),
                                           make_tuple(3, 4, &aom_mse8x16_msa),
                                           make_tuple(3, 3, &aom_mse8x8_msa)));

 INSTANTIATE_TEST_CASE_P(
     MSA, AvxVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_variance64x64_msa, 0),
                       make_tuple(6, 5, &aom_variance64x32_msa, 0),
                       make_tuple(5, 6, &aom_variance32x64_msa, 0),
                       make_tuple(5, 5, &aom_variance32x32_msa, 0),
                       make_tuple(5, 4, &aom_variance32x16_msa, 0),
                       make_tuple(4, 5, &aom_variance16x32_msa, 0),
                       make_tuple(4, 4, &aom_variance16x16_msa, 0),
                       make_tuple(4, 3, &aom_variance16x8_msa, 0),
                       make_tuple(3, 4, &aom_variance8x16_msa, 0),
                       make_tuple(3, 3, &aom_variance8x8_msa, 0),
                       make_tuple(3, 2, &aom_variance8x4_msa, 0),
                       make_tuple(2, 3, &aom_variance4x8_msa, 0),
                       make_tuple(2, 2, &aom_variance4x4_msa, 0)));

 INSTANTIATE_TEST_CASE_P(
     MSA, AvxSubpelVarianceTest,
     ::testing::Values(make_tuple(2, 2, &aom_sub_pixel_variance4x4_msa, 0),
                       make_tuple(2, 3, &aom_sub_pixel_variance4x8_msa, 0),
                       make_tuple(3, 2, &aom_sub_pixel_variance8x4_msa, 0),
                       make_tuple(3, 3, &aom_sub_pixel_variance8x8_msa, 0),
                       make_tuple(3, 4, &aom_sub_pixel_variance8x16_msa, 0),
                       make_tuple(4, 3, &aom_sub_pixel_variance16x8_msa, 0),
                       make_tuple(4, 4, &aom_sub_pixel_variance16x16_msa, 0),
                       make_tuple(4, 5, &aom_sub_pixel_variance16x32_msa, 0),
                       make_tuple(5, 4, &aom_sub_pixel_variance32x16_msa, 0),
                       make_tuple(5, 5, &aom_sub_pixel_variance32x32_msa, 0),
                       make_tuple(5, 6, &aom_sub_pixel_variance32x64_msa, 0),
                       make_tuple(6, 5, &aom_sub_pixel_variance64x32_msa, 0),
                       make_tuple(6, 6, &aom_sub_pixel_variance64x64_msa, 0)));

 INSTANTIATE_TEST_CASE_P(
     MSA, AvxSubpelAvgVarianceTest,
     ::testing::Values(make_tuple(6, 6, &aom_sub_pixel_avg_variance64x64_msa, 0),
                       make_tuple(6, 5, &aom_sub_pixel_avg_variance64x32_msa, 0),
                       make_tuple(5, 6, &aom_sub_pixel_avg_variance32x64_msa, 0),
                       make_tuple(5, 5, &aom_sub_pixel_avg_variance32x32_msa, 0),
                       make_tuple(5, 4, &aom_sub_pixel_avg_variance32x16_msa, 0),
                       make_tuple(4, 5, &aom_sub_pixel_avg_variance16x32_msa, 0),
                       make_tuple(4, 4, &aom_sub_pixel_avg_variance16x16_msa, 0),
                       make_tuple(4, 3, &aom_sub_pixel_avg_variance16x8_msa, 0),
                       make_tuple(3, 4, &aom_sub_pixel_avg_variance8x16_msa, 0),
                       make_tuple(3, 3, &aom_sub_pixel_avg_variance8x8_msa, 0),
                       make_tuple(3, 2, &aom_sub_pixel_avg_variance8x4_msa, 0),
                       make_tuple(2, 3, &aom_sub_pixel_avg_variance4x8_msa, 0),
                       make_tuple(2, 2, &aom_sub_pixel_avg_variance4x4_msa, 0)));
 #endif  // HAVE_MSA
 }  // namespace