blob: edf46821695004d2a227cf8169b3177801e92635 [file] [log] [blame]
Daniel Kang26641c72012-06-28 16:26:31 -07001/*
2 * Copyright (c) 2012 The WebM project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
11#include <math.h>
12#include <stdlib.h>
13#include <string.h>
14
15#include "third_party/googletest/src/include/gtest/gtest.h"
Jingning Han097d59c2015-07-29 14:51:36 -070016
17#include "./vp9_rtcd.h"
18#include "./vpx_dsp_rtcd.h"
Jingning Han4bd17112013-09-16 16:01:50 -070019#include "test/acm_random.h"
Yaowu Xue494df12013-09-03 13:50:17 -070020#include "test/clear_system_state.h"
21#include "test/register_state_check.h"
Jingning Han4bd17112013-09-16 16:01:50 -070022#include "test/util.h"
James Zern002ad402014-01-18 13:03:31 -080023#include "vp9/common/vp9_entropy.h"
Scott LaVarnwayb9626462015-05-22 11:19:51 -070024#include "vp9/common/vp9_scan.h"
Deb Mukherjee10783d42014-09-02 16:34:09 -070025#include "vpx/vpx_codec.h"
James Zern002ad402014-01-18 13:03:31 -080026#include "vpx/vpx_integer.h"
Johann1d7ccd52015-05-11 19:09:22 -070027#include "vpx_ports/mem.h"
James Zern002ad402014-01-18 13:03:31 -080028
James Zernc47d8682015-05-14 19:38:34 -070029using libvpx_test::ACMRandom;
30
31namespace {
32
Deb Mukherjee10783d42014-09-02 16:34:09 -070033const int kNumCoeffs = 64;
34const double kPi = 3.141592653589793238462643383279502884;
James Zernc47d8682015-05-14 19:38:34 -070035
36const int kSignBiasMaxDiff255 = 1500;
37const int kSignBiasMaxDiff15 = 10000;
38
39typedef void (*FdctFunc)(const int16_t *in, tran_low_t *out, int stride);
40typedef void (*IdctFunc)(const tran_low_t *in, uint8_t *out, int stride);
41typedef void (*FhtFunc)(const int16_t *in, tran_low_t *out, int stride,
42 int tx_type);
43typedef void (*IhtFunc)(const tran_low_t *in, uint8_t *out, int stride,
44 int tx_type);
45
46typedef std::tr1::tuple<FdctFunc, IdctFunc, int, vpx_bit_depth_t> Dct8x8Param;
47typedef std::tr1::tuple<FhtFunc, IhtFunc, int, vpx_bit_depth_t> Ht8x8Param;
48typedef std::tr1::tuple<IdctFunc, IdctFunc, int, vpx_bit_depth_t> Idct8x8Param;
49
James Zerncffef112016-02-11 18:27:00 -080050void reference_8x8_dct_1d(const double in[8], double out[8]) {
Deb Mukherjee10783d42014-09-02 16:34:09 -070051 const double kInvSqrt2 = 0.707106781186547524400844362104;
52 for (int k = 0; k < 8; k++) {
53 out[k] = 0.0;
54 for (int n = 0; n < 8; n++)
55 out[k] += in[n] * cos(kPi * (2 * n + 1) * k / 16.0);
56 if (k == 0)
57 out[k] = out[k] * kInvSqrt2;
58 }
59}
60
61void reference_8x8_dct_2d(const int16_t input[kNumCoeffs],
62 double output[kNumCoeffs]) {
63 // First transform columns
64 for (int i = 0; i < 8; ++i) {
65 double temp_in[8], temp_out[8];
66 for (int j = 0; j < 8; ++j)
67 temp_in[j] = input[j*8 + i];
James Zerncffef112016-02-11 18:27:00 -080068 reference_8x8_dct_1d(temp_in, temp_out);
Deb Mukherjee10783d42014-09-02 16:34:09 -070069 for (int j = 0; j < 8; ++j)
70 output[j * 8 + i] = temp_out[j];
71 }
72 // Then transform rows
73 for (int i = 0; i < 8; ++i) {
74 double temp_in[8], temp_out[8];
75 for (int j = 0; j < 8; ++j)
76 temp_in[j] = output[j + i*8];
James Zerncffef112016-02-11 18:27:00 -080077 reference_8x8_dct_1d(temp_in, temp_out);
Deb Mukherjee10783d42014-09-02 16:34:09 -070078 // Scale by some magic number
79 for (int j = 0; j < 8; ++j)
80 output[j + i * 8] = temp_out[j] * 2;
81 }
Daniel Kang26641c72012-06-28 16:26:31 -070082}
Daniel Kang26641c72012-06-28 16:26:31 -070083
Joshua Litt51490e52013-11-18 17:07:55 -080084
James Zerncffef112016-02-11 18:27:00 -080085void fdct8x8_ref(const int16_t *in, tran_low_t *out, int stride,
86 int /*tx_type*/) {
Jingning Han4b5109c2015-07-28 15:57:40 -070087 vpx_fdct8x8_c(in, out, stride);
Jingning Hanab362622013-06-21 11:45:47 -070088}
Jingning Han4bd17112013-09-16 16:01:50 -070089
Deb Mukherjee10783d42014-09-02 16:34:09 -070090void fht8x8_ref(const int16_t *in, tran_low_t *out, int stride, int tx_type) {
Dmitry Kovalev005fc692014-02-06 11:54:15 -080091 vp9_fht8x8_c(in, out, stride, tx_type);
Jingning Hanab362622013-06-21 11:45:47 -070092}
Daniel Kang26641c72012-06-28 16:26:31 -070093
Deb Mukherjee10783d42014-09-02 16:34:09 -070094#if CONFIG_VP9_HIGHBITDEPTH
95void idct8x8_10(const tran_low_t *in, uint8_t *out, int stride) {
Jingning Han08a453b2015-08-03 14:51:10 -070096 vpx_highbd_idct8x8_64_add_c(in, out, stride, 10);
Deb Mukherjee10783d42014-09-02 16:34:09 -070097}
98
99void idct8x8_12(const tran_low_t *in, uint8_t *out, int stride) {
Jingning Han08a453b2015-08-03 14:51:10 -0700100 vpx_highbd_idct8x8_64_add_c(in, out, stride, 12);
Deb Mukherjee10783d42014-09-02 16:34:09 -0700101}
102
103void iht8x8_10(const tran_low_t *in, uint8_t *out, int stride, int tx_type) {
Deb Mukherjee1929c9b2014-10-08 12:43:22 -0700104 vp9_highbd_iht8x8_64_add_c(in, out, stride, tx_type, 10);
Deb Mukherjee10783d42014-09-02 16:34:09 -0700105}
106
107void iht8x8_12(const tran_low_t *in, uint8_t *out, int stride, int tx_type) {
Deb Mukherjee1929c9b2014-10-08 12:43:22 -0700108 vp9_highbd_iht8x8_64_add_c(in, out, stride, tx_type, 12);
Deb Mukherjee10783d42014-09-02 16:34:09 -0700109}
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100110
James Zernf74e04c2016-02-03 23:04:42 -0800111#if HAVE_SSE2
112
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100113void idct8x8_10_add_10_c(const tran_low_t *in, uint8_t *out, int stride) {
Jingning Han08a453b2015-08-03 14:51:10 -0700114 vpx_highbd_idct8x8_10_add_c(in, out, stride, 10);
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100115}
116
117void idct8x8_10_add_12_c(const tran_low_t *in, uint8_t *out, int stride) {
Jingning Han08a453b2015-08-03 14:51:10 -0700118 vpx_highbd_idct8x8_10_add_c(in, out, stride, 12);
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100119}
120
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100121void idct8x8_10_add_10_sse2(const tran_low_t *in, uint8_t *out, int stride) {
Jingning Han08a453b2015-08-03 14:51:10 -0700122 vpx_highbd_idct8x8_10_add_sse2(in, out, stride, 10);
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100123}
124
125void idct8x8_10_add_12_sse2(const tran_low_t *in, uint8_t *out, int stride) {
Jingning Han08a453b2015-08-03 14:51:10 -0700126 vpx_highbd_idct8x8_10_add_sse2(in, out, stride, 12);
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100127}
128
129void idct8x8_64_add_10_sse2(const tran_low_t *in, uint8_t *out, int stride) {
Jingning Han08a453b2015-08-03 14:51:10 -0700130 vpx_highbd_idct8x8_64_add_sse2(in, out, stride, 10);
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100131}
132
133void idct8x8_64_add_12_sse2(const tran_low_t *in, uint8_t *out, int stride) {
Jingning Han08a453b2015-08-03 14:51:10 -0700134 vpx_highbd_idct8x8_64_add_sse2(in, out, stride, 12);
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100135}
136#endif // HAVE_SSE2
137#endif // CONFIG_VP9_HIGHBITDEPTH
Deb Mukherjee10783d42014-09-02 16:34:09 -0700138
Jingning Han4bd17112013-09-16 16:01:50 -0700139class FwdTrans8x8TestBase {
Jingning Hanab362622013-06-21 11:45:47 -0700140 public:
Jingning Han4bd17112013-09-16 16:01:50 -0700141 virtual ~FwdTrans8x8TestBase() {}
Jingning Hanab362622013-06-21 11:45:47 -0700142
143 protected:
Deb Mukherjee10783d42014-09-02 16:34:09 -0700144 virtual void RunFwdTxfm(int16_t *in, tran_low_t *out, int stride) = 0;
145 virtual void RunInvTxfm(tran_low_t *out, uint8_t *dst, int stride) = 0;
Jingning Hanab362622013-06-21 11:45:47 -0700146
Jingning Han4bd17112013-09-16 16:01:50 -0700147 void RunSignBiasCheck() {
148 ACMRandom rnd(ACMRandom::DeterministicSeed());
James Zernfd3658b2015-05-02 13:24:16 -0700149 DECLARE_ALIGNED(16, int16_t, test_input_block[64]);
150 DECLARE_ALIGNED(16, tran_low_t, test_output_block[64]);
Jingning Han4bd17112013-09-16 16:01:50 -0700151 int count_sign_block[64][2];
152 const int count_test_block = 100000;
Jingning Hanab362622013-06-21 11:45:47 -0700153
Jingning Han4bd17112013-09-16 16:01:50 -0700154 memset(count_sign_block, 0, sizeof(count_sign_block));
Daniel Kang26641c72012-06-28 16:26:31 -0700155
Jingning Han4bd17112013-09-16 16:01:50 -0700156 for (int i = 0; i < count_test_block; ++i) {
157 // Initialize a test block with input range [-255, 255].
158 for (int j = 0; j < 64; ++j)
Deb Mukherjee10783d42014-09-02 16:34:09 -0700159 test_input_block[j] = ((rnd.Rand16() >> (16 - bit_depth_)) & mask_) -
160 ((rnd.Rand16() >> (16 - bit_depth_)) & mask_);
James Zern29e1b1a2014-07-09 21:02:02 -0700161 ASM_REGISTER_STATE_CHECK(
Jingning Han4bd17112013-09-16 16:01:50 -0700162 RunFwdTxfm(test_input_block, test_output_block, pitch_));
Daniel Kang26641c72012-06-28 16:26:31 -0700163
Jingning Han4bd17112013-09-16 16:01:50 -0700164 for (int j = 0; j < 64; ++j) {
165 if (test_output_block[j] < 0)
166 ++count_sign_block[j][0];
167 else if (test_output_block[j] > 0)
168 ++count_sign_block[j][1];
169 }
170 }
Daniel Kang26641c72012-06-28 16:26:31 -0700171
172 for (int j = 0; j < 64; ++j) {
Jingning Han4bd17112013-09-16 16:01:50 -0700173 const int diff = abs(count_sign_block[j][0] - count_sign_block[j][1]);
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800174 const int max_diff = kSignBiasMaxDiff255;
Deb Mukherjee10783d42014-09-02 16:34:09 -0700175 EXPECT_LT(diff, max_diff << (bit_depth_ - 8))
Jingning Han4bd17112013-09-16 16:01:50 -0700176 << "Error: 8x8 FDCT/FHT has a sign bias > "
177 << 1. * max_diff / count_test_block * 100 << "%"
178 << " for input range [-255, 255] at index " << j
179 << " count0: " << count_sign_block[j][0]
180 << " count1: " << count_sign_block[j][1]
181 << " diff: " << diff;
182 }
183
184 memset(count_sign_block, 0, sizeof(count_sign_block));
185
186 for (int i = 0; i < count_test_block; ++i) {
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100187 // Initialize a test block with input range [-mask_ / 16, mask_ / 16].
Jingning Han4bd17112013-09-16 16:01:50 -0700188 for (int j = 0; j < 64; ++j)
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100189 test_input_block[j] = ((rnd.Rand16() & mask_) >> 4) -
190 ((rnd.Rand16() & mask_) >> 4);
James Zern29e1b1a2014-07-09 21:02:02 -0700191 ASM_REGISTER_STATE_CHECK(
Jingning Han4bd17112013-09-16 16:01:50 -0700192 RunFwdTxfm(test_input_block, test_output_block, pitch_));
193
194 for (int j = 0; j < 64; ++j) {
195 if (test_output_block[j] < 0)
196 ++count_sign_block[j][0];
197 else if (test_output_block[j] > 0)
198 ++count_sign_block[j][1];
199 }
200 }
201
202 for (int j = 0; j < 64; ++j) {
203 const int diff = abs(count_sign_block[j][0] - count_sign_block[j][1]);
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800204 const int max_diff = kSignBiasMaxDiff15;
Deb Mukherjee10783d42014-09-02 16:34:09 -0700205 EXPECT_LT(diff, max_diff << (bit_depth_ - 8))
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800206 << "Error: 8x8 FDCT/FHT has a sign bias > "
Jingning Han4bd17112013-09-16 16:01:50 -0700207 << 1. * max_diff / count_test_block * 100 << "%"
208 << " for input range [-15, 15] at index " << j
209 << " count0: " << count_sign_block[j][0]
210 << " count1: " << count_sign_block[j][1]
211 << " diff: " << diff;
Daniel Kang26641c72012-06-28 16:26:31 -0700212 }
213 }
214
Jingning Han4bd17112013-09-16 16:01:50 -0700215 void RunRoundTripErrorCheck() {
216 ACMRandom rnd(ACMRandom::DeterministicSeed());
217 int max_error = 0;
218 int total_error = 0;
219 const int count_test_block = 100000;
James Zernfd3658b2015-05-02 13:24:16 -0700220 DECLARE_ALIGNED(16, int16_t, test_input_block[64]);
221 DECLARE_ALIGNED(16, tran_low_t, test_temp_block[64]);
222 DECLARE_ALIGNED(16, uint8_t, dst[64]);
223 DECLARE_ALIGNED(16, uint8_t, src[64]);
Deb Mukherjee10783d42014-09-02 16:34:09 -0700224#if CONFIG_VP9_HIGHBITDEPTH
James Zernfd3658b2015-05-02 13:24:16 -0700225 DECLARE_ALIGNED(16, uint16_t, dst16[64]);
226 DECLARE_ALIGNED(16, uint16_t, src16[64]);
Deb Mukherjee10783d42014-09-02 16:34:09 -0700227#endif
Daniel Kang26641c72012-06-28 16:26:31 -0700228
Jingning Han4bd17112013-09-16 16:01:50 -0700229 for (int i = 0; i < count_test_block; ++i) {
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100230 // Initialize a test block with input range [-mask_, mask_].
Jingning Han4bd17112013-09-16 16:01:50 -0700231 for (int j = 0; j < 64; ++j) {
Deb Mukherjee10783d42014-09-02 16:34:09 -0700232 if (bit_depth_ == VPX_BITS_8) {
233 src[j] = rnd.Rand8();
234 dst[j] = rnd.Rand8();
235 test_input_block[j] = src[j] - dst[j];
236#if CONFIG_VP9_HIGHBITDEPTH
237 } else {
238 src16[j] = rnd.Rand16() & mask_;
239 dst16[j] = rnd.Rand16() & mask_;
240 test_input_block[j] = src16[j] - dst16[j];
241#endif
242 }
Jingning Han4bd17112013-09-16 16:01:50 -0700243 }
Daniel Kang26641c72012-06-28 16:26:31 -0700244
James Zern29e1b1a2014-07-09 21:02:02 -0700245 ASM_REGISTER_STATE_CHECK(
Jingning Han4bd17112013-09-16 16:01:50 -0700246 RunFwdTxfm(test_input_block, test_temp_block, pitch_));
247 for (int j = 0; j < 64; ++j) {
248 if (test_temp_block[j] > 0) {
249 test_temp_block[j] += 2;
250 test_temp_block[j] /= 4;
251 test_temp_block[j] *= 4;
252 } else {
253 test_temp_block[j] -= 2;
254 test_temp_block[j] /= 4;
255 test_temp_block[j] *= 4;
256 }
257 }
Deb Mukherjee10783d42014-09-02 16:34:09 -0700258 if (bit_depth_ == VPX_BITS_8) {
259 ASM_REGISTER_STATE_CHECK(
260 RunInvTxfm(test_temp_block, dst, pitch_));
261#if CONFIG_VP9_HIGHBITDEPTH
262 } else {
263 ASM_REGISTER_STATE_CHECK(
264 RunInvTxfm(test_temp_block, CONVERT_TO_BYTEPTR(dst16), pitch_));
265#endif
266 }
Daniel Kang26641c72012-06-28 16:26:31 -0700267
Jingning Han4bd17112013-09-16 16:01:50 -0700268 for (int j = 0; j < 64; ++j) {
Deb Mukherjee10783d42014-09-02 16:34:09 -0700269#if CONFIG_VP9_HIGHBITDEPTH
270 const int diff =
271 bit_depth_ == VPX_BITS_8 ? dst[j] - src[j] : dst16[j] - src16[j];
272#else
Jingning Han4bd17112013-09-16 16:01:50 -0700273 const int diff = dst[j] - src[j];
Deb Mukherjee10783d42014-09-02 16:34:09 -0700274#endif
Jingning Han4bd17112013-09-16 16:01:50 -0700275 const int error = diff * diff;
276 if (max_error < error)
277 max_error = error;
278 total_error += error;
279 }
Daniel Kang26641c72012-06-28 16:26:31 -0700280 }
281
Deb Mukherjee10783d42014-09-02 16:34:09 -0700282 EXPECT_GE(1 << 2 * (bit_depth_ - 8), max_error)
Jingning Han4bd17112013-09-16 16:01:50 -0700283 << "Error: 8x8 FDCT/IDCT or FHT/IHT has an individual"
284 << " roundtrip error > 1";
Daniel Kang26641c72012-06-28 16:26:31 -0700285
Deb Mukherjee10783d42014-09-02 16:34:09 -0700286 EXPECT_GE((count_test_block << 2 * (bit_depth_ - 8))/5, total_error)
Jingning Han4bd17112013-09-16 16:01:50 -0700287 << "Error: 8x8 FDCT/IDCT or FHT/IHT has average roundtrip "
288 << "error > 1/5 per block";
Daniel Kang26641c72012-06-28 16:26:31 -0700289 }
Jingning Han4bd17112013-09-16 16:01:50 -0700290
291 void RunExtremalCheck() {
292 ACMRandom rnd(ACMRandom::DeterministicSeed());
293 int max_error = 0;
294 int total_error = 0;
Jingning Han5c2696c2014-06-02 16:40:01 -0700295 int total_coeff_error = 0;
Jingning Han4bd17112013-09-16 16:01:50 -0700296 const int count_test_block = 100000;
James Zernfd3658b2015-05-02 13:24:16 -0700297 DECLARE_ALIGNED(16, int16_t, test_input_block[64]);
298 DECLARE_ALIGNED(16, tran_low_t, test_temp_block[64]);
299 DECLARE_ALIGNED(16, tran_low_t, ref_temp_block[64]);
300 DECLARE_ALIGNED(16, uint8_t, dst[64]);
301 DECLARE_ALIGNED(16, uint8_t, src[64]);
Deb Mukherjee10783d42014-09-02 16:34:09 -0700302#if CONFIG_VP9_HIGHBITDEPTH
James Zernfd3658b2015-05-02 13:24:16 -0700303 DECLARE_ALIGNED(16, uint16_t, dst16[64]);
304 DECLARE_ALIGNED(16, uint16_t, src16[64]);
Deb Mukherjee10783d42014-09-02 16:34:09 -0700305#endif
Jingning Han4bd17112013-09-16 16:01:50 -0700306
307 for (int i = 0; i < count_test_block; ++i) {
Deb Mukherjee10783d42014-09-02 16:34:09 -0700308 // Initialize a test block with input range [-mask_, mask_].
Jingning Han4bd17112013-09-16 16:01:50 -0700309 for (int j = 0; j < 64; ++j) {
Deb Mukherjee10783d42014-09-02 16:34:09 -0700310 if (bit_depth_ == VPX_BITS_8) {
311 if (i == 0) {
312 src[j] = 255;
313 dst[j] = 0;
314 } else if (i == 1) {
315 src[j] = 0;
316 dst[j] = 255;
317 } else {
318 src[j] = rnd.Rand8() % 2 ? 255 : 0;
319 dst[j] = rnd.Rand8() % 2 ? 255 : 0;
320 }
321 test_input_block[j] = src[j] - dst[j];
322#if CONFIG_VP9_HIGHBITDEPTH
Jingning Han0343e302014-06-03 16:45:22 -0700323 } else {
Deb Mukherjee10783d42014-09-02 16:34:09 -0700324 if (i == 0) {
325 src16[j] = mask_;
326 dst16[j] = 0;
327 } else if (i == 1) {
328 src16[j] = 0;
329 dst16[j] = mask_;
330 } else {
331 src16[j] = rnd.Rand8() % 2 ? mask_ : 0;
332 dst16[j] = rnd.Rand8() % 2 ? mask_ : 0;
333 }
334 test_input_block[j] = src16[j] - dst16[j];
335#endif
Jingning Han5c2696c2014-06-02 16:40:01 -0700336 }
Jingning Han4bd17112013-09-16 16:01:50 -0700337 }
338
James Zern29e1b1a2014-07-09 21:02:02 -0700339 ASM_REGISTER_STATE_CHECK(
Jingning Han4bd17112013-09-16 16:01:50 -0700340 RunFwdTxfm(test_input_block, test_temp_block, pitch_));
James Zern29e1b1a2014-07-09 21:02:02 -0700341 ASM_REGISTER_STATE_CHECK(
Jingning Han5c2696c2014-06-02 16:40:01 -0700342 fwd_txfm_ref(test_input_block, ref_temp_block, pitch_, tx_type_));
Deb Mukherjee10783d42014-09-02 16:34:09 -0700343 if (bit_depth_ == VPX_BITS_8) {
344 ASM_REGISTER_STATE_CHECK(
345 RunInvTxfm(test_temp_block, dst, pitch_));
346#if CONFIG_VP9_HIGHBITDEPTH
347 } else {
348 ASM_REGISTER_STATE_CHECK(
349 RunInvTxfm(test_temp_block, CONVERT_TO_BYTEPTR(dst16), pitch_));
350#endif
351 }
Jingning Han4bd17112013-09-16 16:01:50 -0700352
353 for (int j = 0; j < 64; ++j) {
Deb Mukherjee10783d42014-09-02 16:34:09 -0700354#if CONFIG_VP9_HIGHBITDEPTH
355 const int diff =
356 bit_depth_ == VPX_BITS_8 ? dst[j] - src[j] : dst16[j] - src16[j];
357#else
Jingning Han4bd17112013-09-16 16:01:50 -0700358 const int diff = dst[j] - src[j];
Deb Mukherjee10783d42014-09-02 16:34:09 -0700359#endif
Jingning Han4bd17112013-09-16 16:01:50 -0700360 const int error = diff * diff;
361 if (max_error < error)
362 max_error = error;
363 total_error += error;
Jingning Han5c2696c2014-06-02 16:40:01 -0700364
365 const int coeff_diff = test_temp_block[j] - ref_temp_block[j];
366 total_coeff_error += abs(coeff_diff);
Jingning Han4bd17112013-09-16 16:01:50 -0700367 }
368
Deb Mukherjee10783d42014-09-02 16:34:09 -0700369 EXPECT_GE(1 << 2 * (bit_depth_ - 8), max_error)
Jingning Han4bd17112013-09-16 16:01:50 -0700370 << "Error: Extremal 8x8 FDCT/IDCT or FHT/IHT has"
371 << "an individual roundtrip error > 1";
372
Deb Mukherjee10783d42014-09-02 16:34:09 -0700373 EXPECT_GE((count_test_block << 2 * (bit_depth_ - 8))/5, total_error)
Jingning Han4bd17112013-09-16 16:01:50 -0700374 << "Error: Extremal 8x8 FDCT/IDCT or FHT/IHT has average"
375 << " roundtrip error > 1/5 per block";
Jingning Han5c2696c2014-06-02 16:40:01 -0700376
377 EXPECT_EQ(0, total_coeff_error)
378 << "Error: Extremal 8x8 FDCT/FHT has"
379 << "overflow issues in the intermediate steps > 1";
Jingning Han4bd17112013-09-16 16:01:50 -0700380 }
381 }
382
Deb Mukherjee10783d42014-09-02 16:34:09 -0700383 void RunInvAccuracyCheck() {
384 ACMRandom rnd(ACMRandom::DeterministicSeed());
385 const int count_test_block = 1000;
James Zernfd3658b2015-05-02 13:24:16 -0700386 DECLARE_ALIGNED(16, int16_t, in[kNumCoeffs]);
387 DECLARE_ALIGNED(16, tran_low_t, coeff[kNumCoeffs]);
388 DECLARE_ALIGNED(16, uint8_t, dst[kNumCoeffs]);
389 DECLARE_ALIGNED(16, uint8_t, src[kNumCoeffs]);
Deb Mukherjee10783d42014-09-02 16:34:09 -0700390#if CONFIG_VP9_HIGHBITDEPTH
James Zernfd3658b2015-05-02 13:24:16 -0700391 DECLARE_ALIGNED(16, uint16_t, src16[kNumCoeffs]);
392 DECLARE_ALIGNED(16, uint16_t, dst16[kNumCoeffs]);
Deb Mukherjee10783d42014-09-02 16:34:09 -0700393#endif
394
395 for (int i = 0; i < count_test_block; ++i) {
396 double out_r[kNumCoeffs];
397
398 // Initialize a test block with input range [-255, 255].
399 for (int j = 0; j < kNumCoeffs; ++j) {
400 if (bit_depth_ == VPX_BITS_8) {
401 src[j] = rnd.Rand8() % 2 ? 255 : 0;
402 dst[j] = src[j] > 0 ? 0 : 255;
403 in[j] = src[j] - dst[j];
404#if CONFIG_VP9_HIGHBITDEPTH
405 } else {
406 src16[j] = rnd.Rand8() % 2 ? mask_ : 0;
407 dst16[j] = src16[j] > 0 ? 0 : mask_;
408 in[j] = src16[j] - dst16[j];
409#endif
410 }
411 }
412
413 reference_8x8_dct_2d(in, out_r);
414 for (int j = 0; j < kNumCoeffs; ++j)
Deb Mukherjee41e6ec42014-09-13 04:11:50 -0700415 coeff[j] = static_cast<tran_low_t>(round(out_r[j]));
Deb Mukherjee10783d42014-09-02 16:34:09 -0700416
417 if (bit_depth_ == VPX_BITS_8) {
418 ASM_REGISTER_STATE_CHECK(RunInvTxfm(coeff, dst, pitch_));
419#if CONFIG_VP9_HIGHBITDEPTH
420 } else {
421 ASM_REGISTER_STATE_CHECK(RunInvTxfm(coeff, CONVERT_TO_BYTEPTR(dst16),
422 pitch_));
423#endif
424 }
425
426 for (int j = 0; j < kNumCoeffs; ++j) {
427#if CONFIG_VP9_HIGHBITDEPTH
428 const uint32_t diff =
429 bit_depth_ == VPX_BITS_8 ? dst[j] - src[j] : dst16[j] - src16[j];
430#else
431 const uint32_t diff = dst[j] - src[j];
432#endif
433 const uint32_t error = diff * diff;
434 EXPECT_GE(1u << 2 * (bit_depth_ - 8), error)
435 << "Error: 8x8 IDCT has error " << error
436 << " at index " << j;
437 }
438 }
439 }
440
441 void RunFwdAccuracyCheck() {
442 ACMRandom rnd(ACMRandom::DeterministicSeed());
443 const int count_test_block = 1000;
James Zernfd3658b2015-05-02 13:24:16 -0700444 DECLARE_ALIGNED(16, int16_t, in[kNumCoeffs]);
445 DECLARE_ALIGNED(16, tran_low_t, coeff_r[kNumCoeffs]);
446 DECLARE_ALIGNED(16, tran_low_t, coeff[kNumCoeffs]);
Deb Mukherjee10783d42014-09-02 16:34:09 -0700447
448 for (int i = 0; i < count_test_block; ++i) {
449 double out_r[kNumCoeffs];
450
451 // Initialize a test block with input range [-mask_, mask_].
452 for (int j = 0; j < kNumCoeffs; ++j)
453 in[j] = rnd.Rand8() % 2 == 0 ? mask_ : -mask_;
454
455 RunFwdTxfm(in, coeff, pitch_);
456 reference_8x8_dct_2d(in, out_r);
457 for (int j = 0; j < kNumCoeffs; ++j)
Deb Mukherjee41e6ec42014-09-13 04:11:50 -0700458 coeff_r[j] = static_cast<tran_low_t>(round(out_r[j]));
Deb Mukherjee10783d42014-09-02 16:34:09 -0700459
460 for (int j = 0; j < kNumCoeffs; ++j) {
461 const uint32_t diff = coeff[j] - coeff_r[j];
462 const uint32_t error = diff * diff;
463 EXPECT_GE(9u << 2 * (bit_depth_ - 8), error)
464 << "Error: 8x8 DCT has error " << error
465 << " at index " << j;
466 }
467 }
468 }
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100469
470void CompareInvReference(IdctFunc ref_txfm, int thresh) {
471 ACMRandom rnd(ACMRandom::DeterministicSeed());
472 const int count_test_block = 10000;
473 const int eob = 12;
James Zernfd3658b2015-05-02 13:24:16 -0700474 DECLARE_ALIGNED(16, tran_low_t, coeff[kNumCoeffs]);
475 DECLARE_ALIGNED(16, uint8_t, dst[kNumCoeffs]);
476 DECLARE_ALIGNED(16, uint8_t, ref[kNumCoeffs]);
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100477#if CONFIG_VP9_HIGHBITDEPTH
James Zernfd3658b2015-05-02 13:24:16 -0700478 DECLARE_ALIGNED(16, uint16_t, dst16[kNumCoeffs]);
479 DECLARE_ALIGNED(16, uint16_t, ref16[kNumCoeffs]);
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100480#endif
481 const int16_t *scan = vp9_default_scan_orders[TX_8X8].scan;
482
483 for (int i = 0; i < count_test_block; ++i) {
484 for (int j = 0; j < kNumCoeffs; ++j) {
485 if (j < eob) {
486 // Random values less than the threshold, either positive or negative
487 coeff[scan[j]] = rnd(thresh) * (1-2*(i%2));
488 } else {
489 coeff[scan[j]] = 0;
490 }
491 if (bit_depth_ == VPX_BITS_8) {
492 dst[j] = 0;
493 ref[j] = 0;
494#if CONFIG_VP9_HIGHBITDEPTH
495 } else {
496 dst16[j] = 0;
497 ref16[j] = 0;
498#endif
499 }
500 }
501 if (bit_depth_ == VPX_BITS_8) {
502 ref_txfm(coeff, ref, pitch_);
503 ASM_REGISTER_STATE_CHECK(RunInvTxfm(coeff, dst, pitch_));
504#if CONFIG_VP9_HIGHBITDEPTH
505 } else {
506 ref_txfm(coeff, CONVERT_TO_BYTEPTR(ref16), pitch_);
507 ASM_REGISTER_STATE_CHECK(RunInvTxfm(coeff, CONVERT_TO_BYTEPTR(dst16),
508 pitch_));
509#endif
510 }
511
512 for (int j = 0; j < kNumCoeffs; ++j) {
513#if CONFIG_VP9_HIGHBITDEPTH
514 const uint32_t diff =
515 bit_depth_ == VPX_BITS_8 ? dst[j] - ref[j] : dst16[j] - ref16[j];
516#else
517 const uint32_t diff = dst[j] - ref[j];
518#endif
519 const uint32_t error = diff * diff;
520 EXPECT_EQ(0u, error)
521 << "Error: 8x8 IDCT has error " << error
522 << " at index " << j;
523 }
524 }
525 }
Jingning Han4bd17112013-09-16 16:01:50 -0700526 int pitch_;
527 int tx_type_;
James Zern54697d32014-07-16 18:56:22 -0700528 FhtFunc fwd_txfm_ref;
Deb Mukherjee10783d42014-09-02 16:34:09 -0700529 vpx_bit_depth_t bit_depth_;
530 int mask_;
Jingning Han4bd17112013-09-16 16:01:50 -0700531};
532
Joshua Litt51490e52013-11-18 17:07:55 -0800533class FwdTrans8x8DCT
534 : public FwdTrans8x8TestBase,
James Zern54697d32014-07-16 18:56:22 -0700535 public ::testing::TestWithParam<Dct8x8Param> {
Jingning Han4bd17112013-09-16 16:01:50 -0700536 public:
537 virtual ~FwdTrans8x8DCT() {}
538
539 virtual void SetUp() {
540 fwd_txfm_ = GET_PARAM(0);
541 inv_txfm_ = GET_PARAM(1);
542 tx_type_ = GET_PARAM(2);
Dmitry Kovaleve5fa44c2013-10-18 12:20:26 -0700543 pitch_ = 8;
Jingning Han4bd17112013-09-16 16:01:50 -0700544 fwd_txfm_ref = fdct8x8_ref;
Deb Mukherjee10783d42014-09-02 16:34:09 -0700545 bit_depth_ = GET_PARAM(3);
546 mask_ = (1 << bit_depth_) - 1;
Jingning Han4bd17112013-09-16 16:01:50 -0700547 }
548
549 virtual void TearDown() { libvpx_test::ClearSystemState(); }
550
551 protected:
Deb Mukherjee10783d42014-09-02 16:34:09 -0700552 void RunFwdTxfm(int16_t *in, tran_low_t *out, int stride) {
Jingning Han4bd17112013-09-16 16:01:50 -0700553 fwd_txfm_(in, out, stride);
554 }
Deb Mukherjee10783d42014-09-02 16:34:09 -0700555 void RunInvTxfm(tran_low_t *out, uint8_t *dst, int stride) {
Dmitry Kovaleve5fa44c2013-10-18 12:20:26 -0700556 inv_txfm_(out, dst, stride);
Jingning Han4bd17112013-09-16 16:01:50 -0700557 }
558
James Zern54697d32014-07-16 18:56:22 -0700559 FdctFunc fwd_txfm_;
560 IdctFunc inv_txfm_;
Jingning Han4bd17112013-09-16 16:01:50 -0700561};
562
563TEST_P(FwdTrans8x8DCT, SignBiasCheck) {
564 RunSignBiasCheck();
Jingning Hanab362622013-06-21 11:45:47 -0700565}
Daniel Kang26641c72012-06-28 16:26:31 -0700566
Jingning Han4bd17112013-09-16 16:01:50 -0700567TEST_P(FwdTrans8x8DCT, RoundTripErrorCheck) {
568 RunRoundTripErrorCheck();
569}
570
571TEST_P(FwdTrans8x8DCT, ExtremalCheck) {
572 RunExtremalCheck();
573}
574
Deb Mukherjee10783d42014-09-02 16:34:09 -0700575TEST_P(FwdTrans8x8DCT, FwdAccuracyCheck) {
576 RunFwdAccuracyCheck();
577}
578
579TEST_P(FwdTrans8x8DCT, InvAccuracyCheck) {
580 RunInvAccuracyCheck();
581}
582
Joshua Litt51490e52013-11-18 17:07:55 -0800583class FwdTrans8x8HT
584 : public FwdTrans8x8TestBase,
James Zern54697d32014-07-16 18:56:22 -0700585 public ::testing::TestWithParam<Ht8x8Param> {
Jingning Han4bd17112013-09-16 16:01:50 -0700586 public:
587 virtual ~FwdTrans8x8HT() {}
588
589 virtual void SetUp() {
590 fwd_txfm_ = GET_PARAM(0);
591 inv_txfm_ = GET_PARAM(1);
592 tx_type_ = GET_PARAM(2);
593 pitch_ = 8;
594 fwd_txfm_ref = fht8x8_ref;
Deb Mukherjee10783d42014-09-02 16:34:09 -0700595 bit_depth_ = GET_PARAM(3);
596 mask_ = (1 << bit_depth_) - 1;
Jingning Han4bd17112013-09-16 16:01:50 -0700597 }
598
599 virtual void TearDown() { libvpx_test::ClearSystemState(); }
600
601 protected:
Deb Mukherjee10783d42014-09-02 16:34:09 -0700602 void RunFwdTxfm(int16_t *in, tran_low_t *out, int stride) {
Jingning Han4bd17112013-09-16 16:01:50 -0700603 fwd_txfm_(in, out, stride, tx_type_);
604 }
Deb Mukherjee10783d42014-09-02 16:34:09 -0700605 void RunInvTxfm(tran_low_t *out, uint8_t *dst, int stride) {
Jingning Han4bd17112013-09-16 16:01:50 -0700606 inv_txfm_(out, dst, stride, tx_type_);
607 }
608
James Zern54697d32014-07-16 18:56:22 -0700609 FhtFunc fwd_txfm_;
610 IhtFunc inv_txfm_;
Jingning Han4bd17112013-09-16 16:01:50 -0700611};
612
613TEST_P(FwdTrans8x8HT, SignBiasCheck) {
614 RunSignBiasCheck();
615}
616
617TEST_P(FwdTrans8x8HT, RoundTripErrorCheck) {
618 RunRoundTripErrorCheck();
619}
620
621TEST_P(FwdTrans8x8HT, ExtremalCheck) {
622 RunExtremalCheck();
623}
624
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100625class InvTrans8x8DCT
626 : public FwdTrans8x8TestBase,
627 public ::testing::TestWithParam<Idct8x8Param> {
628 public:
629 virtual ~InvTrans8x8DCT() {}
630
631 virtual void SetUp() {
632 ref_txfm_ = GET_PARAM(0);
633 inv_txfm_ = GET_PARAM(1);
634 thresh_ = GET_PARAM(2);
635 pitch_ = 8;
636 bit_depth_ = GET_PARAM(3);
637 mask_ = (1 << bit_depth_) - 1;
638 }
639
640 virtual void TearDown() { libvpx_test::ClearSystemState(); }
641
642 protected:
643 void RunInvTxfm(tran_low_t *out, uint8_t *dst, int stride) {
644 inv_txfm_(out, dst, stride);
645 }
James Zerncffef112016-02-11 18:27:00 -0800646 void RunFwdTxfm(int16_t * /*out*/, tran_low_t * /*dst*/, int /*stride*/) {}
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100647
648 IdctFunc ref_txfm_;
649 IdctFunc inv_txfm_;
650 int thresh_;
651};
652
653TEST_P(InvTrans8x8DCT, CompareReference) {
654 CompareInvReference(ref_txfm_, thresh_);
655}
656
Jingning Han4bd17112013-09-16 16:01:50 -0700657using std::tr1::make_tuple;
658
Deb Mukherjee10783d42014-09-02 16:34:09 -0700659#if CONFIG_VP9_HIGHBITDEPTH
Jingning Han4bd17112013-09-16 16:01:50 -0700660INSTANTIATE_TEST_CASE_P(
661 C, FwdTrans8x8DCT,
662 ::testing::Values(
Jingning Han08a453b2015-08-03 14:51:10 -0700663 make_tuple(&vpx_fdct8x8_c, &vpx_idct8x8_64_add_c, 0, VPX_BITS_8),
Jingning Han4b5109c2015-07-28 15:57:40 -0700664 make_tuple(&vpx_highbd_fdct8x8_c, &idct8x8_10, 0, VPX_BITS_10),
665 make_tuple(&vpx_highbd_fdct8x8_c, &idct8x8_12, 0, VPX_BITS_12)));
Deb Mukherjee10783d42014-09-02 16:34:09 -0700666#else
667INSTANTIATE_TEST_CASE_P(
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800668 C, FwdTrans8x8DCT,
Deb Mukherjee10783d42014-09-02 16:34:09 -0700669 ::testing::Values(
Jingning Han08a453b2015-08-03 14:51:10 -0700670 make_tuple(&vpx_fdct8x8_c, &vpx_idct8x8_64_add_c, 0, VPX_BITS_8)));
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100671#endif // CONFIG_VP9_HIGHBITDEPTH
Deb Mukherjee10783d42014-09-02 16:34:09 -0700672
673#if CONFIG_VP9_HIGHBITDEPTH
Jingning Han4bd17112013-09-16 16:01:50 -0700674INSTANTIATE_TEST_CASE_P(
675 C, FwdTrans8x8HT,
676 ::testing::Values(
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800677 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_c, 0, VPX_BITS_8),
Deb Mukherjee1929c9b2014-10-08 12:43:22 -0700678 make_tuple(&vp9_highbd_fht8x8_c, &iht8x8_10, 0, VPX_BITS_10),
679 make_tuple(&vp9_highbd_fht8x8_c, &iht8x8_10, 1, VPX_BITS_10),
680 make_tuple(&vp9_highbd_fht8x8_c, &iht8x8_10, 2, VPX_BITS_10),
681 make_tuple(&vp9_highbd_fht8x8_c, &iht8x8_10, 3, VPX_BITS_10),
682 make_tuple(&vp9_highbd_fht8x8_c, &iht8x8_12, 0, VPX_BITS_12),
683 make_tuple(&vp9_highbd_fht8x8_c, &iht8x8_12, 1, VPX_BITS_12),
684 make_tuple(&vp9_highbd_fht8x8_c, &iht8x8_12, 2, VPX_BITS_12),
685 make_tuple(&vp9_highbd_fht8x8_c, &iht8x8_12, 3, VPX_BITS_12),
Deb Mukherjee10783d42014-09-02 16:34:09 -0700686 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_c, 1, VPX_BITS_8),
687 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_c, 2, VPX_BITS_8),
688 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_c, 3, VPX_BITS_8)));
689#else
James Zern615230b2014-12-01 15:10:00 -0800690INSTANTIATE_TEST_CASE_P(
Deb Mukherjee10783d42014-09-02 16:34:09 -0700691 C, FwdTrans8x8HT,
692 ::testing::Values(
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800693 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_c, 0, VPX_BITS_8),
Deb Mukherjee10783d42014-09-02 16:34:09 -0700694 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_c, 1, VPX_BITS_8),
695 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_c, 2, VPX_BITS_8),
696 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_c, 3, VPX_BITS_8)));
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100697#endif // CONFIG_VP9_HIGHBITDEPTH
Jingning Han4bd17112013-09-16 16:01:50 -0700698
Deb Mukherjeed50716f2014-10-02 15:43:27 -0700699#if HAVE_NEON_ASM && !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE
James Zernc3331102014-02-25 23:11:49 -0800700INSTANTIATE_TEST_CASE_P(
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800701 NEON, FwdTrans8x8DCT,
James Zernc3331102014-02-25 23:11:49 -0800702 ::testing::Values(
Jingning Han08a453b2015-08-03 14:51:10 -0700703 make_tuple(&vpx_fdct8x8_neon, &vpx_idct8x8_64_add_neon, 0,
Deb Mukherjee10783d42014-09-02 16:34:09 -0700704 VPX_BITS_8)));
James Yu4f856cd2014-01-29 01:31:07 +0800705#endif // HAVE_NEON_ASM && !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE
706
707#if HAVE_NEON && !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE
James Zernc3331102014-02-25 23:11:49 -0800708INSTANTIATE_TEST_CASE_P(
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800709 NEON, FwdTrans8x8HT,
James Zernc3331102014-02-25 23:11:49 -0800710 ::testing::Values(
Deb Mukherjee10783d42014-09-02 16:34:09 -0700711 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_neon, 0, VPX_BITS_8),
712 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_neon, 1, VPX_BITS_8),
713 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_neon, 2, VPX_BITS_8),
714 make_tuple(&vp9_fht8x8_c, &vp9_iht8x8_64_add_neon, 3, VPX_BITS_8)));
James Yu4f856cd2014-01-29 01:31:07 +0800715#endif // HAVE_NEON && !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE
James Zernc3331102014-02-25 23:11:49 -0800716
Deb Mukherjeed50716f2014-10-02 15:43:27 -0700717#if HAVE_SSE2 && !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE
Jingning Han4bd17112013-09-16 16:01:50 -0700718INSTANTIATE_TEST_CASE_P(
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800719 SSE2, FwdTrans8x8DCT,
Jingning Han4bd17112013-09-16 16:01:50 -0700720 ::testing::Values(
Jingning Han08a453b2015-08-03 14:51:10 -0700721 make_tuple(&vpx_fdct8x8_sse2, &vpx_idct8x8_64_add_sse2, 0,
Deb Mukherjee10783d42014-09-02 16:34:09 -0700722 VPX_BITS_8)));
Jingning Han4bd17112013-09-16 16:01:50 -0700723INSTANTIATE_TEST_CASE_P(
724 SSE2, FwdTrans8x8HT,
725 ::testing::Values(
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800726 make_tuple(&vp9_fht8x8_sse2, &vp9_iht8x8_64_add_sse2, 0, VPX_BITS_8),
Deb Mukherjee10783d42014-09-02 16:34:09 -0700727 make_tuple(&vp9_fht8x8_sse2, &vp9_iht8x8_64_add_sse2, 1, VPX_BITS_8),
728 make_tuple(&vp9_fht8x8_sse2, &vp9_iht8x8_64_add_sse2, 2, VPX_BITS_8),
729 make_tuple(&vp9_fht8x8_sse2, &vp9_iht8x8_64_add_sse2, 3, VPX_BITS_8)));
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100730#endif // HAVE_SSE2 && !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE
731
732#if HAVE_SSE2 && CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE
733INSTANTIATE_TEST_CASE_P(
734 SSE2, FwdTrans8x8DCT,
735 ::testing::Values(
Jingning Han08a453b2015-08-03 14:51:10 -0700736 make_tuple(&vpx_fdct8x8_sse2, &vpx_idct8x8_64_add_c, 0, VPX_BITS_8),
Jingning Han4b5109c2015-07-28 15:57:40 -0700737 make_tuple(&vpx_highbd_fdct8x8_c,
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100738 &idct8x8_64_add_10_sse2, 12, VPX_BITS_10),
Jingning Han4b5109c2015-07-28 15:57:40 -0700739 make_tuple(&vpx_highbd_fdct8x8_sse2,
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100740 &idct8x8_64_add_10_sse2, 12, VPX_BITS_10),
Jingning Han4b5109c2015-07-28 15:57:40 -0700741 make_tuple(&vpx_highbd_fdct8x8_c,
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100742 &idct8x8_64_add_12_sse2, 12, VPX_BITS_12),
Jingning Han4b5109c2015-07-28 15:57:40 -0700743 make_tuple(&vpx_highbd_fdct8x8_sse2,
James Zern615230b2014-12-01 15:10:00 -0800744 &idct8x8_64_add_12_sse2, 12, VPX_BITS_12)));
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100745
James Zern615230b2014-12-01 15:10:00 -0800746INSTANTIATE_TEST_CASE_P(
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100747 SSE2, FwdTrans8x8HT,
748 ::testing::Values(
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800749 make_tuple(&vp9_fht8x8_sse2, &vp9_iht8x8_64_add_c, 0, VPX_BITS_8),
Peter de Rivaz7e40a552014-10-24 08:48:02 +0100750 make_tuple(&vp9_fht8x8_sse2, &vp9_iht8x8_64_add_c, 1, VPX_BITS_8),
751 make_tuple(&vp9_fht8x8_sse2, &vp9_iht8x8_64_add_c, 2, VPX_BITS_8),
752 make_tuple(&vp9_fht8x8_sse2, &vp9_iht8x8_64_add_c, 3, VPX_BITS_8)));
753
754// Optimizations take effect at a threshold of 6201, so we use a value close to
755// that to test both branches.
756INSTANTIATE_TEST_CASE_P(
757 SSE2, InvTrans8x8DCT,
758 ::testing::Values(
759 make_tuple(&idct8x8_10_add_10_c,
760 &idct8x8_10_add_10_sse2, 6225, VPX_BITS_10),
761 make_tuple(&idct8x8_10,
762 &idct8x8_64_add_10_sse2, 6225, VPX_BITS_10),
763 make_tuple(&idct8x8_10_add_12_c,
764 &idct8x8_10_add_12_sse2, 6225, VPX_BITS_12),
765 make_tuple(&idct8x8_12,
766 &idct8x8_64_add_12_sse2, 6225, VPX_BITS_12)));
767#endif // HAVE_SSE2 && CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE
Jingning Hanb466ad52014-05-08 09:56:38 -0700768
Johannff8505a2015-06-29 16:44:30 -0700769#if HAVE_SSSE3 && CONFIG_USE_X86INC && ARCH_X86_64 && \
770 !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE
Jingning Hanb466ad52014-05-08 09:56:38 -0700771INSTANTIATE_TEST_CASE_P(
Deb Mukherjee1fe643c2014-12-04 16:46:06 -0800772 SSSE3, FwdTrans8x8DCT,
Jingning Hanb466ad52014-05-08 09:56:38 -0700773 ::testing::Values(
Jingning Han08a453b2015-08-03 14:51:10 -0700774 make_tuple(&vpx_fdct8x8_ssse3, &vpx_idct8x8_64_add_ssse3, 0,
Deb Mukherjee10783d42014-09-02 16:34:09 -0700775 VPX_BITS_8)));
Jingning Hanb466ad52014-05-08 09:56:38 -0700776#endif
Parag Salasakar7c5f00f2015-05-08 12:23:27 +0530777
Jingning Han9aaf5232015-07-22 11:53:21 -0700778#if HAVE_MSA && !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE
Parag Salasakar7c5f00f2015-05-08 12:23:27 +0530779INSTANTIATE_TEST_CASE_P(
780 MSA, FwdTrans8x8DCT,
781 ::testing::Values(
Jingning Han08a453b2015-08-03 14:51:10 -0700782 make_tuple(&vpx_fdct8x8_msa, &vpx_idct8x8_64_add_msa, 0, VPX_BITS_8)));
Parag Salasakar7c5f00f2015-05-08 12:23:27 +0530783INSTANTIATE_TEST_CASE_P(
784 MSA, FwdTrans8x8HT,
785 ::testing::Values(
Parag Salasakar7ca84882015-06-18 12:03:30 +0530786 make_tuple(&vp9_fht8x8_msa, &vp9_iht8x8_64_add_msa, 0, VPX_BITS_8),
787 make_tuple(&vp9_fht8x8_msa, &vp9_iht8x8_64_add_msa, 1, VPX_BITS_8),
788 make_tuple(&vp9_fht8x8_msa, &vp9_iht8x8_64_add_msa, 2, VPX_BITS_8),
789 make_tuple(&vp9_fht8x8_msa, &vp9_iht8x8_64_add_msa, 3, VPX_BITS_8)));
Parag Salasakar7c5f00f2015-05-08 12:23:27 +0530790#endif // HAVE_MSA && !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE
Daniel Kang26641c72012-06-28 16:26:31 -0700791} // namespace