Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2012 The WebM project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
| 11 | #include <math.h> |
| 12 | #include <stdlib.h> |
| 13 | #include <string.h> |
| 14 | |
| 15 | #include "third_party/googletest/src/include/gtest/gtest.h" |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 16 | #include "test/acm_random.h" |
| 17 | #include "test/clear_system_state.h" |
| 18 | #include "test/register_state_check.h" |
| 19 | #include "test/util.h" |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 20 | |
Yaowu Xu | afffa3d | 2013-09-05 08:45:56 -0700 | [diff] [blame] | 21 | #include "./vp9_rtcd.h" |
James Zern | 002ad40 | 2014-01-18 13:03:31 -0800 | [diff] [blame] | 22 | #include "vp9/common/vp9_entropy.h" |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 23 | #include "vpx/vpx_codec.h" |
James Zern | 002ad40 | 2014-01-18 13:03:31 -0800 | [diff] [blame] | 24 | #include "vpx/vpx_integer.h" |
| 25 | |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 26 | using libvpx_test::ACMRandom; |
| 27 | |
| 28 | namespace { |
| 29 | |
Yaowu Xu | 77f889b | 2013-02-04 15:22:55 -0800 | [diff] [blame] | 30 | #ifdef _MSC_VER |
| 31 | static int round(double x) { |
| 32 | if (x < 0) |
Yaowu Xu | afffa3d | 2013-09-05 08:45:56 -0700 | [diff] [blame] | 33 | return static_cast<int>(ceil(x - 0.5)); |
Yaowu Xu | 77f889b | 2013-02-04 15:22:55 -0800 | [diff] [blame] | 34 | else |
Yaowu Xu | afffa3d | 2013-09-05 08:45:56 -0700 | [diff] [blame] | 35 | return static_cast<int>(floor(x + 0.5)); |
Yaowu Xu | 77f889b | 2013-02-04 15:22:55 -0800 | [diff] [blame] | 36 | } |
| 37 | #endif |
| 38 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 39 | const int kNumCoeffs = 256; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 40 | const double PI = 3.1415926535898; |
| 41 | void reference2_16x16_idct_2d(double *input, double *output) { |
| 42 | double x; |
| 43 | for (int l = 0; l < 16; ++l) { |
| 44 | for (int k = 0; k < 16; ++k) { |
| 45 | double s = 0; |
| 46 | for (int i = 0; i < 16; ++i) { |
| 47 | for (int j = 0; j < 16; ++j) { |
Yaowu Xu | afffa3d | 2013-09-05 08:45:56 -0700 | [diff] [blame] | 48 | x = cos(PI * j * (l + 0.5) / 16.0) * |
| 49 | cos(PI * i * (k + 0.5) / 16.0) * |
| 50 | input[i * 16 + j] / 256; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 51 | if (i != 0) |
| 52 | x *= sqrt(2.0); |
| 53 | if (j != 0) |
| 54 | x *= sqrt(2.0); |
| 55 | s += x; |
| 56 | } |
| 57 | } |
| 58 | output[k*16+l] = s; |
| 59 | } |
| 60 | } |
| 61 | } |
| 62 | |
Yaowu Xu | 0b17ea6 | 2012-08-07 13:55:49 -0700 | [diff] [blame] | 63 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 64 | const double C1 = 0.995184726672197; |
| 65 | const double C2 = 0.98078528040323; |
| 66 | const double C3 = 0.956940335732209; |
| 67 | const double C4 = 0.923879532511287; |
| 68 | const double C5 = 0.881921264348355; |
| 69 | const double C6 = 0.831469612302545; |
| 70 | const double C7 = 0.773010453362737; |
| 71 | const double C8 = 0.707106781186548; |
| 72 | const double C9 = 0.634393284163646; |
| 73 | const double C10 = 0.555570233019602; |
| 74 | const double C11 = 0.471396736825998; |
| 75 | const double C12 = 0.38268343236509; |
| 76 | const double C13 = 0.290284677254462; |
| 77 | const double C14 = 0.195090322016128; |
| 78 | const double C15 = 0.098017140329561; |
Yaowu Xu | 0b17ea6 | 2012-08-07 13:55:49 -0700 | [diff] [blame] | 79 | |
Jingning Han | ec4b274 | 2013-08-27 17:03:46 -0700 | [diff] [blame] | 80 | void butterfly_16x16_dct_1d(double input[16], double output[16]) { |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 81 | double step[16]; |
| 82 | double intermediate[16]; |
| 83 | double temp1, temp2; |
| 84 | |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 85 | // step 1 |
| 86 | step[ 0] = input[0] + input[15]; |
| 87 | step[ 1] = input[1] + input[14]; |
| 88 | step[ 2] = input[2] + input[13]; |
| 89 | step[ 3] = input[3] + input[12]; |
| 90 | step[ 4] = input[4] + input[11]; |
| 91 | step[ 5] = input[5] + input[10]; |
| 92 | step[ 6] = input[6] + input[ 9]; |
| 93 | step[ 7] = input[7] + input[ 8]; |
| 94 | step[ 8] = input[7] - input[ 8]; |
| 95 | step[ 9] = input[6] - input[ 9]; |
| 96 | step[10] = input[5] - input[10]; |
| 97 | step[11] = input[4] - input[11]; |
| 98 | step[12] = input[3] - input[12]; |
| 99 | step[13] = input[2] - input[13]; |
| 100 | step[14] = input[1] - input[14]; |
| 101 | step[15] = input[0] - input[15]; |
| 102 | |
| 103 | // step 2 |
| 104 | output[0] = step[0] + step[7]; |
| 105 | output[1] = step[1] + step[6]; |
| 106 | output[2] = step[2] + step[5]; |
| 107 | output[3] = step[3] + step[4]; |
| 108 | output[4] = step[3] - step[4]; |
| 109 | output[5] = step[2] - step[5]; |
| 110 | output[6] = step[1] - step[6]; |
| 111 | output[7] = step[0] - step[7]; |
| 112 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 113 | temp1 = step[ 8] * C7; |
| 114 | temp2 = step[15] * C9; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 115 | output[ 8] = temp1 + temp2; |
| 116 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 117 | temp1 = step[ 9] * C11; |
| 118 | temp2 = step[14] * C5; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 119 | output[ 9] = temp1 - temp2; |
| 120 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 121 | temp1 = step[10] * C3; |
| 122 | temp2 = step[13] * C13; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 123 | output[10] = temp1 + temp2; |
| 124 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 125 | temp1 = step[11] * C15; |
| 126 | temp2 = step[12] * C1; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 127 | output[11] = temp1 - temp2; |
| 128 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 129 | temp1 = step[11] * C1; |
| 130 | temp2 = step[12] * C15; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 131 | output[12] = temp2 + temp1; |
| 132 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 133 | temp1 = step[10] * C13; |
| 134 | temp2 = step[13] * C3; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 135 | output[13] = temp2 - temp1; |
| 136 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 137 | temp1 = step[ 9] * C5; |
| 138 | temp2 = step[14] * C11; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 139 | output[14] = temp2 + temp1; |
| 140 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 141 | temp1 = step[ 8] * C9; |
| 142 | temp2 = step[15] * C7; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 143 | output[15] = temp2 - temp1; |
| 144 | |
| 145 | // step 3 |
| 146 | step[ 0] = output[0] + output[3]; |
| 147 | step[ 1] = output[1] + output[2]; |
| 148 | step[ 2] = output[1] - output[2]; |
| 149 | step[ 3] = output[0] - output[3]; |
| 150 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 151 | temp1 = output[4] * C14; |
| 152 | temp2 = output[7] * C2; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 153 | step[ 4] = temp1 + temp2; |
| 154 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 155 | temp1 = output[5] * C10; |
| 156 | temp2 = output[6] * C6; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 157 | step[ 5] = temp1 + temp2; |
| 158 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 159 | temp1 = output[5] * C6; |
| 160 | temp2 = output[6] * C10; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 161 | step[ 6] = temp2 - temp1; |
| 162 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 163 | temp1 = output[4] * C2; |
| 164 | temp2 = output[7] * C14; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 165 | step[ 7] = temp2 - temp1; |
| 166 | |
| 167 | step[ 8] = output[ 8] + output[11]; |
| 168 | step[ 9] = output[ 9] + output[10]; |
| 169 | step[10] = output[ 9] - output[10]; |
| 170 | step[11] = output[ 8] - output[11]; |
| 171 | |
| 172 | step[12] = output[12] + output[15]; |
| 173 | step[13] = output[13] + output[14]; |
| 174 | step[14] = output[13] - output[14]; |
| 175 | step[15] = output[12] - output[15]; |
| 176 | |
| 177 | // step 4 |
| 178 | output[ 0] = (step[ 0] + step[ 1]); |
| 179 | output[ 8] = (step[ 0] - step[ 1]); |
| 180 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 181 | temp1 = step[2] * C12; |
| 182 | temp2 = step[3] * C4; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 183 | temp1 = temp1 + temp2; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 184 | output[ 4] = 2*(temp1 * C8); |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 185 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 186 | temp1 = step[2] * C4; |
| 187 | temp2 = step[3] * C12; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 188 | temp1 = temp2 - temp1; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 189 | output[12] = 2 * (temp1 * C8); |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 190 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 191 | output[ 2] = 2 * ((step[4] + step[ 5]) * C8); |
| 192 | output[14] = 2 * ((step[7] - step[ 6]) * C8); |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 193 | |
| 194 | temp1 = step[4] - step[5]; |
| 195 | temp2 = step[6] + step[7]; |
| 196 | output[ 6] = (temp1 + temp2); |
| 197 | output[10] = (temp1 - temp2); |
| 198 | |
| 199 | intermediate[8] = step[8] + step[14]; |
| 200 | intermediate[9] = step[9] + step[15]; |
| 201 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 202 | temp1 = intermediate[8] * C12; |
| 203 | temp2 = intermediate[9] * C4; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 204 | temp1 = temp1 - temp2; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 205 | output[3] = 2 * (temp1 * C8); |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 206 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 207 | temp1 = intermediate[8] * C4; |
| 208 | temp2 = intermediate[9] * C12; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 209 | temp1 = temp2 + temp1; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 210 | output[13] = 2 * (temp1 * C8); |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 211 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 212 | output[ 9] = 2 * ((step[10] + step[11]) * C8); |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 213 | |
| 214 | intermediate[11] = step[10] - step[11]; |
| 215 | intermediate[12] = step[12] + step[13]; |
| 216 | intermediate[13] = step[12] - step[13]; |
| 217 | intermediate[14] = step[ 8] - step[14]; |
| 218 | intermediate[15] = step[ 9] - step[15]; |
| 219 | |
| 220 | output[15] = (intermediate[11] + intermediate[12]); |
| 221 | output[ 1] = -(intermediate[11] - intermediate[12]); |
| 222 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 223 | output[ 7] = 2 * (intermediate[13] * C8); |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 224 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 225 | temp1 = intermediate[14] * C12; |
| 226 | temp2 = intermediate[15] * C4; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 227 | temp1 = temp1 - temp2; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 228 | output[11] = -2 * (temp1 * C8); |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 229 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 230 | temp1 = intermediate[14] * C4; |
| 231 | temp2 = intermediate[15] * C12; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 232 | temp1 = temp2 + temp1; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 233 | output[ 5] = 2 * (temp1 * C8); |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 234 | } |
| 235 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 236 | void reference_16x16_dct_2d(int16_t input[256], double output[256]) { |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 237 | // First transform columns |
| 238 | for (int i = 0; i < 16; ++i) { |
| 239 | double temp_in[16], temp_out[16]; |
| 240 | for (int j = 0; j < 16; ++j) |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 241 | temp_in[j] = input[j * 16 + i]; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 242 | butterfly_16x16_dct_1d(temp_in, temp_out); |
| 243 | for (int j = 0; j < 16; ++j) |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 244 | output[j * 16 + i] = temp_out[j]; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 245 | } |
| 246 | // Then transform rows |
| 247 | for (int i = 0; i < 16; ++i) { |
| 248 | double temp_in[16], temp_out[16]; |
| 249 | for (int j = 0; j < 16; ++j) |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 250 | temp_in[j] = output[j + i * 16]; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 251 | butterfly_16x16_dct_1d(temp_in, temp_out); |
| 252 | // Scale by some magic number |
| 253 | for (int j = 0; j < 16; ++j) |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 254 | output[j + i * 16] = temp_out[j]/2; |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 255 | } |
| 256 | } |
| 257 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 258 | typedef void (*FdctFunc)(const int16_t *in, tran_low_t *out, int stride); |
| 259 | typedef void (*IdctFunc)(const tran_low_t *in, uint8_t *out, int stride); |
| 260 | typedef void (*FhtFunc)(const int16_t *in, tran_low_t *out, int stride, |
James Zern | 44f8484 | 2014-07-16 18:53:33 -0700 | [diff] [blame] | 261 | int tx_type); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 262 | typedef void (*IhtFunc)(const tran_low_t *in, uint8_t *out, int stride, |
James Zern | 44f8484 | 2014-07-16 18:53:33 -0700 | [diff] [blame] | 263 | int tx_type); |
Jingning Han | cf768b2 | 2013-07-09 16:16:49 -0700 | [diff] [blame] | 264 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 265 | typedef std::tr1::tuple<FdctFunc, IdctFunc, int, vpx_bit_depth_t> Dct16x16Param; |
| 266 | typedef std::tr1::tuple<FhtFunc, IhtFunc, int, vpx_bit_depth_t> Ht16x16Param; |
Joshua Litt | 51490e5 | 2013-11-18 17:07:55 -0800 | [diff] [blame] | 267 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 268 | void fdct16x16_ref(const int16_t *in, tran_low_t *out, int stride, |
James Zern | 632e419 | 2014-08-22 12:11:42 -0700 | [diff] [blame] | 269 | int /*tx_type*/) { |
Dmitry Kovalev | 02feb63 | 2013-10-23 10:57:12 -0700 | [diff] [blame] | 270 | vp9_fdct16x16_c(in, out, stride); |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 271 | } |
| 272 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 273 | void idct16x16_ref(const tran_low_t *in, uint8_t *dest, int stride, |
James Zern | 632e419 | 2014-08-22 12:11:42 -0700 | [diff] [blame] | 274 | int /*tx_type*/) { |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 275 | vp9_idct16x16_256_add_c(in, dest, stride); |
| 276 | } |
| 277 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 278 | void fht16x16_ref(const int16_t *in, tran_low_t *out, int stride, |
| 279 | int tx_type) { |
Dmitry Kovalev | 005fc69 | 2014-02-06 11:54:15 -0800 | [diff] [blame] | 280 | vp9_fht16x16_c(in, out, stride, tx_type); |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 281 | } |
| 282 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 283 | void iht16x16_ref(const tran_low_t *in, uint8_t *dest, int stride, |
| 284 | int tx_type) { |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 285 | vp9_iht16x16_256_add_c(in, dest, stride, tx_type); |
| 286 | } |
| 287 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 288 | #if CONFIG_VP9_HIGHBITDEPTH |
| 289 | void idct16x16_10(const tran_low_t *in, uint8_t *out, int stride) { |
| 290 | vp9_high_idct16x16_256_add_c(in, out, stride, 10); |
| 291 | } |
| 292 | |
| 293 | void idct16x16_12(const tran_low_t *in, uint8_t *out, int stride) { |
| 294 | vp9_high_idct16x16_256_add_c(in, out, stride, 12); |
| 295 | } |
| 296 | |
| 297 | void idct16x16_10_ref(const tran_low_t *in, uint8_t *out, int stride, |
| 298 | int tx_type) { |
| 299 | idct16x16_10(in, out, stride); |
| 300 | } |
| 301 | |
| 302 | void idct16x16_12_ref(const tran_low_t *in, uint8_t *out, int stride, |
| 303 | int tx_type) { |
| 304 | idct16x16_12(in, out, stride); |
| 305 | } |
| 306 | |
| 307 | void iht16x16_10(const tran_low_t *in, uint8_t *out, int stride, int tx_type) { |
| 308 | vp9_high_iht16x16_256_add_c(in, out, stride, tx_type, 10); |
| 309 | } |
| 310 | |
| 311 | void iht16x16_12(const tran_low_t *in, uint8_t *out, int stride, int tx_type) { |
| 312 | vp9_high_iht16x16_256_add_c(in, out, stride, tx_type, 12); |
| 313 | } |
| 314 | #endif |
| 315 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 316 | class Trans16x16TestBase { |
Jingning Han | cf768b2 | 2013-07-09 16:16:49 -0700 | [diff] [blame] | 317 | public: |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 318 | virtual ~Trans16x16TestBase() {} |
Jingning Han | cf768b2 | 2013-07-09 16:16:49 -0700 | [diff] [blame] | 319 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 320 | protected: |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 321 | virtual void RunFwdTxfm(int16_t *in, tran_low_t *out, int stride) = 0; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 322 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 323 | virtual void RunInvTxfm(tran_low_t *out, uint8_t *dst, int stride) = 0; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 324 | |
| 325 | void RunAccuracyCheck() { |
| 326 | ACMRandom rnd(ACMRandom::DeterministicSeed()); |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 327 | uint32_t max_error = 0; |
| 328 | int64_t total_error = 0; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 329 | const int count_test_block = 10000; |
| 330 | for (int i = 0; i < count_test_block; ++i) { |
| 331 | DECLARE_ALIGNED_ARRAY(16, int16_t, test_input_block, kNumCoeffs); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 332 | DECLARE_ALIGNED_ARRAY(16, tran_low_t, test_temp_block, kNumCoeffs); |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 333 | DECLARE_ALIGNED_ARRAY(16, uint8_t, dst, kNumCoeffs); |
| 334 | DECLARE_ALIGNED_ARRAY(16, uint8_t, src, kNumCoeffs); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 335 | #if CONFIG_VP9_HIGHBITDEPTH |
| 336 | DECLARE_ALIGNED_ARRAY(16, uint16_t, dst16, kNumCoeffs); |
| 337 | DECLARE_ALIGNED_ARRAY(16, uint16_t, src16, kNumCoeffs); |
| 338 | #endif |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 339 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 340 | // Initialize a test block with input range [-mask_, mask_]. |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 341 | for (int j = 0; j < kNumCoeffs; ++j) { |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 342 | if (bit_depth_ == VPX_BITS_8) { |
| 343 | src[j] = rnd.Rand8(); |
| 344 | dst[j] = rnd.Rand8(); |
| 345 | test_input_block[j] = src[j] - dst[j]; |
| 346 | #if CONFIG_VP9_HIGHBITDEPTH |
| 347 | } else { |
| 348 | src16[j] = rnd.Rand16() & mask_; |
| 349 | dst16[j] = rnd.Rand16() & mask_; |
| 350 | test_input_block[j] = src16[j] - dst16[j]; |
| 351 | #endif |
| 352 | } |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 353 | } |
| 354 | |
James Zern | 29e1b1a | 2014-07-09 21:02:02 -0700 | [diff] [blame] | 355 | ASM_REGISTER_STATE_CHECK(RunFwdTxfm(test_input_block, |
| 356 | test_temp_block, pitch_)); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 357 | if (bit_depth_ == VPX_BITS_8) { |
| 358 | ASM_REGISTER_STATE_CHECK( |
| 359 | RunInvTxfm(test_temp_block, dst, pitch_)); |
| 360 | #if CONFIG_VP9_HIGHBITDEPTH |
| 361 | } else { |
| 362 | ASM_REGISTER_STATE_CHECK( |
| 363 | RunInvTxfm(test_temp_block, CONVERT_TO_BYTEPTR(dst16), pitch_)); |
| 364 | #endif |
| 365 | } |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 366 | |
| 367 | for (int j = 0; j < kNumCoeffs; ++j) { |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 368 | #if CONFIG_VP9_HIGHBITDEPTH |
| 369 | const uint32_t diff = |
| 370 | bit_depth_ == VPX_BITS_8 ? dst[j] - src[j] : dst16[j] - src16[j]; |
| 371 | #else |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 372 | const uint32_t diff = dst[j] - src[j]; |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 373 | #endif |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 374 | const uint32_t error = diff * diff; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 375 | if (max_error < error) |
| 376 | max_error = error; |
| 377 | total_error += error; |
| 378 | } |
| 379 | } |
| 380 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 381 | EXPECT_GE(1u << 2 * (bit_depth_ - 8), max_error) |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 382 | << "Error: 16x16 FHT/IHT has an individual round trip error > 1"; |
| 383 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 384 | EXPECT_GE(count_test_block << 2 * (bit_depth_ - 8), total_error) |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 385 | << "Error: 16x16 FHT/IHT has average round trip error > 1 per block"; |
| 386 | } |
| 387 | |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 388 | void RunCoeffCheck() { |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 389 | ACMRandom rnd(ACMRandom::DeterministicSeed()); |
| 390 | const int count_test_block = 1000; |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 391 | DECLARE_ALIGNED_ARRAY(16, int16_t, input_block, kNumCoeffs); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 392 | DECLARE_ALIGNED_ARRAY(16, tran_low_t, output_ref_block, kNumCoeffs); |
| 393 | DECLARE_ALIGNED_ARRAY(16, tran_low_t, output_block, kNumCoeffs); |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 394 | |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 395 | for (int i = 0; i < count_test_block; ++i) { |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 396 | // Initialize a test block with input range [-mask_, mask_]. |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 397 | for (int j = 0; j < kNumCoeffs; ++j) |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 398 | input_block[j] = (rnd.Rand16() & mask_) - (rnd.Rand16() & mask_); |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 399 | |
| 400 | fwd_txfm_ref(input_block, output_ref_block, pitch_, tx_type_); |
James Zern | 29e1b1a | 2014-07-09 21:02:02 -0700 | [diff] [blame] | 401 | ASM_REGISTER_STATE_CHECK(RunFwdTxfm(input_block, output_block, pitch_)); |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 402 | |
| 403 | // The minimum quant value is 4. |
| 404 | for (int j = 0; j < kNumCoeffs; ++j) |
| 405 | EXPECT_EQ(output_block[j], output_ref_block[j]); |
| 406 | } |
| 407 | } |
| 408 | |
| 409 | void RunMemCheck() { |
| 410 | ACMRandom rnd(ACMRandom::DeterministicSeed()); |
| 411 | const int count_test_block = 1000; |
| 412 | DECLARE_ALIGNED_ARRAY(16, int16_t, input_block, kNumCoeffs); |
| 413 | DECLARE_ALIGNED_ARRAY(16, int16_t, input_extreme_block, kNumCoeffs); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 414 | DECLARE_ALIGNED_ARRAY(16, tran_low_t, output_ref_block, kNumCoeffs); |
| 415 | DECLARE_ALIGNED_ARRAY(16, tran_low_t, output_block, kNumCoeffs); |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 416 | |
| 417 | for (int i = 0; i < count_test_block; ++i) { |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 418 | // Initialize a test block with input range [-mask_, mask_]. |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 419 | for (int j = 0; j < kNumCoeffs; ++j) { |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 420 | input_block[j] = (rnd.Rand16() & mask_) - (rnd.Rand16() & mask_); |
| 421 | input_extreme_block[j] = rnd.Rand8() % 2 ? mask_ : -mask_; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 422 | } |
Jingning Han | 5c2696c | 2014-06-02 16:40:01 -0700 | [diff] [blame] | 423 | if (i == 0) { |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 424 | for (int j = 0; j < kNumCoeffs; ++j) |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 425 | input_extreme_block[j] = mask_; |
Jingning Han | 5c2696c | 2014-06-02 16:40:01 -0700 | [diff] [blame] | 426 | } else if (i == 1) { |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 427 | for (int j = 0; j < kNumCoeffs; ++j) |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 428 | input_extreme_block[j] = -mask_; |
Jingning Han | 5c2696c | 2014-06-02 16:40:01 -0700 | [diff] [blame] | 429 | } |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 430 | |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 431 | fwd_txfm_ref(input_extreme_block, output_ref_block, pitch_, tx_type_); |
James Zern | 29e1b1a | 2014-07-09 21:02:02 -0700 | [diff] [blame] | 432 | ASM_REGISTER_STATE_CHECK(RunFwdTxfm(input_extreme_block, |
| 433 | output_block, pitch_)); |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 434 | |
| 435 | // The minimum quant value is 4. |
| 436 | for (int j = 0; j < kNumCoeffs; ++j) { |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 437 | EXPECT_EQ(output_block[j], output_ref_block[j]); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 438 | EXPECT_GE(4 * DCT_MAX_VALUE << (bit_depth_ - 8), abs(output_block[j])) |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 439 | << "Error: 16x16 FDCT has coefficient larger than 4*DCT_MAX_VALUE"; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 440 | } |
Jingning Han | cf768b2 | 2013-07-09 16:16:49 -0700 | [diff] [blame] | 441 | } |
| 442 | } |
| 443 | |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 444 | void RunQuantCheck(int dc_thred, int ac_thred) { |
| 445 | ACMRandom rnd(ACMRandom::DeterministicSeed()); |
Jingning Han | 12344f2 | 2014-10-06 10:18:17 -0700 | [diff] [blame^] | 446 | const int count_test_block = 100000; |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 447 | DECLARE_ALIGNED_ARRAY(16, int16_t, input_block, kNumCoeffs); |
| 448 | DECLARE_ALIGNED_ARRAY(16, int16_t, input_extreme_block, kNumCoeffs); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 449 | DECLARE_ALIGNED_ARRAY(16, tran_low_t, output_ref_block, kNumCoeffs); |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 450 | |
| 451 | DECLARE_ALIGNED_ARRAY(16, uint8_t, dst, kNumCoeffs); |
| 452 | DECLARE_ALIGNED_ARRAY(16, uint8_t, ref, kNumCoeffs); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 453 | #if CONFIG_VP9_HIGHBITDEPTH |
| 454 | DECLARE_ALIGNED_ARRAY(16, uint16_t, dst16, kNumCoeffs); |
| 455 | DECLARE_ALIGNED_ARRAY(16, uint16_t, ref16, kNumCoeffs); |
| 456 | #endif |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 457 | |
| 458 | for (int i = 0; i < count_test_block; ++i) { |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 459 | // Initialize a test block with input range [-mask_, mask_]. |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 460 | for (int j = 0; j < kNumCoeffs; ++j) { |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 461 | if (bit_depth_ == VPX_BITS_8) |
| 462 | input_block[j] = rnd.Rand8() - rnd.Rand8(); |
| 463 | else |
| 464 | input_block[j] = (rnd.Rand16() & mask_) - (rnd.Rand16() & mask_); |
| 465 | input_extreme_block[j] = rnd.Rand8() % 2 ? mask_ : -mask_; |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 466 | } |
| 467 | if (i == 0) |
| 468 | for (int j = 0; j < kNumCoeffs; ++j) |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 469 | input_extreme_block[j] = mask_; |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 470 | if (i == 1) |
| 471 | for (int j = 0; j < kNumCoeffs; ++j) |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 472 | input_extreme_block[j] = -mask_; |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 473 | |
| 474 | fwd_txfm_ref(input_extreme_block, output_ref_block, pitch_, tx_type_); |
| 475 | |
| 476 | // clear reconstructed pixel buffers |
| 477 | vpx_memset(dst, 0, kNumCoeffs * sizeof(uint8_t)); |
| 478 | vpx_memset(ref, 0, kNumCoeffs * sizeof(uint8_t)); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 479 | #if CONFIG_VP9_HIGHBITDEPTH |
| 480 | vpx_memset(dst16, 0, kNumCoeffs * sizeof(uint16_t)); |
| 481 | vpx_memset(ref16, 0, kNumCoeffs * sizeof(uint16_t)); |
| 482 | #endif |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 483 | |
| 484 | // quantization with maximum allowed step sizes |
| 485 | output_ref_block[0] = (output_ref_block[0] / dc_thred) * dc_thred; |
| 486 | for (int j = 1; j < kNumCoeffs; ++j) |
| 487 | output_ref_block[j] = (output_ref_block[j] / ac_thred) * ac_thred; |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 488 | if (bit_depth_ == VPX_BITS_8) { |
| 489 | inv_txfm_ref(output_ref_block, ref, pitch_, tx_type_); |
| 490 | ASM_REGISTER_STATE_CHECK(RunInvTxfm(output_ref_block, dst, pitch_)); |
| 491 | #if CONFIG_VP9_HIGHBITDEPTH |
| 492 | } else { |
| 493 | inv_txfm_ref(output_ref_block, CONVERT_TO_BYTEPTR(ref16), pitch_, |
| 494 | tx_type_); |
| 495 | ASM_REGISTER_STATE_CHECK(RunInvTxfm(output_ref_block, |
| 496 | CONVERT_TO_BYTEPTR(dst16), pitch_)); |
| 497 | #endif |
| 498 | } |
| 499 | if (bit_depth_ == VPX_BITS_8) { |
| 500 | for (int j = 0; j < kNumCoeffs; ++j) |
| 501 | EXPECT_EQ(ref[j], dst[j]); |
| 502 | #if CONFIG_VP9_HIGHBITDEPTH |
| 503 | } else { |
| 504 | for (int j = 0; j < kNumCoeffs; ++j) |
| 505 | EXPECT_EQ(ref16[j], dst16[j]); |
| 506 | #endif |
| 507 | } |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 508 | } |
| 509 | } |
| 510 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 511 | void RunInvAccuracyCheck() { |
| 512 | ACMRandom rnd(ACMRandom::DeterministicSeed()); |
| 513 | const int count_test_block = 1000; |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 514 | DECLARE_ALIGNED_ARRAY(16, int16_t, in, kNumCoeffs); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 515 | DECLARE_ALIGNED_ARRAY(16, tran_low_t, coeff, kNumCoeffs); |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 516 | DECLARE_ALIGNED_ARRAY(16, uint8_t, dst, kNumCoeffs); |
| 517 | DECLARE_ALIGNED_ARRAY(16, uint8_t, src, kNumCoeffs); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 518 | #if CONFIG_VP9_HIGHBITDEPTH |
| 519 | DECLARE_ALIGNED_ARRAY(16, uint16_t, dst16, kNumCoeffs); |
| 520 | DECLARE_ALIGNED_ARRAY(16, uint16_t, src16, kNumCoeffs); |
| 521 | #endif |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 522 | |
| 523 | for (int i = 0; i < count_test_block; ++i) { |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 524 | double out_r[kNumCoeffs]; |
| 525 | |
| 526 | // Initialize a test block with input range [-255, 255]. |
| 527 | for (int j = 0; j < kNumCoeffs; ++j) { |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 528 | if (bit_depth_ == VPX_BITS_8) { |
| 529 | src[j] = rnd.Rand8(); |
| 530 | dst[j] = rnd.Rand8(); |
| 531 | in[j] = src[j] - dst[j]; |
| 532 | #if CONFIG_VP9_HIGHBITDEPTH |
| 533 | } else { |
| 534 | src16[j] = rnd.Rand16() & mask_; |
| 535 | dst16[j] = rnd.Rand16() & mask_; |
| 536 | in[j] = src16[j] - dst16[j]; |
| 537 | #endif |
| 538 | } |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 539 | } |
| 540 | |
| 541 | reference_16x16_dct_2d(in, out_r); |
| 542 | for (int j = 0; j < kNumCoeffs; ++j) |
| 543 | coeff[j] = round(out_r[j]); |
| 544 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 545 | if (bit_depth_ == VPX_BITS_8) { |
| 546 | ASM_REGISTER_STATE_CHECK(RunInvTxfm(coeff, dst, 16)); |
| 547 | #if CONFIG_VP9_HIGHBITDEPTH |
| 548 | } else { |
| 549 | ASM_REGISTER_STATE_CHECK(RunInvTxfm(coeff, CONVERT_TO_BYTEPTR(dst16), |
| 550 | 16)); |
| 551 | #endif |
| 552 | } |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 553 | |
| 554 | for (int j = 0; j < kNumCoeffs; ++j) { |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 555 | #if CONFIG_VP9_HIGHBITDEPTH |
| 556 | const uint32_t diff = |
| 557 | bit_depth_ == VPX_BITS_8 ? dst[j] - src[j] : dst16[j] - src16[j]; |
| 558 | #else |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 559 | const uint32_t diff = dst[j] - src[j]; |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 560 | #endif |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 561 | const uint32_t error = diff * diff; |
| 562 | EXPECT_GE(1u, error) |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 563 | << "Error: 16x16 IDCT has error " << error |
| 564 | << " at index " << j; |
| 565 | } |
| 566 | } |
Jingning Han | cf768b2 | 2013-07-09 16:16:49 -0700 | [diff] [blame] | 567 | } |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 568 | int pitch_; |
| 569 | int tx_type_; |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 570 | vpx_bit_depth_t bit_depth_; |
| 571 | int mask_; |
James Zern | 44f8484 | 2014-07-16 18:53:33 -0700 | [diff] [blame] | 572 | FhtFunc fwd_txfm_ref; |
| 573 | IhtFunc inv_txfm_ref; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 574 | }; |
| 575 | |
Joshua Litt | 51490e5 | 2013-11-18 17:07:55 -0800 | [diff] [blame] | 576 | class Trans16x16DCT |
| 577 | : public Trans16x16TestBase, |
James Zern | 44f8484 | 2014-07-16 18:53:33 -0700 | [diff] [blame] | 578 | public ::testing::TestWithParam<Dct16x16Param> { |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 579 | public: |
| 580 | virtual ~Trans16x16DCT() {} |
| 581 | |
| 582 | virtual void SetUp() { |
| 583 | fwd_txfm_ = GET_PARAM(0); |
| 584 | inv_txfm_ = GET_PARAM(1); |
| 585 | tx_type_ = GET_PARAM(2); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 586 | bit_depth_ = GET_PARAM(3); |
Dmitry Kovalev | 1aa7fd5 | 2013-10-18 11:49:33 -0700 | [diff] [blame] | 587 | pitch_ = 16; |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 588 | fwd_txfm_ref = fdct16x16_ref; |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 589 | inv_txfm_ref = idct16x16_ref; |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 590 | mask_ = (1 << bit_depth_) - 1; |
| 591 | #if CONFIG_VP9_HIGHBITDEPTH |
| 592 | switch (bit_depth_) { |
| 593 | case 10: |
| 594 | inv_txfm_ref = idct16x16_10_ref; |
| 595 | break; |
| 596 | case 12: |
| 597 | inv_txfm_ref = idct16x16_12_ref; |
| 598 | break; |
| 599 | default: |
| 600 | inv_txfm_ref = idct16x16_ref; |
| 601 | break; |
| 602 | } |
| 603 | #else |
| 604 | inv_txfm_ref = idct16x16_ref; |
| 605 | #endif |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 606 | } |
| 607 | virtual void TearDown() { libvpx_test::ClearSystemState(); } |
| 608 | |
| 609 | protected: |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 610 | void RunFwdTxfm(int16_t *in, tran_low_t *out, int stride) { |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 611 | fwd_txfm_(in, out, stride); |
| 612 | } |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 613 | void RunInvTxfm(tran_low_t *out, uint8_t *dst, int stride) { |
Dmitry Kovalev | 1aa7fd5 | 2013-10-18 11:49:33 -0700 | [diff] [blame] | 614 | inv_txfm_(out, dst, stride); |
Jingning Han | cf768b2 | 2013-07-09 16:16:49 -0700 | [diff] [blame] | 615 | } |
| 616 | |
James Zern | 44f8484 | 2014-07-16 18:53:33 -0700 | [diff] [blame] | 617 | FdctFunc fwd_txfm_; |
| 618 | IdctFunc inv_txfm_; |
Jingning Han | cf768b2 | 2013-07-09 16:16:49 -0700 | [diff] [blame] | 619 | }; |
| 620 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 621 | TEST_P(Trans16x16DCT, AccuracyCheck) { |
| 622 | RunAccuracyCheck(); |
Jingning Han | cf768b2 | 2013-07-09 16:16:49 -0700 | [diff] [blame] | 623 | } |
| 624 | |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 625 | TEST_P(Trans16x16DCT, CoeffCheck) { |
| 626 | RunCoeffCheck(); |
| 627 | } |
| 628 | |
| 629 | TEST_P(Trans16x16DCT, MemCheck) { |
| 630 | RunMemCheck(); |
Jingning Han | cf768b2 | 2013-07-09 16:16:49 -0700 | [diff] [blame] | 631 | } |
| 632 | |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 633 | TEST_P(Trans16x16DCT, QuantCheck) { |
| 634 | // Use maximally allowed quantization step sizes for DC and AC |
| 635 | // coefficients respectively. |
| 636 | RunQuantCheck(1336, 1828); |
| 637 | } |
| 638 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 639 | TEST_P(Trans16x16DCT, InvAccuracyCheck) { |
| 640 | RunInvAccuracyCheck(); |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 641 | } |
Scott LaVarnway | a272ff2 | 2013-05-15 13:16:02 -0400 | [diff] [blame] | 642 | |
Joshua Litt | 51490e5 | 2013-11-18 17:07:55 -0800 | [diff] [blame] | 643 | class Trans16x16HT |
| 644 | : public Trans16x16TestBase, |
James Zern | 44f8484 | 2014-07-16 18:53:33 -0700 | [diff] [blame] | 645 | public ::testing::TestWithParam<Ht16x16Param> { |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 646 | public: |
| 647 | virtual ~Trans16x16HT() {} |
| 648 | |
| 649 | virtual void SetUp() { |
| 650 | fwd_txfm_ = GET_PARAM(0); |
| 651 | inv_txfm_ = GET_PARAM(1); |
| 652 | tx_type_ = GET_PARAM(2); |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 653 | bit_depth_ = GET_PARAM(3); |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 654 | pitch_ = 16; |
| 655 | fwd_txfm_ref = fht16x16_ref; |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 656 | inv_txfm_ref = iht16x16_ref; |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 657 | mask_ = (1 << bit_depth_) - 1; |
| 658 | #if CONFIG_VP9_HIGHBITDEPTH |
| 659 | switch (bit_depth_) { |
| 660 | case VPX_BITS_10: |
| 661 | inv_txfm_ref = iht16x16_10; |
| 662 | break; |
| 663 | case VPX_BITS_12: |
| 664 | inv_txfm_ref = iht16x16_12; |
| 665 | break; |
| 666 | default: |
| 667 | inv_txfm_ref = iht16x16_ref; |
| 668 | break; |
| 669 | } |
| 670 | #else |
| 671 | inv_txfm_ref = iht16x16_ref; |
| 672 | #endif |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 673 | } |
| 674 | virtual void TearDown() { libvpx_test::ClearSystemState(); } |
| 675 | |
| 676 | protected: |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 677 | void RunFwdTxfm(int16_t *in, tran_low_t *out, int stride) { |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 678 | fwd_txfm_(in, out, stride, tx_type_); |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 679 | } |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 680 | void RunInvTxfm(tran_low_t *out, uint8_t *dst, int stride) { |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 681 | inv_txfm_(out, dst, stride, tx_type_); |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 682 | } |
| 683 | |
James Zern | 44f8484 | 2014-07-16 18:53:33 -0700 | [diff] [blame] | 684 | FhtFunc fwd_txfm_; |
| 685 | IhtFunc inv_txfm_; |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 686 | }; |
| 687 | |
| 688 | TEST_P(Trans16x16HT, AccuracyCheck) { |
| 689 | RunAccuracyCheck(); |
| 690 | } |
| 691 | |
Jingning Han | 37705a3 | 2013-09-09 17:07:55 -0700 | [diff] [blame] | 692 | TEST_P(Trans16x16HT, CoeffCheck) { |
| 693 | RunCoeffCheck(); |
| 694 | } |
| 695 | |
| 696 | TEST_P(Trans16x16HT, MemCheck) { |
| 697 | RunMemCheck(); |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 698 | } |
| 699 | |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 700 | TEST_P(Trans16x16HT, QuantCheck) { |
| 701 | // The encoder skips any non-DC intra prediction modes, |
| 702 | // when the quantization step size goes beyond 988. |
Jingning Han | 12344f2 | 2014-10-06 10:18:17 -0700 | [diff] [blame^] | 703 | RunQuantCheck(429, 729); |
Jingning Han | 49b4a27 | 2014-05-29 12:50:54 -0700 | [diff] [blame] | 704 | } |
| 705 | |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 706 | using std::tr1::make_tuple; |
| 707 | |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 708 | #if CONFIG_VP9_HIGHBITDEPTH |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 709 | INSTANTIATE_TEST_CASE_P( |
| 710 | C, Trans16x16DCT, |
| 711 | ::testing::Values( |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 712 | make_tuple(&vp9_high_fdct16x16_c, &idct16x16_10, 0, VPX_BITS_10), |
| 713 | make_tuple(&vp9_high_fdct16x16_c, &idct16x16_12, 0, VPX_BITS_12), |
| 714 | make_tuple(&vp9_fdct16x16_c, &vp9_idct16x16_256_add_c, 0, VPX_BITS_8))); |
| 715 | #else |
| 716 | INSTANTIATE_TEST_CASE_P( |
| 717 | C, Trans16x16DCT, |
| 718 | ::testing::Values( |
| 719 | make_tuple(&vp9_fdct16x16_c, &vp9_idct16x16_256_add_c, 0, VPX_BITS_8))); |
| 720 | #endif |
| 721 | |
| 722 | #if CONFIG_VP9_HIGHBITDEPTH |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 723 | INSTANTIATE_TEST_CASE_P( |
| 724 | C, Trans16x16HT, |
| 725 | ::testing::Values( |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 726 | make_tuple(&vp9_high_fht16x16_c, &iht16x16_10, 0, VPX_BITS_10), |
| 727 | make_tuple(&vp9_high_fht16x16_c, &iht16x16_10, 1, VPX_BITS_10), |
| 728 | make_tuple(&vp9_high_fht16x16_c, &iht16x16_10, 2, VPX_BITS_10), |
| 729 | make_tuple(&vp9_high_fht16x16_c, &iht16x16_10, 3, VPX_BITS_10), |
| 730 | make_tuple(&vp9_high_fht16x16_c, &iht16x16_12, 0, VPX_BITS_12), |
| 731 | make_tuple(&vp9_high_fht16x16_c, &iht16x16_12, 1, VPX_BITS_12), |
| 732 | make_tuple(&vp9_high_fht16x16_c, &iht16x16_12, 2, VPX_BITS_12), |
| 733 | make_tuple(&vp9_high_fht16x16_c, &iht16x16_12, 3, VPX_BITS_12), |
| 734 | make_tuple(&vp9_fht16x16_c, &vp9_iht16x16_256_add_c, 0, VPX_BITS_8), |
| 735 | make_tuple(&vp9_fht16x16_c, &vp9_iht16x16_256_add_c, 1, VPX_BITS_8), |
| 736 | make_tuple(&vp9_fht16x16_c, &vp9_iht16x16_256_add_c, 2, VPX_BITS_8), |
| 737 | make_tuple(&vp9_fht16x16_c, &vp9_iht16x16_256_add_c, 3, VPX_BITS_8))); |
| 738 | #else |
| 739 | INSTANTIATE_TEST_CASE_P( |
| 740 | C, Trans16x16HT, |
| 741 | ::testing::Values( |
| 742 | make_tuple(&vp9_fht16x16_c, &vp9_iht16x16_256_add_c, 0, VPX_BITS_8), |
| 743 | make_tuple(&vp9_fht16x16_c, &vp9_iht16x16_256_add_c, 1, VPX_BITS_8), |
| 744 | make_tuple(&vp9_fht16x16_c, &vp9_iht16x16_256_add_c, 2, VPX_BITS_8), |
| 745 | make_tuple(&vp9_fht16x16_c, &vp9_iht16x16_256_add_c, 3, VPX_BITS_8))); |
| 746 | #endif |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 747 | |
Deb Mukherjee | d50716f | 2014-10-02 15:43:27 -0700 | [diff] [blame] | 748 | #if HAVE_NEON_ASM && !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE |
James Zern | adbb881 | 2014-02-25 23:11:49 -0800 | [diff] [blame] | 749 | INSTANTIATE_TEST_CASE_P( |
| 750 | NEON, Trans16x16DCT, |
| 751 | ::testing::Values( |
| 752 | make_tuple(&vp9_fdct16x16_c, |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 753 | &vp9_idct16x16_256_add_neon, 0, VPX_BITS_8))); |
James Zern | adbb881 | 2014-02-25 23:11:49 -0800 | [diff] [blame] | 754 | #endif |
| 755 | |
Deb Mukherjee | d50716f | 2014-10-02 15:43:27 -0700 | [diff] [blame] | 756 | #if HAVE_SSE2 && !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 757 | INSTANTIATE_TEST_CASE_P( |
| 758 | SSE2, Trans16x16DCT, |
| 759 | ::testing::Values( |
Dmitry Kovalev | 02feb63 | 2013-10-23 10:57:12 -0700 | [diff] [blame] | 760 | make_tuple(&vp9_fdct16x16_sse2, |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 761 | &vp9_idct16x16_256_add_sse2, 0, VPX_BITS_8))); |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 762 | INSTANTIATE_TEST_CASE_P( |
| 763 | SSE2, Trans16x16HT, |
| 764 | ::testing::Values( |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 765 | make_tuple(&vp9_fht16x16_sse2, &vp9_iht16x16_256_add_sse2, 0, |
| 766 | VPX_BITS_8), |
| 767 | make_tuple(&vp9_fht16x16_sse2, &vp9_iht16x16_256_add_sse2, 1, |
| 768 | VPX_BITS_8), |
| 769 | make_tuple(&vp9_fht16x16_sse2, &vp9_iht16x16_256_add_sse2, 2, |
| 770 | VPX_BITS_8), |
| 771 | make_tuple(&vp9_fht16x16_sse2, &vp9_iht16x16_256_add_sse2, 3, |
| 772 | VPX_BITS_8))); |
Jingning Han | 8f92a7e | 2013-09-05 12:44:03 -0700 | [diff] [blame] | 773 | #endif |
Jingning Han | e4a758b | 2014-05-22 11:31:43 -0700 | [diff] [blame] | 774 | |
Deb Mukherjee | d50716f | 2014-10-02 15:43:27 -0700 | [diff] [blame] | 775 | #if HAVE_SSSE3 && !CONFIG_VP9_HIGHBITDEPTH && !CONFIG_EMULATE_HARDWARE |
Jingning Han | e4a758b | 2014-05-22 11:31:43 -0700 | [diff] [blame] | 776 | INSTANTIATE_TEST_CASE_P( |
| 777 | SSSE3, Trans16x16DCT, |
| 778 | ::testing::Values( |
Deb Mukherjee | 10783d4 | 2014-09-02 16:34:09 -0700 | [diff] [blame] | 779 | make_tuple(&vp9_fdct16x16_c, &vp9_idct16x16_256_add_ssse3, 0, |
| 780 | VPX_BITS_8))); |
Jingning Han | e4a758b | 2014-05-22 11:31:43 -0700 | [diff] [blame] | 781 | #endif |
Daniel Kang | fed8a18 | 2012-08-02 17:03:14 -0700 | [diff] [blame] | 782 | } // namespace |