blob: aeaaea2d1f3618ffe9ff5be02fa0e7674500a0ad [file] [log] [blame]
David Barker8295c7c2017-06-02 15:21:43 +01001/*
2 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
3 *
4 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10 */
11
12#include "test/av1_convolve_2d_test_util.h"
13
Scott LaVarnway8b909182017-12-28 11:39:41 -080014#include "aom_ports/aom_timer.h"
Cheng Chen03c75492017-11-02 16:38:14 -070015#include "av1/common/common_data.h"
Scott LaVarnway8b909182017-12-28 11:39:41 -080016#include "av1/common/convolve.h"
David Barker8295c7c2017-06-02 15:21:43 +010017
James Zern95612802018-03-30 11:37:54 -070018using ::testing::make_tuple;
19using ::testing::tuple;
David Barker8295c7c2017-06-02 15:21:43 +010020
21namespace libaom_test {
22
Linfeng Zhanga3e9c502018-01-09 10:04:20 -080023const int kMaxSize = 128 + 32; // padding
David Barker8295c7c2017-06-02 15:21:43 +010024namespace AV1Convolve2D {
25
26::testing::internal::ParamGenerator<Convolve2DParam> BuildParams(
sarahparker3c38cce2018-03-15 14:12:49 -070027 convolve_2d_func filter, int has_subx, int has_suby) {
28 return ::testing::Combine(::testing::Values(filter),
29 ::testing::Values(has_subx),
30 ::testing::Values(has_suby),
31 ::testing::Range(BLOCK_4X4, BLOCK_SIZES_ALL));
David Barker8295c7c2017-06-02 15:21:43 +010032}
33
Linfeng Zhang5f0485b2018-01-09 10:21:57 -080034AV1Convolve2DSrTest::~AV1Convolve2DSrTest() {}
35void AV1Convolve2DSrTest::SetUp() {
36 rnd_.Reset(ACMRandom::DeterministicSeed());
37}
38
39void AV1Convolve2DSrTest::TearDown() { libaom_test::ClearSystemState(); }
40
41void AV1Convolve2DSrTest::RunCheckOutput(convolve_2d_func test_impl) {
42 const int w = kMaxSize, h = kMaxSize;
43 const int has_subx = GET_PARAM(1);
44 const int has_suby = GET_PARAM(2);
sarahparker3c38cce2018-03-15 14:12:49 -070045 const int block_idx = GET_PARAM(3);
Linfeng Zhang5f0485b2018-01-09 10:21:57 -080046 int hfilter, vfilter, subx, suby;
47 uint8_t input[kMaxSize * kMaxSize];
48 DECLARE_ALIGNED(32, uint8_t, output[MAX_SB_SQUARE]);
49 DECLARE_ALIGNED(32, uint8_t, output2[MAX_SB_SQUARE]);
50
Linfeng Zhang5f0485b2018-01-09 10:21:57 -080051 for (int i = 0; i < h; ++i)
52 for (int j = 0; j < w; ++j) input[i * w + j] = rnd_.Rand8();
53 for (int i = 0; i < MAX_SB_SQUARE; ++i)
54 output[i] = output2[i] = rnd_.Rand31();
55
Sarah Parker30d4e532018-03-14 17:53:39 -070056 // Make sure that sizes 2xN and Nx2 are also tested for chroma.
57 const int num_sizes =
58 (block_size_wide[block_idx] == 4 || block_size_high[block_idx] == 4) ? 2
59 : 1;
60 for (int shift = 0; shift < num_sizes; ++shift) { // luma and chroma
61 const int out_w = block_size_wide[block_idx] >> shift;
62 const int out_h = block_size_high[block_idx] >> shift;
63 for (hfilter = EIGHTTAP_REGULAR; hfilter < INTERP_FILTERS_ALL; ++hfilter) {
64 for (vfilter = EIGHTTAP_REGULAR; vfilter < INTERP_FILTERS_ALL;
65 ++vfilter) {
Peng Bin3a0c2ed2018-07-19 16:24:00 +080066 const InterpFilterParams *filter_params_x =
Urvang Joshia99a2632018-04-20 17:41:27 -040067 av1_get_interp_filter_params_with_block_size((InterpFilter)hfilter,
68 out_w);
Peng Bin3a0c2ed2018-07-19 16:24:00 +080069 const InterpFilterParams *filter_params_y =
Urvang Joshia99a2632018-04-20 17:41:27 -040070 av1_get_interp_filter_params_with_block_size((InterpFilter)vfilter,
71 out_h);
Sarah Parker30d4e532018-03-14 17:53:39 -070072 for (int do_average = 0; do_average < 1; ++do_average) {
73 ConvolveParams conv_params1 =
Peng Binf7b11f52018-08-09 17:29:39 +080074 get_conv_params_no_round(do_average, 0, NULL, 0, 0, 8);
Sarah Parker30d4e532018-03-14 17:53:39 -070075 ConvolveParams conv_params2 =
Peng Binf7b11f52018-08-09 17:29:39 +080076 get_conv_params_no_round(do_average, 0, NULL, 0, 0, 8);
Linfeng Zhang5f0485b2018-01-09 10:21:57 -080077
Sarah Parker30d4e532018-03-14 17:53:39 -070078 const int subx_range = has_subx ? 16 : 1;
79 const int suby_range = has_suby ? 16 : 1;
80 for (subx = 0; subx < subx_range; ++subx) {
81 for (suby = 0; suby < suby_range; ++suby) {
82 // Choose random locations within the source block
83 const int offset_r = 3 + rnd_.PseudoUniform(h - out_h - 7);
84 const int offset_c = 3 + rnd_.PseudoUniform(w - out_w - 7);
85 av1_convolve_2d_sr_c(input + offset_r * w + offset_c, w, output,
Peng Bin3a0c2ed2018-07-19 16:24:00 +080086 MAX_SB_SIZE, out_w, out_h, filter_params_x,
87 filter_params_y, subx, suby, &conv_params1);
Sarah Parker30d4e532018-03-14 17:53:39 -070088 test_impl(input + offset_r * w + offset_c, w, output2,
Peng Bin3a0c2ed2018-07-19 16:24:00 +080089 MAX_SB_SIZE, out_w, out_h, filter_params_x,
90 filter_params_y, subx, suby, &conv_params2);
Linfeng Zhang5f0485b2018-01-09 10:21:57 -080091
Sarah Parker30d4e532018-03-14 17:53:39 -070092 if (memcmp(output, output2, sizeof(output))) {
93 for (int i = 0; i < MAX_SB_SIZE; ++i) {
94 for (int j = 0; j < MAX_SB_SIZE; ++j) {
95 int idx = i * MAX_SB_SIZE + j;
96 ASSERT_EQ(output[idx], output2[idx])
97 << out_w << "x" << out_h << " Pixel mismatch at index "
98 << idx << " = (" << i << ", " << j
99 << "), sub pixel offset = (" << suby << ", " << subx
100 << ")";
Linfeng Zhang5f0485b2018-01-09 10:21:57 -0800101 }
102 }
103 }
104 }
105 }
106 }
107 }
108 }
109 }
110}
111
112void AV1Convolve2DSrTest::RunSpeedTest(convolve_2d_func test_impl) {
113 const int w = kMaxSize, h = kMaxSize;
114 const int has_subx = GET_PARAM(1);
115 const int has_suby = GET_PARAM(2);
sarahparker3c38cce2018-03-15 14:12:49 -0700116 const int block_idx = GET_PARAM(3);
Linfeng Zhang5f0485b2018-01-09 10:21:57 -0800117
118 uint8_t input[kMaxSize * kMaxSize];
119 DECLARE_ALIGNED(32, uint8_t, output[MAX_SB_SQUARE]);
120
121 for (int i = 0; i < h; ++i)
122 for (int j = 0; j < w; ++j) input[i * w + j] = rnd_.Rand8();
123
124 int hfilter = EIGHTTAP_REGULAR, vfilter = EIGHTTAP_REGULAR;
125 int subx = 0, suby = 0;
126
Linfeng Zhang5f0485b2018-01-09 10:21:57 -0800127 const int do_average = 0;
128 ConvolveParams conv_params2 =
Peng Binf7b11f52018-08-09 17:29:39 +0800129 get_conv_params_no_round(do_average, 0, NULL, 0, 0, 8);
Linfeng Zhang5f0485b2018-01-09 10:21:57 -0800130
Sarah Parker30d4e532018-03-14 17:53:39 -0700131 // Make sure that sizes 2xN and Nx2 are also tested for chroma.
132 const int num_sizes =
133 (block_size_wide[block_idx] == 4 || block_size_high[block_idx] == 4) ? 2
134 : 1;
135 for (int shift = 0; shift < num_sizes; ++shift) { // luma and chroma
136 const int out_w = block_size_wide[block_idx] >> shift;
137 const int out_h = block_size_high[block_idx] >> shift;
138 const int num_loops = 1000000000 / (out_w + out_h);
Urvang Joshia99a2632018-04-20 17:41:27 -0400139
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800140 const InterpFilterParams *filter_params_x =
Urvang Joshia99a2632018-04-20 17:41:27 -0400141 av1_get_interp_filter_params_with_block_size((InterpFilter)hfilter,
142 out_w);
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800143 const InterpFilterParams *filter_params_y =
Urvang Joshia99a2632018-04-20 17:41:27 -0400144 av1_get_interp_filter_params_with_block_size((InterpFilter)vfilter,
145 out_h);
146
Sarah Parker30d4e532018-03-14 17:53:39 -0700147 aom_usec_timer timer;
148 aom_usec_timer_start(&timer);
Linfeng Zhang5f0485b2018-01-09 10:21:57 -0800149
Sarah Parker30d4e532018-03-14 17:53:39 -0700150 for (int i = 0; i < num_loops; ++i)
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800151 test_impl(input, w, output, MAX_SB_SIZE, out_w, out_h, filter_params_x,
152 filter_params_y, subx, suby, &conv_params2);
Linfeng Zhang5f0485b2018-01-09 10:21:57 -0800153
Sarah Parker30d4e532018-03-14 17:53:39 -0700154 aom_usec_timer_mark(&timer);
155 const int elapsed_time = static_cast<int>(aom_usec_timer_elapsed(&timer));
sarahparker3c38cce2018-03-15 14:12:49 -0700156 printf("%d,%d convolve %3dx%-3d: %7.2f us\n", has_subx, has_suby, out_w,
Sarah Parker30d4e532018-03-14 17:53:39 -0700157 out_h, 1000.0 * elapsed_time / num_loops);
Linfeng Zhang5f0485b2018-01-09 10:21:57 -0800158 }
159}
160
Cheng Chen56d8b952017-11-03 18:55:55 -0700161AV1JntConvolve2DTest::~AV1JntConvolve2DTest() {}
162void AV1JntConvolve2DTest::SetUp() {
163 rnd_.Reset(ACMRandom::DeterministicSeed());
164}
165
166void AV1JntConvolve2DTest::TearDown() { libaom_test::ClearSystemState(); }
167
168void AV1JntConvolve2DTest::RunCheckOutput(convolve_2d_func test_impl) {
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800169 const int w = kMaxSize, h = kMaxSize;
170 const int has_subx = GET_PARAM(1);
171 const int has_suby = GET_PARAM(2);
sarahparker3c38cce2018-03-15 14:12:49 -0700172 const int block_idx = GET_PARAM(3);
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800173 int hfilter, vfilter, subx, suby;
174 uint8_t input[kMaxSize * kMaxSize];
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530175 DECLARE_ALIGNED(32, CONV_BUF_TYPE, output1[MAX_SB_SQUARE]);
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800176 DECLARE_ALIGNED(32, CONV_BUF_TYPE, output2[MAX_SB_SQUARE]);
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530177 DECLARE_ALIGNED(16, uint8_t, output8_1[MAX_SB_SQUARE]);
178 DECLARE_ALIGNED(16, uint8_t, output8_2[MAX_SB_SQUARE]);
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800179
Linfeng Zhang5f0485b2018-01-09 10:21:57 -0800180 for (int i = 0; i < h; ++i)
181 for (int j = 0; j < w; ++j) input[i * w + j] = rnd_.Rand8();
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530182 for (int i = 0; i < MAX_SB_SQUARE; ++i) {
183 output1[i] = output2[i] = rnd_.Rand16();
184 output8_1[i] = output8_2[i] = rnd_.Rand8();
185 }
Cheng Chen03c75492017-11-02 16:38:14 -0700186
Sarah Parker30d4e532018-03-14 17:53:39 -0700187 const int out_w = block_size_wide[block_idx];
188 const int out_h = block_size_high[block_idx];
189 for (hfilter = EIGHTTAP_REGULAR; hfilter < INTERP_FILTERS_ALL; ++hfilter) {
190 for (vfilter = EIGHTTAP_REGULAR; vfilter < INTERP_FILTERS_ALL; ++vfilter) {
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800191 const InterpFilterParams *filter_params_x =
Urvang Joshia99a2632018-04-20 17:41:27 -0400192 av1_get_interp_filter_params_with_block_size((InterpFilter)hfilter,
193 out_w);
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800194 const InterpFilterParams *filter_params_y =
Urvang Joshia99a2632018-04-20 17:41:27 -0400195 av1_get_interp_filter_params_with_block_size((InterpFilter)vfilter,
196 out_h);
Sarah Parker30d4e532018-03-14 17:53:39 -0700197 for (int do_average = 0; do_average <= 1; ++do_average) {
Peng Binf7b11f52018-08-09 17:29:39 +0800198 ConvolveParams conv_params1 =
199 get_conv_params_no_round(do_average, 0, output1, MAX_SB_SIZE, 1, 8);
200 ConvolveParams conv_params2 =
201 get_conv_params_no_round(do_average, 0, output2, MAX_SB_SIZE, 1, 8);
Cheng Chen03c75492017-11-02 16:38:14 -0700202
Sarah Parker30d4e532018-03-14 17:53:39 -0700203 // Test special case where jnt_comp_avg is not used
Debargha Mukherjee7ac3eb12018-12-12 10:26:50 -0800204 conv_params1.use_dist_wtd_comp_avg = 0;
205 conv_params2.use_dist_wtd_comp_avg = 0;
Cheng Chen03c75492017-11-02 16:38:14 -0700206
Sarah Parker30d4e532018-03-14 17:53:39 -0700207 const int subx_range = has_subx ? 16 : 1;
208 const int suby_range = has_suby ? 16 : 1;
209 for (subx = 0; subx < subx_range; ++subx) {
210 for (suby = 0; suby < suby_range; ++suby) {
211 // Choose random locations within the source block
212 const int offset_r = 3 + rnd_.PseudoUniform(h - out_h - 7);
213 const int offset_c = 3 + rnd_.PseudoUniform(w - out_w - 7);
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530214 av1_jnt_convolve_2d_c(input + offset_r * w + offset_c, w, output8_1,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800215 MAX_SB_SIZE, out_w, out_h, filter_params_x,
216 filter_params_y, subx, suby, &conv_params1);
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530217 test_impl(input + offset_r * w + offset_c, w, output8_2,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800218 MAX_SB_SIZE, out_w, out_h, filter_params_x,
219 filter_params_y, subx, suby, &conv_params2);
Cheng Chen03c75492017-11-02 16:38:14 -0700220
Sarah Parker30d4e532018-03-14 17:53:39 -0700221 for (int i = 0; i < out_h; ++i) {
222 for (int j = 0; j < out_w; ++j) {
223 int idx = i * MAX_SB_SIZE + j;
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530224 ASSERT_EQ(output1[idx], output2[idx])
Sarah Parker30d4e532018-03-14 17:53:39 -0700225 << "Mismatch at unit tests for av1_jnt_convolve_2d\n"
226 << out_w << "x" << out_h << " Pixel mismatch at index "
227 << idx << " = (" << i << ", " << j
228 << "), sub pixel offset = (" << suby << ", " << subx << ")";
Cheng Chen03c75492017-11-02 16:38:14 -0700229 }
230 }
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530231
232 if (memcmp(output8_1, output8_2, sizeof(output8_1))) {
233 for (int i = 0; i < MAX_SB_SIZE; ++i) {
234 for (int j = 0; j < MAX_SB_SIZE; ++j) {
235 int idx = i * MAX_SB_SIZE + j;
236 ASSERT_EQ(output8_1[idx], output8_2[idx])
237 << out_w << "x" << out_h << " Pixel mismatch at index "
238 << idx << " = (" << i << ", " << j
239 << "), sub pixel offset = (" << suby << ", " << subx
240 << ")";
241 }
242 }
243 }
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800244 }
Sarah Parker30d4e532018-03-14 17:53:39 -0700245 }
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800246
Sarah Parker30d4e532018-03-14 17:53:39 -0700247 // Test different combination of fwd and bck offset weights
248 for (int k = 0; k < 2; ++k) {
249 for (int l = 0; l < 4; ++l) {
Debargha Mukherjee7ac3eb12018-12-12 10:26:50 -0800250 conv_params1.use_dist_wtd_comp_avg = 1;
251 conv_params2.use_dist_wtd_comp_avg = 1;
Sarah Parker30d4e532018-03-14 17:53:39 -0700252 conv_params1.fwd_offset = quant_dist_lookup_table[k][l][0];
253 conv_params1.bck_offset = quant_dist_lookup_table[k][l][1];
254 conv_params2.fwd_offset = quant_dist_lookup_table[k][l][0];
255 conv_params2.bck_offset = quant_dist_lookup_table[k][l][1];
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800256
Sarah Parker30d4e532018-03-14 17:53:39 -0700257 for (subx = 0; subx < subx_range; ++subx) {
258 for (suby = 0; suby < suby_range; ++suby) {
259 // Choose random locations within the source block
260 const int offset_r = 3 + rnd_.PseudoUniform(h - out_h - 7);
261 const int offset_c = 3 + rnd_.PseudoUniform(w - out_w - 7);
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530262 av1_jnt_convolve_2d_c(input + offset_r * w + offset_c, w,
263 output8_1, MAX_SB_SIZE, out_w, out_h,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800264 filter_params_x, filter_params_y, subx,
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530265 suby, &conv_params1);
266 test_impl(input + offset_r * w + offset_c, w, output8_2,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800267 MAX_SB_SIZE, out_w, out_h, filter_params_x,
268 filter_params_y, subx, suby, &conv_params2);
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800269
Sarah Parker30d4e532018-03-14 17:53:39 -0700270 for (int i = 0; i < out_h; ++i) {
271 for (int j = 0; j < out_w; ++j) {
272 int idx = i * MAX_SB_SIZE + j;
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530273 ASSERT_EQ(output1[idx], output2[idx])
Sarah Parker30d4e532018-03-14 17:53:39 -0700274 << "Mismatch at unit tests for "
275 "av1_jnt_convolve_2d\n"
276 << out_w << "x" << out_h << " Pixel mismatch at index "
277 << idx << " = (" << i << ", " << j
278 << "), sub pixel offset = (" << suby << ", " << subx
279 << ")";
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800280 }
281 }
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530282 if (memcmp(output8_1, output8_2, sizeof(output8_1))) {
283 for (int i = 0; i < MAX_SB_SIZE; ++i) {
284 for (int j = 0; j < MAX_SB_SIZE; ++j) {
285 int idx = i * MAX_SB_SIZE + j;
286 ASSERT_EQ(output8_1[idx], output8_2[idx])
287 << out_w << "x" << out_h
288 << " Pixel mismatch at index " << idx << " = (" << i
289 << ", " << j << "), sub pixel offset = (" << suby
290 << ", " << subx << ")";
291 }
292 }
293 }
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800294 }
295 }
296 }
Cheng Chen03c75492017-11-02 16:38:14 -0700297 }
298 }
299 }
300 }
Cheng Chen03c75492017-11-02 16:38:14 -0700301}
Sanampudi Venkata Rao90134d32018-05-19 16:19:20 +0530302
303void AV1JntConvolve2DTest::RunSpeedTest(convolve_2d_func test_impl) {
304 const int w = kMaxSize, h = kMaxSize;
305 const int has_subx = GET_PARAM(1);
306 const int has_suby = GET_PARAM(2);
307 const int block_idx = GET_PARAM(3);
308
309 int subx = 0, suby = 0;
310 uint8_t input[kMaxSize * kMaxSize];
311 DECLARE_ALIGNED(32, CONV_BUF_TYPE, output[MAX_SB_SQUARE]);
312 DECLARE_ALIGNED(16, uint8_t, output8[MAX_SB_SQUARE]);
313 int hfilter = EIGHTTAP_REGULAR, vfilter = EIGHTTAP_REGULAR;
314 for (int i = 0; i < h; ++i)
315 for (int j = 0; j < w; ++j) input[i * w + j] = rnd_.Rand8();
316 for (int i = 0; i < MAX_SB_SQUARE; ++i) {
317 output[i] = rnd_.Rand16();
318 output8[i] = rnd_.Rand8();
319 }
320
321 const int out_w = block_size_wide[block_idx];
322 const int out_h = block_size_high[block_idx];
323 const int num_loops = 1000000000 / (out_w + out_h);
324 const int do_average = 0;
325
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800326 const InterpFilterParams *filter_params_x =
Sanampudi Venkata Rao90134d32018-05-19 16:19:20 +0530327 av1_get_interp_filter_params_with_block_size((InterpFilter)hfilter,
328 out_w);
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800329 const InterpFilterParams *filter_params_y =
Sanampudi Venkata Rao90134d32018-05-19 16:19:20 +0530330 av1_get_interp_filter_params_with_block_size((InterpFilter)vfilter,
331 out_h);
332
333 ConvolveParams conv_params =
Peng Binf7b11f52018-08-09 17:29:39 +0800334 get_conv_params_no_round(do_average, 0, output, MAX_SB_SIZE, 1, 8);
Sanampudi Venkata Rao90134d32018-05-19 16:19:20 +0530335
Debargha Mukherjee7ac3eb12018-12-12 10:26:50 -0800336 conv_params.use_dist_wtd_comp_avg = 0;
Sanampudi Venkata Rao90134d32018-05-19 16:19:20 +0530337
338 // Choose random locations within the source block
339 const int offset_r = 3 + rnd_.PseudoUniform(h - out_h - 7);
340 const int offset_c = 3 + rnd_.PseudoUniform(w - out_w - 7);
341
342 aom_usec_timer timer;
343 aom_usec_timer_start(&timer);
344
345 for (int i = 0; i < num_loops; ++i)
346 test_impl(input + offset_r * w + offset_c, w, output8, MAX_SB_SIZE, out_w,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800347 out_h, filter_params_x, filter_params_y, subx, suby,
Sanampudi Venkata Rao90134d32018-05-19 16:19:20 +0530348 &conv_params);
349
350 aom_usec_timer_mark(&timer);
351 const int elapsed_time = static_cast<int>(aom_usec_timer_elapsed(&timer));
352 printf("%d,%d convolve %3dx%-3d: %7.2f us\n", has_subx, has_suby, out_w,
353 out_h, 1000.0 * elapsed_time / num_loops);
354}
David Barker8295c7c2017-06-02 15:21:43 +0100355} // namespace AV1Convolve2D
356
David Barker8295c7c2017-06-02 15:21:43 +0100357namespace AV1HighbdConvolve2D {
David Barker8295c7c2017-06-02 15:21:43 +0100358::testing::internal::ParamGenerator<HighbdConvolve2DParam> BuildParams(
sarahparker3c38cce2018-03-15 14:12:49 -0700359 highbd_convolve_2d_func filter, int has_subx, int has_suby) {
360 return ::testing::Combine(
Ravi Chaudharybc2bd032018-04-12 13:48:54 +0530361 ::testing::Range(8, 13, 2), ::testing::Values(filter),
sarahparker3c38cce2018-03-15 14:12:49 -0700362 ::testing::Values(has_subx), ::testing::Values(has_suby),
363 ::testing::Range(BLOCK_4X4, BLOCK_SIZES_ALL));
David Barker8295c7c2017-06-02 15:21:43 +0100364}
365
Cherma Rajan A09d45302018-02-22 17:25:15 +0530366AV1HighbdConvolve2DSrTest::~AV1HighbdConvolve2DSrTest() {}
367void AV1HighbdConvolve2DSrTest::SetUp() {
368 rnd_.Reset(ACMRandom::DeterministicSeed());
369}
370
371void AV1HighbdConvolve2DSrTest::TearDown() { libaom_test::ClearSystemState(); }
372
Ravi Chaudharybe4dd102018-03-07 09:19:17 +0530373void AV1HighbdConvolve2DSrTest::RunSpeedTest(
374 highbd_convolve_2d_func test_impl) {
375 const int w = kMaxSize, h = kMaxSize;
376 const int bd = GET_PARAM(0);
Ravi Chaudhary79363c82018-03-08 18:46:41 +0530377 const int has_subx = GET_PARAM(2);
378 const int has_suby = GET_PARAM(3);
sarahparker3c38cce2018-03-15 14:12:49 -0700379 const int block_idx = GET_PARAM(4);
Ravi Chaudharybe4dd102018-03-07 09:19:17 +0530380 int hfilter, vfilter, subx, suby;
381 uint16_t input[kMaxSize * kMaxSize];
382 DECLARE_ALIGNED(32, uint16_t, output[MAX_SB_SQUARE]);
Ravi Chaudharybe4dd102018-03-07 09:19:17 +0530383
384 for (int i = 0; i < h; ++i)
385 for (int j = 0; j < w; ++j)
386 input[i * w + j] = rnd_.Rand16() & ((1 << bd) - 1);
Ravi Chaudharybe4dd102018-03-07 09:19:17 +0530387
388 hfilter = EIGHTTAP_REGULAR;
389 vfilter = EIGHTTAP_REGULAR;
390 int do_average = 0;
391
Ravi Chaudhary79363c82018-03-08 18:46:41 +0530392 const int offset_r = 3;
393 const int offset_c = 3;
394 subx = 0;
395 suby = 0;
396
Ravi Chaudhary79363c82018-03-08 18:46:41 +0530397 ConvolveParams conv_params =
Peng Binf7b11f52018-08-09 17:29:39 +0800398 get_conv_params_no_round(do_average, 0, NULL, 0, 0, bd);
Ravi Chaudhary79363c82018-03-08 18:46:41 +0530399
Sarah Parker30d4e532018-03-14 17:53:39 -0700400 // Make sure that sizes 2xN and Nx2 are also tested for chroma.
401 const int num_sizes =
402 (block_size_wide[block_idx] == 4 || block_size_high[block_idx] == 4) ? 2
403 : 1;
Ravi Chaudharybe4dd102018-03-07 09:19:17 +0530404
Sarah Parker30d4e532018-03-14 17:53:39 -0700405 for (int shift = 0; shift < num_sizes; ++shift) { // luma and chroma
406 const int out_w = block_size_wide[block_idx] >> shift;
407 const int out_h = block_size_high[block_idx] >> shift;
408 const int num_loops = 1000000000 / (out_w + out_h);
Ravi Chaudharybe4dd102018-03-07 09:19:17 +0530409
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800410 const InterpFilterParams *filter_params_x =
Urvang Joshia99a2632018-04-20 17:41:27 -0400411 av1_get_interp_filter_params_with_block_size((InterpFilter)hfilter,
412 out_w);
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800413 const InterpFilterParams *filter_params_y =
Urvang Joshia99a2632018-04-20 17:41:27 -0400414 av1_get_interp_filter_params_with_block_size((InterpFilter)vfilter,
415 out_h);
416
Sarah Parker30d4e532018-03-14 17:53:39 -0700417 aom_usec_timer timer;
418 aom_usec_timer_start(&timer);
419 for (int i = 0; i < num_loops; ++i)
420 test_impl(input + offset_r * w + offset_c, w, output, MAX_SB_SIZE, out_w,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800421 out_h, filter_params_x, filter_params_y, subx, suby,
Sarah Parker30d4e532018-03-14 17:53:39 -0700422 &conv_params, bd);
Ravi Chaudharybe4dd102018-03-07 09:19:17 +0530423
Sarah Parker30d4e532018-03-14 17:53:39 -0700424 aom_usec_timer_mark(&timer);
425 const int elapsed_time = static_cast<int>(aom_usec_timer_elapsed(&timer));
sarahparker3c38cce2018-03-15 14:12:49 -0700426 printf("%d,%d convolve %3dx%-3d: %7.2f us\n", has_subx, has_suby, out_w,
Sarah Parker30d4e532018-03-14 17:53:39 -0700427 out_h, 1000.0 * elapsed_time / num_loops);
Ravi Chaudharybe4dd102018-03-07 09:19:17 +0530428 }
429}
430
Cherma Rajan A09d45302018-02-22 17:25:15 +0530431void AV1HighbdConvolve2DSrTest::RunCheckOutput(
432 highbd_convolve_2d_func test_impl) {
433 const int w = kMaxSize, h = kMaxSize;
434 const int bd = GET_PARAM(0);
435 const int has_subx = GET_PARAM(2);
436 const int has_suby = GET_PARAM(3);
sarahparker3c38cce2018-03-15 14:12:49 -0700437 const int block_idx = GET_PARAM(4);
Cherma Rajan A09d45302018-02-22 17:25:15 +0530438 int hfilter, vfilter, subx, suby;
439 uint16_t input[kMaxSize * kMaxSize];
440 DECLARE_ALIGNED(32, uint16_t, output[MAX_SB_SQUARE]);
441 DECLARE_ALIGNED(32, uint16_t, output2[MAX_SB_SQUARE]);
Cherma Rajan A09d45302018-02-22 17:25:15 +0530442
443 for (int i = 0; i < h; ++i)
444 for (int j = 0; j < w; ++j)
445 input[i * w + j] = rnd_.Rand16() & ((1 << bd) - 1);
446 for (int i = 0; i < MAX_SB_SQUARE; ++i)
447 output[i] = output2[i] = rnd_.Rand31();
448
Sarah Parker30d4e532018-03-14 17:53:39 -0700449 // Make sure that sizes 2xN and Nx2 are also tested for chroma.
450 const int num_sizes =
451 (block_size_wide[block_idx] == 4 || block_size_high[block_idx] == 4) ? 2
452 : 1;
453 for (int shift = 0; shift < num_sizes; ++shift) { // luma and chroma
454 const int out_w = block_size_wide[block_idx] >> shift;
455 const int out_h = block_size_high[block_idx] >> shift;
456 for (hfilter = EIGHTTAP_REGULAR; hfilter < INTERP_FILTERS_ALL; ++hfilter) {
457 for (vfilter = EIGHTTAP_REGULAR; vfilter < INTERP_FILTERS_ALL;
458 ++vfilter) {
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800459 const InterpFilterParams *filter_params_x =
Urvang Joshia99a2632018-04-20 17:41:27 -0400460 av1_get_interp_filter_params_with_block_size((InterpFilter)hfilter,
461 out_w);
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800462 const InterpFilterParams *filter_params_y =
Urvang Joshia99a2632018-04-20 17:41:27 -0400463 av1_get_interp_filter_params_with_block_size((InterpFilter)vfilter,
464 out_h);
Sarah Parker30d4e532018-03-14 17:53:39 -0700465 for (int do_average = 0; do_average < 1; ++do_average) {
466 ConvolveParams conv_params1 =
Peng Binf7b11f52018-08-09 17:29:39 +0800467 get_conv_params_no_round(do_average, 0, NULL, 0, 0, bd);
Sarah Parker30d4e532018-03-14 17:53:39 -0700468 ConvolveParams conv_params2 =
Peng Binf7b11f52018-08-09 17:29:39 +0800469 get_conv_params_no_round(do_average, 0, NULL, 0, 0, bd);
Cherma Rajan A09d45302018-02-22 17:25:15 +0530470
Sarah Parker30d4e532018-03-14 17:53:39 -0700471 const int subx_range = has_subx ? 16 : 1;
472 const int suby_range = has_suby ? 16 : 1;
473 for (subx = 0; subx < subx_range; ++subx) {
474 for (suby = 0; suby < suby_range; ++suby) {
475 // Choose random locations within the source block
476 const int offset_r = 3 + rnd_.PseudoUniform(h - out_h - 7);
477 const int offset_c = 3 + rnd_.PseudoUniform(w - out_w - 7);
478 av1_highbd_convolve_2d_sr_c(input + offset_r * w + offset_c, w,
479 output, MAX_SB_SIZE, out_w, out_h,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800480 filter_params_x, filter_params_y,
Sarah Parker30d4e532018-03-14 17:53:39 -0700481 subx, suby, &conv_params1, bd);
482 test_impl(input + offset_r * w + offset_c, w, output2,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800483 MAX_SB_SIZE, out_w, out_h, filter_params_x,
484 filter_params_y, subx, suby, &conv_params2, bd);
Cherma Rajan A09d45302018-02-22 17:25:15 +0530485
Sarah Parker30d4e532018-03-14 17:53:39 -0700486 if (memcmp(output, output2, sizeof(output))) {
487 for (int i = 0; i < MAX_SB_SIZE; ++i) {
488 for (int j = 0; j < MAX_SB_SIZE; ++j) {
489 int idx = i * MAX_SB_SIZE + j;
490 ASSERT_EQ(output[idx], output2[idx])
491 << out_w << "x" << out_h << " Pixel mismatch at index "
492 << idx << " = (" << i << ", " << j
493 << "), sub pixel offset = (" << suby << ", " << subx
494 << ")";
Cherma Rajan A09d45302018-02-22 17:25:15 +0530495 }
496 }
497 }
498 }
499 }
500 }
501 }
502 }
503 }
504}
505
Cheng Chen56d8b952017-11-03 18:55:55 -0700506AV1HighbdJntConvolve2DTest::~AV1HighbdJntConvolve2DTest() {}
507void AV1HighbdJntConvolve2DTest::SetUp() {
508 rnd_.Reset(ACMRandom::DeterministicSeed());
509}
510
511void AV1HighbdJntConvolve2DTest::TearDown() { libaom_test::ClearSystemState(); }
512
Ravi Chaudharybb6a7692018-03-02 15:30:05 +0530513void AV1HighbdJntConvolve2DTest::RunSpeedTest(
514 highbd_convolve_2d_func test_impl) {
515 const int w = kMaxSize, h = kMaxSize;
516 const int bd = GET_PARAM(0);
sarahparker3c38cce2018-03-15 14:12:49 -0700517 const int block_idx = GET_PARAM(4);
Ravi Chaudharybb6a7692018-03-02 15:30:05 +0530518 int hfilter, vfilter, subx, suby;
519 uint16_t input[kMaxSize * kMaxSize];
520 DECLARE_ALIGNED(32, CONV_BUF_TYPE, output[MAX_SB_SQUARE]);
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530521 DECLARE_ALIGNED(32, uint16_t, output16[MAX_SB_SQUARE]);
Ravi Chaudharybb6a7692018-03-02 15:30:05 +0530522
523 for (int i = 0; i < h; ++i)
524 for (int j = 0; j < w; ++j)
525 input[i * w + j] = rnd_.Rand16() & ((1 << bd) - 1);
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530526 for (int i = 0; i < MAX_SB_SQUARE; ++i) output[i] = rnd_.Rand16();
Ravi Chaudharybb6a7692018-03-02 15:30:05 +0530527 hfilter = EIGHTTAP_REGULAR;
528 vfilter = EIGHTTAP_REGULAR;
529 int do_average = 0;
Sarah Parker30d4e532018-03-14 17:53:39 -0700530 const int out_w = block_size_wide[block_idx];
531 const int out_h = block_size_high[block_idx];
Ravi Chaudharybb6a7692018-03-02 15:30:05 +0530532
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800533 const InterpFilterParams *filter_params_x =
Urvang Joshia99a2632018-04-20 17:41:27 -0400534 av1_get_interp_filter_params_with_block_size((InterpFilter)hfilter,
535 out_w);
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800536 const InterpFilterParams *filter_params_y =
Urvang Joshia99a2632018-04-20 17:41:27 -0400537 av1_get_interp_filter_params_with_block_size((InterpFilter)vfilter,
538 out_h);
Ravi Chaudharybb6a7692018-03-02 15:30:05 +0530539
Sarah Parker30d4e532018-03-14 17:53:39 -0700540 ConvolveParams conv_params =
Peng Binf7b11f52018-08-09 17:29:39 +0800541 get_conv_params_no_round(do_average, 0, output, MAX_SB_SIZE, 1, bd);
Ravi Chaudharybb6a7692018-03-02 15:30:05 +0530542
Sarah Parker30d4e532018-03-14 17:53:39 -0700543 // Test special case where jnt_comp_avg is not used
Debargha Mukherjee7ac3eb12018-12-12 10:26:50 -0800544 conv_params.use_dist_wtd_comp_avg = 0;
Ravi Chaudharybb6a7692018-03-02 15:30:05 +0530545
Sarah Parker30d4e532018-03-14 17:53:39 -0700546 subx = 0;
547 suby = 0;
548 // Choose random locations within the source block
549 const int offset_r = 3;
550 const int offset_c = 3;
Ravi Chaudharybb6a7692018-03-02 15:30:05 +0530551
Sarah Parker30d4e532018-03-14 17:53:39 -0700552 const int num_loops = 1000000000 / (out_w + out_h);
553 aom_usec_timer timer;
554 aom_usec_timer_start(&timer);
555 for (int i = 0; i < num_loops; ++i)
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530556 test_impl(input + offset_r * w + offset_c, w, output16, MAX_SB_SIZE, out_w,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800557 out_h, filter_params_x, filter_params_y, subx, suby, &conv_params,
558 bd);
Ravi Chaudharybb6a7692018-03-02 15:30:05 +0530559
Sarah Parker30d4e532018-03-14 17:53:39 -0700560 aom_usec_timer_mark(&timer);
561 const int elapsed_time = static_cast<int>(aom_usec_timer_elapsed(&timer));
sarahparker3c38cce2018-03-15 14:12:49 -0700562 printf("convolve %3dx%-3d: %7.2f us\n", out_w, out_h,
Sarah Parker30d4e532018-03-14 17:53:39 -0700563 1000.0 * elapsed_time / num_loops);
Ravi Chaudharybb6a7692018-03-02 15:30:05 +0530564}
565
Cheng Chen56d8b952017-11-03 18:55:55 -0700566void AV1HighbdJntConvolve2DTest::RunCheckOutput(
567 highbd_convolve_2d_func test_impl) {
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800568 const int w = kMaxSize, h = kMaxSize;
569 const int bd = GET_PARAM(0);
Cherma Rajan Acb4622d2018-02-23 16:17:08 +0530570 const int has_subx = GET_PARAM(2);
571 const int has_suby = GET_PARAM(3);
sarahparker3c38cce2018-03-15 14:12:49 -0700572 const int block_idx = GET_PARAM(4);
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800573 int hfilter, vfilter, subx, suby;
574 uint16_t input[kMaxSize * kMaxSize];
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530575 DECLARE_ALIGNED(32, CONV_BUF_TYPE, output1[MAX_SB_SQUARE]);
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800576 DECLARE_ALIGNED(32, CONV_BUF_TYPE, output2[MAX_SB_SQUARE]);
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530577 DECLARE_ALIGNED(32, uint16_t, output16_1[MAX_SB_SQUARE]);
578 DECLARE_ALIGNED(32, uint16_t, output16_2[MAX_SB_SQUARE]);
Cheng Chen56d8b952017-11-03 18:55:55 -0700579
Linfeng Zhang5f0485b2018-01-09 10:21:57 -0800580 for (int i = 0; i < h; ++i)
581 for (int j = 0; j < w; ++j)
582 input[i * w + j] = rnd_.Rand16() & ((1 << bd) - 1);
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530583 for (int i = 0; i < MAX_SB_SQUARE; ++i) {
584 output1[i] = output2[i] = rnd_.Rand16();
585 output16_1[i] = output16_2[i] = rnd_.Rand16();
586 }
Cheng Chen56d8b952017-11-03 18:55:55 -0700587
Sarah Parker30d4e532018-03-14 17:53:39 -0700588 const int out_w = block_size_wide[block_idx];
589 const int out_h = block_size_high[block_idx];
590 for (hfilter = EIGHTTAP_REGULAR; hfilter < INTERP_FILTERS_ALL; ++hfilter) {
591 for (vfilter = EIGHTTAP_REGULAR; vfilter < INTERP_FILTERS_ALL; ++vfilter) {
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800592 const InterpFilterParams *filter_params_x =
Urvang Joshia99a2632018-04-20 17:41:27 -0400593 av1_get_interp_filter_params_with_block_size((InterpFilter)hfilter,
594 out_w);
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800595 const InterpFilterParams *filter_params_y =
Urvang Joshia99a2632018-04-20 17:41:27 -0400596 av1_get_interp_filter_params_with_block_size((InterpFilter)vfilter,
597 out_h);
Sarah Parker30d4e532018-03-14 17:53:39 -0700598 for (int do_average = 0; do_average <= 1; ++do_average) {
599 ConvolveParams conv_params1 = get_conv_params_no_round(
Peng Binf7b11f52018-08-09 17:29:39 +0800600 do_average, 0, output1, MAX_SB_SIZE, 1, bd);
Sarah Parker30d4e532018-03-14 17:53:39 -0700601 ConvolveParams conv_params2 = get_conv_params_no_round(
Peng Binf7b11f52018-08-09 17:29:39 +0800602 do_average, 0, output2, MAX_SB_SIZE, 1, bd);
Cheng Chen56d8b952017-11-03 18:55:55 -0700603
Sarah Parker30d4e532018-03-14 17:53:39 -0700604 // Test special case where jnt_comp_avg is not used
Debargha Mukherjee7ac3eb12018-12-12 10:26:50 -0800605 conv_params1.use_dist_wtd_comp_avg = 0;
606 conv_params2.use_dist_wtd_comp_avg = 0;
Cheng Chen56d8b952017-11-03 18:55:55 -0700607
Sarah Parker30d4e532018-03-14 17:53:39 -0700608 const int subx_range = has_subx ? 16 : 1;
609 const int suby_range = has_suby ? 16 : 1;
610 for (subx = 0; subx < subx_range; ++subx) {
611 for (suby = 0; suby < suby_range; ++suby) {
612 // Choose random locations within the source block
613 const int offset_r = 3 + rnd_.PseudoUniform(h - out_h - 7);
614 const int offset_c = 3 + rnd_.PseudoUniform(w - out_w - 7);
615 av1_highbd_jnt_convolve_2d_c(input + offset_r * w + offset_c, w,
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530616 output16_1, MAX_SB_SIZE, out_w, out_h,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800617 filter_params_x, filter_params_y, subx,
618 suby, &conv_params1, bd);
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530619 test_impl(input + offset_r * w + offset_c, w, output16_2,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800620 MAX_SB_SIZE, out_w, out_h, filter_params_x,
621 filter_params_y, subx, suby, &conv_params2, bd);
Cheng Chen56d8b952017-11-03 18:55:55 -0700622
Sarah Parker30d4e532018-03-14 17:53:39 -0700623 for (int i = 0; i < out_h; ++i) {
624 for (int j = 0; j < out_w; ++j) {
625 int idx = i * MAX_SB_SIZE + j;
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530626 ASSERT_EQ(output1[idx], output2[idx])
Sarah Parker30d4e532018-03-14 17:53:39 -0700627 << out_w << "x" << out_h << " Pixel mismatch at index "
628 << idx << " = (" << i << ", " << j
629 << "), sub pixel offset = (" << suby << ", " << subx << ")";
Cheng Chen56d8b952017-11-03 18:55:55 -0700630 }
631 }
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530632
633 if (memcmp(output16_1, output16_2, sizeof(output16_1))) {
634 for (int i = 0; i < MAX_SB_SIZE; ++i) {
635 for (int j = 0; j < MAX_SB_SIZE; ++j) {
636 int idx = i * MAX_SB_SIZE + j;
637 ASSERT_EQ(output16_1[idx], output16_2[idx])
638 << out_w << "x" << out_h << " Pixel mismatch at index "
639 << idx << " = (" << i << ", " << j
640 << "), sub pixel offset = (" << suby << ", " << subx
641 << ")";
642 }
643 }
644 }
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800645 }
Sarah Parker30d4e532018-03-14 17:53:39 -0700646 }
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800647
Sarah Parker30d4e532018-03-14 17:53:39 -0700648 // Test different combination of fwd and bck offset weights
649 for (int k = 0; k < 2; ++k) {
650 for (int l = 0; l < 4; ++l) {
Debargha Mukherjee7ac3eb12018-12-12 10:26:50 -0800651 conv_params1.use_dist_wtd_comp_avg = 1;
652 conv_params2.use_dist_wtd_comp_avg = 1;
Sarah Parker30d4e532018-03-14 17:53:39 -0700653 conv_params1.fwd_offset = quant_dist_lookup_table[k][l][0];
654 conv_params1.bck_offset = quant_dist_lookup_table[k][l][1];
655 conv_params2.fwd_offset = quant_dist_lookup_table[k][l][0];
656 conv_params2.bck_offset = quant_dist_lookup_table[k][l][1];
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800657
Sarah Parker30d4e532018-03-14 17:53:39 -0700658 const int subx_range = has_subx ? 16 : 1;
659 const int suby_range = has_suby ? 16 : 1;
660 for (subx = 0; subx < subx_range; ++subx) {
661 for (suby = 0; suby < suby_range; ++suby) {
662 // Choose random locations within the source block
663 const int offset_r = 3 + rnd_.PseudoUniform(h - out_h - 7);
664 const int offset_c = 3 + rnd_.PseudoUniform(w - out_w - 7);
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530665 av1_highbd_jnt_convolve_2d_c(
666 input + offset_r * w + offset_c, w, output16_1, MAX_SB_SIZE,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800667 out_w, out_h, filter_params_x, filter_params_y, subx, suby,
668 &conv_params1, bd);
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530669 test_impl(input + offset_r * w + offset_c, w, output16_2,
Peng Bin3a0c2ed2018-07-19 16:24:00 +0800670 MAX_SB_SIZE, out_w, out_h, filter_params_x,
671 filter_params_y, subx, suby, &conv_params2, bd);
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800672
Sarah Parker30d4e532018-03-14 17:53:39 -0700673 for (int i = 0; i < out_h; ++i) {
674 for (int j = 0; j < out_w; ++j) {
675 int idx = i * MAX_SB_SIZE + j;
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530676 ASSERT_EQ(output1[idx], output2[idx])
Sarah Parker30d4e532018-03-14 17:53:39 -0700677 << out_w << "x" << out_h << " Pixel mismatch at index "
678 << idx << " = (" << i << ", " << j
679 << "), sub pixel offset = (" << suby << ", " << subx
680 << ")";
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800681 }
682 }
Cherma Rajan Aa7be3682018-03-20 10:00:51 +0530683
684 if (memcmp(output16_1, output16_2, sizeof(output16_1))) {
685 for (int i = 0; i < MAX_SB_SIZE; ++i) {
686 for (int j = 0; j < MAX_SB_SIZE; ++j) {
687 int idx = i * MAX_SB_SIZE + j;
688 ASSERT_EQ(output16_1[idx], output16_2[idx])
689 << out_w << "x" << out_h
690 << " Pixel mismatch at index " << idx << " = (" << i
691 << ", " << j << "), sub pixel offset = (" << suby
692 << ", " << subx << ")";
693 }
694 }
695 }
Linfeng Zhanga3e9c502018-01-09 10:04:20 -0800696 }
697 }
698 }
Cheng Chen56d8b952017-11-03 18:55:55 -0700699 }
700 }
701 }
702 }
Cheng Chen56d8b952017-11-03 18:55:55 -0700703}
David Barker8295c7c2017-06-02 15:21:43 +0100704} // namespace AV1HighbdConvolve2D
David Barker8295c7c2017-06-02 15:21:43 +0100705} // namespace libaom_test