blob: 58845f19b4e23c6ec7e35937df85ce4f435f332b [file] [log] [blame]
Yaowu Xuc27fc142016-08-22 16:08:15 -07001/*
Yaowu Xubde4ac82016-11-28 15:26:06 -08002 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
Yaowu Xuc27fc142016-08-22 16:08:15 -07003 *
Yaowu Xubde4ac82016-11-28 15:26:06 -08004 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
Yaowu Xuc27fc142016-08-22 16:08:15 -070010 */
11
Yaowu Xuf883b422016-08-30 14:01:10 -070012#include "./av1_rtcd.h"
Sarah Parker31c66502017-05-19 16:51:07 -070013#include "aom_dsp/inv_txfm.h"
Yaowu Xuc27fc142016-08-22 16:08:15 -070014#include "av1/common/enums.h"
Yaowu Xuf883b422016-08-30 14:01:10 -070015#include "av1/common/av1_txfm.h"
16#include "av1/common/av1_inv_txfm1d.h"
Sarah Parkereec47e62017-05-15 20:49:22 -070017#include "av1/common/av1_inv_txfm1d_cfg.h"
Yaowu Xuc27fc142016-08-22 16:08:15 -070018
19static INLINE TxfmFunc inv_txfm_type_to_func(TXFM_TYPE txfm_type) {
20 switch (txfm_type) {
Yaowu Xuf883b422016-08-30 14:01:10 -070021 case TXFM_TYPE_DCT4: return av1_idct4_new;
22 case TXFM_TYPE_DCT8: return av1_idct8_new;
23 case TXFM_TYPE_DCT16: return av1_idct16_new;
24 case TXFM_TYPE_DCT32: return av1_idct32_new;
25 case TXFM_TYPE_ADST4: return av1_iadst4_new;
26 case TXFM_TYPE_ADST8: return av1_iadst8_new;
27 case TXFM_TYPE_ADST16: return av1_iadst16_new;
28 case TXFM_TYPE_ADST32: return av1_iadst32_new;
Sarah Parker3eed4172017-05-15 20:49:22 -070029#if CONFIG_EXT_TX
30 case TXFM_TYPE_IDENTITY4: return av1_iidentity4_c;
31 case TXFM_TYPE_IDENTITY8: return av1_iidentity8_c;
32 case TXFM_TYPE_IDENTITY16: return av1_iidentity16_c;
33 case TXFM_TYPE_IDENTITY32: return av1_iidentity32_c;
34#endif // CONFIG_EXT_TX
Yaowu Xuc27fc142016-08-22 16:08:15 -070035 default: assert(0); return NULL;
36 }
37}
38
Sarah Parkereec47e62017-05-15 20:49:22 -070039static const TXFM_1D_CFG *inv_txfm_col_cfg_ls[TX_TYPES_1D][TX_SIZES] = {
40 // DCT
Frank Galligan0b73f3e2017-05-03 22:43:22 +000041 {
Timothy B. Terriberryfe67ed62017-04-26 16:53:47 -070042#if CONFIG_CHROMA_2X2
Frank Galligan0b73f3e2017-05-03 22:43:22 +000043 NULL,
44#endif
Sarah Parkereec47e62017-05-15 20:49:22 -070045 &inv_txfm_1d_col_cfg_dct_4, &inv_txfm_1d_col_cfg_dct_8,
46 &inv_txfm_1d_col_cfg_dct_16, &inv_txfm_1d_col_cfg_dct_32 },
47 // ADST
Frank Galligan0b73f3e2017-05-03 22:43:22 +000048 {
Timothy B. Terriberryfe67ed62017-04-26 16:53:47 -070049#if CONFIG_CHROMA_2X2
Frank Galligan0b73f3e2017-05-03 22:43:22 +000050 NULL,
51#endif
Sarah Parkereec47e62017-05-15 20:49:22 -070052 &inv_txfm_1d_col_cfg_adst_4, &inv_txfm_1d_col_cfg_adst_8,
53 &inv_txfm_1d_col_cfg_adst_16, &inv_txfm_1d_col_cfg_adst_32 },
Fred BARBIERb72ab8f2017-05-08 20:01:07 +020054#if CONFIG_EXT_TX
Sarah Parkereec47e62017-05-15 20:49:22 -070055 // FLIPADST
Fred BARBIERb72ab8f2017-05-08 20:01:07 +020056 {
Timothy B. Terriberryfe67ed62017-04-26 16:53:47 -070057#if CONFIG_CHROMA_2X2
Fred BARBIERb72ab8f2017-05-08 20:01:07 +020058 NULL,
Frank Galligan0b73f3e2017-05-03 22:43:22 +000059#endif
Sarah Parkereec47e62017-05-15 20:49:22 -070060 &inv_txfm_1d_col_cfg_adst_4, &inv_txfm_1d_col_cfg_adst_8,
61 &inv_txfm_1d_col_cfg_adst_16, &inv_txfm_1d_col_cfg_adst_32 },
Sarah Parker3eed4172017-05-15 20:49:22 -070062 // IDENTITY
Fred BARBIERb72ab8f2017-05-08 20:01:07 +020063 {
Timothy B. Terriberryfe67ed62017-04-26 16:53:47 -070064#if CONFIG_CHROMA_2X2
Fred BARBIERb72ab8f2017-05-08 20:01:07 +020065 NULL,
66#endif
Sarah Parker3eed4172017-05-15 20:49:22 -070067 &inv_txfm_1d_cfg_identity_4, &inv_txfm_1d_cfg_identity_8,
68 &inv_txfm_1d_cfg_identity_16, &inv_txfm_1d_cfg_identity_32 },
Sarah Parkereec47e62017-05-15 20:49:22 -070069#endif // CONFIG_EXT_TX
70};
71
72static const TXFM_1D_CFG *inv_txfm_row_cfg_ls[TX_TYPES_1D][TX_SIZES] = {
73 // DCT
Fred BARBIERb72ab8f2017-05-08 20:01:07 +020074 {
Timothy B. Terriberryfe67ed62017-04-26 16:53:47 -070075#if CONFIG_CHROMA_2X2
Fred BARBIERb72ab8f2017-05-08 20:01:07 +020076 NULL,
77#endif
Sarah Parkereec47e62017-05-15 20:49:22 -070078 &inv_txfm_1d_row_cfg_dct_4, &inv_txfm_1d_row_cfg_dct_8,
79 &inv_txfm_1d_row_cfg_dct_16, &inv_txfm_1d_row_cfg_dct_32 },
80 // ADST
Fred BARBIERb72ab8f2017-05-08 20:01:07 +020081 {
Timothy B. Terriberryfe67ed62017-04-26 16:53:47 -070082#if CONFIG_CHROMA_2X2
Fred BARBIERb72ab8f2017-05-08 20:01:07 +020083 NULL,
84#endif
Sarah Parkereec47e62017-05-15 20:49:22 -070085 &inv_txfm_1d_row_cfg_adst_4, &inv_txfm_1d_row_cfg_adst_8,
86 &inv_txfm_1d_row_cfg_adst_16, &inv_txfm_1d_row_cfg_adst_32 },
87#if CONFIG_EXT_TX
88 // FLIPADST
Fred BARBIERb72ab8f2017-05-08 20:01:07 +020089 {
Timothy B. Terriberryfe67ed62017-04-26 16:53:47 -070090#if CONFIG_CHROMA_2X2
Fred BARBIERb72ab8f2017-05-08 20:01:07 +020091 NULL,
92#endif
Sarah Parkereec47e62017-05-15 20:49:22 -070093 &inv_txfm_1d_row_cfg_adst_4, &inv_txfm_1d_row_cfg_adst_8,
94 &inv_txfm_1d_row_cfg_adst_16, &inv_txfm_1d_row_cfg_adst_32 },
Sarah Parker3eed4172017-05-15 20:49:22 -070095 // IDENTITY
Sarah Parkereec47e62017-05-15 20:49:22 -070096 {
Timothy B. Terriberryfe67ed62017-04-26 16:53:47 -070097#if CONFIG_CHROMA_2X2
Sarah Parkereec47e62017-05-15 20:49:22 -070098 NULL,
99#endif
Sarah Parker3eed4172017-05-15 20:49:22 -0700100 &inv_txfm_1d_cfg_identity_4, &inv_txfm_1d_cfg_identity_8,
101 &inv_txfm_1d_cfg_identity_16, &inv_txfm_1d_cfg_identity_32 },
Fred BARBIERb72ab8f2017-05-08 20:01:07 +0200102#endif // CONFIG_EXT_TX
103};
Yaowu Xuc27fc142016-08-22 16:08:15 -0700104
Yaowu Xuf883b422016-08-30 14:01:10 -0700105TXFM_2D_FLIP_CFG av1_get_inv_txfm_cfg(int tx_type, int tx_size) {
Yaowu Xuc27fc142016-08-22 16:08:15 -0700106 TXFM_2D_FLIP_CFG cfg;
107 set_flip_cfg(tx_type, &cfg);
Sarah Parker30dfa882017-06-12 14:02:33 -0700108 const int tx_type_col = vtx_tab[tx_type];
109 const int tx_type_row = htx_tab[tx_type];
110 const int tx_size_col = txsize_vert_map[tx_size];
111 const int tx_size_row = txsize_horz_map[tx_size];
Sarah Parker31c66502017-05-19 16:51:07 -0700112 cfg.col_cfg = inv_txfm_col_cfg_ls[tx_type_col][tx_size_col];
113 cfg.row_cfg = inv_txfm_row_cfg_ls[tx_type_row][tx_size_row];
Yaowu Xuc27fc142016-08-22 16:08:15 -0700114 return cfg;
115}
116
Yaowu Xuf883b422016-08-30 14:01:10 -0700117TXFM_2D_FLIP_CFG av1_get_inv_txfm_64x64_cfg(int tx_type) {
Sarah Parkereec47e62017-05-15 20:49:22 -0700118 TXFM_2D_FLIP_CFG cfg = { 0, 0, NULL, NULL };
Yaowu Xuc27fc142016-08-22 16:08:15 -0700119 switch (tx_type) {
120 case DCT_DCT:
Sarah Parkereec47e62017-05-15 20:49:22 -0700121 cfg.col_cfg = &inv_txfm_1d_col_cfg_dct_64;
122 cfg.row_cfg = &inv_txfm_1d_row_cfg_dct_64;
Yaowu Xuc27fc142016-08-22 16:08:15 -0700123 set_flip_cfg(tx_type, &cfg);
124 break;
125 default: assert(0);
126 }
127 return cfg;
128}
129
Jonathan Matthews284f9d02017-06-08 15:49:08 +0100130static INLINE void inv_txfm2d_add_c(const int32_t *input, uint16_t *output,
Yaowu Xuc27fc142016-08-22 16:08:15 -0700131 int stride, TXFM_2D_FLIP_CFG *cfg,
Jonathan Matthews284f9d02017-06-08 15:49:08 +0100132 int32_t *txfm_buf, int bd) {
Sarah Parker31c66502017-05-19 16:51:07 -0700133 // Note when assigning txfm_size_col, we use the txfm_size from the
134 // row configuration and vice versa. This is intentionally done to
135 // accurately perform rectangular transforms. When the transform is
136 // rectangular, the number of columns will be the same as the
137 // txfm_size stored in the row cfg struct. It will make no difference
138 // for square transforms.
139 const int txfm_size_col = cfg->row_cfg->txfm_size;
140 const int txfm_size_row = cfg->col_cfg->txfm_size;
141 // Take the shift from the larger dimension in the rectangular case.
Sarah Parker30dfa882017-06-12 14:02:33 -0700142 const int8_t *shift = (txfm_size_col > txfm_size_row) ? cfg->row_cfg->shift
143 : cfg->col_cfg->shift;
Sarah Parkereec47e62017-05-15 20:49:22 -0700144 const int8_t *stage_range_col = cfg->col_cfg->stage_range;
145 const int8_t *stage_range_row = cfg->row_cfg->stage_range;
146 const int8_t *cos_bit_col = cfg->col_cfg->cos_bit;
147 const int8_t *cos_bit_row = cfg->row_cfg->cos_bit;
148 const TxfmFunc txfm_func_col = inv_txfm_type_to_func(cfg->col_cfg->txfm_type);
149 const TxfmFunc txfm_func_row = inv_txfm_type_to_func(cfg->row_cfg->txfm_type);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700150
Sarah Parker31c66502017-05-19 16:51:07 -0700151 // txfm_buf's length is txfm_size_row * txfm_size_col + 2 * txfm_size_row
Yaowu Xuc27fc142016-08-22 16:08:15 -0700152 // it is used for intermediate data buffering
153 int32_t *temp_in = txfm_buf;
Sarah Parker31c66502017-05-19 16:51:07 -0700154 int32_t *temp_out = temp_in + txfm_size_row;
155 int32_t *buf = temp_out + txfm_size_row;
Yaowu Xuc27fc142016-08-22 16:08:15 -0700156 int32_t *buf_ptr = buf;
157 int c, r;
158
159 // Rows
Sarah Parker31c66502017-05-19 16:51:07 -0700160 for (r = 0; r < txfm_size_row; ++r) {
Yaowu Xuc27fc142016-08-22 16:08:15 -0700161 txfm_func_row(input, buf_ptr, cos_bit_row, stage_range_row);
Sarah Parker31c66502017-05-19 16:51:07 -0700162 round_shift_array(buf_ptr, txfm_size_col, -shift[0]);
163 // Multiply everything by Sqrt2 if the transform is rectangular
164 if (txfm_size_row != txfm_size_col) {
165 for (c = 0; c < txfm_size_col; ++c)
166 buf_ptr[c] = (int32_t)dct_const_round_shift(buf_ptr[c] * Sqrt2);
167 }
168 input += txfm_size_col;
169 buf_ptr += txfm_size_col;
Yaowu Xuc27fc142016-08-22 16:08:15 -0700170 }
171
172 // Columns
Sarah Parker31c66502017-05-19 16:51:07 -0700173 for (c = 0; c < txfm_size_col; ++c) {
Yaowu Xuc27fc142016-08-22 16:08:15 -0700174 if (cfg->lr_flip == 0) {
Sarah Parker31c66502017-05-19 16:51:07 -0700175 for (r = 0; r < txfm_size_row; ++r)
176 temp_in[r] = buf[r * txfm_size_col + c];
Yaowu Xuc27fc142016-08-22 16:08:15 -0700177 } else {
178 // flip left right
Sarah Parker31c66502017-05-19 16:51:07 -0700179 for (r = 0; r < txfm_size_row; ++r)
180 temp_in[r] = buf[r * txfm_size_col + (txfm_size_col - c - 1)];
Yaowu Xuc27fc142016-08-22 16:08:15 -0700181 }
182 txfm_func_col(temp_in, temp_out, cos_bit_col, stage_range_col);
Sarah Parker31c66502017-05-19 16:51:07 -0700183 round_shift_array(temp_out, txfm_size_row, -shift[1]);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700184 if (cfg->ud_flip == 0) {
Jonathan Matthews284f9d02017-06-08 15:49:08 +0100185 for (r = 0; r < txfm_size_row; ++r) {
186 output[r * stride + c] =
187 highbd_clip_pixel_add(output[r * stride + c], temp_out[r], bd);
188 }
Yaowu Xuc27fc142016-08-22 16:08:15 -0700189 } else {
190 // flip upside down
Jonathan Matthews284f9d02017-06-08 15:49:08 +0100191 for (r = 0; r < txfm_size_row; ++r) {
192 output[r * stride + c] = highbd_clip_pixel_add(
193 output[r * stride + c], temp_out[txfm_size_row - r - 1], bd);
194 }
Yaowu Xuc27fc142016-08-22 16:08:15 -0700195 }
196 }
197}
198
Frederic Barbierc53753f2017-04-25 11:05:01 +0200199static INLINE void inv_txfm2d_add_facade(const int32_t *input, uint16_t *output,
200 int stride, int32_t *txfm_buf,
201 int tx_type, int tx_size, int bd) {
Frederic Barbierc53753f2017-04-25 11:05:01 +0200202 TXFM_2D_FLIP_CFG cfg = av1_get_inv_txfm_cfg(tx_type, tx_size);
Jonathan Matthews284f9d02017-06-08 15:49:08 +0100203 inv_txfm2d_add_c(input, output, stride, &cfg, txfm_buf, bd);
Sarah Parker31c66502017-05-19 16:51:07 -0700204}
205
206void av1_inv_txfm2d_add_4x8_c(const int32_t *input, uint16_t *output,
207 int stride, int tx_type, int bd) {
208 int txfm_buf[4 * 8 + 8 + 8];
209 inv_txfm2d_add_facade(input, output, stride, txfm_buf, tx_type, TX_4X8, bd);
210}
211
212void av1_inv_txfm2d_add_8x4_c(const int32_t *input, uint16_t *output,
213 int stride, int tx_type, int bd) {
214 int txfm_buf[8 * 4 + 4 + 4];
215 inv_txfm2d_add_facade(input, output, stride, txfm_buf, tx_type, TX_8X4, bd);
216}
217
218void av1_inv_txfm2d_add_8x16_c(const int32_t *input, uint16_t *output,
219 int stride, int tx_type, int bd) {
220 int txfm_buf[8 * 16 + 16 + 16];
221 inv_txfm2d_add_facade(input, output, stride, txfm_buf, tx_type, TX_8X16, bd);
222}
223
224void av1_inv_txfm2d_add_16x8_c(const int32_t *input, uint16_t *output,
225 int stride, int tx_type, int bd) {
226 int txfm_buf[16 * 8 + 8 + 8];
227 inv_txfm2d_add_facade(input, output, stride, txfm_buf, tx_type, TX_16X8, bd);
228}
229
230void av1_inv_txfm2d_add_16x32_c(const int32_t *input, uint16_t *output,
231 int stride, int tx_type, int bd) {
232 int txfm_buf[16 * 32 + 32 + 32];
233 inv_txfm2d_add_facade(input, output, stride, txfm_buf, tx_type, TX_16X32, bd);
234}
235
236void av1_inv_txfm2d_add_32x16_c(const int32_t *input, uint16_t *output,
237 int stride, int tx_type, int bd) {
238 int txfm_buf[32 * 16 + 16 + 16];
239 inv_txfm2d_add_facade(input, output, stride, txfm_buf, tx_type, TX_32X16, bd);
Frederic Barbierc53753f2017-04-25 11:05:01 +0200240}
241
242void av1_inv_txfm2d_add_4x4_c(const int32_t *input, uint16_t *output,
243 int stride, int tx_type, int bd) {
244 int txfm_buf[4 * 4 + 4 + 4];
245 inv_txfm2d_add_facade(input, output, stride, txfm_buf, tx_type, TX_4X4, bd);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700246}
247
Yaowu Xuf883b422016-08-30 14:01:10 -0700248void av1_inv_txfm2d_add_8x8_c(const int32_t *input, uint16_t *output,
249 int stride, int tx_type, int bd) {
Yaowu Xuc27fc142016-08-22 16:08:15 -0700250 int txfm_buf[8 * 8 + 8 + 8];
Frederic Barbierc53753f2017-04-25 11:05:01 +0200251 inv_txfm2d_add_facade(input, output, stride, txfm_buf, tx_type, TX_8X8, bd);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700252}
253
Yaowu Xuf883b422016-08-30 14:01:10 -0700254void av1_inv_txfm2d_add_16x16_c(const int32_t *input, uint16_t *output,
255 int stride, int tx_type, int bd) {
Yaowu Xuc27fc142016-08-22 16:08:15 -0700256 int txfm_buf[16 * 16 + 16 + 16];
Frederic Barbierc53753f2017-04-25 11:05:01 +0200257 inv_txfm2d_add_facade(input, output, stride, txfm_buf, tx_type, TX_16X16, bd);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700258}
259
Yaowu Xuf883b422016-08-30 14:01:10 -0700260void av1_inv_txfm2d_add_32x32_c(const int32_t *input, uint16_t *output,
261 int stride, int tx_type, int bd) {
Yaowu Xuc27fc142016-08-22 16:08:15 -0700262 int txfm_buf[32 * 32 + 32 + 32];
Frederic Barbierc53753f2017-04-25 11:05:01 +0200263 inv_txfm2d_add_facade(input, output, stride, txfm_buf, tx_type, TX_32X32, bd);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700264}
265
Yaowu Xuf883b422016-08-30 14:01:10 -0700266void av1_inv_txfm2d_add_64x64_c(const int32_t *input, uint16_t *output,
267 int stride, int tx_type, int bd) {
Yaowu Xuc27fc142016-08-22 16:08:15 -0700268 int txfm_buf[64 * 64 + 64 + 64];
Yaowu Xuf883b422016-08-30 14:01:10 -0700269 TXFM_2D_FLIP_CFG cfg = av1_get_inv_txfm_64x64_cfg(tx_type);
Jonathan Matthews284f9d02017-06-08 15:49:08 +0100270 inv_txfm2d_add_c(input, output, stride, &cfg, txfm_buf, bd);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700271}