Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2017, Alliance for Open Media. All rights reserved |
| 3 | * |
| 4 | * This source code is subject to the terms of the BSD 2 Clause License and |
| 5 | * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License |
| 6 | * was not distributed with this source code in the LICENSE file, you can |
| 7 | * obtain it at www.aomedia.org/license/software. If the Alliance for Open |
| 8 | * Media Patent License 1.0 was not distributed with this source code in the |
| 9 | * PATENTS file, you can obtain it at www.aomedia.org/license/patent. |
| 10 | */ |
| 11 | |
Linfeng Zhang | ae7b2f3 | 2017-11-08 15:46:57 -0800 | [diff] [blame] | 12 | #include "aom_ports/mem.h" |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 13 | #include "av1/common/scan.h" |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 14 | #include "av1/common/blockd.h" |
Angie Chiang | e50f3ec | 2017-04-10 15:50:33 -0700 | [diff] [blame] | 15 | #include "av1/common/idct.h" |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 16 | #include "av1/common/pred_common.h" |
Angie Chiang | 1628fcc | 2017-04-13 16:30:30 -0700 | [diff] [blame] | 17 | #include "av1/encoder/bitstream.h" |
| 18 | #include "av1/encoder/encodeframe.h" |
Angie Chiang | 47c7218 | 2017-02-27 14:30:38 -0800 | [diff] [blame] | 19 | #include "av1/encoder/cost.h" |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 20 | #include "av1/encoder/encodetxb.h" |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 21 | #include "av1/encoder/hash.h" |
Angie Chiang | 808d859 | 2017-04-06 18:36:55 -0700 | [diff] [blame] | 22 | #include "av1/encoder/rdopt.h" |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 23 | #include "av1/encoder/tokenize.h" |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 24 | |
Angie Chiang | 47e0707 | 2017-05-30 17:27:01 -0700 | [diff] [blame] | 25 | #define TEST_OPTIMIZE_TXB 0 |
| 26 | |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 27 | static int hbt_hash_needs_init = 1; |
| 28 | static CRC_CALCULATOR crc_calculator; |
| 29 | static CRC_CALCULATOR crc_calculator2; |
| 30 | static const int HBT_HASH_EOB = 16; // also the length in opt_qcoeff |
| 31 | |
| 32 | typedef struct OptTxbQcoeff { |
| 33 | uint32_t hbt_hash_match; |
| 34 | double hits; |
| 35 | tran_low_t opt_qcoeff[16]; |
| 36 | } OptTxbQcoeff; |
| 37 | |
| 38 | OptTxbQcoeff hbt_hash_table[65536][16]; |
| 39 | |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 40 | typedef struct LevelDownStats { |
| 41 | int update; |
| 42 | tran_low_t low_qc; |
| 43 | tran_low_t low_dqc; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 44 | int64_t dist0; |
| 45 | int rate; |
| 46 | int rate_low; |
| 47 | int64_t dist; |
| 48 | int64_t dist_low; |
| 49 | int64_t rd; |
| 50 | int64_t rd_low; |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 51 | int64_t nz_rd; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 52 | int64_t rd_diff; |
| 53 | int cost_diff; |
| 54 | int64_t dist_diff; |
| 55 | int new_eob; |
| 56 | } LevelDownStats; |
| 57 | |
Angie Chiang | f0fbf9d | 2017-03-15 15:01:22 -0700 | [diff] [blame] | 58 | void av1_alloc_txb_buf(AV1_COMP *cpi) { |
Angie Chiang | c484abe | 2017-03-20 15:43:11 -0700 | [diff] [blame] | 59 | #if 0 |
Angie Chiang | f0fbf9d | 2017-03-15 15:01:22 -0700 | [diff] [blame] | 60 | AV1_COMMON *cm = &cpi->common; |
| 61 | int mi_block_size = 1 << MI_SIZE_LOG2; |
| 62 | // TODO(angiebird): Make sure cm->subsampling_x/y is set correctly, and then |
| 63 | // use precise buffer size according to cm->subsampling_x/y |
| 64 | int pixel_stride = mi_block_size * cm->mi_cols; |
| 65 | int pixel_height = mi_block_size * cm->mi_rows; |
| 66 | int i; |
| 67 | for (i = 0; i < MAX_MB_PLANE; ++i) { |
| 68 | CHECK_MEM_ERROR( |
| 69 | cm, cpi->tcoeff_buf[i], |
| 70 | aom_malloc(sizeof(*cpi->tcoeff_buf[i]) * pixel_stride * pixel_height)); |
| 71 | } |
Angie Chiang | c484abe | 2017-03-20 15:43:11 -0700 | [diff] [blame] | 72 | #else |
Jingning Han | f5a4d3b | 2017-08-27 23:01:19 -0700 | [diff] [blame] | 73 | AV1_COMMON *cm = &cpi->common; |
Dominic Symes | 917d6c0 | 2017-10-11 18:00:52 +0200 | [diff] [blame] | 74 | int size = ((cm->mi_rows >> cm->mib_size_log2) + 1) * |
| 75 | ((cm->mi_cols >> cm->mib_size_log2) + 1); |
Jingning Han | f5a4d3b | 2017-08-27 23:01:19 -0700 | [diff] [blame] | 76 | |
Angie Chiang | 9367e3e | 2017-10-02 16:28:11 -0700 | [diff] [blame] | 77 | av1_free_txb_buf(cpi); |
Jingning Han | f5a4d3b | 2017-08-27 23:01:19 -0700 | [diff] [blame] | 78 | // TODO(jingning): This should be further reduced. |
| 79 | CHECK_MEM_ERROR(cm, cpi->coeff_buffer_base, |
| 80 | aom_malloc(sizeof(*cpi->coeff_buffer_base) * size)); |
Angie Chiang | c484abe | 2017-03-20 15:43:11 -0700 | [diff] [blame] | 81 | #endif |
Angie Chiang | f0fbf9d | 2017-03-15 15:01:22 -0700 | [diff] [blame] | 82 | } |
| 83 | |
| 84 | void av1_free_txb_buf(AV1_COMP *cpi) { |
Angie Chiang | c484abe | 2017-03-20 15:43:11 -0700 | [diff] [blame] | 85 | #if 0 |
Angie Chiang | f0fbf9d | 2017-03-15 15:01:22 -0700 | [diff] [blame] | 86 | int i; |
| 87 | for (i = 0; i < MAX_MB_PLANE; ++i) { |
| 88 | aom_free(cpi->tcoeff_buf[i]); |
| 89 | } |
Angie Chiang | c484abe | 2017-03-20 15:43:11 -0700 | [diff] [blame] | 90 | #else |
Jingning Han | f5a4d3b | 2017-08-27 23:01:19 -0700 | [diff] [blame] | 91 | aom_free(cpi->coeff_buffer_base); |
Angie Chiang | c484abe | 2017-03-20 15:43:11 -0700 | [diff] [blame] | 92 | #endif |
Angie Chiang | f0fbf9d | 2017-03-15 15:01:22 -0700 | [diff] [blame] | 93 | } |
| 94 | |
Jingning Han | f5a4d3b | 2017-08-27 23:01:19 -0700 | [diff] [blame] | 95 | void av1_set_coeff_buffer(const AV1_COMP *const cpi, MACROBLOCK *const x, |
| 96 | int mi_row, int mi_col) { |
Dominic Symes | 917d6c0 | 2017-10-11 18:00:52 +0200 | [diff] [blame] | 97 | int mib_size_log2 = cpi->common.mib_size_log2; |
| 98 | int stride = (cpi->common.mi_cols >> mib_size_log2) + 1; |
| 99 | int offset = (mi_row >> mib_size_log2) * stride + (mi_col >> mib_size_log2); |
Jingning Han | f5a4d3b | 2017-08-27 23:01:19 -0700 | [diff] [blame] | 100 | CB_COEFF_BUFFER *coeff_buf = &cpi->coeff_buffer_base[offset]; |
| 101 | const int txb_offset = x->cb_offset / (TX_SIZE_W_MIN * TX_SIZE_H_MIN); |
| 102 | for (int plane = 0; plane < MAX_MB_PLANE; ++plane) { |
| 103 | x->mbmi_ext->tcoeff[plane] = coeff_buf->tcoeff[plane] + x->cb_offset; |
| 104 | x->mbmi_ext->eobs[plane] = coeff_buf->eobs[plane] + txb_offset; |
| 105 | x->mbmi_ext->txb_skip_ctx[plane] = |
| 106 | coeff_buf->txb_skip_ctx[plane] + txb_offset; |
| 107 | x->mbmi_ext->dc_sign_ctx[plane] = |
| 108 | coeff_buf->dc_sign_ctx[plane] + txb_offset; |
| 109 | } |
| 110 | } |
| 111 | |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 112 | static void write_golomb(aom_writer *w, int level) { |
| 113 | int x = level + 1; |
| 114 | int i = x; |
| 115 | int length = 0; |
| 116 | |
| 117 | while (i) { |
| 118 | i >>= 1; |
| 119 | ++length; |
| 120 | } |
| 121 | assert(length > 0); |
| 122 | |
| 123 | for (i = 0; i < length - 1; ++i) aom_write_bit(w, 0); |
| 124 | |
| 125 | for (i = length - 1; i >= 0; --i) aom_write_bit(w, (x >> i) & 0x01); |
| 126 | } |
| 127 | |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 128 | static INLINE tran_low_t get_lower_coeff(tran_low_t qc) { |
| 129 | if (qc == 0) { |
| 130 | return 0; |
| 131 | } |
| 132 | return qc > 0 ? qc - 1 : qc + 1; |
| 133 | } |
| 134 | |
Sarah Parker | 3d75209 | 2017-12-20 15:37:55 -0800 | [diff] [blame] | 135 | static INLINE tran_low_t qcoeff_to_dqcoeff(tran_low_t qc, |
| 136 | #if CONFIG_NEW_QUANT |
| 137 | const tran_low_t *nq_dq, |
| 138 | #endif // CONFIG_NEW_QUANT |
| 139 | int dqv, int shift) { |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 140 | int sgn = qc < 0 ? -1 : 1; |
Sarah Parker | 3d75209 | 2017-12-20 15:37:55 -0800 | [diff] [blame] | 141 | #if CONFIG_NEW_QUANT |
Sarah Parker | 8a086e0 | 2018-01-10 14:56:42 -0800 | [diff] [blame] | 142 | int dqcoeff = av1_dequant_coeff_nuq(abs(qc), dqv, nq_dq, shift); |
| 143 | return sgn * dqcoeff; |
Sarah Parker | 3d75209 | 2017-12-20 15:37:55 -0800 | [diff] [blame] | 144 | #endif // CONFIG_NEW_QUANT |
| 145 | |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 146 | return sgn * ((abs(qc) * dqv) >> shift); |
| 147 | } |
| 148 | |
| 149 | static INLINE int64_t get_coeff_dist(tran_low_t tcoeff, tran_low_t dqcoeff, |
| 150 | int shift) { |
Monty Montgomery | 4a05a58 | 2017-11-01 21:21:07 -0400 | [diff] [blame] | 151 | #if CONFIG_DAALA_TX |
| 152 | int depth_shift = (TX_COEFF_DEPTH - 11) * 2; |
| 153 | int depth_round = depth_shift > 1 ? (1 << (depth_shift - 1)) : 0; |
| 154 | const int64_t diff = tcoeff - dqcoeff; |
Monty | bca9e9e | 2017-12-14 06:23:29 -0600 | [diff] [blame] | 155 | const int64_t error = (diff * diff + depth_round) >> depth_shift; |
Monty Montgomery | 4a05a58 | 2017-11-01 21:21:07 -0400 | [diff] [blame] | 156 | (void)shift; |
| 157 | #else |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 158 | const int64_t diff = (tcoeff - dqcoeff) * (1 << shift); |
| 159 | const int64_t error = diff * diff; |
Monty Montgomery | 4a05a58 | 2017-11-01 21:21:07 -0400 | [diff] [blame] | 160 | #endif |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 161 | return error; |
| 162 | } |
| 163 | |
Jingning Han | 35deaa7 | 2017-10-26 15:36:30 -0700 | [diff] [blame] | 164 | void av1_update_eob_context(int eob, int seg_eob, TX_SIZE tx_size, |
| 165 | TX_TYPE tx_type, PLANE_TYPE plane, |
Yunqing Wang | 0e141b5 | 2017-11-02 15:08:58 -0700 | [diff] [blame] | 166 | FRAME_CONTEXT *ec_ctx, FRAME_COUNTS *counts, |
| 167 | uint8_t allow_update_cdf) { |
Linfeng Zhang | 0c72b2f | 2017-12-04 10:59:28 -0800 | [diff] [blame] | 168 | int eob_extra, dummy; |
| 169 | const int eob_pt = get_eob_pos_token(eob, &eob_extra); |
| 170 | const int max_eob_pt = get_eob_pos_token(seg_eob, &dummy); |
Debargha Mukherjee | b3eda2f | 2017-11-28 16:00:20 -0800 | [diff] [blame] | 171 | TX_SIZE txs_ctx = get_txsize_entropy_ctx(tx_size); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 172 | |
Dake He | 0db7d0e | 2017-12-21 15:23:20 -0800 | [diff] [blame] | 173 | (void)max_eob_pt; |
| 174 | const int eob_multi_size = txsize_log2_minus4[tx_size]; |
| 175 | const int eob_multi_ctx = (tx_type_to_class[tx_type] == TX_CLASS_2D) ? 0 : 1; |
| 176 | |
| 177 | switch (eob_multi_size) { |
| 178 | case 0: |
| 179 | ++counts->eob_multi16[plane][eob_multi_ctx][eob_pt - 1]; |
| 180 | if (allow_update_cdf) |
| 181 | update_cdf(ec_ctx->eob_flag_cdf16[plane][eob_multi_ctx], eob_pt - 1, 5); |
| 182 | break; |
| 183 | case 1: |
| 184 | ++counts->eob_multi32[plane][eob_multi_ctx][eob_pt - 1]; |
| 185 | if (allow_update_cdf) |
| 186 | update_cdf(ec_ctx->eob_flag_cdf32[plane][eob_multi_ctx], eob_pt - 1, 6); |
| 187 | break; |
| 188 | case 2: |
| 189 | ++counts->eob_multi64[plane][eob_multi_ctx][eob_pt - 1]; |
| 190 | if (allow_update_cdf) |
| 191 | update_cdf(ec_ctx->eob_flag_cdf64[plane][eob_multi_ctx], eob_pt - 1, 7); |
| 192 | break; |
| 193 | case 3: |
| 194 | ++counts->eob_multi128[plane][eob_multi_ctx][eob_pt - 1]; |
| 195 | if (allow_update_cdf) |
| 196 | update_cdf(ec_ctx->eob_flag_cdf128[plane][eob_multi_ctx], eob_pt - 1, |
| 197 | 8); |
| 198 | break; |
| 199 | case 4: |
| 200 | ++counts->eob_multi256[plane][eob_multi_ctx][eob_pt - 1]; |
| 201 | if (allow_update_cdf) |
| 202 | update_cdf(ec_ctx->eob_flag_cdf256[plane][eob_multi_ctx], eob_pt - 1, |
| 203 | 9); |
| 204 | break; |
| 205 | case 5: |
| 206 | ++counts->eob_multi512[plane][eob_multi_ctx][eob_pt - 1]; |
| 207 | if (allow_update_cdf) |
| 208 | update_cdf(ec_ctx->eob_flag_cdf512[plane][eob_multi_ctx], eob_pt - 1, |
| 209 | 10); |
| 210 | break; |
| 211 | case 6: |
| 212 | default: |
| 213 | ++counts->eob_multi1024[plane][eob_multi_ctx][eob_pt - 1]; |
| 214 | if (allow_update_cdf) |
| 215 | update_cdf(ec_ctx->eob_flag_cdf1024[plane][eob_multi_ctx], eob_pt - 1, |
| 216 | 11); |
| 217 | break; |
| 218 | } |
Jingning Han | 00803a7 | 2017-10-25 16:04:34 -0700 | [diff] [blame] | 219 | |
Angie Chiang | 7ab884e | 2017-10-18 15:57:12 -0700 | [diff] [blame] | 220 | if (k_eob_offset_bits[eob_pt] > 0) { |
| 221 | int eob_shift = k_eob_offset_bits[eob_pt] - 1; |
| 222 | int bit = (eob_extra & (1 << eob_shift)) ? 1 : 0; |
Jingning Han | 35deaa7 | 2017-10-26 15:36:30 -0700 | [diff] [blame] | 223 | counts->eob_extra[txs_ctx][plane][eob_pt][bit]++; |
Yunqing Wang | 0e141b5 | 2017-11-02 15:08:58 -0700 | [diff] [blame] | 224 | if (allow_update_cdf) |
| 225 | update_cdf(ec_ctx->eob_extra_cdf[txs_ctx][plane][eob_pt], bit, 2); |
Angie Chiang | 7ab884e | 2017-10-18 15:57:12 -0700 | [diff] [blame] | 226 | } |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 227 | } |
| 228 | |
| 229 | static int get_eob_cost(int eob, int seg_eob, |
Dake He | 0db7d0e | 2017-12-21 15:23:20 -0800 | [diff] [blame] | 230 | const LV_MAP_EOB_COST *txb_eob_costs, |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 231 | const LV_MAP_COEFF_COST *txb_costs, TX_TYPE tx_type) { |
Linfeng Zhang | 0c72b2f | 2017-12-04 10:59:28 -0800 | [diff] [blame] | 232 | int eob_extra, dummy; |
| 233 | const int eob_pt = get_eob_pos_token(eob, &eob_extra); |
| 234 | const int max_eob_pt = get_eob_pos_token(seg_eob, &dummy); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 235 | int eob_cost = 0; |
Dake He | 0db7d0e | 2017-12-21 15:23:20 -0800 | [diff] [blame] | 236 | (void)max_eob_pt; |
| 237 | const int eob_multi_ctx = (tx_type_to_class[tx_type] == TX_CLASS_2D) ? 0 : 1; |
| 238 | eob_cost = txb_eob_costs->eob_cost[eob_multi_ctx][eob_pt - 1]; |
Dake He | 0db7d0e | 2017-12-21 15:23:20 -0800 | [diff] [blame] | 239 | |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 240 | if (k_eob_offset_bits[eob_pt] > 0) { |
Angie Chiang | 7ab884e | 2017-10-18 15:57:12 -0700 | [diff] [blame] | 241 | int eob_shift = k_eob_offset_bits[eob_pt] - 1; |
| 242 | int bit = (eob_extra & (1 << eob_shift)) ? 1 : 0; |
| 243 | eob_cost += txb_costs->eob_extra_cost[eob_pt][bit]; |
| 244 | for (int i = 1; i < k_eob_offset_bits[eob_pt]; i++) { |
| 245 | eob_shift = k_eob_offset_bits[eob_pt] - 1 - i; |
| 246 | bit = (eob_extra & (1 << eob_shift)) ? 1 : 0; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 247 | eob_cost += av1_cost_bit(128, bit); |
| 248 | } |
| 249 | } |
| 250 | return eob_cost; |
| 251 | } |
| 252 | |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 253 | static int get_coeff_cost(const tran_low_t qc, const int scan_idx, |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 254 | const int is_eob, const TxbInfo *const txb_info, |
Linfeng Zhang | 5f1b8ce | 2017-12-11 15:53:10 -0800 | [diff] [blame] | 255 | const LV_MAP_COEFF_COST *const txb_costs, |
| 256 | const int coeff_ctx); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 257 | |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 258 | static void get_dist_cost_stats(LevelDownStats *const stats, const int scan_idx, |
Ola Hugosson | 1389210 | 2017-11-06 08:01:44 +0100 | [diff] [blame] | 259 | const int is_eob, |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 260 | const LV_MAP_COEFF_COST *const txb_costs, |
Cheng Chen | 37d8873 | 2018-01-09 14:02:41 -0800 | [diff] [blame] | 261 | const TxbInfo *const txb_info, |
| 262 | int has_nz_tail) { |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 263 | const int16_t *const scan = txb_info->scan_order->scan; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 264 | const int coeff_idx = scan[scan_idx]; |
| 265 | const tran_low_t qc = txb_info->qcoeff[coeff_idx]; |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 266 | const uint8_t *const levels = txb_info->levels; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 267 | stats->new_eob = -1; |
| 268 | stats->update = 0; |
Debargha Mukherjee | e2f6b16 | 2018-01-04 17:23:05 -0800 | [diff] [blame] | 269 | stats->rd_low = 0; |
| 270 | stats->rd = 0; |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 271 | // TODO(mfo): explore if there's a better way to prevent compiler init |
| 272 | // warnings |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 273 | stats->nz_rd = 0; |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 274 | stats->dist_low = 0; |
| 275 | stats->rate_low = 0; |
| 276 | stats->low_qc = 0; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 277 | |
| 278 | const tran_low_t tqc = txb_info->tcoeff[coeff_idx]; |
| 279 | const int dqv = txb_info->dequant[coeff_idx != 0]; |
Sarah Parker | 3d75209 | 2017-12-20 15:37:55 -0800 | [diff] [blame] | 280 | #if CONFIG_NEW_QUANT |
| 281 | const tran_low_t *nq_dequant_val = txb_info->nq_dequant_vals[coeff_idx != 0]; |
| 282 | #endif // CONFIG_NEW_QUANT |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 283 | |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 284 | const int coeff_ctx = |
| 285 | get_nz_map_ctx(levels, coeff_idx, txb_info->bwl, txb_info->height, |
| 286 | scan_idx, is_eob, txb_info->tx_size, txb_info->tx_type); |
| 287 | const int qc_cost = |
| 288 | get_coeff_cost(qc, scan_idx, is_eob, txb_info, txb_costs, coeff_ctx); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 289 | if (qc == 0) { |
Cheng Chen | 7964120 | 2018-01-04 18:52:52 -0800 | [diff] [blame] | 290 | stats->dist = 0; |
| 291 | stats->rate = qc_cost; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 292 | return; |
Cheng Chen | 7964120 | 2018-01-04 18:52:52 -0800 | [diff] [blame] | 293 | } else { |
| 294 | const tran_low_t dqc = qcoeff_to_dqcoeff(qc, |
| 295 | #if CONFIG_NEW_QUANT |
| 296 | nq_dequant_val, |
| 297 | #endif // CONFIG_NEW_QUANT |
| 298 | dqv, txb_info->shift); |
| 299 | const int64_t dqc_dist = get_coeff_dist(tqc, dqc, txb_info->shift); |
| 300 | |
| 301 | // distortion difference when coefficient is quantized to 0 |
| 302 | const tran_low_t dqc0 = qcoeff_to_dqcoeff(0, |
| 303 | #if CONFIG_NEW_QUANT |
| 304 | nq_dequant_val, |
| 305 | #endif // CONFIG_NEW_QUANT |
| 306 | dqv, txb_info->shift); |
| 307 | |
| 308 | stats->dist0 = get_coeff_dist(tqc, dqc0, txb_info->shift); |
| 309 | stats->dist = dqc_dist - stats->dist0; |
| 310 | stats->rate = qc_cost; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 311 | } |
Cheng Chen | 7964120 | 2018-01-04 18:52:52 -0800 | [diff] [blame] | 312 | |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 313 | stats->rd = RDCOST(txb_info->rdmult, stats->rate, stats->dist); |
| 314 | |
| 315 | stats->low_qc = get_lower_coeff(qc); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 316 | |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 317 | if (is_eob && stats->low_qc == 0) { |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 318 | stats->rd_low = stats->rd; // disable selection of low_qc in this case. |
Ola Hugosson | 1389210 | 2017-11-06 08:01:44 +0100 | [diff] [blame] | 319 | } else { |
Cheng Chen | 37d8873 | 2018-01-09 14:02:41 -0800 | [diff] [blame] | 320 | if (stats->low_qc == 0) { |
| 321 | stats->dist_low = 0; |
| 322 | } else { |
| 323 | stats->low_dqc = qcoeff_to_dqcoeff(stats->low_qc, |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 324 | #if CONFIG_NEW_QUANT |
Cheng Chen | 37d8873 | 2018-01-09 14:02:41 -0800 | [diff] [blame] | 325 | nq_dequant_val, |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 326 | #endif // CONFIG_NEW_QUANT |
Cheng Chen | 37d8873 | 2018-01-09 14:02:41 -0800 | [diff] [blame] | 327 | dqv, txb_info->shift); |
| 328 | const int64_t low_dqc_dist = |
| 329 | get_coeff_dist(tqc, stats->low_dqc, txb_info->shift); |
| 330 | stats->dist_low = low_dqc_dist - stats->dist0; |
| 331 | } |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 332 | const int low_qc_cost = get_coeff_cost(stats->low_qc, scan_idx, is_eob, |
Yaowu Xu | 0154f2b | 2018-01-04 09:01:17 -0800 | [diff] [blame] | 333 | txb_info, txb_costs, coeff_ctx); |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 334 | stats->rate_low = low_qc_cost; |
| 335 | stats->rd_low = RDCOST(txb_info->rdmult, stats->rate_low, stats->dist_low); |
Ola Hugosson | 1389210 | 2017-11-06 08:01:44 +0100 | [diff] [blame] | 336 | } |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 337 | if ((has_nz_tail < 2) && ((scan_idx == txb_info->eob - 1) || !is_eob)) { |
Cheng Chen | 37d8873 | 2018-01-09 14:02:41 -0800 | [diff] [blame] | 338 | (void)levels; |
| 339 | const int coeff_ctx_temp = |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 340 | get_nz_map_ctx(levels, coeff_idx, txb_info->bwl, txb_info->height, |
| 341 | scan_idx, 1, txb_info->tx_size, txb_info->tx_type); |
Cheng Chen | 37d8873 | 2018-01-09 14:02:41 -0800 | [diff] [blame] | 342 | const int qc_eob_cost = |
| 343 | get_coeff_cost(qc, scan_idx, 1, txb_info, txb_costs, coeff_ctx_temp); |
| 344 | int64_t rd_eob = RDCOST(txb_info->rdmult, qc_eob_cost, stats->dist); |
| 345 | if (stats->low_qc != 0) { |
| 346 | const int low_qc_eob_cost = get_coeff_cost( |
| 347 | stats->low_qc, scan_idx, 1, txb_info, txb_costs, coeff_ctx_temp); |
| 348 | int64_t rd_eob_low = |
| 349 | RDCOST(txb_info->rdmult, low_qc_eob_cost, stats->dist_low); |
| 350 | rd_eob = (rd_eob > rd_eob_low) ? rd_eob_low : rd_eob; |
| 351 | } |
| 352 | |
| 353 | stats->nz_rd = AOMMIN(stats->rd_low, stats->rd) - rd_eob; |
Cheng Chen | 37d8873 | 2018-01-09 14:02:41 -0800 | [diff] [blame] | 354 | } |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 355 | } |
| 356 | |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 357 | static INLINE void update_qcoeff(const int coeff_idx, const tran_low_t qc, |
| 358 | const TxbInfo *const txb_info) { |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 359 | txb_info->qcoeff[coeff_idx] = qc; |
Linfeng Zhang | d564737 | 2017-12-05 17:06:07 -0800 | [diff] [blame] | 360 | txb_info->levels[get_padded_idx(coeff_idx, txb_info->bwl)] = |
Jingning Han | 5cb408e | 2017-11-17 14:43:39 -0800 | [diff] [blame] | 361 | (uint8_t)clamp(abs(qc), 0, INT8_MAX); |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 362 | } |
| 363 | |
| 364 | static INLINE void update_coeff(const int coeff_idx, const tran_low_t qc, |
| 365 | const TxbInfo *const txb_info) { |
| 366 | update_qcoeff(coeff_idx, qc, txb_info); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 367 | const int dqv = txb_info->dequant[coeff_idx != 0]; |
Sarah Parker | 3d75209 | 2017-12-20 15:37:55 -0800 | [diff] [blame] | 368 | #if CONFIG_NEW_QUANT |
| 369 | const tran_low_t *nq_dequant_val = txb_info->nq_dequant_vals[coeff_idx != 0]; |
| 370 | #endif // CONFIG_NEW_QUANT |
| 371 | txb_info->dqcoeff[coeff_idx] = qcoeff_to_dqcoeff(qc, |
| 372 | #if CONFIG_NEW_QUANT |
| 373 | nq_dequant_val, |
| 374 | #endif // CONFIG_NEW_QUANT |
| 375 | dqv, txb_info->shift); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 376 | } |
| 377 | |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 378 | static INLINE void av1_txb_init_levels(const tran_low_t *const coeff, |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 379 | const int width, const int height, |
Linfeng Zhang | 679d81e | 2017-10-31 15:27:42 -0700 | [diff] [blame] | 380 | uint8_t *const levels) { |
| 381 | const int stride = width + TX_PAD_HOR; |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 382 | uint8_t *ls = levels; |
Linfeng Zhang | 679d81e | 2017-10-31 15:27:42 -0700 | [diff] [blame] | 383 | |
| 384 | memset(levels - TX_PAD_TOP * stride, 0, |
| 385 | sizeof(*levels) * TX_PAD_TOP * stride); |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 386 | memset(levels + stride * height, 0, |
| 387 | sizeof(*levels) * (TX_PAD_BOTTOM * stride + TX_PAD_END)); |
Linfeng Zhang | 679d81e | 2017-10-31 15:27:42 -0700 | [diff] [blame] | 388 | |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 389 | for (int i = 0; i < height; i++) { |
| 390 | for (int j = 0; j < width; j++) { |
Jingning Han | 5cb408e | 2017-11-17 14:43:39 -0800 | [diff] [blame] | 391 | *ls++ = (uint8_t)clamp(abs(coeff[i * width + j]), 0, INT8_MAX); |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 392 | } |
| 393 | for (int j = 0; j < TX_PAD_HOR; j++) { |
| 394 | *ls++ = 0; |
| 395 | } |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 396 | } |
| 397 | } |
| 398 | |
Linfeng Zhang | 0ba23e8 | 2017-12-20 16:27:28 -0800 | [diff] [blame] | 399 | void av1_get_nz_map_contexts_c(const uint8_t *const levels, |
| 400 | const int16_t *const scan, const uint16_t eob, |
| 401 | const TX_SIZE tx_size, const TX_TYPE tx_type, |
| 402 | int8_t *const coeff_contexts) { |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 403 | const int bwl = get_txb_bwl(tx_size); |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 404 | const int height = get_txb_high(tx_size); |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 405 | for (int i = 0; i < eob; ++i) { |
| 406 | const int pos = scan[i]; |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 407 | coeff_contexts[pos] = get_nz_map_ctx(levels, pos, bwl, height, i, |
| 408 | i == eob - 1, tx_size, tx_type); |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 409 | } |
| 410 | } |
| 411 | |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 412 | void av1_write_coeffs_txb(const AV1_COMMON *const cm, MACROBLOCKD *xd, |
Luc Trudeau | 2eb9b84 | 2017-12-13 11:19:16 -0500 | [diff] [blame] | 413 | aom_writer *w, int blk_row, int blk_col, int plane, |
| 414 | TX_SIZE tx_size, const tran_low_t *tcoeff, |
Jingning Han | 7eab9ff | 2017-07-06 10:12:54 -0700 | [diff] [blame] | 415 | uint16_t eob, TXB_CTX *txb_ctx) { |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 416 | MB_MODE_INFO *mbmi = &xd->mi[0]->mbmi; |
Angie Chiang | cea11f2 | 2017-02-24 12:30:40 -0800 | [diff] [blame] | 417 | const PLANE_TYPE plane_type = get_plane_type(plane); |
Debargha Mukherjee | b3eda2f | 2017-11-28 16:00:20 -0800 | [diff] [blame] | 418 | const TX_SIZE txs_ctx = get_txsize_entropy_ctx(tx_size); |
Jingning Han | 19b5c8f | 2017-07-06 15:10:12 -0700 | [diff] [blame] | 419 | const TX_TYPE tx_type = |
Luc Trudeau | 2eb9b84 | 2017-12-13 11:19:16 -0500 | [diff] [blame] | 420 | av1_get_tx_type(plane_type, xd, blk_row, blk_col, tx_size); |
Angie Chiang | bd99b38 | 2017-06-20 15:11:16 -0700 | [diff] [blame] | 421 | const SCAN_ORDER *const scan_order = get_scan(cm, tx_size, tx_type, mbmi); |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 422 | const int16_t *const scan = scan_order->scan; |
Urvang Joshi | 8089315 | 2017-10-27 11:51:14 -0700 | [diff] [blame] | 423 | const int seg_eob = av1_get_max_eob(tx_size); |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 424 | int c; |
Angie Chiang | a9ba58e | 2017-12-01 19:22:43 -0800 | [diff] [blame] | 425 | const int bwl = get_txb_bwl(tx_size); |
| 426 | const int width = get_txb_wide(tx_size); |
| 427 | const int height = get_txb_high(tx_size); |
Linfeng Zhang | 848f7bc | 2017-10-31 15:26:07 -0700 | [diff] [blame] | 428 | int update_eob = -1; |
Jingning Han | 41c7f44 | 2017-09-05 14:54:00 -0700 | [diff] [blame] | 429 | FRAME_CONTEXT *ec_ctx = xd->tile_ctx; |
Linfeng Zhang | 679d81e | 2017-10-31 15:27:42 -0700 | [diff] [blame] | 430 | uint8_t levels_buf[TX_PAD_2D]; |
| 431 | uint8_t *const levels = set_levels(levels_buf, width); |
Linfeng Zhang | ae7b2f3 | 2017-11-08 15:46:57 -0800 | [diff] [blame] | 432 | DECLARE_ALIGNED(16, uint8_t, level_counts[MAX_TX_SQUARE]); |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 433 | DECLARE_ALIGNED(16, int8_t, coeff_contexts[MAX_TX_SQUARE]); |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 434 | |
Jingning Han | 94cea4a | 2017-09-30 14:13:23 -0700 | [diff] [blame] | 435 | aom_write_bin(w, eob == 0, |
| 436 | ec_ctx->txb_skip_cdf[txs_ctx][txb_ctx->txb_skip_ctx], 2); |
Angie Chiang | 5f0cb5e | 2017-12-11 16:07:50 -0800 | [diff] [blame] | 437 | #if CONFIG_TXK_SEL |
Angie Chiang | a3f7d2e | 2017-12-07 19:51:14 -0800 | [diff] [blame] | 438 | if (plane == 0 && eob == 0) { |
| 439 | assert(tx_type == DCT_DCT); |
| 440 | } |
Angie Chiang | 5f0cb5e | 2017-12-11 16:07:50 -0800 | [diff] [blame] | 441 | #endif |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 442 | if (eob == 0) return; |
Linfeng Zhang | ce065ca | 2017-10-17 16:49:30 -0700 | [diff] [blame] | 443 | |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 444 | av1_txb_init_levels(tcoeff, width, height, levels); |
Linfeng Zhang | ce065ca | 2017-10-17 16:49:30 -0700 | [diff] [blame] | 445 | |
Angie Chiang | cd9b03f | 2017-04-16 13:37:13 -0700 | [diff] [blame] | 446 | #if CONFIG_TXK_SEL |
Debargha Mukherjee | 3ebb0d0 | 2017-12-14 05:05:18 -0800 | [diff] [blame] | 447 | av1_write_tx_type(cm, xd, blk_row, blk_col, plane, tx_size, w); |
Angie Chiang | cd9b03f | 2017-04-16 13:37:13 -0700 | [diff] [blame] | 448 | #endif |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 449 | |
Linfeng Zhang | 0c72b2f | 2017-12-04 10:59:28 -0800 | [diff] [blame] | 450 | int eob_extra, dummy; |
| 451 | const int eob_pt = get_eob_pos_token(eob, &eob_extra); |
| 452 | const int max_eob_pt = get_eob_pos_token(seg_eob, &dummy); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 453 | |
Dake He | 0db7d0e | 2017-12-21 15:23:20 -0800 | [diff] [blame] | 454 | (void)max_eob_pt; |
| 455 | const int eob_multi_size = txsize_log2_minus4[tx_size]; |
| 456 | const int eob_multi_ctx = (tx_type_to_class[tx_type] == TX_CLASS_2D) ? 0 : 1; |
| 457 | switch (eob_multi_size) { |
| 458 | case 0: |
| 459 | aom_write_symbol(w, eob_pt - 1, |
| 460 | ec_ctx->eob_flag_cdf16[plane_type][eob_multi_ctx], 5); |
| 461 | break; |
| 462 | case 1: |
| 463 | aom_write_symbol(w, eob_pt - 1, |
| 464 | ec_ctx->eob_flag_cdf32[plane_type][eob_multi_ctx], 6); |
| 465 | break; |
| 466 | case 2: |
| 467 | aom_write_symbol(w, eob_pt - 1, |
| 468 | ec_ctx->eob_flag_cdf64[plane_type][eob_multi_ctx], 7); |
| 469 | break; |
| 470 | case 3: |
| 471 | aom_write_symbol(w, eob_pt - 1, |
| 472 | ec_ctx->eob_flag_cdf128[plane_type][eob_multi_ctx], 8); |
| 473 | break; |
| 474 | case 4: |
| 475 | aom_write_symbol(w, eob_pt - 1, |
| 476 | ec_ctx->eob_flag_cdf256[plane_type][eob_multi_ctx], 9); |
| 477 | break; |
| 478 | case 5: |
| 479 | aom_write_symbol(w, eob_pt - 1, |
| 480 | ec_ctx->eob_flag_cdf512[plane_type][eob_multi_ctx], 10); |
| 481 | break; |
| 482 | default: |
| 483 | aom_write_symbol(w, eob_pt - 1, |
| 484 | ec_ctx->eob_flag_cdf1024[plane_type][eob_multi_ctx], 11); |
| 485 | break; |
| 486 | } |
| 487 | |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 488 | if (k_eob_offset_bits[eob_pt] > 0) { |
Angie Chiang | 7ab884e | 2017-10-18 15:57:12 -0700 | [diff] [blame] | 489 | int eob_shift = k_eob_offset_bits[eob_pt] - 1; |
| 490 | int bit = (eob_extra & (1 << eob_shift)) ? 1 : 0; |
| 491 | aom_write_bin(w, bit, ec_ctx->eob_extra_cdf[txs_ctx][plane_type][eob_pt], |
| 492 | 2); |
| 493 | for (int i = 1; i < k_eob_offset_bits[eob_pt]; i++) { |
| 494 | eob_shift = k_eob_offset_bits[eob_pt] - 1 - i; |
| 495 | bit = (eob_extra & (1 << eob_shift)) ? 1 : 0; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 496 | aom_write_bit(w, bit); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 497 | } |
| 498 | } |
Dake He | 03a3292 | 2017-10-31 08:06:45 -0700 | [diff] [blame] | 499 | |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 500 | av1_get_nz_map_contexts(levels, scan, eob, tx_size, tx_type, coeff_contexts); |
| 501 | |
| 502 | for (c = eob - 1; c >= 0; --c) { |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 503 | const int pos = scan[c]; |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 504 | const int coeff_ctx = coeff_contexts[pos]; |
| 505 | const tran_low_t v = tcoeff[pos]; |
Dake He | 03a3292 | 2017-10-31 08:06:45 -0700 | [diff] [blame] | 506 | |
Dake He | 3fe369c | 2017-11-16 17:56:44 -0800 | [diff] [blame] | 507 | if (c == eob - 1) { |
| 508 | aom_write_symbol( |
| 509 | w, AOMMIN(abs(v), 3) - 1, |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 510 | ec_ctx->coeff_base_eob_cdf[txs_ctx][plane_type][coeff_ctx], 3); |
Dake He | 3fe369c | 2017-11-16 17:56:44 -0800 | [diff] [blame] | 511 | } else { |
| 512 | aom_write_symbol(w, AOMMIN(abs(v), 3), |
| 513 | ec_ctx->coeff_base_cdf[txs_ctx][plane_type][coeff_ctx], |
| 514 | 4); |
| 515 | } |
Dake He | 03a3292 | 2017-10-31 08:06:45 -0700 | [diff] [blame] | 516 | } |
| 517 | update_eob = eob - 1; |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 518 | |
Dake He | 43edb76 | 2017-10-26 10:29:46 -0700 | [diff] [blame] | 519 | // Loop to code all signs in the transform block, |
| 520 | // starting with the sign of DC (if applicable) |
| 521 | for (c = 0; c < eob; ++c) { |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 522 | const tran_low_t v = tcoeff[scan[c]]; |
| 523 | const tran_low_t level = abs(v); |
| 524 | const int sign = (v < 0) ? 1 : 0; |
Dake He | 43edb76 | 2017-10-26 10:29:46 -0700 | [diff] [blame] | 525 | if (level == 0) continue; |
| 526 | |
| 527 | if (c == 0) { |
Dake He | 43edb76 | 2017-10-26 10:29:46 -0700 | [diff] [blame] | 528 | aom_write_bin(w, sign, |
| 529 | ec_ctx->dc_sign_cdf[plane_type][txb_ctx->dc_sign_ctx], 2); |
Dake He | 43edb76 | 2017-10-26 10:29:46 -0700 | [diff] [blame] | 530 | } else { |
| 531 | aom_write_bit(w, sign); |
| 532 | } |
| 533 | } |
| 534 | |
Linfeng Zhang | 97fc474 | 2017-11-07 12:57:25 -0800 | [diff] [blame] | 535 | if (update_eob >= 0) { |
Linfeng Zhang | 97fc474 | 2017-11-07 12:57:25 -0800 | [diff] [blame] | 536 | for (c = update_eob; c >= 0; --c) { |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 537 | const int pos = scan[c]; |
| 538 | const tran_low_t level = abs(tcoeff[pos]); |
Linfeng Zhang | 97fc474 | 2017-11-07 12:57:25 -0800 | [diff] [blame] | 539 | int idx; |
| 540 | int ctx; |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 541 | |
Linfeng Zhang | 97fc474 | 2017-11-07 12:57:25 -0800 | [diff] [blame] | 542 | if (level <= NUM_BASE_LEVELS) continue; |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 543 | |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 544 | // level is above 1. |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 545 | const int base_range = level - 1 - NUM_BASE_LEVELS; |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 546 | #if USE_CAUSAL_BR_CTX |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 547 | ctx = get_br_ctx(levels, pos, bwl, level_counts[pos], tx_type); |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 548 | |
| 549 | #else |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 550 | ctx = get_br_ctx(levels, pos, bwl, level_counts[pos]); |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 551 | #endif |
Ola Hugosson | e72a209 | 2017-11-12 09:11:53 +0100 | [diff] [blame] | 552 | for (idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) { |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 553 | const int k = AOMMIN(base_range - idx, BR_CDF_SIZE - 1); |
Dake He | e2d8f18 | 2017-12-14 13:28:00 -0800 | [diff] [blame] | 554 | aom_write_symbol(w, k, |
| 555 | #if 0 |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 556 | ec_ctx->coeff_br_cdf[AOMMIN(txs_ctx, TX_16X16)][plane_type][ctx], |
Dake He | e2d8f18 | 2017-12-14 13:28:00 -0800 | [diff] [blame] | 557 | #else |
| 558 | ec_ctx->coeff_br_cdf[AOMMIN(txs_ctx, TX_32X32)] |
| 559 | [plane_type][ctx], |
| 560 | #endif |
| 561 | BR_CDF_SIZE); |
Ola Hugosson | e72a209 | 2017-11-12 09:11:53 +0100 | [diff] [blame] | 562 | if (k < BR_CDF_SIZE - 1) break; |
| 563 | } |
| 564 | if (base_range < COEFF_BASE_RANGE) continue; |
Linfeng Zhang | 97fc474 | 2017-11-07 12:57:25 -0800 | [diff] [blame] | 565 | // use 0-th order Golomb code to handle the residual level. |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 566 | write_golomb(w, |
| 567 | abs(tcoeff[pos]) - COEFF_BASE_RANGE - 1 - NUM_BASE_LEVELS); |
Jingning Han | 87b01b5 | 2017-08-31 12:07:20 -0700 | [diff] [blame] | 568 | } |
Angie Chiang | 80b8226 | 2017-02-24 11:39:47 -0800 | [diff] [blame] | 569 | } |
| 570 | } |
Angie Chiang | 47c7218 | 2017-02-27 14:30:38 -0800 | [diff] [blame] | 571 | |
Angie Chiang | 140b333 | 2017-12-12 17:29:25 -0800 | [diff] [blame] | 572 | typedef struct encode_txb_args { |
| 573 | const AV1_COMMON *cm; |
| 574 | MACROBLOCK *x; |
| 575 | aom_writer *w; |
| 576 | } ENCODE_TXB_ARGS; |
| 577 | |
Jingning Han | 4b48cd1 | 2018-01-11 15:56:42 -0800 | [diff] [blame^] | 578 | static void av1_write_coeffs_txb_wrap(const AV1_COMMON *cm, MACROBLOCK *x, |
| 579 | aom_writer *w, int plane, int block, |
| 580 | int blk_row, int blk_col, |
| 581 | TX_SIZE tx_size) { |
Angie Chiang | c8af611 | 2017-03-16 16:11:22 -0700 | [diff] [blame] | 582 | MACROBLOCKD *xd = &x->e_mbd; |
Angie Chiang | 140b333 | 2017-12-12 17:29:25 -0800 | [diff] [blame] | 583 | tran_low_t *tcoeff = BLOCK_OFFSET(x->mbmi_ext->tcoeff[plane], block); |
| 584 | uint16_t eob = x->mbmi_ext->eobs[plane][block]; |
| 585 | TXB_CTX txb_ctx = { x->mbmi_ext->txb_skip_ctx[plane][block], |
| 586 | x->mbmi_ext->dc_sign_ctx[plane][block] }; |
Luc Trudeau | 2eb9b84 | 2017-12-13 11:19:16 -0500 | [diff] [blame] | 587 | av1_write_coeffs_txb(cm, xd, w, blk_row, blk_col, plane, tx_size, tcoeff, eob, |
| 588 | &txb_ctx); |
Angie Chiang | 140b333 | 2017-12-12 17:29:25 -0800 | [diff] [blame] | 589 | } |
| 590 | |
Jingning Han | 4b48cd1 | 2018-01-11 15:56:42 -0800 | [diff] [blame^] | 591 | void av1_write_coeffs_mb(const AV1_COMMON *const cm, MACROBLOCK *x, int mi_row, |
| 592 | int mi_col, aom_writer *w, int plane, |
| 593 | BLOCK_SIZE bsize) { |
Angie Chiang | 140b333 | 2017-12-12 17:29:25 -0800 | [diff] [blame] | 594 | MACROBLOCKD *xd = &x->e_mbd; |
Jingning Han | 4b48cd1 | 2018-01-11 15:56:42 -0800 | [diff] [blame^] | 595 | const struct macroblockd_plane *const pd = &xd->plane[plane]; |
| 596 | const TX_SIZE tx_size = av1_get_tx_size(plane, xd); |
| 597 | const int stepr = tx_size_high_unit[tx_size]; |
| 598 | const int stepc = tx_size_wide_unit[tx_size]; |
| 599 | const BLOCK_SIZE plane_bsize = get_plane_block_size(bsize, pd); |
| 600 | int row, col; |
| 601 | const int max_blocks_wide = max_block_wide(xd, plane_bsize, plane); |
| 602 | const int max_blocks_high = max_block_high(xd, plane_bsize, plane); |
| 603 | |
| 604 | if (!is_chroma_reference(mi_row, mi_col, bsize, pd->subsampling_x, |
| 605 | pd->subsampling_y)) |
| 606 | return; |
| 607 | |
| 608 | int blk_row, blk_col; |
| 609 | int block = 0; |
| 610 | const int step = stepr * stepc; |
| 611 | const BLOCK_SIZE max_unit_bsize = get_plane_block_size(BLOCK_64X64, pd); |
| 612 | int mu_blocks_wide = block_size_wide[max_unit_bsize] >> tx_size_wide_log2[0]; |
| 613 | int mu_blocks_high = block_size_high[max_unit_bsize] >> tx_size_high_log2[0]; |
| 614 | mu_blocks_wide = AOMMIN(max_blocks_wide, mu_blocks_wide); |
| 615 | mu_blocks_high = AOMMIN(max_blocks_high, mu_blocks_high); |
| 616 | |
| 617 | for (row = 0; row < max_blocks_high; row += mu_blocks_high) { |
| 618 | const int unit_height = AOMMIN(mu_blocks_high + row, max_blocks_high); |
| 619 | for (col = 0; col < max_blocks_wide; col += mu_blocks_wide) { |
| 620 | const int unit_width = AOMMIN(mu_blocks_wide + col, max_blocks_wide); |
| 621 | |
| 622 | for (blk_row = row; blk_row < unit_height; blk_row += stepr) { |
| 623 | for (blk_col = col; blk_col < unit_width; blk_col += stepc) { |
| 624 | av1_write_coeffs_txb_wrap(cm, x, w, plane, block, blk_row, blk_col, |
| 625 | tx_size); |
| 626 | block += step; |
| 627 | } |
| 628 | } |
| 629 | } |
| 630 | } |
Angie Chiang | c8af611 | 2017-03-16 16:11:22 -0700 | [diff] [blame] | 631 | } |
| 632 | |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 633 | static INLINE int get_br_cost(tran_low_t abs_qc, int ctx, |
Angie Chiang | 26d3e45 | 2017-09-29 17:40:02 -0700 | [diff] [blame] | 634 | const int *coeff_lps) { |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 635 | const tran_low_t min_level = 1 + NUM_BASE_LEVELS; |
| 636 | const tran_low_t max_level = 1 + NUM_BASE_LEVELS + COEFF_BASE_RANGE; |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 637 | (void)ctx; |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 638 | if (abs_qc >= min_level) { |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 639 | if (abs_qc >= max_level) |
Jingning Han | 772dee3 | 2017-09-15 08:53:18 -0700 | [diff] [blame] | 640 | return coeff_lps[COEFF_BASE_RANGE]; // COEFF_BASE_RANGE * cost0; |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 641 | else |
Jingning Han | 772dee3 | 2017-09-15 08:53:18 -0700 | [diff] [blame] | 642 | return coeff_lps[(abs_qc - min_level)]; // * cost0 + cost1; |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 643 | } else { |
| 644 | return 0; |
| 645 | } |
| 646 | } |
| 647 | |
Linfeng Zhang | c02b411 | 2017-12-21 13:11:36 -0800 | [diff] [blame] | 648 | // Note: don't call this function when eob is 0. |
| 649 | int av1_cost_coeffs_txb(const AV1_COMMON *const cm, const MACROBLOCK *x, |
| 650 | const int plane, const int blk_row, const int blk_col, |
| 651 | const int block, const TX_SIZE tx_size, |
| 652 | const TXB_CTX *const txb_ctx) { |
| 653 | const MACROBLOCKD *const xd = &x->e_mbd; |
| 654 | const TX_SIZE txs_ctx = get_txsize_entropy_ctx(tx_size); |
Angie Chiang | 47c7218 | 2017-02-27 14:30:38 -0800 | [diff] [blame] | 655 | const PLANE_TYPE plane_type = get_plane_type(plane); |
Jingning Han | 19b5c8f | 2017-07-06 15:10:12 -0700 | [diff] [blame] | 656 | const TX_TYPE tx_type = |
Luc Trudeau | 2eb9b84 | 2017-12-13 11:19:16 -0500 | [diff] [blame] | 657 | av1_get_tx_type(plane_type, xd, blk_row, blk_col, tx_size); |
Linfeng Zhang | c02b411 | 2017-12-21 13:11:36 -0800 | [diff] [blame] | 658 | const MB_MODE_INFO *const mbmi = &xd->mi[0]->mbmi; |
Angie Chiang | 47c7218 | 2017-02-27 14:30:38 -0800 | [diff] [blame] | 659 | const struct macroblock_plane *p = &x->plane[plane]; |
| 660 | const int eob = p->eobs[block]; |
| 661 | const tran_low_t *const qcoeff = BLOCK_OFFSET(p->qcoeff, block); |
| 662 | int c, cost; |
Linfeng Zhang | c02b411 | 2017-12-21 13:11:36 -0800 | [diff] [blame] | 663 | const int txb_skip_ctx = txb_ctx->txb_skip_ctx; |
Angie Chiang | a9ba58e | 2017-12-01 19:22:43 -0800 | [diff] [blame] | 664 | const int bwl = get_txb_bwl(tx_size); |
| 665 | const int width = get_txb_wide(tx_size); |
| 666 | const int height = get_txb_high(tx_size); |
Angie Chiang | bd99b38 | 2017-06-20 15:11:16 -0700 | [diff] [blame] | 667 | const SCAN_ORDER *const scan_order = get_scan(cm, tx_size, tx_type, mbmi); |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 668 | const int16_t *const scan = scan_order->scan; |
Linfeng Zhang | 679d81e | 2017-10-31 15:27:42 -0700 | [diff] [blame] | 669 | uint8_t levels_buf[TX_PAD_2D]; |
| 670 | uint8_t *const levels = set_levels(levels_buf, width); |
Linfeng Zhang | ae7b2f3 | 2017-11-08 15:46:57 -0800 | [diff] [blame] | 671 | DECLARE_ALIGNED(16, uint8_t, level_counts[MAX_TX_SQUARE]); |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 672 | DECLARE_ALIGNED(16, int8_t, coeff_contexts[MAX_TX_SQUARE]); |
Linfeng Zhang | c02b411 | 2017-12-21 13:11:36 -0800 | [diff] [blame] | 673 | const LV_MAP_COEFF_COST *const coeff_costs = |
| 674 | &x->coeff_costs[txs_ctx][plane_type]; |
Angie Chiang | 47c7218 | 2017-02-27 14:30:38 -0800 | [diff] [blame] | 675 | |
Dake He | 0db7d0e | 2017-12-21 15:23:20 -0800 | [diff] [blame] | 676 | const int eob_multi_size = txsize_log2_minus4[tx_size]; |
| 677 | const LV_MAP_EOB_COST *const eob_costs = |
| 678 | &x->eob_costs[eob_multi_size][plane_type]; |
Dake He | 5641635 | 2017-12-26 15:43:34 -0800 | [diff] [blame] | 679 | // eob must be greater than 0 here. |
| 680 | assert(eob > 0); |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 681 | cost = coeff_costs->txb_skip_cost[txb_skip_ctx][0]; |
Angie Chiang | 47c7218 | 2017-02-27 14:30:38 -0800 | [diff] [blame] | 682 | |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 683 | av1_txb_init_levels(qcoeff, width, height, levels); |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 684 | |
Angie Chiang | cd9b03f | 2017-04-16 13:37:13 -0700 | [diff] [blame] | 685 | #if CONFIG_TXK_SEL |
Yue Chen | b23d00a | 2017-07-28 17:01:21 -0700 | [diff] [blame] | 686 | cost += av1_tx_type_cost(cm, x, xd, mbmi->sb_type, plane, tx_size, tx_type); |
Angie Chiang | cd9b03f | 2017-04-16 13:37:13 -0700 | [diff] [blame] | 687 | #endif |
Angie Chiang | 0591787 | 2017-04-15 12:28:56 -0700 | [diff] [blame] | 688 | |
Urvang Joshi | 8089315 | 2017-10-27 11:51:14 -0700 | [diff] [blame] | 689 | const int seg_eob = av1_get_max_eob(tx_size); |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 690 | int eob_cost = get_eob_cost(eob, seg_eob, eob_costs, coeff_costs, tx_type); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 691 | cost += eob_cost; |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 692 | |
| 693 | av1_get_nz_map_contexts(levels, scan, eob, tx_size, tx_type, coeff_contexts); |
| 694 | |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 695 | for (c = eob - 1; c >= 0; --c) { |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 696 | const int pos = scan[c]; |
| 697 | const tran_low_t v = qcoeff[pos]; |
| 698 | const int is_nz = (v != 0); |
| 699 | const int level = abs(v); |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 700 | const int coeff_ctx = coeff_contexts[pos]; |
Dake He | 3fe369c | 2017-11-16 17:56:44 -0800 | [diff] [blame] | 701 | if (c == eob - 1) { |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 702 | cost += coeff_costs->base_eob_cost[coeff_ctx][AOMMIN(level, 3) - 1]; |
Dake He | 3fe369c | 2017-11-16 17:56:44 -0800 | [diff] [blame] | 703 | } else { |
| 704 | cost += coeff_costs->base_cost[coeff_ctx][AOMMIN(level, 3)]; |
| 705 | } |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 706 | |
| 707 | if (is_nz) { |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 708 | int sign = (v < 0) ? 1 : 0; |
| 709 | |
| 710 | // sign bit cost |
| 711 | if (c == 0) { |
| 712 | int dc_sign_ctx = txb_ctx->dc_sign_ctx; |
| 713 | cost += coeff_costs->dc_sign_cost[dc_sign_ctx][sign]; |
| 714 | } else { |
| 715 | cost += av1_cost_bit(128, sign); |
| 716 | } |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 717 | if (level > NUM_BASE_LEVELS) { |
| 718 | int ctx; |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 719 | #if USE_CAUSAL_BR_CTX |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 720 | ctx = get_br_ctx(levels, pos, bwl, level_counts[pos], tx_type); |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 721 | #else |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 722 | ctx = get_br_ctx(levels, pos, bwl, level_counts[pos]); |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 723 | #endif |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 724 | const int base_range = level - 1 - NUM_BASE_LEVELS; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 725 | if (base_range < COEFF_BASE_RANGE) { |
| 726 | cost += coeff_costs->lps_cost[ctx][base_range]; |
| 727 | } else { |
| 728 | cost += coeff_costs->lps_cost[ctx][COEFF_BASE_RANGE]; |
| 729 | } |
| 730 | |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 731 | if (level >= 1 + NUM_BASE_LEVELS + COEFF_BASE_RANGE) { |
| 732 | // residual cost |
| 733 | int r = level - COEFF_BASE_RANGE - NUM_BASE_LEVELS; |
| 734 | int ri = r; |
| 735 | int length = 0; |
| 736 | |
| 737 | while (ri) { |
| 738 | ri >>= 1; |
| 739 | ++length; |
| 740 | } |
| 741 | |
| 742 | for (ri = 0; ri < length - 1; ++ri) cost += av1_cost_bit(128, 0); |
| 743 | |
| 744 | for (ri = length - 1; ri >= 0; --ri) |
| 745 | cost += av1_cost_bit(128, (r >> ri) & 0x01); |
| 746 | } |
| 747 | } |
| 748 | } |
| 749 | } |
Angie Chiang | 47c7218 | 2017-02-27 14:30:38 -0800 | [diff] [blame] | 750 | return cost; |
| 751 | } |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 752 | |
Angie Chiang | 2affb3b | 2017-05-30 15:23:51 -0700 | [diff] [blame] | 753 | static INLINE int has_base(tran_low_t qc, int base_idx) { |
| 754 | const int level = base_idx + 1; |
| 755 | return abs(qc) >= level; |
| 756 | } |
| 757 | |
Angie Chiang | 2affb3b | 2017-05-30 15:23:51 -0700 | [diff] [blame] | 758 | static INLINE int has_br(tran_low_t qc) { |
| 759 | return abs(qc) >= 1 + NUM_BASE_LEVELS; |
| 760 | } |
| 761 | |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 762 | static INLINE int get_sign_bit_cost(tran_low_t qc, int coeff_idx, |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 763 | const int (*dc_sign_cost)[2], |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 764 | int dc_sign_ctx) { |
| 765 | const int sign = (qc < 0) ? 1 : 0; |
| 766 | // sign bit cost |
| 767 | if (coeff_idx == 0) { |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 768 | return dc_sign_cost[dc_sign_ctx][sign]; |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 769 | } else { |
| 770 | return av1_cost_bit(128, sign); |
| 771 | } |
| 772 | } |
| 773 | static INLINE int get_golomb_cost(int abs_qc) { |
| 774 | if (abs_qc >= 1 + NUM_BASE_LEVELS + COEFF_BASE_RANGE) { |
| 775 | // residual cost |
| 776 | int r = abs_qc - COEFF_BASE_RANGE - NUM_BASE_LEVELS; |
| 777 | int ri = r; |
| 778 | int length = 0; |
| 779 | |
| 780 | while (ri) { |
| 781 | ri >>= 1; |
| 782 | ++length; |
| 783 | } |
| 784 | |
| 785 | return av1_cost_literal(2 * length - 1); |
| 786 | } else { |
| 787 | return 0; |
| 788 | } |
| 789 | } |
| 790 | |
Angie Chiang | 2affb3b | 2017-05-30 15:23:51 -0700 | [diff] [blame] | 791 | void gen_txb_cache(TxbCache *txb_cache, TxbInfo *txb_info) { |
Angie Chiang | 481c01f | 2017-08-15 16:24:30 -0700 | [diff] [blame] | 792 | // gen_nz_count_arr |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 793 | const int16_t *const scan = txb_info->scan_order->scan; |
Angie Chiang | 481c01f | 2017-08-15 16:24:30 -0700 | [diff] [blame] | 794 | const int bwl = txb_info->bwl; |
| 795 | const int height = txb_info->height; |
Linfeng Zhang | 72e0b3f | 2017-10-18 13:32:12 -0700 | [diff] [blame] | 796 | const tran_low_t *const qcoeff = txb_info->qcoeff; |
Linfeng Zhang | b6957c2 | 2017-10-25 13:17:28 -0700 | [diff] [blame] | 797 | const uint8_t *const levels = txb_info->levels; |
Angie Chiang | def1125 | 2017-08-18 14:37:32 -0700 | [diff] [blame] | 798 | const BASE_CTX_TABLE *base_ctx_table = |
| 799 | txb_info->coeff_ctx_table->base_ctx_table; |
Angie Chiang | 481c01f | 2017-08-15 16:24:30 -0700 | [diff] [blame] | 800 | for (int c = 0; c < txb_info->eob; ++c) { |
| 801 | const int coeff_idx = scan[c]; // raster order |
| 802 | const int row = coeff_idx >> bwl; |
| 803 | const int col = coeff_idx - (row << bwl); |
Jingning Han | 3422ac1 | 2017-10-25 20:37:53 -0700 | [diff] [blame] | 804 | |
Linfeng Zhang | f91f3ca | 2017-12-05 11:22:41 -0800 | [diff] [blame] | 805 | txb_cache->nz_count_arr[coeff_idx] = |
Linfeng Zhang | d564737 | 2017-12-05 17:06:07 -0800 | [diff] [blame] | 806 | get_nz_count(levels + get_padded_idx(coeff_idx, bwl), bwl, |
Linfeng Zhang | f91f3ca | 2017-12-05 11:22:41 -0800 | [diff] [blame] | 807 | tx_type_to_class[txb_info->tx_type]); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 808 | |
Yaowu Xu | 102ef81 | 2017-12-12 11:31:03 -0800 | [diff] [blame] | 809 | txb_cache->nz_ctx_arr[coeff_idx] = |
| 810 | get_nz_map_ctx_from_stats(0, coeff_idx, bwl, txb_info->tx_size, |
| 811 | tx_type_to_class[txb_info->tx_type]); |
Angie Chiang | 481c01f | 2017-08-15 16:24:30 -0700 | [diff] [blame] | 812 | |
| 813 | // gen_base_count_mag_arr |
| 814 | if (!has_base(qcoeff[coeff_idx], 0)) continue; |
| 815 | int *base_mag = txb_cache->base_mag_arr[coeff_idx]; |
Angie Chiang | 9cde59f | 2017-08-16 15:24:55 -0700 | [diff] [blame] | 816 | int count[NUM_BASE_LEVELS]; |
| 817 | get_base_count_mag(base_mag, count, qcoeff, bwl, height, row, col); |
Angie Chiang | 481c01f | 2017-08-15 16:24:30 -0700 | [diff] [blame] | 818 | |
| 819 | for (int i = 0; i < NUM_BASE_LEVELS; ++i) { |
Angie Chiang | 9cde59f | 2017-08-16 15:24:55 -0700 | [diff] [blame] | 820 | if (!has_base(qcoeff[coeff_idx], i)) break; |
| 821 | txb_cache->base_count_arr[i][coeff_idx] = count[i]; |
Angie Chiang | 481c01f | 2017-08-15 16:24:30 -0700 | [diff] [blame] | 822 | const int level = i + 1; |
Angie Chiang | 9cde59f | 2017-08-16 15:24:55 -0700 | [diff] [blame] | 823 | txb_cache->base_ctx_arr[i][coeff_idx] = |
Angie Chiang | def1125 | 2017-08-18 14:37:32 -0700 | [diff] [blame] | 824 | base_ctx_table[row != 0][col != 0][base_mag[0] > level][count[i]]; |
Angie Chiang | 481c01f | 2017-08-15 16:24:30 -0700 | [diff] [blame] | 825 | } |
| 826 | |
| 827 | // gen_br_count_mag_arr |
| 828 | if (!has_br(qcoeff[coeff_idx])) continue; |
| 829 | int *br_count = txb_cache->br_count_arr + coeff_idx; |
| 830 | int *br_mag = txb_cache->br_mag_arr[coeff_idx]; |
Angie Chiang | ea8183b | 2017-08-17 14:36:35 -0700 | [diff] [blame] | 831 | *br_count = get_br_count_mag(br_mag, qcoeff, bwl, height, row, col, |
| 832 | NUM_BASE_LEVELS); |
Angie Chiang | 481c01f | 2017-08-15 16:24:30 -0700 | [diff] [blame] | 833 | txb_cache->br_ctx_arr[coeff_idx] = |
| 834 | get_br_ctx_from_count_mag(row, col, *br_count, br_mag[0]); |
| 835 | } |
Angie Chiang | 2affb3b | 2017-05-30 15:23:51 -0700 | [diff] [blame] | 836 | } |
| 837 | |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 838 | static INLINE const int *get_level_prob(int level, int coeff_idx, |
| 839 | const TxbCache *txb_cache, |
| 840 | const LV_MAP_COEFF_COST *txb_costs) { |
Ola Hugosson | 1389210 | 2017-11-06 08:01:44 +0100 | [diff] [blame] | 841 | if (level < 1 + NUM_BASE_LEVELS) { |
| 842 | const int ctx = txb_cache->nz_ctx_arr[coeff_idx]; |
| 843 | return &txb_costs->base_cost[ctx][level]; |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 844 | } else if (level >= 1 + NUM_BASE_LEVELS && |
| 845 | level < 1 + NUM_BASE_LEVELS + COEFF_BASE_RANGE) { |
Angie Chiang | 1ae0ebf | 2017-08-15 15:16:47 -0700 | [diff] [blame] | 846 | const int ctx = txb_cache->br_ctx_arr[coeff_idx]; |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 847 | return txb_costs->lps_cost[ctx]; |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 848 | } else if (level >= 1 + NUM_BASE_LEVELS + COEFF_BASE_RANGE) { |
Ola Hugosson | 1389210 | 2017-11-06 08:01:44 +0100 | [diff] [blame] | 849 | // printf("get_level_prob does not support golomb\n"); |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 850 | assert(0); |
| 851 | return 0; |
| 852 | } else { |
| 853 | assert(0); |
| 854 | return 0; |
| 855 | } |
| 856 | } |
| 857 | |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 858 | static INLINE void update_mag_arr(int *mag_arr, int abs_qc) { |
| 859 | if (mag_arr[0] == abs_qc) { |
| 860 | mag_arr[1] -= 1; |
| 861 | assert(mag_arr[1] >= 0); |
| 862 | } |
| 863 | } |
| 864 | |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 865 | static INLINE int get_mag_from_mag_arr(const int *mag_arr) { |
| 866 | int mag; |
| 867 | if (mag_arr[1] > 0) { |
| 868 | mag = mag_arr[0]; |
| 869 | } else if (mag_arr[0] > 0) { |
| 870 | mag = mag_arr[0] - 1; |
| 871 | } else { |
| 872 | // no neighbor |
| 873 | assert(mag_arr[0] == 0 && mag_arr[1] == 0); |
| 874 | mag = 0; |
| 875 | } |
| 876 | return mag; |
| 877 | } |
| 878 | |
| 879 | static int neighbor_level_down_update(int *new_count, int *new_mag, int count, |
| 880 | const int *mag, int coeff_idx, |
| 881 | tran_low_t abs_nb_coeff, int nb_coeff_idx, |
| 882 | int level, const TxbInfo *txb_info) { |
| 883 | *new_count = count; |
| 884 | *new_mag = get_mag_from_mag_arr(mag); |
| 885 | |
| 886 | int update = 0; |
| 887 | // check if br_count changes |
| 888 | if (abs_nb_coeff == level) { |
| 889 | update = 1; |
| 890 | *new_count -= 1; |
| 891 | assert(*new_count >= 0); |
| 892 | } |
| 893 | const int row = coeff_idx >> txb_info->bwl; |
| 894 | const int col = coeff_idx - (row << txb_info->bwl); |
| 895 | const int nb_row = nb_coeff_idx >> txb_info->bwl; |
| 896 | const int nb_col = nb_coeff_idx - (nb_row << txb_info->bwl); |
| 897 | |
| 898 | // check if mag changes |
| 899 | if (nb_row >= row && nb_col >= col) { |
| 900 | if (abs_nb_coeff == mag[0]) { |
| 901 | assert(mag[1] > 0); |
| 902 | if (mag[1] == 1) { |
| 903 | // the nb is the only qc with max mag |
| 904 | *new_mag -= 1; |
| 905 | assert(*new_mag >= 0); |
| 906 | update = 1; |
| 907 | } |
| 908 | } |
| 909 | } |
| 910 | return update; |
| 911 | } |
| 912 | |
| 913 | static int try_neighbor_level_down_br(int coeff_idx, int nb_coeff_idx, |
| 914 | const TxbCache *txb_cache, |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 915 | const LV_MAP_COEFF_COST *txb_costs, |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 916 | const TxbInfo *txb_info) { |
| 917 | const tran_low_t qc = txb_info->qcoeff[coeff_idx]; |
| 918 | const tran_low_t abs_qc = abs(qc); |
| 919 | const int level = NUM_BASE_LEVELS + 1; |
| 920 | if (abs_qc < level) return 0; |
| 921 | |
| 922 | const tran_low_t nb_coeff = txb_info->qcoeff[nb_coeff_idx]; |
| 923 | const tran_low_t abs_nb_coeff = abs(nb_coeff); |
| 924 | const int count = txb_cache->br_count_arr[coeff_idx]; |
| 925 | const int *mag = txb_cache->br_mag_arr[coeff_idx]; |
| 926 | int new_count; |
| 927 | int new_mag; |
| 928 | const int update = |
| 929 | neighbor_level_down_update(&new_count, &new_mag, count, mag, coeff_idx, |
| 930 | abs_nb_coeff, nb_coeff_idx, level, txb_info); |
| 931 | if (update) { |
| 932 | const int row = coeff_idx >> txb_info->bwl; |
| 933 | const int col = coeff_idx - (row << txb_info->bwl); |
Angie Chiang | 1ae0ebf | 2017-08-15 15:16:47 -0700 | [diff] [blame] | 934 | const int ctx = txb_cache->br_ctx_arr[coeff_idx]; |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 935 | const int org_cost = get_br_cost(abs_qc, ctx, txb_costs->lps_cost[ctx]); |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 936 | |
| 937 | const int new_ctx = get_br_ctx_from_count_mag(row, col, new_count, new_mag); |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 938 | const int new_cost = |
| 939 | get_br_cost(abs_qc, new_ctx, txb_costs->lps_cost[new_ctx]); |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 940 | const int cost_diff = -org_cost + new_cost; |
| 941 | return cost_diff; |
| 942 | } else { |
| 943 | return 0; |
| 944 | } |
| 945 | } |
| 946 | |
| 947 | static int try_neighbor_level_down_base(int coeff_idx, int nb_coeff_idx, |
| 948 | const TxbCache *txb_cache, |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 949 | const LV_MAP_COEFF_COST *txb_costs, |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 950 | const TxbInfo *txb_info) { |
Ola Hugosson | 1389210 | 2017-11-06 08:01:44 +0100 | [diff] [blame] | 951 | // TODO(olah): not implemented yet |
| 952 | (void)coeff_idx; |
| 953 | (void)nb_coeff_idx; |
| 954 | (void)txb_cache; |
| 955 | (void)txb_costs; |
| 956 | (void)txb_info; |
| 957 | return 0; |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 958 | } |
| 959 | |
| 960 | static int try_neighbor_level_down_nz(int coeff_idx, int nb_coeff_idx, |
| 961 | const TxbCache *txb_cache, |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 962 | const LV_MAP_COEFF_COST *txb_costs, |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 963 | TxbInfo *txb_info) { |
| 964 | // assume eob doesn't change |
| 965 | const tran_low_t qc = txb_info->qcoeff[coeff_idx]; |
| 966 | const tran_low_t abs_qc = abs(qc); |
| 967 | const tran_low_t nb_coeff = txb_info->qcoeff[nb_coeff_idx]; |
| 968 | const tran_low_t abs_nb_coeff = abs(nb_coeff); |
| 969 | if (abs_nb_coeff != 1) return 0; |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 970 | const int16_t *const iscan = txb_info->scan_order->iscan; |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 971 | const int scan_idx = iscan[coeff_idx]; |
| 972 | if (scan_idx == txb_info->seg_eob) return 0; |
| 973 | const int nb_scan_idx = iscan[nb_coeff_idx]; |
| 974 | if (nb_scan_idx < scan_idx) { |
| 975 | const int count = txb_cache->nz_count_arr[coeff_idx]; |
Linfeng Zhang | 8ac4557 | 2017-11-29 11:39:51 -0800 | [diff] [blame] | 976 | (void)count; |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 977 | assert(count > 0); |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 978 | update_qcoeff(nb_coeff_idx, get_lower_coeff(nb_coeff), txb_info); |
Linfeng Zhang | 8ac4557 | 2017-11-29 11:39:51 -0800 | [diff] [blame] | 979 | const int new_ctx = get_nz_map_ctx_from_stats( |
Yaowu Xu | 102ef81 | 2017-12-12 11:31:03 -0800 | [diff] [blame] | 980 | 0, coeff_idx, txb_info->bwl, txb_info->tx_size, |
| 981 | tx_type_to_class[txb_info->tx_type]); |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 982 | update_qcoeff(nb_coeff_idx, nb_coeff, txb_info); |
Angie Chiang | 1ae0ebf | 2017-08-15 15:16:47 -0700 | [diff] [blame] | 983 | const int ctx = txb_cache->nz_ctx_arr[coeff_idx]; |
Ola Hugosson | 1389210 | 2017-11-06 08:01:44 +0100 | [diff] [blame] | 984 | const int org_cost = txb_costs->base_cost[ctx][AOMMIN(abs_qc, 3)]; |
| 985 | const int new_cost = txb_costs->base_cost[new_ctx][AOMMIN(abs_qc, 3)]; |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 986 | const int cost_diff = new_cost - org_cost; |
| 987 | return cost_diff; |
| 988 | } else { |
| 989 | return 0; |
| 990 | } |
| 991 | } |
| 992 | |
| 993 | static int try_self_level_down(tran_low_t *low_coeff, int coeff_idx, |
| 994 | const TxbCache *txb_cache, |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 995 | const LV_MAP_COEFF_COST *txb_costs, |
| 996 | TxbInfo *txb_info) { |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 997 | const tran_low_t qc = txb_info->qcoeff[coeff_idx]; |
| 998 | if (qc == 0) { |
| 999 | *low_coeff = 0; |
| 1000 | return 0; |
| 1001 | } |
| 1002 | const tran_low_t abs_qc = abs(qc); |
| 1003 | *low_coeff = get_lower_coeff(qc); |
| 1004 | int cost_diff; |
| 1005 | if (*low_coeff == 0) { |
| 1006 | const int scan_idx = txb_info->scan_order->iscan[coeff_idx]; |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1007 | const int *level_cost = |
| 1008 | get_level_prob(abs_qc, coeff_idx, txb_cache, txb_costs); |
| 1009 | const int *low_level_cost = |
| 1010 | get_level_prob(abs(*low_coeff), coeff_idx, txb_cache, txb_costs); |
Jingning Han | 3422ac1 | 2017-10-25 20:37:53 -0700 | [diff] [blame] | 1011 | |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1012 | if (scan_idx < txb_info->eob - 1) { |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 1013 | // When level-0, we code the binary of abs_qc > level |
| 1014 | // but when level-k k > 0 we code the binary of abs_qc == level |
| 1015 | // That's why wee need this special treatment for level-0 map |
| 1016 | // TODO(angiebird): make leve-0 consistent to other levels |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1017 | cost_diff = -level_cost[1] + low_level_cost[0] - low_level_cost[1]; |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 1018 | } else { |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1019 | cost_diff = -level_cost[1]; |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 1020 | } |
| 1021 | |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 1022 | const int sign_cost = get_sign_bit_cost( |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1023 | qc, coeff_idx, txb_costs->dc_sign_cost, txb_info->txb_ctx->dc_sign_ctx); |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 1024 | cost_diff -= sign_cost; |
Jingning Han | 772dee3 | 2017-09-15 08:53:18 -0700 | [diff] [blame] | 1025 | } else if (abs_qc <= NUM_BASE_LEVELS) { |
| 1026 | const int *level_cost = |
| 1027 | get_level_prob(abs_qc, coeff_idx, txb_cache, txb_costs); |
| 1028 | const int *low_level_cost = |
| 1029 | get_level_prob(abs(*low_coeff), coeff_idx, txb_cache, txb_costs); |
| 1030 | cost_diff = -level_cost[1] + low_level_cost[1] - low_level_cost[0]; |
| 1031 | } else if (abs_qc == NUM_BASE_LEVELS + 1) { |
| 1032 | const int *level_cost = |
| 1033 | get_level_prob(abs_qc, coeff_idx, txb_cache, txb_costs); |
| 1034 | const int *low_level_cost = |
| 1035 | get_level_prob(abs(*low_coeff), coeff_idx, txb_cache, txb_costs); |
| 1036 | cost_diff = -level_cost[0] + low_level_cost[1] - low_level_cost[0]; |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 1037 | } else if (abs_qc < 1 + NUM_BASE_LEVELS + COEFF_BASE_RANGE) { |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1038 | const int *level_cost = |
| 1039 | get_level_prob(abs_qc, coeff_idx, txb_cache, txb_costs); |
| 1040 | const int *low_level_cost = |
| 1041 | get_level_prob(abs(*low_coeff), coeff_idx, txb_cache, txb_costs); |
| 1042 | |
Jingning Han | 772dee3 | 2017-09-15 08:53:18 -0700 | [diff] [blame] | 1043 | cost_diff = -level_cost[abs_qc - 1 - NUM_BASE_LEVELS] + |
| 1044 | low_level_cost[abs(*low_coeff) - 1 - NUM_BASE_LEVELS]; |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 1045 | } else if (abs_qc == 1 + NUM_BASE_LEVELS + COEFF_BASE_RANGE) { |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1046 | const int *low_level_cost = |
| 1047 | get_level_prob(abs(*low_coeff), coeff_idx, txb_cache, txb_costs); |
Jingning Han | 772dee3 | 2017-09-15 08:53:18 -0700 | [diff] [blame] | 1048 | cost_diff = -get_golomb_cost(abs_qc) - low_level_cost[COEFF_BASE_RANGE] + |
| 1049 | low_level_cost[COEFF_BASE_RANGE - 1]; |
Angie Chiang | 7afbba4 | 2017-05-30 15:59:15 -0700 | [diff] [blame] | 1050 | } else { |
| 1051 | assert(abs_qc > 1 + NUM_BASE_LEVELS + COEFF_BASE_RANGE); |
| 1052 | const tran_low_t abs_low_coeff = abs(*low_coeff); |
| 1053 | cost_diff = -get_golomb_cost(abs_qc) + get_golomb_cost(abs_low_coeff); |
| 1054 | } |
| 1055 | return cost_diff; |
| 1056 | } |
| 1057 | |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1058 | #define COST_MAP_SIZE 5 |
| 1059 | #define COST_MAP_OFFSET 2 |
| 1060 | |
| 1061 | static INLINE int check_nz_neighbor(tran_low_t qc) { return abs(qc) == 1; } |
| 1062 | |
| 1063 | static INLINE int check_base_neighbor(tran_low_t qc) { |
| 1064 | return abs(qc) <= 1 + NUM_BASE_LEVELS; |
| 1065 | } |
| 1066 | |
| 1067 | static INLINE int check_br_neighbor(tran_low_t qc) { |
| 1068 | return abs(qc) > BR_MAG_OFFSET; |
| 1069 | } |
| 1070 | |
Angie Chiang | 8727829 | 2017-10-18 09:59:47 -0700 | [diff] [blame] | 1071 | #define FAST_OPTIMIZE_TXB 1 |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1072 | |
| 1073 | #if FAST_OPTIMIZE_TXB |
| 1074 | #define ALNB_REF_OFFSET_NUM 2 |
Linfeng Zhang | 4afda45 | 2017-10-24 10:34:04 -0700 | [diff] [blame] | 1075 | static const int alnb_ref_offset[ALNB_REF_OFFSET_NUM][2] = { |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1076 | { -1, 0 }, { 0, -1 }, |
| 1077 | }; |
| 1078 | #define NB_REF_OFFSET_NUM 4 |
Linfeng Zhang | 4afda45 | 2017-10-24 10:34:04 -0700 | [diff] [blame] | 1079 | static const int nb_ref_offset[NB_REF_OFFSET_NUM][2] = { |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1080 | { -1, 0 }, { 0, -1 }, { 1, 0 }, { 0, 1 }, |
| 1081 | }; |
| 1082 | #endif // FAST_OPTIMIZE_TXB |
| 1083 | |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1084 | // TODO(angiebird): add static to this function once it's called |
| 1085 | int try_level_down(int coeff_idx, const TxbCache *txb_cache, |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1086 | const LV_MAP_COEFF_COST *txb_costs, TxbInfo *txb_info, |
Angie Chiang | 25645b7 | 2017-09-24 14:28:49 -0700 | [diff] [blame] | 1087 | int (*cost_map)[COST_MAP_SIZE], int fast_mode) { |
| 1088 | #if !FAST_OPTIMIZE_TXB |
| 1089 | (void)fast_mode; |
| 1090 | #endif |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1091 | if (cost_map) { |
| 1092 | for (int i = 0; i < COST_MAP_SIZE; ++i) av1_zero(cost_map[i]); |
| 1093 | } |
| 1094 | |
| 1095 | tran_low_t qc = txb_info->qcoeff[coeff_idx]; |
| 1096 | tran_low_t low_coeff; |
| 1097 | if (qc == 0) return 0; |
| 1098 | int accu_cost_diff = 0; |
| 1099 | |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 1100 | const int16_t *const iscan = txb_info->scan_order->iscan; |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1101 | const int eob = txb_info->eob; |
| 1102 | const int scan_idx = iscan[coeff_idx]; |
| 1103 | if (scan_idx < eob) { |
| 1104 | const int cost_diff = try_self_level_down(&low_coeff, coeff_idx, txb_cache, |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1105 | txb_costs, txb_info); |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1106 | if (cost_map) |
| 1107 | cost_map[0 + COST_MAP_OFFSET][0 + COST_MAP_OFFSET] = cost_diff; |
| 1108 | accu_cost_diff += cost_diff; |
| 1109 | } |
| 1110 | |
| 1111 | const int row = coeff_idx >> txb_info->bwl; |
| 1112 | const int col = coeff_idx - (row << txb_info->bwl); |
| 1113 | if (check_nz_neighbor(qc)) { |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1114 | #if FAST_OPTIMIZE_TXB |
Linfeng Zhang | 4afda45 | 2017-10-24 10:34:04 -0700 | [diff] [blame] | 1115 | const int(*ref_offset)[2]; |
Angie Chiang | 25645b7 | 2017-09-24 14:28:49 -0700 | [diff] [blame] | 1116 | int ref_num; |
| 1117 | if (fast_mode) { |
| 1118 | ref_offset = alnb_ref_offset; |
| 1119 | ref_num = ALNB_REF_OFFSET_NUM; |
| 1120 | } else { |
| 1121 | ref_offset = sig_ref_offset; |
| 1122 | ref_num = SIG_REF_OFFSET_NUM; |
| 1123 | } |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1124 | #else |
Linfeng Zhang | 4afda45 | 2017-10-24 10:34:04 -0700 | [diff] [blame] | 1125 | const int(*ref_offset)[2] = sig_ref_offset; |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1126 | const int ref_num = SIG_REF_OFFSET_NUM; |
| 1127 | #endif |
| 1128 | for (int i = 0; i < ref_num; ++i) { |
| 1129 | const int nb_row = row - ref_offset[i][0]; |
| 1130 | const int nb_col = col - ref_offset[i][1]; |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1131 | const int nb_coeff_idx = nb_row * txb_info->width + nb_col; |
Jingning Han | 4cbb363 | 2017-06-13 12:50:33 -0700 | [diff] [blame] | 1132 | |
Angie Chiang | 0c89dca | 2017-08-17 16:36:18 -0700 | [diff] [blame] | 1133 | if (nb_row < 0 || nb_col < 0 || nb_row >= txb_info->height || |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1134 | nb_col >= txb_info->width) |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1135 | continue; |
| 1136 | |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1137 | const int nb_scan_idx = iscan[nb_coeff_idx]; |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1138 | if (nb_scan_idx < eob) { |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1139 | const int cost_diff = try_neighbor_level_down_nz( |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1140 | nb_coeff_idx, coeff_idx, txb_cache, txb_costs, txb_info); |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1141 | if (cost_map) |
| 1142 | cost_map[nb_row - row + COST_MAP_OFFSET] |
| 1143 | [nb_col - col + COST_MAP_OFFSET] += cost_diff; |
| 1144 | accu_cost_diff += cost_diff; |
| 1145 | } |
| 1146 | } |
| 1147 | } |
| 1148 | |
| 1149 | if (check_base_neighbor(qc)) { |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1150 | #if FAST_OPTIMIZE_TXB |
Linfeng Zhang | 4afda45 | 2017-10-24 10:34:04 -0700 | [diff] [blame] | 1151 | const int(*ref_offset)[2]; |
Angie Chiang | 25645b7 | 2017-09-24 14:28:49 -0700 | [diff] [blame] | 1152 | int ref_num; |
| 1153 | if (fast_mode) { |
| 1154 | ref_offset = nb_ref_offset; |
| 1155 | ref_num = NB_REF_OFFSET_NUM; |
| 1156 | } else { |
| 1157 | ref_offset = base_ref_offset; |
| 1158 | ref_num = BASE_CONTEXT_POSITION_NUM; |
| 1159 | } |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1160 | #else |
Linfeng Zhang | ce065ca | 2017-10-17 16:49:30 -0700 | [diff] [blame] | 1161 | const int(*ref_offset)[2] = base_ref_offset; |
Angie Chiang | 25645b7 | 2017-09-24 14:28:49 -0700 | [diff] [blame] | 1162 | int ref_num = BASE_CONTEXT_POSITION_NUM; |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1163 | #endif |
| 1164 | for (int i = 0; i < ref_num; ++i) { |
| 1165 | const int nb_row = row - ref_offset[i][0]; |
| 1166 | const int nb_col = col - ref_offset[i][1]; |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1167 | const int nb_coeff_idx = nb_row * txb_info->width + nb_col; |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1168 | |
Angie Chiang | 0c89dca | 2017-08-17 16:36:18 -0700 | [diff] [blame] | 1169 | if (nb_row < 0 || nb_col < 0 || nb_row >= txb_info->height || |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1170 | nb_col >= txb_info->width) |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1171 | continue; |
| 1172 | |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1173 | const int nb_scan_idx = iscan[nb_coeff_idx]; |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1174 | if (nb_scan_idx < eob) { |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1175 | const int cost_diff = try_neighbor_level_down_base( |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1176 | nb_coeff_idx, coeff_idx, txb_cache, txb_costs, txb_info); |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1177 | if (cost_map) |
| 1178 | cost_map[nb_row - row + COST_MAP_OFFSET] |
| 1179 | [nb_col - col + COST_MAP_OFFSET] += cost_diff; |
| 1180 | accu_cost_diff += cost_diff; |
| 1181 | } |
| 1182 | } |
| 1183 | } |
| 1184 | |
| 1185 | if (check_br_neighbor(qc)) { |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1186 | #if FAST_OPTIMIZE_TXB |
Linfeng Zhang | 4afda45 | 2017-10-24 10:34:04 -0700 | [diff] [blame] | 1187 | const int(*ref_offset)[2]; |
Angie Chiang | 25645b7 | 2017-09-24 14:28:49 -0700 | [diff] [blame] | 1188 | int ref_num; |
| 1189 | if (fast_mode) { |
| 1190 | ref_offset = nb_ref_offset; |
| 1191 | ref_num = NB_REF_OFFSET_NUM; |
| 1192 | } else { |
| 1193 | ref_offset = br_ref_offset; |
| 1194 | ref_num = BR_CONTEXT_POSITION_NUM; |
| 1195 | } |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1196 | #else |
Linfeng Zhang | ce065ca | 2017-10-17 16:49:30 -0700 | [diff] [blame] | 1197 | const int(*ref_offset)[2] = br_ref_offset; |
Angie Chiang | e80957f | 2017-09-05 10:48:00 -0700 | [diff] [blame] | 1198 | const int ref_num = BR_CONTEXT_POSITION_NUM; |
| 1199 | #endif |
| 1200 | for (int i = 0; i < ref_num; ++i) { |
| 1201 | const int nb_row = row - ref_offset[i][0]; |
| 1202 | const int nb_col = col - ref_offset[i][1]; |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1203 | const int nb_coeff_idx = nb_row * txb_info->width + nb_col; |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1204 | |
Angie Chiang | 0c89dca | 2017-08-17 16:36:18 -0700 | [diff] [blame] | 1205 | if (nb_row < 0 || nb_col < 0 || nb_row >= txb_info->height || |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1206 | nb_col >= txb_info->width) |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1207 | continue; |
| 1208 | |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1209 | const int nb_scan_idx = iscan[nb_coeff_idx]; |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1210 | if (nb_scan_idx < eob) { |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1211 | const int cost_diff = try_neighbor_level_down_br( |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1212 | nb_coeff_idx, coeff_idx, txb_cache, txb_costs, txb_info); |
Angie Chiang | a530ef4 | 2017-05-30 16:32:36 -0700 | [diff] [blame] | 1213 | if (cost_map) |
| 1214 | cost_map[nb_row - row + COST_MAP_OFFSET] |
| 1215 | [nb_col - col + COST_MAP_OFFSET] += cost_diff; |
| 1216 | accu_cost_diff += cost_diff; |
| 1217 | } |
| 1218 | } |
| 1219 | } |
| 1220 | |
| 1221 | return accu_cost_diff; |
| 1222 | } |
| 1223 | |
Angie Chiang | c77799b | 2017-05-30 17:08:17 -0700 | [diff] [blame] | 1224 | static INLINE void set_eob(TxbInfo *txb_info, int eob) { |
| 1225 | txb_info->eob = eob; |
Urvang Joshi | 8089315 | 2017-10-27 11:51:14 -0700 | [diff] [blame] | 1226 | txb_info->seg_eob = av1_get_max_eob(txb_info->tx_size); |
Angie Chiang | c77799b | 2017-05-30 17:08:17 -0700 | [diff] [blame] | 1227 | } |
| 1228 | |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1229 | // TODO(angiebird): add static to this function it's called |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1230 | void update_level_down(const int coeff_idx, TxbCache *const txb_cache, |
| 1231 | TxbInfo *const txb_info) { |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1232 | const tran_low_t qc = txb_info->qcoeff[coeff_idx]; |
| 1233 | const int abs_qc = abs(qc); |
| 1234 | if (qc == 0) return; |
| 1235 | const tran_low_t low_coeff = get_lower_coeff(qc); |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1236 | update_coeff(coeff_idx, low_coeff, txb_info); |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1237 | |
| 1238 | const int row = coeff_idx >> txb_info->bwl; |
| 1239 | const int col = coeff_idx - (row << txb_info->bwl); |
| 1240 | const int eob = txb_info->eob; |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 1241 | const int16_t *const iscan = txb_info->scan_order->iscan; |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1242 | for (int i = 0; i < SIG_REF_OFFSET_NUM; ++i) { |
| 1243 | const int nb_row = row - sig_ref_offset[i][0]; |
| 1244 | const int nb_col = col - sig_ref_offset[i][1]; |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1245 | |
| 1246 | if (!(nb_row >= 0 && nb_col >= 0 && nb_row < txb_info->height && |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1247 | nb_col < txb_info->width)) |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1248 | continue; |
| 1249 | |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1250 | const int nb_coeff_idx = nb_row * txb_info->width + nb_col; |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1251 | const int nb_scan_idx = iscan[nb_coeff_idx]; |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1252 | if (nb_scan_idx < eob) { |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1253 | const int scan_idx = iscan[coeff_idx]; |
| 1254 | if (scan_idx < nb_scan_idx) { |
| 1255 | const int level = 1; |
| 1256 | if (abs_qc == level) { |
| 1257 | txb_cache->nz_count_arr[nb_coeff_idx] -= 1; |
| 1258 | assert(txb_cache->nz_count_arr[nb_coeff_idx] >= 0); |
| 1259 | } |
Yaowu Xu | 102ef81 | 2017-12-12 11:31:03 -0800 | [diff] [blame] | 1260 | txb_cache->nz_ctx_arr[nb_coeff_idx] = get_nz_map_ctx_from_stats( |
| 1261 | 0, nb_coeff_idx, txb_info->bwl, txb_info->tx_size, |
| 1262 | tx_type_to_class[txb_info->tx_type]); |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1263 | } |
| 1264 | } |
| 1265 | } |
| 1266 | |
Angie Chiang | def1125 | 2017-08-18 14:37:32 -0700 | [diff] [blame] | 1267 | const BASE_CTX_TABLE *base_ctx_table = |
| 1268 | txb_info->coeff_ctx_table->base_ctx_table; |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1269 | for (int i = 0; i < BASE_CONTEXT_POSITION_NUM; ++i) { |
| 1270 | const int nb_row = row - base_ref_offset[i][0]; |
| 1271 | const int nb_col = col - base_ref_offset[i][1]; |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1272 | const int nb_coeff_idx = nb_row * txb_info->width + nb_col; |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1273 | |
| 1274 | if (!(nb_row >= 0 && nb_col >= 0 && nb_row < txb_info->height && |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1275 | nb_col < txb_info->width)) |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1276 | continue; |
| 1277 | |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1278 | const tran_low_t nb_coeff = txb_info->qcoeff[nb_coeff_idx]; |
| 1279 | if (!has_base(nb_coeff, 0)) continue; |
| 1280 | const int nb_scan_idx = iscan[nb_coeff_idx]; |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1281 | if (nb_scan_idx < eob) { |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1282 | if (row >= nb_row && col >= nb_col) |
| 1283 | update_mag_arr(txb_cache->base_mag_arr[nb_coeff_idx], abs_qc); |
| 1284 | const int mag = |
| 1285 | get_mag_from_mag_arr(txb_cache->base_mag_arr[nb_coeff_idx]); |
| 1286 | for (int base_idx = 0; base_idx < NUM_BASE_LEVELS; ++base_idx) { |
| 1287 | if (!has_base(nb_coeff, base_idx)) continue; |
| 1288 | const int level = base_idx + 1; |
| 1289 | if (abs_qc == level) { |
| 1290 | txb_cache->base_count_arr[base_idx][nb_coeff_idx] -= 1; |
| 1291 | assert(txb_cache->base_count_arr[base_idx][nb_coeff_idx] >= 0); |
| 1292 | } |
| 1293 | const int count = txb_cache->base_count_arr[base_idx][nb_coeff_idx]; |
Angie Chiang | 1ae0ebf | 2017-08-15 15:16:47 -0700 | [diff] [blame] | 1294 | txb_cache->base_ctx_arr[base_idx][nb_coeff_idx] = |
Angie Chiang | def1125 | 2017-08-18 14:37:32 -0700 | [diff] [blame] | 1295 | base_ctx_table[nb_row != 0][nb_col != 0][mag > level][count]; |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1296 | } |
| 1297 | } |
| 1298 | } |
| 1299 | |
| 1300 | for (int i = 0; i < BR_CONTEXT_POSITION_NUM; ++i) { |
| 1301 | const int nb_row = row - br_ref_offset[i][0]; |
| 1302 | const int nb_col = col - br_ref_offset[i][1]; |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1303 | const int nb_coeff_idx = nb_row * txb_info->width + nb_col; |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1304 | |
| 1305 | if (!(nb_row >= 0 && nb_col >= 0 && nb_row < txb_info->height && |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1306 | nb_col < txb_info->width)) |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1307 | continue; |
| 1308 | |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1309 | const int nb_scan_idx = iscan[nb_coeff_idx]; |
| 1310 | const tran_low_t nb_coeff = txb_info->qcoeff[nb_coeff_idx]; |
| 1311 | if (!has_br(nb_coeff)) continue; |
Jingning Han | 3455e76 | 2017-06-13 21:15:44 -0700 | [diff] [blame] | 1312 | if (nb_scan_idx < eob) { |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1313 | const int level = 1 + NUM_BASE_LEVELS; |
| 1314 | if (abs_qc == level) { |
| 1315 | txb_cache->br_count_arr[nb_coeff_idx] -= 1; |
| 1316 | assert(txb_cache->br_count_arr[nb_coeff_idx] >= 0); |
| 1317 | } |
| 1318 | if (row >= nb_row && col >= nb_col) |
| 1319 | update_mag_arr(txb_cache->br_mag_arr[nb_coeff_idx], abs_qc); |
| 1320 | const int count = txb_cache->br_count_arr[nb_coeff_idx]; |
| 1321 | const int mag = get_mag_from_mag_arr(txb_cache->br_mag_arr[nb_coeff_idx]); |
Angie Chiang | 1ae0ebf | 2017-08-15 15:16:47 -0700 | [diff] [blame] | 1322 | txb_cache->br_ctx_arr[nb_coeff_idx] = |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1323 | get_br_ctx_from_count_mag(nb_row, nb_col, count, mag); |
Angie Chiang | d19969e | 2017-05-30 18:02:33 -0700 | [diff] [blame] | 1324 | } |
| 1325 | } |
| 1326 | } |
| 1327 | |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1328 | static int get_coeff_cost(const tran_low_t qc, const int scan_idx, |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1329 | const int is_eob, const TxbInfo *const txb_info, |
Linfeng Zhang | 5f1b8ce | 2017-12-11 15:53:10 -0800 | [diff] [blame] | 1330 | const LV_MAP_COEFF_COST *const txb_costs, |
| 1331 | const int coeff_ctx) { |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1332 | const TXB_CTX *txb_ctx = txb_info->txb_ctx; |
| 1333 | const int is_nz = (qc != 0); |
| 1334 | const tran_low_t abs_qc = abs(qc); |
| 1335 | int cost = 0; |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 1336 | const int16_t *const scan = txb_info->scan_order->scan; |
| 1337 | const int pos = scan[scan_idx]; |
Dake He | 03a3292 | 2017-10-31 08:06:45 -0700 | [diff] [blame] | 1338 | |
Dake He | 3fe369c | 2017-11-16 17:56:44 -0800 | [diff] [blame] | 1339 | if (is_eob) { |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 1340 | cost += txb_costs->base_eob_cost[coeff_ctx][AOMMIN(abs_qc, 3) - 1]; |
Dake He | 3fe369c | 2017-11-16 17:56:44 -0800 | [diff] [blame] | 1341 | } else { |
| 1342 | cost += txb_costs->base_cost[coeff_ctx][AOMMIN(abs_qc, 3)]; |
| 1343 | } |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1344 | if (is_nz) { |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1345 | cost += get_sign_bit_cost(qc, scan_idx, txb_costs->dc_sign_cost, |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1346 | txb_ctx->dc_sign_ctx); |
| 1347 | |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1348 | if (abs_qc > NUM_BASE_LEVELS) { |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 1349 | const int row = pos >> txb_info->bwl; |
| 1350 | const int col = pos - (row << txb_info->bwl); |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 1351 | |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1352 | #if USE_CAUSAL_BR_CTX |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 1353 | (void)col; |
| 1354 | const int count = 0; |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 1355 | const int ctx = get_br_ctx(txb_info->levels, pos, txb_info->bwl, count, |
| 1356 | txb_info->tx_type); |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 1357 | #else |
Linfeng Zhang | 97fc474 | 2017-11-07 12:57:25 -0800 | [diff] [blame] | 1358 | const int count = get_level_count( |
| 1359 | txb_info->levels, (1 << txb_info->bwl) + TX_PAD_HOR, row, col, |
| 1360 | NUM_BASE_LEVELS, br_ref_offset, BR_CONTEXT_POSITION_NUM); |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 1361 | const int ctx = get_br_ctx(txb_info->levels, pos, txb_info->bwl, count); |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 1362 | #endif |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1363 | cost += get_br_cost(abs_qc, ctx, txb_costs->lps_cost[ctx]); |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1364 | cost += get_golomb_cost(abs_qc); |
| 1365 | } |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1366 | } |
| 1367 | return cost; |
| 1368 | } |
| 1369 | |
Angie Chiang | 47e0707 | 2017-05-30 17:27:01 -0700 | [diff] [blame] | 1370 | #if TEST_OPTIMIZE_TXB |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1371 | #define ALL_REF_OFFSET_NUM 17 |
Linfeng Zhang | 4afda45 | 2017-10-24 10:34:04 -0700 | [diff] [blame] | 1372 | static const int all_ref_offset[ALL_REF_OFFSET_NUM][2] = { |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1373 | { 0, 0 }, { -2, -1 }, { -2, 0 }, { -2, 1 }, { -1, -2 }, { -1, -1 }, |
| 1374 | { -1, 0 }, { -1, 1 }, { 0, -2 }, { 0, -1 }, { 1, -2 }, { 1, -1 }, |
| 1375 | { 1, 0 }, { 2, 0 }, { 0, 1 }, { 0, 2 }, { 1, 1 }, |
| 1376 | }; |
| 1377 | |
Angie Chiang | 0b2795c | 2017-09-29 16:00:08 -0700 | [diff] [blame] | 1378 | static int try_level_down_ref(int coeff_idx, const LV_MAP_COEFF_COST *txb_costs, |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1379 | TxbInfo *txb_info, |
| 1380 | int (*cost_map)[COST_MAP_SIZE]) { |
| 1381 | if (cost_map) { |
| 1382 | for (int i = 0; i < COST_MAP_SIZE; ++i) av1_zero(cost_map[i]); |
| 1383 | } |
| 1384 | tran_low_t qc = txb_info->qcoeff[coeff_idx]; |
| 1385 | if (qc == 0) return 0; |
| 1386 | int row = coeff_idx >> txb_info->bwl; |
| 1387 | int col = coeff_idx - (row << txb_info->bwl); |
| 1388 | int org_cost = 0; |
| 1389 | for (int i = 0; i < ALL_REF_OFFSET_NUM; ++i) { |
| 1390 | int nb_row = row - all_ref_offset[i][0]; |
| 1391 | int nb_col = col - all_ref_offset[i][1]; |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1392 | int nb_coeff_idx = nb_row * txb_info->width + nb_col; |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1393 | int nb_scan_idx = txb_info->scan_order->iscan[nb_coeff_idx]; |
| 1394 | if (nb_scan_idx < txb_info->eob && nb_row >= 0 && nb_col >= 0 && |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1395 | nb_row < txb_info->height && nb_col < txb_info->width) { |
Linfeng Zhang | 960e700 | 2017-12-11 13:46:40 -0800 | [diff] [blame] | 1396 | const tran_low_t nb_coeff = txb_info->qcoeff[nb_coeff_idx]; |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1397 | const int coeff_ctx = get_nz_map_ctx( |
| 1398 | txb_info->levels, nb_coeff_idx, txb_info->bwl, txb_info->height, |
| 1399 | nb_scan_idx, is_eob, txb_info->tx_size, txb_info->tx_type); |
| 1400 | const int cost = get_coeff_cost(nb_coeff, nb_scan_idx, is_eob, txb_info, |
| 1401 | txb_costs, coeff_ctx); |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1402 | if (cost_map) |
| 1403 | cost_map[nb_row - row + COST_MAP_OFFSET] |
| 1404 | [nb_col - col + COST_MAP_OFFSET] -= cost; |
| 1405 | org_cost += cost; |
| 1406 | } |
| 1407 | } |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1408 | update_qcoeff(coeff_idx, get_lower_coeff(qc), txb_info); |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1409 | int new_cost = 0; |
| 1410 | for (int i = 0; i < ALL_REF_OFFSET_NUM; ++i) { |
| 1411 | int nb_row = row - all_ref_offset[i][0]; |
| 1412 | int nb_col = col - all_ref_offset[i][1]; |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1413 | int nb_coeff_idx = nb_row * txb_info->width + nb_col; |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1414 | int nb_scan_idx = txb_info->scan_order->iscan[nb_coeff_idx]; |
| 1415 | if (nb_scan_idx < txb_info->eob && nb_row >= 0 && nb_col >= 0 && |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1416 | nb_row < txb_info->height && nb_col < txb_info->width) { |
Linfeng Zhang | 960e700 | 2017-12-11 13:46:40 -0800 | [diff] [blame] | 1417 | const tran_low_t nb_coeff = txb_info->qcoeff[nb_coeff_idx]; |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1418 | const int coeff_ctx = get_nz_map_ctx( |
| 1419 | txb_info->levels, nb_coeff_idx, txb_info->bwl, txb_info->height, |
| 1420 | nb_scan_idx, is_eob, txb_info->tx_size, txb_info->tx_type); |
| 1421 | const int cost = get_coeff_cost(nb_coeff, nb_scan_idx, is_eob, txb_info, |
| 1422 | txb_costs, coeff_ctx); |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1423 | if (cost_map) |
| 1424 | cost_map[nb_row - row + COST_MAP_OFFSET] |
| 1425 | [nb_col - col + COST_MAP_OFFSET] += cost; |
| 1426 | new_cost += cost; |
| 1427 | } |
| 1428 | } |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1429 | update_qcoeff(coeff_idx, qc, txb_info); |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1430 | return new_cost - org_cost; |
| 1431 | } |
| 1432 | |
| 1433 | static void test_level_down(int coeff_idx, const TxbCache *txb_cache, |
Angie Chiang | 0b2795c | 2017-09-29 16:00:08 -0700 | [diff] [blame] | 1434 | const LV_MAP_COEFF_COST *txb_costs, |
| 1435 | TxbInfo *txb_info) { |
Angie Chiang | 47e0707 | 2017-05-30 17:27:01 -0700 | [diff] [blame] | 1436 | int cost_map[COST_MAP_SIZE][COST_MAP_SIZE]; |
| 1437 | int ref_cost_map[COST_MAP_SIZE][COST_MAP_SIZE]; |
| 1438 | const int cost_diff = |
Angie Chiang | 0b2795c | 2017-09-29 16:00:08 -0700 | [diff] [blame] | 1439 | try_level_down(coeff_idx, txb_cache, txb_costs, txb_info, cost_map, 0); |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1440 | const int cost_diff_ref = |
Angie Chiang | 0b2795c | 2017-09-29 16:00:08 -0700 | [diff] [blame] | 1441 | try_level_down_ref(coeff_idx, txb_costs, txb_info, ref_cost_map); |
Angie Chiang | 47e0707 | 2017-05-30 17:27:01 -0700 | [diff] [blame] | 1442 | if (cost_diff != cost_diff_ref) { |
| 1443 | printf("qc %d cost_diff %d cost_diff_ref %d\n", txb_info->qcoeff[coeff_idx], |
| 1444 | cost_diff, cost_diff_ref); |
| 1445 | for (int r = 0; r < COST_MAP_SIZE; ++r) { |
| 1446 | for (int c = 0; c < COST_MAP_SIZE; ++c) { |
| 1447 | printf("%d:%d ", cost_map[r][c], ref_cost_map[r][c]); |
| 1448 | } |
| 1449 | printf("\n"); |
| 1450 | } |
| 1451 | } |
| 1452 | } |
| 1453 | #endif |
| 1454 | |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1455 | // TODO(angiebird): make this static once it's called |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1456 | int get_txb_cost(TxbInfo *txb_info, const LV_MAP_COEFF_COST *txb_costs) { |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1457 | int cost = 0; |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 1458 | const int txb_skip_ctx = txb_info->txb_ctx->txb_skip_ctx; |
| 1459 | const int16_t *const scan = txb_info->scan_order->scan; |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1460 | if (txb_info->eob == 0) { |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1461 | cost = txb_costs->txb_skip_cost[txb_skip_ctx][1]; |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1462 | return cost; |
| 1463 | } |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1464 | cost = txb_costs->txb_skip_cost[txb_skip_ctx][0]; |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1465 | for (int c = 0; c < txb_info->eob; ++c) { |
Linfeng Zhang | 5f1b8ce | 2017-12-11 15:53:10 -0800 | [diff] [blame] | 1466 | const int pos = scan[c]; |
| 1467 | const tran_low_t qc = txb_info->qcoeff[pos]; |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1468 | const int coeff_ctx = get_nz_map_ctx( |
| 1469 | txb_info->levels, pos, txb_info->bwl, txb_info->height, c, |
| 1470 | c == txb_info->eob - 1, txb_info->tx_size, txb_info->tx_type); |
| 1471 | const int coeff_cost = get_coeff_cost(qc, c, c == txb_info->eob - 1, |
Linfeng Zhang | 5f1b8ce | 2017-12-11 15:53:10 -0800 | [diff] [blame] | 1472 | txb_info, txb_costs, coeff_ctx); |
Angie Chiang | 488f921 | 2017-05-30 12:46:26 -0700 | [diff] [blame] | 1473 | cost += coeff_cost; |
| 1474 | } |
| 1475 | return cost; |
| 1476 | } |
| 1477 | |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1478 | #if TEST_OPTIMIZE_TXB |
Angie Chiang | 0b2795c | 2017-09-29 16:00:08 -0700 | [diff] [blame] | 1479 | void test_try_change_eob(TxbInfo *txb_info, const LV_MAP_COEFF_COST *txb_costs, |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1480 | TxbCache *txb_cache) { |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 1481 | const int eob = txb_info->eob; |
| 1482 | const int16_t *const scan = txb_info->scan_order->scan; |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1483 | if (eob > 0) { |
| 1484 | int last_si = eob - 1; |
| 1485 | int last_ci = scan[last_si]; |
| 1486 | int last_coeff = txb_info->qcoeff[last_ci]; |
| 1487 | if (abs(last_coeff) == 1) { |
| 1488 | int new_eob; |
| 1489 | int cost_diff = |
Angie Chiang | 0b2795c | 2017-09-29 16:00:08 -0700 | [diff] [blame] | 1490 | try_change_eob(&new_eob, last_ci, txb_cache, txb_costs, txb_info, 0); |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1491 | int org_eob = txb_info->eob; |
Angie Chiang | 0b2795c | 2017-09-29 16:00:08 -0700 | [diff] [blame] | 1492 | int cost = get_txb_cost(txb_info, txb_costs); |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1493 | |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1494 | update_qcoeff(last_ci, get_lower_coeff(last_coeff), txb_info); |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1495 | set_eob(txb_info, new_eob); |
Angie Chiang | 0b2795c | 2017-09-29 16:00:08 -0700 | [diff] [blame] | 1496 | int new_cost = get_txb_cost(txb_info, txb_costs); |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1497 | set_eob(txb_info, org_eob); |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1498 | update_qcoeff(last_ci, last_coeff, txb_info); |
Angie Chiang | 5e012fe | 2017-05-30 18:47:39 -0700 | [diff] [blame] | 1499 | |
| 1500 | int ref_cost_diff = -cost + new_cost; |
| 1501 | if (cost_diff != ref_cost_diff) |
| 1502 | printf("org_eob %d new_eob %d cost_diff %d ref_cost_diff %d\n", org_eob, |
| 1503 | new_eob, cost_diff, ref_cost_diff); |
| 1504 | } |
| 1505 | } |
| 1506 | } |
| 1507 | #endif |
| 1508 | |
Jingning Han | 3422ac1 | 2017-10-25 20:37:53 -0700 | [diff] [blame] | 1509 | #if 1 |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1510 | static int optimize_txb(TxbInfo *txb_info, const LV_MAP_COEFF_COST *txb_costs, |
Dake He | 0db7d0e | 2017-12-21 15:23:20 -0800 | [diff] [blame] | 1511 | const LV_MAP_EOB_COST *txb_eob_costs, |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1512 | TxbCache *txb_cache, int dry_run, int fast_mode) { |
| 1513 | (void)fast_mode; |
| 1514 | (void)txb_cache; |
| 1515 | int update = 0; |
Dake He | 5988177 | 2017-11-24 07:00:02 -0800 | [diff] [blame] | 1516 | // return update; // TODO(DKHE): training only. |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1517 | if (txb_info->eob == 0) return update; |
Urvang Joshi | 8089315 | 2017-10-27 11:51:14 -0700 | [diff] [blame] | 1518 | const int max_eob = av1_get_max_eob(txb_info->tx_size); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1519 | |
| 1520 | #if TEST_OPTIMIZE_TXB |
| 1521 | int64_t sse; |
| 1522 | int64_t org_dist = |
| 1523 | av1_block_error_c(txb_info->tcoeff, txb_info->dqcoeff, max_eob, &sse) * |
| 1524 | (1 << (2 * txb_info->shift)); |
| 1525 | int org_cost = get_txb_cost(txb_info, txb_probs); |
| 1526 | #endif |
| 1527 | |
| 1528 | tran_low_t *org_qcoeff = txb_info->qcoeff; |
| 1529 | tran_low_t *org_dqcoeff = txb_info->dqcoeff; |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1530 | uint8_t *const org_levels = txb_info->levels; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1531 | |
| 1532 | tran_low_t tmp_qcoeff[MAX_TX_SQUARE]; |
| 1533 | tran_low_t tmp_dqcoeff[MAX_TX_SQUARE]; |
Linfeng Zhang | 679d81e | 2017-10-31 15:27:42 -0700 | [diff] [blame] | 1534 | uint8_t tmp_levels_buf[TX_PAD_2D]; |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1535 | uint8_t *const tmp_levels = set_levels(tmp_levels_buf, txb_info->width); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1536 | const int org_eob = txb_info->eob; |
| 1537 | if (dry_run) { |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1538 | const int stride = txb_info->width + TX_PAD_HOR; |
| 1539 | const int levels_size = |
| 1540 | |
| 1541 | (stride * (txb_info->height + TX_PAD_VER) + TX_PAD_END); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1542 | memcpy(tmp_qcoeff, org_qcoeff, sizeof(org_qcoeff[0]) * max_eob); |
| 1543 | memcpy(tmp_dqcoeff, org_dqcoeff, sizeof(org_dqcoeff[0]) * max_eob); |
Linfeng Zhang | 679d81e | 2017-10-31 15:27:42 -0700 | [diff] [blame] | 1544 | memcpy(tmp_levels, org_levels - TX_PAD_TOP * stride, |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1545 | sizeof(org_levels[0]) * levels_size); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1546 | txb_info->qcoeff = tmp_qcoeff; |
| 1547 | txb_info->dqcoeff = tmp_dqcoeff; |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1548 | txb_info->levels = tmp_levels; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1549 | } |
| 1550 | |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 1551 | const int16_t *const scan = txb_info->scan_order->scan; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1552 | |
| 1553 | // forward optimize the nz_map` |
| 1554 | const int init_eob = txb_info->eob; |
| 1555 | const int seg_eob = txb_info->seg_eob; |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1556 | const int eob_cost = get_eob_cost(init_eob, seg_eob, txb_eob_costs, txb_costs, |
Dake He | 0db7d0e | 2017-12-21 15:23:20 -0800 | [diff] [blame] | 1557 | txb_info->tx_type); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1558 | |
| 1559 | // backward optimize the level-k map |
| 1560 | int64_t accu_rate = eob_cost; |
| 1561 | int64_t accu_dist = 0; |
| 1562 | int64_t prev_eob_rd_cost = INT64_MAX; |
| 1563 | int64_t cur_eob_rd_cost = 0; |
Jingning Han | 8be58fa | 2017-12-18 09:46:13 -0800 | [diff] [blame] | 1564 | int8_t has_nz_tail = 0; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1565 | |
| 1566 | for (int si = init_eob - 1; si >= 0; --si) { |
| 1567 | const int coeff_idx = scan[si]; |
| 1568 | tran_low_t qc = txb_info->qcoeff[coeff_idx]; |
| 1569 | |
| 1570 | LevelDownStats stats; |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1571 | get_dist_cost_stats(&stats, si, si == init_eob - 1, txb_costs, txb_info, |
| 1572 | has_nz_tail); |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1573 | |
| 1574 | if (qc == 0) { |
| 1575 | accu_rate += stats.rate; |
| 1576 | } else { |
Jingning Han | 8be58fa | 2017-12-18 09:46:13 -0800 | [diff] [blame] | 1577 | if (has_nz_tail < 2) { |
| 1578 | // check if it is better to make this the last significant coefficient |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1579 | int cur_eob_rate = get_eob_cost(si + 1, seg_eob, txb_eob_costs, |
| 1580 | txb_costs, txb_info->tx_type); |
Jingning Han | 8be58fa | 2017-12-18 09:46:13 -0800 | [diff] [blame] | 1581 | cur_eob_rd_cost = RDCOST(txb_info->rdmult, cur_eob_rate, 0); |
| 1582 | prev_eob_rd_cost = |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 1583 | RDCOST(txb_info->rdmult, accu_rate, accu_dist) + stats.nz_rd; |
Jingning Han | 8be58fa | 2017-12-18 09:46:13 -0800 | [diff] [blame] | 1584 | if (cur_eob_rd_cost <= prev_eob_rd_cost) { |
| 1585 | update = 1; |
| 1586 | for (int j = si + 1; j < txb_info->eob; j++) { |
| 1587 | const int coeff_pos_j = scan[j]; |
| 1588 | update_coeff(coeff_pos_j, 0, txb_info); |
| 1589 | } |
| 1590 | txb_info->eob = si + 1; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1591 | |
Jingning Han | 8be58fa | 2017-12-18 09:46:13 -0800 | [diff] [blame] | 1592 | // rerun cost calculation due to change of eob |
| 1593 | accu_rate = cur_eob_rate; |
| 1594 | accu_dist = 0; |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1595 | get_dist_cost_stats(&stats, si, 1, txb_costs, txb_info, has_nz_tail); |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 1596 | if ((stats.rd_low < stats.rd) && (stats.low_qc != 0)) { |
| 1597 | update = 1; |
| 1598 | update_coeff(coeff_idx, stats.low_qc, txb_info); |
| 1599 | accu_rate += stats.rate_low; |
| 1600 | accu_dist += stats.dist_low; |
| 1601 | } else { |
| 1602 | accu_rate += stats.rate; |
| 1603 | accu_dist += stats.dist; |
| 1604 | } |
Jingning Han | 8be58fa | 2017-12-18 09:46:13 -0800 | [diff] [blame] | 1605 | continue; |
| 1606 | } |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1607 | } |
| 1608 | |
| 1609 | int bUpdCoeff = 0; |
| 1610 | if (stats.rd_low < stats.rd) { |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 1611 | if ((si < txb_info->eob - 1)) { |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1612 | bUpdCoeff = 1; |
| 1613 | update = 1; |
| 1614 | } |
Jingning Han | 8be58fa | 2017-12-18 09:46:13 -0800 | [diff] [blame] | 1615 | } else { |
| 1616 | ++has_nz_tail; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1617 | } |
| 1618 | |
| 1619 | if (bUpdCoeff) { |
| 1620 | update_coeff(coeff_idx, stats.low_qc, txb_info); |
| 1621 | accu_rate += stats.rate_low; |
| 1622 | accu_dist += stats.dist_low; |
| 1623 | } else { |
| 1624 | accu_rate += stats.rate; |
| 1625 | accu_dist += stats.dist; |
| 1626 | } |
| 1627 | } |
| 1628 | } // for (si) |
Jingning Han | a7a6f4e | 2017-12-13 14:44:08 -0800 | [diff] [blame] | 1629 | |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1630 | int non_zero_blk_rate = |
| 1631 | txb_costs->txb_skip_cost[txb_info->txb_ctx->txb_skip_ctx][0]; |
| 1632 | prev_eob_rd_cost = |
| 1633 | RDCOST(txb_info->rdmult, accu_rate + non_zero_blk_rate, accu_dist); |
| 1634 | |
| 1635 | int zero_blk_rate = |
| 1636 | txb_costs->txb_skip_cost[txb_info->txb_ctx->txb_skip_ctx][1]; |
| 1637 | int64_t zero_blk_rd_cost = RDCOST(txb_info->rdmult, zero_blk_rate, 0); |
| 1638 | if (zero_blk_rd_cost <= prev_eob_rd_cost) { |
| 1639 | update = 1; |
| 1640 | for (int j = 0; j < txb_info->eob; j++) { |
| 1641 | const int coeff_pos_j = scan[j]; |
| 1642 | update_coeff(coeff_pos_j, 0, txb_info); |
| 1643 | } |
| 1644 | txb_info->eob = 0; |
| 1645 | } |
| 1646 | |
| 1647 | #if TEST_OPTIMIZE_TXB |
| 1648 | int cost_diff = 0; |
| 1649 | int64_t dist_diff = 0; |
| 1650 | int64_t rd_diff = 0; |
| 1651 | int64_t new_dist = |
| 1652 | av1_block_error_c(txb_info->tcoeff, txb_info->dqcoeff, max_eob, &sse) * |
| 1653 | (1 << (2 * txb_info->shift)); |
| 1654 | int new_cost = get_txb_cost(txb_info, txb_probs); |
| 1655 | int64_t ref_dist_diff = new_dist - org_dist; |
| 1656 | int ref_cost_diff = new_cost - org_cost; |
| 1657 | if (cost_diff != ref_cost_diff || dist_diff != ref_dist_diff) |
| 1658 | printf( |
| 1659 | "overall rd_diff %ld\ncost_diff %d ref_cost_diff%d\ndist_diff %ld " |
| 1660 | "ref_dist_diff %ld\neob %d new_eob %d\n\n", |
| 1661 | rd_diff, cost_diff, ref_cost_diff, dist_diff, ref_dist_diff, org_eob, |
| 1662 | txb_info->eob); |
| 1663 | #endif |
| 1664 | if (dry_run) { |
| 1665 | txb_info->qcoeff = org_qcoeff; |
| 1666 | txb_info->dqcoeff = org_dqcoeff; |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1667 | txb_info->levels = org_levels; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1668 | set_eob(txb_info, org_eob); |
| 1669 | } |
| 1670 | return update; |
| 1671 | } |
| 1672 | |
| 1673 | #else |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 1674 | static int optimize_txb(TxbInfo *txb_info, const LV_MAP_COEFF_COST *txb_costs, |
Angie Chiang | 25645b7 | 2017-09-24 14:28:49 -0700 | [diff] [blame] | 1675 | TxbCache *txb_cache, int dry_run, int fast_mode) { |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1676 | int update = 0; |
| 1677 | if (txb_info->eob == 0) return update; |
| 1678 | int cost_diff = 0; |
| 1679 | int64_t dist_diff = 0; |
| 1680 | int64_t rd_diff = 0; |
Urvang Joshi | 8089315 | 2017-10-27 11:51:14 -0700 | [diff] [blame] | 1681 | const int max_eob = av1_get_max_eob(txb_info->tx_size); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1682 | |
| 1683 | #if TEST_OPTIMIZE_TXB |
| 1684 | int64_t sse; |
| 1685 | int64_t org_dist = |
| 1686 | av1_block_error_c(txb_info->tcoeff, txb_info->dqcoeff, max_eob, &sse) * |
| 1687 | (1 << (2 * txb_info->shift)); |
Angie Chiang | 0b2795c | 2017-09-29 16:00:08 -0700 | [diff] [blame] | 1688 | int org_cost = get_txb_cost(txb_info, txb_costs); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1689 | #endif |
| 1690 | |
| 1691 | tran_low_t *org_qcoeff = txb_info->qcoeff; |
| 1692 | tran_low_t *org_dqcoeff = txb_info->dqcoeff; |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1693 | uint8_t *const org_levels = txb_info->levels; |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1694 | |
| 1695 | tran_low_t tmp_qcoeff[MAX_TX_SQUARE]; |
| 1696 | tran_low_t tmp_dqcoeff[MAX_TX_SQUARE]; |
Linfeng Zhang | 679d81e | 2017-10-31 15:27:42 -0700 | [diff] [blame] | 1697 | uint8_t tmp_levels_buf[TX_PAD_2D]; |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1698 | uint8_t *const tmp_levels = set_levels(tmp_levels_buf, txb_info->width); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1699 | const int org_eob = txb_info->eob; |
| 1700 | if (dry_run) { |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1701 | const int stride = txb_info->width + TX_PAD_HOR; |
| 1702 | const int levels_size = |
| 1703 | |
| 1704 | (stride * (txb_info->height + TX_PAD_VER) + TX_PAD_END); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1705 | memcpy(tmp_qcoeff, org_qcoeff, sizeof(org_qcoeff[0]) * max_eob); |
| 1706 | memcpy(tmp_dqcoeff, org_dqcoeff, sizeof(org_dqcoeff[0]) * max_eob); |
Linfeng Zhang | 679d81e | 2017-10-31 15:27:42 -0700 | [diff] [blame] | 1707 | memcpy(tmp_levels, org_levels - TX_PAD_TOP * stride, |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 1708 | sizeof(org_levels[0]) * levels_size); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1709 | txb_info->qcoeff = tmp_qcoeff; |
| 1710 | txb_info->dqcoeff = tmp_dqcoeff; |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1711 | txb_info->levels = tmp_levels; |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1712 | } |
| 1713 | |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 1714 | const int16_t *const scan = txb_info->scan_order->scan; |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1715 | |
| 1716 | // forward optimize the nz_map |
| 1717 | const int cur_eob = txb_info->eob; |
| 1718 | for (int si = 0; si < cur_eob; ++si) { |
| 1719 | const int coeff_idx = scan[si]; |
| 1720 | tran_low_t qc = txb_info->qcoeff[coeff_idx]; |
| 1721 | if (abs(qc) == 1) { |
| 1722 | LevelDownStats stats; |
Angie Chiang | 25645b7 | 2017-09-24 14:28:49 -0700 | [diff] [blame] | 1723 | try_level_down_facade(&stats, si, txb_cache, txb_costs, txb_info, |
| 1724 | fast_mode); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1725 | if (stats.update) { |
| 1726 | update = 1; |
| 1727 | cost_diff += stats.cost_diff; |
| 1728 | dist_diff += stats.dist_diff; |
| 1729 | rd_diff += stats.rd_diff; |
| 1730 | update_level_down(coeff_idx, txb_cache, txb_info); |
| 1731 | set_eob(txb_info, stats.new_eob); |
| 1732 | } |
| 1733 | } |
| 1734 | } |
| 1735 | |
| 1736 | // backward optimize the level-k map |
Angie Chiang | 530b304 | 2017-08-17 15:08:58 -0700 | [diff] [blame] | 1737 | int eob_fix = 0; |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1738 | for (int si = txb_info->eob - 1; si >= 0; --si) { |
Angie Chiang | 530b304 | 2017-08-17 15:08:58 -0700 | [diff] [blame] | 1739 | const int coeff_idx = scan[si]; |
| 1740 | if (eob_fix == 1 && txb_info->qcoeff[coeff_idx] == 1) { |
| 1741 | // when eob is fixed, there is not need to optimize again when |
| 1742 | // abs(qc) == 1 |
| 1743 | continue; |
| 1744 | } |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1745 | LevelDownStats stats; |
Angie Chiang | 25645b7 | 2017-09-24 14:28:49 -0700 | [diff] [blame] | 1746 | try_level_down_facade(&stats, si, txb_cache, txb_costs, txb_info, |
| 1747 | fast_mode); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1748 | if (stats.update) { |
| 1749 | #if TEST_OPTIMIZE_TXB |
| 1750 | // printf("si %d low_qc %d cost_diff %d dist_diff %ld rd_diff %ld eob %d new_eob |
| 1751 | // %d\n", si, stats.low_qc, stats.cost_diff, stats.dist_diff, stats.rd_diff, |
| 1752 | // txb_info->eob, stats.new_eob); |
| 1753 | #endif |
| 1754 | update = 1; |
| 1755 | cost_diff += stats.cost_diff; |
| 1756 | dist_diff += stats.dist_diff; |
| 1757 | rd_diff += stats.rd_diff; |
| 1758 | update_level_down(coeff_idx, txb_cache, txb_info); |
| 1759 | set_eob(txb_info, stats.new_eob); |
| 1760 | } |
Angie Chiang | 530b304 | 2017-08-17 15:08:58 -0700 | [diff] [blame] | 1761 | if (eob_fix == 0 && txb_info->qcoeff[coeff_idx] != 0) eob_fix = 1; |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1762 | if (si > txb_info->eob) si = txb_info->eob; |
| 1763 | } |
| 1764 | #if TEST_OPTIMIZE_TXB |
| 1765 | int64_t new_dist = |
| 1766 | av1_block_error_c(txb_info->tcoeff, txb_info->dqcoeff, max_eob, &sse) * |
| 1767 | (1 << (2 * txb_info->shift)); |
Angie Chiang | 0b2795c | 2017-09-29 16:00:08 -0700 | [diff] [blame] | 1768 | int new_cost = get_txb_cost(txb_info, txb_costs); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1769 | int64_t ref_dist_diff = new_dist - org_dist; |
| 1770 | int ref_cost_diff = new_cost - org_cost; |
| 1771 | if (cost_diff != ref_cost_diff || dist_diff != ref_dist_diff) |
| 1772 | printf( |
| 1773 | "overall rd_diff %ld\ncost_diff %d ref_cost_diff%d\ndist_diff %ld " |
| 1774 | "ref_dist_diff %ld\neob %d new_eob %d\n\n", |
| 1775 | rd_diff, cost_diff, ref_cost_diff, dist_diff, ref_dist_diff, org_eob, |
| 1776 | txb_info->eob); |
| 1777 | #endif |
| 1778 | if (dry_run) { |
| 1779 | txb_info->qcoeff = org_qcoeff; |
| 1780 | txb_info->dqcoeff = org_dqcoeff; |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 1781 | txb_info->levels = org_levels; |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1782 | set_eob(txb_info, org_eob); |
| 1783 | } |
| 1784 | return update; |
| 1785 | } |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 1786 | #endif |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1787 | |
| 1788 | // These numbers are empirically obtained. |
| 1789 | static const int plane_rd_mult[REF_TYPES][PLANE_TYPES] = { |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1790 | { 17, 13 }, { 16, 10 }, |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1791 | }; |
| 1792 | |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 1793 | void hbt_hash_init() { |
| 1794 | av1_crc_calculator_init(&crc_calculator, 16, 0x5D6DCB); // ctx 16 bit hash |
| 1795 | av1_crc_calculator_init(&crc_calculator2, 16, 0x5D6DCB); // qc 16 bit hash |
| 1796 | memset(hbt_hash_table, 0, sizeof(hbt_hash_table[0][0]) * 65536 * 16); |
| 1797 | hbt_hash_needs_init = 0; |
| 1798 | } |
| 1799 | |
| 1800 | int hbt_hash_miss(int found_index, uint16_t hbt_hash_index, |
| 1801 | uint32_t hbt_hash_match, TxbInfo *txb_info, |
| 1802 | const LV_MAP_COEFF_COST *txb_costs, |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 1803 | const LV_MAP_EOB_COST *txb_eob_costs, |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 1804 | const struct macroblock_plane *p, int block, int fast_mode) { |
| 1805 | const int16_t *scan = txb_info->scan_order->scan; |
| 1806 | |
| 1807 | av1_txb_init_levels(txb_info->qcoeff, txb_info->width, txb_info->height, |
| 1808 | txb_info->levels); |
| 1809 | // The hash_based_trellis speed feature requires lv_map_multi, so always true. |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1810 | const int update = |
| 1811 | optimize_txb(txb_info, txb_costs, txb_eob_costs, NULL, 0, fast_mode); |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 1812 | |
| 1813 | if (update) { |
| 1814 | // Overwrite old lowest entry |
| 1815 | hbt_hash_table[hbt_hash_index][found_index].hbt_hash_match = hbt_hash_match; |
| 1816 | hbt_hash_table[hbt_hash_index][found_index].hits = 1.0; |
| 1817 | for (int i = 0; i < txb_info->eob; i++) { |
| 1818 | hbt_hash_table[hbt_hash_index][found_index].opt_qcoeff[i] = |
| 1819 | txb_info->qcoeff[scan[i]]; |
| 1820 | } |
| 1821 | for (int i = txb_info->eob; i < HBT_HASH_EOB; i++) { |
| 1822 | hbt_hash_table[hbt_hash_index][found_index].opt_qcoeff[i] = 0; |
| 1823 | } |
| 1824 | |
| 1825 | p->eobs[block] = txb_info->eob; |
| 1826 | p->txb_entropy_ctx[block] = av1_get_txb_entropy_context( |
| 1827 | txb_info->qcoeff, txb_info->scan_order, txb_info->eob); |
| 1828 | } |
| 1829 | return txb_info->eob; |
| 1830 | } |
| 1831 | |
| 1832 | int hbt_hash_hit(uint16_t hbt_hash_index, int found_index, TxbInfo *txb_info, |
| 1833 | const struct macroblock_plane *p, int block) { |
| 1834 | const int16_t *scan = txb_info->scan_order->scan; |
| 1835 | int new_eob = 0; |
| 1836 | int update = 0; |
| 1837 | |
| 1838 | for (int i = 0; i < txb_info->eob; i++) { |
| 1839 | if (txb_info->qcoeff[scan[i]] != |
| 1840 | hbt_hash_table[hbt_hash_index][found_index].opt_qcoeff[i]) { |
| 1841 | txb_info->qcoeff[scan[i]] = |
| 1842 | hbt_hash_table[hbt_hash_index][found_index].opt_qcoeff[i]; |
| 1843 | update = 1; |
| 1844 | update_coeff(scan[i], txb_info->qcoeff[scan[i]], txb_info); |
| 1845 | } |
| 1846 | |
| 1847 | if (txb_info->qcoeff[scan[i]]) new_eob = i + 1; |
| 1848 | } |
| 1849 | |
| 1850 | if (update) { |
| 1851 | txb_info->eob = new_eob; |
| 1852 | p->eobs[block] = txb_info->eob; |
| 1853 | p->txb_entropy_ctx[block] = av1_get_txb_entropy_context( |
| 1854 | txb_info->qcoeff, txb_info->scan_order, txb_info->eob); |
| 1855 | } |
| 1856 | return txb_info->eob; |
| 1857 | } |
| 1858 | |
| 1859 | int search_hbt_hash_match(uint16_t hbt_hash_index, uint32_t hbt_hash_match, |
| 1860 | TxbInfo *txb_info, const LV_MAP_COEFF_COST *txb_costs, |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 1861 | const LV_MAP_EOB_COST *txb_eob_costs, |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 1862 | const struct macroblock_plane *p, int block, |
| 1863 | int fast_mode) { |
| 1864 | // Decay all hits |
| 1865 | double lowest_hits = 1.0; |
| 1866 | int lowest_index = 0; |
| 1867 | |
| 1868 | for (int i = 0; i < 16; i++) { |
| 1869 | hbt_hash_table[hbt_hash_index][i].hits *= 31.0; |
| 1870 | hbt_hash_table[hbt_hash_index][i].hits /= 32.0; |
| 1871 | |
| 1872 | if (hbt_hash_table[hbt_hash_index][i].hits < lowest_hits) { |
| 1873 | lowest_hits = hbt_hash_table[hbt_hash_index][i].hits; |
| 1874 | lowest_index = i; |
| 1875 | } |
| 1876 | } |
| 1877 | |
| 1878 | // Search soft hash vector for qcoeff match |
| 1879 | int found_index = -1; |
| 1880 | for (int i = 0; i < 16; i++) { // OptTxbQcoeff array has fixed size of 16. |
| 1881 | if (hbt_hash_table[hbt_hash_index][i].hbt_hash_match == hbt_hash_match) { |
| 1882 | found_index = i; |
| 1883 | hbt_hash_table[hbt_hash_index][i].hits += 1.0; |
| 1884 | break; // Found a match and it's at found_index |
| 1885 | } |
| 1886 | } |
| 1887 | |
| 1888 | if (found_index == -1) { // Add new OptTxbQcoeff into array. |
| 1889 | return hbt_hash_miss(lowest_index, hbt_hash_index, hbt_hash_match, txb_info, |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1890 | txb_costs, txb_eob_costs, p, block, fast_mode); |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 1891 | } else { // Retrieve data from array. |
| 1892 | return hbt_hash_hit(hbt_hash_index, found_index, txb_info, p, block); |
| 1893 | } |
| 1894 | } |
| 1895 | |
| 1896 | int hash_based_trellis_mode(TxbInfo *txb_info, |
| 1897 | const LV_MAP_COEFF_COST *txb_costs, |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 1898 | const LV_MAP_EOB_COST *txb_eob_costs, |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 1899 | const struct macroblock_plane *p, int block, |
| 1900 | int fast_mode, TXB_CTX *txb_ctx) { |
| 1901 | // Initialize hash table if needed. |
| 1902 | if (hbt_hash_needs_init) { |
| 1903 | hbt_hash_init(); |
| 1904 | } |
| 1905 | |
| 1906 | //// Hash creation |
| 1907 | // TODO(mfo): use exact length once input finalized |
| 1908 | uint8_t txb_hash_data[256]; |
| 1909 | const int16_t *scan = txb_info->scan_order->scan; |
| 1910 | uint8_t chunk = 0; |
| 1911 | |
| 1912 | uint16_t ctx_hash = 0; |
| 1913 | uint32_t qc_hash = 0; |
| 1914 | |
| 1915 | int hash_data_index = 0; |
| 1916 | for (int i = 0; i < txb_info->eob; i++) { |
| 1917 | // Data softening: data from -3 -> 3 is left alone, |
| 1918 | // while 'large' data is put into buckets of 16s |
| 1919 | // Consider bucketing less than 16 down to 4 instead of 0 |
| 1920 | // if(txb_info->qcoeff[scan[i]] < 4 && txb_info->qcoeff[scan[i]] > -4) |
| 1921 | chunk = (txb_info->qcoeff[scan[i]]) & 0xff; |
| 1922 | /*else if(txb_info->qcoeff[scan[i]] < 16 && txb_info->qcoeff[scan[i]] > -16) |
| 1923 | chunk = (txb_info->qcoeff[scan[i]]) & 0xfc; // |
| 1924 | else |
| 1925 | chunk = (txb_info->qcoeff[scan[i]]) & 0xf0; // greater than 16*/ |
| 1926 | txb_hash_data[hash_data_index++] = chunk; |
| 1927 | |
| 1928 | chunk = ((txb_info->qcoeff[scan[i]]) & 0xff00) >> 8; |
| 1929 | txb_hash_data[hash_data_index++] = chunk; |
| 1930 | } |
| 1931 | assert(hash_data_index <= 256); |
| 1932 | // 16 bit |
| 1933 | qc_hash = av1_get_crc_value(&crc_calculator2, txb_hash_data, hash_data_index); |
| 1934 | |
| 1935 | hash_data_index = 0; |
| 1936 | // tcoeff |
| 1937 | for (int i = 0; i < txb_info->eob; i++) { |
| 1938 | chunk = (txb_info->tcoeff[scan[i]] - txb_info->dqcoeff[scan[i]]) & 0xff; |
| 1939 | txb_hash_data[hash_data_index++] = chunk; |
| 1940 | } |
| 1941 | // txb_ctx |
| 1942 | chunk = txb_ctx->txb_skip_ctx & 0xff; |
| 1943 | txb_hash_data[hash_data_index++] = chunk; |
| 1944 | chunk = txb_ctx->dc_sign_ctx & 0xff; |
| 1945 | txb_hash_data[hash_data_index++] = chunk; |
| 1946 | // dequant |
| 1947 | chunk = txb_info->dequant[0] & 0xff; |
| 1948 | txb_hash_data[hash_data_index++] = chunk; |
| 1949 | chunk = (txb_info->dequant[0] & 0xff00) >> 8; |
| 1950 | txb_hash_data[hash_data_index++] = chunk; |
| 1951 | chunk = txb_info->dequant[1] & 0xff; |
| 1952 | txb_hash_data[hash_data_index++] = chunk; |
| 1953 | chunk = (txb_info->dequant[1] & 0xff00) >> 8; |
| 1954 | txb_hash_data[hash_data_index++] = chunk; |
| 1955 | // txb_skip_cost |
| 1956 | /*for (int i = 0; i < 2; i++) { |
| 1957 | for (int j = 0; j < TXB_SKIP_CONTEXTS; j++) { |
| 1958 | chunk = (txb_costs->txb_skip_cost[j][i] & 0xff00) >> 8; |
| 1959 | txb_hash_data[hash_data_index++] = chunk; |
| 1960 | } |
| 1961 | } |
| 1962 | // base_eob_cost |
| 1963 | for (int i = 1; i < 3; i++) { // i = 0 are softened away |
| 1964 | for (int j = 0; j < SIG_COEF_CONTEXTS_EOB; j++) { |
| 1965 | chunk = (txb_costs->base_eob_cost[j][i] & 0xff00) >> 8; |
| 1966 | txb_hash_data[hash_data_index++] = chunk; |
| 1967 | } |
| 1968 | }*/ |
| 1969 | assert(hash_data_index <= 256); |
| 1970 | // Gives 16 bit hash for ctx |
| 1971 | ctx_hash = av1_get_crc_value(&crc_calculator, txb_hash_data, hash_data_index); |
| 1972 | |
| 1973 | uint16_t hbt_hash_index = ctx_hash; // 16 bit ctx_hash: index to table |
| 1974 | uint32_t hbt_hash_match = qc_hash; // 16 bit qc_hash: matched in array |
| 1975 | //// End hash creation |
| 1976 | |
| 1977 | return search_hbt_hash_match(hbt_hash_index, hbt_hash_match, txb_info, |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 1978 | txb_costs, txb_eob_costs, p, block, fast_mode); |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 1979 | } |
| 1980 | |
| 1981 | int av1_optimize_txb(const AV1_COMP *const cpi, MACROBLOCK *x, int plane, |
Jingning Han | 7eab9ff | 2017-07-06 10:12:54 -0700 | [diff] [blame] | 1982 | int blk_row, int blk_col, int block, TX_SIZE tx_size, |
Angie Chiang | 25645b7 | 2017-09-24 14:28:49 -0700 | [diff] [blame] | 1983 | TXB_CTX *txb_ctx, int fast_mode) { |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 1984 | const AV1_COMMON *cm = &cpi->common; |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1985 | MACROBLOCKD *const xd = &x->e_mbd; |
| 1986 | const PLANE_TYPE plane_type = get_plane_type(plane); |
Debargha Mukherjee | b3eda2f | 2017-11-28 16:00:20 -0800 | [diff] [blame] | 1987 | const TX_SIZE txs_ctx = get_txsize_entropy_ctx(tx_size); |
Jingning Han | 19b5c8f | 2017-07-06 15:10:12 -0700 | [diff] [blame] | 1988 | const TX_TYPE tx_type = |
Luc Trudeau | 2eb9b84 | 2017-12-13 11:19:16 -0500 | [diff] [blame] | 1989 | av1_get_tx_type(plane_type, xd, blk_row, blk_col, tx_size); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 1990 | const MB_MODE_INFO *mbmi = &xd->mi[0]->mbmi; |
| 1991 | const struct macroblock_plane *p = &x->plane[plane]; |
| 1992 | struct macroblockd_plane *pd = &xd->plane[plane]; |
| 1993 | const int eob = p->eobs[block]; |
| 1994 | tran_low_t *qcoeff = BLOCK_OFFSET(p->qcoeff, block); |
| 1995 | tran_low_t *dqcoeff = BLOCK_OFFSET(pd->dqcoeff, block); |
| 1996 | const tran_low_t *tcoeff = BLOCK_OFFSET(p->coeff, block); |
Monty Montgomery | 125c0fc | 2017-10-26 00:44:35 -0400 | [diff] [blame] | 1997 | const int16_t *dequant = p->dequant_QTX; |
Urvang Joshi | 8089315 | 2017-10-27 11:51:14 -0700 | [diff] [blame] | 1998 | const int seg_eob = av1_get_max_eob(tx_size); |
Angie Chiang | a9ba58e | 2017-12-01 19:22:43 -0800 | [diff] [blame] | 1999 | const int bwl = get_txb_bwl(tx_size); |
| 2000 | const int width = get_txb_wide(tx_size); |
| 2001 | const int height = get_txb_high(tx_size); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 2002 | const int is_inter = is_inter_block(mbmi); |
Angie Chiang | bd99b38 | 2017-06-20 15:11:16 -0700 | [diff] [blame] | 2003 | const SCAN_ORDER *const scan_order = get_scan(cm, tx_size, tx_type, mbmi); |
Jingning Han | dfd7232 | 2017-08-09 14:04:12 -0700 | [diff] [blame] | 2004 | const LV_MAP_COEFF_COST txb_costs = x->coeff_costs[txs_ctx][plane_type]; |
Sarah Parker | 3d75209 | 2017-12-20 15:37:55 -0800 | [diff] [blame] | 2005 | #if CONFIG_NEW_QUANT |
Debargha Mukherjee | e15b8ad | 2017-12-26 07:10:40 -0800 | [diff] [blame] | 2006 | int dq = get_dq_profile(cm->dq_type, x->qindex, is_inter, plane_type); |
Sarah Parker | 3d75209 | 2017-12-20 15:37:55 -0800 | [diff] [blame] | 2007 | const dequant_val_type_nuq *dequant_val = p->dequant_val_nuq_QTX[dq]; |
| 2008 | #endif // CONFIG_NEW_QUANT |
Dake He | 0db7d0e | 2017-12-21 15:23:20 -0800 | [diff] [blame] | 2009 | const int eob_multi_size = txsize_log2_minus4[tx_size]; |
| 2010 | const LV_MAP_EOB_COST txb_eob_costs = |
| 2011 | x->eob_costs[eob_multi_size][plane_type]; |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 2012 | |
Monty | bca9e9e | 2017-12-14 06:23:29 -0600 | [diff] [blame] | 2013 | #if CONFIG_DAALA_TX |
| 2014 | const int shift = 0; |
| 2015 | #else |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 2016 | const int shift = av1_get_tx_scale(tx_size); |
Monty | bca9e9e | 2017-12-14 06:23:29 -0600 | [diff] [blame] | 2017 | #endif |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 2018 | const int64_t rdmult = |
Jingning Han | b433f4c | 2017-11-17 15:43:59 -0800 | [diff] [blame] | 2019 | ((x->rdmult * plane_rd_mult[is_inter][plane_type] << (2 * (xd->bd - 8))) + |
| 2020 | 2) >> |
| 2021 | 2; |
Linfeng Zhang | 679d81e | 2017-10-31 15:27:42 -0700 | [diff] [blame] | 2022 | uint8_t levels_buf[TX_PAD_2D]; |
| 2023 | uint8_t *const levels = set_levels(levels_buf, width); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 2024 | |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 2025 | assert(width == (1 << bwl)); |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 2026 | TxbInfo txb_info = { |
Sarah Parker | 3d75209 | 2017-12-20 15:37:55 -0800 | [diff] [blame] | 2027 | qcoeff, |
| 2028 | levels, |
| 2029 | dqcoeff, |
| 2030 | tcoeff, |
| 2031 | dequant, |
| 2032 | #if CONFIG_NEW_QUANT |
| 2033 | dequant_val, |
| 2034 | #endif // CONFIG_NEW_QUANT |
| 2035 | shift, |
| 2036 | tx_size, |
| 2037 | txs_ctx, |
| 2038 | tx_type, |
| 2039 | bwl, |
| 2040 | width, |
| 2041 | height, |
| 2042 | eob, |
| 2043 | seg_eob, |
| 2044 | scan_order, |
| 2045 | txb_ctx, |
| 2046 | rdmult, |
| 2047 | &cm->coeff_ctx_table |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 2048 | }; |
| 2049 | |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 2050 | // Hash based trellis (hbt) speed feature: avoid expensive optimize_txb calls |
| 2051 | // by storing the optimized coefficients in a hash table. |
| 2052 | // Currently disabled in speedfeatures.c |
| 2053 | if (eob <= HBT_HASH_EOB && eob > 0 && cpi->sf.use_hash_based_trellis) { |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 2054 | return hash_based_trellis_mode(&txb_info, &txb_costs, &txb_eob_costs, p, |
| 2055 | block, fast_mode, txb_ctx); |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 2056 | } |
| 2057 | |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 2058 | av1_txb_init_levels(qcoeff, width, height, levels); |
Urvang Joshi | 70006e4 | 2017-06-14 16:08:55 -0700 | [diff] [blame] | 2059 | |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 2060 | const int update = |
| 2061 | optimize_txb(&txb_info, &txb_costs, &txb_eob_costs, NULL, 0, fast_mode); |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 2062 | |
Jingning Han | d7e9911 | 2017-12-13 09:47:45 -0800 | [diff] [blame] | 2063 | if (update) { |
| 2064 | p->eobs[block] = txb_info.eob; |
| 2065 | p->txb_entropy_ctx[block] = |
| 2066 | av1_get_txb_entropy_context(qcoeff, scan_order, txb_info.eob); |
| 2067 | } |
Angie Chiang | 07c57f3 | 2017-05-30 18:18:33 -0700 | [diff] [blame] | 2068 | return txb_info.eob; |
| 2069 | } |
Jingning Han | d7e9911 | 2017-12-13 09:47:45 -0800 | [diff] [blame] | 2070 | |
Angie Chiang | 74e2307 | 2017-03-24 14:54:23 -0700 | [diff] [blame] | 2071 | int av1_get_txb_entropy_context(const tran_low_t *qcoeff, |
| 2072 | const SCAN_ORDER *scan_order, int eob) { |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 2073 | const int16_t *const scan = scan_order->scan; |
Angie Chiang | 74e2307 | 2017-03-24 14:54:23 -0700 | [diff] [blame] | 2074 | int cul_level = 0; |
| 2075 | int c; |
Jingning Han | 339cf93 | 2017-09-18 10:17:02 -0700 | [diff] [blame] | 2076 | |
| 2077 | if (eob == 0) return 0; |
Angie Chiang | 74e2307 | 2017-03-24 14:54:23 -0700 | [diff] [blame] | 2078 | for (c = 0; c < eob; ++c) { |
| 2079 | cul_level += abs(qcoeff[scan[c]]); |
| 2080 | } |
| 2081 | |
| 2082 | cul_level = AOMMIN(COEFF_CONTEXT_MASK, cul_level); |
| 2083 | set_dc_sign(&cul_level, qcoeff[0]); |
| 2084 | |
| 2085 | return cul_level; |
| 2086 | } |
| 2087 | |
Jingning Han | 4fe5f67 | 2017-05-19 15:46:07 -0700 | [diff] [blame] | 2088 | void av1_update_txb_context_b(int plane, int block, int blk_row, int blk_col, |
| 2089 | BLOCK_SIZE plane_bsize, TX_SIZE tx_size, |
| 2090 | void *arg) { |
Jingning Han | 6171ae7 | 2017-05-18 20:15:06 -0700 | [diff] [blame] | 2091 | struct tokenize_b_args *const args = arg; |
Angie Chiang | 36d616b | 2017-03-22 13:58:36 -0700 | [diff] [blame] | 2092 | const AV1_COMP *cpi = args->cpi; |
| 2093 | const AV1_COMMON *cm = &cpi->common; |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2094 | ThreadData *const td = args->td; |
| 2095 | MACROBLOCK *const x = &td->mb; |
| 2096 | MACROBLOCKD *const xd = &x->e_mbd; |
Angie Chiang | 36d616b | 2017-03-22 13:58:36 -0700 | [diff] [blame] | 2097 | MB_MODE_INFO *mbmi = &xd->mi[0]->mbmi; |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2098 | struct macroblock_plane *p = &x->plane[plane]; |
| 2099 | struct macroblockd_plane *pd = &xd->plane[plane]; |
Angie Chiang | 36d616b | 2017-03-22 13:58:36 -0700 | [diff] [blame] | 2100 | const uint16_t eob = p->eobs[block]; |
| 2101 | const tran_low_t *qcoeff = BLOCK_OFFSET(p->qcoeff, block); |
| 2102 | const PLANE_TYPE plane_type = pd->plane_type; |
Jingning Han | 19b5c8f | 2017-07-06 15:10:12 -0700 | [diff] [blame] | 2103 | const TX_TYPE tx_type = |
Luc Trudeau | 2eb9b84 | 2017-12-13 11:19:16 -0500 | [diff] [blame] | 2104 | av1_get_tx_type(plane_type, xd, blk_row, blk_col, tx_size); |
Angie Chiang | bd99b38 | 2017-06-20 15:11:16 -0700 | [diff] [blame] | 2105 | const SCAN_ORDER *const scan_order = get_scan(cm, tx_size, tx_type, mbmi); |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2106 | (void)plane_bsize; |
Angie Chiang | 36d616b | 2017-03-22 13:58:36 -0700 | [diff] [blame] | 2107 | |
Angie Chiang | 74e2307 | 2017-03-24 14:54:23 -0700 | [diff] [blame] | 2108 | int cul_level = av1_get_txb_entropy_context(qcoeff, scan_order, eob); |
Angie Chiang | 36d616b | 2017-03-22 13:58:36 -0700 | [diff] [blame] | 2109 | av1_set_contexts(xd, pd, plane, tx_size, cul_level, blk_col, blk_row); |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2110 | } |
| 2111 | |
Jingning Han | 4fe5f67 | 2017-05-19 15:46:07 -0700 | [diff] [blame] | 2112 | void av1_update_and_record_txb_context(int plane, int block, int blk_row, |
| 2113 | int blk_col, BLOCK_SIZE plane_bsize, |
| 2114 | TX_SIZE tx_size, void *arg) { |
Jingning Han | 6171ae7 | 2017-05-18 20:15:06 -0700 | [diff] [blame] | 2115 | struct tokenize_b_args *const args = arg; |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2116 | const AV1_COMP *cpi = args->cpi; |
| 2117 | const AV1_COMMON *cm = &cpi->common; |
| 2118 | ThreadData *const td = args->td; |
| 2119 | MACROBLOCK *const x = &td->mb; |
| 2120 | MACROBLOCKD *const xd = &x->e_mbd; |
| 2121 | struct macroblock_plane *p = &x->plane[plane]; |
| 2122 | struct macroblockd_plane *pd = &xd->plane[plane]; |
| 2123 | MB_MODE_INFO *mbmi = &xd->mi[0]->mbmi; |
Linfeng Zhang | 848f7bc | 2017-10-31 15:26:07 -0700 | [diff] [blame] | 2124 | int eob = p->eobs[block], update_eob = -1; |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2125 | const PLANE_TYPE plane_type = pd->plane_type; |
| 2126 | const tran_low_t *qcoeff = BLOCK_OFFSET(p->qcoeff, block); |
| 2127 | tran_low_t *tcoeff = BLOCK_OFFSET(x->mbmi_ext->tcoeff[plane], block); |
| 2128 | const int segment_id = mbmi->segment_id; |
Jingning Han | 19b5c8f | 2017-07-06 15:10:12 -0700 | [diff] [blame] | 2129 | const TX_TYPE tx_type = |
Luc Trudeau | 2eb9b84 | 2017-12-13 11:19:16 -0500 | [diff] [blame] | 2130 | av1_get_tx_type(plane_type, xd, blk_row, blk_col, tx_size); |
Angie Chiang | bd99b38 | 2017-06-20 15:11:16 -0700 | [diff] [blame] | 2131 | const SCAN_ORDER *const scan_order = get_scan(cm, tx_size, tx_type, mbmi); |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 2132 | const int16_t *const scan = scan_order->scan; |
hui su | c0cf71d | 2017-07-20 16:38:50 -0700 | [diff] [blame] | 2133 | const int seg_eob = av1_get_tx_eob(&cpi->common.seg, segment_id, tx_size); |
Linfeng Zhang | 1015a34 | 2017-10-24 16:20:41 -0700 | [diff] [blame] | 2134 | int c; |
Angie Chiang | 8590156 | 2017-03-17 12:03:27 -0700 | [diff] [blame] | 2135 | TXB_CTX txb_ctx; |
| 2136 | get_txb_ctx(plane_bsize, tx_size, plane, pd->above_context + blk_col, |
| 2137 | pd->left_context + blk_row, &txb_ctx); |
Angie Chiang | a9ba58e | 2017-12-01 19:22:43 -0800 | [diff] [blame] | 2138 | const int bwl = get_txb_bwl(tx_size); |
| 2139 | const int width = get_txb_wide(tx_size); |
| 2140 | const int height = get_txb_high(tx_size); |
Linfeng Zhang | 679d81e | 2017-10-31 15:27:42 -0700 | [diff] [blame] | 2141 | uint8_t levels_buf[TX_PAD_2D]; |
| 2142 | uint8_t *const levels = set_levels(levels_buf, width); |
Linfeng Zhang | ae7b2f3 | 2017-11-08 15:46:57 -0800 | [diff] [blame] | 2143 | DECLARE_ALIGNED(16, uint8_t, level_counts[MAX_TX_SQUARE]); |
Yunqing Wang | 0e141b5 | 2017-11-02 15:08:58 -0700 | [diff] [blame] | 2144 | const uint8_t allow_update_cdf = args->allow_update_cdf; |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2145 | |
Debargha Mukherjee | b3eda2f | 2017-11-28 16:00:20 -0800 | [diff] [blame] | 2146 | TX_SIZE txsize_ctx = get_txsize_entropy_ctx(tx_size); |
Jingning Han | 8f66160 | 2017-08-19 08:16:50 -0700 | [diff] [blame] | 2147 | FRAME_CONTEXT *ec_ctx = xd->tile_ctx; |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 2148 | DECLARE_ALIGNED(16, int8_t, coeff_contexts[MAX_TX_SQUARE]); |
Jingning Han | 48be0e1 | 2017-06-13 12:12:01 -0700 | [diff] [blame] | 2149 | |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2150 | memcpy(tcoeff, qcoeff, sizeof(*tcoeff) * seg_eob); |
| 2151 | |
Jingning Han | 48be0e1 | 2017-06-13 12:12:01 -0700 | [diff] [blame] | 2152 | ++td->counts->txb_skip[txsize_ctx][txb_ctx.txb_skip_ctx][eob == 0]; |
Yunqing Wang | 0e141b5 | 2017-11-02 15:08:58 -0700 | [diff] [blame] | 2153 | if (allow_update_cdf) |
| 2154 | update_bin(ec_ctx->txb_skip_cdf[txsize_ctx][txb_ctx.txb_skip_ctx], eob == 0, |
| 2155 | 2); |
Angie Chiang | 8590156 | 2017-03-17 12:03:27 -0700 | [diff] [blame] | 2156 | x->mbmi_ext->txb_skip_ctx[plane][block] = txb_ctx.txb_skip_ctx; |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2157 | |
| 2158 | x->mbmi_ext->eobs[plane][block] = eob; |
| 2159 | |
| 2160 | if (eob == 0) { |
| 2161 | av1_set_contexts(xd, pd, plane, tx_size, 0, blk_col, blk_row); |
| 2162 | return; |
| 2163 | } |
| 2164 | |
Linfeng Zhang | 1122d7d | 2017-10-31 15:30:28 -0700 | [diff] [blame] | 2165 | av1_txb_init_levels(tcoeff, width, height, levels); |
Linfeng Zhang | ce065ca | 2017-10-17 16:49:30 -0700 | [diff] [blame] | 2166 | |
Angie Chiang | cd9b03f | 2017-04-16 13:37:13 -0700 | [diff] [blame] | 2167 | #if CONFIG_TXK_SEL |
Luc Trudeau | 2eb9b84 | 2017-12-13 11:19:16 -0500 | [diff] [blame] | 2168 | av1_update_tx_type_count(cm, xd, blk_row, blk_col, plane, mbmi->sb_type, |
Debargha Mukherjee | 3ebb0d0 | 2017-12-14 05:05:18 -0800 | [diff] [blame] | 2169 | tx_size, td->counts, allow_update_cdf); |
Angie Chiang | cd9b03f | 2017-04-16 13:37:13 -0700 | [diff] [blame] | 2170 | #endif |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2171 | |
Jingning Han | 35deaa7 | 2017-10-26 15:36:30 -0700 | [diff] [blame] | 2172 | av1_update_eob_context(eob, seg_eob, tx_size, tx_type, plane_type, ec_ctx, |
Yunqing Wang | 0e141b5 | 2017-11-02 15:08:58 -0700 | [diff] [blame] | 2173 | td->counts, allow_update_cdf); |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 2174 | |
| 2175 | av1_get_nz_map_contexts(levels, scan, eob, tx_size, tx_type, coeff_contexts); |
| 2176 | |
Dake He | 03a3292 | 2017-10-31 08:06:45 -0700 | [diff] [blame] | 2177 | update_eob = eob - 1; |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 2178 | for (c = eob - 1; c >= 0; --c) { |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 2179 | const int pos = scan[c]; |
Linfeng Zhang | d67c13f | 2017-12-11 11:49:12 -0800 | [diff] [blame] | 2180 | const int coeff_ctx = coeff_contexts[pos]; |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 2181 | const tran_low_t v = qcoeff[pos]; |
| 2182 | const int is_nz = (v != 0); |
Dake He | 03a3292 | 2017-10-31 08:06:45 -0700 | [diff] [blame] | 2183 | |
Ola Hugosson | 1389210 | 2017-11-06 08:01:44 +0100 | [diff] [blame] | 2184 | (void)is_nz; |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 2185 | if (allow_update_cdf) { |
| 2186 | if (c == eob - 1) { |
| 2187 | assert(coeff_ctx < 4); |
| 2188 | update_cdf( |
| 2189 | ec_ctx->coeff_base_eob_cdf[txsize_ctx][plane_type][coeff_ctx], |
| 2190 | AOMMIN(abs(v), 3) - 1, 3); |
| 2191 | } else { |
| 2192 | update_cdf(ec_ctx->coeff_base_cdf[txsize_ctx][plane_type][coeff_ctx], |
| 2193 | AOMMIN(abs(v), 3), 4); |
| 2194 | } |
Dake He | 3fe369c | 2017-11-16 17:56:44 -0800 | [diff] [blame] | 2195 | } |
Dake He | 5988177 | 2017-11-24 07:00:02 -0800 | [diff] [blame] | 2196 | { |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 2197 | if (c == eob - 1) { |
| 2198 | assert(coeff_ctx < 4); |
| 2199 | ++td->counts->coeff_base_eob_multi[txsize_ctx][plane_type][coeff_ctx] |
| 2200 | [AOMMIN(abs(v), 3) - 1]; |
| 2201 | } else { |
| 2202 | ++td->counts->coeff_base_multi[txsize_ctx][plane_type][coeff_ctx] |
| 2203 | [AOMMIN(abs(v), 3)]; |
Dake He | 5988177 | 2017-11-24 07:00:02 -0800 | [diff] [blame] | 2204 | } |
| 2205 | } |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 2206 | } |
Dake He | a47cd6c | 2017-10-13 18:09:58 -0700 | [diff] [blame] | 2207 | |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 2208 | // Update the context needed to code the DC sign (if applicable) |
| 2209 | const int sign = (tcoeff[0] < 0) ? 1 : 0; |
| 2210 | if (tcoeff[0] != 0) { |
Dake He | 43edb76 | 2017-10-26 10:29:46 -0700 | [diff] [blame] | 2211 | int dc_sign_ctx = txb_ctx.dc_sign_ctx; |
| 2212 | |
| 2213 | ++td->counts->dc_sign[plane_type][dc_sign_ctx][sign]; |
Yunqing Wang | 0e141b5 | 2017-11-02 15:08:58 -0700 | [diff] [blame] | 2214 | if (allow_update_cdf) |
| 2215 | update_bin(ec_ctx->dc_sign_cdf[plane_type][dc_sign_ctx], sign, 2); |
Dake He | 43edb76 | 2017-10-26 10:29:46 -0700 | [diff] [blame] | 2216 | x->mbmi_ext->dc_sign_ctx[plane][block] = dc_sign_ctx; |
| 2217 | } |
| 2218 | |
Linfeng Zhang | 97fc474 | 2017-11-07 12:57:25 -0800 | [diff] [blame] | 2219 | if (update_eob >= 0) { |
Linfeng Zhang | 97fc474 | 2017-11-07 12:57:25 -0800 | [diff] [blame] | 2220 | for (c = update_eob; c >= 0; --c) { |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 2221 | const int pos = scan[c]; |
| 2222 | const tran_low_t level = abs(tcoeff[pos]); |
Linfeng Zhang | 97fc474 | 2017-11-07 12:57:25 -0800 | [diff] [blame] | 2223 | int idx; |
| 2224 | int ctx; |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2225 | |
Linfeng Zhang | 97fc474 | 2017-11-07 12:57:25 -0800 | [diff] [blame] | 2226 | if (level <= NUM_BASE_LEVELS) continue; |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2227 | |
Sebastien Alaiwan | 78f7bb9 | 2018-01-11 11:02:43 +0100 | [diff] [blame] | 2228 | // level is above 1. |
Jingning Han | 87b01b5 | 2017-08-31 12:07:20 -0700 | [diff] [blame] | 2229 | |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 2230 | const int base_range = level - 1 - NUM_BASE_LEVELS; |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 2231 | #if USE_CAUSAL_BR_CTX |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 2232 | ctx = get_br_ctx(levels, pos, bwl, level_counts[pos], tx_type); |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 2233 | #else |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 2234 | ctx = get_br_ctx(levels, pos, bwl, level_counts[pos]); |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 2235 | #endif |
Ola Hugosson | e72a209 | 2017-11-12 09:11:53 +0100 | [diff] [blame] | 2236 | for (idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) { |
Linfeng Zhang | db41d1e | 2017-12-05 11:06:20 -0800 | [diff] [blame] | 2237 | const int k = AOMMIN(base_range - idx, BR_CDF_SIZE - 1); |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 2238 | if (allow_update_cdf) { |
| 2239 | update_cdf( |
Dake He | e2d8f18 | 2017-12-14 13:28:00 -0800 | [diff] [blame] | 2240 | #if 0 |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 2241 | ec_ctx->coeff_br_cdf[AOMMIN(txsize_ctx, TX_16X16)][plane_type][ctx], |
Dake He | e2d8f18 | 2017-12-14 13:28:00 -0800 | [diff] [blame] | 2242 | #else |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 2243 | ec_ctx |
| 2244 | ->coeff_br_cdf[AOMMIN(txsize_ctx, TX_32X32)][plane_type][ctx], |
Dake He | e2d8f18 | 2017-12-14 13:28:00 -0800 | [diff] [blame] | 2245 | #endif |
Dake He | 4d44769 | 2017-12-15 09:10:06 -0800 | [diff] [blame] | 2246 | k, BR_CDF_SIZE); |
| 2247 | } |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 2248 | for (int lps = 0; lps < BR_CDF_SIZE - 1; lps++) { |
Dake He | e2d8f18 | 2017-12-14 13:28:00 -0800 | [diff] [blame] | 2249 | #if 0 |
Dake He | 7d01ab5 | 2017-11-24 17:53:28 -0800 | [diff] [blame] | 2250 | ++td->counts->coeff_lps[AOMMIN(txsize_ctx, TX_16X16)][plane_type][lps] |
| 2251 | [ctx][lps == k]; |
Dake He | e2d8f18 | 2017-12-14 13:28:00 -0800 | [diff] [blame] | 2252 | #else |
| 2253 | ++td->counts->coeff_lps[AOMMIN(txsize_ctx, TX_32X32)][plane_type][lps] |
| 2254 | [ctx][lps == k]; |
| 2255 | #endif |
Dake He | 5988177 | 2017-11-24 07:00:02 -0800 | [diff] [blame] | 2256 | if (lps == k) break; |
| 2257 | } |
Dake He | e2d8f18 | 2017-12-14 13:28:00 -0800 | [diff] [blame] | 2258 | ++td->counts->coeff_lps_multi[AOMMIN(txsize_ctx, TX_32X32)][plane_type] |
| 2259 | [ctx][k]; |
Dake He | 5988177 | 2017-11-24 07:00:02 -0800 | [diff] [blame] | 2260 | |
Ola Hugosson | e72a209 | 2017-11-12 09:11:53 +0100 | [diff] [blame] | 2261 | if (k < BR_CDF_SIZE - 1) break; |
| 2262 | } |
Linfeng Zhang | 97fc474 | 2017-11-07 12:57:25 -0800 | [diff] [blame] | 2263 | // use 0-th order Golomb code to handle the residual level. |
Jingning Han | 87b01b5 | 2017-08-31 12:07:20 -0700 | [diff] [blame] | 2264 | } |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2265 | } |
Angie Chiang | 36d616b | 2017-03-22 13:58:36 -0700 | [diff] [blame] | 2266 | |
Angie Chiang | 63d190a | 2017-10-23 15:43:05 -0700 | [diff] [blame] | 2267 | int cul_level = av1_get_txb_entropy_context(tcoeff, scan_order, eob); |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2268 | av1_set_contexts(xd, pd, plane, tx_size, cul_level, blk_col, blk_row); |
| 2269 | } |
| 2270 | |
| 2271 | void av1_update_txb_context(const AV1_COMP *cpi, ThreadData *td, |
| 2272 | RUN_TYPE dry_run, BLOCK_SIZE bsize, int *rate, |
Yunqing Wang | 0e141b5 | 2017-11-02 15:08:58 -0700 | [diff] [blame] | 2273 | int mi_row, int mi_col, uint8_t allow_update_cdf) { |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2274 | MACROBLOCK *const x = &td->mb; |
| 2275 | MACROBLOCKD *const xd = &x->e_mbd; |
| 2276 | MB_MODE_INFO *const mbmi = &xd->mi[0]->mbmi; |
Yunqing Wang | 0e141b5 | 2017-11-02 15:08:58 -0700 | [diff] [blame] | 2277 | struct tokenize_b_args arg = { cpi, td, NULL, 0, allow_update_cdf }; |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2278 | (void)rate; |
| 2279 | (void)mi_row; |
| 2280 | (void)mi_col; |
| 2281 | if (mbmi->skip) { |
Timothy B. Terriberry | a2d5cde | 2017-05-10 18:33:50 -0700 | [diff] [blame] | 2282 | av1_reset_skip_context(xd, mi_row, mi_col, bsize); |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2283 | return; |
| 2284 | } |
| 2285 | |
| 2286 | if (!dry_run) { |
Jingning Han | 94652b8 | 2017-04-04 09:45:02 -0700 | [diff] [blame] | 2287 | av1_foreach_transformed_block(xd, bsize, mi_row, mi_col, |
Jingning Han | 4fe5f67 | 2017-05-19 15:46:07 -0700 | [diff] [blame] | 2288 | av1_update_and_record_txb_context, &arg); |
Angie Chiang | c8af611 | 2017-03-16 16:11:22 -0700 | [diff] [blame] | 2289 | } else if (dry_run == DRY_RUN_NORMAL) { |
Jingning Han | 4fe5f67 | 2017-05-19 15:46:07 -0700 | [diff] [blame] | 2290 | av1_foreach_transformed_block(xd, bsize, mi_row, mi_col, |
| 2291 | av1_update_txb_context_b, &arg); |
Angie Chiang | c8af611 | 2017-03-16 16:11:22 -0700 | [diff] [blame] | 2292 | } else { |
| 2293 | printf("DRY_RUN_COSTCOEFFS is not supported yet\n"); |
| 2294 | assert(0); |
Angie Chiang | 0397eda | 2017-03-15 16:57:14 -0700 | [diff] [blame] | 2295 | } |
| 2296 | } |
Angie Chiang | 800df03 | 2017-03-22 11:14:12 -0700 | [diff] [blame] | 2297 | |
Angie Chiang | cd9b03f | 2017-04-16 13:37:13 -0700 | [diff] [blame] | 2298 | #if CONFIG_TXK_SEL |
Angie Chiang | 808d859 | 2017-04-06 18:36:55 -0700 | [diff] [blame] | 2299 | int64_t av1_search_txk_type(const AV1_COMP *cpi, MACROBLOCK *x, int plane, |
| 2300 | int block, int blk_row, int blk_col, |
| 2301 | BLOCK_SIZE plane_bsize, TX_SIZE tx_size, |
Angie Chiang | 65a39bb | 2017-04-11 16:50:04 -0700 | [diff] [blame] | 2302 | const ENTROPY_CONTEXT *a, const ENTROPY_CONTEXT *l, |
| 2303 | int use_fast_coef_costing, RD_STATS *rd_stats) { |
Angie Chiang | 808d859 | 2017-04-06 18:36:55 -0700 | [diff] [blame] | 2304 | const AV1_COMMON *cm = &cpi->common; |
| 2305 | MACROBLOCKD *xd = &x->e_mbd; |
| 2306 | MB_MODE_INFO *mbmi = &xd->mi[0]->mbmi; |
| 2307 | TX_TYPE txk_start = DCT_DCT; |
| 2308 | TX_TYPE txk_end = TX_TYPES - 1; |
| 2309 | TX_TYPE best_tx_type = txk_start; |
| 2310 | int64_t best_rd = INT64_MAX; |
Angie Chiang | 4e16ea6 | 2017-12-15 17:58:44 -0800 | [diff] [blame] | 2311 | uint8_t best_txb_ctx = 0; |
| 2312 | uint16_t best_eob = 0; |
Jingning Han | e3b81bc | 2017-06-23 11:43:52 -0700 | [diff] [blame] | 2313 | RD_STATS best_rd_stats; |
Angie Chiang | 808d859 | 2017-04-06 18:36:55 -0700 | [diff] [blame] | 2314 | TX_TYPE tx_type; |
Jingning Han | e3b81bc | 2017-06-23 11:43:52 -0700 | [diff] [blame] | 2315 | |
| 2316 | av1_invalid_rd_stats(&best_rd_stats); |
| 2317 | |
Angie Chiang | 808d859 | 2017-04-06 18:36:55 -0700 | [diff] [blame] | 2318 | for (tx_type = txk_start; tx_type <= txk_end; ++tx_type) { |
Angie Chiang | bce07f1 | 2017-12-01 16:34:31 -0800 | [diff] [blame] | 2319 | if (plane == 0) |
| 2320 | mbmi->txk_type[(blk_row << MAX_MIB_SIZE_LOG2) + blk_col] = tx_type; |
Luc Trudeau | 2eb9b84 | 2017-12-13 11:19:16 -0500 | [diff] [blame] | 2321 | TX_TYPE ref_tx_type = |
| 2322 | av1_get_tx_type(get_plane_type(plane), xd, blk_row, blk_col, tx_size); |
Angie Chiang | 00491e0 | 2017-04-11 17:55:10 -0700 | [diff] [blame] | 2323 | if (tx_type != ref_tx_type) { |
hui su | 45b6475 | 2017-07-12 16:54:35 -0700 | [diff] [blame] | 2324 | // use av1_get_tx_type() to check if the tx_type is valid for the current |
| 2325 | // mode if it's not, we skip it here. |
Angie Chiang | 00491e0 | 2017-04-11 17:55:10 -0700 | [diff] [blame] | 2326 | continue; |
| 2327 | } |
Jingning Han | e57d632 | 2017-07-03 18:50:25 -0700 | [diff] [blame] | 2328 | |
Hui Su | ddbcde2 | 2017-09-18 17:22:02 -0700 | [diff] [blame] | 2329 | const int is_inter = is_inter_block(mbmi); |
Angie Chiang | 53bf1e9 | 2017-11-29 16:53:07 -0800 | [diff] [blame] | 2330 | const TxSetType tx_set_type = get_ext_tx_set_type( |
| 2331 | tx_size, mbmi->sb_type, is_inter, cm->reduced_tx_set_used); |
Hui Su | ddbcde2 | 2017-09-18 17:22:02 -0700 | [diff] [blame] | 2332 | if (!av1_ext_tx_used[tx_set_type][tx_type]) continue; |
Jingning Han | e57d632 | 2017-07-03 18:50:25 -0700 | [diff] [blame] | 2333 | |
Angie Chiang | 808d859 | 2017-04-06 18:36:55 -0700 | [diff] [blame] | 2334 | RD_STATS this_rd_stats; |
| 2335 | av1_invalid_rd_stats(&this_rd_stats); |
Sarah Parker | 792c2ec | 2017-12-21 16:08:22 -0800 | [diff] [blame] | 2336 | if (cpi->sf.optimize_coefficients != FULL_TRELLIS_OPT) { |
| 2337 | av1_xform_quant(cm, x, plane, block, blk_row, blk_col, plane_bsize, |
| 2338 | tx_size, AV1_XFORM_QUANT_B); |
| 2339 | } else { |
| 2340 | av1_xform_quant(cm, x, plane, block, blk_row, blk_col, plane_bsize, |
| 2341 | tx_size, AV1_XFORM_QUANT_FP); |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 2342 | av1_optimize_b(cpi, x, plane, blk_row, blk_col, block, plane_bsize, |
Sarah Parker | 792c2ec | 2017-12-21 16:08:22 -0800 | [diff] [blame] | 2343 | tx_size, a, l, 1); |
| 2344 | } |
Angie Chiang | 808d859 | 2017-04-06 18:36:55 -0700 | [diff] [blame] | 2345 | av1_dist_block(cpi, x, plane, plane_bsize, block, blk_row, blk_col, tx_size, |
Angie Chiang | 2ed03a3 | 2017-04-16 18:00:06 -0700 | [diff] [blame] | 2346 | &this_rd_stats.dist, &this_rd_stats.sse, |
| 2347 | OUTPUT_HAS_PREDICTED_PIXELS); |
Angie Chiang | bd99b38 | 2017-06-20 15:11:16 -0700 | [diff] [blame] | 2348 | const SCAN_ORDER *scan_order = get_scan(cm, tx_size, tx_type, mbmi); |
Jingning Han | 7eab9ff | 2017-07-06 10:12:54 -0700 | [diff] [blame] | 2349 | this_rd_stats.rate = |
| 2350 | av1_cost_coeffs(cpi, x, plane, blk_row, blk_col, block, tx_size, |
| 2351 | scan_order, a, l, use_fast_coef_costing); |
Jingning Han | 721c4c3 | 2018-01-03 09:05:08 -0800 | [diff] [blame] | 2352 | int64_t rd = RDCOST(x->rdmult, this_rd_stats.rate, this_rd_stats.dist); |
Jingning Han | 19b5c8f | 2017-07-06 15:10:12 -0700 | [diff] [blame] | 2353 | |
Angie Chiang | 808d859 | 2017-04-06 18:36:55 -0700 | [diff] [blame] | 2354 | if (rd < best_rd) { |
| 2355 | best_rd = rd; |
Jingning Han | e3b81bc | 2017-06-23 11:43:52 -0700 | [diff] [blame] | 2356 | best_rd_stats = this_rd_stats; |
Angie Chiang | 808d859 | 2017-04-06 18:36:55 -0700 | [diff] [blame] | 2357 | best_tx_type = tx_type; |
Angie Chiang | 4e16ea6 | 2017-12-15 17:58:44 -0800 | [diff] [blame] | 2358 | best_txb_ctx = x->plane[plane].txb_entropy_ctx[block]; |
| 2359 | best_eob = x->plane[plane].eobs[block]; |
Angie Chiang | 808d859 | 2017-04-06 18:36:55 -0700 | [diff] [blame] | 2360 | } |
| 2361 | } |
Jingning Han | e3b81bc | 2017-06-23 11:43:52 -0700 | [diff] [blame] | 2362 | |
| 2363 | av1_merge_rd_stats(rd_stats, &best_rd_stats); |
| 2364 | |
Angie Chiang | a3f7d2e | 2017-12-07 19:51:14 -0800 | [diff] [blame] | 2365 | if (best_eob == 0) best_tx_type = DCT_DCT; |
Jingning Han | 19b5c8f | 2017-07-06 15:10:12 -0700 | [diff] [blame] | 2366 | |
Angie Chiang | bce07f1 | 2017-12-01 16:34:31 -0800 | [diff] [blame] | 2367 | if (plane == 0) |
| 2368 | mbmi->txk_type[(blk_row << MAX_MIB_SIZE_LOG2) + blk_col] = best_tx_type; |
Angie Chiang | 4e16ea6 | 2017-12-15 17:58:44 -0800 | [diff] [blame] | 2369 | x->plane[plane].txb_entropy_ctx[block] = best_txb_ctx; |
Angie Chiang | 6f90fb2 | 2017-12-20 16:30:20 -0800 | [diff] [blame] | 2370 | x->plane[plane].eobs[block] = best_eob; |
Jingning Han | 4755817 | 2017-07-05 16:33:19 -0700 | [diff] [blame] | 2371 | |
Angie Chiang | 2ed03a3 | 2017-04-16 18:00:06 -0700 | [diff] [blame] | 2372 | if (!is_inter_block(mbmi)) { |
Sarah Parker | 792c2ec | 2017-12-21 16:08:22 -0800 | [diff] [blame] | 2373 | // intra mode needs decoded result such that the next transform block |
| 2374 | // can use it for prediction. |
| 2375 | if (cpi->sf.optimize_coefficients != FULL_TRELLIS_OPT) { |
| 2376 | av1_xform_quant(cm, x, plane, block, blk_row, blk_col, plane_bsize, |
| 2377 | tx_size, AV1_XFORM_QUANT_B); |
| 2378 | } else { |
| 2379 | av1_xform_quant(cm, x, plane, block, blk_row, blk_col, plane_bsize, |
| 2380 | tx_size, AV1_XFORM_QUANT_FP); |
Michelle Findlay-Olynyk | fbab062 | 2017-12-13 14:10:56 -0800 | [diff] [blame] | 2381 | av1_optimize_b(cpi, x, plane, blk_row, blk_col, block, plane_bsize, |
Sarah Parker | 792c2ec | 2017-12-21 16:08:22 -0800 | [diff] [blame] | 2382 | tx_size, a, l, 1); |
| 2383 | } |
Jingning Han | 4755817 | 2017-07-05 16:33:19 -0700 | [diff] [blame] | 2384 | |
Angie Chiang | 2ed03a3 | 2017-04-16 18:00:06 -0700 | [diff] [blame] | 2385 | av1_inverse_transform_block_facade(xd, plane, block, blk_row, blk_col, |
Frederic Barbier | 33b39f0 | 2017-11-21 11:11:24 +0100 | [diff] [blame] | 2386 | x->plane[plane].eobs[block], |
| 2387 | cm->reduced_tx_set_used); |
Angie Chiang | 2ed03a3 | 2017-04-16 18:00:06 -0700 | [diff] [blame] | 2388 | } |
Angie Chiang | 808d859 | 2017-04-06 18:36:55 -0700 | [diff] [blame] | 2389 | return best_rd; |
| 2390 | } |
Angie Chiang | cd9b03f | 2017-04-16 13:37:13 -0700 | [diff] [blame] | 2391 | #endif // CONFIG_TXK_SEL |