| /* |
| * Copyright (c) 2017, Alliance for Open Media. All rights reserved |
| * |
| * This source code is subject to the terms of the BSD 2 Clause License and |
| * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License |
| * was not distributed with this source code in the LICENSE file, you can |
| * obtain it at www.aomedia.org/license/software. If the Alliance for Open |
| * Media Patent License 1.0 was not distributed with this source code in the |
| * PATENTS file, you can obtain it at www.aomedia.org/license/patent. |
| */ |
| |
| #include "av1/decoder/decodetxb.h" |
| |
| #include "aom_ports/mem.h" |
| #include "av1/common/idct.h" |
| #include "av1/common/scan.h" |
| #include "av1/common/txb_common.h" |
| #include "av1/decoder/decodemv.h" |
| |
| #define ACCT_STR __func__ |
| |
| static int read_golomb(MACROBLOCKD *xd, aom_reader *r) { |
| int x = 1; |
| int length = 0; |
| int i = 0; |
| |
| while (!i) { |
| i = aom_read_bit(r, ACCT_STR); |
| ++length; |
| if (length > 20) { |
| aom_internal_error(xd->error_info, AOM_CODEC_CORRUPT_FRAME, |
| "Invalid length in read_golomb"); |
| break; |
| } |
| } |
| |
| for (i = 0; i < length - 1; ++i) { |
| x <<= 1; |
| x += aom_read_bit(r, ACCT_STR); |
| } |
| |
| return x - 1; |
| } |
| |
| static INLINE int rec_eob_pos(const int eob_token, const int extra) { |
| int eob = k_eob_group_start[eob_token]; |
| if (eob > 2) { |
| eob += extra; |
| } |
| return eob; |
| } |
| |
| static INLINE int get_dqv(const int16_t *dequant, int coeff_idx, |
| const qm_val_t *iqmatrix) { |
| int dqv = dequant[!!coeff_idx]; |
| if (iqmatrix != NULL) |
| dqv = |
| ((iqmatrix[coeff_idx] * dqv) + (1 << (AOM_QM_BITS - 1))) >> AOM_QM_BITS; |
| return dqv; |
| } |
| |
| static INLINE void read_coeffs_reverse_2d(aom_reader *r, TX_SIZE tx_size, |
| int start_si, int end_si, |
| const int16_t *scan, int bwl, |
| uint8_t *levels, |
| base_cdf_arr base_cdf, |
| br_cdf_arr br_cdf) { |
| for (int c = end_si; c >= start_si; --c) { |
| const int pos = scan[c]; |
| const int coeff_ctx = get_lower_levels_ctx_2d(levels, pos, bwl, tx_size); |
| const int nsymbs = 4; |
| int level = aom_read_symbol(r, base_cdf[coeff_ctx], nsymbs, ACCT_STR); |
| if (level > NUM_BASE_LEVELS) { |
| const int br_ctx = get_br_ctx_2d(levels, pos, bwl); |
| aom_cdf_prob *cdf = br_cdf[br_ctx]; |
| for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) { |
| const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR); |
| level += k; |
| if (k < BR_CDF_SIZE - 1) break; |
| } |
| } |
| levels[get_padded_idx(pos, bwl)] = level; |
| } |
| } |
| |
| static INLINE void read_coeffs_reverse(aom_reader *r, TX_SIZE tx_size, |
| TX_CLASS tx_class, int start_si, |
| int end_si, const int16_t *scan, int bwl, |
| uint8_t *levels, base_cdf_arr base_cdf, |
| br_cdf_arr br_cdf) { |
| for (int c = end_si; c >= start_si; --c) { |
| const int pos = scan[c]; |
| const int coeff_ctx = |
| get_lower_levels_ctx(levels, pos, bwl, tx_size, tx_class); |
| const int nsymbs = 4; |
| int level = aom_read_symbol(r, base_cdf[coeff_ctx], nsymbs, ACCT_STR); |
| if (level > NUM_BASE_LEVELS) { |
| const int br_ctx = get_br_ctx(levels, pos, bwl, tx_class); |
| aom_cdf_prob *cdf = br_cdf[br_ctx]; |
| for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) { |
| const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR); |
| level += k; |
| if (k < BR_CDF_SIZE - 1) break; |
| } |
| } |
| levels[get_padded_idx(pos, bwl)] = level; |
| } |
| } |
| |
| |
| #define USE_GPU_BLOCKS 1 |
| |
| uint8_t av1_read_coeffs_txb(const AV1_COMMON *const cm, MACROBLOCKD *const xd, |
| aom_reader *const r, const int blk_row, |
| const int blk_col, const int plane, |
| const TXB_CTX *const txb_ctx, |
| const TX_SIZE tx_size) { |
| FRAME_CONTEXT *const ec_ctx = xd->tile_ctx; |
| const int32_t max_value = (1 << (7 + xd->bd)) - 1; |
| const int32_t min_value = -(1 << (7 + xd->bd)); |
| const TX_SIZE txs_ctx = get_txsize_entropy_ctx(tx_size); |
| const PLANE_TYPE plane_type = get_plane_type(plane); |
| MB_MODE_INFO *const mbmi = xd->mi[0]; |
| struct macroblockd_plane *const pd = &xd->plane[plane]; |
| const int16_t *const dequant = pd->seg_dequant_QTX[mbmi->segment_id]; |
| av1_tile_data * tile_data = xd->tile_data; |
| tran_low_t *const tcoeffs_raw = tile_data->dq_buffer_base + tile_data->dq_buffer_ptr; |
| const int shift = av1_get_tx_scale(tx_size); |
| const int bwl = get_txb_bwl(tx_size); |
| const int width = get_txb_wide(tx_size); |
| const int height = get_txb_high(tx_size); |
| int cul_level = 0; |
| int dc_val = 0; |
| uint8_t levels_buf[TX_PAD_2D]; |
| uint8_t *const levels = set_levels(levels_buf, width); |
| const int all_zero = aom_read_symbol( |
| r, ec_ctx->txb_skip_cdf[txs_ctx][txb_ctx->txb_skip_ctx], 2, ACCT_STR); |
| eob_info *eob_data = pd->eob_data + xd->txb_offset[plane]; |
| uint16_t *const eob = &(eob_data->eob); |
| uint16_t *const max_scan_line = &(eob_data->max_scan_line); |
| *max_scan_line = 0; |
| *eob = 0; |
| |
| #if CONFIG_INSPECTION |
| if (plane == 0) { |
| const int txk_type_idx = |
| av1_get_txk_type_index(mbmi->sb_type, blk_row, blk_col); |
| mbmi->tx_skip[txk_type_idx] = all_zero; |
| } |
| #endif |
| |
| if (all_zero) { |
| *max_scan_line = 0; |
| if (plane == 0) { |
| const int txk_type_idx = |
| av1_get_txk_type_index(mbmi->sb_type, blk_row, blk_col); |
| xd->txk_type[txk_type_idx] = DCT_DCT; |
| } |
| return 0; |
| } |
| |
| if (plane == AOM_PLANE_Y) { |
| // only y plane's tx_type is transmitted |
| av1_read_tx_type(cm, xd, blk_row, blk_col, tx_size, r); |
| } |
| const TX_TYPE tx_type = av1_get_tx_type(plane_type, xd, blk_row, blk_col, |
| tx_size, cm->reduced_tx_set_used); |
| const TX_CLASS tx_class = tx_type_to_class[tx_type]; |
| const TX_SIZE qm_tx_size = av1_get_adjusted_tx_size(tx_size); |
| const qm_val_t *iqmatrix = |
| IS_2D_TRANSFORM(tx_type) |
| ? pd->seg_iqmatrix[mbmi->segment_id][qm_tx_size] |
| : cm->giqmatrix[NUM_QM_LEVELS - 1][0][qm_tx_size]; |
| const SCAN_ORDER *const scan_order = get_scan(tx_size, tx_type); |
| const int16_t *const scan = scan_order->scan; |
| int eob_extra = 0; |
| int eob_pt = 1; |
| |
| const int eob_multi_size = txsize_log2_minus4[tx_size]; |
| const int eob_multi_ctx = (tx_class == TX_CLASS_2D) ? 0 : 1; |
| switch (eob_multi_size) { |
| case 0: |
| eob_pt = |
| aom_read_symbol(r, ec_ctx->eob_flag_cdf16[plane_type][eob_multi_ctx], |
| 5, ACCT_STR) + |
| 1; |
| break; |
| case 1: |
| eob_pt = |
| aom_read_symbol(r, ec_ctx->eob_flag_cdf32[plane_type][eob_multi_ctx], |
| 6, ACCT_STR) + |
| 1; |
| break; |
| case 2: |
| eob_pt = |
| aom_read_symbol(r, ec_ctx->eob_flag_cdf64[plane_type][eob_multi_ctx], |
| 7, ACCT_STR) + |
| 1; |
| break; |
| case 3: |
| eob_pt = |
| aom_read_symbol(r, ec_ctx->eob_flag_cdf128[plane_type][eob_multi_ctx], |
| 8, ACCT_STR) + |
| 1; |
| break; |
| case 4: |
| eob_pt = |
| aom_read_symbol(r, ec_ctx->eob_flag_cdf256[plane_type][eob_multi_ctx], |
| 9, ACCT_STR) + |
| 1; |
| break; |
| case 5: |
| eob_pt = |
| aom_read_symbol(r, ec_ctx->eob_flag_cdf512[plane_type][eob_multi_ctx], |
| 10, ACCT_STR) + |
| 1; |
| break; |
| case 6: |
| default: |
| eob_pt = aom_read_symbol( |
| r, ec_ctx->eob_flag_cdf1024[plane_type][eob_multi_ctx], 11, |
| ACCT_STR) + |
| 1; |
| break; |
| } |
| |
| const int eob_offset_bits = k_eob_offset_bits[eob_pt]; |
| if (eob_offset_bits > 0) { |
| const int eob_ctx = eob_pt - 3; |
| int bit = aom_read_symbol( |
| r, ec_ctx->eob_extra_cdf[txs_ctx][plane_type][eob_ctx], 2, ACCT_STR); |
| if (bit) { |
| eob_extra += (1 << (eob_offset_bits - 1)); |
| } |
| |
| for (int i = 1; i < eob_offset_bits; i++) { |
| bit = aom_read_bit(r, ACCT_STR); |
| if (bit) { |
| eob_extra += (1 << (eob_offset_bits - 1 - i)); |
| } |
| } |
| } |
| *eob = rec_eob_pos(eob_pt, eob_extra); |
| |
| if (*eob > 1) { |
| memset(levels_buf, 0, |
| sizeof(*levels_buf) * |
| ((width + TX_PAD_HOR) * (height + TX_PAD_VER) + TX_PAD_END)); |
| } |
| |
| { |
| // Read the non-zero coefficient with scan index eob-1 |
| // TODO(angiebird): Put this into a function |
| const int c = *eob - 1; |
| const int pos = scan[c]; |
| const int coeff_ctx = get_lower_levels_ctx_eob(bwl, height, c); |
| const int nsymbs = 3; |
| aom_cdf_prob *cdf = |
| ec_ctx->coeff_base_eob_cdf[txs_ctx][plane_type][coeff_ctx]; |
| int level = aom_read_symbol(r, cdf, nsymbs, ACCT_STR) + 1; |
| if (level > NUM_BASE_LEVELS) { |
| const int br_ctx = get_br_ctx_eob(pos, bwl, tx_class); |
| cdf = ec_ctx->coeff_br_cdf[AOMMIN(txs_ctx, TX_32X32)][plane_type][br_ctx]; |
| for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) { |
| const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR); |
| level += k; |
| if (k < BR_CDF_SIZE - 1) break; |
| } |
| } |
| levels[get_padded_idx(pos, bwl)] = level; |
| } |
| if (*eob > 1) { |
| base_cdf_arr base_cdf = ec_ctx->coeff_base_cdf[txs_ctx][plane_type]; |
| br_cdf_arr br_cdf = |
| ec_ctx->coeff_br_cdf[AOMMIN(txs_ctx, TX_32X32)][plane_type]; |
| if (tx_class == TX_CLASS_2D) { |
| read_coeffs_reverse_2d(r, tx_size, 1, *eob - 1 - 1, scan, bwl, levels, |
| base_cdf, br_cdf); |
| read_coeffs_reverse(r, tx_size, tx_class, 0, 0, scan, bwl, levels, |
| base_cdf, br_cdf); |
| } else { |
| read_coeffs_reverse(r, tx_size, tx_class, 0, *eob - 1 - 1, scan, bwl, |
| levels, base_cdf, br_cdf); |
| } |
| } |
| |
| for (int c = 0; c < *eob; ++c) { |
| const int pos = scan[c]; |
| uint8_t sign; |
| tran_low_t level = levels[get_padded_idx(pos, bwl)]; |
| if (level) { |
| *max_scan_line = AOMMAX(*max_scan_line, pos); |
| if (c == 0) { |
| const int dc_sign_ctx = txb_ctx->dc_sign_ctx; |
| sign = aom_read_symbol(r, ec_ctx->dc_sign_cdf[plane_type][dc_sign_ctx], |
| 2, ACCT_STR); |
| } else { |
| sign = aom_read_bit(r, ACCT_STR); |
| } |
| if (level >= MAX_BASE_BR_RANGE) { |
| level += read_golomb(xd, r); |
| } |
| |
| if (c == 0) dc_val = sign ? -level : level; |
| |
| // Bitmasking to clamp level to valid range: |
| // The valid range for 8/10/12 bit vdieo is at most 14/16/18 bit |
| level &= 0xfffff; |
| cul_level += level; |
| tran_low_t dq_coeff; |
| // Bitmasking to clamp dq_coeff to valid range: |
| // The valid range for 8/10/12 bit video is at most 17/19/21 bit |
| dq_coeff = (tran_low_t)( |
| (int64_t)level * get_dqv(dequant, scan[c], iqmatrix) & 0xffffff); |
| dq_coeff = dq_coeff >> shift; |
| if (sign) { |
| dq_coeff = -dq_coeff; |
| } |
| tcoeffs_raw[c] = clamp(dq_coeff, min_value, max_value); |
| } |
| else |
| tcoeffs_raw[c] = 0; |
| |
| } |
| |
| cul_level = AOMMIN(COEFF_CONTEXT_MASK, cul_level); |
| |
| // DC value |
| set_dc_sign(&cul_level, dc_val); |
| { |
| const int tx_types_flags[] = { |
| 0, // DCT_DCT, |
| 0x080000, // ADST_DCT, |
| 0x020000, // DCT_ADST, |
| 0x0A0000, // ADST_ADST, |
| 0x090000, // FLIPADST_DCT, |
| 0x028000, // DCT_FLIPADST, |
| 0x0B8000, // FLIPADST_FLIPADST, |
| 0x0A8000, // ADST_FLIPADST, |
| 0x0B0000, // FLIPADST_ADST, |
| 0x140000, // IDTX, |
| 0x040000, // V_DCT, |
| 0x100000, // H_DCT, |
| 0x0C0000, // V_ADST, |
| 0x120000, // H_ADST, |
| 0x0D0000, // V_FLIPADST, |
| 0x128000 // H_FLIPADST, |
| }; |
| |
| int mi_col = mbmi->mi_col; |
| int mi_row = mbmi->mi_row; |
| if (pd->subsampling_y && (mi_row & 0x01) && (mi_size_high[mbmi->sb_type] == 1)) |
| mi_row -= 1; |
| if (pd->subsampling_x && (mi_col & 0x01) && (mi_size_wide[mbmi->sb_type] == 1)) |
| mi_col -= 1; |
| const uint32_t x = ((mi_col * MI_SIZE) >> (pd->subsampling_x + 2)) + blk_col; |
| const uint32_t y = ((mi_row * MI_SIZE) >> (pd->subsampling_y + 2)) + blk_row; |
| tx_block_info_gpu * block = tile_data->idct_blocks_host + tile_data->idct_blocks_ptr; |
| const uint32_t coef_count = ((*eob) + 3) >> 2; |
| const int av1_idct_scans_lut[TX_TYPES] = { |
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 2, 1, 2, 1, 2 |
| }; |
| |
| for (uint32_t c = *eob; c < (coef_count << 2); ++c) |
| tcoeffs_raw[c] = 0; |
| const int type_index = (xd->lossless[xd->mi[0]->segment_id] && tx_size == 0)? TX_SIZES_ALL : tx_size; |
| block->flags = coef_count | tx_types_flags[tx_type] | (plane << 21) | (av1_idct_scans_lut[tx_type] << 11); |
| block->input_offset = tile_data->dq_buffer_ptr; |
| block->output_pos = x | (y << 16); |
| block->sorting_idx = (tile_data->idct_blocks_sizes[type_index] << 8) + type_index; |
| ++tile_data->idct_blocks_sizes[type_index]; |
| ++tile_data->idct_blocks_ptr; |
| tile_data->dq_buffer_ptr += coef_count << 2; |
| } |
| return cul_level; |
| } |
| |
| void av1_read_coeffs_txb_facade(const AV1_COMMON *const cm, |
| MACROBLOCKD *const xd, aom_reader *const r, |
| const int plane, const int row, const int col, |
| const TX_SIZE tx_size) { |
| #if TXCOEFF_TIMER |
| struct aom_usec_timer timer; |
| aom_usec_timer_start(&timer); |
| #endif |
| MB_MODE_INFO *const mbmi = xd->mi[0]; |
| struct macroblockd_plane *const pd = &xd->plane[plane]; |
| |
| const BLOCK_SIZE bsize = mbmi->sb_type; |
| const BLOCK_SIZE plane_bsize = |
| get_plane_block_size(bsize, pd->subsampling_x, pd->subsampling_y); |
| |
| TXB_CTX txb_ctx; |
| get_txb_ctx(plane_bsize, tx_size, plane, pd->above_context + col, |
| pd->left_context + row, &txb_ctx); |
| const uint8_t cul_level = |
| av1_read_coeffs_txb(cm, xd, r, row, col, plane, &txb_ctx, tx_size); |
| |
| av1_set_contexts(xd, pd, plane, plane_bsize, tx_size, cul_level, col, row); |
| |
| if (is_inter_block(mbmi)) { |
| PLANE_TYPE plane_type = get_plane_type(plane); |
| // tx_type will be read out in av1_read_coeffs_txb_facade |
| const TX_TYPE tx_type = av1_get_tx_type(plane_type, xd, row, col, tx_size, |
| cm->reduced_tx_set_used); |
| |
| if (plane == 0) |
| update_txk_array(xd->txk_type, mbmi->sb_type, row, col, tx_size, |
| tx_type); |
| } |
| |
| #if TXCOEFF_TIMER |
| aom_usec_timer_mark(&timer); |
| const int64_t elapsed_time = aom_usec_timer_elapsed(&timer); |
| cm->txcoeff_timer += elapsed_time; |
| ++cm->txb_count; |
| #endif |
| } |