|  | /* | 
|  | * Copyright (c) 2021, Alliance for Open Media. All rights reserved | 
|  | * | 
|  | * This source code is subject to the terms of the BSD 3-Clause Clear License | 
|  | * and the Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear | 
|  | * License was not distributed with this source code in the LICENSE file, you | 
|  | * can obtain it at aomedia.org/license/software-license/bsd-3-c-c/.  If the | 
|  | * Alliance for Open Media Patent License 1.0 was not distributed with this | 
|  | * source code in the PATENTS file, you can obtain it at | 
|  | * aomedia.org/license/patent-license/. | 
|  | */ | 
|  |  | 
|  | #include "config/aom_config.h" | 
|  | #include "config/av1_rtcd.h" | 
|  | #include "config/aom_dsp_rtcd.h" | 
|  |  | 
|  | #include "av1/common/idct.h" | 
|  | #include "av1/encoder/hybrid_fwd_txfm.h" | 
|  | #include "av1/common/scan.h" | 
|  |  | 
|  | /* 4-point reversible, orthonormal Walsh-Hadamard in 3.5 adds, 0.5 shifts per | 
|  | pixel. */ | 
|  | void av1_fwht4x4_c(const int16_t *input, tran_low_t *output, int stride) { | 
|  | int i; | 
|  | tran_high_t a1, b1, c1, d1, e1; | 
|  | const int16_t *ip_pass0 = input; | 
|  | const tran_low_t *ip = NULL; | 
|  | tran_low_t *op = output; | 
|  |  | 
|  | for (i = 0; i < 4; i++) { | 
|  | a1 = ip_pass0[0 * stride]; | 
|  | b1 = ip_pass0[1 * stride]; | 
|  | c1 = ip_pass0[2 * stride]; | 
|  | d1 = ip_pass0[3 * stride]; | 
|  |  | 
|  | a1 += b1; | 
|  | d1 = d1 - c1; | 
|  | e1 = (a1 - d1) >> 1; | 
|  | b1 = e1 - b1; | 
|  | c1 = e1 - c1; | 
|  | a1 -= c1; | 
|  | d1 += b1; | 
|  | op[0] = (tran_low_t)a1; | 
|  | op[4] = (tran_low_t)c1; | 
|  | op[8] = (tran_low_t)d1; | 
|  | op[12] = (tran_low_t)b1; | 
|  |  | 
|  | ip_pass0++; | 
|  | op++; | 
|  | } | 
|  | ip = output; | 
|  | op = output; | 
|  |  | 
|  | for (i = 0; i < 4; i++) { | 
|  | a1 = ip[0]; | 
|  | b1 = ip[1]; | 
|  | c1 = ip[2]; | 
|  | d1 = ip[3]; | 
|  |  | 
|  | a1 += b1; | 
|  | d1 -= c1; | 
|  | e1 = (a1 - d1) >> 1; | 
|  | b1 = e1 - b1; | 
|  | c1 = e1 - c1; | 
|  | a1 -= c1; | 
|  | d1 += b1; | 
|  | op[0] = (tran_low_t)(a1 * UNIT_QUANT_FACTOR); | 
|  | op[1] = (tran_low_t)(c1 * UNIT_QUANT_FACTOR); | 
|  | op[2] = (tran_low_t)(d1 * UNIT_QUANT_FACTOR); | 
|  | op[3] = (tran_low_t)(b1 * UNIT_QUANT_FACTOR); | 
|  |  | 
|  | ip += 4; | 
|  | op += 4; | 
|  | } | 
|  | } | 
|  |  | 
|  | void av1_highbd_fwht4x4_c(const int16_t *input, tran_low_t *output, | 
|  | int stride) { | 
|  | av1_fwht4x4_c(input, output, stride); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_4x4(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const TX_TYPE tx_type = txfm_param->tx_type; | 
|  | const int bd = txfm_param->bd; | 
|  | if (txfm_param->lossless) { | 
|  | #if CONFIG_LOSSLESS_DPCM | 
|  | assert(tx_type == DCT_DCT || tx_type == IDTX); | 
|  | if (tx_type == IDTX) { | 
|  | av1_fwd_txfm2d_4x4(src_diff, dst_coeff, diff_stride, tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } else { | 
|  | av1_highbd_fwht4x4(src_diff, coeff, diff_stride); | 
|  | } | 
|  | #else   // CONFIG_LOSSLESS_DPCM | 
|  | assert(tx_type == DCT_DCT); | 
|  | av1_highbd_fwht4x4(src_diff, coeff, diff_stride); | 
|  | #endif  // CONFIG_LOSSLESS_DPCM | 
|  | return; | 
|  | } | 
|  | av1_fwd_txfm2d_4x4(src_diff, dst_coeff, diff_stride, tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_4x8(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | av1_fwd_txfm2d_4x8(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | txfm_param->bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_8x4(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | av1_fwd_txfm2d_8x4(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | txfm_param->bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_8x16(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const TX_TYPE tx_type = txfm_param->tx_type; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_8x16(src_diff, dst_coeff, diff_stride, tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_16x8(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const TX_TYPE tx_type = txfm_param->tx_type; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_16x8(src_diff, dst_coeff, diff_stride, tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_16x32(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | av1_fwd_txfm2d_16x32(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | txfm_param->bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_32x16(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | av1_fwd_txfm2d_32x16(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | txfm_param->bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_16x4(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | av1_fwd_txfm2d_16x4(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | txfm_param->bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_4x16(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | av1_fwd_txfm2d_4x16(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | txfm_param->bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_32x8(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | av1_fwd_txfm2d_32x8(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | txfm_param->bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_8x32(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | av1_fwd_txfm2d_8x32(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | txfm_param->bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_8x8(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const TX_TYPE tx_type = txfm_param->tx_type; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_8x8(src_diff, dst_coeff, diff_stride, tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_16x16(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const TX_TYPE tx_type = txfm_param->tx_type; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_16x16(src_diff, dst_coeff, diff_stride, tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_32x32(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const TX_TYPE tx_type = txfm_param->tx_type; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_32x32(src_diff, dst_coeff, diff_stride, tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_32x64(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | assert(txfm_param->tx_type == DCT_DCT); | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_32x64(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_64x32(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | assert(txfm_param->tx_type == DCT_DCT); | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_64x32(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_16x64(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_16x64(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_64x16(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_64x16(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_64x64(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | assert(txfm_param->tx_type == DCT_DCT); | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_64x64(src_diff, dst_coeff, diff_stride, DCT_DCT, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | #if CONFIG_EXT_RECUR_PARTITIONS | 
|  | static void highbd_fwd_txfm_4x32(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_4x32(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_32x4(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_32x4(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_8x64(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_8x64(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_64x8(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_64x8(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_4x64(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_4x64(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  |  | 
|  | static void highbd_fwd_txfm_64x4(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | int32_t *dst_coeff = (int32_t *)coeff; | 
|  | const int bd = txfm_param->bd; | 
|  | av1_fwd_txfm2d_64x4(src_diff, dst_coeff, diff_stride, txfm_param->tx_type, | 
|  | #if CONFIG_INTER_DDT | 
|  | txfm_param->use_ddt, | 
|  | #endif  // CONFIG_INTER_DDT | 
|  | bd); | 
|  | } | 
|  | #endif  // CONFIG_EXT_RECUR_PARTITIONS | 
|  |  | 
|  | void av1_fwd_txfm(const int16_t *src_diff, tran_low_t *coeff, int diff_stride, | 
|  | TxfmParam *txfm_param) { | 
|  | if (txfm_param->bd == 8) { | 
|  | av1_lowbd_fwd_txfm(src_diff, coeff, diff_stride, txfm_param); | 
|  | } else { | 
|  | av1_highbd_fwd_txfm(src_diff, coeff, diff_stride, txfm_param); | 
|  | } | 
|  | } | 
|  |  | 
|  | void av1_lowbd_fwd_txfm_c(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | av1_highbd_fwd_txfm(src_diff, coeff, diff_stride, txfm_param); | 
|  | } | 
|  |  | 
|  | void av1_highbd_fwd_txfm(const int16_t *src_diff, tran_low_t *coeff, | 
|  | int diff_stride, TxfmParam *txfm_param) { | 
|  | assert(av1_ext_tx_used[txfm_param->tx_set_type][txfm_param->tx_type]); | 
|  | const TX_SIZE tx_size = txfm_param->tx_size; | 
|  | switch (tx_size) { | 
|  | case TX_64X64: | 
|  | highbd_fwd_txfm_64x64(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_32X64: | 
|  | highbd_fwd_txfm_32x64(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_64X32: | 
|  | highbd_fwd_txfm_64x32(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_16X64: | 
|  | highbd_fwd_txfm_16x64(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_64X16: | 
|  | highbd_fwd_txfm_64x16(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_32X32: | 
|  | highbd_fwd_txfm_32x32(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_16X16: | 
|  | highbd_fwd_txfm_16x16(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_8X8: | 
|  | highbd_fwd_txfm_8x8(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_4X8: | 
|  | highbd_fwd_txfm_4x8(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_8X4: | 
|  | highbd_fwd_txfm_8x4(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_8X16: | 
|  | highbd_fwd_txfm_8x16(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_16X8: | 
|  | highbd_fwd_txfm_16x8(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_16X32: | 
|  | highbd_fwd_txfm_16x32(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_32X16: | 
|  | highbd_fwd_txfm_32x16(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_4X4: | 
|  | highbd_fwd_txfm_4x4(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_4X16: | 
|  | highbd_fwd_txfm_4x16(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_16X4: | 
|  | highbd_fwd_txfm_16x4(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_8X32: | 
|  | highbd_fwd_txfm_8x32(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_32X8: | 
|  | highbd_fwd_txfm_32x8(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | #if CONFIG_EXT_RECUR_PARTITIONS | 
|  | case TX_4X32: | 
|  | highbd_fwd_txfm_4x32(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_32X4: | 
|  | highbd_fwd_txfm_32x4(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_8X64: | 
|  | highbd_fwd_txfm_8x64(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_64X8: | 
|  | highbd_fwd_txfm_64x8(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_4X64: | 
|  | highbd_fwd_txfm_4x64(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | case TX_64X4: | 
|  | highbd_fwd_txfm_64x4(src_diff, coeff, diff_stride, txfm_param); | 
|  | break; | 
|  | #endif  // CONFIG_EXT_RECUR_PARTITIONS | 
|  | default: assert(0); break; | 
|  | } | 
|  | } | 
|  |  | 
|  | // Apply forward cross chroma component transform | 
|  | void av1_fwd_cross_chroma_tx_block_c(tran_low_t *coeff_c1, tran_low_t *coeff_c2, | 
|  | TX_SIZE tx_size, CctxType cctx_type) { | 
|  | if (cctx_type == CCTX_NONE) return; | 
|  | const int ncoeffs = av1_get_max_eob(tx_size); | 
|  | int32_t *src_c1 = (int32_t *)coeff_c1; | 
|  | int32_t *src_c2 = (int32_t *)coeff_c2; | 
|  | int64_t tmp[2] = { 0, 0 }; | 
|  |  | 
|  | const int angle_idx = cctx_type - CCTX_START; | 
|  | for (int i = 0; i < ncoeffs; i++) { | 
|  | tmp[0] = (int64_t)cctx_mtx[angle_idx][0] * (int64_t)src_c1[i] + | 
|  | (int64_t)cctx_mtx[angle_idx][1] * (int64_t)src_c2[i]; | 
|  | tmp[1] = (int64_t)-cctx_mtx[angle_idx][1] * (int64_t)src_c1[i] + | 
|  | (int64_t)cctx_mtx[angle_idx][0] * (int64_t)src_c2[i]; | 
|  | src_c1[i] = (int32_t)ROUND_POWER_OF_TWO_SIGNED_64(tmp[0], CCTX_PREC_BITS); | 
|  | src_c2[i] = (int32_t)ROUND_POWER_OF_TWO_SIGNED_64(tmp[1], CCTX_PREC_BITS); | 
|  | } | 
|  | } | 
|  |  | 
|  | void av1_fwd_stxfm(tran_low_t *coeff, TxfmParam *txfm_param) { | 
|  | const TX_TYPE stx_type = txfm_param->sec_tx_type; | 
|  |  | 
|  | const int width = tx_size_wide[txfm_param->tx_size] <= 32 | 
|  | ? tx_size_wide[txfm_param->tx_size] | 
|  | : 32; | 
|  | const int height = tx_size_high[txfm_param->tx_size] <= 32 | 
|  | ? tx_size_high[txfm_param->tx_size] | 
|  | : 32; | 
|  |  | 
|  | if ((width >= 4 && height >= 4) && stx_type) { | 
|  | const PREDICTION_MODE intra_mode = | 
|  | (txfm_param->is_inter ? DC_PRED : txfm_param->intra_mode); | 
|  | PREDICTION_MODE mode = 0, mode_t = 0; | 
|  | const int log2width = tx_size_wide_log2[txfm_param->tx_size]; | 
|  | const int sb_size = (width >= 8 && height >= 8) ? 8 : 4; | 
|  | const int16_t *scan_order_in; | 
|  | // Align scan order of IST with primary transform scan order | 
|  | const SCAN_ORDER *scan_order_out = | 
|  | get_scan(txfm_param->tx_size, txfm_param->tx_type); | 
|  | const int16_t *const scan = scan_order_out->scan; | 
|  | tran_low_t buf0[64] = { 0 }, buf1[64] = { 0 }; | 
|  | tran_low_t *tmp = buf0; | 
|  | tran_low_t *src = coeff; | 
|  | int8_t transpose = 0; | 
|  | mode = AOMMIN(intra_mode, SMOOTH_H_PRED); | 
|  | if ((mode == H_PRED) || (mode == D157_PRED) || (mode == D67_PRED) || | 
|  | (mode == SMOOTH_H_PRED)) | 
|  | transpose = 1; | 
|  | #if CONFIG_IST_SET_FLAG | 
|  | mode_t = txfm_param->sec_tx_set; | 
|  | #if !CONFIG_IST_INTER_MULTISET | 
|  | assert(mode_t < IST_SET_SIZE); | 
|  | #endif | 
|  | // If in debug mode, verify whether txfm_param->sec_tx_set == intra pred dir | 
|  | // based tx set id | 
|  | #if !CONFIG_IST_ANY_SET && !defined(NDEBUG) | 
|  | { | 
|  | int mode_t2 = (txfm_param->tx_type == ADST_ADST) | 
|  | ? stx_transpose_mapping[mode] + IST_DIR_SIZE | 
|  | : stx_transpose_mapping[mode]; | 
|  | assert(mode_t == mode_t2); | 
|  | } | 
|  | #endif  // !CONFIG_IST_ANY_SET && !defined(NDEBUG) | 
|  | #else   // CONFIG_IST_SET_FLAG | 
|  | mode_t = (txfm_param->tx_type == ADST_ADST) | 
|  | ? stx_transpose_mapping[mode] + 7 | 
|  | : stx_transpose_mapping[mode]; | 
|  | #endif  // CONFIG_IST_SET_FLAG | 
|  | if (transpose) { | 
|  | scan_order_in = (sb_size == 4) | 
|  | ? stx_scan_orders_transpose_4x4[log2width - 2] | 
|  | : stx_scan_orders_transpose_8x8[log2width - 2]; | 
|  | } else { | 
|  | scan_order_in = (sb_size == 4) ? stx_scan_orders_4x4[log2width - 2] | 
|  | : stx_scan_orders_8x8[log2width - 2]; | 
|  | } | 
|  | for (int r = 0; r < sb_size * sb_size; r++) { | 
|  | *tmp = src[scan_order_in[r]]; | 
|  | tmp++; | 
|  | } | 
|  | #if CONFIG_IST_INTER_MULTISET | 
|  | mode_t = (txfm_param->is_inter ? (mode_t == 0 ? 0 : IST_SET_SIZE) : mode_t); | 
|  | #endif | 
|  | #if CONFIG_IST_REDUCE_METHOD4 | 
|  | const int st_size_class = (width == 8 && height == 8) ? 1 : (width >= 8 && height >= 8) ? 2 : 0; | 
|  | fwd_stxfm(buf0, buf1, mode_t, stx_type - 1, st_size_class); | 
|  | #else | 
|  | fwd_stxfm(buf0, buf1, mode_t, stx_type - 1, sb_size); | 
|  | #endif | 
|  | memset(coeff, 0, width * height * sizeof(tran_low_t)); | 
|  | tmp = buf1; | 
|  | for (int i = 0; i < sb_size * sb_size; i++) { | 
|  | // Align scan order of IST with primary transform scan order | 
|  | coeff[scan[i]] = *tmp++; | 
|  | } | 
|  | } | 
|  | } |