Align a few buffers to 32 byte boundaries This better supports AVX2 operations. BUG=aomedia:1533 Change-Id: Ife789ac9193b13b3af7f979b33523b1e1db16f51
diff --git a/av1/common/idct.c b/av1/common/idct.c index be1ef7e..6bab6ef 100644 --- a/av1/common/idct.c +++ b/av1/common/idct.c
@@ -1683,7 +1683,7 @@ void av1_inv_txfm_add_c(const tran_low_t *dqcoeff, uint8_t *dst, int stride, const TxfmParam *txfm_param) { const TX_SIZE tx_size = txfm_param->tx_size; - DECLARE_ALIGNED(16, uint16_t, tmp[MAX_TX_SQUARE]); + DECLARE_ALIGNED(32, uint16_t, tmp[MAX_TX_SQUARE]); int tmp_stride = MAX_TX_SIZE; int w = tx_size_wide[tx_size]; int h = tx_size_high[tx_size];
diff --git a/av1/decoder/decoder.h b/av1/decoder/decoder.h index 5de74ce..e17e58d 100644 --- a/av1/decoder/decoder.h +++ b/av1/decoder/decoder.h
@@ -36,9 +36,9 @@ typedef struct TileData { AV1_COMMON *cm; aom_reader bit_reader; - DECLARE_ALIGNED(16, MACROBLOCKD, xd); + DECLARE_ALIGNED(32, MACROBLOCKD, xd); /* dqcoeff are shared by all the planes. So planes must be decoded serially */ - DECLARE_ALIGNED(16, tran_low_t, dqcoeff[MAX_TX_SQUARE]); + DECLARE_ALIGNED(32, tran_low_t, dqcoeff[MAX_TX_SQUARE]); DECLARE_ALIGNED(16, FRAME_CONTEXT, tctx); DECLARE_ALIGNED(16, uint8_t, color_index_map[2][MAX_PALETTE_SQUARE]); } TileData; @@ -52,9 +52,9 @@ } TileBufferDec; typedef struct AV1Decoder { - DECLARE_ALIGNED(16, MACROBLOCKD, mb); + DECLARE_ALIGNED(32, MACROBLOCKD, mb); - DECLARE_ALIGNED(16, AV1_COMMON, common); + DECLARE_ALIGNED(32, AV1_COMMON, common); int ready_for_new_data;