av1/encoder/block.h - aom - Git at Google

 /*
  * Copyright (c) 2016, Alliance for Open Media. All rights reserved
  *
  * This source code is subject to the terms of the BSD 2 Clause License and
  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
  * was not distributed with this source code in the LICENSE file, you can
  * obtain it at www.aomedia.org/license/software. If the Alliance for Open
  * Media Patent License 1.0 was not distributed with this source code in the
  * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
  */

 #ifndef AV1_ENCODER_BLOCK_H_
 #define AV1_ENCODER_BLOCK_H_

 #include "av1/common/entropymv.h"
 #include "av1/common/entropy.h"
 #if CONFIG_PVQ
 #include "av1/encoder/encint.h"
 #endif
 #if CONFIG_REF_MV
 #include "av1/common/mvref_common.h"
 #endif

 #ifdef __cplusplus
 extern "C" {
 #endif

 #if CONFIG_PVQ
 // Maximum possible # of tx blocks in luma plane, which is currently 256,
 // since there can be 16x16 of 4x4 tx.
 #define MAX_PVQ_BLOCKS_IN_SB (MAX_SB_SQUARE >> 2 * OD_LOG_BSIZE0)
 #endif

 typedef struct {
   unsigned int sse;
   int sum;
   unsigned int var;
 } DIFF;

 typedef struct macroblock_plane {
   DECLARE_ALIGNED(16, int16_t, src_diff[MAX_SB_SQUARE]);
 #if CONFIG_PVQ
   DECLARE_ALIGNED(16, int16_t, src_int16[MAX_SB_SQUARE]);
 #endif
   tran_low_t *qcoeff;
   tran_low_t *coeff;
   uint16_t *eobs;
   struct buf_2d src;

   // Quantizer setings
   const int16_t *quant_fp;
   const int16_t *round_fp;
   const int16_t *quant;
   const int16_t *quant_shift;
   const int16_t *zbin;
   const int16_t *round;
 #if CONFIG_NEW_QUANT
   const cuml_bins_type_nuq *cuml_bins_nuq[QUANT_PROFILES];
 #endif  // CONFIG_NEW_QUANT
 } MACROBLOCK_PLANE;

 /* The [2] dimension is for whether we skip the EOB node (i.e. if previous
  * coefficient in this block was zero) or not. */
 typedef unsigned int av1_coeff_cost[PLANE_TYPES][REF_TYPES][COEF_BANDS][2]
                                    [COEFF_CONTEXTS][ENTROPY_TOKENS];

 typedef struct {
   int_mv ref_mvs[MODE_CTX_REF_FRAMES][MAX_MV_REF_CANDIDATES];
   int16_t mode_context[MODE_CTX_REF_FRAMES];
 #if CONFIG_REF_MV
   uint8_t ref_mv_count[MODE_CTX_REF_FRAMES];
   CANDIDATE_MV ref_mv_stack[MODE_CTX_REF_FRAMES][MAX_REF_MV_STACK_SIZE];
 #if CONFIG_EXT_INTER
   int16_t compound_mode_context[MODE_CTX_REF_FRAMES];
 #endif  // CONFIG_EXT_INTER
 #endif
 } MB_MODE_INFO_EXT;

 #if CONFIG_PALETTE
 typedef struct {
   uint8_t best_palette_color_map[MAX_SB_SQUARE];
   float kmeans_data_buf[2 * MAX_SB_SQUARE];
 } PALETTE_BUFFER;
 #endif  // CONFIG_PALETTE

 typedef struct macroblock MACROBLOCK;
 struct macroblock {
   struct macroblock_plane plane[MAX_MB_PLANE];

   MACROBLOCKD e_mbd;
   MB_MODE_INFO_EXT *mbmi_ext;
   int skip_block;
   int qindex;

   // The equivalent error at the current rdmult of one whole bit (not one
   // bitcost unit).
   int errorperbit;
   // The equivalend SAD error of one (whole) bit at the current quantizer
   // for large blocks.
   int sadperbit16;
   // The equivalend SAD error of one (whole) bit at the current quantizer
   // for sub-8x8 blocks.
   int sadperbit4;
   int rddiv;
   int rdmult;
   int mb_energy;
   int *m_search_count_ptr;
   int *ex_search_count_ptr;

 #if CONFIG_VAR_TX
   unsigned int txb_split_count;
 #endif

   // These are set to their default values at the beginning, and then adjusted
   // further in the encoding process.
   BLOCK_SIZE min_partition_size;
   BLOCK_SIZE max_partition_size;

   int mv_best_ref_index[TOTAL_REFS_PER_FRAME];
   unsigned int max_mv_context[TOTAL_REFS_PER_FRAME];
   unsigned int source_variance;
   unsigned int recon_variance;
   unsigned int pred_sse[TOTAL_REFS_PER_FRAME];
   int pred_mv_sad[TOTAL_REFS_PER_FRAME];

 #if CONFIG_REF_MV
   int *nmvjointcost;
   int nmv_vec_cost[NMV_CONTEXTS][MV_JOINTS];
   int *nmvcost[NMV_CONTEXTS][2];
   int *nmvcost_hp[NMV_CONTEXTS][2];
   int **mv_cost_stack[NMV_CONTEXTS];
   int *nmvjointsadcost;
 #else
   int nmvjointcost[MV_JOINTS];
   int *nmvcost[2];
   int *nmvcost_hp[2];
   int nmvjointsadcost[MV_JOINTS];
 #endif

   int **mvcost;
   int *nmvsadcost[2];
   int *nmvsadcost_hp[2];
   int **mvsadcost;
 #if CONFIG_MOTION_VAR
   int32_t *wsrc_buf;
   int32_t *mask_buf;
 #endif  // CONFIG_MOTION_VAR

 #if CONFIG_PALETTE
   PALETTE_BUFFER *palette_buffer;
 #endif  // CONFIG_PALETTE

   // These define limits to motion vector components to prevent them
   // from extending outside the UMV borders
   int mv_col_min;
   int mv_col_max;
   int mv_row_min;
   int mv_row_max;

 #if CONFIG_VAR_TX
   uint8_t blk_skip[MAX_MB_PLANE][MAX_MIB_SIZE * MAX_MIB_SIZE * 8];
 #if CONFIG_REF_MV
   uint8_t blk_skip_drl[MAX_MB_PLANE][MAX_MIB_SIZE * MAX_MIB_SIZE * 8];
 #endif
 #endif

   int skip;

   // note that token_costs is the cost when eob node is skipped
   av1_coeff_cost token_costs[TX_SIZES];

   int optimize;

   // Used to store sub partition's choices.
   MV pred_mv[TOTAL_REFS_PER_FRAME];

   // Store the best motion vector during motion search
   int_mv best_mv;
   // Store the second best motion vector during full-pixel motion search
   int_mv second_best_mv;

   // use default transform and skip transform type search for intra modes
   int use_default_intra_tx_type;
   // use default transform and skip transform type search for inter modes
   int use_default_inter_tx_type;
 #if CONFIG_PVQ
   int rate;
   // 1 if neither AC nor DC is coded. Only used during RDO.
   int pvq_skip[MAX_MB_PLANE];
   PVQ_QUEUE *pvq_q;

   // Storage for PVQ tx block encodings in a superblock.
   // There can be max 16x16 of 4x4 blocks (and YUV) encode by PVQ
   // 256 is the max # of 4x4 blocks in a SB (64x64), which comes from:
   // 1) Since PVQ is applied to each trasnform-ed block
   // 2) 4x4 is the smallest tx size in AV1
   // 3) AV1 allows using smaller tx size than block (i.e. partition) size
   // TODO(yushin) : The memory usage could be improved a lot, since this has
   // storage for 10 bands and 128 coefficients for every 4x4 block,
   PVQ_INFO pvq[MAX_PVQ_BLOCKS_IN_SB][MAX_MB_PLANE];
   daala_enc_ctx daala_enc;
   int pvq_speed;
   int pvq_coded;  // Indicates whether pvq_info needs be stored to tokenize
 #endif
 #if CONFIG_DAALA_DIST
   // Keep rate of each 4x4 block in the current macroblock during RDO
   // This is needed when using the 8x8 Daala distortion metric during RDO,
   // because it evaluates distortion in a different order than the underlying
   // 4x4 blocks are coded.
   int rate_4x4[256];
 #endif
 };

 // Converts block_index for given transform size to index of the block in raster
 // order.
 static inline int av1_block_index_to_raster_order(TX_SIZE tx_size,
                                                   int block_idx) {
   // For transform size 4x8, the possible block_idx values are 0 & 2, because
   // block_idx values are incremented in steps of size 'tx_width_unit x
   // tx_height_unit'. But, for this transform size, block_idx = 2 corresponds to
   // block number 1 in raster order, inside an 8x8 MI block.
   // For any other transform size, the two indices are equivalent.
   return (tx_size == TX_4X8 && block_idx == 2) ? 1 : block_idx;
 }

 // Inverse of above function.
 // Note: only implemented for transform sizes 4x4, 4x8 and 8x4 right now.
 static inline int av1_raster_order_to_block_index(TX_SIZE tx_size,
                                                   int raster_order) {
   assert(tx_size == TX_4X4 || tx_size == TX_4X8 || tx_size == TX_8X4);
   // We ensure that block indices are 0 & 2 if tx size is 4x8 or 8x4.
   return (tx_size == TX_4X4) ? raster_order : (raster_order > 0) ? 2 : 0;
 }

 #ifdef __cplusplus
 }  // extern "C"
 #endif

 #endif  // AV1_ENCODER_BLOCK_H_
	/*
	* Copyright (c) 2016, Alliance for Open Media. All rights reserved
	*
	* This source code is subject to the terms of the BSD 2 Clause License and
	* the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
	* was not distributed with this source code in the LICENSE file, you can
	* obtain it at www.aomedia.org/license/software. If the Alliance for Open
	* Media Patent License 1.0 was not distributed with this source code in the
	* PATENTS file, you can obtain it at www.aomedia.org/license/patent.
	*/

	#ifndef AV1_ENCODER_BLOCK_H_
	#define AV1_ENCODER_BLOCK_H_

	#include "av1/common/entropymv.h"
	#include "av1/common/entropy.h"
	#if CONFIG_PVQ
	#include "av1/encoder/encint.h"
	#endif
	#if CONFIG_REF_MV
	#include "av1/common/mvref_common.h"
	#endif

	#ifdef __cplusplus
	extern "C" {
	#endif

	#if CONFIG_PVQ
	// Maximum possible # of tx blocks in luma plane, which is currently 256,
	// since there can be 16x16 of 4x4 tx.
	#define MAX_PVQ_BLOCKS_IN_SB (MAX_SB_SQUARE >> 2 * OD_LOG_BSIZE0)
	#endif

	typedef struct {
	unsigned int sse;
	int sum;
	unsigned int var;
	} DIFF;

	typedef struct macroblock_plane {
	DECLARE_ALIGNED(16, int16_t, src_diff[MAX_SB_SQUARE]);
	#if CONFIG_PVQ
	DECLARE_ALIGNED(16, int16_t, src_int16[MAX_SB_SQUARE]);
	#endif
	tran_low_t *qcoeff;
	tran_low_t *coeff;
	uint16_t *eobs;
	struct buf_2d src;

	// Quantizer setings
	const int16_t *quant_fp;
	const int16_t *round_fp;
	const int16_t *quant;
	const int16_t *quant_shift;
	const int16_t *zbin;
	const int16_t *round;
	#if CONFIG_NEW_QUANT
	const cuml_bins_type_nuq *cuml_bins_nuq[QUANT_PROFILES];
	#endif // CONFIG_NEW_QUANT
	} MACROBLOCK_PLANE;

	/* The [2] dimension is for whether we skip the EOB node (i.e. if previous
	* coefficient in this block was zero) or not. */
	typedef unsigned int av1_coeff_cost[PLANE_TYPES][REF_TYPES][COEF_BANDS][2]
	[COEFF_CONTEXTS][ENTROPY_TOKENS];

	typedef struct {
	int_mv ref_mvs[MODE_CTX_REF_FRAMES][MAX_MV_REF_CANDIDATES];
	int16_t mode_context[MODE_CTX_REF_FRAMES];
	#if CONFIG_REF_MV
	uint8_t ref_mv_count[MODE_CTX_REF_FRAMES];
	CANDIDATE_MV ref_mv_stack[MODE_CTX_REF_FRAMES][MAX_REF_MV_STACK_SIZE];
	#if CONFIG_EXT_INTER
	int16_t compound_mode_context[MODE_CTX_REF_FRAMES];
	#endif // CONFIG_EXT_INTER
	#endif
	} MB_MODE_INFO_EXT;

	#if CONFIG_PALETTE
	typedef struct {
	uint8_t best_palette_color_map[MAX_SB_SQUARE];
	float kmeans_data_buf[2 * MAX_SB_SQUARE];
	} PALETTE_BUFFER;
	#endif // CONFIG_PALETTE

	typedef struct macroblock MACROBLOCK;
	struct macroblock {
	struct macroblock_plane plane[MAX_MB_PLANE];

	MACROBLOCKD e_mbd;
	MB_MODE_INFO_EXT *mbmi_ext;
	int skip_block;
	int qindex;

	// The equivalent error at the current rdmult of one whole bit (not one
	// bitcost unit).
	int errorperbit;
	// The equivalend SAD error of one (whole) bit at the current quantizer
	// for large blocks.
	int sadperbit16;
	// The equivalend SAD error of one (whole) bit at the current quantizer
	// for sub-8x8 blocks.
	int sadperbit4;
	int rddiv;
	int rdmult;
	int mb_energy;
	int *m_search_count_ptr;
	int *ex_search_count_ptr;

	#if CONFIG_VAR_TX
	unsigned int txb_split_count;
	#endif

	// These are set to their default values at the beginning, and then adjusted
	// further in the encoding process.
	BLOCK_SIZE min_partition_size;
	BLOCK_SIZE max_partition_size;

	int mv_best_ref_index[TOTAL_REFS_PER_FRAME];
	unsigned int max_mv_context[TOTAL_REFS_PER_FRAME];
	unsigned int source_variance;
	unsigned int recon_variance;
	unsigned int pred_sse[TOTAL_REFS_PER_FRAME];
	int pred_mv_sad[TOTAL_REFS_PER_FRAME];

	#if CONFIG_REF_MV
	int *nmvjointcost;
	int nmv_vec_cost[NMV_CONTEXTS][MV_JOINTS];
	int *nmvcost[NMV_CONTEXTS][2];
	int *nmvcost_hp[NMV_CONTEXTS][2];
	int **mv_cost_stack[NMV_CONTEXTS];
	int *nmvjointsadcost;
	#else
	int nmvjointcost[MV_JOINTS];
	int *nmvcost[2];
	int *nmvcost_hp[2];
	int nmvjointsadcost[MV_JOINTS];
	#endif

	int **mvcost;
	int *nmvsadcost[2];
	int *nmvsadcost_hp[2];
	int **mvsadcost;
	#if CONFIG_MOTION_VAR
	int32_t *wsrc_buf;
	int32_t *mask_buf;
	#endif // CONFIG_MOTION_VAR

	#if CONFIG_PALETTE
	PALETTE_BUFFER *palette_buffer;
	#endif // CONFIG_PALETTE

	// These define limits to motion vector components to prevent them
	// from extending outside the UMV borders
	int mv_col_min;
	int mv_col_max;
	int mv_row_min;
	int mv_row_max;

	#if CONFIG_VAR_TX
	uint8_t blk_skip[MAX_MB_PLANE][MAX_MIB_SIZE * MAX_MIB_SIZE * 8];
	#if CONFIG_REF_MV
	uint8_t blk_skip_drl[MAX_MB_PLANE][MAX_MIB_SIZE * MAX_MIB_SIZE * 8];
	#endif
	#endif

	int skip;

	// note that token_costs is the cost when eob node is skipped
	av1_coeff_cost token_costs[TX_SIZES];

	int optimize;

	// Used to store sub partition's choices.
	MV pred_mv[TOTAL_REFS_PER_FRAME];

	// Store the best motion vector during motion search
	int_mv best_mv;
	// Store the second best motion vector during full-pixel motion search
	int_mv second_best_mv;

	// use default transform and skip transform type search for intra modes
	int use_default_intra_tx_type;
	// use default transform and skip transform type search for inter modes
	int use_default_inter_tx_type;
	#if CONFIG_PVQ
	int rate;
	// 1 if neither AC nor DC is coded. Only used during RDO.
	int pvq_skip[MAX_MB_PLANE];
	PVQ_QUEUE *pvq_q;

	// Storage for PVQ tx block encodings in a superblock.
	// There can be max 16x16 of 4x4 blocks (and YUV) encode by PVQ
	// 256 is the max # of 4x4 blocks in a SB (64x64), which comes from:
	// 1) Since PVQ is applied to each trasnform-ed block
	// 2) 4x4 is the smallest tx size in AV1
	// 3) AV1 allows using smaller tx size than block (i.e. partition) size
	// TODO(yushin) : The memory usage could be improved a lot, since this has
	// storage for 10 bands and 128 coefficients for every 4x4 block,
	PVQ_INFO pvq[MAX_PVQ_BLOCKS_IN_SB][MAX_MB_PLANE];
	daala_enc_ctx daala_enc;
	int pvq_speed;
	int pvq_coded; // Indicates whether pvq_info needs be stored to tokenize
	#endif
	#if CONFIG_DAALA_DIST
	// Keep rate of each 4x4 block in the current macroblock during RDO
	// This is needed when using the 8x8 Daala distortion metric during RDO,
	// because it evaluates distortion in a different order than the underlying
	// 4x4 blocks are coded.
	int rate_4x4[256];
	#endif
	};

	// Converts block_index for given transform size to index of the block in raster
	// order.
	static inline int av1_block_index_to_raster_order(TX_SIZE tx_size,
	int block_idx) {
	// For transform size 4x8, the possible block_idx values are 0 & 2, because
	// block_idx values are incremented in steps of size 'tx_width_unit x
	// tx_height_unit'. But, for this transform size, block_idx = 2 corresponds to
	// block number 1 in raster order, inside an 8x8 MI block.
	// For any other transform size, the two indices are equivalent.
	return (tx_size == TX_4X8 && block_idx == 2) ? 1 : block_idx;
	}

	// Inverse of above function.
	// Note: only implemented for transform sizes 4x4, 4x8 and 8x4 right now.
	static inline int av1_raster_order_to_block_index(TX_SIZE tx_size,
	int raster_order) {
	assert(tx_size == TX_4X4 \|\| tx_size == TX_4X8 \|\| tx_size == TX_8X4);
	// We ensure that block indices are 0 & 2 if tx size is 4x8 or 8x4.
	return (tx_size == TX_4X4) ? raster_order : (raster_order > 0) ? 2 : 0;
	}

	#ifdef __cplusplus
	} // extern "C"
	#endif

	#endif // AV1_ENCODER_BLOCK_H_