| /* |
| * Copyright (c) 2020, Alliance for Open Media. All rights reserved |
| * |
| * This source code is subject to the terms of the BSD 2 Clause License and |
| * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License |
| * was not distributed with this source code in the LICENSE file, you can |
| * obtain it at www.aomedia.org/license/software. If the Alliance for Open |
| * Media Patent License 1.0 was not distributed with this source code in the |
| * PATENTS file, you can obtain it at www.aomedia.org/license/patent. |
| */ |
| |
| #ifndef AOM_AV1_ENCODER_ENCODEFRAME_UTILS_H_ |
| #define AOM_AV1_ENCODER_ENCODEFRAME_UTILS_H_ |
| |
| #include "aom_ports/aom_timer.h" |
| #include "aom_ports/system_state.h" |
| |
| #include "av1/common/reconinter.h" |
| |
| #include "av1/encoder/encoder.h" |
| #include "av1/encoder/partition_strategy.h" |
| #include "av1/encoder/rdopt.h" |
| |
| #ifdef __cplusplus |
| extern "C" { |
| #endif |
| |
| enum { PICK_MODE_RD = 0, PICK_MODE_NONRD }; |
| |
| enum { |
| SB_SINGLE_PASS, // Single pass encoding: all ctxs get updated normally |
| SB_DRY_PASS, // First pass of multi-pass: does not update the ctxs |
| SB_WET_PASS // Second pass of multi-pass: finalize and update the ctx |
| } UENUM1BYTE(SB_MULTI_PASS_MODE); |
| |
| typedef struct { |
| ENTROPY_CONTEXT a[MAX_MIB_SIZE * MAX_MB_PLANE]; |
| ENTROPY_CONTEXT l[MAX_MIB_SIZE * MAX_MB_PLANE]; |
| PARTITION_CONTEXT sa[MAX_MIB_SIZE]; |
| PARTITION_CONTEXT sl[MAX_MIB_SIZE]; |
| TXFM_CONTEXT *p_ta; |
| TXFM_CONTEXT *p_tl; |
| TXFM_CONTEXT ta[MAX_MIB_SIZE]; |
| TXFM_CONTEXT tl[MAX_MIB_SIZE]; |
| } RD_SEARCH_MACROBLOCK_CONTEXT; |
| |
| // This struct is used to store the statistics used by sb-level multi-pass |
| // encoding. Currently, this is only used to make a copy of the state before we |
| // perform the first pass |
| typedef struct SB_FIRST_PASS_STATS { |
| RD_SEARCH_MACROBLOCK_CONTEXT x_ctx; |
| RD_COUNTS rd_count; |
| |
| int split_count; |
| FRAME_COUNTS fc; |
| InterModeRdModel inter_mode_rd_models[BLOCK_SIZES_ALL]; |
| int thresh_freq_fact[BLOCK_SIZES_ALL][MAX_MODES]; |
| int current_qindex; |
| |
| #if CONFIG_INTERNAL_STATS |
| unsigned int mode_chosen_counts[MAX_MODES]; |
| #endif // CONFIG_INTERNAL_STATS |
| } SB_FIRST_PASS_STATS; |
| |
| // This structure contains block size related |
| // variables for use in rd_pick_partition(). |
| typedef struct { |
| // Half of block width to determine block edge. |
| int mi_step; |
| |
| // Block row and column indices. |
| int mi_row; |
| int mi_col; |
| |
| // Block edge row and column indices. |
| int mi_row_edge; |
| int mi_col_edge; |
| |
| // Block width of current partition block. |
| int width; |
| |
| // Block width of minimum partition size allowed. |
| int min_partition_size_1d; |
| |
| // Flag to indicate if partition is 8x8 or higher size. |
| int bsize_at_least_8x8; |
| |
| // Indicates edge blocks in frame. |
| int has_rows; |
| int has_cols; |
| |
| // Block size of current partition. |
| BLOCK_SIZE bsize; |
| |
| // Size of current sub-partition. |
| BLOCK_SIZE subsize; |
| |
| // Size of split partition. |
| BLOCK_SIZE split_bsize2; |
| } PartitionBlkParams; |
| |
| #if CONFIG_COLLECT_PARTITION_STATS |
| typedef struct PartitionTimingStats { |
| // Tracks the number of partition decision used in the current call to \ref |
| // av1_rd_pick_partition |
| int partition_decisions[EXT_PARTITION_TYPES]; |
| // Tracks the number of partition_block searched in the current call to \ref |
| // av1_rd_pick_partition |
| int partition_attempts[EXT_PARTITION_TYPES]; |
| // Tracks the time spent on each partition search in the current call to \ref |
| // av1_rd_pick_partition |
| int64_t partition_times[EXT_PARTITION_TYPES]; |
| // Tracks the rdcost spent on each partition search in the current call to |
| // \ref av1_rd_pick_partition |
| int64_t partition_rdcost[EXT_PARTITION_TYPES]; |
| // Timer used to time the partitions. |
| struct aom_usec_timer timer; |
| // Whether the timer is on |
| int timer_is_on; |
| } PartitionTimingStats; |
| #endif // CONFIG_COLLECT_PARTITION_STATS |
| |
| // Structure holding state variables for partition search. |
| typedef struct { |
| // Intra partitioning related info. |
| PartitionSearchInfo *intra_part_info; |
| |
| // Parameters related to partition block size. |
| PartitionBlkParams part_blk_params; |
| |
| // Win flags for HORZ and VERT partition evaluations. |
| RD_RECT_PART_WIN_INFO split_part_rect_win[SUB_PARTITIONS_SPLIT]; |
| |
| // RD cost for the current block of given partition type. |
| RD_STATS this_rdc; |
| |
| // RD cost summed across all blocks of partition type. |
| RD_STATS sum_rdc; |
| |
| // Array holding partition type cost. |
| int tmp_partition_cost[PARTITION_TYPES]; |
| |
| // Pointer to partition cost buffer |
| int *partition_cost; |
| |
| // RD costs for different partition types. |
| int64_t none_rd; |
| int64_t split_rd[SUB_PARTITIONS_SPLIT]; |
| // RD costs for rectangular partitions. |
| // rect_part_rd[0][i] is the RD cost of ith partition index of PARTITION_HORZ. |
| // rect_part_rd[1][i] is the RD cost of ith partition index of PARTITION_VERT. |
| int64_t rect_part_rd[NUM_RECT_PARTS][SUB_PARTITIONS_RECT]; |
| |
| // Flags indicating if the corresponding partition was winner or not. |
| // Used to bypass similar blocks during AB partition evaluation. |
| int is_split_ctx_is_ready[2]; |
| int is_rect_ctx_is_ready[NUM_RECT_PARTS]; |
| |
| // Flags to prune/skip particular partition size evaluation. |
| int terminate_partition_search; |
| int partition_none_allowed; |
| int partition_rect_allowed[NUM_RECT_PARTS]; |
| int do_rectangular_split; |
| int do_square_split; |
| int prune_rect_part[NUM_RECT_PARTS]; |
| |
| // Chroma subsampling in x and y directions. |
| int ss_x; |
| int ss_y; |
| |
| // Partition plane context index. |
| int pl_ctx_idx; |
| |
| // This flag will be set if best partition is found from the search. |
| bool found_best_partition; |
| |
| #if CONFIG_COLLECT_PARTITION_STATS |
| PartitionTimingStats part_timing_stats; |
| #endif // CONFIG_COLLECT_PARTITION_STATS |
| } PartitionSearchState; |
| |
| static AOM_INLINE void update_filter_type_cdf(const MACROBLOCKD *xd, |
| const MB_MODE_INFO *mbmi, |
| int dual_filter) { |
| for (int dir = 0; dir < 2; ++dir) { |
| if (dir && !dual_filter) break; |
| const int ctx = av1_get_pred_context_switchable_interp(xd, dir); |
| InterpFilter filter = av1_extract_interp_filter(mbmi->interp_filters, dir); |
| update_cdf(xd->tile_ctx->switchable_interp_cdf[ctx], filter, |
| SWITCHABLE_FILTERS); |
| } |
| } |
| |
| static AOM_INLINE int set_segment_rdmult(const AV1_COMP *const cpi, |
| MACROBLOCK *const x, |
| int8_t segment_id) { |
| const AV1_COMMON *const cm = &cpi->common; |
| av1_init_plane_quantizers(cpi, x, segment_id); |
| aom_clear_system_state(); |
| const int segment_qindex = |
| av1_get_qindex(&cm->seg, segment_id, cm->quant_params.base_qindex); |
| return av1_compute_rd_mult(cpi, |
| segment_qindex + cm->quant_params.y_dc_delta_q); |
| } |
| |
| static AOM_INLINE int do_slipt_check(BLOCK_SIZE bsize) { |
| return (bsize == BLOCK_16X16 || bsize == BLOCK_32X32); |
| } |
| |
| #if !CONFIG_REALTIME_ONLY |
| static AOM_INLINE const FIRSTPASS_STATS *read_one_frame_stats(const TWO_PASS *p, |
| int frm) { |
| assert(frm >= 0); |
| if (frm < 0 || |
| p->stats_buf_ctx->stats_in_start + frm > p->stats_buf_ctx->stats_in_end) { |
| return NULL; |
| } |
| |
| return &p->stats_buf_ctx->stats_in_start[frm]; |
| } |
| |
| static BLOCK_SIZE dim_to_size(int dim) { |
| switch (dim) { |
| case 4: return BLOCK_4X4; |
| case 8: return BLOCK_8X8; |
| case 16: return BLOCK_16X16; |
| case 32: return BLOCK_32X32; |
| case 64: return BLOCK_64X64; |
| case 128: return BLOCK_128X128; |
| default: assert(0); return 0; |
| } |
| } |
| |
| static AOM_INLINE void set_max_min_partition_size(SuperBlockEnc *sb_enc, |
| AV1_COMP *cpi, MACROBLOCK *x, |
| const SPEED_FEATURES *sf, |
| BLOCK_SIZE sb_size, |
| int mi_row, int mi_col) { |
| const AV1_COMMON *cm = &cpi->common; |
| |
| sb_enc->max_partition_size = |
| AOMMIN(sf->part_sf.default_max_partition_size, |
| dim_to_size(cpi->oxcf.part_cfg.max_partition_size)); |
| sb_enc->min_partition_size = |
| AOMMAX(sf->part_sf.default_min_partition_size, |
| dim_to_size(cpi->oxcf.part_cfg.min_partition_size)); |
| sb_enc->max_partition_size = |
| AOMMIN(sb_enc->max_partition_size, cm->seq_params->sb_size); |
| sb_enc->min_partition_size = |
| AOMMIN(sb_enc->min_partition_size, cm->seq_params->sb_size); |
| |
| if (use_auto_max_partition(cpi, sb_size, mi_row, mi_col)) { |
| float features[FEATURE_SIZE_MAX_MIN_PART_PRED] = { 0.0f }; |
| |
| av1_get_max_min_partition_features(cpi, x, mi_row, mi_col, features); |
| sb_enc->max_partition_size = |
| AOMMAX(AOMMIN(av1_predict_max_partition(cpi, x, features), |
| sb_enc->max_partition_size), |
| sb_enc->min_partition_size); |
| } |
| } |
| |
| int av1_get_rdmult_delta(AV1_COMP *cpi, BLOCK_SIZE bsize, int mi_row, |
| int mi_col, int orig_rdmult); |
| |
| int av1_active_h_edge(const AV1_COMP *cpi, int mi_row, int mi_step); |
| |
| int av1_active_v_edge(const AV1_COMP *cpi, int mi_col, int mi_step); |
| |
| void av1_get_tpl_stats_sb(AV1_COMP *cpi, BLOCK_SIZE bsize, int mi_row, |
| int mi_col, SuperBlockEnc *sb_enc); |
| |
| int av1_get_q_for_deltaq_objective(AV1_COMP *const cpi, BLOCK_SIZE bsize, |
| int mi_row, int mi_col); |
| #endif // !CONFIG_REALTIME_ONLY |
| |
| void av1_set_ssim_rdmult(const AV1_COMP *const cpi, int *errorperbit, |
| const BLOCK_SIZE bsize, const int mi_row, |
| const int mi_col, int *const rdmult); |
| |
| int av1_get_hier_tpl_rdmult(const AV1_COMP *const cpi, MACROBLOCK *const x, |
| const BLOCK_SIZE bsize, const int mi_row, |
| const int mi_col, int orig_rdmult); |
| |
| void av1_update_state(const AV1_COMP *const cpi, ThreadData *td, |
| const PICK_MODE_CONTEXT *const ctx, int mi_row, |
| int mi_col, BLOCK_SIZE bsize, RUN_TYPE dry_run); |
| |
| void av1_update_inter_mode_stats(FRAME_CONTEXT *fc, FRAME_COUNTS *counts, |
| PREDICTION_MODE mode, int16_t mode_context); |
| |
| void av1_sum_intra_stats(const AV1_COMMON *const cm, FRAME_COUNTS *counts, |
| MACROBLOCKD *xd, const MB_MODE_INFO *const mbmi, |
| const MB_MODE_INFO *above_mi, |
| const MB_MODE_INFO *left_mi, const int intraonly); |
| |
| void av1_restore_context(MACROBLOCK *x, const RD_SEARCH_MACROBLOCK_CONTEXT *ctx, |
| int mi_row, int mi_col, BLOCK_SIZE bsize, |
| const int num_planes); |
| |
| void av1_save_context(const MACROBLOCK *x, RD_SEARCH_MACROBLOCK_CONTEXT *ctx, |
| int mi_row, int mi_col, BLOCK_SIZE bsize, |
| const int num_planes); |
| |
| void av1_set_fixed_partitioning(AV1_COMP *cpi, const TileInfo *const tile, |
| MB_MODE_INFO **mib, int mi_row, int mi_col, |
| BLOCK_SIZE bsize); |
| |
| int av1_is_leaf_split_partition(AV1_COMMON *cm, int mi_row, int mi_col, |
| BLOCK_SIZE bsize); |
| |
| void av1_reset_simple_motion_tree_partition(SIMPLE_MOTION_DATA_TREE *sms_tree, |
| BLOCK_SIZE bsize); |
| |
| void av1_update_picked_ref_frames_mask(MACROBLOCK *const x, int ref_type, |
| BLOCK_SIZE bsize, int mib_size, |
| int mi_row, int mi_col); |
| |
| void av1_avg_cdf_symbols(FRAME_CONTEXT *ctx_left, FRAME_CONTEXT *ctx_tr, |
| int wt_left, int wt_tr); |
| |
| void av1_source_content_sb(AV1_COMP *cpi, MACROBLOCK *x, int offset); |
| |
| void av1_reset_mbmi(CommonModeInfoParams *const mi_params, BLOCK_SIZE sb_size, |
| int mi_row, int mi_col); |
| |
| void av1_backup_sb_state(SB_FIRST_PASS_STATS *sb_fp_stats, const AV1_COMP *cpi, |
| ThreadData *td, const TileDataEnc *tile_data, |
| int mi_row, int mi_col); |
| |
| void av1_restore_sb_state(const SB_FIRST_PASS_STATS *sb_fp_stats, AV1_COMP *cpi, |
| ThreadData *td, TileDataEnc *tile_data, int mi_row, |
| int mi_col); |
| |
| void av1_set_cost_upd_freq(AV1_COMP *cpi, ThreadData *td, |
| const TileInfo *const tile_info, const int mi_row, |
| const int mi_col); |
| |
| static AOM_INLINE void av1_dealloc_mb_data(struct AV1Common *cm, |
| struct macroblock *mb) { |
| if (mb->txfm_search_info.txb_rd_records) { |
| aom_free(mb->txfm_search_info.txb_rd_records); |
| mb->txfm_search_info.txb_rd_records = NULL; |
| } |
| const int num_planes = av1_num_planes(cm); |
| for (int plane = 0; plane < num_planes; plane++) { |
| if (mb->plane[plane].src_diff) { |
| aom_free(mb->plane[plane].src_diff); |
| mb->plane[plane].src_diff = NULL; |
| } |
| } |
| if (mb->e_mbd.seg_mask) { |
| aom_free(mb->e_mbd.seg_mask); |
| mb->e_mbd.seg_mask = NULL; |
| } |
| if (mb->winner_mode_stats) { |
| aom_free(mb->winner_mode_stats); |
| mb->winner_mode_stats = NULL; |
| } |
| } |
| |
| static AOM_INLINE void av1_alloc_mb_data(struct AV1Common *cm, |
| struct macroblock *mb, |
| int use_nonrd_pick_mode) { |
| if (!use_nonrd_pick_mode) { |
| mb->txfm_search_info.txb_rd_records = |
| (TxbRdRecords *)aom_malloc(sizeof(TxbRdRecords)); |
| } |
| const int num_planes = av1_num_planes(cm); |
| for (int plane = 0; plane < num_planes; plane++) { |
| const int subsampling_xy = |
| plane ? cm->seq_params->subsampling_x + cm->seq_params->subsampling_y |
| : 0; |
| const int sb_size = MAX_SB_SQUARE >> subsampling_xy; |
| CHECK_MEM_ERROR(cm, mb->plane[plane].src_diff, |
| (int16_t *)aom_memalign( |
| 32, sizeof(*mb->plane[plane].src_diff) * sb_size)); |
| } |
| CHECK_MEM_ERROR(cm, mb->e_mbd.seg_mask, |
| (uint8_t *)aom_memalign( |
| 16, 2 * MAX_SB_SQUARE * sizeof(mb->e_mbd.seg_mask[0]))); |
| const int winner_mode_count = frame_is_intra_only(cm) |
| ? MAX_WINNER_MODE_COUNT_INTRA |
| : MAX_WINNER_MODE_COUNT_INTER; |
| CHECK_MEM_ERROR(cm, mb->winner_mode_stats, |
| (WinnerModeStats *)aom_malloc( |
| winner_mode_count * sizeof(mb->winner_mode_stats[0]))); |
| } |
| |
| // This function will compute the number of reference frames to be disabled |
| // based on selective_ref_frame speed feature. |
| static AOM_INLINE unsigned int get_num_refs_to_disable( |
| const AV1_COMP *cpi, const int *ref_frame_flags, |
| const unsigned int *ref_display_order_hint, |
| unsigned int cur_frame_display_index) { |
| unsigned int num_refs_to_disable = 0; |
| if (cpi->sf.inter_sf.selective_ref_frame >= 3) { |
| num_refs_to_disable++; |
| if (cpi->sf.inter_sf.selective_ref_frame >= 6) { |
| // Disable LAST2_FRAME and ALTREF2_FRAME |
| num_refs_to_disable += 2; |
| } else if (cpi->sf.inter_sf.selective_ref_frame == 5 && |
| *ref_frame_flags & av1_ref_frame_flag_list[LAST2_FRAME]) { |
| const int last2_frame_dist = av1_encoder_get_relative_dist( |
| ref_display_order_hint[LAST2_FRAME - LAST_FRAME], |
| cur_frame_display_index); |
| // Disable LAST2_FRAME if it is a temporally distant frame |
| if (abs(last2_frame_dist) > 2) { |
| num_refs_to_disable++; |
| } |
| #if !CONFIG_REALTIME_ONLY |
| else if (is_stat_consumption_stage_twopass(cpi)) { |
| const FIRSTPASS_STATS *const this_frame_stats = |
| read_one_frame_stats(&cpi->ppi->twopass, cur_frame_display_index); |
| aom_clear_system_state(); |
| const double coded_error_per_mb = |
| this_frame_stats->coded_error / cpi->frame_info.num_mbs; |
| // Disable LAST2_FRAME if the coded error of the current frame based on |
| // first pass stats is very low. |
| if (coded_error_per_mb < 100.0) num_refs_to_disable++; |
| } |
| #endif // CONFIG_REALTIME_ONLY |
| } |
| } |
| return num_refs_to_disable; |
| } |
| |
| static INLINE int get_max_allowed_ref_frames( |
| const AV1_COMP *cpi, const int *ref_frame_flags, |
| const unsigned int *ref_display_order_hint, |
| unsigned int cur_frame_display_index) { |
| const unsigned int max_reference_frames = |
| cpi->oxcf.ref_frm_cfg.max_reference_frames; |
| const unsigned int num_refs_to_disable = get_num_refs_to_disable( |
| cpi, ref_frame_flags, ref_display_order_hint, cur_frame_display_index); |
| const unsigned int max_allowed_refs_for_given_speed = |
| INTER_REFS_PER_FRAME - num_refs_to_disable; |
| return AOMMIN(max_allowed_refs_for_given_speed, max_reference_frames); |
| } |
| |
| // Enforce the number of references for each arbitrary frame based on user |
| // options and speed. |
| static AOM_INLINE void enforce_max_ref_frames( |
| AV1_COMP *cpi, int *ref_frame_flags, |
| const unsigned int *ref_display_order_hint, |
| unsigned int cur_frame_display_index) { |
| MV_REFERENCE_FRAME ref_frame; |
| int total_valid_refs = 0; |
| |
| for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) { |
| if (*ref_frame_flags & av1_ref_frame_flag_list[ref_frame]) { |
| total_valid_refs++; |
| } |
| } |
| |
| const int max_allowed_refs = get_max_allowed_ref_frames( |
| cpi, ref_frame_flags, ref_display_order_hint, cur_frame_display_index); |
| |
| for (int i = 0; i < 4 && total_valid_refs > max_allowed_refs; ++i) { |
| const MV_REFERENCE_FRAME ref_frame_to_disable = disable_order[i]; |
| |
| if (!(*ref_frame_flags & av1_ref_frame_flag_list[ref_frame_to_disable])) { |
| continue; |
| } |
| |
| switch (ref_frame_to_disable) { |
| case LAST3_FRAME: *ref_frame_flags &= ~AOM_LAST3_FLAG; break; |
| case LAST2_FRAME: *ref_frame_flags &= ~AOM_LAST2_FLAG; break; |
| case ALTREF2_FRAME: *ref_frame_flags &= ~AOM_ALT2_FLAG; break; |
| case GOLDEN_FRAME: *ref_frame_flags &= ~AOM_GOLD_FLAG; break; |
| default: assert(0); |
| } |
| --total_valid_refs; |
| } |
| assert(total_valid_refs <= max_allowed_refs); |
| } |
| |
| #ifdef __cplusplus |
| } // extern "C" |
| #endif |
| |
| #endif // AOM_AV1_ENCODER_ENCODEFRAME_UTILS_H_ |