| /* |
| * Copyright (c) 2016, Alliance for Open Media. All rights reserved |
| * |
| * This source code is subject to the terms of the BSD 2 Clause License and |
| * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License |
| * was not distributed with this source code in the LICENSE file, you can |
| * obtain it at www.aomedia.org/license/software. If the Alliance for Open |
| * Media Patent License 1.0 was not distributed with this source code in the |
| * PATENTS file, you can obtain it at www.aomedia.org/license/patent. |
| */ |
| |
| #ifndef AOM_AV1_ENCODER_FIRSTPASS_H_ |
| #define AOM_AV1_ENCODER_FIRSTPASS_H_ |
| |
| #include "av1/common/av1_common_int.h" |
| #include "av1/common/enums.h" |
| #include "av1/encoder/lookahead.h" |
| #include "av1/encoder/ratectrl.h" |
| |
| #ifdef __cplusplus |
| extern "C" { |
| #endif |
| |
| #define DOUBLE_DIVIDE_CHECK(x) ((x) < 0 ? (x)-0.000001 : (x) + 0.000001) |
| |
| #define MIN_ZERO_MOTION 0.95 |
| #define MAX_SR_CODED_ERROR 40 |
| #define MAX_RAW_ERR_VAR 2000 |
| #define MIN_MV_IN_OUT 0.4 |
| |
| #define VLOW_MOTION_THRESHOLD 950 |
| struct ThreadData; |
| |
| /*! |
| * \brief The stucture of acummulated frame stats in the first pass. |
| * |
| * Errors (coded_error, intra_error, etc.) and counters (new_mv_count) are |
| * normalized to each MB. MV related stats (MVc, MVr, etc.) are normalized to |
| * the frame width and height. See function normalize_firstpass_stats. |
| */ |
| typedef struct { |
| /*! |
| * Frame number in display order, if stats are for a single frame. |
| * No real meaning for a collection of frames. |
| */ |
| double frame; |
| /*! |
| * Weight assigned to this frame (or total weight for the collection of |
| * frames) currently based on intra factor and brightness factor. This is used |
| * to distribute bits betweeen easier and harder frames. |
| */ |
| double weight; |
| /*! |
| * Intra prediction error. |
| */ |
| double intra_error; |
| /*! |
| * Average wavelet energy computed using Discrete Wavelet Transform (DWT). |
| */ |
| double frame_avg_wavelet_energy; |
| /*! |
| * Best of intra pred error and inter pred error using last frame as ref. |
| */ |
| double coded_error; |
| /*! |
| * Best of intra pred error and inter pred error using golden frame as ref. |
| */ |
| double sr_coded_error; |
| /*! |
| * Percentage of blocks with inter pred error < intra pred error. |
| */ |
| double pcnt_inter; |
| /*! |
| * Percentage of blocks using (inter prediction and) non-zero motion vectors. |
| */ |
| double pcnt_motion; |
| /*! |
| * Percentage of blocks where golden frame was better than last or intra: |
| * inter pred error using golden frame < inter pred error using last frame and |
| * inter pred error using golden frame < intra pred error |
| */ |
| double pcnt_second_ref; |
| /*! |
| * Percentage of blocks where intra and inter prediction errors were very |
| * close. Note that this is a 'weighted count', that is, the so blocks may be |
| * weighted by how close the two errors were. |
| */ |
| double pcnt_neutral; |
| /*! |
| * Percentage of blocks that have almost no intra error residual |
| * (i.e. are in effect completely flat and untextured in the intra |
| * domain). In natural videos this is uncommon, but it is much more |
| * common in animations, graphics and screen content, so may be used |
| * as a signal to detect these types of content. |
| */ |
| double intra_skip_pct; |
| /*! |
| * Image mask rows top and bottom. |
| */ |
| double inactive_zone_rows; |
| /*! |
| * Image mask columns at left and right edges. |
| */ |
| double inactive_zone_cols; |
| /*! |
| * Average of row motion vectors. |
| */ |
| double MVr; |
| /*! |
| * Mean of absolute value of row motion vectors. |
| */ |
| double mvr_abs; |
| /*! |
| * Mean of column motion vectors. |
| */ |
| double MVc; |
| /*! |
| * Mean of absolute value of column motion vectors. |
| */ |
| double mvc_abs; |
| /*! |
| * Variance of row motion vectors. |
| */ |
| double MVrv; |
| /*! |
| * Variance of column motion vectors. |
| */ |
| double MVcv; |
| /*! |
| * Value in range [-1,1] indicating fraction of row and column motion vectors |
| * that point inwards (negative MV value) or outwards (positive MV value). |
| * For example, value of 1 indicates, all row/column MVs are inwards. |
| */ |
| double mv_in_out_count; |
| /*! |
| * Count of unique non-zero motion vectors. |
| */ |
| double new_mv_count; |
| /*! |
| * Duration of the frame / collection of frames. |
| */ |
| double duration; |
| /*! |
| * 1.0 if stats are for a single frame, OR |
| * Number of frames in this collection for which the stats are accumulated. |
| */ |
| double count; |
| /*! |
| * standard deviation for (0, 0) motion prediction error |
| */ |
| double raw_error_stdev; |
| /*! |
| * Whether the frame contains a flash |
| */ |
| int64_t is_flash; |
| /*! |
| * Estimated noise variance |
| */ |
| double noise_var; |
| /*! |
| * Correlation coefficient with the previous frame |
| */ |
| double cor_coeff; |
| } FIRSTPASS_STATS; |
| |
| // We want to keep one past stats for key frame detection |
| // in test_candidate_kf() |
| #define FIRSTPASS_INFO_STATS_PAST_MIN 1 |
| |
| // The size of static buffer used in FIRSTPASS_INFO. |
| #define FIRSTPASS_INFO_STATIC_BUF_SIZE \ |
| (MAX_LAP_BUFFERS + FIRSTPASS_INFO_STATS_PAST_MIN) |
| |
| /*! |
| * \brief Data structure used for managing first pass stats |
| */ |
| typedef struct { |
| /*! |
| * A static buffer that will be used when no ext_stats_buf is assigned. The |
| * ext_stats_buf is assigned through av1_firstpass_info_init() when the user |
| * already has a pre-existing firstpass stats that is stored in an external |
| * buffer. The ext_stats_buf is usually used in two pass mode. When using one |
| * pass mode, we generate "firstpass" stats and encode the video in the same |
| * pass. In this scenario, the stats will be pushed and popped from |
| * static_stats_buf. |
| */ |
| FIRSTPASS_STATS static_stats_buf[FIRSTPASS_INFO_STATIC_BUF_SIZE]; |
| /*! |
| * A pointer to first pass stats. |
| * Note that this buffer will be used as ring buffer. |
| */ |
| FIRSTPASS_STATS *stats_buf; |
| /*! |
| * size of stats_buf |
| */ |
| int stats_buf_size; |
| /*! |
| * start index of the available frame stats |
| * Note that start_index doesn't always point to |
| * current frame's stats because we need to |
| * keep past stats as well. To access current |
| * frame's stats, please use cur_index. |
| */ |
| int start_index; |
| |
| /*! |
| * count available stats stored in stats_buf |
| * the following condition should stay true |
| * stats_count = future_stats_count + past_stats_count |
| */ |
| int stats_count; |
| |
| /*! |
| * index of the current frame's stats |
| */ |
| int cur_index; |
| |
| /*! |
| * count available future stats including current stats |
| */ |
| int future_stats_count; |
| |
| /*! |
| * count available past stats EXCLUDING current stats |
| */ |
| int past_stats_count; |
| |
| /*! |
| * Accumulation of the stats being pushed into firstpass_info |
| */ |
| FIRSTPASS_STATS total_stats; |
| } FIRSTPASS_INFO; |
| |
| /*!\brief Init firstpass_info |
| * |
| * If using ext_stats_buf, the buffer needs to stay available during encoding |
| * process. |
| * |
| * \ingroup rate_control |
| * \param[out] firstpass_info struct of firstpass_info. |
| * \param[in] ext_stats_buf external stats buffer. Pass in NULL if |
| * choose to use internal static_stats_buf. |
| * \param[in] ext_stats_buf_size external stats buffer size. Pass in 0 if |
| * choose to use internal static_stats_buf. \return status |
| */ |
| aom_codec_err_t av1_firstpass_info_init(FIRSTPASS_INFO *firstpass_info, |
| FIRSTPASS_STATS *ext_stats_buf, |
| int ext_stats_buf_size); |
| |
| /*!\brief Move cur_index by 1 |
| * |
| * \ingroup rate_control |
| * \param[out] firstpass_info struct of firstpass_info. |
| * \return status |
| */ |
| aom_codec_err_t av1_firstpass_info_move_cur_index( |
| FIRSTPASS_INFO *firstpass_info); |
| |
| /*!\brief Pop a stats from firstpass_info |
| * |
| * \ingroup rate_control |
| * \param[out] firstpass_info struct of firstpass_info. |
| * \return status |
| */ |
| aom_codec_err_t av1_firstpass_info_pop(FIRSTPASS_INFO *firstpass_info); |
| |
| /*!\brief Move cur_index by 1 and pop a stats from firstpass_info |
| * |
| * \ingroup rate_control |
| * \param[out] firstpass_info struct of firstpass_info. |
| * \return status |
| */ |
| aom_codec_err_t av1_firstpass_info_move_cur_index_and_pop( |
| FIRSTPASS_INFO *firstpass_info); |
| |
| /*!\brief Push a stats into firstpass_info |
| * |
| * Note that the input stats will be copied into firstpass_info. |
| * \ingroup rate_control |
| * \param[out] firstpass_info struct of firstpass_info. |
| * \param[in] input_stats input stats |
| * \return status |
| */ |
| aom_codec_err_t av1_firstpass_info_push(FIRSTPASS_INFO *firstpass_info, |
| const FIRSTPASS_STATS *input_stats); |
| |
| /*!\brief Peek at a stats from firstpass_info |
| * |
| * The target index is as follows. |
| * (cur_index + offset_from_cur) % firstpass_info->stats_buf_size |
| * |
| * \ingroup rate_control |
| * \param[in] firstpass_info struct of firstpass_info. |
| * \param[in] offset_from_cur index offset from cur_index. |
| * \return pointer to the stats. The pointer will be NULL if |
| * stats_index_offset is invalid. |
| */ |
| const FIRSTPASS_STATS *av1_firstpass_info_peek( |
| const FIRSTPASS_INFO *firstpass_info, int offset_from_cur); |
| |
| /*!\brief Count the future stats from the target in firstpass_info |
| * Note that the target stats will be counted as well. |
| * The target index is as follows. |
| * (cur_index + offset_from_cur) % firstpass_info->stats_buf_size |
| * |
| * \ingroup rate_control |
| * \param[in] firstpass_info struct of firstpass_info. |
| * \param[in] offset_from_cur target stats's inffset |
| * from cur_index. |
| * \return Number of stats in the future after the target stats |
| * including itself. |
| */ |
| int av1_firstpass_info_future_count(const FIRSTPASS_INFO *firstpass_info, |
| int offset_from_cur); |
| |
| /*!\brief Count the past stats before the target in firstpass_info |
| * Note that the target stats will NOT be counted. |
| * The target index is as follows. |
| * (cur_index + offset_from_cur) % firstpass_info->stats_buf_size |
| * |
| * \ingroup rate_control |
| * \param[in] firstpass_info struct of firstpass_info. |
| * \param[in] offset_from_cur target stats's index offset |
| * from cur_index. |
| * \return Number of stats in the past before the target stats |
| * excluding itself. |
| */ |
| int av1_firstpass_info_past_count(const FIRSTPASS_INFO *firstpass_info, |
| int offset_from_cur); |
| |
| /*!\cond */ |
| #define FC_ANIMATION_THRESH 0.15 |
| enum { |
| FC_NORMAL = 0, |
| FC_GRAPHICS_ANIMATION = 1, |
| FRAME_CONTENT_TYPES = 2 |
| } UENUM1BYTE(FRAME_CONTENT_TYPE); |
| /*!\endcond */ |
| |
| /*! |
| * \brief Data related to the current GF/ARF group and the |
| * individual frames within the group |
| */ |
| typedef struct GF_GROUP { |
| /*!\cond */ |
| // Frame update type, e.g. ARF/GF/LF/Overlay |
| FRAME_UPDATE_TYPE update_type[MAX_STATIC_GF_GROUP_LENGTH]; |
| unsigned char arf_src_offset[MAX_STATIC_GF_GROUP_LENGTH]; |
| // The number of frames displayed so far within the GOP at a given coding |
| // frame. |
| unsigned char cur_frame_idx[MAX_STATIC_GF_GROUP_LENGTH]; |
| int layer_depth[MAX_STATIC_GF_GROUP_LENGTH]; |
| int arf_boost[MAX_STATIC_GF_GROUP_LENGTH]; |
| int max_layer_depth; |
| int max_layer_depth_allowed; |
| // This is currently only populated for AOM_Q mode |
| int q_val[MAX_STATIC_GF_GROUP_LENGTH]; |
| int bit_allocation[MAX_STATIC_GF_GROUP_LENGTH]; |
| // The frame coding type - inter/intra frame |
| FRAME_TYPE frame_type[MAX_STATIC_GF_GROUP_LENGTH]; |
| // The reference frame buffer control - update or reset |
| REFBUF_STATE refbuf_state[MAX_STATIC_GF_GROUP_LENGTH]; |
| int arf_index; // the index in the gf group of ARF, if no arf, then -1 |
| int size; // The total length of a GOP |
| #if CONFIG_FRAME_PARALLEL_ENCODE |
| // Indicates the level of parallelism in frame parallel encodes. |
| // 0 : frame is independently encoded (not part of parallel encodes). |
| // 1 : frame is the first in encode order in a given parallel encode set. |
| // 2 : frame occurs later in encode order in a given parallel encode set. |
| int frame_parallel_level[MAX_STATIC_GF_GROUP_LENGTH]; |
| // Indicates whether a frame should act as non-reference frame. |
| // 0 : frame is a reference frame. |
| // 1 : frame is a non-reference frame. |
| int is_frame_non_ref[MAX_STATIC_GF_GROUP_LENGTH]; |
| |
| // The offset into lookahead_ctx for choosing |
| // source of frame parallel encodes. |
| int src_offset[MAX_STATIC_GF_GROUP_LENGTH]; |
| #if CONFIG_FRAME_PARALLEL_ENCODE_2 |
| // Stores the display order hint of each frame in the current GF_GROUP. |
| int display_idx[MAX_STATIC_GF_GROUP_LENGTH]; |
| // Stores the display order hint of the frames not to be |
| // refreshed by the current frame. |
| int skip_frame_refresh[MAX_STATIC_GF_GROUP_LENGTH][REF_FRAMES]; |
| // Stores the display order hint of the frame to be excluded during reference |
| // assignment. |
| int skip_frame_as_ref[MAX_STATIC_GF_GROUP_LENGTH]; |
| #endif // CONFIG_FRAME_PARALLEL_ENCODE_2 |
| #endif // CONFIG_FRAME_PARALLEL_ENCODE |
| /*!\endcond */ |
| } GF_GROUP; |
| /*!\cond */ |
| |
| typedef struct { |
| // Track if the last frame in a GOP has higher quality. |
| int arf_gf_boost_lst; |
| } GF_STATE; |
| |
| typedef struct { |
| FIRSTPASS_STATS *stats_in_start; |
| FIRSTPASS_STATS *stats_in_end; |
| FIRSTPASS_STATS *stats_in_buf_end; |
| FIRSTPASS_STATS *total_stats; |
| FIRSTPASS_STATS *total_left_stats; |
| } STATS_BUFFER_CTX; |
| |
| /*!\endcond */ |
| |
| /*! |
| * \brief Two pass status and control data. |
| */ |
| typedef struct { |
| /*!\cond */ |
| unsigned int section_intra_rating; |
| // Circular queue of first pass stats stored for most recent frames. |
| // cpi->output_pkt_list[i].data.twopass_stats.buf points to actual data stored |
| // here. |
| FIRSTPASS_STATS *frame_stats_arr[MAX_LAP_BUFFERS + 1]; |
| int frame_stats_next_idx; // Index to next unused element in frame_stats_arr. |
| STATS_BUFFER_CTX *stats_buf_ctx; |
| FIRSTPASS_INFO firstpass_info; // This is the first pass data structure |
| // intended to replace stats_in |
| int first_pass_done; |
| int64_t bits_left; |
| double modified_error_min; |
| double modified_error_max; |
| double modified_error_left; |
| |
| // Projected total bits available for a key frame group of frames |
| int64_t kf_group_bits; |
| |
| // Error score of frames still to be coded in kf group |
| double kf_group_error_left; |
| |
| // Over time correction for bits per macro block estimation |
| double bpm_factor; |
| |
| // Record of target and actual bits spent in current ARF group |
| int rolling_arf_group_target_bits; |
| int rolling_arf_group_actual_bits; |
| |
| int sr_update_lag; |
| |
| int kf_zeromotion_pct; |
| int last_kfgroup_zeromotion_pct; |
| int extend_minq; |
| int extend_maxq; |
| int extend_minq_fast; |
| /*!\endcond */ |
| } TWO_PASS; |
| |
| /*! |
| * \brief Frame level Two pass status and control data. |
| */ |
| typedef struct { |
| /*!\cond */ |
| const FIRSTPASS_STATS *stats_in; |
| // Pointer to the stats of the current frame. |
| const FIRSTPASS_STATS *this_frame; |
| double mb_av_energy; |
| // An indication of the content type of the current frame |
| FRAME_CONTENT_TYPE fr_content_type; |
| double frame_avg_haar_energy; |
| /*!\endcond */ |
| } TWO_PASS_FRAME; |
| |
| /*!\cond */ |
| |
| // This structure contains several key parameters to be accumulated for this |
| // frame. |
| typedef struct { |
| // Intra prediction error. |
| int64_t intra_error; |
| // Average wavelet energy computed using Discrete Wavelet Transform (DWT). |
| int64_t frame_avg_wavelet_energy; |
| // Best of intra pred error and inter pred error using last frame as ref. |
| int64_t coded_error; |
| // Best of intra pred error and inter pred error using golden frame as ref. |
| int64_t sr_coded_error; |
| // Count of motion vector. |
| int mv_count; |
| // Count of blocks that pick inter prediction (inter pred error is smaller |
| // than intra pred error). |
| int inter_count; |
| // Count of blocks that pick second ref (golden frame). |
| int second_ref_count; |
| // Count of blocks where the inter and intra are very close and very low. |
| double neutral_count; |
| // Count of blocks where intra error is very small. |
| int intra_skip_count; |
| // Start row. |
| int image_data_start_row; |
| // Count of unique non-zero motion vectors. |
| int new_mv_count; |
| // Sum of inward motion vectors. |
| int sum_in_vectors; |
| // Sum of motion vector row. |
| int sum_mvr; |
| // Sum of motion vector column. |
| int sum_mvc; |
| // Sum of absolute value of motion vector row. |
| int sum_mvr_abs; |
| // Sum of absolute value of motion vector column. |
| int sum_mvc_abs; |
| // Sum of the square of motion vector row. |
| int64_t sum_mvrs; |
| // Sum of the square of motion vector column. |
| int64_t sum_mvcs; |
| // A factor calculated using intra pred error. |
| double intra_factor; |
| // A factor that measures brightness. |
| double brightness_factor; |
| } FRAME_STATS; |
| |
| // This structure contains first pass data. |
| typedef struct { |
| // Buffer holding frame stats for all MACROBLOCKs. |
| // mb_stats[i] stores the FRAME_STATS of the ith |
| // MB in raster scan order. |
| FRAME_STATS *mb_stats; |
| // Buffer to store the prediction error of the (0,0) motion |
| // vector using the last source frame as the reference. |
| // raw_motion_err_list[i] stores the raw_motion_err of |
| // the ith MB in raster scan order. |
| int *raw_motion_err_list; |
| } FirstPassData; |
| |
| struct AV1_COMP; |
| struct EncodeFrameParams; |
| struct AV1EncoderConfig; |
| struct TileDataEnc; |
| |
| static INLINE int is_fp_wavelet_energy_invalid( |
| const FIRSTPASS_STATS *fp_stats) { |
| assert(fp_stats != NULL); |
| return (fp_stats->frame_avg_wavelet_energy < 0); |
| } |
| |
| static INLINE BLOCK_SIZE get_fp_block_size(int is_screen_content_type) { |
| return (is_screen_content_type ? BLOCK_8X8 : BLOCK_16X16); |
| } |
| |
| int av1_get_unit_rows_in_tile(TileInfo tile, const BLOCK_SIZE fp_block_size); |
| int av1_get_unit_cols_in_tile(TileInfo tile, const BLOCK_SIZE fp_block_size); |
| |
| void av1_rc_get_first_pass_params(struct AV1_COMP *cpi); |
| void av1_first_pass_row(struct AV1_COMP *cpi, struct ThreadData *td, |
| struct TileDataEnc *tile_data, const int mb_row, |
| const BLOCK_SIZE fp_block_size); |
| void av1_end_first_pass(struct AV1_COMP *cpi); |
| |
| void av1_twopass_zero_stats(FIRSTPASS_STATS *section); |
| void av1_accumulate_stats(FIRSTPASS_STATS *section, |
| const FIRSTPASS_STATS *frame); |
| /*!\endcond */ |
| |
| /*!\brief AV1 first pass encoding. |
| * |
| * \ingroup rate_control |
| * This function is the first encoding pass for the two pass encoding mode. |
| * It encodes the whole video and collect essential information. |
| * Two pass encoding is an encoding mode in the reference software (libaom) |
| * of AV1 for high performance encoding. The first pass is a fast encoding |
| * process to collect essential information to help the second pass make |
| * encoding decisions and improve coding quality. The collected stats is used |
| * in rate control, for example, to determine frame cut, the position of |
| * alternative reference frame (ARF), etc. |
| * |
| * \param[in] cpi Top-level encoder structure |
| * \param[in] ts_duration Duration of the frame / collection of frames |
| * |
| * \return Nothing is returned. Instead, the "TWO_PASS" structure inside "cpi" |
| * is modified to store information computed in this function. |
| */ |
| void av1_first_pass(struct AV1_COMP *cpi, const int64_t ts_duration); |
| |
| #ifdef __cplusplus |
| } // extern "C" |
| #endif |
| |
| #endif // AOM_AV1_ENCODER_FIRSTPASS_H_ |