| /* |
| * Copyright (c) 2021, Alliance for Open Media. All rights reserved |
| * |
| * This source code is subject to the terms of the BSD 3-Clause Clear License |
| * and the Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear |
| * License was not distributed with this source code in the LICENSE file, you |
| * can obtain it at aomedia.org/license/software-license/bsd-3-c-c/. If the |
| * Alliance for Open Media Patent License 1.0 was not distributed with this |
| * source code in the PATENTS file, you can obtain it at |
| * aomedia.org/license/patent-license/. |
| */ |
| |
| #ifndef AOM_AV1_ENCODER_FIRSTPASS_H_ |
| #define AOM_AV1_ENCODER_FIRSTPASS_H_ |
| |
| #include "av1/common/av1_common_int.h" |
| #include "av1/common/enums.h" |
| #include "av1/encoder/lookahead.h" |
| #include "av1/encoder/ratectrl.h" |
| |
| #ifdef __cplusplus |
| extern "C" { |
| #endif |
| |
| #define DOUBLE_DIVIDE_CHECK(x) ((x) < 0 ? (x)-0.000001 : (x) + 0.000001) |
| |
| #define MIN_ZERO_MOTION 0.95 |
| #define MAX_SR_CODED_ERROR 40 |
| #define MAX_RAW_ERR_VAR 2000 |
| #define MIN_MV_IN_OUT 0.4 |
| |
| #define VLOW_MOTION_THRESHOLD 950 |
| |
| // size of firstpass macroblocks in terms of MIs. |
| #define FP_MIB_SIZE 4 |
| #define FP_MIB_SIZE_LOG2 2 |
| |
| /*! |
| * \brief The stucture of acummulated frame stats in the first pass. |
| */ |
| typedef struct { |
| /*! |
| * Frame number in display order, if stats are for a single frame. |
| * No real meaning for a collection of frames. |
| */ |
| double frame; |
| /*! |
| * Weight assigned to this frame (or total weight for the collection of |
| * frames) currently based on intra factor and brightness factor. This is used |
| * to distribute bits betweeen easier and harder frames. |
| */ |
| double weight; |
| /*! |
| * Intra prediction error. |
| */ |
| double intra_error; |
| /*! |
| * Average wavelet energy computed using Discrete Wavelet Transform (DWT). |
| */ |
| double frame_avg_wavelet_energy; |
| /*! |
| * Best of intra pred error and inter pred error using last frame as ref. |
| */ |
| double coded_error; |
| /*! |
| * Best of intra pred error and inter pred error using golden frame as ref. |
| */ |
| double sr_coded_error; |
| /*! |
| * Best of intra pred error and inter pred error using altref frame as ref. |
| */ |
| double tr_coded_error; |
| /*! |
| * Percentage of blocks with inter pred error < intra pred error. |
| */ |
| double pcnt_inter; |
| /*! |
| * Percentage of blocks using (inter prediction and) non-zero motion vectors. |
| */ |
| double pcnt_motion; |
| /*! |
| * Percentage of blocks where golden frame was better than last or intra: |
| * inter pred error using golden frame < inter pred error using last frame and |
| * inter pred error using golden frame < intra pred error |
| */ |
| double pcnt_second_ref; |
| /*! |
| * Percentage of blocks where altref frame was better than intra, last, golden |
| */ |
| double pcnt_third_ref; |
| /*! |
| * Percentage of blocks where intra and inter prediction errors were very |
| * close. Note that this is a 'weighted count', that is, the so blocks may be |
| * weighted by how close the two errors were. |
| */ |
| double pcnt_neutral; |
| /*! |
| * Percentage of blocks that have almost no intra error residual |
| * (i.e. are in effect completely flat and untextured in the intra |
| * domain). In natural videos this is uncommon, but it is much more |
| * common in animations, graphics and screen content, so may be used |
| * as a signal to detect these types of content. |
| */ |
| double intra_skip_pct; |
| /*! |
| * Image mask rows top and bottom. |
| */ |
| double inactive_zone_rows; |
| /*! |
| * Image mask columns at left and right edges. |
| */ |
| double inactive_zone_cols; |
| /*! |
| * Average of row motion vectors. |
| */ |
| double MVr; |
| /*! |
| * Mean of absolute value of row motion vectors. |
| */ |
| double mvr_abs; |
| /*! |
| * Mean of column motion vectors. |
| */ |
| double MVc; |
| /*! |
| * Mean of absolute value of column motion vectors. |
| */ |
| double mvc_abs; |
| /*! |
| * Variance of row motion vectors. |
| */ |
| double MVrv; |
| /*! |
| * Variance of column motion vectors. |
| */ |
| double MVcv; |
| /*! |
| * Value in range [-1,1] indicating fraction of row and column motion vectors |
| * that point inwards (negative MV value) or outwards (positive MV value). |
| * For example, value of 1 indicates, all row/column MVs are inwards. |
| */ |
| double mv_in_out_count; |
| /*! |
| * Count of unique non-zero motion vectors. |
| */ |
| double new_mv_count; |
| /*! |
| * Duration of the frame / collection of frames. |
| */ |
| double duration; |
| /*! |
| * 1.0 if stats are for a single frame, OR |
| * Number of frames in this collection for which the stats are accumulated. |
| */ |
| double count; |
| /*! |
| * standard deviation for (0, 0) motion prediction error |
| */ |
| double raw_error_stdev; |
| } FIRSTPASS_STATS; |
| |
| /*!\cond */ |
| |
| #define FC_HIGHMOTION_THRESH 0.15 |
| enum { |
| FC_NORMAL = 0, |
| FC_HIGHMOTION = 1, |
| FRAME_CONTENT_TYPES = 2 |
| } UENUM1BYTE(FRAME_CONTENT_TYPE); |
| |
| typedef struct { |
| FIRSTPASS_STATS *stats_in_start; |
| FIRSTPASS_STATS *stats_in_end; |
| FIRSTPASS_STATS *stats_in_buf_end; |
| FIRSTPASS_STATS *total_stats; |
| FIRSTPASS_STATS *total_left_stats; |
| } STATS_BUFFER_CTX; |
| |
| /*!\endcond */ |
| |
| /*! |
| * \brief Two pass status and control data. |
| */ |
| typedef struct { |
| /*!\cond */ |
| unsigned int section_intra_rating; |
| // Circular queue of first pass stats stored for most recent frames. |
| // cpi->output_pkt_list[i].data.twopass_stats.buf points to actual data stored |
| // here. |
| FIRSTPASS_STATS *frame_stats_arr[MAX_LAP_BUFFERS + 1]; |
| int frame_stats_next_idx; // Index to next unused element in frame_stats_arr. |
| const FIRSTPASS_STATS *stats_in; |
| STATS_BUFFER_CTX *stats_buf_ctx; |
| int first_pass_done; |
| int64_t bits_left; |
| double modified_error_min; |
| double modified_error_max; |
| double modified_error_left; |
| double mb_av_energy; |
| double frame_avg_haar_energy; |
| |
| // An indication of the content type of the current frame |
| FRAME_CONTENT_TYPE fr_content_type; |
| |
| // Projected total bits available for a key frame group of frames |
| int64_t kf_group_bits; |
| |
| // Error score of frames still to be coded in kf group |
| int64_t kf_group_error_left; |
| |
| // Over time correction for bits per macro block estimation |
| double bpm_factor; |
| |
| // Record of target and actual bits spent in current ARF group |
| int rolling_arf_group_target_bits; |
| int rolling_arf_group_actual_bits; |
| |
| int sr_update_lag; |
| |
| int kf_zeromotion_pct; |
| int last_kfgroup_zeromotion_pct; |
| int extend_minq; |
| int extend_maxq; |
| int extend_minq_fast; |
| /*!\endcond */ |
| } TWO_PASS; |
| |
| /*!\cond */ |
| |
| // This structure contains several key parameters to be accumulated for this |
| // frame. |
| typedef struct { |
| // Intra prediction error. |
| int64_t intra_error; |
| // Average wavelet energy computed using Discrete Wavelet Transform (DWT). |
| int64_t frame_avg_wavelet_energy; |
| // Best of intra pred error and inter pred error using last frame as ref. |
| int64_t coded_error; |
| // Best of intra pred error and inter pred error using golden frame as ref. |
| int64_t sr_coded_error; |
| // Best of intra pred error and inter pred error using altref frame as ref. |
| int64_t tr_coded_error; |
| // Count of motion vector. |
| int mv_count; |
| // Count of blocks that pick inter prediction (inter pred error is smaller |
| // than intra pred error). |
| int inter_count; |
| // Count of blocks that pick second ref (golden frame). |
| int second_ref_count; |
| // Count of blocks that pick third ref (altref frame). |
| int third_ref_count; |
| // Count of blocks where the inter and intra are very close and very low. |
| double neutral_count; |
| // Count of blocks where intra error is very small. |
| int intra_skip_count; |
| // Start row. |
| int image_data_start_row; |
| // Count of unique non-zero motion vectors. |
| int new_mv_count; |
| // Sum of inward motion vectors. |
| int sum_in_vectors; |
| // Sum of motion vector row. |
| int sum_mvr; |
| // Sum of motion vector column. |
| int sum_mvc; |
| // Sum of absolute value of motion vector row. |
| int sum_mvr_abs; |
| // Sum of absolute value of motion vector column. |
| int sum_mvc_abs; |
| // Sum of the square of motion vector row. |
| int64_t sum_mvrs; |
| // Sum of the square of motion vector column. |
| int64_t sum_mvcs; |
| // A factor calculated using intra pred error. |
| double intra_factor; |
| // A factor that measures brightness. |
| double brightness_factor; |
| } FRAME_STATS; |
| |
| // This structure contains first pass data. |
| typedef struct { |
| // Buffer holding frame stats for all MACROBLOCKs. |
| // mb_stats[i] stores the FRAME_STATS of the ith |
| // MB in raster scan order. |
| FRAME_STATS *mb_stats; |
| // Buffer to store the prediction error of the (0,0) motion |
| // vector using the last source frame as the reference. |
| // raw_motion_err_list[i] stores the raw_motion_err of |
| // the ith MB in raster scan order. |
| int *raw_motion_err_list; |
| } FirstPassData; |
| |
| struct AV1_COMP; |
| struct EncodeFrameParams; |
| struct AV1EncoderConfig; |
| struct TileDataEnc; |
| |
| int av1_get_mb_rows_in_tile(TileInfo tile); |
| int av1_get_mb_cols_in_tile(TileInfo tile); |
| |
| void av1_rc_get_first_pass_params(struct AV1_COMP *cpi); |
| void av1_first_pass_row(struct AV1_COMP *cpi, struct ThreadData *td, |
| struct TileDataEnc *tile_data, int mb_row); |
| void av1_end_first_pass(struct AV1_COMP *cpi); |
| |
| void av1_twopass_zero_stats(FIRSTPASS_STATS *section); |
| void av1_accumulate_stats(FIRSTPASS_STATS *section, |
| const FIRSTPASS_STATS *frame); |
| /*!\endcond */ |
| |
| /*!\brief AV1 first pass encoding. |
| * |
| * \ingroup rate_control |
| * This function is the first encoding pass for the two pass encoding mode. |
| * It encodes the whole video and collect essential information. |
| * Two pass encoding is an encoding mode in the reference software (libaom) |
| * of AV1 for high performance encoding. The first pass is a fast encoding |
| * process to collect essential information to help the second pass make |
| * encoding decisions and improve coding quality. The collected stats is used |
| * in rate control, for example, to determine frame cut, the position of |
| * alternative reference frame (ARF), etc. |
| * |
| * \param[in] cpi Top-level encoder structure |
| * \param[in] ts_duration Duration of the frame / collection of frames |
| * |
| * Nothing is returned. Instead, the "TWO_PASS" structure inside "cpi" |
| * is modified to store information computed in this function. |
| */ |
| void av1_first_pass(struct AV1_COMP *cpi, const int64_t ts_duration); |
| |
| #ifdef __cplusplus |
| } // extern "C" |
| #endif |
| |
| #endif // AOM_AV1_ENCODER_FIRSTPASS_H_ |