blob: 6d8e5c01e15595b72be601de00185bbcbe8056ba [file] [log] [blame]
/*
* Copyright (c) 2016, Alliance for Open Media. All rights reserved
*
* This source code is subject to the terms of the BSD 2 Clause License and
* the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
* was not distributed with this source code in the LICENSE file, you can
* obtain it at www.aomedia.org/license/software. If the Alliance for Open
* Media Patent License 1.0 was not distributed with this source code in the
* PATENTS file, you can obtain it at www.aomedia.org/license/patent.
*/
#ifndef AOM_AV1_ENCODER_FIRSTPASS_H_
#define AOM_AV1_ENCODER_FIRSTPASS_H_
#include <stdbool.h>
#include "av1/common/av1_common_int.h"
#include "av1/common/enums.h"
#include "av1/encoder/lookahead.h"
#include "av1/encoder/ratectrl.h"
#ifdef __cplusplus
extern "C" {
#endif
#define DOUBLE_DIVIDE_CHECK(x) ((x) < 0 ? (x)-0.000001 : (x) + 0.000001)
#define MIN_ZERO_MOTION 0.95
#define MAX_SR_CODED_ERROR 40
#define MAX_RAW_ERR_VAR 2000
#define MIN_MV_IN_OUT 0.4
#define VLOW_MOTION_THRESHOLD 950
struct ThreadData;
/*!
* \brief The stucture of acummulated frame stats in the first pass.
*
* Errors (coded_error, intra_error, etc.) and counters (new_mv_count) are
* normalized to each MB. MV related stats (MVc, MVr, etc.) are normalized to
* the frame width and height. See function normalize_firstpass_stats.
*/
typedef struct FIRSTPASS_STATS {
/*!
* Frame number in display order, if stats are for a single frame.
* No real meaning for a collection of frames.
*/
double frame;
/*!
* Weight assigned to this frame (or total weight for the collection of
* frames) currently based on intra factor and brightness factor. This is used
* to distribute bits betweeen easier and harder frames.
*/
double weight;
/*!
* Intra prediction error.
*/
double intra_error;
/*!
* Average wavelet energy computed using Discrete Wavelet Transform (DWT).
*/
double frame_avg_wavelet_energy;
/*!
* Best of intra pred error and inter pred error using last frame as ref.
*/
double coded_error;
/*!
* Best of intra pred error and inter pred error using golden frame as ref.
*/
double sr_coded_error;
/*!
* Percentage of blocks with inter pred error < intra pred error.
*/
double pcnt_inter;
/*!
* Percentage of blocks using (inter prediction and) non-zero motion vectors.
*/
double pcnt_motion;
/*!
* Percentage of blocks where golden frame was better than last or intra:
* inter pred error using golden frame < inter pred error using last frame and
* inter pred error using golden frame < intra pred error
*/
double pcnt_second_ref;
/*!
* Percentage of blocks where intra and inter prediction errors were very
* close. Note that this is a 'weighted count', that is, the so blocks may be
* weighted by how close the two errors were.
*/
double pcnt_neutral;
/*!
* Percentage of blocks that have almost no intra error residual
* (i.e. are in effect completely flat and untextured in the intra
* domain). In natural videos this is uncommon, but it is much more
* common in animations, graphics and screen content, so may be used
* as a signal to detect these types of content.
*/
double intra_skip_pct;
/*!
* Image mask rows top and bottom.
*/
double inactive_zone_rows;
/*!
* Image mask columns at left and right edges.
*/
double inactive_zone_cols;
/*!
* Average of row motion vectors.
*/
double MVr;
/*!
* Mean of absolute value of row motion vectors.
*/
double mvr_abs;
/*!
* Mean of column motion vectors.
*/
double MVc;
/*!
* Mean of absolute value of column motion vectors.
*/
double mvc_abs;
/*!
* Variance of row motion vectors.
*/
double MVrv;
/*!
* Variance of column motion vectors.
*/
double MVcv;
/*!
* Value in range [-1,1] indicating fraction of row and column motion vectors
* that point inwards (negative MV value) or outwards (positive MV value).
* For example, value of 1 indicates, all row/column MVs are inwards.
*/
double mv_in_out_count;
/*!
* Count of unique non-zero motion vectors.
*/
double new_mv_count;
/*!
* Duration of the frame / collection of frames.
*/
double duration;
/*!
* 1.0 if stats are for a single frame, OR
* Number of frames in this collection for which the stats are accumulated.
*/
double count;
/*!
* standard deviation for (0, 0) motion prediction error
*/
double raw_error_stdev;
/*!
* Whether the frame contains a flash
*/
int64_t is_flash;
/*!
* Estimated noise variance
*/
double noise_var;
/*!
* Correlation coefficient with the previous frame
*/
double cor_coeff;
/*!
* log of intra_error
*/
double log_intra_error;
/*!
* log of coded_error
*/
double log_coded_error;
} FIRSTPASS_STATS;
// We want to keep one past stats for key frame detection
// in test_candidate_kf()
#define FIRSTPASS_INFO_STATS_PAST_MIN 1
// The size of static buffer used in FIRSTPASS_INFO.
#define FIRSTPASS_INFO_STATIC_BUF_SIZE \
(MAX_LAP_BUFFERS + FIRSTPASS_INFO_STATS_PAST_MIN)
/*!
* \brief Data structure used for managing first pass stats
*/
typedef struct {
/*!
* A static buffer that will be used when no ext_stats_buf is assigned. The
* ext_stats_buf is assigned through av1_firstpass_info_init() when the user
* already has a pre-existing firstpass stats that is stored in an external
* buffer. The ext_stats_buf is usually used in two pass mode. When using one
* pass mode, we generate "firstpass" stats and encode the video in the same
* pass. In this scenario, the stats will be pushed and popped from
* static_stats_buf.
*/
FIRSTPASS_STATS static_stats_buf[FIRSTPASS_INFO_STATIC_BUF_SIZE];
/*!
* A pointer to first pass stats.
* Note that this buffer will be used as ring buffer.
*/
FIRSTPASS_STATS *stats_buf;
/*!
* size of stats_buf
*/
int stats_buf_size;
/*!
* start index of the available frame stats
* Note that start_index doesn't always point to
* current frame's stats because we need to
* keep past stats as well. To access current
* frame's stats, please use cur_index.
*/
int start_index;
/*!
* count available stats stored in stats_buf
* the following condition should stay true
* stats_count = future_stats_count + past_stats_count
*/
int stats_count;
/*!
* index of the current frame's stats
*/
int cur_index;
/*!
* count available future stats including current stats
*/
int future_stats_count;
/*!
* count available past stats EXCLUDING current stats
*/
int past_stats_count;
/*!
* Accumulation of the stats being pushed into firstpass_info
*/
FIRSTPASS_STATS total_stats;
} FIRSTPASS_INFO;
/*!\brief Init firstpass_info
*
* If using ext_stats_buf, the buffer needs to stay available during encoding
* process.
*
* \ingroup rate_control
* \param[out] firstpass_info struct of firstpass_info.
* \param[in] ext_stats_buf external stats buffer. Pass in NULL if
* choose to use internal static_stats_buf.
* \param[in] ext_stats_buf_size external stats buffer size. Pass in 0 if
* choose to use internal static_stats_buf. \return status
*/
aom_codec_err_t av1_firstpass_info_init(FIRSTPASS_INFO *firstpass_info,
FIRSTPASS_STATS *ext_stats_buf,
int ext_stats_buf_size);
/*!\brief Move cur_index by 1
*
* \ingroup rate_control
* \param[out] firstpass_info struct of firstpass_info.
* \return status
*/
aom_codec_err_t av1_firstpass_info_move_cur_index(
FIRSTPASS_INFO *firstpass_info);
/*!\brief Pop a stats from firstpass_info
*
* \ingroup rate_control
* \param[out] firstpass_info struct of firstpass_info.
* \return status
*/
aom_codec_err_t av1_firstpass_info_pop(FIRSTPASS_INFO *firstpass_info);
/*!\brief Move cur_index by 1 and pop a stats from firstpass_info
*
* \ingroup rate_control
* \param[out] firstpass_info struct of firstpass_info.
* \return status
*/
aom_codec_err_t av1_firstpass_info_move_cur_index_and_pop(
FIRSTPASS_INFO *firstpass_info);
/*!\brief Push a stats into firstpass_info
*
* Note that the input stats will be copied into firstpass_info.
* \ingroup rate_control
* \param[out] firstpass_info struct of firstpass_info.
* \param[in] input_stats input stats
* \return status
*/
aom_codec_err_t av1_firstpass_info_push(FIRSTPASS_INFO *firstpass_info,
const FIRSTPASS_STATS *input_stats);
/*!\brief Peek at a stats from firstpass_info
*
* The target index is as follows.
* (cur_index + offset_from_cur) % firstpass_info->stats_buf_size
*
* \ingroup rate_control
* \param[in] firstpass_info struct of firstpass_info.
* \param[in] offset_from_cur index offset from cur_index.
* \return pointer to the stats. The pointer will be NULL if
* stats_index_offset is invalid.
*/
const FIRSTPASS_STATS *av1_firstpass_info_peek(
const FIRSTPASS_INFO *firstpass_info, int offset_from_cur);
/*!\brief Count the future stats from the target in firstpass_info
* Note that the target stats will be counted as well.
* The target index is as follows.
* (cur_index + offset_from_cur) % firstpass_info->stats_buf_size
*
* \ingroup rate_control
* \param[in] firstpass_info struct of firstpass_info.
* \param[in] offset_from_cur target stats's inffset
* from cur_index.
* \return Number of stats in the future after the target stats
* including itself.
*/
int av1_firstpass_info_future_count(const FIRSTPASS_INFO *firstpass_info,
int offset_from_cur);
/*!\brief Count the past stats before the target in firstpass_info
* Note that the target stats will NOT be counted.
* The target index is as follows.
* (cur_index + offset_from_cur) % firstpass_info->stats_buf_size
*
* \ingroup rate_control
* \param[in] firstpass_info struct of firstpass_info.
* \param[in] offset_from_cur target stats's index offset
* from cur_index.
* \return Number of stats in the past before the target stats
* excluding itself.
*/
int av1_firstpass_info_past_count(const FIRSTPASS_INFO *firstpass_info,
int offset_from_cur);
/*!\cond */
#define FC_ANIMATION_THRESH 0.15
enum {
FC_NORMAL = 0,
FC_GRAPHICS_ANIMATION = 1,
FRAME_CONTENT_TYPES = 2
} UENUM1BYTE(FRAME_CONTENT_TYPE);
/*!\endcond */
/*!
* \brief Data related to the current GF/ARF group and the
* individual frames within the group
*/
typedef struct GF_GROUP {
/*!\cond */
// Frame update type, e.g. ARF/GF/LF/Overlay
FRAME_UPDATE_TYPE update_type[MAX_STATIC_GF_GROUP_LENGTH];
unsigned char arf_src_offset[MAX_STATIC_GF_GROUP_LENGTH];
// The number of frames displayed so far within the GOP at a given coding
// frame.
unsigned char cur_frame_idx[MAX_STATIC_GF_GROUP_LENGTH];
int layer_depth[MAX_STATIC_GF_GROUP_LENGTH];
int arf_boost[MAX_STATIC_GF_GROUP_LENGTH];
int max_layer_depth;
int max_layer_depth_allowed;
// This is currently only populated for AOM_Q mode
int q_val[MAX_STATIC_GF_GROUP_LENGTH];
int rdmult_val[MAX_STATIC_GF_GROUP_LENGTH];
int bit_allocation[MAX_STATIC_GF_GROUP_LENGTH];
// The frame coding type - inter/intra frame
FRAME_TYPE frame_type[MAX_STATIC_GF_GROUP_LENGTH];
// The reference frame buffer control - update or reset
REFBUF_STATE refbuf_state[MAX_STATIC_GF_GROUP_LENGTH];
int arf_index; // the index in the gf group of ARF, if no arf, then -1
int size; // The total length of a GOP
// The offset into lookahead_ctx for choosing
// source of frame parallel encodes.
int src_offset[MAX_STATIC_GF_GROUP_LENGTH];
// Stores the display order hint of each frame in the current GF_GROUP.
int display_idx[MAX_STATIC_GF_GROUP_LENGTH];
// The reference frame list maps the reference frame indexes to its
// buffer index in the decoded buffer. A value of -1 means the
// corresponding reference frame index doesn't point towards any
// previously decoded frame.
int8_t ref_frame_list[MAX_STATIC_GF_GROUP_LENGTH][REF_FRAMES];
// Update frame index
int update_ref_idx[MAX_STATIC_GF_GROUP_LENGTH];
// The map_idx of primary reference
int primary_ref_idx[MAX_STATIC_GF_GROUP_LENGTH];
// Indicates the level of parallelism in frame parallel encodes.
// 0 : frame is independently encoded (not part of parallel encodes).
// 1 : frame is the first in encode order in a given parallel encode set.
// 2 : frame occurs later in encode order in a given parallel encode set.
int frame_parallel_level[MAX_STATIC_GF_GROUP_LENGTH];
// Indicates whether a frame should act as non-reference frame.
bool is_frame_non_ref[MAX_STATIC_GF_GROUP_LENGTH];
// Indicates whether a frame is dropped.
bool is_frame_dropped[MAX_STATIC_GF_GROUP_LENGTH];
// Stores the display order hint of the frames not to be
// refreshed by the current frame.
int skip_frame_refresh[MAX_STATIC_GF_GROUP_LENGTH][REF_FRAMES];
// Stores the display order hint of the frame to be excluded during reference
// assignment.
int skip_frame_as_ref[MAX_STATIC_GF_GROUP_LENGTH];
/*!\endcond */
} GF_GROUP;
/*!\cond */
typedef struct {
// Track if the last frame in a GOP has higher quality.
int arf_gf_boost_lst;
} GF_STATE;
typedef struct {
FIRSTPASS_STATS *stats_in_start;
FIRSTPASS_STATS *stats_in_end;
FIRSTPASS_STATS *stats_in_buf_end;
FIRSTPASS_STATS *total_stats;
FIRSTPASS_STATS *total_left_stats;
} STATS_BUFFER_CTX;
/*!\endcond */
/*!
* \brief Two pass status and control data.
*/
typedef struct {
/*!\cond */
unsigned int section_intra_rating;
// Circular queue of first pass stats stored for most recent frames.
// cpi->output_pkt_list[i].data.twopass_stats.buf points to actual data stored
// here.
FIRSTPASS_STATS *frame_stats_arr[MAX_LAP_BUFFERS + 1];
int frame_stats_next_idx; // Index to next unused element in frame_stats_arr.
STATS_BUFFER_CTX *stats_buf_ctx;
FIRSTPASS_INFO firstpass_info; // This is the first pass data structure
// intended to replace stats_in
int first_pass_done;
int64_t bits_left;
double modified_error_min;
double modified_error_max;
double modified_error_left;
// Projected total bits available for a key frame group of frames
int64_t kf_group_bits;
// Error score of frames still to be coded in kf group
double kf_group_error_left;
// Over time correction for bits per macro block estimation
double bpm_factor;
// Record of target and actual bits spent in current ARF group
int rolling_arf_group_target_bits;
int rolling_arf_group_actual_bits;
int sr_update_lag;
int kf_zeromotion_pct;
int last_kfgroup_zeromotion_pct;
int extend_minq;
int extend_maxq;
int extend_minq_fast;
/*!\endcond */
} TWO_PASS;
/*!
* \brief Frame level Two pass status and control data.
*/
typedef struct {
/*!\cond */
const FIRSTPASS_STATS *stats_in;
// Pointer to the stats of the current frame.
const FIRSTPASS_STATS *this_frame;
double mb_av_energy;
// An indication of the content type of the current frame
FRAME_CONTENT_TYPE fr_content_type;
double frame_avg_haar_energy;
/*!\endcond */
} TWO_PASS_FRAME;
/*!\cond */
// This structure contains several key parameters to be accumulated for this
// frame.
typedef struct {
// Intra prediction error.
int64_t intra_error;
// Average wavelet energy computed using Discrete Wavelet Transform (DWT).
int64_t frame_avg_wavelet_energy;
// Best of intra pred error and inter pred error using last frame as ref.
int64_t coded_error;
// Best of intra pred error and inter pred error using golden frame as ref.
int64_t sr_coded_error;
// Count of motion vector.
int mv_count;
// Count of blocks that pick inter prediction (inter pred error is smaller
// than intra pred error).
int inter_count;
// Count of blocks that pick second ref (golden frame).
int second_ref_count;
// Count of blocks where the inter and intra are very close and very low.
double neutral_count;
// Count of blocks where intra error is very small.
int intra_skip_count;
// Start row.
int image_data_start_row;
// Count of unique non-zero motion vectors.
int new_mv_count;
// Sum of inward motion vectors.
int sum_in_vectors;
// Sum of motion vector row.
int sum_mvr;
// Sum of motion vector column.
int sum_mvc;
// Sum of absolute value of motion vector row.
int sum_mvr_abs;
// Sum of absolute value of motion vector column.
int sum_mvc_abs;
// Sum of the square of motion vector row.
int64_t sum_mvrs;
// Sum of the square of motion vector column.
int64_t sum_mvcs;
// A factor calculated using intra pred error.
double intra_factor;
// A factor that measures brightness.
double brightness_factor;
} FRAME_STATS;
// This structure contains first pass data.
typedef struct {
// Buffer holding frame stats for all MACROBLOCKs.
// mb_stats[i] stores the FRAME_STATS of the ith
// MB in raster scan order.
FRAME_STATS *mb_stats;
// Buffer to store the prediction error of the (0,0) motion
// vector using the last source frame as the reference.
// raw_motion_err_list[i] stores the raw_motion_err of
// the ith MB in raster scan order.
int *raw_motion_err_list;
} FirstPassData;
struct AV1_COMP;
struct EncodeFrameParams;
struct AV1EncoderConfig;
struct TileDataEnc;
static INLINE int is_fp_wavelet_energy_invalid(
const FIRSTPASS_STATS *fp_stats) {
assert(fp_stats != NULL);
return (fp_stats->frame_avg_wavelet_energy < 0);
}
static INLINE BLOCK_SIZE get_fp_block_size(int is_screen_content_type) {
return (is_screen_content_type ? BLOCK_8X8 : BLOCK_16X16);
}
int av1_get_unit_rows_in_tile(const TileInfo *tile,
const BLOCK_SIZE fp_block_size);
int av1_get_unit_cols_in_tile(const TileInfo *tile,
const BLOCK_SIZE fp_block_size);
void av1_first_pass_row(struct AV1_COMP *cpi, struct ThreadData *td,
struct TileDataEnc *tile_data, const int mb_row,
const BLOCK_SIZE fp_block_size);
void av1_end_first_pass(struct AV1_COMP *cpi);
void av1_twopass_zero_stats(FIRSTPASS_STATS *section);
void av1_accumulate_stats(FIRSTPASS_STATS *section,
const FIRSTPASS_STATS *frame);
/*!\endcond */
/*!\brief AV1 first pass encoding.
*
* \ingroup rate_control
* This function is the first encoding pass for the two pass encoding mode.
* It encodes the whole video and collect essential information.
* Two pass encoding is an encoding mode in the reference software (libaom)
* of AV1 for high performance encoding. The first pass is a fast encoding
* process to collect essential information to help the second pass make
* encoding decisions and improve coding quality. The collected stats is used
* in rate control, for example, to determine frame cut, the position of
* alternative reference frame (ARF), etc.
*
* \param[in] cpi Top-level encoder structure
* \param[in] ts_duration Duration of the frame / collection of frames
*
* \remark Nothing is returned. Instead, the "TWO_PASS" structure inside "cpi"
* is modified to store information computed in this function.
*/
void av1_first_pass(struct AV1_COMP *cpi, const int64_t ts_duration);
void av1_noop_first_pass_frame(struct AV1_COMP *cpi, const int64_t ts_duration);
#ifdef __cplusplus
} // extern "C"
#endif
#endif // AOM_AV1_ENCODER_FIRSTPASS_H_