blob: 5fa8492410a4f4e1e08cc4c3affc18ea936d459c [file] [log] [blame] [edit]
/*
* Copyright (c) 2022, Alliance for Open Media. All rights reserved
*
* This source code is subject to the terms of the BSD 2 Clause License and
* the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
* was not distributed with this source code in the LICENSE file, you can
* obtain it at www.aomedia.org/license/software. If the Alliance for Open
* Media Patent License 1.0 was not distributed with this source code in the
* PATENTS file, you can obtain it at www.aomedia.org/license/patent.
*/
#ifndef AOM_AV1_RATECTRL_QMODE_INTERFACE_H_
#define AOM_AV1_RATECTRL_QMODE_INTERFACE_H_
#include <array>
#include <vector>
#include "av1/encoder/firstpass.h"
namespace aom {
constexpr int kBlockRefCount = 2;
constexpr int kRefFrameTableSize = 7;
struct MotionVector {
int row; // subpel row
int col; // subpel col
int subpel_bits; // number of fractional bits used by row/col
};
struct RateControlParam {
int max_gop_show_frame_count;
int min_gop_show_frame_count;
int max_ref_frames;
int base_q_index;
int frame_width;
int frame_height;
};
struct TplBlockStats {
int height; // pixel height
int width; // pixel width
int row; // pixel row of the top left corner
int col; // pixel col of the top lef corner
int64_t intra_cost;
int64_t inter_cost;
std::array<MotionVector, kBlockRefCount> mv;
std::array<int, kBlockRefCount> ref_frame_index;
};
enum class EncodeRefMode {
kRegular,
kOverlay,
kShowExisting,
};
enum class ReferenceName {
kNoneFrame = -1,
kIntraFrame = 0,
kLastFrame = 1,
kLast2Frame = 2,
kLast3Frame = 3,
kGoldenFrame = 4,
kBwdrefFrame = 5,
kAltref2Frame = 6,
kAltrefFrame = 7,
};
struct ReferenceFrame {
int index; // Index of reference slot containing the reference frame
ReferenceName name;
};
struct GopFrame {
// basic info
bool is_valid;
int order_idx; // Index in display order in a GOP
int coding_idx; // Index in coding order in a GOP
int global_order_idx; // Index in display order in the whole video chunk
int global_coding_idx; // Index in coding order in the whole video chunk
bool is_key_frame; // If this is key frame, reset reference buffers are
// required
bool is_arf_frame; // Is this a forward frame, a frame with order_idx
// higher than the current display order
bool is_show_frame; // Is this frame a show frame after coding
bool is_golden_frame; // Is this a high quality frame
// reference frame info
EncodeRefMode encode_ref_mode;
int colocated_ref_idx; // colocated_ref_idx == -1 when encode_ref_mode ==
// EncodeRefMode::kRegular
int update_ref_idx; // The reference index that this frame should be
// updated to. update_ref_idx == -1 when this frame
// will not serve as a reference frame
std::vector<ReferenceFrame>
ref_frame_list; // A list of available reference frames in priority order
// for the current to-be-coded frame. The list size
// should be less or equal to kRefFrameTableSize. The
// reference frames with smaller indices are more likely
// to be a good reference frame. Therefore, they should
// be prioritized when the reference frame count is
// limited. For example, if we plan to use 3 reference
// frames, we should choose ref_frame_list[0],
// ref_frame_list[1] and ref_frame_list[2].
int layer_depth; // Layer depth in the GOP structure
ReferenceFrame primary_ref_frame; // We will use the primary reference frame
// to update current frame's initial
// probability model
};
struct GopStruct {
int show_frame_count;
int global_coding_idx_offset;
int global_order_idx_offset;
std::vector<GopFrame> gop_frame_list;
};
using GopStructList = std::vector<GopStruct>;
struct FrameEncodeParameters {
int q_index;
int rdmult;
};
struct FirstpassInfo {
int num_mbs_16x16; // Count of 16x16 unit blocks in each frame.
// FIRSTPASS_STATS's unit block size is 16x16
std::vector<FIRSTPASS_STATS> stats_list;
};
using RefFrameTable = std::array<GopFrame, kRefFrameTableSize>;
struct GopEncodeInfo {
std::vector<FrameEncodeParameters> param_list;
RefFrameTable final_snapshot; // RefFrameTable snapshot after coding this GOP
};
struct TplFrameStats {
int min_block_size;
int frame_width;
int frame_height;
std::vector<TplBlockStats> block_stats_list;
};
struct TplGopStats {
std::vector<TplFrameStats> frame_stats_list;
};
class AV1RateControlQModeInterface {
public:
AV1RateControlQModeInterface();
virtual ~AV1RateControlQModeInterface();
virtual void SetRcParam(const RateControlParam &rc_param) = 0;
virtual GopStructList DetermineGopInfo(
const FirstpassInfo &firstpass_info) = 0;
// Accept firstpass and tpl info from the encoder and return q index and
// rdmult. This needs to be called with consecutive GOPs as returned by
// DetermineGopInfo.
virtual GopEncodeInfo GetGopEncodeInfo(
const GopStruct &gop_struct, const TplGopStats &tpl_gop_stats,
const RefFrameTable &ref_frame_table_snapshot_init) = 0;
}; // class AV1RateCtrlQMode
} // namespace aom
#endif // AOM_AV1_RATECTRL_QMODE_INTERFACE_H_