blob: eaae19ea72a7e92fb953076ced014db617b262b0 [file] [log] [blame]
Yaowu Xuc27fc142016-08-22 16:08:15 -07001/*
Yaowu Xu2ab7ff02016-09-02 12:04:54 -07002 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
Yaowu Xuc27fc142016-08-22 16:08:15 -07003 *
Yaowu Xu2ab7ff02016-09-02 12:04:54 -07004 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
Yaowu Xuc27fc142016-08-22 16:08:15 -070010 */
11
James Zerne1cbb132018-08-22 14:10:36 -070012#ifndef AOM_AV1_ENCODER_RD_H_
13#define AOM_AV1_ENCODER_RD_H_
Yaowu Xuc27fc142016-08-22 16:08:15 -070014
15#include <limits.h>
16
Yaowu Xuc27fc142016-08-22 16:08:15 -070017#include "av1/common/blockd.h"
18
19#include "av1/encoder/block.h"
20#include "av1/encoder/context_tree.h"
21#include "av1/encoder/cost.h"
22
23#ifdef __cplusplus
24extern "C" {
25#endif
26
27#define RDDIV_BITS 7
28#define RD_EPB_SHIFT 6
29
Angie Chiange4ea7482018-03-15 11:36:41 -070030#define RDCOST(RM, R, D) \
31 (ROUND_POWER_OF_TWO(((int64_t)(R)) * (RM), AV1_PROB_COST_SHIFT) + \
32 ((D) * (1 << RDDIV_BITS)))
Yaowu Xuc27fc142016-08-22 16:08:15 -070033
sdeng256c4d32019-06-11 12:19:48 -070034#define RDCOST_NEG_R(RM, R, D) \
35 (((D) * (1 << RDDIV_BITS)) - \
36 ROUND_POWER_OF_TWO(((int64_t)(R)) * (RM), AV1_PROB_COST_SHIFT))
37
Urvang Joshi70006e42017-06-14 16:08:55 -070038#define RDCOST_DBL(RM, R, D) \
Yaowu Xuf883b422016-08-30 14:01:10 -070039 (((((double)(R)) * (RM)) / (double)(1 << AV1_PROB_COST_SHIFT)) + \
Urvang Joshi70006e42017-06-14 16:08:55 -070040 ((double)(D) * (1 << RDDIV_BITS)))
Yaowu Xuc27fc142016-08-22 16:08:15 -070041
42#define QIDX_SKIP_THRESH 115
43
44#define MV_COST_WEIGHT 108
45#define MV_COST_WEIGHT_SUB 120
46
Yaowu Xuc27fc142016-08-22 16:08:15 -070047#define RD_THRESH_MAX_FACT 64
48#define RD_THRESH_INC 1
49
Peng Binc7101aa2018-06-22 20:47:05 +080050// Factor to weigh the rate for switchable interp filters.
51#define SWITCHABLE_INTERP_RATE_FACTOR 1
52
Cherma Rajan A628efce2019-09-18 18:55:12 +053053enum {
54 // Default initialization
55 DEFAULT_EVAL = 0,
56 // Initialization for default mode evaluation
57 MODE_EVAL,
58 // Initialization for winner mode evaluation
59 WINNER_MODE_EVAL,
60 // All mode evaluation types
61 MODE_EVAL_TYPES,
62} UENUM1BYTE(MODE_EVAL_TYPE);
63
Yaowu Xuc27fc142016-08-22 16:08:15 -070064typedef struct RD_OPT {
65 // Thresh_mult is used to set a threshold for the rd score. A higher value
66 // means that we will accept the best mode so far more often. This number
67 // is used in combination with the current block size, and thresh_freq_fact
68 // to pick a threshold.
69 int thresh_mult[MAX_MODES];
Yaowu Xuc27fc142016-08-22 16:08:15 -070070
Rupert Swarbrick93c39e92017-07-12 11:11:02 +010071 int threshes[MAX_SEGMENTS][BLOCK_SIZES_ALL][MAX_MODES];
Yaowu Xuc27fc142016-08-22 16:08:15 -070072
Yaowu Xuc27fc142016-08-22 16:08:15 -070073 int RDMULT;
Yue Chen7cae98f2018-08-24 10:43:16 -070074
Debargha Mukherjeed0c0b772019-05-27 23:05:06 -070075 double r0, arf_r0;
Yue Chenbd934232019-08-05 14:23:39 -070076#if !USE_TPL_CLASSIC_MODEL
Debargha Mukherjee88ff7382019-05-01 12:36:10 -070077 double mc_saved_base, mc_count_base;
Yue Chenbd934232019-08-05 14:23:39 -070078#endif // !USE_TPL_CLASSIC_MODEL
Yaowu Xuc27fc142016-08-22 16:08:15 -070079} RD_OPT;
80
Angie Chiang2a2a7dd2017-04-25 16:08:47 -070081static INLINE void av1_init_rd_stats(RD_STATS *rd_stats) {
82#if CONFIG_RD_DEBUG
83 int plane;
84#endif
85 rd_stats->rate = 0;
86 rd_stats->dist = 0;
87 rd_stats->rdcost = 0;
88 rd_stats->sse = 0;
89 rd_stats->skip = 1;
Jingning Han3bce7542017-07-25 10:53:57 -070090 rd_stats->zero_rate = 0;
Angie Chiang2a2a7dd2017-04-25 16:08:47 -070091#if CONFIG_RD_DEBUG
Imdad Sardharwallaaf8e2642018-01-19 11:46:34 +000092 // This may run into problems when monochrome video is
93 // encoded, as there will only be 1 plane
Angie Chiang2a2a7dd2017-04-25 16:08:47 -070094 for (plane = 0; plane < MAX_MB_PLANE; ++plane) {
95 rd_stats->txb_coeff_cost[plane] = 0;
Angie Chiang2a2a7dd2017-04-25 16:08:47 -070096 {
97 int r, c;
98 for (r = 0; r < TXB_COEFF_COST_MAP_SIZE; ++r)
99 for (c = 0; c < TXB_COEFF_COST_MAP_SIZE; ++c)
100 rd_stats->txb_coeff_cost_map[plane][r][c] = 0;
101 }
Angie Chiang2a2a7dd2017-04-25 16:08:47 -0700102 }
103#endif
104}
Yaowu Xuc27fc142016-08-22 16:08:15 -0700105
Angie Chiang2a2a7dd2017-04-25 16:08:47 -0700106static INLINE void av1_invalid_rd_stats(RD_STATS *rd_stats) {
107#if CONFIG_RD_DEBUG
108 int plane;
109#endif
110 rd_stats->rate = INT_MAX;
111 rd_stats->dist = INT64_MAX;
112 rd_stats->rdcost = INT64_MAX;
113 rd_stats->sse = INT64_MAX;
114 rd_stats->skip = 0;
Jingning Han3bce7542017-07-25 10:53:57 -0700115 rd_stats->zero_rate = 0;
Angie Chiang2a2a7dd2017-04-25 16:08:47 -0700116#if CONFIG_RD_DEBUG
Imdad Sardharwallaaf8e2642018-01-19 11:46:34 +0000117 // This may run into problems when monochrome video is
118 // encoded, as there will only be 1 plane
Angie Chiang2a2a7dd2017-04-25 16:08:47 -0700119 for (plane = 0; plane < MAX_MB_PLANE; ++plane) {
120 rd_stats->txb_coeff_cost[plane] = INT_MAX;
Angie Chiang2a2a7dd2017-04-25 16:08:47 -0700121 {
122 int r, c;
123 for (r = 0; r < TXB_COEFF_COST_MAP_SIZE; ++r)
124 for (c = 0; c < TXB_COEFF_COST_MAP_SIZE; ++c)
Jingning Han46564ea2019-10-28 15:29:54 -0700125 rd_stats->txb_coeff_cost_map[plane][r][c] = INT16_MAX;
Angie Chiang2a2a7dd2017-04-25 16:08:47 -0700126 }
Angie Chiang2a2a7dd2017-04-25 16:08:47 -0700127 }
128#endif
129}
130
131static INLINE void av1_merge_rd_stats(RD_STATS *rd_stats_dst,
132 const RD_STATS *rd_stats_src) {
Hui Sucd735502019-04-08 11:23:02 -0700133 assert(rd_stats_dst->rate != INT_MAX && rd_stats_src->rate != INT_MAX);
Venkat72481752019-07-01 16:33:49 +0530134 rd_stats_dst->rate = (int)AOMMIN(
135 ((int64_t)rd_stats_dst->rate + (int64_t)rd_stats_src->rate), INT_MAX);
Debargha Mukherjeede80e762017-11-30 13:58:56 -0800136 if (!rd_stats_dst->zero_rate)
137 rd_stats_dst->zero_rate = rd_stats_src->zero_rate;
Angie Chiang2a2a7dd2017-04-25 16:08:47 -0700138 rd_stats_dst->dist += rd_stats_src->dist;
139 rd_stats_dst->sse += rd_stats_src->sse;
140 rd_stats_dst->skip &= rd_stats_src->skip;
141#if CONFIG_RD_DEBUG
Imdad Sardharwallaaf8e2642018-01-19 11:46:34 +0000142 // This may run into problems when monochrome video is
143 // encoded, as there will only be 1 plane
Hui Sucd735502019-04-08 11:23:02 -0700144 for (int plane = 0; plane < MAX_MB_PLANE; ++plane) {
Angie Chiang2a2a7dd2017-04-25 16:08:47 -0700145 rd_stats_dst->txb_coeff_cost[plane] += rd_stats_src->txb_coeff_cost[plane];
Angie Chiang2a2a7dd2017-04-25 16:08:47 -0700146 {
147 // TODO(angiebird): optimize this part
148 int r, c;
149 int ref_txb_coeff_cost = 0;
150 for (r = 0; r < TXB_COEFF_COST_MAP_SIZE; ++r)
151 for (c = 0; c < TXB_COEFF_COST_MAP_SIZE; ++c) {
152 rd_stats_dst->txb_coeff_cost_map[plane][r][c] +=
153 rd_stats_src->txb_coeff_cost_map[plane][r][c];
154 ref_txb_coeff_cost += rd_stats_dst->txb_coeff_cost_map[plane][r][c];
155 }
156 assert(ref_txb_coeff_cost == rd_stats_dst->txb_coeff_cost[plane]);
157 }
Angie Chiang2a2a7dd2017-04-25 16:08:47 -0700158 }
159#endif
160}
Yaowu Xuc27fc142016-08-22 16:08:15 -0700161
Venkatd5d823c2019-06-25 16:48:23 +0530162static INLINE void av1_accumulate_rd_stats(RD_STATS *rd_stats, int64_t dist,
163 int rate, int skip, int64_t sse,
164 int zero_rate) {
165 assert(rd_stats->rate != INT_MAX && rate != INT_MAX);
166 rd_stats->rate += rate;
167 if (!rd_stats->zero_rate) rd_stats->zero_rate = zero_rate;
168 rd_stats->dist += dist;
169 rd_stats->skip &= skip;
170 rd_stats->sse += sse;
171}
172
sdeng256c4d32019-06-11 12:19:48 -0700173static INLINE int64_t av1_calculate_rd_cost(int mult, int rate, int64_t dist) {
174 assert(mult >= 0);
175 if (rate >= 0) {
176 return RDCOST(mult, rate, dist);
177 }
178 return RDCOST_NEG_R(mult, -rate, dist);
179}
180
181static INLINE void av1_rd_cost_update(int mult, RD_STATS *rd_cost) {
sdengafdb8512019-06-12 16:15:56 -0700182 if (rd_cost->rate < INT_MAX && rd_cost->dist < INT64_MAX &&
183 rd_cost->rdcost < INT64_MAX) {
sdeng256c4d32019-06-11 12:19:48 -0700184 rd_cost->rdcost = av1_calculate_rd_cost(mult, rd_cost->rate, rd_cost->dist);
185 } else {
186 av1_invalid_rd_stats(rd_cost);
187 }
188}
189
sdengafdb8512019-06-12 16:15:56 -0700190static INLINE void av1_rd_stats_subtraction(int mult,
191 const RD_STATS *const left,
sdengeff3bb42019-06-11 15:56:04 -0700192 const RD_STATS *const right,
193 RD_STATS *result) {
194 if (left->rate == INT_MAX || right->rate == INT_MAX ||
195 left->dist == INT64_MAX || right->dist == INT64_MAX ||
196 left->rdcost == INT64_MAX || right->rdcost == INT64_MAX) {
197 av1_invalid_rd_stats(result);
198 } else {
199 result->rate = left->rate - right->rate;
200 result->dist = left->dist - right->dist;
sdengafdb8512019-06-12 16:15:56 -0700201 result->rdcost = av1_calculate_rd_cost(mult, result->rate, result->dist);
sdengeff3bb42019-06-11 15:56:04 -0700202 }
203}
204
Yaowu Xuc27fc142016-08-22 16:08:15 -0700205struct TileInfo;
206struct TileDataEnc;
Yaowu Xuf883b422016-08-30 14:01:10 -0700207struct AV1_COMP;
Yaowu Xuc27fc142016-08-22 16:08:15 -0700208struct macroblock;
209
Yaowu Xuea8a6ca2018-11-07 14:53:46 -0800210int av1_compute_rd_mult_based_on_qindex(const struct AV1_COMP *cpi, int qindex);
Ravi Chaudhary95492052018-10-24 11:51:28 +0530211
Yaowu Xuf883b422016-08-30 14:01:10 -0700212int av1_compute_rd_mult(const struct AV1_COMP *cpi, int qindex);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700213
Yaowu Xuf883b422016-08-30 14:01:10 -0700214void av1_initialize_rd_consts(struct AV1_COMP *cpi);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700215
Yaowu Xuf883b422016-08-30 14:01:10 -0700216void av1_initialize_me_consts(const struct AV1_COMP *cpi, MACROBLOCK *x,
217 int qindex);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700218
Yaowu Xuf883b422016-08-30 14:01:10 -0700219void av1_model_rd_from_var_lapndz(int64_t var, unsigned int n,
220 unsigned int qstep, int *rate, int64_t *dist);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700221
Debargha Mukherjee00079832019-01-17 11:28:52 -0800222void av1_model_rd_curvfit(BLOCK_SIZE bsize, double sse_norm, double xqr,
Debargha Mukherjeea7b37312019-01-14 15:15:49 -0800223 double *rate_f, double *distbysse_f);
Debargha Mukherjee00079832019-01-17 11:28:52 -0800224void av1_model_rd_surffit(BLOCK_SIZE bsize, double sse_norm, double xm,
225 double yl, double *rate_f, double *distbysse_f);
Debargha Mukherjee483e2952018-07-25 07:34:26 -0700226
Yue Chenb23d00a2017-07-28 17:01:21 -0700227int av1_get_switchable_rate(const AV1_COMMON *const cm, MACROBLOCK *x,
228 const MACROBLOCKD *xd);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700229
Yaowu Xuf883b422016-08-30 14:01:10 -0700230YV12_BUFFER_CONFIG *av1_get_scaled_ref_frame(const struct AV1_COMP *cpi,
231 int ref_frame);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700232
Yaowu Xuf883b422016-08-30 14:01:10 -0700233void av1_init_me_luts(void);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700234
Yaowu Xu901d6222018-02-21 21:40:48 -0800235void av1_set_mvcost(MACROBLOCK *x, int ref, int ref_mv_idx);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700236
Yunqing Wangef2afb42018-05-01 09:41:00 -0700237void av1_get_entropy_contexts(BLOCK_SIZE bsize,
Yaowu Xuf883b422016-08-30 14:01:10 -0700238 const struct macroblockd_plane *pd,
Wan-Teh Chang660f8ed2018-05-11 17:28:08 -0700239 ENTROPY_CONTEXT t_above[MAX_MIB_SIZE],
240 ENTROPY_CONTEXT t_left[MAX_MIB_SIZE]);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700241
Yaowu Xuf883b422016-08-30 14:01:10 -0700242void av1_set_rd_speed_thresholds(struct AV1_COMP *cpi);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700243
Yaowu Xuf883b422016-08-30 14:01:10 -0700244void av1_update_rd_thresh_fact(const AV1_COMMON *const cm,
245 int (*fact)[MAX_MODES], int rd_thresh, int bsize,
246 int best_mode_index);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700247
Yaowu Xuc27fc142016-08-22 16:08:15 -0700248static INLINE int rd_less_than_thresh(int64_t best_rd, int thresh,
249 int thresh_fact) {
250 return best_rd < ((int64_t)thresh * thresh_fact >> 5) || thresh == INT_MAX;
251}
252
Urvang Joshi52648442016-10-13 17:27:51 -0700253void av1_mv_pred(const struct AV1_COMP *cpi, MACROBLOCK *x,
254 uint8_t *ref_y_buffer, int ref_y_stride, int ref_frame,
255 BLOCK_SIZE block_size);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700256
257static INLINE void set_error_per_bit(MACROBLOCK *x, int rdmult) {
258 x->errorperbit = rdmult >> RD_EPB_SHIFT;
259 x->errorperbit += (x->errorperbit == 0);
260}
261
Ranjit Kumar Tulabandu824f9db2019-07-05 15:16:37 +0530262// Get the threshold for R-D optimization of coefficients depending upon mode
263// decision/winner mode processing
264static INLINE uint32_t get_rd_opt_coeff_thresh(
265 const uint32_t *const coeff_opt_dist_threshold,
266 int enable_winner_mode_for_coeff_opt, int is_winner_mode) {
267 // Default initialization of threshold
Cherma Rajan A628efce2019-09-18 18:55:12 +0530268 uint32_t coeff_opt_thresh = coeff_opt_dist_threshold[DEFAULT_EVAL];
Ranjit Kumar Tulabandu824f9db2019-07-05 15:16:37 +0530269 // TODO(any): Experiment with coeff_opt_dist_threshold values when
270 // enable_winner_mode_for_coeff_opt is ON
271 // TODO(any): Skip the winner mode processing for blocks with lower residual
272 // energy as R-D optimization of coefficients would have been enabled during
273 // mode decision
274 if (enable_winner_mode_for_coeff_opt) {
275 // Use conservative threshold during mode decision and perform R-D
276 // optimization of coeffs always for winner modes
277 if (is_winner_mode)
Cherma Rajan A628efce2019-09-18 18:55:12 +0530278 coeff_opt_thresh = coeff_opt_dist_threshold[WINNER_MODE_EVAL];
Ranjit Kumar Tulabandu824f9db2019-07-05 15:16:37 +0530279 else
Cherma Rajan A628efce2019-09-18 18:55:12 +0530280 coeff_opt_thresh = coeff_opt_dist_threshold[MODE_EVAL];
Ranjit Kumar Tulabandu824f9db2019-07-05 15:16:37 +0530281 }
282 return coeff_opt_thresh;
283}
284
Yaowu Xuf883b422016-08-30 14:01:10 -0700285void av1_setup_pred_block(const MACROBLOCKD *xd,
286 struct buf_2d dst[MAX_MB_PLANE],
287 const YV12_BUFFER_CONFIG *src, int mi_row, int mi_col,
288 const struct scale_factors *scale,
Imdad Sardharwallaaf8e2642018-01-19 11:46:34 +0000289 const struct scale_factors *scale_uv,
290 const int num_planes);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700291
Yaowu Xuf883b422016-08-30 14:01:10 -0700292int av1_get_intra_cost_penalty(int qindex, int qdelta,
293 aom_bit_depth_t bit_depth);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700294
Yue Chenb23d00a2017-07-28 17:01:21 -0700295void av1_fill_mode_rates(AV1_COMMON *const cm, MACROBLOCK *x,
296 FRAME_CONTEXT *fc);
297
Imdad Sardharwallaaf8e2642018-01-19 11:46:34 +0000298void av1_fill_coeff_costs(MACROBLOCK *x, FRAME_CONTEXT *fc,
299 const int num_planes);
Jingning Handfd72322017-08-09 14:04:12 -0700300
Wan-Teh Changec5cb192019-09-16 08:50:06 -0700301void av1_fill_mv_costs(const FRAME_CONTEXT *fc, int integer_mv, int usehp,
Debargha Mukherjee8d273412019-09-11 10:36:50 -0700302 MACROBLOCK *x);
303
Yue Chen7cae98f2018-08-24 10:43:16 -0700304int av1_get_adaptive_rdmult(const struct AV1_COMP *cpi, double beta);
305
Debargha Mukherjeecfcd5ad2019-05-20 20:27:17 -0700306int av1_get_deltaq_offset(const struct AV1_COMP *cpi, int qindex, double beta);
307
Yaowu Xuc27fc142016-08-22 16:08:15 -0700308#ifdef __cplusplus
309} // extern "C"
310#endif
311
James Zerne1cbb132018-08-22 14:10:36 -0700312#endif // AOM_AV1_ENCODER_RD_H_