ext_tile: add 2 tile encoding modes
Added 2 tile encoding modes:
TILE_NORMAL mode supports the large-scale tile coding up to 1024 x 1024
tiles;
TILE_VR mode supports the large-scale tile coding and also the decoding
of a single tile.
TILE_NORMAL mode allows the non-vr content to be encoded in multiple tiles
without using the coding tool that are designed for vr applications.
Change-Id: Id804806a1bbcb916b7f5dc7e2c5509d88f3defcb
diff --git a/av1/av1_cx_iface.c b/av1/av1_cx_iface.c
index 4ec146e..6389572 100644
--- a/av1/av1_cx_iface.c
+++ b/av1/av1_cx_iface.c
@@ -75,6 +75,9 @@
#if CONFIG_ANS && ANS_MAX_SYMBOLS
int ans_window_size_log2;
#endif
+#if CONFIG_EXT_TILE
+ unsigned int tile_encoding_mode;
+#endif // CONFIG_EXT_TILE
};
static struct av1_extracfg default_extra_cfg = {
@@ -134,6 +137,9 @@
#if CONFIG_ANS && ANS_MAX_SYMBOLS
23, // ans_window_size_log2
#endif
+#if CONFIG_EXT_TILE
+ 0, // Tile encoding mode is TILE_NORMAL by default.
+#endif // CONFIG_EXT_TILE
};
struct aom_codec_alg_priv {
@@ -270,6 +276,7 @@
if (extra_cfg->tile_rows != UINT_MAX)
RANGE_CHECK(extra_cfg, tile_rows, 1, 64);
}
+ RANGE_CHECK_HI(extra_cfg, tile_encoding_mode, 1);
#else
RANGE_CHECK_HI(extra_cfg, tile_columns, 6);
RANGE_CHECK_HI(extra_cfg, tile_rows, 2);
@@ -520,6 +527,7 @@
#endif // CONFIG_EXT_PARTITION
oxcf->tile_columns = AOMMIN(extra_cfg->tile_columns, max);
oxcf->tile_rows = AOMMIN(extra_cfg->tile_rows, max);
+ oxcf->tile_encoding_mode = extra_cfg->tile_encoding_mode;
}
#else
oxcf->tile_columns = extra_cfg->tile_columns;
@@ -822,6 +830,15 @@
return update_extra_cfg(ctx, &extra_cfg);
}
+#if CONFIG_EXT_TILE
+static aom_codec_err_t ctrl_set_tile_encoding_mode(aom_codec_alg_priv_t *ctx,
+ va_list args) {
+ struct av1_extracfg extra_cfg = ctx->extra_cfg;
+ extra_cfg.tile_encoding_mode = CAST(AV1E_SET_TILE_ENCODING_MODE, args);
+ return update_extra_cfg(ctx, &extra_cfg);
+}
+#endif // CONFIG_EXT_TILE
+
static aom_codec_err_t ctrl_set_aq_mode(aom_codec_alg_priv_t *ctx,
va_list args) {
struct av1_extracfg extra_cfg = ctx->extra_cfg;
@@ -1449,6 +1466,9 @@
#if CONFIG_ANS && ANS_MAX_SYMBOLS
{ AV1E_SET_ANS_WINDOW_SIZE_LOG2, ctrl_set_ans_window_size_log2 },
#endif
+#if CONFIG_EXT_TILE
+ { AV1E_SET_TILE_ENCODING_MODE, ctrl_set_tile_encoding_mode },
+#endif // CONFIG_EXT_TILE
// Getters
{ AOME_GET_LAST_QUANTIZER, ctrl_get_quantizer },
diff --git a/av1/av1_dx_iface.c b/av1/av1_dx_iface.c
index 8cd40a3..f20ea48 100644
--- a/av1/av1_dx_iface.c
+++ b/av1/av1_dx_iface.c
@@ -759,7 +759,8 @@
yuvconfig2image(&ctx->img, &sd, frame_worker_data->user_priv);
#if CONFIG_EXT_TILE
- if (frame_worker_data->pbi->dec_tile_row >= 0) {
+ if (cm->tile_encoding_mode &&
+ frame_worker_data->pbi->dec_tile_row >= 0) {
const int tile_row =
AOMMIN(frame_worker_data->pbi->dec_tile_row, cm->tile_rows - 1);
const int mi_row = tile_row * cm->tile_height;
@@ -774,7 +775,8 @@
AOMMIN(cm->tile_height, cm->mi_rows - mi_row) * MI_SIZE;
}
- if (frame_worker_data->pbi->dec_tile_col >= 0) {
+ if (cm->tile_encoding_mode &&
+ frame_worker_data->pbi->dec_tile_col >= 0) {
const int tile_col =
AOMMIN(frame_worker_data->pbi->dec_tile_col, cm->tile_cols - 1);
const int mi_col = tile_col * cm->tile_width;
diff --git a/av1/common/blockd.h b/av1/common/blockd.h
index eae726c..b2be442 100644
--- a/av1/common/blockd.h
+++ b/av1/common/blockd.h
@@ -861,11 +861,7 @@
#endif // CONFIG_INTRA_INTERP
#endif // CONFIG_EXT_INTRA
-#if CONFIG_EXT_TILE
-#define FIXED_TX_TYPE 1
-#else
#define FIXED_TX_TYPE 0
-#endif
// Converts block_index for given transform size to index of the block in raster
// order.
diff --git a/av1/common/enums.h b/av1/common/enums.h
index b42a326..acfcafd 100644
--- a/av1/common/enums.h
+++ b/av1/common/enums.h
@@ -55,6 +55,9 @@
// Maximum number of tile rows and tile columns
#if CONFIG_EXT_TILE
+#define TILE_NORMAL 0
+#define TILE_VR 1
+
#define MAX_TILE_ROWS 1024
#define MAX_TILE_COLS 1024
#else
diff --git a/av1/common/onyxc_int.h b/av1/common/onyxc_int.h
index 6c28678..5fc92f0 100644
--- a/av1/common/onyxc_int.h
+++ b/av1/common/onyxc_int.h
@@ -356,6 +356,9 @@
#endif // !CONFIG_EXT_TILE
int tile_cols, tile_rows;
int tile_width, tile_height; // In MI units
+#if CONFIG_EXT_TILE
+ unsigned int tile_encoding_mode;
+#endif // CONFIG_EXT_TILE
#if CONFIG_DEPENDENT_HORZTILES
int dependent_horz_tiles;
diff --git a/av1/decoder/decodeframe.c b/av1/decoder/decodeframe.c
index 61fc82f..91b140d 100644
--- a/av1/decoder/decodeframe.c
+++ b/av1/decoder/decodeframe.c
@@ -2934,6 +2934,7 @@
struct aom_read_bit_buffer *const rb) {
AV1_COMMON *const cm = &pbi->common;
#if CONFIG_EXT_TILE
+ cm->tile_encoding_mode = aom_rb_read_literal(rb, 1);
// Read the tile width/height
#if CONFIG_EXT_PARTITION
if (cm->sb_size == BLOCK_128X128) {
@@ -3051,7 +3052,8 @@
const uint8_t **data, aom_decrypt_cb decrypt_cb,
void *decrypt_state,
TileBufferDec (*const tile_buffers)[MAX_TILE_COLS],
- int tile_size_bytes, int col, int row) {
+ int tile_size_bytes, int col, int row,
+ unsigned int tile_encoding_mode) {
size_t size;
size_t copy_size = 0;
@@ -3070,8 +3072,9 @@
size = mem_get_varsize(*data, tile_size_bytes);
}
- // The top bit indicates copy mode
- if ((size >> (tile_size_bytes * 8 - 1)) == 1) {
+ // If cm->tile_encoding_mode = 1 (i.e. TILE_VR), then the top bit of the tile
+ // header indicates copy mode.
+ if (tile_encoding_mode && (size >> (tile_size_bytes * 8 - 1)) == 1) {
// The remaining bits in the top byte signal the row offset
int offset = (size >> (tile_size_bytes - 1) * 8) & 0x7f;
@@ -3167,7 +3170,7 @@
get_tile_buffer(tile_col_data_end[c], &pbi->common.error, &data,
pbi->decrypt_cb, pbi->decrypt_state, tile_buffers,
- tile_size_bytes, c, r);
+ tile_size_bytes, c, r, cm->tile_encoding_mode);
}
}
@@ -3182,7 +3185,7 @@
get_tile_buffer(tile_col_data_end[c], &pbi->common.error, &data,
pbi->decrypt_cb, pbi->decrypt_state, tile_buffers,
- tile_size_bytes, c, r);
+ tile_size_bytes, c, r, cm->tile_encoding_mode);
}
}
}
@@ -3548,7 +3551,9 @@
// after the entire frame is decoded.
#if !CONFIG_VAR_TX && !CONFIG_PARALLEL_DEBLOCKING && !CONFIG_CB4X4
// Loopfilter one tile row.
- if (cm->lf.filter_level && !cm->skip_loop_filter) {
+ // Note: If out-of-order tile decoding is used(for example, inv_row_order
+ // = 1), the loopfiltering has be done after all tile rows are decoded.
+ if (!inv_row_order && cm->lf.filter_level && !cm->skip_loop_filter) {
LFWorkerData *const lf_data = (LFWorkerData *)pbi->lf_worker.data1;
const int lf_start = AOMMAX(0, tile_info.mi_row_start - cm->mib_size);
const int lf_end = tile_info.mi_row_end - cm->mib_size;
@@ -4842,6 +4847,17 @@
first_partition_size = read_uncompressed_header(
pbi, init_read_bit_buffer(pbi, &rb, data, data_end, clear_data));
+
+#if CONFIG_EXT_TILE
+ // If cm->tile_encoding_mode == TILE_NORMAL, the independent decoding of a
+ // single tile or a section of a frame is not allowed.
+ if (!cm->tile_encoding_mode &&
+ (pbi->dec_tile_row >= 0 || pbi->dec_tile_col >= 0)) {
+ pbi->dec_tile_row = -1;
+ pbi->dec_tile_col = -1;
+ }
+#endif // CONFIG_EXT_TILE
+
#if CONFIG_TILE_GROUPS
pbi->first_partition_size = first_partition_size;
pbi->uncomp_hdr_size = aom_rb_bytes_read(&rb);
diff --git a/av1/encoder/bitstream.c b/av1/encoder/bitstream.c
index 993ac99..ce518e6 100644
--- a/av1/encoder/bitstream.c
+++ b/av1/encoder/bitstream.c
@@ -3731,6 +3731,8 @@
assert(tile_width > 0);
assert(tile_height > 0);
+ aom_wb_write_literal(wb, cm->tile_encoding_mode, 1);
+
// Write the tile sizes
#if CONFIG_EXT_PARTITION
if (cm->sb_size == BLOCK_128X128) {
@@ -3990,10 +3992,11 @@
// tile header: size of this tile, or copy offset
uint32_t tile_header = tile_size;
- // Check if this tile is a copy tile.
+ // If the tile_encoding_mode is 1 (i.e. TILE_VR), check if this tile is
+ // a copy tile.
// Very low chances to have copy tiles on the key frames, so don't
// search on key frames to reduce unnecessary search.
- if (cm->frame_type != KEY_FRAME) {
+ if (cm->frame_type != KEY_FRAME && cm->tile_encoding_mode) {
const int idendical_tile_offset =
find_identical_tile(tile_row, tile_col, tile_buffers);
diff --git a/av1/encoder/encoder.c b/av1/encoder/encoder.c
index e430ed4..27a6801 100644
--- a/av1/encoder/encoder.c
+++ b/av1/encoder/encoder.c
@@ -4824,6 +4824,10 @@
}
#endif
+#if CONFIG_EXT_TILE
+ cm->tile_encoding_mode = cpi->oxcf.tile_encoding_mode;
+#endif // CONFIG_EXT_TILE
+
#if CONFIG_XIPHRC
if (drop_this_frame) {
av1_rc_postencode_update_drop_frame(cpi);
diff --git a/av1/encoder/encoder.h b/av1/encoder/encoder.h
index 2299f01..76edaa7 100644
--- a/av1/encoder/encoder.h
+++ b/av1/encoder/encoder.h
@@ -267,6 +267,9 @@
#if CONFIG_ANS && ANS_MAX_SYMBOLS
int ans_window_size_log2;
#endif // CONFIG_ANS && ANS_MAX_SYMBOLS
+#if CONFIG_EXT_TILE
+ unsigned int tile_encoding_mode;
+#endif // CONFIG_EXT_TILE
} AV1EncoderConfig;
static INLINE int is_lossless_requested(const AV1EncoderConfig *cfg) {
diff --git a/av1/encoder/picklpf.c b/av1/encoder/picklpf.c
index b925451..fc0ea48 100644
--- a/av1/encoder/picklpf.c
+++ b/av1/encoder/picklpf.c
@@ -206,6 +206,6 @@
// TODO(any): 0 loopfilter level is only necessary if individual tile
// decoding is required. We need to communicate this requirement to this
// code and force loop filter level 0 only if required.
- lf->filter_level = 0;
+ if (cm->tile_encoding_mode) lf->filter_level = 0;
#endif // CONFIG_EXT_TILE
}
diff --git a/av1/encoder/speed_features.c b/av1/encoder/speed_features.c
index bf99c5d..0f9ea75 100644
--- a/av1/encoder/speed_features.c
+++ b/av1/encoder/speed_features.c
@@ -371,11 +371,7 @@
sf->disable_filter_search_var_thresh = 0;
sf->adaptive_interp_filter_search = 0;
sf->allow_partition_search_skip = 0;
-#if CONFIG_EXT_TILE
- sf->use_upsampled_references = 0;
-#else
sf->use_upsampled_references = 1;
-#endif // CONFIG_EXT_TILE
#if CONFIG_EXT_INTER
sf->disable_wedge_search_var_thresh = 0;
sf->fast_wedge_sign_estimate = 0;
@@ -406,12 +402,8 @@
sf->partition_search_breakout_rate_thr = 0;
sf->simple_model_rd_from_var = 0;
-// Set this at the appropriate speed levels
-#if CONFIG_EXT_TILE
- sf->use_transform_domain_distortion = 1;
-#else
+ // Set this at the appropriate speed levels
sf->use_transform_domain_distortion = 0;
-#endif // CONFIG_EXT_TILE
if (oxcf->mode == GOOD
#if CONFIG_XIPHRC