blob: ec654db1151e63c7f62405a1d253682f0125472d [file] [log] [blame]
Ryan Overbecka5fefa72017-09-19 11:39:10 -07001/*
2 * Copyright (c) 2017, Alliance for Open Media. All rights reserved
3 *
4 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10 */
11
12// Lightfield Encoder
13// ==================
14//
15// This is an example of a simple lightfield encoder. It builds upon the
16// twopass_encoder.c example. It takes an input file in YV12 format,
17// treating it as a planar lightfield instead of a video. The img_width
18// and img_height arguments are the dimensions of the lightfield images,
19// while the lf_width and lf_height arguments are the number of
20// lightfield images in each dimension. The lf_blocksize determines the
21// number of reference images used for MCP. For example, 5 means that there
22// is a reference image for every 5x5 lightfield image block. All images
23// within a block will use the center image in that block as the reference
24// image for MCP.
25// Run "make test" to download lightfield test data: vase10x10.yuv.
26// Run lightfield encoder to encode whole lightfield:
Yunqing Wangd417bb52018-06-03 14:13:38 -070027// examples/lightfield_encoder 1024 1024 vase10x10.yuv vase10x10.ivf 10 10 5
Ryan Overbecka5fefa72017-09-19 11:39:10 -070028
Yunqing Wangb041d8a2017-11-15 12:31:18 -080029// Note: In bitstream.c and encoder.c, define EXT_TILE_DEBUG as 1 will print
30// out the uncompressed header and the frame contexts, which can be used to
31// test the bit exactness of the headers and the frame contexts for large scale
32// tile coded frames.
33
Ryan Overbecka5fefa72017-09-19 11:39:10 -070034#include <stdio.h>
35#include <stdlib.h>
36#include <string.h>
37
38#include "aom/aom_encoder.h"
39#include "aom/aomcx.h"
Urvang Joshi6077b182018-08-21 11:49:38 -070040#include "aom_scale/yv12config.h"
Ryan Overbecka5fefa72017-09-19 11:39:10 -070041#include "av1/common/enums.h"
Tom Finegan77902132018-05-21 10:19:15 -070042#include "common/tools_common.h"
43#include "common/video_writer.h"
Ryan Overbecka5fefa72017-09-19 11:39:10 -070044
45static const char *exec_name;
Ryan Overbecka5fefa72017-09-19 11:39:10 -070046
47void usage_exit(void) {
48 fprintf(stderr,
49 "Usage: %s <img_width> <img_height> <infile> <outfile> "
50 "<lf_width> <lf_height> <lf_blocksize>\n",
51 exec_name);
52 exit(EXIT_FAILURE);
53}
54
Yaowu Xu413566e2019-05-17 09:36:48 -070055static int img_size_bytes(aom_image_t *img) {
Ryan Overbecka5fefa72017-09-19 11:39:10 -070056 int image_size_bytes = 0;
57 int plane;
58 for (plane = 0; plane < 3; ++plane) {
Ryan Overbecka5fefa72017-09-19 11:39:10 -070059 const int w = aom_img_plane_width(img, plane) *
60 ((img->fmt & AOM_IMG_FMT_HIGHBITDEPTH) ? 2 : 1);
61 const int h = aom_img_plane_height(img, plane);
Yunqing Wang17d9d432018-05-27 15:08:04 -070062 image_size_bytes += w * h;
Ryan Overbecka5fefa72017-09-19 11:39:10 -070063 }
64 return image_size_bytes;
65}
66
67static int get_frame_stats(aom_codec_ctx_t *ctx, const aom_image_t *img,
68 aom_codec_pts_t pts, unsigned int duration,
Sean DuBois47cc2552018-01-23 07:44:16 +000069 aom_enc_frame_flags_t flags,
Ryan Overbecka5fefa72017-09-19 11:39:10 -070070 aom_fixed_buf_t *stats) {
71 int got_pkts = 0;
72 aom_codec_iter_t iter = NULL;
73 const aom_codec_cx_pkt_t *pkt = NULL;
Sean DuBois47cc2552018-01-23 07:44:16 +000074 const aom_codec_err_t res = aom_codec_encode(ctx, img, pts, duration, flags);
Ryan Overbecka5fefa72017-09-19 11:39:10 -070075 if (res != AOM_CODEC_OK) die_codec(ctx, "Failed to get frame stats.");
76
77 while ((pkt = aom_codec_get_cx_data(ctx, &iter)) != NULL) {
78 got_pkts = 1;
79
Debargha Mukherjee7118f422020-06-29 15:49:06 -070080#if CONFIG_SINGLEPASS
81 (void)stats;
82#else
Ryan Overbecka5fefa72017-09-19 11:39:10 -070083 if (pkt->kind == AOM_CODEC_STATS_PKT) {
84 const uint8_t *const pkt_buf = pkt->data.twopass_stats.buf;
85 const size_t pkt_size = pkt->data.twopass_stats.sz;
86 stats->buf = realloc(stats->buf, stats->sz + pkt_size);
87 memcpy((uint8_t *)stats->buf + stats->sz, pkt_buf, pkt_size);
88 stats->sz += pkt_size;
89 }
Debargha Mukherjee7118f422020-06-29 15:49:06 -070090#endif // !CONFIG_SINGLEPASS
Ryan Overbecka5fefa72017-09-19 11:39:10 -070091 }
92
93 return got_pkts;
94}
95
96static int encode_frame(aom_codec_ctx_t *ctx, const aom_image_t *img,
97 aom_codec_pts_t pts, unsigned int duration,
Yunqing Wangb97cfae2018-05-11 14:19:05 -070098 aom_enc_frame_flags_t flags, AvxVideoWriter *writer) {
Ryan Overbecka5fefa72017-09-19 11:39:10 -070099 int got_pkts = 0;
100 aom_codec_iter_t iter = NULL;
101 const aom_codec_cx_pkt_t *pkt = NULL;
Sean DuBois47cc2552018-01-23 07:44:16 +0000102 const aom_codec_err_t res = aom_codec_encode(ctx, img, pts, duration, flags);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700103 if (res != AOM_CODEC_OK) die_codec(ctx, "Failed to encode frame.");
104
105 while ((pkt = aom_codec_get_cx_data(ctx, &iter)) != NULL) {
106 got_pkts = 1;
107 if (pkt->kind == AOM_CODEC_CX_FRAME_PKT) {
108 const int keyframe = (pkt->data.frame.flags & AOM_FRAME_IS_KEY) != 0;
109
110 if (!aom_video_writer_write_frame(writer, pkt->data.frame.buf,
111 pkt->data.frame.sz,
112 pkt->data.frame.pts))
113 die_codec(ctx, "Failed to write compressed frame.");
114 printf(keyframe ? "K" : ".");
115 fflush(stdout);
116 }
117 }
118
119 return got_pkts;
120}
121
Yunqing Wang17d9d432018-05-27 15:08:04 -0700122static void get_raw_image(aom_image_t **frame_to_encode, aom_image_t *raw,
123 aom_image_t *raw_shift) {
Jerome Jiang5fad3fb2019-08-14 10:16:12 -0700124 if (FORCE_HIGHBITDEPTH_DECODING) {
Yunqing Wang17d9d432018-05-27 15:08:04 -0700125 // Need to allocate larger buffer to use hbd internal.
126 int input_shift = 0;
127 aom_img_upshift(raw_shift, raw, input_shift);
128 *frame_to_encode = raw_shift;
129 } else {
130 *frame_to_encode = raw;
131 }
132}
133
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700134static aom_fixed_buf_t pass0(aom_image_t *raw, FILE *infile,
Elliott Karpilovsky67e84d42020-04-26 16:03:39 -0700135 aom_codec_iface_t *encoder,
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700136 const aom_codec_enc_cfg_t *cfg, int lf_width,
Yunqing Wang17d9d432018-05-27 15:08:04 -0700137 int lf_height, int lf_blocksize, int flags,
138 aom_image_t *raw_shift) {
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700139 aom_codec_ctx_t codec;
140 int frame_count = 0;
Yaowu Xu413566e2019-05-17 09:36:48 -0700141 int image_size_bytes = img_size_bytes(raw);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700142 int u_blocks, v_blocks;
143 int bu, bv;
144 aom_fixed_buf_t stats = { NULL, 0 };
Yunqing Wang17d9d432018-05-27 15:08:04 -0700145 aom_image_t *frame_to_encode;
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700146
Elliott Karpilovskycbe219b2020-04-22 16:21:06 -0700147 if (aom_codec_enc_init(&codec, encoder, cfg, flags))
James Zerndad374f2020-05-06 19:13:19 -0700148 die("Failed to initialize encoder");
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700149 if (aom_codec_control(&codec, AOME_SET_ENABLEAUTOALTREF, 0))
150 die_codec(&codec, "Failed to turn off auto altref");
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800151 if (aom_codec_control(&codec, AV1E_SET_FRAME_PARALLEL_DECODING, 0))
152 die_codec(&codec, "Failed to set frame parallel decoding");
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700153
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700154 // How many reference images we need to encode.
155 u_blocks = (lf_width + lf_blocksize - 1) / lf_blocksize;
156 v_blocks = (lf_height + lf_blocksize - 1) / lf_blocksize;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700157
158 printf("\n First pass: ");
159
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700160 for (bv = 0; bv < v_blocks; ++bv) {
161 for (bu = 0; bu < u_blocks; ++bu) {
162 const int block_u_min = bu * lf_blocksize;
163 const int block_v_min = bv * lf_blocksize;
164 int block_u_end = (bu + 1) * lf_blocksize;
165 int block_v_end = (bv + 1) * lf_blocksize;
166 int u_block_size, v_block_size;
167 int block_ref_u, block_ref_v;
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700168
169 block_u_end = block_u_end < lf_width ? block_u_end : lf_width;
170 block_v_end = block_v_end < lf_height ? block_v_end : lf_height;
171 u_block_size = block_u_end - block_u_min;
172 v_block_size = block_v_end - block_v_min;
173 block_ref_u = block_u_min + u_block_size / 2;
174 block_ref_v = block_v_min + v_block_size / 2;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700175
176 printf("A%d, ", (block_ref_u + block_ref_v * lf_width));
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700177 fseek(infile, (block_ref_u + block_ref_v * lf_width) * image_size_bytes,
178 SEEK_SET);
179 aom_img_read(raw, infile);
Yunqing Wang17d9d432018-05-27 15:08:04 -0700180 get_raw_image(&frame_to_encode, raw, raw_shift);
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800181
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700182 // Reference frames can be encoded encoded without tiles.
183 ++frame_count;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700184 get_frame_stats(&codec, frame_to_encode, frame_count, 1,
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800185 AOM_EFLAG_NO_REF_LAST2 | AOM_EFLAG_NO_REF_LAST3 |
186 AOM_EFLAG_NO_REF_GF | AOM_EFLAG_NO_REF_ARF |
187 AOM_EFLAG_NO_REF_BWD | AOM_EFLAG_NO_REF_ARF2 |
188 AOM_EFLAG_NO_UPD_LAST | AOM_EFLAG_NO_UPD_GF |
189 AOM_EFLAG_NO_UPD_ARF,
Sean DuBois47cc2552018-01-23 07:44:16 +0000190 &stats);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700191 }
192 }
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800193
194 if (aom_codec_control(&codec, AV1E_SET_FRAME_PARALLEL_DECODING, 1))
195 die_codec(&codec, "Failed to set frame parallel decoding");
196
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700197 for (bv = 0; bv < v_blocks; ++bv) {
198 for (bu = 0; bu < u_blocks; ++bu) {
199 const int block_u_min = bu * lf_blocksize;
200 const int block_v_min = bv * lf_blocksize;
201 int block_u_end = (bu + 1) * lf_blocksize;
202 int block_v_end = (bv + 1) * lf_blocksize;
203 int u, v;
204 block_u_end = block_u_end < lf_width ? block_u_end : lf_width;
205 block_v_end = block_v_end < lf_height ? block_v_end : lf_height;
206 for (v = block_v_min; v < block_v_end; ++v) {
207 for (u = block_u_min; u < block_u_end; ++u) {
Yunqing Wang17d9d432018-05-27 15:08:04 -0700208 printf("C%d, ", (u + v * lf_width));
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700209 fseek(infile, (u + v * lf_width) * image_size_bytes, SEEK_SET);
210 aom_img_read(raw, infile);
Yunqing Wang17d9d432018-05-27 15:08:04 -0700211 get_raw_image(&frame_to_encode, raw, raw_shift);
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800212
Yunqing Wang17d9d432018-05-27 15:08:04 -0700213 ++frame_count;
214 get_frame_stats(&codec, frame_to_encode, frame_count, 1,
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800215 AOM_EFLAG_NO_REF_LAST2 | AOM_EFLAG_NO_REF_LAST3 |
216 AOM_EFLAG_NO_REF_GF | AOM_EFLAG_NO_REF_ARF |
217 AOM_EFLAG_NO_REF_BWD | AOM_EFLAG_NO_REF_ARF2 |
218 AOM_EFLAG_NO_UPD_LAST | AOM_EFLAG_NO_UPD_GF |
219 AOM_EFLAG_NO_UPD_ARF | AOM_EFLAG_NO_UPD_ENTROPY,
Sean DuBois47cc2552018-01-23 07:44:16 +0000220 &stats);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700221 }
222 }
223 }
224 }
225 // Flush encoder.
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800226 // No ARF, this should not be needed.
Sean DuBois47cc2552018-01-23 07:44:16 +0000227 while (get_frame_stats(&codec, NULL, frame_count, 1, 0, &stats)) {
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700228 }
229
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700230 if (aom_codec_destroy(&codec)) die_codec(&codec, "Failed to destroy codec.");
231
Yunqing Wang17d9d432018-05-27 15:08:04 -0700232 printf("\nFirst pass complete. Processed %d frames.\n", frame_count);
233
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700234 return stats;
235}
236
237static void pass1(aom_image_t *raw, FILE *infile, const char *outfile_name,
Elliott Karpilovsky67e84d42020-04-26 16:03:39 -0700238 aom_codec_iface_t *encoder, aom_codec_enc_cfg_t *cfg,
Yunqing Wang17d9d432018-05-27 15:08:04 -0700239 int lf_width, int lf_height, int lf_blocksize, int flags,
240 aom_image_t *raw_shift) {
Elliott Karpilovskycbe219b2020-04-22 16:21:06 -0700241 AvxVideoInfo info = { get_fourcc_by_aom_encoder(encoder),
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700242 cfg->g_w,
243 cfg->g_h,
Jonathan Matthewsa6e4f962018-07-13 16:01:28 +0100244 { cfg->g_timebase.num, cfg->g_timebase.den },
245 0 };
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700246 AvxVideoWriter *writer = NULL;
247 aom_codec_ctx_t codec;
248 int frame_count = 0;
Yaowu Xu413566e2019-05-17 09:36:48 -0700249 int image_size_bytes = img_size_bytes(raw);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700250 int bu, bv;
251 int u_blocks, v_blocks;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700252 aom_image_t *frame_to_encode;
Yunqing Wang93b18f32018-06-08 21:08:29 -0700253 aom_image_t reference_images[MAX_EXTERNAL_REFERENCES];
Yunqing Wang17d9d432018-05-27 15:08:04 -0700254 int reference_image_num = 0;
255 int i;
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700256
257 writer = aom_video_writer_open(outfile_name, kContainerIVF, &info);
258 if (!writer) die("Failed to open %s for writing", outfile_name);
259
Elliott Karpilovskycbe219b2020-04-22 16:21:06 -0700260 if (aom_codec_enc_init(&codec, encoder, cfg, flags))
James Zerndad374f2020-05-06 19:13:19 -0700261 die("Failed to initialize encoder");
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700262 if (aom_codec_control(&codec, AOME_SET_ENABLEAUTOALTREF, 0))
263 die_codec(&codec, "Failed to turn off auto altref");
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800264 if (aom_codec_control(&codec, AV1E_SET_FRAME_PARALLEL_DECODING, 0))
265 die_codec(&codec, "Failed to set frame parallel decoding");
Yunqing Wangd8fd9e72019-12-26 15:36:31 -0800266 if (aom_codec_control(&codec, AV1E_ENABLE_EXT_TILE_DEBUG, 1))
267 die_codec(&codec, "Failed to enable encoder ext_tile debug");
Yaowu Xu8d9fecb2020-04-27 15:21:02 -0700268 if (aom_codec_control(&codec, AOME_SET_CPUUSED, 3))
Yunqing Wangd8fd9e72019-12-26 15:36:31 -0800269 die_codec(&codec, "Failed to set cpu-used");
Yunqing Wangd0f0d3b2019-12-23 12:15:44 -0800270
Yunqing Wange3de2d82018-05-15 13:43:41 -0700271 // Note: The superblock is a sequence parameter and has to be the same for 1
272 // sequence. In lightfield application, must choose the superblock size(either
273 // 64x64 or 128x128) before the encoding starts. Otherwise, the default is
274 // AOM_SUPERBLOCK_SIZE_DYNAMIC, and the superblock size will be set to 64x64
275 // internally.
276 if (aom_codec_control(&codec, AV1E_SET_SUPERBLOCK_SIZE,
277 AOM_SUPERBLOCK_SIZE_64X64))
278 die_codec(&codec, "Failed to set SB size");
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700279
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700280 u_blocks = (lf_width + lf_blocksize - 1) / lf_blocksize;
281 v_blocks = (lf_height + lf_blocksize - 1) / lf_blocksize;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700282
283 reference_image_num = u_blocks * v_blocks;
Sarah Parker9feb1582019-04-25 12:29:52 -0700284 // Set the max gf group length so the references are guaranteed to be in
285 // a different gf group than any of the regular frames. This avoids using
Sarah Parker48b46b42019-04-23 20:43:02 -0700286 // both vbr and constant quality mode in a single group. The number of
287 // references now cannot surpass 17 because of the enforced MAX_GF_INTERVAL of
288 // 16. If it is necessary to exceed this reference frame limit, one will have
289 // to do some additional handling to ensure references are in separate gf
290 // groups from the regular frames.
291 if (aom_codec_control(&codec, AV1E_SET_MAX_GF_INTERVAL,
292 reference_image_num - 1))
293 die_codec(&codec, "Failed to set max gf interval");
Yunqing Wang17d9d432018-05-27 15:08:04 -0700294 aom_img_fmt_t ref_fmt = AOM_IMG_FMT_I420;
Jerome Jiang5fad3fb2019-08-14 10:16:12 -0700295 if (FORCE_HIGHBITDEPTH_DECODING) ref_fmt |= AOM_IMG_FMT_HIGHBITDEPTH;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700296 // Allocate memory with the border so that it can be used as a reference.
Satish Kumar Suman29909962019-01-09 10:31:21 +0530297 int border_in_pixels =
298 (codec.config.enc->rc_resize_mode || codec.config.enc->rc_superres_mode)
299 ? AOM_BORDER_IN_PIXELS
300 : AOM_ENC_NO_SCALE_BORDER;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700301 for (i = 0; i < reference_image_num; i++) {
302 if (!aom_img_alloc_with_border(&reference_images[i], ref_fmt, cfg->g_w,
Satish Kumar Suman29909962019-01-09 10:31:21 +0530303 cfg->g_h, 32, 8, border_in_pixels)) {
Yunqing Wang17d9d432018-05-27 15:08:04 -0700304 die("Failed to allocate image.");
305 }
306 }
307
308 printf("\n Second pass: ");
309
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700310 // Encode reference images first.
311 printf("Encoding Reference Images\n");
312 for (bv = 0; bv < v_blocks; ++bv) {
313 for (bu = 0; bu < u_blocks; ++bu) {
314 const int block_u_min = bu * lf_blocksize;
315 const int block_v_min = bv * lf_blocksize;
316 int block_u_end = (bu + 1) * lf_blocksize;
317 int block_v_end = (bv + 1) * lf_blocksize;
318 int u_block_size, v_block_size;
319 int block_ref_u, block_ref_v;
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700320
321 block_u_end = block_u_end < lf_width ? block_u_end : lf_width;
322 block_v_end = block_v_end < lf_height ? block_v_end : lf_height;
323 u_block_size = block_u_end - block_u_min;
324 v_block_size = block_v_end - block_v_min;
325 block_ref_u = block_u_min + u_block_size / 2;
326 block_ref_v = block_v_min + v_block_size / 2;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700327
328 printf("A%d, ", (block_ref_u + block_ref_v * lf_width));
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700329 fseek(infile, (block_ref_u + block_ref_v * lf_width) * image_size_bytes,
330 SEEK_SET);
331 aom_img_read(raw, infile);
Yunqing Wang17d9d432018-05-27 15:08:04 -0700332
333 get_raw_image(&frame_to_encode, raw, raw_shift);
334
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700335 // Reference frames may be encoded without tiles.
336 ++frame_count;
337 printf("Encoding reference image %d of %d\n", bv * u_blocks + bu,
338 u_blocks * v_blocks);
Yunqing Wang17d9d432018-05-27 15:08:04 -0700339 encode_frame(&codec, frame_to_encode, frame_count, 1,
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800340 AOM_EFLAG_NO_REF_LAST2 | AOM_EFLAG_NO_REF_LAST3 |
341 AOM_EFLAG_NO_REF_GF | AOM_EFLAG_NO_REF_ARF |
342 AOM_EFLAG_NO_REF_BWD | AOM_EFLAG_NO_REF_ARF2 |
343 AOM_EFLAG_NO_UPD_LAST | AOM_EFLAG_NO_UPD_GF |
344 AOM_EFLAG_NO_UPD_ARF | AOM_EFLAG_NO_UPD_ENTROPY,
Sean DuBois47cc2552018-01-23 07:44:16 +0000345 writer);
Yunqing Wang17d9d432018-05-27 15:08:04 -0700346
Yunqing Wang946ec2b2018-06-06 12:34:23 -0700347 if (aom_codec_control(&codec, AV1_COPY_NEW_FRAME_IMAGE,
Yunqing Wang17d9d432018-05-27 15:08:04 -0700348 &reference_images[frame_count - 1]))
Yunqing Wang946ec2b2018-06-06 12:34:23 -0700349 die_codec(&codec, "Failed to copy decoder reference frame");
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700350 }
351 }
352
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800353 cfg->large_scale_tile = 1;
354 // Fixed q encoding for camera frames.
355 cfg->rc_end_usage = AOM_Q;
356 if (aom_codec_enc_config_set(&codec, cfg))
357 die_codec(&codec, "Failed to configure encoder");
358
359 // The fixed q value used in encoding.
Urvang Joshi3d3535b2020-07-14 11:01:30 -0700360 if (aom_codec_control(&codec, AOME_SET_QP, 36))
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800361 die_codec(&codec, "Failed to set cq level");
362 if (aom_codec_control(&codec, AV1E_SET_FRAME_PARALLEL_DECODING, 1))
363 die_codec(&codec, "Failed to set frame parallel decoding");
364 if (aom_codec_control(&codec, AV1E_SET_SINGLE_TILE_DECODING, 1))
365 die_codec(&codec, "Failed to turn on single tile decoding");
Yunqing Wang75e20e82018-06-16 12:10:48 -0700366 // Set tile_columns and tile_rows to MAX values, which guarantees the tile
367 // size of 64 x 64 pixels(i.e. 1 SB) for <= 4k resolution.
368 if (aom_codec_control(&codec, AV1E_SET_TILE_COLUMNS, 6))
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800369 die_codec(&codec, "Failed to set tile width");
Yunqing Wang75e20e82018-06-16 12:10:48 -0700370 if (aom_codec_control(&codec, AV1E_SET_TILE_ROWS, 6))
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800371 die_codec(&codec, "Failed to set tile height");
372
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700373 for (bv = 0; bv < v_blocks; ++bv) {
374 for (bu = 0; bu < u_blocks; ++bu) {
375 const int block_u_min = bu * lf_blocksize;
376 const int block_v_min = bv * lf_blocksize;
377 int block_u_end = (bu + 1) * lf_blocksize;
378 int block_v_end = (bv + 1) * lf_blocksize;
379 int u, v;
380 block_u_end = block_u_end < lf_width ? block_u_end : lf_width;
381 block_v_end = block_v_end < lf_height ? block_v_end : lf_height;
382 for (v = block_v_min; v < block_v_end; ++v) {
383 for (u = block_u_min; u < block_u_end; ++u) {
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700384 av1_ref_frame_t ref;
385 ref.idx = 0;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700386 ref.use_external_ref = 1;
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700387 ref.img = reference_images[bv * u_blocks + bu];
388 if (aom_codec_control(&codec, AV1_SET_REFERENCE, &ref))
389 die_codec(&codec, "Failed to set reference frame");
Yunqing Wang17d9d432018-05-27 15:08:04 -0700390
391 printf("C%d, ", (u + v * lf_width));
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700392 fseek(infile, (u + v * lf_width) * image_size_bytes, SEEK_SET);
393 aom_img_read(raw, infile);
Yunqing Wang17d9d432018-05-27 15:08:04 -0700394 get_raw_image(&frame_to_encode, raw, raw_shift);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700395
Yunqing Wang17d9d432018-05-27 15:08:04 -0700396 ++frame_count;
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700397 printf("Encoding image %d of %d\n",
398 frame_count - (u_blocks * v_blocks), lf_width * lf_height);
Yunqing Wang17d9d432018-05-27 15:08:04 -0700399 encode_frame(&codec, frame_to_encode, frame_count, 1,
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800400 AOM_EFLAG_NO_REF_LAST2 | AOM_EFLAG_NO_REF_LAST3 |
401 AOM_EFLAG_NO_REF_GF | AOM_EFLAG_NO_REF_ARF |
402 AOM_EFLAG_NO_REF_BWD | AOM_EFLAG_NO_REF_ARF2 |
403 AOM_EFLAG_NO_UPD_LAST | AOM_EFLAG_NO_UPD_GF |
404 AOM_EFLAG_NO_UPD_ARF | AOM_EFLAG_NO_UPD_ENTROPY,
Sean DuBois47cc2552018-01-23 07:44:16 +0000405 writer);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700406 }
407 }
408 }
409 }
410
411 // Flush encoder.
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800412 // No ARF, this should not be needed.
Sean DuBois47cc2552018-01-23 07:44:16 +0000413 while (encode_frame(&codec, NULL, -1, 1, 0, writer)) {
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700414 }
415
Yunqing Wang17d9d432018-05-27 15:08:04 -0700416 for (i = 0; i < reference_image_num; i++) aom_img_free(&reference_images[i]);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700417
Yunqing Wang17d9d432018-05-27 15:08:04 -0700418 if (aom_codec_destroy(&codec)) die_codec(&codec, "Failed to destroy codec.");
Yunqing Wang3ae70c92019-01-25 17:34:07 -0800419
420 // Modify large_scale_file fourcc.
421 if (cfg->large_scale_tile == 1)
422 aom_video_writer_set_fourcc(writer, LST_FOURCC);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700423 aom_video_writer_close(writer);
424
Yunqing Wang17d9d432018-05-27 15:08:04 -0700425 printf("\nSecond pass complete. Processed %d frames.\n", frame_count);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700426}
427
428int main(int argc, char **argv) {
429 FILE *infile = NULL;
430 int w, h;
431 // The number of lightfield images in the u and v dimensions.
432 int lf_width, lf_height;
433 // Defines how many images refer to the same reference image for MCP.
434 // lf_blocksize X lf_blocksize images will all use the reference image
435 // in the middle of the block of images.
436 int lf_blocksize;
437 aom_codec_ctx_t codec;
438 aom_codec_enc_cfg_t cfg;
439 aom_image_t raw;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700440 aom_image_t raw_shift;
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700441 aom_codec_err_t res;
442 aom_fixed_buf_t stats;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700443 int flags = 0;
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700444
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700445 const int fps = 30;
446 const int bitrate = 200; // kbit/s
447 const char *const width_arg = argv[1];
448 const char *const height_arg = argv[2];
449 const char *const infile_arg = argv[3];
450 const char *const outfile_arg = argv[4];
451 const char *const lf_width_arg = argv[5];
452 const char *const lf_height_arg = argv[6];
453 const char *lf_blocksize_arg = argv[7];
454 exec_name = argv[0];
455
456 if (argc < 8) die("Invalid number of arguments");
457
Elliott Karpilovskycbe219b2020-04-22 16:21:06 -0700458 aom_codec_iface_t *encoder = get_aom_encoder_by_short_name("av1");
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700459 if (!encoder) die("Unsupported codec.");
460
461 w = (int)strtol(width_arg, NULL, 0);
462 h = (int)strtol(height_arg, NULL, 0);
463 lf_width = (int)strtol(lf_width_arg, NULL, 0);
464 lf_height = (int)strtol(lf_height_arg, NULL, 0);
465 lf_blocksize = (int)strtol(lf_blocksize_arg, NULL, 0);
466 lf_blocksize = lf_blocksize < lf_width ? lf_blocksize : lf_width;
467 lf_blocksize = lf_blocksize < lf_height ? lf_blocksize : lf_height;
468
469 if (w <= 0 || h <= 0 || (w % 2) != 0 || (h % 2) != 0)
470 die("Invalid frame size: %dx%d", w, h);
471 if (lf_width <= 0 || lf_height <= 0)
472 die("Invalid lf_width and/or lf_height: %dx%d", lf_width, lf_height);
473 if (lf_blocksize <= 0) die("Invalid lf_blocksize: %d", lf_blocksize);
474
Yunqing Wang17d9d432018-05-27 15:08:04 -0700475 if (!aom_img_alloc(&raw, AOM_IMG_FMT_I420, w, h, 32)) {
476 die("Failed to allocate image.");
477 }
Jerome Jiang5fad3fb2019-08-14 10:16:12 -0700478 if (FORCE_HIGHBITDEPTH_DECODING) {
Yunqing Wang17d9d432018-05-27 15:08:04 -0700479 // Need to allocate larger buffer to use hbd internal.
480 aom_img_alloc(&raw_shift, AOM_IMG_FMT_I420 | AOM_IMG_FMT_HIGHBITDEPTH, w, h,
481 32);
482 }
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700483
Elliott Karpilovskycbe219b2020-04-22 16:21:06 -0700484 printf("Using %s\n", aom_codec_iface_name(encoder));
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700485
486 // Configuration
Elliott Karpilovskycbe219b2020-04-22 16:21:06 -0700487 res = aom_codec_enc_config_default(encoder, &cfg, 0);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700488 if (res) die_codec(&codec, "Failed to get default codec config.");
489
490 cfg.g_w = w;
491 cfg.g_h = h;
492 cfg.g_timebase.num = 1;
493 cfg.g_timebase.den = fps;
494 cfg.rc_target_bitrate = bitrate;
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800495 cfg.g_error_resilient = 0; // This is required.
496 cfg.g_lag_in_frames = 0; // need to set this since default is 19.
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700497 cfg.kf_mode = AOM_KF_DISABLED;
Yunqing Wangb041d8a2017-11-15 12:31:18 -0800498 cfg.large_scale_tile = 0; // Only set it to 1 for camera frame encoding.
Yunqing Wang17d9d432018-05-27 15:08:04 -0700499 cfg.g_bit_depth = AOM_BITS_8;
Jerome Jiang5fad3fb2019-08-14 10:16:12 -0700500 flags |= (cfg.g_bit_depth > AOM_BITS_8 || FORCE_HIGHBITDEPTH_DECODING)
Yunqing Wang17d9d432018-05-27 15:08:04 -0700501 ? AOM_CODEC_USE_HIGHBITDEPTH
502 : 0;
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700503
504 if (!(infile = fopen(infile_arg, "rb")))
505 die("Failed to open %s for reading", infile_arg);
506
507 // Pass 0
508 cfg.g_pass = AOM_RC_FIRST_PASS;
Yunqing Wang17d9d432018-05-27 15:08:04 -0700509 stats = pass0(&raw, infile, encoder, &cfg, lf_width, lf_height, lf_blocksize,
510 flags, &raw_shift);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700511
512 // Pass 1
513 rewind(infile);
514 cfg.g_pass = AOM_RC_LAST_PASS;
515 cfg.rc_twopass_stats_in = stats;
516 pass1(&raw, infile, outfile_arg, encoder, &cfg, lf_width, lf_height,
Yunqing Wang17d9d432018-05-27 15:08:04 -0700517 lf_blocksize, flags, &raw_shift);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700518 free(stats.buf);
519
Jerome Jiang5fad3fb2019-08-14 10:16:12 -0700520 if (FORCE_HIGHBITDEPTH_DECODING) aom_img_free(&raw_shift);
Ryan Overbecka5fefa72017-09-19 11:39:10 -0700521 aom_img_free(&raw);
522 fclose(infile);
523
524 return EXIT_SUCCESS;
525}