aomenc.c 82.2 KB
Newer Older
John Koleszar's avatar
John Koleszar committed
1
/*
2
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
John Koleszar's avatar
John Koleszar committed
3
 *
4 5 6 7 8 9
 * This source code is subject to the terms of the BSD 2 Clause License and
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
 * was not distributed with this source code in the LICENSE file, you can
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
 * Media Patent License 1.0 was not distributed with this source code in the
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
John Koleszar's avatar
John Koleszar committed
10 11
 */

12 13
#include "./aomenc.h"
#include "./aom_config.h"
John Koleszar's avatar
John Koleszar committed
14

15 16
#include <assert.h>
#include <limits.h>
17
#include <math.h>
18
#include <stdarg.h>
John Koleszar's avatar
John Koleszar committed
19 20 21
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
22

23 24 25 26
#if CONFIG_LIBYUV
#include "third_party/libyuv/include/libyuv/scale.h"
#endif

27
#include "aom/aom_encoder.h"
28
#if CONFIG_AV1_DECODER
29
#include "aom/aom_decoder.h"
30
#endif
31

32 33
#include "./args.h"
#include "./ivfenc.h"
34
#include "./tools_common.h"
35
#include "examples/encoder_util.h"
36

37 38
#if CONFIG_AV1_ENCODER
#include "aom/aomcx.h"
39
#endif
40 41
#if CONFIG_AV1_DECODER
#include "aom/aomdx.h"
42 43
#endif

44
#include "./aomstats.h"
45
#include "./rate_hist.h"
46
#include "./warnings.h"
47
#include "aom/aom_integer.h"
48
#include "aom_dsp/aom_dsp_common.h"
49 50
#include "aom_ports/aom_timer.h"
#include "aom_ports/mem_ops.h"
51
#if CONFIG_WEBM_IO
52
#include "./webmenc.h"
53
#endif
54
#include "./y4minput.h"
55

56
/* Swallow warnings about unused results of fread/fwrite */
57
static size_t wrap_fread(void *ptr, size_t size, size_t nmemb, FILE *stream) {
58
  return fread(ptr, size, nmemb, stream);
59 60 61 62
}
#define fread wrap_fread

static size_t wrap_fwrite(const void *ptr, size_t size, size_t nmemb,
63 64
                          FILE *stream) {
  return fwrite(ptr, size, nmemb, stream);
65 66 67
}
#define fwrite wrap_fwrite

John Koleszar's avatar
John Koleszar committed
68 69
static const char *exec_name;

70
static void warn_or_exit_on_errorv(aom_codec_ctx_t *ctx, int fatal,
71
                                   const char *s, va_list ap) {
John Koleszar's avatar
John Koleszar committed
72
  if (ctx->err) {
73
    const char *detail = aom_codec_error_detail(ctx);
John Koleszar's avatar
John Koleszar committed
74

75
    vfprintf(stderr, s, ap);
76
    fprintf(stderr, ": %s\n", aom_codec_error(ctx));
John Koleszar's avatar
John Koleszar committed
77

78
    if (detail) fprintf(stderr, "    %s\n", detail);
John Koleszar's avatar
John Koleszar committed
79

80
    if (fatal) exit(EXIT_FAILURE);
John Koleszar's avatar
John Koleszar committed
81
  }
John Koleszar's avatar
John Koleszar committed
82 83
}

84
static void ctx_exit_on_error(aom_codec_ctx_t *ctx, const char *s, ...) {
85 86 87 88 89 90 91
  va_list ap;

  va_start(ap, s);
  warn_or_exit_on_errorv(ctx, 1, s, ap);
  va_end(ap);
}

92
static void warn_or_exit_on_error(aom_codec_ctx_t *ctx, int fatal,
93 94 95 96 97 98 99 100
                                  const char *s, ...) {
  va_list ap;

  va_start(ap, s);
  warn_or_exit_on_errorv(ctx, fatal, s, ap);
  va_end(ap);
}

101
static int read_frame(struct AvxInputContext *input_ctx, aom_image_t *img) {
102 103
  FILE *f = input_ctx->file;
  y4m_input *y4m = &input_ctx->y4m;
John Koleszar's avatar
John Koleszar committed
104 105
  int shortread = 0;

106
  if (input_ctx->file_type == FILE_TYPE_Y4M) {
107
    if (y4m_input_fetch_frame(y4m, f, img) < 1) return 0;
John Koleszar's avatar
John Koleszar committed
108
  } else {
109
    shortread = read_yuv_frame(input_ctx, img);
John Koleszar's avatar
John Koleszar committed
110
  }
John Koleszar's avatar
John Koleszar committed
111

John Koleszar's avatar
John Koleszar committed
112
  return !shortread;
John Koleszar's avatar
John Koleszar committed
113 114
}

115
static int file_is_y4m(const char detect[4]) {
John Koleszar's avatar
John Koleszar committed
116 117 118 119
  if (memcmp(detect, "YUV4", 4) == 0) {
    return 1;
  }
  return 0;
120 121
}

122
static int fourcc_is_ivf(const char detect[4]) {
123 124 125 126 127
  if (memcmp(detect, "DKIF", 4) == 0) {
    return 1;
  }
  return 0;
}
128

James Zern's avatar
James Zern committed
129 130
static const arg_def_t help =
    ARG_DEF(NULL, "help", 0, "Show usage options and exit");
131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151
static const arg_def_t debugmode =
    ARG_DEF("D", "debug", 0, "Debug mode (makes output deterministic)");
static const arg_def_t outputfile =
    ARG_DEF("o", "output", 1, "Output filename");
static const arg_def_t use_yv12 =
    ARG_DEF(NULL, "yv12", 0, "Input file is YV12 ");
static const arg_def_t use_i420 =
    ARG_DEF(NULL, "i420", 0, "Input file is I420 (default)");
static const arg_def_t use_i422 =
    ARG_DEF(NULL, "i422", 0, "Input file is I422");
static const arg_def_t use_i444 =
    ARG_DEF(NULL, "i444", 0, "Input file is I444");
static const arg_def_t use_i440 =
    ARG_DEF(NULL, "i440", 0, "Input file is I440");
static const arg_def_t codecarg = ARG_DEF(NULL, "codec", 1, "Codec to use");
static const arg_def_t passes =
    ARG_DEF("p", "passes", 1, "Number of passes (1/2)");
static const arg_def_t pass_arg =
    ARG_DEF(NULL, "pass", 1, "Pass to execute (1/2)");
static const arg_def_t fpf_name =
    ARG_DEF(NULL, "fpf", 1, "First pass statistics file name");
152
#if CONFIG_FP_MB_STATS
153 154
static const arg_def_t fpmbf_name =
    ARG_DEF(NULL, "fpmbf", 1, "First pass block statistics file name");
155
#endif
156 157 158 159 160 161 162 163 164 165 166 167 168 169
static const arg_def_t limit =
    ARG_DEF(NULL, "limit", 1, "Stop encoding after n input frames");
static const arg_def_t skip =
    ARG_DEF(NULL, "skip", 1, "Skip the first n input frames");
static const arg_def_t deadline =
    ARG_DEF("d", "deadline", 1, "Deadline per frame (usec)");
static const arg_def_t good_dl =
    ARG_DEF(NULL, "good", 0, "Use Good Quality Deadline");
static const arg_def_t quietarg =
    ARG_DEF("q", "quiet", 0, "Do not print encode progress");
static const arg_def_t verbosearg =
    ARG_DEF("v", "verbose", 0, "Show encoder parameters");
static const arg_def_t psnrarg =
    ARG_DEF(NULL, "psnr", 0, "Show PSNR in status line");
170

171
static const struct arg_enum_list test_decode_enum[] = {
172 173 174 175
  { "off", TEST_DECODE_OFF },
  { "fatal", TEST_DECODE_FATAL },
  { "warn", TEST_DECODE_WARN },
  { NULL, 0 }
176
};
177 178
static const arg_def_t recontest = ARG_DEF_ENUM(
    NULL, "test-decode", 1, "Test encode/decode mismatch", test_decode_enum);
179 180 181 182 183
static const arg_def_t framerate =
    ARG_DEF(NULL, "fps", 1, "Stream frame rate (rate/scale)");
static const arg_def_t use_webm =
    ARG_DEF(NULL, "webm", 0, "Output WebM (default when WebM IO is enabled)");
static const arg_def_t use_ivf = ARG_DEF(NULL, "ivf", 0, "Output IVF");
184 185 186
#if CONFIG_OBU_NO_IVF
static const arg_def_t use_obu = ARG_DEF(NULL, "obu", 0, "Output OBU");
#endif
187 188 189 190 191 192 193 194 195 196 197 198 199
static const arg_def_t out_part =
    ARG_DEF("P", "output-partitions", 0,
            "Makes encoder output partitions. Requires IVF output!");
static const arg_def_t q_hist_n =
    ARG_DEF(NULL, "q-hist", 1, "Show quantizer histogram (n-buckets)");
static const arg_def_t rate_hist_n =
    ARG_DEF(NULL, "rate-hist", 1, "Show rate histogram (n-buckets)");
static const arg_def_t disable_warnings =
    ARG_DEF(NULL, "disable-warnings", 0,
            "Disable warnings about potentially incorrect encode settings.");
static const arg_def_t disable_warning_prompt =
    ARG_DEF("y", "disable-warning-prompt", 0,
            "Display warnings, but do not prompt user to continue.");
200

201
#if CONFIG_HIGHBITDEPTH
202 203 204 205 206 207 208 209 210 211
static const struct arg_enum_list bitdepth_enum[] = {
  { "8", AOM_BITS_8 }, { "10", AOM_BITS_10 }, { "12", AOM_BITS_12 }, { NULL, 0 }
};

static const arg_def_t bitdeptharg = ARG_DEF_ENUM(
    "b", "bit-depth", 1,
    "Bit depth for codec (8 for version <=1, 10 or 12 for version 2)",
    bitdepth_enum);
static const arg_def_t inbitdeptharg =
    ARG_DEF(NULL, "input-bit-depth", 1, "Bit depth of input");
212
#endif
213

James Zern's avatar
James Zern committed
214 215
static const arg_def_t *main_args[] = { &help,
                                        &debugmode,
216 217 218 219 220 221 222 223 224 225 226 227 228 229
                                        &outputfile,
                                        &codecarg,
                                        &passes,
                                        &pass_arg,
                                        &fpf_name,
                                        &limit,
                                        &skip,
                                        &deadline,
                                        &good_dl,
                                        &quietarg,
                                        &verbosearg,
                                        &psnrarg,
                                        &use_webm,
                                        &use_ivf,
230 231 232
#if CONFIG_OBU_NO_IVF
                                        &use_obu,
#endif
233 234 235 236 237 238 239 240 241 242 243 244 245 246
                                        &out_part,
                                        &q_hist_n,
                                        &rate_hist_n,
                                        &disable_warnings,
                                        &disable_warning_prompt,
                                        &recontest,
                                        NULL };

static const arg_def_t usage =
    ARG_DEF("u", "usage", 1, "Usage profile number to use");
static const arg_def_t threads =
    ARG_DEF("t", "threads", 1, "Max number of threads to use");
static const arg_def_t profile =
    ARG_DEF(NULL, "profile", 1, "Bitstream profile number to use");
247 248
static const arg_def_t width = ARG_DEF("w", "width", 1, "Frame width");
static const arg_def_t height = ARG_DEF("h", "height", 1, "Frame height");
249
#if CONFIG_WEBM_IO
250
static const struct arg_enum_list stereo_mode_enum[] = {
251 252 253 254 255 256
  { "mono", STEREO_FORMAT_MONO },
  { "left-right", STEREO_FORMAT_LEFT_RIGHT },
  { "bottom-top", STEREO_FORMAT_BOTTOM_TOP },
  { "top-bottom", STEREO_FORMAT_TOP_BOTTOM },
  { "right-left", STEREO_FORMAT_RIGHT_LEFT },
  { NULL, 0 }
257
};
258 259
static const arg_def_t stereo_mode = ARG_DEF_ENUM(
    NULL, "stereo-mode", 1, "Stereo 3D video format", stereo_mode_enum);
260
#endif
261 262
static const arg_def_t timebase = ARG_DEF(
    NULL, "timebase", 1, "Output timestamp precision (fractional seconds)");
263 264 265 266
static const arg_def_t error_resilient =
    ARG_DEF(NULL, "error-resilient", 1, "Enable error resiliency features");
static const arg_def_t lag_in_frames =
    ARG_DEF(NULL, "lag-in-frames", 1, "Max number of frames to lag");
267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282
#if CONFIG_EXT_TILE
static const arg_def_t large_scale_tile =
    ARG_DEF(NULL, "large-scale-tile", 1,
            "Large scale tile coding (0: off (default), 1: on)");
#endif  // CONFIG_EXT_TILE

static const arg_def_t *global_args[] = { &use_yv12,
                                          &use_i420,
                                          &use_i422,
                                          &use_i444,
                                          &use_i440,
                                          &usage,
                                          &threads,
                                          &profile,
                                          &width,
                                          &height,
283
#if CONFIG_WEBM_IO
284
                                          &stereo_mode,
285
#endif
286 287 288
                                          &timebase,
                                          &framerate,
                                          &error_resilient,
289
#if CONFIG_HIGHBITDEPTH
290
                                          &bitdeptharg,
291
#endif
292 293 294 295 296
                                          &lag_in_frames,
#if CONFIG_EXT_TILE
                                          &large_scale_tile,
#endif  // CONFIG_EXT_TILE
                                          NULL };
297 298 299

static const arg_def_t dropframe_thresh =
    ARG_DEF(NULL, "drop-frame", 1, "Temporal resampling threshold (buf %)");
300 301
static const arg_def_t resize_mode =
    ARG_DEF(NULL, "resize-mode", 1, "Frame resize mode");
302 303 304 305
static const arg_def_t resize_denominator =
    ARG_DEF(NULL, "resize-denominator", 1, "Frame resize denominator");
static const arg_def_t resize_kf_denominator = ARG_DEF(
    NULL, "resize-kf-denominator", 1, "Frame resize keyframe denominator");
306
#if CONFIG_HORZONLY_FRAME_SUPERRES
307 308
static const arg_def_t superres_mode =
    ARG_DEF(NULL, "superres-mode", 1, "Frame super-resolution mode");
309 310 311 312 313
static const arg_def_t superres_denominator = ARG_DEF(
    NULL, "superres-denominator", 1, "Frame super-resolution denominator");
static const arg_def_t superres_kf_denominator =
    ARG_DEF(NULL, "superres-kf-denominator", 1,
            "Frame super-resolution keyframe denominator");
314 315 316 317 318
static const arg_def_t superres_qthresh = ARG_DEF(
    NULL, "superres-qthresh", 1, "Frame super-resolution qindex threshold");
static const arg_def_t superres_kf_qthresh =
    ARG_DEF(NULL, "superres-kf-qthresh", 1,
            "Frame super-resolution keyframe qindex threshold");
319
#endif  // CONFIG_HORZONLY_FRAME_SUPERRES
320 321 322 323 324
static const struct arg_enum_list end_usage_enum[] = { { "vbr", AOM_VBR },
                                                       { "cbr", AOM_CBR },
                                                       { "cq", AOM_CQ },
                                                       { "q", AOM_Q },
                                                       { NULL, 0 } };
325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342
static const arg_def_t end_usage =
    ARG_DEF_ENUM(NULL, "end-usage", 1, "Rate control mode", end_usage_enum);
static const arg_def_t target_bitrate =
    ARG_DEF(NULL, "target-bitrate", 1, "Bitrate (kbps)");
static const arg_def_t min_quantizer =
    ARG_DEF(NULL, "min-q", 1, "Minimum (best) quantizer");
static const arg_def_t max_quantizer =
    ARG_DEF(NULL, "max-q", 1, "Maximum (worst) quantizer");
static const arg_def_t undershoot_pct =
    ARG_DEF(NULL, "undershoot-pct", 1, "Datarate undershoot (min) target (%)");
static const arg_def_t overshoot_pct =
    ARG_DEF(NULL, "overshoot-pct", 1, "Datarate overshoot (max) target (%)");
static const arg_def_t buf_sz =
    ARG_DEF(NULL, "buf-sz", 1, "Client buffer size (ms)");
static const arg_def_t buf_initial_sz =
    ARG_DEF(NULL, "buf-initial-sz", 1, "Client initial buffer size (ms)");
static const arg_def_t buf_optimal_sz =
    ARG_DEF(NULL, "buf-optimal-sz", 1, "Client optimal buffer size (ms)");
343 344
static const arg_def_t *rc_args[] = { &dropframe_thresh,
                                      &resize_mode,
345 346
                                      &resize_denominator,
                                      &resize_kf_denominator,
347
#if CONFIG_HORZONLY_FRAME_SUPERRES
348
                                      &superres_mode,
349 350
                                      &superres_denominator,
                                      &superres_kf_denominator,
351 352
                                      &superres_qthresh,
                                      &superres_kf_qthresh,
353
#endif  // CONFIG_HORZONLY_FRAME_SUPERRES
354 355 356 357 358 359 360 361 362 363
                                      &end_usage,
                                      &target_bitrate,
                                      &min_quantizer,
                                      &max_quantizer,
                                      &undershoot_pct,
                                      &overshoot_pct,
                                      &buf_sz,
                                      &buf_initial_sz,
                                      &buf_optimal_sz,
                                      NULL };
John Koleszar's avatar
John Koleszar committed
364

365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394
static const arg_def_t bias_pct =
    ARG_DEF(NULL, "bias-pct", 1, "CBR/VBR bias (0=CBR, 100=VBR)");
static const arg_def_t minsection_pct =
    ARG_DEF(NULL, "minsection-pct", 1, "GOP min bitrate (% of target)");
static const arg_def_t maxsection_pct =
    ARG_DEF(NULL, "maxsection-pct", 1, "GOP max bitrate (% of target)");
static const arg_def_t *rc_twopass_args[] = { &bias_pct, &minsection_pct,
                                              &maxsection_pct, NULL };

static const arg_def_t kf_min_dist =
    ARG_DEF(NULL, "kf-min-dist", 1, "Minimum keyframe interval (frames)");
static const arg_def_t kf_max_dist =
    ARG_DEF(NULL, "kf-max-dist", 1, "Maximum keyframe interval (frames)");
static const arg_def_t kf_disabled =
    ARG_DEF(NULL, "disable-kf", 0, "Disable keyframe placement");
static const arg_def_t *kf_args[] = { &kf_min_dist, &kf_max_dist, &kf_disabled,
                                      NULL };

static const arg_def_t noise_sens =
    ARG_DEF(NULL, "noise-sensitivity", 1, "Noise sensitivity (frames to blur)");
static const arg_def_t sharpness =
    ARG_DEF(NULL, "sharpness", 1, "Loop filter sharpness (0..7)");
static const arg_def_t static_thresh =
    ARG_DEF(NULL, "static-thresh", 1, "Motion detection threshold");
static const arg_def_t auto_altref =
    ARG_DEF(NULL, "auto-alt-ref", 1, "Enable automatic alt reference frames");
static const arg_def_t arnr_maxframes =
    ARG_DEF(NULL, "arnr-maxframes", 1, "AltRef max frames (0..15)");
static const arg_def_t arnr_strength =
    ARG_DEF(NULL, "arnr-strength", 1, "AltRef filter strength (0..6)");
395
static const struct arg_enum_list tuning_enum[] = {
396 397 398 399 400 401 402
  { "psnr", AOM_TUNE_PSNR },
  { "ssim", AOM_TUNE_SSIM },
#ifdef CONFIG_DIST_8X8
  { "cdef-dist", AOM_TUNE_CDEF_DIST },
  { "daala-dist", AOM_TUNE_DAALA_DIST },
#endif
  { NULL, 0 }
403
};
404 405
static const arg_def_t tune_metric =
    ARG_DEF_ENUM(NULL, "tune", 1, "Distortion metric tuned with", tuning_enum);
406 407 408 409
static const arg_def_t cq_level =
    ARG_DEF(NULL, "cq-level", 1, "Constant/Constrained Quality level");
static const arg_def_t max_intra_rate_pct =
    ARG_DEF(NULL, "max-intra-rate", 1, "Max I-frame bitrate (pct)");
410

411 412
#if CONFIG_AV1_ENCODER
static const arg_def_t cpu_used_av1 =
Yaowu Xu's avatar
Yaowu Xu committed
413
    ARG_DEF(NULL, "cpu-used", 1, "CPU Used (0..8)");
414 415
static const arg_def_t dev_sf_av1 =
    ARG_DEF(NULL, "dev-sf", 1, "Dev Speed (0..255)");
416 417 418 419 420
#if CONFIG_EXT_TILE
static const arg_def_t single_tile_decoding =
    ARG_DEF(NULL, "single-tile-decoding", 1,
            "Single tile decoding (0: off (default), 1: on)");
#endif  // CONFIG_EXT_TILE
421 422 423 424 425
static const arg_def_t tile_cols =
    ARG_DEF(NULL, "tile-columns", 1, "Number of tile columns to use, log2");
static const arg_def_t tile_rows =
    ARG_DEF(NULL, "tile-rows", 1,
            "Number of tile rows to use, log2 (set to 0 while threads > 1)");
426 427
#if CONFIG_MAX_TILE
static const arg_def_t tile_width =
428
    ARG_DEF(NULL, "tile-width", 1, "Tile widths (comma separated)");
429
static const arg_def_t tile_height =
430
    ARG_DEF(NULL, "tile-height", 1, "Tile heights (command separated)");
431
#endif
432 433 434 435
#if CONFIG_DEPENDENT_HORZTILES
static const arg_def_t tile_dependent_rows =
    ARG_DEF(NULL, "tile-dependent-rows", 1, "Enable dependent Tile rows");
#endif
436
#if CONFIG_LOOPFILTERING_ACROSS_TILES
437 438
static const arg_def_t tile_loopfilter = ARG_DEF(
    NULL, "tile-loopfilter", 1, "Enable loop filter across tile boundary");
439
#endif  // CONFIG_LOOPFILTERING_ACROSS_TILES
440 441
static const arg_def_t lossless =
    ARG_DEF(NULL, "lossless", 1, "Lossless mode (0: false (default), 1: true)");
442 443 444 445
static const arg_def_t enable_cdef =
    ARG_DEF(NULL, "enable-cdef", 1,
            "Enable the constrained directional enhancement filter (0: false, "
            "1: true (default))");
446 447
#if CONFIG_AOM_QM
static const arg_def_t enable_qm =
448
    ARG_DEF(NULL, "enable-qm", 1,
449 450
            "Enable quantisation matrices (0: false (default), 1: true)");
static const arg_def_t qm_min = ARG_DEF(
451
    NULL, "qm-min", 1, "Min quant matrix flatness (0..15), default is 8");
452
static const arg_def_t qm_max = ARG_DEF(
453
    NULL, "qm-max", 1, "Max quant matrix flatness (0..15), default is 16");
454
#endif
455 456 457 458 459
#if CONFIG_DIST_8X8
static const arg_def_t enable_dist_8x8 =
    ARG_DEF(NULL, "enable-dist-8x8", 1,
            "Enable dist-8x8 (0: false (default), 1: true)");
#endif  // CONFIG_DIST_8X8
Yaowu Xu's avatar
Yaowu Xu committed
460 461
static const arg_def_t num_tg = ARG_DEF(
    NULL, "num-tile-groups", 1, "Maximum number of tile groups, default is 1");
462 463
static const arg_def_t mtu_size =
    ARG_DEF(NULL, "mtu-size", 1,
Yaowu Xu's avatar
Yaowu Xu committed
464 465
            "MTU size for a tile group, default is 0 (no MTU targeting), "
            "overrides maximum number of tile groups");
466 467 468 469
#if CONFIG_TEMPMV_SIGNALING
static const arg_def_t disable_tempmv = ARG_DEF(
    NULL, "disable-tempmv", 1, "Disable temporal mv prediction (default is 0)");
#endif
Yaowu Xu's avatar
Yaowu Xu committed
470 471 472 473
static const arg_def_t frame_parallel_decoding =
    ARG_DEF(NULL, "frame-parallel", 1,
            "Enable frame parallel decodability features "
            "(0: false (default), 1: true)");
474
#if !CONFIG_EXT_DELTA_Q
475 476 477
static const arg_def_t aq_mode = ARG_DEF(
    NULL, "aq-mode", 1,
    "Adaptive quantization mode (0: off (default), 1: variance 2: complexity, "
478
    "3: cyclic refresh, 4: delta quant)");
479
#else
Thomas's avatar
Thomas committed
480 481 482
static const arg_def_t aq_mode = ARG_DEF(
    NULL, "aq-mode", 1,
    "Adaptive quantization mode (0: off (default), 1: variance 2: complexity, "
483
    "3: cyclic refresh)");
484
#endif
485 486 487 488 489
#if CONFIG_EXT_DELTA_Q
static const arg_def_t deltaq_mode = ARG_DEF(
    NULL, "deltaq-mode", 1,
    "Delta qindex mode (0: off (default), 1: deltaq 2: deltaq + deltalf)");
#endif
490 491 492
static const arg_def_t frame_periodic_boost =
    ARG_DEF(NULL, "frame-boost", 1,
            "Enable frame periodic boost (0: off (default), 1: on)");
493 494
static const arg_def_t gf_cbr_boost_pct = ARG_DEF(
    NULL, "gf-cbr-boost", 1, "Boost for Golden Frame in CBR mode (pct)");
495 496
static const arg_def_t max_inter_rate_pct =
    ARG_DEF(NULL, "max-inter-rate", 1, "Max P-frame bitrate (pct)");
497 498 499 500 501 502
static const arg_def_t min_gf_interval = ARG_DEF(
    NULL, "min-gf-interval", 1,
    "min gf/arf frame interval (default 0, indicating in-built behavior)");
static const arg_def_t max_gf_interval = ARG_DEF(
    NULL, "max-gf-interval", 1,
    "max gf/arf frame interval (default 0, indicating in-built behavior)");
503

Yaowu Xu's avatar
Yaowu Xu committed
504
static const struct arg_enum_list color_space_enum[] = {
505 506 507 508 509 510 511 512 513 514 515
  { "unknown", AOM_CS_UNKNOWN },
  { "bt601", AOM_CS_BT_601 },
  { "bt709", AOM_CS_BT_709 },
  { "smpte170", AOM_CS_SMPTE_170 },
  { "smpte240", AOM_CS_SMPTE_240 },
  { "bt2020ncl", AOM_CS_BT_2020_NCL },
  { "bt2020cl", AOM_CS_BT_2020_CL },
  { "sRGB", AOM_CS_SRGB },
  { "ICtCp", AOM_CS_ICTCP },
  { "monochrome", AOM_CS_MONOCHROME },
  { NULL, 0 }
Yaowu Xu's avatar
Yaowu Xu committed
516 517
};

518
static const arg_def_t input_color_space =
clang-format's avatar
clang-format committed
519 520
    ARG_DEF_ENUM(NULL, "color-space", 1,
                 "The color space of input content:", color_space_enum);
Yaowu Xu's avatar
Yaowu Xu committed
521

522 523 524 525 526 527 528 529 530
static const struct arg_enum_list transfer_function_enum[] = {
  { "unknown", AOM_TF_UNKNOWN },
  { "bt709", AOM_TF_BT_709 },
  { "pq", AOM_TF_PQ },
  { "hlg", AOM_TF_HLG },
  { NULL, 0 }
};

static const arg_def_t input_transfer_function = ARG_DEF_ENUM(
clang-format's avatar
clang-format committed
531 532
    NULL, "transfer-function", 1,
    "The transfer function of input content:", transfer_function_enum);
533 534 535 536 537 538 539 540 541 542 543 544 545

static const struct arg_enum_list chroma_sample_position_enum[] = {
  { "unknown", AOM_CSP_UNKNOWN },
  { "vertical", AOM_CSP_VERTICAL },
  { "colocated", AOM_CSP_COLOCATED },
  { NULL, 0 }
};

static const arg_def_t input_chroma_sample_position =
    ARG_DEF_ENUM(NULL, "chroma-sample-position", 1,
                 "The chroma sample position when chroma 4:2:0 is signaled:",
                 chroma_sample_position_enum);

546
static const struct arg_enum_list tune_content_enum[] = {
547 548
  { "default", AOM_CONTENT_DEFAULT },
  { "screen", AOM_CONTENT_SCREEN },
549
  { NULL, 0 }
550 551 552 553
};

static const arg_def_t tune_content = ARG_DEF_ENUM(
    NULL, "tune-content", 1, "Tune content type", tune_content_enum);
hui su's avatar
hui su committed
554
#endif
555

556
#if CONFIG_AV1_ENCODER
557 558
#if CONFIG_EXT_PARTITION
static const struct arg_enum_list superblock_size_enum[] = {
559 560 561
  { "dynamic", AOM_SUPERBLOCK_SIZE_DYNAMIC },
  { "64", AOM_SUPERBLOCK_SIZE_64X64 },
  { "128", AOM_SUPERBLOCK_SIZE_128X128 },
562
  { NULL, 0 }
563 564 565 566 567
};
static const arg_def_t superblock_size = ARG_DEF_ENUM(
    NULL, "sb-size", 1, "Superblock size to use", superblock_size_enum);
#endif  // CONFIG_EXT_PARTITION

568
static const arg_def_t *av1_args[] = { &cpu_used_av1,
569
                                       &dev_sf_av1,
570 571 572
                                       &auto_altref,
                                       &sharpness,
                                       &static_thresh,
573 574 575
#if CONFIG_EXT_TILE
                                       &single_tile_decoding,
#endif  // CONFIG_EXT_TILE
576 577
                                       &tile_cols,
                                       &tile_rows,
578 579 580
#if CONFIG_DEPENDENT_HORZTILES
                                       &tile_dependent_rows,
#endif
581
#if CONFIG_LOOPFILTERING_ACROSS_TILES
582
                                       &tile_loopfilter,
583
#endif  // CONFIG_LOOPFILTERING_ACROSS_TILES
584 585
                                       &arnr_maxframes,
                                       &arnr_strength,
586
                                       &tune_metric,
587 588 589 590 591
                                       &cq_level,
                                       &max_intra_rate_pct,
                                       &max_inter_rate_pct,
                                       &gf_cbr_boost_pct,
                                       &lossless,
592
                                       &enable_cdef,
593 594 595 596
#if CONFIG_AOM_QM
                                       &enable_qm,
                                       &qm_min,
                                       &qm_max,
597 598 599
#endif
#if CONFIG_DIST_8X8
                                       &enable_dist_8x8,
600
#endif
601 602
                                       &frame_parallel_decoding,
                                       &aq_mode,
603 604 605
#if CONFIG_EXT_DELTA_Q
                                       &deltaq_mode,
#endif
606 607 608 609
                                       &frame_periodic_boost,
                                       &noise_sens,
                                       &tune_content,
                                       &input_color_space,
610 611
                                       &input_transfer_function,
                                       &input_chroma_sample_position,
612 613
                                       &min_gf_interval,
                                       &max_gf_interval,
614
#if CONFIG_EXT_PARTITION
615
                                       &superblock_size,
616
#endif  // CONFIG_EXT_PARTITION
617 618
                                       &num_tg,
                                       &mtu_size,
619 620 621
#if CONFIG_TEMPMV_SIGNALING
                                       &disable_tempmv,
#endif
622
#if CONFIG_HIGHBITDEPTH
623 624
                                       &bitdeptharg,
                                       &inbitdeptharg,
625
#endif  // CONFIG_HIGHBITDEPTH
626 627
                                       NULL };
static const int av1_arg_ctrl_map[] = { AOME_SET_CPUUSED,
628
                                        AOME_SET_DEVSF,
629 630 631
                                        AOME_SET_ENABLEAUTOALTREF,
                                        AOME_SET_SHARPNESS,
                                        AOME_SET_STATIC_THRESHOLD,
632 633 634
#if CONFIG_EXT_TILE
                                        AV1E_SET_SINGLE_TILE_DECODING,
#endif  // CONFIG_EXT_TILE
635 636
                                        AV1E_SET_TILE_COLUMNS,
                                        AV1E_SET_TILE_ROWS,
637 638 639
#if CONFIG_DEPENDENT_HORZTILES
                                        AV1E_SET_TILE_DEPENDENT_ROWS,
#endif
640
#if CONFIG_LOOPFILTERING_ACROSS_TILES
641
                                        AV1E_SET_TILE_LOOPFILTER,
642
#endif  // CONFIG_LOOPFILTERING_ACROSS_TILES
643 644 645 646 647 648 649 650
                                        AOME_SET_ARNR_MAXFRAMES,
                                        AOME_SET_ARNR_STRENGTH,
                                        AOME_SET_TUNING,
                                        AOME_SET_CQ_LEVEL,
                                        AOME_SET_MAX_INTRA_BITRATE_PCT,
                                        AV1E_SET_MAX_INTER_BITRATE_PCT,
                                        AV1E_SET_GF_CBR_BOOST_PCT,
                                        AV1E_SET_LOSSLESS,
651
                                        AV1E_SET_ENABLE_CDEF,
652 653 654 655
#if CONFIG_AOM_QM
                                        AV1E_SET_ENABLE_QM,
                                        AV1E_SET_QM_MIN,
                                        AV1E_SET_QM_MAX,
656 657 658
#endif
#if CONFIG_DIST_8X8
                                        AV1E_SET_ENABLE_DIST_8X8,
659
#endif
660 661
                                        AV1E_SET_FRAME_PARALLEL_DECODING,
                                        AV1E_SET_AQ_MODE,
662 663 664
#if CONFIG_EXT_DELTA_Q
                                        AV1E_SET_DELTAQ_MODE,
#endif
665 666 667 668
                                        AV1E_SET_FRAME_PERIODIC_BOOST,
                                        AV1E_SET_NOISE_SENSITIVITY,
                                        AV1E_SET_TUNE_CONTENT,
                                        AV1E_SET_COLOR_SPACE,
669 670
                                        AV1E_SET_TRANSFER_FUNCTION,
                                        AV1E_SET_CHROMA_SAMPLE_POSITION,
671 672
                                        AV1E_SET_MIN_GF_INTERVAL,
                                        AV1E_SET_MAX_GF_INTERVAL,
673
#if CONFIG_EXT_PARTITION
674
                                        AV1E_SET_SUPERBLOCK_SIZE,
675
#endif  // CONFIG_EXT_PARTITION
676 677
                                        AV1E_SET_NUM_TG,
                                        AV1E_SET_MTU,
678 679
#if CONFIG_TEMPMV_SIGNALING
                                        AV1E_SET_DISABLE_TEMPMV,
680
#endif
681
                                        0 };
hui su's avatar
hui su committed
682 683
#endif

John Koleszar's avatar
John Koleszar committed
684 685
static const arg_def_t *no_args[] = { NULL };

James Zern's avatar
James Zern committed
686 687
void show_help(FILE *fout, int shorthelp) {
  fprintf(fout, "Usage: %s <options> -o dst_filename src_filename \n",
John Koleszar's avatar
John Koleszar committed
688 689
          exec_name);

James Zern's avatar
James Zern committed
690 691 692 693 694 695 696 697 698 699 700 701 702 703 704
  if (shorthelp) {
    fprintf(fout, "Use --help to see the full list of options.\n");
    return;
  }

  fprintf(fout, "\nOptions:\n");
  arg_show_usage(fout, main_args);
  fprintf(fout, "\nEncoder Global Options:\n");
  arg_show_usage(fout, global_args);
  fprintf(fout, "\nRate Control Options:\n");
  arg_show_usage(fout, rc_args);
  fprintf(fout, "\nTwopass Rate Control Options:\n");
  arg_show_usage(fout, rc_twopass_args);
  fprintf(fout, "\nKeyframe Placement Options:\n");
  arg_show_usage(fout, kf_args);
705
#if CONFIG_AV1_ENCODER
James Zern's avatar
James Zern committed
706 707
  fprintf(fout, "\nAV1 Specific Options:\n");
  arg_show_usage(fout, av1_args);
John Koleszar's avatar
John Koleszar committed
708
#endif
James Zern's avatar
James Zern committed
709
  fprintf(fout,
710
          "\nStream timebase (--timebase):\n"
John Koleszar's avatar
John Koleszar committed
711 712
          "  The desired precision of timestamps in the output, expressed\n"
          "  in fractional seconds. Default is 1/1000.\n");
James Zern's avatar
James Zern committed
713
  fprintf(fout, "\nIncluded encoders:\n\n");
John Koleszar's avatar
John Koleszar committed
714

James Zern's avatar
James Zern committed
715 716
  const int num_encoder = get_aom_encoder_count();
  for (int i = 0; i < num_encoder; ++i) {
717
    const AvxInterface *const encoder = get_aom_encoder_by_index(i);
718
    const char *defstr = (i == (num_encoder - 1)) ? "(default)" : "";
James Zern's avatar
James Zern committed
719
    fprintf(fout, "    %-6s - %s %s\n", encoder->name,
720
            aom_codec_iface_name(encoder->codec_interface()), defstr);
721
  }
James Zern's avatar
James Zern committed
722 723 724
  fprintf(fout, "\n        ");
  fprintf(fout, "Use --codec to switch to a non-default encoder.\n\n");
}
John Koleszar's avatar
John Koleszar committed
725

James Zern's avatar
James Zern committed
726 727
void usage_exit(void) {
  show_help(stderr, 1);
John Koleszar's avatar
John Koleszar committed
728
  exit(EXIT_FAILURE);
John Koleszar's avatar
John Koleszar committed
729 730
}

731 732
#if CONFIG_AV1_ENCODER
#define ARG_CTRL_CNT_MAX NELEMENTS(av1_arg_ctrl_map)
733
#endif
John Koleszar's avatar
John Koleszar committed
734

735 736
#if !CONFIG_WEBM_IO
typedef int stereo_format_t;
737 738 739
struct WebmOutputContext {
  int debug;
};
740 741
#endif

742
/* Per-stream configuration */
743
struct stream_config {
744
  struct aom_codec_enc_cfg cfg;
745 746
  const char *out_fn;
  const char *stats_fn;
747
#if CONFIG_FP_MB_STATS
748
  const char *fpmb_stats_fn;
749
#endif
750 751 752 753
  stereo_format_t stereo_fmt;
  int arg_ctrls[ARG_CTRL_CNT_MAX][2];
  int arg_ctrl_cnt;
  int write_webm;
754 755 756
#if CONFIG_OBU_NO_IVF
  int write_ivf;
#endif
757
  // whether to use 16bit internal buffers
758
  int use_16bit_internal;
759 760
};

761
struct stream_state {
762 763 764 765 766 767 768 769 770 771 772
  int index;
  struct stream_state *next;
  struct stream_config config;
  FILE *file;
  struct rate_hist *rate_hist;
  struct WebmOutputContext webm_ctx;
  uint64_t psnr_sse_total;
  uint64_t psnr_samples_total;
  double psnr_totals[4];
  int psnr_count;
  int counts[64];
773
  aom_codec_ctx_t encoder;
774 775 776 777
  unsigned int frames_out;
  uint64_t cx_time;
  size_t nbytes;
  stats_io_t stats;
778
#if CONFIG_FP_MB_STATS
779
  stats_io_t fpmb_stats;
780
#endif
781 782
  struct aom_image *img;
  aom_codec_ctx_t decoder;
783
  int mismatch_seen;
784 785
};

786
static void validate_positive_rational(const char *msg,
787
                                       struct aom_rational *rat) {
788 789 790 791
  if (rat->den < 0) {
    rat->num *= -1;
    rat->den *= -1;
  }
792

793
  if (rat->num < 0) die("Error: %s must be positive\n", msg);
794

795
  if (!rat->den) die("Error: %s has zero denominator\n", msg);
796 797
}

798
static void parse_global_config(struct AvxEncoderConfig *global, char **argv) {
799 800
  char **argi, **argj;
  struct arg arg;
801
  const int num_encoder = get_aom_encoder_count();
802

803
  if (num_encoder < 1) die("Error: no valid encoder available\n");
804 805 806

  /* Initialize default parameters */
  memset(global, 0, sizeof(*global));
807
  global->codec = get_aom_encoder_by_index(num_encoder - 1);
808
  global->passes = 0;
809
  global->color_type = I420;
810
  /* Assign default deadline to good quality */
811
  global->deadline = AOM_DL_GOOD_QUALITY;
John Koleszar's avatar
John Koleszar committed
812 813 814 815

  for (argi = argj = argv; (*argj = *argi); argi += arg.argv_step) {
    arg.argv_step = 1;

James Zern's avatar
James Zern committed
816 817 818 819
    if (arg_match(&arg, &help, argi)) {
      show_help(stdout, 0);
      exit(EXIT_SUCCESS);
    } else if (arg_match(&arg, &codecarg, argi)) {
820
      global->codec = get_aom_encoder_by_name(arg.val);
821 822
      if (!global->codec)
        die("Error: Unrecognized argument (%s) to --codec\n", arg.val);
John Koleszar's avatar
John Koleszar committed
823
    } else if (arg_match(&arg, &passes, argi)) {
824
      global->passes = arg_parse_uint(&arg);
John Koleszar's avatar
John Koleszar committed
825

826 827
      if (global->passes < 1 || global->passes > 2)
        die("Error: Invalid number of passes (%d)\n", global->passes);
John Koleszar's avatar
John Koleszar committed
828
    } else if (arg_match(&arg, &pass_arg, argi)) {
829 830 831
      global->pass = arg_parse_uint(&arg);

      if (global->pass < 1 || global->pass > 2)
832
        die("Error: Invalid pass selected (%d)\n", global->pass);
833 834
    } else if (arg_match(&arg, &usage, argi))
      global->usage = arg_parse_uint(&arg);
John Koleszar's avatar
John Koleszar committed
835
    else if (arg_match(&arg, &deadline, argi))
836
      global->deadline = arg_parse_uint(&arg);
John Koleszar's avatar
John Koleszar committed
837
    else if (arg_match(&arg, &good_dl, argi))
838
      global->deadline = AOM_DL_GOOD_QUALITY;
839
    else if (arg_match(&arg, &use_yv12, argi))
840
      global->color_type = YV12;
841
    else if (arg_match(&arg, &use_i420, argi))
842 843 844 845 846
      global->color_type = I420;
    else if (arg_match(&arg, &use_i422, argi))
      global->color_type = I422;
    else if (arg_match(&arg, &use_i444, argi))
      global->color_type = I444;
847 848
    else if (arg_match(&arg, &use_i440, argi))
      global->color_type = I440;
849 850 851 852
    else if (arg_match(&arg, &quietarg, argi))
      global->quiet = 1;
    else if (arg_match(&arg, &verbosearg, argi))
      global->verbose = 1;
John Koleszar's avatar
John Koleszar committed
853
    else if (arg_match(&arg, &limit, argi))
854
      global->limit = arg_parse_uint(&arg);
John Koleszar's avatar
John Koleszar committed
855
    else if (arg_match(&arg, &skip, argi))
856
      global->skip_frames = arg_parse_uint(&arg);
John Koleszar's avatar
John Koleszar committed
857
    else if (arg_match(&arg, &psnrarg, argi))
858
      global->show_psnr = 1;
John Koleszar's avatar
John Koleszar committed
859
    else if (arg_match(&arg, &recontest, argi))
860
      global->test_decode = arg_parse_enum_or_int(&arg);
John Koleszar's avatar
John Koleszar committed
861
    else if (arg_match(&arg, &framerate, argi)) {
862 863 864 865 866
      global->framerate = arg_parse_rational(&arg);
      validate_positive_rational(arg.name, &global->framerate);
      global->have_framerate = 1;
    } else if (arg_match(&arg, &out_part, argi))
      global->out_part = 1;
John Koleszar's avatar
John Koleszar committed
867
    else if (arg_match(&arg, &debugmode, argi))
868
      global->debug = 1;
John Koleszar's avatar
John Koleszar committed
869
    else if (arg_match(&arg, &q_hist_n, argi))
870
      global->show_q_hist_buckets = arg_parse_uint(&arg);
John Koleszar's avatar
John Koleszar committed
871
    else if (arg_match(&arg, &rate_hist_n, argi))
872
      global->show_rate_hist_buckets = arg_parse_uint(&arg);
873 874 875 876
    else if (arg_match(&arg, &disable_warnings, argi))
      global->disable_warnings = 1;
    else if (arg_match(&arg, &disable_warning_prompt, argi))
      global->disable_warning_prompt = 1;
John Koleszar's avatar
John Koleszar committed
877 878 879
    else
      argj++;
  }
John Koleszar's avatar
John Koleszar committed
880

881 882 883
  if (global->pass) {
    /* DWIM: Assume the user meant passes=2 if pass=2 is specified */
    if (global->pass > global->passes) {
884 885
      warn("Assuming --pass=%d implies --passes=%d\n", global->pass,
           global->pass);
886 887 888
      global->passes = global->pass;
    }
  }
889
  /* Validate global config */
890
  if (global->passes == 0) {
891 892
#if CONFIG_AV1_ENCODER
    // Make default AV1 passes = 2 until there is a better quality 1-pass
893
    // encoder
894
    if (global->codec != NULL && global->codec->name != NULL)
Thomas Daede's avatar
Thomas Daede committed
895
      global->passes = (strcmp(global->codec->name, "av1") == 0) ? 2 : 1;
James Zern's avatar
James Zern committed
896 897 898
#else
    global->passes = 1;
#endif
899
  }
900 901
}

902
static void open_input_file(struct AvxInputContext *input) {
903
  /* Parse certain options from the input file, if possible */
904 905
  input->file = strcmp(input->filename, "-") ? fopen(input->filename, "rb")
                                             : set_binary_mode(stdin);
906

907
  if (!input->file) fatal("Failed to open input file");
John Koleszar's avatar
John Koleszar committed
908

909 910 911 912 913 914 915 916
  if (!fseeko(input->file, 0, SEEK_END)) {
    /* Input file is seekable. Figure out how long it is, so we can get
     * progress info.
     */
    input->length = ftello(input->file);
    rewind(input->file);
  }

917 918 919 920
  /* Default to 1:1 pixel aspect ratio. */
  input->pixel_aspect_ratio.numerator = 1;
  input->pixel_aspect_ratio.denominator = 1;

921 922 923 924 925 926
  /* For RAW input sources, these bytes will applied on the first frame
   *  in read_frame().
   */
  input->detect.buf_read = fread(input->detect.buf, 1, 4, input->file);
  input->detect.position = 0;

927
  if (input->detect.buf_read == 4 && file_is_y4m(input->detect.buf)) {
928 929
    if (y4m_input_open(&input->y4m, input->file, input->detect.buf, 4,
                       input->only_i420) >= 0) {
930
      input->file_type = FILE_TYPE_Y4M;
931 932
      input->width = input->y4m.pic_w;
      input->height = input->y4m.pic_h;
933 934
      input->pixel_aspect_ratio.numerator = input->y4m.par_n;
      input->pixel_aspect_ratio.denominator = input->y4m.par_d;
935 936
      input->framerate.numerator = input->y4m.fps_n;
      input->framerate.denominator = input->y4m.fps_d;
937
      input->fmt = input->y4m.aom_fmt;
938
      input->bit_depth = input->y4m.bit_depth;
939 940
    } else
      fatal("Unsupported Y4M stream.");
941
  } else if (input->detect.buf_read == 4 && fourcc_is_ivf(input->detect.buf)) {
942
    fatal("IVF is not supported as input.");
943 944
  } else {
    input->file_type = FILE_TYPE_RAW;
John Koleszar's avatar
John Koleszar committed
945
  }
946 947
}

948
static void close_input_file(struct AvxInputContext *input) {
949
  fclose(input->file);
950
  if (input->file_type == FILE_TYPE_Y4M) y4m_input_close(&input->y4m);
951 952
}

953
static struct stream_state *new_stream(struct AvxEncoderConfig *global,
954
                                       struct stream_state *prev) {
955 956 957
  struct stream_state *stream;

  stream = calloc(1, sizeof(*stream));
958
  if (stream == NULL) {
959
    fatal("Failed to allocate new stream.");
960 961
  }

962 963 964 965 966
  if (prev) {
    memcpy(stream, prev, sizeof(*stream));
    stream->index++;
    prev->next = stream;
  } else {
967
    aom_codec_err_t res;
968 969

    /* Populate encoder configuration */
970
    res = aom_codec_enc_config_default(global->codec->codec_interface(),
971
                                       &stream->config.cfg, global->usage);
972
    if (res) fatal("Failed to get config: %s\n", aom_codec_err_to_string(res));
John Koleszar's avatar
John Koleszar committed
973

974 975 976 977
    /* Change the default timebase to a high enough value so that the
     * encoder will always create strictly increasing timestamps.
     */
    stream->config.cfg.g_timebase.den = 1000;
978

979 980 981 982 983
    /* Never use the library's default resolution, require it be parsed
     * from the file or set on the command line.
     */
    stream->config.cfg.g_w = 0;
    stream->config.cfg.g_h = 0;
John Koleszar's avatar
John Koleszar committed
984

985 986
    /* Initialize remaining stream parameters */
    stream->config.write_webm = 1;
987 988 989
#if CONFIG_OBU_NO_IVF
    stream->config.write_ivf = 0;
#endif
990
#if CONFIG_WEBM_IO
991
    stream->config.stereo_fmt = STEREO_FORMAT_MONO;
992 993 994
    stream->webm_ctx.last_pts_ns = -1;
    stream->webm_ctx.writer = NULL;
    stream->webm_ctx.segment = NULL;
995
#endif
John Koleszar's avatar
John Koleszar committed
996

997
    /* Allows removal of the application version from the EBML tags */
998
    stream->webm_ctx.debug = global->debug;
John Koleszar's avatar
John Koleszar committed
999
  }
John Koleszar's avatar
John Koleszar committed
1000

1001 1002
  /* Output files must be specified for each stream */
  stream->config.out_fn = NULL;
John Koleszar's avatar
John Koleszar committed
1003

1004 1005
  stream->next = NULL;
  return stream;
1006
}
John Koleszar's avatar
John Koleszar committed
1007

1008
static int parse_stream_params(struct AvxEncoderConfig *global,
1009 1010 1011
                               struct stream_state *stream, char **argv) {
  char **argi, **argj;
  struct arg arg;
1012
  static const arg_def_t **ctrl_args = no_args;
1013 1014 1015
  static const int *ctrl_args_map = NULL;
  struct stream_config *config = &stream->config;
  int eos_mark_found = 0;
1016
  int webm_forced = 0;
1017

1018
  // Handle codec specific options
1019
  if (0) {
1020 1021 1022 1023 1024 1025
#if CONFIG_AV1_ENCODER
  } else if (strcmp(global->codec->name, "av1") == 0) {
    // TODO(jingning): Reuse AV1 specific encoder configuration parameters.
    // Consider to expand this set for AV1 encoder control.
    ctrl_args = av1_args;
    ctrl_args_map = av1_arg_ctrl_map;
1026
#endif
1027
  }
1028

John Koleszar's avatar
John Koleszar committed
1029 1030
  for (argi = argj = argv; (*argj = *argi); argi += arg.argv_step) {
    arg.argv_step = 1;
John Koleszar's avatar
John Koleszar committed
1031

1032 1033 1034 1035 1036 1037 1038 1039 1040 1041
    /* Once we've found an end-of-stream marker (--) we want to continue
     * shifting arguments but not consuming them.
     */
    if (eos_mark_found) {
      argj++;
      continue;
    } else if (!strcmp(*argj, "--")) {
      eos_mark_found = 1;
      continue;
    }
John Koleszar's avatar
John Koleszar committed
1042

Adrian Grange's avatar
Adrian Grange committed
1043
    if (arg_match(&arg, &outputfile, argi)) {
1044
      config->out_fn = arg.val;
1045 1046 1047 1048 1049
      if (!webm_forced) {
        const size_t out_fn_len = strlen(config->out_fn);
        if (out_fn_len >= 4 &&
            !strcmp(config->out_fn + out_fn_len - 4, ".ivf")) {
          config->write_webm = 0;
1050 1051 1052
#if CONFIG_OBU_NO_IVF
          config->write_ivf = 1;
#endif
1053
        }
1054 1055 1056 1057 1058 1059 1060
#if CONFIG_OBU_NO_IVF
        else if (out_fn_len >= 4 &&
                 !strcmp(config->out_fn + out_fn_len - 4, ".obu")) {
          config->write_webm = 0;
          config->write_ivf = 0;
        }
#endif
1061
      }
1062
    } else if (arg_match(&arg, &fpf_name, argi)) {
1063
      config->stats_fn = arg.val;
1064 1065 1066
#if CONFIG_FP_MB_STATS
    } else if (arg_match(&arg, &fpmbf_name, argi)) {
      config->fpmb_stats_fn = arg.val;
1067 1068 1069 1070
#endif
    } else if (arg_match(&arg, &use_webm, argi)) {
#if CONFIG_WEBM_IO
      config->write_webm = 1;
1071
      webm_forced = 1;
1072 1073
#else
      die("Error: --webm specified but webm is disabled.");
1074
#endif
1075
    } else if (arg_match(&arg, &use_ivf, argi)) {
1076
      config->write_webm = 0;
1077 1078 1079 1080 1081 1082 1083 1084
#if CONFIG_OBU_NO_IVF
      config->write_ivf = 1;
#endif
#if CONFIG_OBU_NO_IVF
    } else if (arg_match(&arg, &use_obu, argi)) {
      config->write_webm = 0;
      config->write_ivf = 0;
#endif
1085
    } else if (arg_match(&arg, &threads, argi)) {
1086
      config->cfg.g_threads = arg_parse_uint(&arg);
1087
    } else if (arg_match(&arg, &profile, argi)) {
1088
      config->cfg.g_profile = arg_parse_uint(&arg);
1089
    } else if (arg_match(&arg, &width, argi)) {
1090
      config->cfg.g_w = arg_parse_uint(&arg);
1091
    } else if (arg_match(&arg, &height, argi)) {
1092
      config->cfg.g_h = arg_parse_uint(&arg);
1093
#if CONFIG_HIGHBITDEPTH
1094 1095 1096 1097 1098
    } else if (arg_match(&arg, &bitdeptharg, argi)) {
      config->cfg.g_bit_depth = arg_parse_enum_or_int(&arg);
    } else if (arg_match(&arg, &inbitdeptharg, argi)) {
      config->cfg.g_input_bit_depth = arg_parse_uint(&arg);
#endif
1099
#if CONFIG_WEBM_IO
1100
    } else if (arg_match(&arg, &stereo_mode, argi)) {
1101
      config->stereo_fmt = arg_parse_enum_or_int(&arg);
1102
#endif
1103
    } else if (arg_match(&arg, &timebase, argi)) {
1104 1105
      config->cfg.g_timebase = arg_parse_rational(&arg);
      validate_positive_rational(arg.name, &config->cfg.g_timebase);
1106
    } else if (arg_match(&arg, &error_resilient, argi)) {
1107
      config->cfg.g_error_resilient = arg_parse_uint(&arg);
1108
    } else if (arg_match(&arg, &lag_in_frames, argi)) {
1109
      config->cfg.g_lag_in_frames = arg_parse_uint(&arg);
1110 1111 1112 1113
#if CONFIG_EXT_TILE
    } else if (arg_match(&arg, &large_scale_tile, argi)) {
      config->cfg.large_scale_tile = arg_parse_uint(&arg);
#endif  // CONFIG_EXT_TILE
1114
    } else if (arg_match(&arg, &dropframe_thresh, argi)) {
1115
      config->cfg.rc_dropframe_thresh = arg_parse_uint(&arg);
1116 1117
    } else if (arg_match(&arg, &resize_mode, argi)) {
      config->cfg.rc_resize_mode = arg_parse_uint(&arg);
1118 1119 1120 1121
    } else if (arg_match(&arg, &resize_denominator, argi)) {
      config->cfg.rc_resize_denominator = arg_parse_uint(&arg);
    } else if (arg_match(&arg, &resize_kf_denominator, argi)) {
      config->cfg.rc_resize_kf_denominator = arg_parse_uint(&arg);
1122
#if CONFIG_HORZONLY_FRAME_SUPERRES
1123 1124
    } else if (arg_match(&arg, &superres_mode, argi)) {
      config->cfg.rc_superres_mode = arg_parse_uint(&arg);
1125 1126 1127 1128
    } else if (arg_match(&arg, &superres_denominator, argi)) {
      config->cfg.rc_superres_denominator = arg_parse_uint(&arg);
    } else if (arg_match(&arg, &superres_kf_denominator, argi)) {
      config->cfg.rc_superres_kf_denominator = arg_parse_uint(&arg);
1129 1130 1131 1132
    } else if (arg_match(&arg, &superres_qthresh, argi)) {
      config->cfg.rc_superres_qthresh = arg_parse_uint(&arg);
    } else if (arg_match(&arg, &superres_kf_qthresh, argi)) {
      config->cfg.rc_superres_kf_qthresh = arg_parse_uint(&arg);
1133
#endif  // CONFIG_HORZONLY_FRAME_SUPERRES
1134
    } else if (arg_match(&arg, &end_usage, argi)) {
1135
      config->cfg.rc_end_usage = arg_parse_enum_or_int(&arg);
1136
    } else if (arg_match(&arg, &target_bitrate, argi)) {
1137
      config->cfg.rc_target_bitrate = arg_parse_uint(&arg);
1138
    } else if (arg_match(&arg, &min_quantizer, argi)) {
1139
      config->cfg.rc_min_quantizer = arg_parse_uint(&arg);
1140
    } else if (arg_match(&arg, &max_quantizer, argi)) {
1141
      config->cfg.rc_max_quantizer = arg_parse_uint(&arg);
1142
    } else if (arg_match(&arg, &undershoot_pct, argi)) {
1143
      config->cfg.rc_undershoot_pct = arg_parse_uint(&arg);
1144
    } else if (arg_match(&arg, &overshoot_pct, argi)) {
1145
      config->cfg.rc_overshoot_pct = arg_parse_uint(&arg);
1146
    } else if (arg_match(&arg, &buf_sz, argi)) {
1147
      config->cfg.rc_buf_sz = arg_parse_uint(&arg);
1148
    } else if (arg_match(&arg, &buf_initial_sz, argi)) {
1149
      config->cfg.rc_buf_initial_sz = arg_parse_uint(&arg);
1150
    } else if (arg_match(&arg, &buf_optimal_sz, argi)) {
1151
      config->cfg.rc_buf_optimal_sz = arg_parse_uint(&arg);
1152
    } else if (arg_match(&arg, &bias_pct, argi)) {
1153
      config->cfg.rc_2pass_vbr_bias_pct = arg_parse_uint(&arg);
1154 1155
      if (global->passes < 2)
        warn("option %s ignored in one-pass mode.\n", arg.name);
John Koleszar's avatar
John Koleszar committed
1156
    } else if (arg_match(&arg, &minsection_pct, argi)) {
1157
      config->cfg.rc_2pass_vbr_minsection_pct = arg_parse_uint(&arg);
John Koleszar's avatar
John Koleszar committed
1158

1159 1160
      if (global->passes < 2)
        warn("option %s ignored in one-pass mode.\n", arg.name);
John Koleszar's avatar
John Koleszar committed
1161
    } else if (arg_match(&arg, &maxsection_pct, argi)) {