aomdec.c 34.5 KB
Newer Older
John Koleszar's avatar
John Koleszar committed
1
/*
2
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
John Koleszar's avatar
John Koleszar committed
3
 *
4 5 6 7 8 9
 * This source code is subject to the terms of the BSD 2 Clause License and
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
 * was not distributed with this source code in the LICENSE file, you can
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
 * Media Patent License 1.0 was not distributed with this source code in the
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
John Koleszar's avatar
John Koleszar committed
10 11
 */

12
#include <assert.h>
John Koleszar's avatar
John Koleszar committed
13 14 15 16
#include <stdio.h>
#include <stdlib.h>
#include <stdarg.h>
#include <string.h>
17
#include <limits.h>
18

19
#include "./aom_config.h"
20

James Zern's avatar
James Zern committed
21 22 23 24 25 26 27 28
#if CONFIG_OS_SUPPORT
#if HAVE_UNISTD_H
#include <unistd.h>  // NOLINT
#elif !defined(STDOUT_FILENO)
#define STDOUT_FILENO 1
#endif
#endif

29
#if CONFIG_LIBYUV
30
#include "third_party/libyuv/include/libyuv/scale.h"
31
#endif
32 33

#include "./args.h"
34 35
#include "./ivfdec.h"

36
#include "aom/aom_decoder.h"
37
#include "aom_ports/mem_ops.h"
38
#include "aom_ports/aom_timer.h"
39

40 41
#if CONFIG_AV1_DECODER
#include "aom/aomdx.h"
John Koleszar's avatar
John Koleszar committed
42
#endif
43

44
#include "./md5_utils.h"
45 46

#include "./tools_common.h"
47
#if CONFIG_WEBM_IO
48
#include "./webmdec.h"
49
#endif
50
#include "./y4menc.h"
John Koleszar's avatar
John Koleszar committed
51 52 53

static const char *exec_name;

54 55
struct AvxDecInputContext {
  struct AvxInputContext *aom_input_ctx;
56 57 58
  struct WebmInputContext *webm_ctx;
};

James Zern's avatar
James Zern committed
59 60
static const arg_def_t help =
    ARG_DEF(NULL, "help", 0, "Show usage options and exit");
clang-format's avatar
clang-format committed
61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99
static const arg_def_t looparg =
    ARG_DEF(NULL, "loops", 1, "Number of times to decode the file");
static const arg_def_t codecarg = ARG_DEF(NULL, "codec", 1, "Codec to use");
static const arg_def_t use_yv12 =
    ARG_DEF(NULL, "yv12", 0, "Output raw YV12 frames");
static const arg_def_t use_i420 =
    ARG_DEF(NULL, "i420", 0, "Output raw I420 frames");
static const arg_def_t flipuvarg =
    ARG_DEF(NULL, "flipuv", 0, "Flip the chroma planes in the output");
static const arg_def_t rawvideo =
    ARG_DEF(NULL, "rawvideo", 0, "Output raw YUV frames");
static const arg_def_t noblitarg =
    ARG_DEF(NULL, "noblit", 0, "Don't process the decoded frames");
static const arg_def_t progressarg =
    ARG_DEF(NULL, "progress", 0, "Show progress after each frame decodes");
static const arg_def_t limitarg =
    ARG_DEF(NULL, "limit", 1, "Stop decoding after n frames");
static const arg_def_t skiparg =
    ARG_DEF(NULL, "skip", 1, "Skip the first n input frames");
static const arg_def_t postprocarg =
    ARG_DEF(NULL, "postproc", 0, "Postprocess decoded frames");
static const arg_def_t summaryarg =
    ARG_DEF(NULL, "summary", 0, "Show timing summary");
static const arg_def_t outputfile =
    ARG_DEF("o", "output", 1, "Output file name pattern (see below)");
static const arg_def_t threadsarg =
    ARG_DEF("t", "threads", 1, "Max threads to use");
static const arg_def_t frameparallelarg =
    ARG_DEF(NULL, "frame-parallel", 0, "Frame parallel decode");
static const arg_def_t verbosearg =
    ARG_DEF("v", "verbose", 0, "Show version string");
static const arg_def_t scalearg =
    ARG_DEF("S", "scale", 0, "Scale output frames uniformly");
static const arg_def_t continuearg =
    ARG_DEF("k", "keep-going", 0, "(debug) Continue decoding after error");
static const arg_def_t fb_arg =
    ARG_DEF(NULL, "frame-buffers", 1, "Number of frame buffers to use");
static const arg_def_t md5arg =
    ARG_DEF(NULL, "md5", 0, "Compute the MD5 sum of the decoded frame");
100 101
static const arg_def_t framestatsarg =
    ARG_DEF(NULL, "framestats", 1, "Output per-frame stats (.csv format)");
102
#if CONFIG_HIGHBITDEPTH
clang-format's avatar
clang-format committed
103 104
static const arg_def_t outbitdeptharg =
    ARG_DEF(NULL, "output-bit-depth", 1, "Output bit-depth for decoded frames");
105
#endif
106
#if CONFIG_EXT_TILE
clang-format's avatar
clang-format committed
107 108 109 110 111 112
static const arg_def_t tiler = ARG_DEF(NULL, "tile-row", 1,
                                       "Row index of tile to decode "
                                       "(-1 for all rows)");
static const arg_def_t tilec = ARG_DEF(NULL, "tile-column", 1,
                                       "Column index of tile to decode "
                                       "(-1 for all columns)");
113
#endif  // CONFIG_EXT_TILE
Dmitry Kovalev's avatar
Dmitry Kovalev committed
114

James Zern's avatar
James Zern committed
115 116
static const arg_def_t *all_args[] = { &help,
                                       &codecarg,
clang-format's avatar
clang-format committed
117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133
                                       &use_yv12,
                                       &use_i420,
                                       &flipuvarg,
                                       &rawvideo,
                                       &noblitarg,
                                       &progressarg,
                                       &limitarg,
                                       &skiparg,
                                       &postprocarg,
                                       &summaryarg,
                                       &outputfile,
                                       &threadsarg,
                                       &frameparallelarg,
                                       &verbosearg,
                                       &scalearg,
                                       &fb_arg,
                                       &md5arg,
134
                                       &framestatsarg,
clang-format's avatar
clang-format committed
135
                                       &continuearg,
136
#if CONFIG_HIGHBITDEPTH
clang-format's avatar
clang-format committed
137
                                       &outbitdeptharg,
138
#endif
139
#if CONFIG_EXT_TILE
clang-format's avatar
clang-format committed
140 141
                                       &tiler,
                                       &tilec,
142
#endif  // CONFIG_EXT_TILE
clang-format's avatar
clang-format committed
143
                                       NULL };
John Koleszar's avatar
John Koleszar committed
144

145
#if CONFIG_LIBYUV
146
static INLINE int libyuv_scale(aom_image_t *src, aom_image_t *dst,
clang-format's avatar
clang-format committed
147
                               FilterModeEnum mode) {
148
#if CONFIG_HIGHBITDEPTH
149 150
  if (src->fmt == AOM_IMG_FMT_I42016) {
    assert(dst->fmt == AOM_IMG_FMT_I42016);
clang-format's avatar
clang-format committed
151
    return I420Scale_16(
152 153 154 155 156 157 158
        (uint16_t *)src->planes[AOM_PLANE_Y], src->stride[AOM_PLANE_Y] / 2,
        (uint16_t *)src->planes[AOM_PLANE_U], src->stride[AOM_PLANE_U] / 2,
        (uint16_t *)src->planes[AOM_PLANE_V], src->stride[AOM_PLANE_V] / 2,
        src->d_w, src->d_h, (uint16_t *)dst->planes[AOM_PLANE_Y],
        dst->stride[AOM_PLANE_Y] / 2, (uint16_t *)dst->planes[AOM_PLANE_U],
        dst->stride[AOM_PLANE_U] / 2, (uint16_t *)dst->planes[AOM_PLANE_V],
        dst->stride[AOM_PLANE_V] / 2, dst->d_w, dst->d_h, mode);
159 160
  }
#endif
161 162 163 164 165 166 167 168
  assert(src->fmt == AOM_IMG_FMT_I420);
  assert(dst->fmt == AOM_IMG_FMT_I420);
  return I420Scale(src->planes[AOM_PLANE_Y], src->stride[AOM_PLANE_Y],
                   src->planes[AOM_PLANE_U], src->stride[AOM_PLANE_U],
                   src->planes[AOM_PLANE_V], src->stride[AOM_PLANE_V], src->d_w,
                   src->d_h, dst->planes[AOM_PLANE_Y], dst->stride[AOM_PLANE_Y],
                   dst->planes[AOM_PLANE_U], dst->stride[AOM_PLANE_U],
                   dst->planes[AOM_PLANE_V], dst->stride[AOM_PLANE_V], dst->d_w,
clang-format's avatar
clang-format committed
169
                   dst->d_h, mode);
170
}
171
#endif
172

James Zern's avatar
James Zern committed
173 174
void show_help(FILE *fout, int shorthelp) {
  fprintf(fout, "Usage: %s <options> filename\n\n", exec_name);
John Koleszar's avatar
John Koleszar committed
175

James Zern's avatar
James Zern committed
176 177 178 179 180 181 182 183
  if (shorthelp) {
    fprintf(fout, "Use --help to see the full list of options.\n");
    return;
  }

  fprintf(fout, "Options:\n");
  arg_show_usage(fout, all_args);
  fprintf(fout,
John Koleszar's avatar
John Koleszar committed
184 185 186 187 188
          "\nOutput File Patterns:\n\n"
          "  The -o argument specifies the name of the file(s) to "
          "write to. If the\n  argument does not include any escape "
          "characters, the output will be\n  written to a single file. "
          "Otherwise, the filename will be calculated by\n  expanding "
John Koleszar's avatar
John Koleszar committed
189
          "the following escape characters:\n");
James Zern's avatar
James Zern committed
190
  fprintf(fout,
John Koleszar's avatar
John Koleszar committed
191 192 193 194 195
          "\n\t%%w   - Frame width"
          "\n\t%%h   - Frame height"
          "\n\t%%<n> - Frame number, zero padded to <n> places (1..9)"
          "\n\n  Pattern arguments are only supported in conjunction "
          "with the --yv12 and\n  --i420 options. If the -o option is "
clang-format's avatar
clang-format committed
196
          "not specified, the output will be\n  directed to stdout.\n");
James Zern's avatar
James Zern committed
197
  fprintf(fout, "\nIncluded decoders:\n\n");
John Koleszar's avatar
John Koleszar committed
198

James Zern's avatar
James Zern committed
199
  for (int i = 0; i < get_aom_decoder_count(); ++i) {
200
    const AvxInterface *const decoder = get_aom_decoder_by_index(i);
James Zern's avatar
James Zern committed
201
    fprintf(fout, "    %-6s - %s\n", decoder->name,
202
            aom_codec_iface_name(decoder->codec_interface()));
203
  }
James Zern's avatar
James Zern committed
204
}
John Koleszar's avatar
John Koleszar committed
205

James Zern's avatar
James Zern committed
206 207
void usage_exit(void) {
  show_help(stderr, 1);
John Koleszar's avatar
John Koleszar committed
208
  exit(EXIT_FAILURE);
John Koleszar's avatar
John Koleszar committed
209 210
}

clang-format's avatar
clang-format committed
211 212
static int raw_read_frame(FILE *infile, uint8_t **buffer, size_t *bytes_read,
                          size_t *buffer_size) {
213
  char raw_hdr[RAW_FRAME_HDR_SZ];
214
  size_t frame_size = 0;
John Koleszar's avatar
John Koleszar committed
215

216
  if (fread(raw_hdr, RAW_FRAME_HDR_SZ, 1, infile) != 1) {
clang-format's avatar
clang-format committed
217
    if (!feof(infile)) warn("Failed to read RAW frame size\n");
218
  } else {
219 220
    const size_t kCorruptFrameThreshold = 256 * 1024 * 1024;
    const size_t kFrameTooSmallThreshold = 256 * 1024;
221
    frame_size = mem_get_le32(raw_hdr);
John Koleszar's avatar
John Koleszar committed
222

223 224 225 226
    if (frame_size > kCorruptFrameThreshold) {
      warn("Read invalid frame size (%u)\n", (unsigned int)frame_size);
      frame_size = 0;
    }
John Koleszar's avatar
John Koleszar committed
227

228 229 230
    if (frame_size < kFrameTooSmallThreshold) {
      warn("Warning: Read invalid frame size (%u) - not a raw file?\n",
           (unsigned int)frame_size);
John Koleszar's avatar
John Koleszar committed
231
    }
John Koleszar's avatar
John Koleszar committed
232

233 234 235 236 237 238 239 240
    if (frame_size > *buffer_size) {
      uint8_t *new_buf = realloc(*buffer, 2 * frame_size);
      if (new_buf) {
        *buffer = new_buf;
        *buffer_size = 2 * frame_size;
      } else {
        warn("Failed to allocate compressed data buffer\n");
        frame_size = 0;
241
      }
John Koleszar's avatar
John Koleszar committed
242
    }
243
  }
John Koleszar's avatar
John Koleszar committed
244

245 246 247 248 249 250
  if (!feof(infile)) {
    if (fread(*buffer, 1, frame_size, infile) != frame_size) {
      warn("Failed to read full frame\n");
      return 1;
    }
    *bytes_read = frame_size;
John Koleszar's avatar
John Koleszar committed
251 252
  }

253 254 255
  return 0;
}

256
static int read_frame(struct AvxDecInputContext *input, uint8_t **buf,
257
                      size_t *bytes_in_buffer, size_t *buffer_size) {
258
  switch (input->aom_input_ctx->file_type) {
259
#if CONFIG_WEBM_IO
260
    case FILE_TYPE_WEBM:
261
      return webm_read_frame(input->webm_ctx, buf, bytes_in_buffer);
262
#endif
263
    case FILE_TYPE_RAW:
264
      return raw_read_frame(input->aom_input_ctx->file, buf, bytes_in_buffer,
clang-format's avatar
clang-format committed
265
                            buffer_size);
266
    case FILE_TYPE_IVF:
267
      return ivf_read_frame(input->aom_input_ctx->file, buf, bytes_in_buffer,
clang-format's avatar
clang-format committed
268 269
                            buffer_size);
    default: return 1;
270
  }
John Koleszar's avatar
John Koleszar committed
271 272
}

273
static void update_image_md5(const aom_image_t *img, const int planes[3],
274 275 276 277 278 279 280
                             MD5Context *md5) {
  int i, y;

  for (i = 0; i < 3; ++i) {
    const int plane = planes[i];
    const unsigned char *buf = img->planes[plane];
    const int stride = img->stride[plane];
281 282 283
    const int w = aom_img_plane_width(img, plane) *
                  ((img->fmt & AOM_IMG_FMT_HIGHBITDEPTH) ? 2 : 1);
    const int h = aom_img_plane_height(img, plane);
284 285 286 287 288 289 290 291

    for (y = 0; y < h; ++y) {
      MD5Update(md5, buf, w);
      buf += stride;
    }
  }
}

292
static void write_image_file(const aom_image_t *img, const int planes[3],
293 294
                             FILE *file) {
  int i, y;
295
#if CONFIG_HIGHBITDEPTH
296
  const int bytes_per_sample = ((img->fmt & AOM_IMG_FMT_HIGHBITDEPTH) ? 2 : 1);
297 298 299
#else
  const int bytes_per_sample = 1;
#endif
300 301 302 303 304

  for (i = 0; i < 3; ++i) {
    const int plane = planes[i];
    const unsigned char *buf = img->planes[plane];
    const int stride = img->stride[plane];
305 306
    const int w = aom_img_plane_width(img, plane);
    const int h = aom_img_plane_height(img, plane);
307 308

    for (y = 0; y < h; ++y) {
309
      fwrite(buf, bytes_per_sample, w, file);
310 311
      buf += stride;
    }
John Koleszar's avatar
John Koleszar committed
312
  }
John Koleszar's avatar
John Koleszar committed
313 314
}

315
static int file_is_raw(struct AvxInputContext *input) {
316
  uint8_t buf[32];
John Koleszar's avatar
John Koleszar committed
317
  int is_raw = 0;
318
  aom_codec_stream_info_t si;
319

320
  if (fread(buf, 1, 32, input->file) == 32) {
John Koleszar's avatar
John Koleszar committed
321 322
    int i;

323
    if (mem_get_le32(buf) < 256 * 1024 * 1024) {
324 325 326
      for (i = 0; i < get_aom_decoder_count(); ++i) {
        const AvxInterface *const decoder = get_aom_decoder_by_index(i);
        if (!aom_codec_peek_stream_info(decoder->codec_interface(), buf + 4,
clang-format's avatar
clang-format committed
327
                                        32 - 4, &si)) {
John Koleszar's avatar
John Koleszar committed
328
          is_raw = 1;
329
          input->fourcc = decoder->fourcc;
330 331 332 333
          input->width = si.w;
          input->height = si.h;
          input->framerate.numerator = 30;
          input->framerate.denominator = 1;
John Koleszar's avatar
John Koleszar committed
334 335
          break;
        }
336 337
      }
    }
John Koleszar's avatar
John Koleszar committed
338 339
  }

340
  rewind(input->file);
John Koleszar's avatar
John Koleszar committed
341
  return is_raw;
342 343
}

344
static void show_progress(int frame_in, int frame_out, uint64_t dx_time) {
345
  fprintf(stderr,
clang-format's avatar
clang-format committed
346
          "%d decoded frames/%d showed frames in %" PRId64 " us (%.2f fps)\r",
John Koleszar's avatar
John Koleszar committed
347
          frame_in, frame_out, dx_time,
348
          (double)frame_out * 1000000.0 / (double)dx_time);
349 350
}

351
struct ExternalFrameBuffer {
clang-format's avatar
clang-format committed
352
  uint8_t *data;
353 354 355 356 357 358 359 360 361
  size_t size;
  int in_use;
};

struct ExternalFrameBufferList {
  int num_external_frame_buffers;
  struct ExternalFrameBuffer *ext_fb;
};

362
// Callback used by libaom to request an external frame buffer. |cb_priv|
363 364 365
// Application private data passed into the set function. |min_size| is the
// minimum size in bytes needed to decode the next frame. |fb| pointer to the
// frame buffer.
366 367
static int get_av1_frame_buffer(void *cb_priv, size_t min_size,
                                aom_codec_frame_buffer_t *fb) {
368 369 370
  int i;
  struct ExternalFrameBufferList *const ext_fb_list =
      (struct ExternalFrameBufferList *)cb_priv;
clang-format's avatar
clang-format committed
371
  if (ext_fb_list == NULL) return -1;
372 373 374

  // Find a free frame buffer.
  for (i = 0; i < ext_fb_list->num_external_frame_buffers; ++i) {
clang-format's avatar
clang-format committed
375
    if (!ext_fb_list->ext_fb[i].in_use) break;
376 377
  }

clang-format's avatar
clang-format committed
378
  if (i == ext_fb_list->num_external_frame_buffers) return -1;
379 380 381

  if (ext_fb_list->ext_fb[i].size < min_size) {
    free(ext_fb_list->ext_fb[i].data);
382
    ext_fb_list->ext_fb[i].data = (uint8_t *)calloc(min_size, sizeof(uint8_t));
clang-format's avatar
clang-format committed
383
    if (!ext_fb_list->ext_fb[i].data) return -1;
384 385 386 387 388 389 390 391 392 393 394 395 396

    ext_fb_list->ext_fb[i].size = min_size;
  }

  fb->data = ext_fb_list->ext_fb[i].data;
  fb->size = ext_fb_list->ext_fb[i].size;
  ext_fb_list->ext_fb[i].in_use = 1;

  // Set the frame buffer's private data to point at the external frame buffer.
  fb->priv = &ext_fb_list->ext_fb[i];
  return 0;
}

397
// Callback used by libaom when there are no references to the frame buffer.
398 399
// |cb_priv| user private data passed into the set function. |fb| pointer
// to the frame buffer.
400 401
static int release_av1_frame_buffer(void *cb_priv,
                                    aom_codec_frame_buffer_t *fb) {
402 403 404 405 406 407 408
  struct ExternalFrameBuffer *const ext_fb =
      (struct ExternalFrameBuffer *)fb->priv;
  (void)cb_priv;
  ext_fb->in_use = 0;
  return 0;
}

409 410 411
static void generate_filename(const char *pattern, char *out, size_t q_len,
                              unsigned int d_w, unsigned int d_h,
                              unsigned int frame_in) {
John Koleszar's avatar
John Koleszar committed
412 413 414 415 416 417 418 419 420
  const char *p = pattern;
  char *q = out;

  do {
    char *next_pat = strchr(p, '%');

    if (p == next_pat) {
      size_t pat_len;

John Koleszar's avatar
John Koleszar committed
421
      /* parse the pattern */
John Koleszar's avatar
John Koleszar committed
422 423
      q[q_len - 1] = '\0';
      switch (p[1]) {
clang-format's avatar
clang-format committed
424 425 426 427 428 429 430 431 432 433 434 435
        case 'w': snprintf(q, q_len - 1, "%d", d_w); break;
        case 'h': snprintf(q, q_len - 1, "%d", d_h); break;
        case '1': snprintf(q, q_len - 1, "%d", frame_in); break;
        case '2': snprintf(q, q_len - 1, "%02d", frame_in); break;
        case '3': snprintf(q, q_len - 1, "%03d", frame_in); break;
        case '4': snprintf(q, q_len - 1, "%04d", frame_in); break;
        case '5': snprintf(q, q_len - 1, "%05d", frame_in); break;
        case '6': snprintf(q, q_len - 1, "%06d", frame_in); break;
        case '7': snprintf(q, q_len - 1, "%07d", frame_in); break;
        case '8': snprintf(q, q_len - 1, "%08d", frame_in); break;
        case '9': snprintf(q, q_len - 1, "%09d", frame_in); break;
        default: die("Unrecognized pattern %%%c\n", p[1]); break;
John Koleszar's avatar
John Koleszar committed
436 437 438
      }

      pat_len = strlen(q);
clang-format's avatar
clang-format committed
439
      if (pat_len >= q_len - 1) die("Output filename too long.\n");
John Koleszar's avatar
John Koleszar committed
440 441 442 443 444 445
      q += pat_len;
      p += 2;
      q_len -= pat_len;
    } else {
      size_t copy_len;

John Koleszar's avatar
John Koleszar committed
446
      /* copy the next segment */
John Koleszar's avatar
John Koleszar committed
447 448 449 450 451
      if (!next_pat)
        copy_len = strlen(p);
      else
        copy_len = next_pat - p;

clang-format's avatar
clang-format committed
452
      if (copy_len >= q_len - 1) die("Output filename too long.\n");
John Koleszar's avatar
John Koleszar committed
453 454 455 456 457 458 459 460

      memcpy(q, p, copy_len);
      q[copy_len] = '\0';
      q += copy_len;
      p += copy_len;
      q_len -= copy_len;
    }
  } while (*p);
461 462
}

463 464 465 466 467 468 469
static int is_single_file(const char *outfile_pattern) {
  const char *p = outfile_pattern;

  do {
    p = strchr(p, '%');
    if (p && p[1] >= '1' && p[1] <= '9')
      return 0;  // pattern contains sequence number, so it's not unique
clang-format's avatar
clang-format committed
470
    if (p) p++;
471 472 473 474 475 476 477 478
  } while (p);

  return 1;
}

static void print_md5(unsigned char digest[16], const char *filename) {
  int i;

clang-format's avatar
clang-format committed
479
  for (i = 0; i < 16; ++i) printf("%02x", digest[i]);
480 481 482 483 484 485 486 487 488
  printf("  %s\n", filename);
}

static FILE *open_outfile(const char *name) {
  if (strcmp("-", name) == 0) {
    set_binary_mode(stdout);
    return stdout;
  } else {
    FILE *file = fopen(name, "wb");
clang-format's avatar
clang-format committed
489
    if (!file) fatal("Failed to open output file '%s'", name);
490 491 492 493
    return file;
  }
}

494
#if CONFIG_HIGHBITDEPTH
495 496 497
static int img_shifted_realloc_required(const aom_image_t *img,
                                        const aom_image_t *shifted,
                                        aom_img_fmt_t required_fmt) {
clang-format's avatar
clang-format committed
498
  return img->d_w != shifted->d_w || img->d_h != shifted->d_h ||
499 500
         required_fmt != shifted->fmt;
}
501 502
#endif

503
static int main_loop(int argc, const char **argv_) {
504
  aom_codec_ctx_t decoder;
clang-format's avatar
clang-format committed
505 506
  char *fn = NULL;
  int i;
James Zern's avatar
James Zern committed
507
  int ret = EXIT_FAILURE;
clang-format's avatar
clang-format committed
508 509 510 511 512 513 514 515
  uint8_t *buf = NULL;
  size_t bytes_in_buffer = 0, buffer_size = 0;
  FILE *infile;
  int frame_in = 0, frame_out = 0, flipuv = 0, noblit = 0;
  int do_md5 = 0, progress = 0, frame_parallel = 0;
  int stop_after = 0, postproc = 0, summary = 0, quiet = 1;
  int arg_skip = 0;
  int keep_going = 0;
516 517
  const AvxInterface *interface = NULL;
  const AvxInterface *fourcc_interface = NULL;
518
  uint64_t dx_time = 0;
clang-format's avatar
clang-format committed
519 520 521 522 523 524 525
  struct arg arg;
  char **argv, **argi, **argj;

  int single_file;
  int use_y4m = 1;
  int opt_yv12 = 0;
  int opt_i420 = 0;
526
  aom_codec_dec_cfg_t cfg = { 0, 0, 0, CONFIG_LOWBITDEPTH };
527
#if CONFIG_HIGHBITDEPTH
clang-format's avatar
clang-format committed
528
  unsigned int output_bit_depth = 0;
529
#endif
530
#if CONFIG_EXT_TILE
clang-format's avatar
clang-format committed
531 532
  int tile_row = -1;
  int tile_col = -1;
533
#endif  // CONFIG_EXT_TILE
clang-format's avatar
clang-format committed
534 535 536
  int frames_corrupted = 0;
  int dec_flags = 0;
  int do_scale = 0;
537
  aom_image_t *scaled_img = NULL;
538
#if CONFIG_HIGHBITDEPTH
539
  aom_image_t *img_shifted = NULL;
540
#endif
clang-format's avatar
clang-format committed
541 542 543
  int frame_avail, got_data, flush_decoder = 0;
  int num_external_frame_buffers = 0;
  struct ExternalFrameBufferList ext_fb_list = { 0, NULL };
John Koleszar's avatar
John Koleszar committed
544

545
  const char *outfile_pattern = NULL;
clang-format's avatar
clang-format committed
546
  char outfile_name[PATH_MAX] = { 0 };
547 548
  FILE *outfile = NULL;

549 550
  FILE *framestats_file = NULL;

551 552 553
  MD5Context md5_ctx;
  unsigned char md5_digest[16];

554 555
  struct AvxDecInputContext input = { NULL, NULL };
  struct AvxInputContext aom_input_ctx;
556
#if CONFIG_WEBM_IO
557 558
  struct WebmInputContext webm_ctx;
  memset(&(webm_ctx), 0, sizeof(webm_ctx));
559
  input.webm_ctx = &webm_ctx;
560
#endif
561
  input.aom_input_ctx = &aom_input_ctx;
562

John Koleszar's avatar
John Koleszar committed
563 564 565 566 567 568 569 570
  /* Parse command line */
  exec_name = argv_[0];
  argv = argv_dup(argc - 1, argv_ + 1);

  for (argi = argj = argv; (*argj = *argi); argi += arg.argv_step) {
    memset(&arg, 0, sizeof(arg));
    arg.argv_step = 1;

James Zern's avatar
James Zern committed
571 572 573 574
    if (arg_match(&arg, &help, argi)) {
      show_help(stdout, 0);
      exit(EXIT_SUCCESS);
    } else if (arg_match(&arg, &codecarg, argi)) {
575
      interface = get_aom_decoder_by_name(arg.val);
576 577
      if (!interface)
        die("Error: Unrecognized argument (%s) to --codec\n", arg.val);
John Koleszar's avatar
John Koleszar committed
578 579
    } else if (arg_match(&arg, &looparg, argi)) {
      // no-op
580
    } else if (arg_match(&arg, &outputfile, argi)) {
John Koleszar's avatar
John Koleszar committed
581
      outfile_pattern = arg.val;
582
    } else if (arg_match(&arg, &use_yv12, argi)) {
John Koleszar's avatar
John Koleszar committed
583 584
      use_y4m = 0;
      flipuv = 1;
585
      opt_yv12 = 1;
John Koleszar's avatar
John Koleszar committed
586 587 588
    } else if (arg_match(&arg, &use_i420, argi)) {
      use_y4m = 0;
      flipuv = 0;
589 590 591
      opt_i420 = 1;
    } else if (arg_match(&arg, &rawvideo, argi)) {
      use_y4m = 0;
592
    } else if (arg_match(&arg, &flipuvarg, argi)) {
John Koleszar's avatar
John Koleszar committed
593
      flipuv = 1;
594
    } else if (arg_match(&arg, &noblitarg, argi)) {
John Koleszar's avatar
John Koleszar committed
595
      noblit = 1;
596
    } else if (arg_match(&arg, &progressarg, argi)) {
John Koleszar's avatar
John Koleszar committed
597
      progress = 1;
598
    } else if (arg_match(&arg, &limitarg, argi)) {
John Koleszar's avatar
John Koleszar committed
599
      stop_after = arg_parse_uint(&arg);
600
    } else if (arg_match(&arg, &skiparg, argi)) {
601
      arg_skip = arg_parse_uint(&arg);
602
    } else if (arg_match(&arg, &postprocarg, argi)) {
John Koleszar's avatar
John Koleszar committed
603
      postproc = 1;
604
    } else if (arg_match(&arg, &md5arg, argi)) {
John Koleszar's avatar
John Koleszar committed
605
      do_md5 = 1;
606 607 608 609 610 611 612
    } else if (arg_match(&arg, &framestatsarg, argi)) {
      framestats_file = fopen(arg.val, "w");
      if (!framestats_file) {
        die("Error: Could not open --framestats file (%s) for writing.\n",
            arg.val);
      }
    } else if (arg_match(&arg, &summaryarg, argi)) {
John Koleszar's avatar
John Koleszar committed
613
      summary = 1;
614
    } else if (arg_match(&arg, &threadsarg, argi)) {
John Koleszar's avatar
John Koleszar committed
615
      cfg.threads = arg_parse_uint(&arg);
616
    }
617
#if CONFIG_AV1_DECODER
618 619 620
    else if (arg_match(&arg, &frameparallelarg, argi))
      frame_parallel = 1;
#endif
John Koleszar's avatar
John Koleszar committed
621 622
    else if (arg_match(&arg, &verbosearg, argi))
      quiet = 0;
623 624
    else if (arg_match(&arg, &scalearg, argi))
      do_scale = 1;
625 626
    else if (arg_match(&arg, &fb_arg, argi))
      num_external_frame_buffers = arg_parse_uint(&arg);
627 628
    else if (arg_match(&arg, &continuearg, argi))
      keep_going = 1;
629
#if CONFIG_HIGHBITDEPTH
630 631 632 633
    else if (arg_match(&arg, &outbitdeptharg, argi)) {
      output_bit_depth = arg_parse_uint(&arg);
    }
#endif
634 635 636 637 638 639
#if CONFIG_EXT_TILE
    else if (arg_match(&arg, &tiler, argi))
      tile_row = arg_parse_int(&arg);
    else if (arg_match(&arg, &tilec, argi))
      tile_col = arg_parse_int(&arg);
#endif  // CONFIG_EXT_TILE
John Koleszar's avatar
John Koleszar committed
640 641 642
    else
      argj++;
  }
John Koleszar's avatar
John Koleszar committed
643

John Koleszar's avatar
John Koleszar committed
644 645 646 647
  /* Check for unrecognized options */
  for (argi = argv; *argi; argi++)
    if (argi[0][0] == '-' && strlen(argi[0]) > 1)
      die("Error: Unrecognized option %s\n", *argi);
John Koleszar's avatar
John Koleszar committed
648

John Koleszar's avatar
John Koleszar committed
649 650
  /* Handle non-option arguments */
  fn = argv[0];
John Koleszar's avatar
John Koleszar committed
651

hanno's avatar
hanno committed
652 653
  if (!fn) {
    free(argv);
James Zern's avatar
James Zern committed
654
    fprintf(stderr, "No input file specified!\n");
John Koleszar's avatar
John Koleszar committed
655
    usage_exit();
hanno's avatar
hanno committed
656
  }
John Koleszar's avatar
John Koleszar committed
657 658
  /* Open file */
  infile = strcmp(fn, "-") ? fopen(fn, "rb") : set_binary_mode(stdin);
John Koleszar's avatar
John Koleszar committed
659

John Koleszar's avatar
John Koleszar committed
660
  if (!infile) {
661
    fatal("Failed to open input file '%s'", strcmp(fn, "-") ? fn : "stdin");
John Koleszar's avatar
John Koleszar committed
662
  }
663
#if CONFIG_OS_SUPPORT
John Koleszar's avatar
John Koleszar committed
664
  /* Make sure we don't dump to the terminal, unless forced to with -o - */
James Zern's avatar
James Zern committed
665
  if (!outfile_pattern && isatty(STDOUT_FILENO) && !do_md5 && !noblit) {
John Koleszar's avatar
John Koleszar committed
666 667 668 669 670
    fprintf(stderr,
            "Not dumping raw video to your terminal. Use '-o -' to "
            "override.\n");
    return EXIT_FAILURE;
  }
671
#endif
672 673 674
  input.aom_input_ctx->file = infile;
  if (file_is_ivf(input.aom_input_ctx))
    input.aom_input_ctx->file_type = FILE_TYPE_IVF;
675
#if CONFIG_WEBM_IO
676 677
  else if (file_is_webm(input.webm_ctx, input.aom_input_ctx))
    input.aom_input_ctx->file_type = FILE_TYPE_WEBM;
678
#endif
679 680
  else if (file_is_raw(input.aom_input_ctx))
    input.aom_input_ctx->file_type = FILE_TYPE_RAW;
John Koleszar's avatar
John Koleszar committed
681 682
  else {
    fprintf(stderr, "Unrecognized input file type.\n");
683
#if !CONFIG_WEBM_IO
684
    fprintf(stderr, "aomdec was built without WebM container support.\n");
685
#endif
John Koleszar's avatar
John Koleszar committed
686 687 688 689
    return EXIT_FAILURE;
  }

  outfile_pattern = outfile_pattern ? outfile_pattern : "-";
690
  single_file = is_single_file(outfile_pattern);
John Koleszar's avatar
John Koleszar committed
691

692 693
  if (!noblit && single_file) {
    generate_filename(outfile_pattern, outfile_name, PATH_MAX,
694
                      aom_input_ctx.width, aom_input_ctx.height, 0);
695 696 697 698
    if (do_md5)
      MD5Init(&md5_ctx);
    else
      outfile = open_outfile(outfile_name);
John Koleszar's avatar
John Koleszar committed
699 700 701 702
  }

  if (use_y4m && !noblit) {
    if (!single_file) {
clang-format's avatar
clang-format committed
703 704
      fprintf(stderr,
              "YUV4MPEG2 not supported with output patterns,"
Deb Mukherjee's avatar
Deb Mukherjee committed
705
              " try --i420 or --yv12 or --rawvideo.\n");
John Koleszar's avatar
John Koleszar committed
706
      return EXIT_FAILURE;
707
    }
John Koleszar's avatar
John Koleszar committed
708

709
#if CONFIG_WEBM_IO
710 711
    if (aom_input_ctx.file_type == FILE_TYPE_WEBM) {
      if (webm_guess_framerate(input.webm_ctx, input.aom_input_ctx)) {
clang-format's avatar
clang-format committed
712 713
        fprintf(stderr,
                "Failed to guess framerate -- error parsing "
John Koleszar's avatar
John Koleszar committed
714 715 716
                "webm file?\n");
        return EXIT_FAILURE;
      }
717
    }
718
#endif
John Koleszar's avatar
John Koleszar committed
719 720
  }

721
  fourcc_interface = get_aom_decoder_by_fourcc(aom_input_ctx.fourcc);
722 723 724 725
  if (interface && fourcc_interface && interface != fourcc_interface)
    warn("Header indicates codec: %s\n", fourcc_interface->name);
  else
    interface = fourcc_interface;
John Koleszar's avatar
John Koleszar committed
726

727
  if (!interface) interface = get_aom_decoder_by_index(0);
728

729 730 731
  dec_flags = (postproc ? AOM_CODEC_USE_POSTPROC : 0) |
              (frame_parallel ? AOM_CODEC_USE_FRAME_THREADING : 0);
  if (aom_codec_dec_init(&decoder, interface->codec_interface(), &cfg,
clang-format's avatar
clang-format committed
732
                         dec_flags)) {
733
    fprintf(stderr, "Failed to initialize decoder: %s\n",
734
            aom_codec_error(&decoder));
James Zern's avatar
James Zern committed
735
    goto fail2;
John Koleszar's avatar
John Koleszar committed
736
  }
John Koleszar's avatar
John Koleszar committed
737

clang-format's avatar
clang-format committed
738
  if (!quiet) fprintf(stderr, "%s\n", decoder.name);
John Koleszar's avatar
John Koleszar committed
739

740
#if CONFIG_AV1_DECODER && CONFIG_EXT_TILE
741 742 743 744 745
  if (aom_codec_control(&decoder, AV1_SET_DECODE_TILE_ROW, tile_row)) {
    fprintf(stderr, "Failed to set decode_tile_row: %s\n",
            aom_codec_error(&decoder));
    goto fail;
  }
746

747 748 749 750
  if (aom_codec_control(&decoder, AV1_SET_DECODE_TILE_COL, tile_col)) {
    fprintf(stderr, "Failed to set decode_tile_col: %s\n",
            aom_codec_error(&decoder));
    goto fail;
751 752
  }
#endif
753

clang-format's avatar
clang-format committed
754
  if (arg_skip) fprintf(stderr, "Skipping first %d frames.\n", arg_skip);
755
  while (arg_skip) {
clang-format's avatar
clang-format committed
756
    if (read_frame(&input, &buf, &bytes_in_buffer, &buffer_size)) break;
757 758 759
    arg_skip--;
  }

760 761 762 763
  if (num_external_frame_buffers > 0) {
    ext_fb_list.num_external_frame_buffers = num_external_frame_buffers;
    ext_fb_list.ext_fb = (struct ExternalFrameBuffer *)calloc(
        num_external_frame_buffers, sizeof(*ext_fb_list.ext_fb));
764 765
    if (aom_codec_set_frame_buffer_functions(&decoder, get_av1_frame_buffer,
                                             release_av1_frame_buffer,
clang-format's avatar
clang-format committed
766
                                             &ext_fb_list)) {
767
      fprintf(stderr, "Failed to configure external frame buffers: %s\n",
768
              aom_codec_error(&decoder));
James Zern's avatar
James Zern committed
769
      goto fail;
770 771 772
    }
  }

Scott LaVarnway's avatar
Scott LaVarnway committed
773 774 775
  frame_avail = 1;
  got_data = 0;

776 777
  if (framestats_file) fprintf(framestats_file, "bytes,qp\r\n");

John Koleszar's avatar
John Koleszar committed
778
  /* Decode file */
Scott LaVarnway's avatar
Scott LaVarnway committed
779
  while (frame_avail || got_data) {
780 781 782
    aom_codec_iter_t iter = NULL;
    aom_image_t *img;
    struct aom_usec_timer timer;
clang-format's avatar
clang-format committed
783
    int corrupted = 0;
John Koleszar's avatar
John Koleszar committed
784

Scott LaVarnway's avatar
Scott LaVarnway committed
785 786
    frame_avail = 0;
    if (!stop_after || frame_in < stop_after) {
787
      if (!read_frame(&input, &buf, &bytes_in_buffer, &buffer_size)) {
Scott LaVarnway's avatar
Scott LaVarnway committed
788 789
        frame_avail = 1;
        frame_in++;
John Koleszar's avatar
John Koleszar committed
790

791
        aom_usec_timer_start(&timer);
John Koleszar's avatar
John Koleszar committed
792

793
        if (aom_codec_decode(&decoder, buf, (unsigned int)bytes_in_buffer, NULL,
clang-format's avatar
clang-format committed
794
                             0)) {
795
          const char *detail = aom_codec_error_detail(&decoder);
clang-format's avatar
clang-format committed
796
          warn("Failed to decode frame %d: %s", frame_in,
797
               aom_codec_error(&decoder));
798

clang-format's avatar
clang-format committed
799 800
          if (detail) warn("Additional information: %s", detail);
          if (!keep_going) goto fail;
Scott LaVarnway's avatar
Scott LaVarnway committed
801 802
        }

803 804 805 806 807 808 809 810 811 812
        if (framestats_file) {
          int qp;
          if (aom_codec_control(&decoder, AOMD_GET_LAST_QUANTIZER, &qp)) {
            warn("Failed AOMD_GET_LAST_QUANTIZER: %s",
                 aom_codec_error(&decoder));
            if (!keep_going) goto fail;
          }
          fprintf(framestats_file, "%d,%d\r\n", (int)bytes_in_buffer, qp);
        }

813 814
        aom_usec_timer_mark(&timer);
        dx_time += aom_usec_timer_elapsed(&timer);
815 816
      } else {
        flush_decoder = 1;
Scott LaVarnway's avatar
Scott LaVarnway committed
817
      }
818 819
    } else {
      flush_decoder = 1;
Scott LaVarnway's avatar
Scott LaVarnway committed
820 821
    }

822
    aom_usec_timer_start(&timer);
Scott LaVarnway's avatar
Scott LaVarnway committed
823

824 825
    if (flush_decoder) {
      // Flush the decoder in frame parallel decode.
826 827
      if (aom_codec_decode(&decoder, NULL, 0, NULL, 0)) {
        warn("Failed to flush decoder: %s", aom_codec_error(&decoder));
828 829 830
      }
    }

Scott LaVarnway's avatar
Scott LaVarnway committed
831
    got_data = 0;
832
    if ((img = aom_codec_get_frame(&decoder, &iter))) {
Scott LaVarnway's avatar
Scott LaVarnway committed
833 834
      ++frame_out;
      got_data = 1;
835 836
    }

837 838
    aom_usec_timer_mark(&timer);
    dx_time += (unsigned int)aom_usec_timer_elapsed(&timer);
839

840
    if (!frame_parallel &&
841 842
        aom_codec_control(&decoder, AOMD_GET_FRAME_CORRUPTED, &corrupted)) {
      warn("Failed AOM_GET_FRAME_CORRUPTED: %s", aom_codec_error(&decoder));
clang-format's avatar
clang-format committed
843
      if (!keep_going) goto fail;
844
    }
John Koleszar's avatar
John Koleszar committed
845
    frames_corrupted += corrupted;
John Koleszar's avatar
John Koleszar committed
846

clang-format's avatar
clang-format committed
847
    if (progress) show_progress(frame_in, frame_out, dx_time);
John Koleszar's avatar
John Koleszar committed
848

849
    if (!noblit && img) {
850 851
      const int PLANES_YUV[] = { AOM_PLANE_Y, AOM_PLANE_U, AOM_PLANE_V };
      const int PLANES_YVU[] = { AOM_PLANE_Y, AOM_PLANE_V, AOM_PLANE_U };
852
      const int *planes = flipuv ? PLANES_YVU : PLANES_YUV;
853

854
      if (do_scale) {
855 856 857 858
        if (frame_out == 1) {
          // If the output frames are to be scaled to a fixed display size then
          // use the width and height specified in the container. If either of
          // these is set to 0, use the display size set in the first frame
859 860
          // header. If that is unavailable, use the raw decoded size of the
          // first decoded frame.
861 862
          int render_width = aom_input_ctx.width;
          int render_height = aom_input_ctx.height;
863 864
          if (!render_width || !render_height) {
            int render_size[2];
865
            if (aom_codec_control(&decoder, AV1D_GET_DISPLAY_SIZE,
866
                                  render_size)) {
867
              // As last resort use size of first frame as display size.
868 869
              render_width = img->d_w;
              render_height = img->d_h;
870
            } else {
871 872
              render_width = render_size[0];
              render_height = render_size[1];
873
            }
874
          }
clang-format's avatar
clang-format committed
875
          scaled_img =
876
              aom_img_alloc(NULL, img->fmt, render_width, render_height, 16);
877
          scaled_img->bit_depth = img->bit_depth;
878
        }
879

880
        if (img->d_w != scaled_img->d_w || img->d_h != scaled_img->d_h) {
881
#if CONFIG_LIBYUV
882
          libyuv_scale(img, scaled_img, kFilterBox);
883
          img = scaled_img;
884
#else
clang-format's avatar
clang-format committed
885 886
          fprintf(stderr,
                  "Failed  to scale output frame: %s.\n"
887 888
                  "Scaling is disabled in this configuration. "
                  "To enable scaling, configure with --enable-libyuv\n",
889
                  aom_codec_error(&decoder));
James Zern's avatar
James Zern committed
890
          goto fail;
891
#endif
892 893
        }
      }
894
#if CONFIG_HIGHBITDEPTH
895
      // Default to codec bit depth if output bit depth not set
896
      if (!output_bit_depth && single_file && !do_md5) {
897 898 899
        output_bit_depth = img->bit_depth;
      }
      // Shift up or down if necessary
Sebastien Alaiwan's avatar
Sebastien Alaiwan committed
900
      if (output_bit_depth != 0) {
901
        const aom_img_fmt_t shifted_fmt =
clang-format's avatar
clang-format committed
902
            output_bit_depth == 8
903 904
                ? img->fmt ^ (img->fmt & AOM_IMG_FMT_HIGHBITDEPTH)
                : img->fmt | AOM_IMG_FMT_HIGHBITDEPTH;
Sebastien Alaiwan's avatar
Sebastien Alaiwan committed
905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924

        if (shifted_fmt != img->fmt || output_bit_depth != img->bit_depth) {
          if (img_shifted &&
              img_shifted_realloc_required(img, img_shifted, shifted_fmt)) {
            aom_img_free(img_shifted);
            img_shifted = NULL;
          }
          if (!img_shifted) {
            img_shifted =
                aom_img_alloc(NULL, shifted_fmt, img->d_w, img->d_h, 16);
            img_shifted->bit_depth = output_bit_depth;
          }
          if (output_bit_depth > img->bit_depth) {
            aom_img_upshift(img_shifted, img,
                            output_bit_depth - img->bit_depth);
          } else {
            aom_img_downshift(img_shifted, img,
                              img->bit_depth - output_bit_depth);
          }
          img = img_shifted;
925 926 927
        }
      }
#endif
928

929
#if CONFIG_EXT_TILE
930 931
      aom_input_ctx.width = img->d_w;
      aom_input_ctx.height = img->d_h;
932 933
#endif  // CONFIG_EXT_TILE

934
      if (single_file) {
935
        if (use_y4m) {
936
          char y4m_buf[Y4M_BUFFER_SIZE] = { 0 };
937
          size_t len = 0;
938
          if (img->fmt == AOM_IMG_FMT_I440 || img->fmt == AOM_IMG_FMT_I44016) {
Deb Mukherjee's avatar
Deb Mukherjee committed
939 940 941
            fprintf(stderr, "Cannot produce y4m output for 440 sampling.\n");
            goto fail;
          }
942 943
          if (frame_out == 1) {
            // Y4M file header
clang-format's avatar
clang-format committed
944
            len = y4m_write_file_header(
945 946 947
                y4m_buf, sizeof(y4m_buf), aom_input_ctx.width,
                aom_input_ctx.height, &aom_input_ctx.framerate, img->fmt,
                img->bit_depth);
948
            if (do_md5) {
949
              MD5Update(&md5_ctx, (md5byte *)y4m_buf, (unsigned int)len);
950
            } else {
951
              fputs(y4m_buf, outfile);
952 953 954 955
            }
          }

          // Y4M frame header
956
          len = y4m_write_frame_header(y4m_buf, sizeof(y4m_buf));
957
          if (do_md5) {
958
            MD5Update(&md5_ctx, (md5byte *)y4m_buf, (unsigned int)len);
959
          } else {
960
            fputs(y4m_buf, outfile);
961
          }
962 963 964 965 966
        } else {
          if (frame_out == 1) {
            // Check if --yv12 or --i420 options are consistent with the
            // bit-stream decoded
            if (opt_i420) {
967 968
              if (img->fmt != AOM_IMG_FMT_I420 &&
                  img->fmt != AOM_IMG_FMT_I42016) {
969 970 971 972 973
                fprintf(stderr, "Cannot produce i420 output for bit-stream.\n");
                goto fail;
              }
            }
            if (opt_yv12) {
974 975
              if ((img->fmt != AOM_IMG_FMT_I420 &&
                   img->fmt != AOM_IMG_FMT_YV12) ||
clang-format's avatar