OSUOSL/Nero are experiencing Internet connectivity problems. This affects us as we're hosted with OSUOSL. We apologize for the inconvenience.

aomdec.c 35.1 KB
Newer Older
John Koleszar's avatar
John Koleszar committed
1
/*
2
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
John Koleszar's avatar
John Koleszar committed
3
 *
4 5 6 7 8 9
 * This source code is subject to the terms of the BSD 2 Clause License and
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
 * was not distributed with this source code in the LICENSE file, you can
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
 * Media Patent License 1.0 was not distributed with this source code in the
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
John Koleszar's avatar
John Koleszar committed
10 11
 */

12
#include <assert.h>
John Koleszar's avatar
John Koleszar committed
13 14 15 16
#include <stdio.h>
#include <stdlib.h>
#include <stdarg.h>
#include <string.h>
17
#include <limits.h>
18

19
#include "./aom_config.h"
20

James Zern's avatar
James Zern committed
21 22 23 24 25 26 27 28
#if CONFIG_OS_SUPPORT
#if HAVE_UNISTD_H
#include <unistd.h>  // NOLINT
#elif !defined(STDOUT_FILENO)
#define STDOUT_FILENO 1
#endif
#endif

29
#if CONFIG_LIBYUV
30
#include "third_party/libyuv/include/libyuv/scale.h"
31
#endif
32 33

#include "./args.h"
34 35
#include "./ivfdec.h"

36
#include "aom/aom_decoder.h"
37
#include "aom_ports/mem_ops.h"
38
#include "aom_ports/aom_timer.h"
39

40 41
#if CONFIG_AV1_DECODER
#include "aom/aomdx.h"
John Koleszar's avatar
John Koleszar committed
42
#endif
43

44
#include "./md5_utils.h"
45

46 47 48 49
#if CONFIG_OBU_NO_IVF
#include "./obudec.h"
#endif

50
#include "./tools_common.h"
51
#if CONFIG_WEBM_IO
52
#include "./webmdec.h"
53
#endif
54

55
#include "./y4menc.h"
John Koleszar's avatar
John Koleszar committed
56 57 58

static const char *exec_name;

59 60
struct AvxDecInputContext {
  struct AvxInputContext *aom_input_ctx;
61 62 63
  struct WebmInputContext *webm_ctx;
};

James Zern's avatar
James Zern committed
64 65
static const arg_def_t help =
    ARG_DEF(NULL, "help", 0, "Show usage options and exit");
clang-format's avatar
clang-format committed
66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104
static const arg_def_t looparg =
    ARG_DEF(NULL, "loops", 1, "Number of times to decode the file");
static const arg_def_t codecarg = ARG_DEF(NULL, "codec", 1, "Codec to use");
static const arg_def_t use_yv12 =
    ARG_DEF(NULL, "yv12", 0, "Output raw YV12 frames");
static const arg_def_t use_i420 =
    ARG_DEF(NULL, "i420", 0, "Output raw I420 frames");
static const arg_def_t flipuvarg =
    ARG_DEF(NULL, "flipuv", 0, "Flip the chroma planes in the output");
static const arg_def_t rawvideo =
    ARG_DEF(NULL, "rawvideo", 0, "Output raw YUV frames");
static const arg_def_t noblitarg =
    ARG_DEF(NULL, "noblit", 0, "Don't process the decoded frames");
static const arg_def_t progressarg =
    ARG_DEF(NULL, "progress", 0, "Show progress after each frame decodes");
static const arg_def_t limitarg =
    ARG_DEF(NULL, "limit", 1, "Stop decoding after n frames");
static const arg_def_t skiparg =
    ARG_DEF(NULL, "skip", 1, "Skip the first n input frames");
static const arg_def_t postprocarg =
    ARG_DEF(NULL, "postproc", 0, "Postprocess decoded frames");
static const arg_def_t summaryarg =
    ARG_DEF(NULL, "summary", 0, "Show timing summary");
static const arg_def_t outputfile =
    ARG_DEF("o", "output", 1, "Output file name pattern (see below)");
static const arg_def_t threadsarg =
    ARG_DEF("t", "threads", 1, "Max threads to use");
static const arg_def_t frameparallelarg =
    ARG_DEF(NULL, "frame-parallel", 0, "Frame parallel decode");
static const arg_def_t verbosearg =
    ARG_DEF("v", "verbose", 0, "Show version string");
static const arg_def_t scalearg =
    ARG_DEF("S", "scale", 0, "Scale output frames uniformly");
static const arg_def_t continuearg =
    ARG_DEF("k", "keep-going", 0, "(debug) Continue decoding after error");
static const arg_def_t fb_arg =
    ARG_DEF(NULL, "frame-buffers", 1, "Number of frame buffers to use");
static const arg_def_t md5arg =
    ARG_DEF(NULL, "md5", 0, "Compute the MD5 sum of the decoded frame");
105 106
static const arg_def_t framestatsarg =
    ARG_DEF(NULL, "framestats", 1, "Output per-frame stats (.csv format)");
107
#if CONFIG_HIGHBITDEPTH
clang-format's avatar
clang-format committed
108 109
static const arg_def_t outbitdeptharg =
    ARG_DEF(NULL, "output-bit-depth", 1, "Output bit-depth for decoded frames");
110
#endif
111
#if CONFIG_EXT_TILE
clang-format's avatar
clang-format committed
112 113 114 115 116 117
static const arg_def_t tiler = ARG_DEF(NULL, "tile-row", 1,
                                       "Row index of tile to decode "
                                       "(-1 for all rows)");
static const arg_def_t tilec = ARG_DEF(NULL, "tile-column", 1,
                                       "Column index of tile to decode "
                                       "(-1 for all columns)");
118
#endif  // CONFIG_EXT_TILE
Dmitry Kovalev's avatar
Dmitry Kovalev committed
119

James Zern's avatar
James Zern committed
120 121
static const arg_def_t *all_args[] = { &help,
                                       &codecarg,
clang-format's avatar
clang-format committed
122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138
                                       &use_yv12,
                                       &use_i420,
                                       &flipuvarg,
                                       &rawvideo,
                                       &noblitarg,
                                       &progressarg,
                                       &limitarg,
                                       &skiparg,
                                       &postprocarg,
                                       &summaryarg,
                                       &outputfile,
                                       &threadsarg,
                                       &frameparallelarg,
                                       &verbosearg,
                                       &scalearg,
                                       &fb_arg,
                                       &md5arg,
139
                                       &framestatsarg,
clang-format's avatar
clang-format committed
140
                                       &continuearg,
141
#if CONFIG_HIGHBITDEPTH
clang-format's avatar
clang-format committed
142
                                       &outbitdeptharg,
143
#endif
144
#if CONFIG_EXT_TILE
clang-format's avatar
clang-format committed
145 146
                                       &tiler,
                                       &tilec,
147
#endif  // CONFIG_EXT_TILE
clang-format's avatar
clang-format committed
148
                                       NULL };
John Koleszar's avatar
John Koleszar committed
149

150
#if CONFIG_LIBYUV
151
static INLINE int libyuv_scale(aom_image_t *src, aom_image_t *dst,
clang-format's avatar
clang-format committed
152
                               FilterModeEnum mode) {
153
#if CONFIG_HIGHBITDEPTH
154 155
  if (src->fmt == AOM_IMG_FMT_I42016) {
    assert(dst->fmt == AOM_IMG_FMT_I42016);
clang-format's avatar
clang-format committed
156
    return I420Scale_16(
157 158 159 160 161 162 163
        (uint16_t *)src->planes[AOM_PLANE_Y], src->stride[AOM_PLANE_Y] / 2,
        (uint16_t *)src->planes[AOM_PLANE_U], src->stride[AOM_PLANE_U] / 2,
        (uint16_t *)src->planes[AOM_PLANE_V], src->stride[AOM_PLANE_V] / 2,
        src->d_w, src->d_h, (uint16_t *)dst->planes[AOM_PLANE_Y],
        dst->stride[AOM_PLANE_Y] / 2, (uint16_t *)dst->planes[AOM_PLANE_U],
        dst->stride[AOM_PLANE_U] / 2, (uint16_t *)dst->planes[AOM_PLANE_V],
        dst->stride[AOM_PLANE_V] / 2, dst->d_w, dst->d_h, mode);
164 165
  }
#endif
166 167 168 169 170 171 172 173
  assert(src->fmt == AOM_IMG_FMT_I420);
  assert(dst->fmt == AOM_IMG_FMT_I420);
  return I420Scale(src->planes[AOM_PLANE_Y], src->stride[AOM_PLANE_Y],
                   src->planes[AOM_PLANE_U], src->stride[AOM_PLANE_U],
                   src->planes[AOM_PLANE_V], src->stride[AOM_PLANE_V], src->d_w,
                   src->d_h, dst->planes[AOM_PLANE_Y], dst->stride[AOM_PLANE_Y],
                   dst->planes[AOM_PLANE_U], dst->stride[AOM_PLANE_U],
                   dst->planes[AOM_PLANE_V], dst->stride[AOM_PLANE_V], dst->d_w,
clang-format's avatar
clang-format committed
174
                   dst->d_h, mode);
175
}
176
#endif
177

James Zern's avatar
James Zern committed
178 179
void show_help(FILE *fout, int shorthelp) {
  fprintf(fout, "Usage: %s <options> filename\n\n", exec_name);
John Koleszar's avatar
John Koleszar committed
180

James Zern's avatar
James Zern committed
181 182 183 184 185 186 187 188
  if (shorthelp) {
    fprintf(fout, "Use --help to see the full list of options.\n");
    return;
  }

  fprintf(fout, "Options:\n");
  arg_show_usage(fout, all_args);
  fprintf(fout,
John Koleszar's avatar
John Koleszar committed
189 190 191 192 193
          "\nOutput File Patterns:\n\n"
          "  The -o argument specifies the name of the file(s) to "
          "write to. If the\n  argument does not include any escape "
          "characters, the output will be\n  written to a single file. "
          "Otherwise, the filename will be calculated by\n  expanding "
John Koleszar's avatar
John Koleszar committed
194
          "the following escape characters:\n");
James Zern's avatar
James Zern committed
195
  fprintf(fout,
John Koleszar's avatar
John Koleszar committed
196 197 198 199 200
          "\n\t%%w   - Frame width"
          "\n\t%%h   - Frame height"
          "\n\t%%<n> - Frame number, zero padded to <n> places (1..9)"
          "\n\n  Pattern arguments are only supported in conjunction "
          "with the --yv12 and\n  --i420 options. If the -o option is "
clang-format's avatar
clang-format committed
201
          "not specified, the output will be\n  directed to stdout.\n");
James Zern's avatar
James Zern committed
202
  fprintf(fout, "\nIncluded decoders:\n\n");
John Koleszar's avatar
John Koleszar committed
203

James Zern's avatar
James Zern committed
204
  for (int i = 0; i < get_aom_decoder_count(); ++i) {
205
    const AvxInterface *const decoder = get_aom_decoder_by_index(i);
James Zern's avatar
James Zern committed
206
    fprintf(fout, "    %-6s - %s\n", decoder->name,
207
            aom_codec_iface_name(decoder->codec_interface()));
208
  }
James Zern's avatar
James Zern committed
209
}
John Koleszar's avatar
John Koleszar committed
210

James Zern's avatar
James Zern committed
211 212
void usage_exit(void) {
  show_help(stderr, 1);
John Koleszar's avatar
John Koleszar committed
213
  exit(EXIT_FAILURE);
John Koleszar's avatar
John Koleszar committed
214 215
}

clang-format's avatar
clang-format committed
216 217
static int raw_read_frame(FILE *infile, uint8_t **buffer, size_t *bytes_read,
                          size_t *buffer_size) {
218
  char raw_hdr[RAW_FRAME_HDR_SZ];
219
  size_t frame_size = 0;
John Koleszar's avatar
John Koleszar committed
220

221
  if (fread(raw_hdr, RAW_FRAME_HDR_SZ, 1, infile) != 1) {
clang-format's avatar
clang-format committed
222
    if (!feof(infile)) warn("Failed to read RAW frame size\n");
223
  } else {
224 225
    const size_t kCorruptFrameThreshold = 256 * 1024 * 1024;
    const size_t kFrameTooSmallThreshold = 256 * 1024;
226
    frame_size = mem_get_le32(raw_hdr);
John Koleszar's avatar
John Koleszar committed
227

228 229 230 231
    if (frame_size > kCorruptFrameThreshold) {
      warn("Read invalid frame size (%u)\n", (unsigned int)frame_size);
      frame_size = 0;
    }
John Koleszar's avatar
John Koleszar committed
232

233 234 235
    if (frame_size < kFrameTooSmallThreshold) {
      warn("Warning: Read invalid frame size (%u) - not a raw file?\n",
           (unsigned int)frame_size);
John Koleszar's avatar
John Koleszar committed
236
    }
John Koleszar's avatar
John Koleszar committed
237

238 239 240 241 242 243 244 245
    if (frame_size > *buffer_size) {
      uint8_t *new_buf = realloc(*buffer, 2 * frame_size);
      if (new_buf) {
        *buffer = new_buf;
        *buffer_size = 2 * frame_size;
      } else {
        warn("Failed to allocate compressed data buffer\n");
        frame_size = 0;
246
      }
John Koleszar's avatar
John Koleszar committed
247
    }
248
  }
John Koleszar's avatar
John Koleszar committed
249

250 251 252 253 254 255
  if (!feof(infile)) {
    if (fread(*buffer, 1, frame_size, infile) != frame_size) {
      warn("Failed to read full frame\n");
      return 1;
    }
    *bytes_read = frame_size;
John Koleszar's avatar
John Koleszar committed
256 257
  }

258 259 260
  return 0;
}

261
static int read_frame(struct AvxDecInputContext *input, uint8_t **buf,
262
                      size_t *bytes_in_buffer, size_t *buffer_size) {
263
  switch (input->aom_input_ctx->file_type) {
264
#if CONFIG_WEBM_IO
265
    case FILE_TYPE_WEBM:
266
      return webm_read_frame(input->webm_ctx, buf, bytes_in_buffer);
267
#endif
268
    case FILE_TYPE_RAW:
269
      return raw_read_frame(input->aom_input_ctx->file, buf, bytes_in_buffer,
clang-format's avatar
clang-format committed
270
                            buffer_size);
271
    case FILE_TYPE_IVF:
272
      return ivf_read_frame(input->aom_input_ctx->file, buf, bytes_in_buffer,
clang-format's avatar
clang-format committed
273
                            buffer_size);
274 275 276 277 278
#if CONFIG_OBU_NO_IVF
    case FILE_TYPE_OBU:
      return obu_read_temporal_unit(input->aom_input_ctx->file, buf,
                                    bytes_in_buffer, buffer_size);
#endif
clang-format's avatar
clang-format committed
279
    default: return 1;
280
  }
John Koleszar's avatar
John Koleszar committed
281 282
}

283
static void update_image_md5(const aom_image_t *img, const int planes[3],
284 285 286 287 288 289 290
                             MD5Context *md5) {
  int i, y;

  for (i = 0; i < 3; ++i) {
    const int plane = planes[i];
    const unsigned char *buf = img->planes[plane];
    const int stride = img->stride[plane];
291 292 293
    const int w = aom_img_plane_width(img, plane) *
                  ((img->fmt & AOM_IMG_FMT_HIGHBITDEPTH) ? 2 : 1);
    const int h = aom_img_plane_height(img, plane);
294 295 296 297 298 299 300 301

    for (y = 0; y < h; ++y) {
      MD5Update(md5, buf, w);
      buf += stride;
    }
  }
}

302 303
static void write_image_file(const aom_image_t *img, const int *planes,
                             const int num_planes, FILE *file) {
304
  int i, y;
305
#if CONFIG_HIGHBITDEPTH
306
  const int bytes_per_sample = ((img->fmt & AOM_IMG_FMT_HIGHBITDEPTH) ? 2 : 1);
307 308 309
#else
  const int bytes_per_sample = 1;
#endif
310

311
  for (i = 0; i < num_planes; ++i) {
312 313 314
    const int plane = planes[i];
    const unsigned char *buf = img->planes[plane];
    const int stride = img->stride[plane];
315 316
    const int w = aom_img_plane_width(img, plane);
    const int h = aom_img_plane_height(img, plane);
317 318

    for (y = 0; y < h; ++y) {
319
      fwrite(buf, bytes_per_sample, w, file);
320 321
      buf += stride;
    }
John Koleszar's avatar
John Koleszar committed
322
  }
John Koleszar's avatar
John Koleszar committed
323 324
}

325
static int file_is_raw(struct AvxInputContext *input) {
326
  uint8_t buf[32];
John Koleszar's avatar
John Koleszar committed
327
  int is_raw = 0;
328
  aom_codec_stream_info_t si;
329

330
  if (fread(buf, 1, 32, input->file) == 32) {
John Koleszar's avatar
John Koleszar committed
331 332
    int i;

333
    if (mem_get_le32(buf) < 256 * 1024 * 1024) {
334 335 336
      for (i = 0; i < get_aom_decoder_count(); ++i) {
        const AvxInterface *const decoder = get_aom_decoder_by_index(i);
        if (!aom_codec_peek_stream_info(decoder->codec_interface(), buf + 4,
clang-format's avatar
clang-format committed
337
                                        32 - 4, &si)) {
John Koleszar's avatar
John Koleszar committed
338
          is_raw = 1;
339
          input->fourcc = decoder->fourcc;
340 341 342 343
          input->width = si.w;
          input->height = si.h;
          input->framerate.numerator = 30;
          input->framerate.denominator = 1;
John Koleszar's avatar
John Koleszar committed
344 345
          break;
        }
346 347
      }
    }
John Koleszar's avatar
John Koleszar committed
348 349
  }

350
  rewind(input->file);
John Koleszar's avatar
John Koleszar committed
351
  return is_raw;
352 353
}

354
static void show_progress(int frame_in, int frame_out, uint64_t dx_time) {
355
  fprintf(stderr,
clang-format's avatar
clang-format committed
356
          "%d decoded frames/%d showed frames in %" PRId64 " us (%.2f fps)\r",
John Koleszar's avatar
John Koleszar committed
357
          frame_in, frame_out, dx_time,
358
          (double)frame_out * 1000000.0 / (double)dx_time);
359 360
}

361
struct ExternalFrameBuffer {
clang-format's avatar
clang-format committed
362
  uint8_t *data;
363 364 365 366 367 368 369 370 371
  size_t size;
  int in_use;
};

struct ExternalFrameBufferList {
  int num_external_frame_buffers;
  struct ExternalFrameBuffer *ext_fb;
};

372
// Callback used by libaom to request an external frame buffer. |cb_priv|
373 374 375
// Application private data passed into the set function. |min_size| is the
// minimum size in bytes needed to decode the next frame. |fb| pointer to the
// frame buffer.
376 377
static int get_av1_frame_buffer(void *cb_priv, size_t min_size,
                                aom_codec_frame_buffer_t *fb) {
378 379 380
  int i;
  struct ExternalFrameBufferList *const ext_fb_list =
      (struct ExternalFrameBufferList *)cb_priv;
clang-format's avatar
clang-format committed
381
  if (ext_fb_list == NULL) return -1;
382 383 384

  // Find a free frame buffer.
  for (i = 0; i < ext_fb_list->num_external_frame_buffers; ++i) {
clang-format's avatar
clang-format committed
385
    if (!ext_fb_list->ext_fb[i].in_use) break;
386 387
  }

clang-format's avatar
clang-format committed
388
  if (i == ext_fb_list->num_external_frame_buffers) return -1;
389 390 391

  if (ext_fb_list->ext_fb[i].size < min_size) {
    free(ext_fb_list->ext_fb[i].data);
392
    ext_fb_list->ext_fb[i].data = (uint8_t *)calloc(min_size, sizeof(uint8_t));
clang-format's avatar
clang-format committed
393
    if (!ext_fb_list->ext_fb[i].data) return -1;
394 395 396 397 398 399 400 401 402 403 404 405 406

    ext_fb_list->ext_fb[i].size = min_size;
  }

  fb->data = ext_fb_list->ext_fb[i].data;
  fb->size = ext_fb_list->ext_fb[i].size;
  ext_fb_list->ext_fb[i].in_use = 1;

  // Set the frame buffer's private data to point at the external frame buffer.
  fb->priv = &ext_fb_list->ext_fb[i];
  return 0;
}

407
// Callback used by libaom when there are no references to the frame buffer.
408 409
// |cb_priv| user private data passed into the set function. |fb| pointer
// to the frame buffer.
410 411
static int release_av1_frame_buffer(void *cb_priv,
                                    aom_codec_frame_buffer_t *fb) {
412 413 414 415 416 417 418
  struct ExternalFrameBuffer *const ext_fb =
      (struct ExternalFrameBuffer *)fb->priv;
  (void)cb_priv;
  ext_fb->in_use = 0;
  return 0;
}

419 420 421
static void generate_filename(const char *pattern, char *out, size_t q_len,
                              unsigned int d_w, unsigned int d_h,
                              unsigned int frame_in) {
John Koleszar's avatar
John Koleszar committed
422 423 424 425 426 427 428 429 430
  const char *p = pattern;
  char *q = out;

  do {
    char *next_pat = strchr(p, '%');

    if (p == next_pat) {
      size_t pat_len;

John Koleszar's avatar
John Koleszar committed
431
      /* parse the pattern */
John Koleszar's avatar
John Koleszar committed
432 433
      q[q_len - 1] = '\0';
      switch (p[1]) {
clang-format's avatar
clang-format committed
434 435 436 437 438 439 440 441 442 443 444 445
        case 'w': snprintf(q, q_len - 1, "%d", d_w); break;
        case 'h': snprintf(q, q_len - 1, "%d", d_h); break;
        case '1': snprintf(q, q_len - 1, "%d", frame_in); break;
        case '2': snprintf(q, q_len - 1, "%02d", frame_in); break;
        case '3': snprintf(q, q_len - 1, "%03d", frame_in); break;
        case '4': snprintf(q, q_len - 1, "%04d", frame_in); break;
        case '5': snprintf(q, q_len - 1, "%05d", frame_in); break;
        case '6': snprintf(q, q_len - 1, "%06d", frame_in); break;
        case '7': snprintf(q, q_len - 1, "%07d", frame_in); break;
        case '8': snprintf(q, q_len - 1, "%08d", frame_in); break;
        case '9': snprintf(q, q_len - 1, "%09d", frame_in); break;
        default: die("Unrecognized pattern %%%c\n", p[1]); break;
John Koleszar's avatar
John Koleszar committed
446 447 448
      }

      pat_len = strlen(q);
clang-format's avatar
clang-format committed
449
      if (pat_len >= q_len - 1) die("Output filename too long.\n");
John Koleszar's avatar
John Koleszar committed
450 451 452 453 454 455
      q += pat_len;
      p += 2;
      q_len -= pat_len;
    } else {
      size_t copy_len;

John Koleszar's avatar
John Koleszar committed
456
      /* copy the next segment */
John Koleszar's avatar
John Koleszar committed
457 458 459 460 461
      if (!next_pat)
        copy_len = strlen(p);
      else
        copy_len = next_pat - p;

clang-format's avatar
clang-format committed
462
      if (copy_len >= q_len - 1) die("Output filename too long.\n");
John Koleszar's avatar
John Koleszar committed
463 464 465 466 467 468 469 470

      memcpy(q, p, copy_len);
      q[copy_len] = '\0';
      q += copy_len;
      p += copy_len;
      q_len -= copy_len;
    }
  } while (*p);
471 472
}

473 474 475 476 477 478 479
static int is_single_file(const char *outfile_pattern) {
  const char *p = outfile_pattern;

  do {
    p = strchr(p, '%');
    if (p && p[1] >= '1' && p[1] <= '9')
      return 0;  // pattern contains sequence number, so it's not unique
clang-format's avatar
clang-format committed
480
    if (p) p++;
481 482 483 484 485 486 487 488
  } while (p);

  return 1;
}

static void print_md5(unsigned char digest[16], const char *filename) {
  int i;

clang-format's avatar
clang-format committed
489
  for (i = 0; i < 16; ++i) printf("%02x", digest[i]);
490 491 492 493 494 495 496 497 498
  printf("  %s\n", filename);
}

static FILE *open_outfile(const char *name) {
  if (strcmp("-", name) == 0) {
    set_binary_mode(stdout);
    return stdout;
  } else {
    FILE *file = fopen(name, "wb");
clang-format's avatar
clang-format committed
499
    if (!file) fatal("Failed to open output file '%s'", name);
500 501 502 503
    return file;
  }
}

504
#if CONFIG_HIGHBITDEPTH
505 506 507
static int img_shifted_realloc_required(const aom_image_t *img,
                                        const aom_image_t *shifted,
                                        aom_img_fmt_t required_fmt) {
clang-format's avatar
clang-format committed
508
  return img->d_w != shifted->d_w || img->d_h != shifted->d_h ||
509 510
         required_fmt != shifted->fmt;
}
511 512
#endif

513
static int main_loop(int argc, const char **argv_) {
514
  aom_codec_ctx_t decoder;
clang-format's avatar
clang-format committed
515 516
  char *fn = NULL;
  int i;
James Zern's avatar
James Zern committed
517
  int ret = EXIT_FAILURE;
clang-format's avatar
clang-format committed
518 519 520 521 522 523 524 525
  uint8_t *buf = NULL;
  size_t bytes_in_buffer = 0, buffer_size = 0;
  FILE *infile;
  int frame_in = 0, frame_out = 0, flipuv = 0, noblit = 0;
  int do_md5 = 0, progress = 0, frame_parallel = 0;
  int stop_after = 0, postproc = 0, summary = 0, quiet = 1;
  int arg_skip = 0;
  int keep_going = 0;
526 527
  const AvxInterface *interface = NULL;
  const AvxInterface *fourcc_interface = NULL;
528
  uint64_t dx_time = 0;
clang-format's avatar
clang-format committed
529 530 531 532 533 534 535
  struct arg arg;
  char **argv, **argi, **argj;

  int single_file;
  int use_y4m = 1;
  int opt_yv12 = 0;
  int opt_i420 = 0;
536
  aom_codec_dec_cfg_t cfg = { 0, 0, 0, CONFIG_LOWBITDEPTH };
537
#if CONFIG_HIGHBITDEPTH
clang-format's avatar
clang-format committed
538
  unsigned int output_bit_depth = 0;
539
#endif
540
#if CONFIG_EXT_TILE
clang-format's avatar
clang-format committed
541 542
  int tile_row = -1;
  int tile_col = -1;
543
#endif  // CONFIG_EXT_TILE
clang-format's avatar
clang-format committed
544 545 546
  int frames_corrupted = 0;
  int dec_flags = 0;
  int do_scale = 0;
547
  aom_image_t *scaled_img = NULL;
548
#if CONFIG_HIGHBITDEPTH
549
  aom_image_t *img_shifted = NULL;
550
#endif
clang-format's avatar
clang-format committed
551 552 553
  int frame_avail, got_data, flush_decoder = 0;
  int num_external_frame_buffers = 0;
  struct ExternalFrameBufferList ext_fb_list = { 0, NULL };
John Koleszar's avatar
John Koleszar committed
554

555
  const char *outfile_pattern = NULL;
clang-format's avatar
clang-format committed
556
  char outfile_name[PATH_MAX] = { 0 };
557 558
  FILE *outfile = NULL;

559 560
  FILE *framestats_file = NULL;

561 562 563
  MD5Context md5_ctx;
  unsigned char md5_digest[16];

564 565
  struct AvxDecInputContext input = { NULL, NULL };
  struct AvxInputContext aom_input_ctx;
566
#if CONFIG_WEBM_IO
567 568
  struct WebmInputContext webm_ctx;
  memset(&(webm_ctx), 0, sizeof(webm_ctx));
569
  input.webm_ctx = &webm_ctx;
570
#endif
571
  input.aom_input_ctx = &aom_input_ctx;
572

John Koleszar's avatar
John Koleszar committed
573 574 575 576 577 578 579 580
  /* Parse command line */
  exec_name = argv_[0];
  argv = argv_dup(argc - 1, argv_ + 1);

  for (argi = argj = argv; (*argj = *argi); argi += arg.argv_step) {
    memset(&arg, 0, sizeof(arg));
    arg.argv_step = 1;

James Zern's avatar
James Zern committed
581 582 583 584
    if (arg_match(&arg, &help, argi)) {
      show_help(stdout, 0);
      exit(EXIT_SUCCESS);
    } else if (arg_match(&arg, &codecarg, argi)) {
585
      interface = get_aom_decoder_by_name(arg.val);
586 587
      if (!interface)
        die("Error: Unrecognized argument (%s) to --codec\n", arg.val);
John Koleszar's avatar
John Koleszar committed
588 589
    } else if (arg_match(&arg, &looparg, argi)) {
      // no-op
590
    } else if (arg_match(&arg, &outputfile, argi)) {
John Koleszar's avatar
John Koleszar committed
591
      outfile_pattern = arg.val;
592
    } else if (arg_match(&arg, &use_yv12, argi)) {
John Koleszar's avatar
John Koleszar committed
593 594
      use_y4m = 0;
      flipuv = 1;
595
      opt_yv12 = 1;
John Koleszar's avatar
John Koleszar committed
596 597 598
    } else if (arg_match(&arg, &use_i420, argi)) {
      use_y4m = 0;
      flipuv = 0;
599 600 601
      opt_i420 = 1;
    } else if (arg_match(&arg, &rawvideo, argi)) {
      use_y4m = 0;
602
    } else if (arg_match(&arg, &flipuvarg, argi)) {
John Koleszar's avatar
John Koleszar committed
603
      flipuv = 1;
604
    } else if (arg_match(&arg, &noblitarg, argi)) {
John Koleszar's avatar
John Koleszar committed
605
      noblit = 1;
606
    } else if (arg_match(&arg, &progressarg, argi)) {
John Koleszar's avatar
John Koleszar committed
607
      progress = 1;
608
    } else if (arg_match(&arg, &limitarg, argi)) {
John Koleszar's avatar
John Koleszar committed
609
      stop_after = arg_parse_uint(&arg);
610
    } else if (arg_match(&arg, &skiparg, argi)) {
611
      arg_skip = arg_parse_uint(&arg);
612
    } else if (arg_match(&arg, &postprocarg, argi)) {
John Koleszar's avatar
John Koleszar committed
613
      postproc = 1;
614
    } else if (arg_match(&arg, &md5arg, argi)) {
John Koleszar's avatar
John Koleszar committed
615
      do_md5 = 1;
616 617 618 619 620 621 622
    } else if (arg_match(&arg, &framestatsarg, argi)) {
      framestats_file = fopen(arg.val, "w");
      if (!framestats_file) {
        die("Error: Could not open --framestats file (%s) for writing.\n",
            arg.val);
      }
    } else if (arg_match(&arg, &summaryarg, argi)) {
John Koleszar's avatar
John Koleszar committed
623
      summary = 1;
624
    } else if (arg_match(&arg, &threadsarg, argi)) {
John Koleszar's avatar
John Koleszar committed
625
      cfg.threads = arg_parse_uint(&arg);
626
    }
627
#if CONFIG_AV1_DECODER
628 629 630
    else if (arg_match(&arg, &frameparallelarg, argi))
      frame_parallel = 1;
#endif
John Koleszar's avatar
John Koleszar committed
631 632
    else if (arg_match(&arg, &verbosearg, argi))
      quiet = 0;
633 634
    else if (arg_match(&arg, &scalearg, argi))
      do_scale = 1;
635 636
    else if (arg_match(&arg, &fb_arg, argi))
      num_external_frame_buffers = arg_parse_uint(&arg);
637 638
    else if (arg_match(&arg, &continuearg, argi))
      keep_going = 1;
639
#if CONFIG_HIGHBITDEPTH
640 641 642 643
    else if (arg_match(&arg, &outbitdeptharg, argi)) {
      output_bit_depth = arg_parse_uint(&arg);
    }
#endif
644 645 646 647 648 649
#if CONFIG_EXT_TILE
    else if (arg_match(&arg, &tiler, argi))
      tile_row = arg_parse_int(&arg);
    else if (arg_match(&arg, &tilec, argi))
      tile_col = arg_parse_int(&arg);
#endif  // CONFIG_EXT_TILE
John Koleszar's avatar
John Koleszar committed
650 651 652
    else
      argj++;
  }
John Koleszar's avatar
John Koleszar committed
653

John Koleszar's avatar
John Koleszar committed
654 655 656 657
  /* Check for unrecognized options */
  for (argi = argv; *argi; argi++)
    if (argi[0][0] == '-' && strlen(argi[0]) > 1)
      die("Error: Unrecognized option %s\n", *argi);
John Koleszar's avatar
John Koleszar committed
658

John Koleszar's avatar
John Koleszar committed
659 660
  /* Handle non-option arguments */
  fn = argv[0];
John Koleszar's avatar
John Koleszar committed
661

hanno's avatar
hanno committed
662 663
  if (!fn) {
    free(argv);
James Zern's avatar
James Zern committed
664
    fprintf(stderr, "No input file specified!\n");
John Koleszar's avatar
John Koleszar committed
665
    usage_exit();
hanno's avatar
hanno committed
666
  }
John Koleszar's avatar
John Koleszar committed
667 668
  /* Open file */
  infile = strcmp(fn, "-") ? fopen(fn, "rb") : set_binary_mode(stdin);
John Koleszar's avatar
John Koleszar committed
669

John Koleszar's avatar
John Koleszar committed
670
  if (!infile) {
671
    fatal("Failed to open input file '%s'", strcmp(fn, "-") ? fn : "stdin");
John Koleszar's avatar
John Koleszar committed
672
  }
673
#if CONFIG_OS_SUPPORT
John Koleszar's avatar
John Koleszar committed
674
  /* Make sure we don't dump to the terminal, unless forced to with -o - */
James Zern's avatar
James Zern committed
675
  if (!outfile_pattern && isatty(STDOUT_FILENO) && !do_md5 && !noblit) {
John Koleszar's avatar
John Koleszar committed
676 677 678 679 680
    fprintf(stderr,
            "Not dumping raw video to your terminal. Use '-o -' to "
            "override.\n");
    return EXIT_FAILURE;
  }
681
#endif
682 683 684
  input.aom_input_ctx->file = infile;
  if (file_is_ivf(input.aom_input_ctx))
    input.aom_input_ctx->file_type = FILE_TYPE_IVF;
685
#if CONFIG_WEBM_IO
686 687
  else if (file_is_webm(input.webm_ctx, input.aom_input_ctx))
    input.aom_input_ctx->file_type = FILE_TYPE_WEBM;
688 689 690 691
#endif
#if CONFIG_OBU_NO_IVF
  else if (file_is_obu(input.aom_input_ctx))
    input.aom_input_ctx->file_type = FILE_TYPE_OBU;
692
#endif
693 694
  else if (file_is_raw(input.aom_input_ctx))
    input.aom_input_ctx->file_type = FILE_TYPE_RAW;
John Koleszar's avatar
John Koleszar committed
695 696
  else {
    fprintf(stderr, "Unrecognized input file type.\n");
697
#if !CONFIG_WEBM_IO
698
    fprintf(stderr, "aomdec was built without WebM container support.\n");
699
#endif
John Koleszar's avatar
John Koleszar committed
700 701 702 703
    return EXIT_FAILURE;
  }

  outfile_pattern = outfile_pattern ? outfile_pattern : "-";
704
  single_file = is_single_file(outfile_pattern);
John Koleszar's avatar
John Koleszar committed
705

706 707
  if (!noblit && single_file) {
    generate_filename(outfile_pattern, outfile_name, PATH_MAX,
708
                      aom_input_ctx.width, aom_input_ctx.height, 0);
709 710 711 712
    if (do_md5)
      MD5Init(&md5_ctx);
    else
      outfile = open_outfile(outfile_name);
John Koleszar's avatar
John Koleszar committed
713 714 715 716
  }

  if (use_y4m && !noblit) {
    if (!single_file) {
clang-format's avatar
clang-format committed
717 718
      fprintf(stderr,
              "YUV4MPEG2 not supported with output patterns,"
Deb Mukherjee's avatar
Deb Mukherjee committed
719
              " try --i420 or --yv12 or --rawvideo.\n");
John Koleszar's avatar
John Koleszar committed
720
      return EXIT_FAILURE;
721
    }
John Koleszar's avatar
John Koleszar committed
722

723
#if CONFIG_WEBM_IO
724 725
    if (aom_input_ctx.file_type == FILE_TYPE_WEBM) {
      if (webm_guess_framerate(input.webm_ctx, input.aom_input_ctx)) {
clang-format's avatar
clang-format committed
726 727
        fprintf(stderr,
                "Failed to guess framerate -- error parsing "
John Koleszar's avatar
John Koleszar committed
728 729 730
                "webm file?\n");
        return EXIT_FAILURE;
      }
731
    }
732
#endif
John Koleszar's avatar
John Koleszar committed
733 734
  }

735
  fourcc_interface = get_aom_decoder_by_fourcc(aom_input_ctx.fourcc);
736 737 738 739
  if (interface && fourcc_interface && interface != fourcc_interface)
    warn("Header indicates codec: %s\n", fourcc_interface->name);
  else
    interface = fourcc_interface;
John Koleszar's avatar
John Koleszar committed
740

741
  if (!interface) interface = get_aom_decoder_by_index(0);
742

743 744 745
  dec_flags = (postproc ? AOM_CODEC_USE_POSTPROC : 0) |
              (frame_parallel ? AOM_CODEC_USE_FRAME_THREADING : 0);
  if (aom_codec_dec_init(&decoder, interface->codec_interface(), &cfg,
clang-format's avatar
clang-format committed
746
                         dec_flags)) {
747
    fprintf(stderr, "Failed to initialize decoder: %s\n",
748
            aom_codec_error(&decoder));
James Zern's avatar
James Zern committed
749
    goto fail2;
John Koleszar's avatar
John Koleszar committed
750
  }
John Koleszar's avatar
John Koleszar committed
751

clang-format's avatar
clang-format committed
752
  if (!quiet) fprintf(stderr, "%s\n", decoder.name);
John Koleszar's avatar
John Koleszar committed
753

754
#if CONFIG_AV1_DECODER && CONFIG_EXT_TILE
755 756 757 758 759
  if (aom_codec_control(&decoder, AV1_SET_DECODE_TILE_ROW, tile_row)) {
    fprintf(stderr, "Failed to set decode_tile_row: %s\n",
            aom_codec_error(&decoder));
    goto fail;
  }
760

761 762 763 764
  if (aom_codec_control(&decoder, AV1_SET_DECODE_TILE_COL, tile_col)) {
    fprintf(stderr, "Failed to set decode_tile_col: %s\n",
            aom_codec_error(&decoder));
    goto fail;
765 766
  }
#endif
767

clang-format's avatar
clang-format committed
768
  if (arg_skip) fprintf(stderr, "Skipping first %d frames.\n", arg_skip);
769
  while (arg_skip) {
clang-format's avatar
clang-format committed
770
    if (read_frame(&input, &buf, &bytes_in_buffer, &buffer_size)) break;
771 772 773
    arg_skip--;
  }

774 775 776 777
  if (num_external_frame_buffers > 0) {
    ext_fb_list.num_external_frame_buffers = num_external_frame_buffers;
    ext_fb_list.ext_fb = (struct ExternalFrameBuffer *)calloc(
        num_external_frame_buffers, sizeof(*ext_fb_list.ext_fb));
778 779
    if (aom_codec_set_frame_buffer_functions(&decoder, get_av1_frame_buffer,
                                             release_av1_frame_buffer,
clang-format's avatar
clang-format committed
780
                                             &ext_fb_list)) {
781
      fprintf(stderr, "Failed to configure external frame buffers: %s\n",
782
              aom_codec_error(&decoder));
James Zern's avatar
James Zern committed
783
      goto fail;
784 785 786
    }
  }

Scott LaVarnway's avatar
Scott LaVarnway committed
787 788 789
  frame_avail = 1;
  got_data = 0;

790 791
  if (framestats_file) fprintf(framestats_file, "bytes,qp\r\n");

John Koleszar's avatar
John Koleszar committed
792
  /* Decode file */
Scott LaVarnway's avatar
Scott LaVarnway committed
793
  while (frame_avail || got_data) {
794 795 796
    aom_codec_iter_t iter = NULL;
    aom_image_t *img;
    struct aom_usec_timer timer;
clang-format's avatar
clang-format committed
797
    int corrupted = 0;
John Koleszar's avatar
John Koleszar committed
798

Scott LaVarnway's avatar
Scott LaVarnway committed
799 800
    frame_avail = 0;
    if (!stop_after || frame_in < stop_after) {
801
      if (!read_frame(&input, &buf, &bytes_in_buffer, &buffer_size)) {
Scott LaVarnway's avatar
Scott LaVarnway committed
802 803
        frame_avail = 1;
        frame_in++;
John Koleszar's avatar
John Koleszar committed
804

805
        aom_usec_timer_start(&timer);
John Koleszar's avatar
John Koleszar committed
806

807
        if (aom_codec_decode(&decoder, buf, (unsigned int)bytes_in_buffer, NULL,
clang-format's avatar
clang-format committed
808
                             0)) {
809
          const char *detail = aom_codec_error_detail(&decoder);
clang-format's avatar
clang-format committed
810
          warn("Failed to decode frame %d: %s", frame_in,
811
               aom_codec_error(&decoder));
812

clang-format's avatar
clang-format committed
813 814
          if (detail) warn("Additional information: %s", detail);
          if (!keep_going) goto fail;
Scott LaVarnway's avatar
Scott LaVarnway committed
815 816
        }

817 818 819 820 821 822 823 824 825 826
        if (framestats_file) {
          int qp;
          if (aom_codec_control(&decoder, AOMD_GET_LAST_QUANTIZER, &qp)) {
            warn("Failed AOMD_GET_LAST_QUANTIZER: %s",
                 aom_codec_error(&decoder));
            if (!keep_going) goto fail;
          }
          fprintf(framestats_file, "%d,%d\r\n", (int)bytes_in_buffer, qp);
        }

827 828
        aom_usec_timer_mark(&timer);
        dx_time += aom_usec_timer_elapsed(&timer);
829 830
      } else {
        flush_decoder = 1;
Scott LaVarnway's avatar
Scott LaVarnway committed
831
      }
832 833
    } else {
      flush_decoder = 1;
Scott LaVarnway's avatar
Scott LaVarnway committed
834 835
    }

836
    aom_usec_timer_start(&timer);
Scott LaVarnway's avatar
Scott LaVarnway committed
837

838 839
    if (flush_decoder) {
      // Flush the decoder in frame parallel decode.
840 841
      if (aom_codec_decode(&decoder, NULL, 0, NULL, 0)) {
        warn("Failed to flush decoder: %s", aom_codec_error(&decoder));
842 843 844
      }
    }

Scott LaVarnway's avatar
Scott LaVarnway committed
845
    got_data = 0;
846
    if ((img = aom_codec_get_frame(&decoder, &iter))) {
Scott LaVarnway's avatar
Scott LaVarnway committed
847 848
      ++frame_out;
      got_data = 1;
849 850
    }

851 852
    aom_usec_timer_mark(&timer);
    dx_time += (unsigned int)aom_usec_timer_elapsed(&timer);
853

854
    if (!frame_parallel &&
855 856
        aom_codec_control(&decoder, AOMD_GET_FRAME_CORRUPTED, &corrupted)) {
      warn("Failed AOM_GET_FRAME_CORRUPTED: %s", aom_codec_error(&decoder));
clang-format's avatar
clang-format committed
857
      if (!keep_going) goto fail;
858
    }
John Koleszar's avatar
John Koleszar committed
859
    frames_corrupted += corrupted;
John Koleszar's avatar
John Koleszar committed
860

clang-format's avatar
clang-format committed
861
    if (progress) show_progress(frame_in, frame_out, dx_time);
John Koleszar's avatar
John Koleszar committed
862

863
    if (!noblit && img) {
864 865
      const int PLANES_YUV[] = { AOM_PLANE_Y, AOM_PLANE_U, AOM_PLANE_V };
      const int PLANES_YVU[] = { AOM_PLANE_Y, AOM_PLANE_V, AOM_PLANE_U };
866
      const int *planes = flipuv ? PLANES_YVU : PLANES_YUV;
867

868
      if (do_scale) {
869 870 871 872
        if (frame_out == 1) {
          // If the output frames are to be scaled to a fixed display size then
          // use the width and height specified in the container. If either of
          // these is set to 0, use the display size set in the first frame
873 874
          // header. If that is unavailable, use the raw decoded size of the
          // first decoded frame.
875 876
          int render_width = aom_input_ctx.width;
          int render_height = aom_input_ctx.height;
877 878
          if (!render_width || !render_height) {
            int render_size[2];
879
            if (aom_codec_control(&decoder, AV1D_GET_DISPLAY_SIZE,
880
                                  render_size)) {
881
              // As last resort use size of first frame as display size.
882 883
              render_width = img->d_w;
              render_height = img->d_h;
884
            } else {
885 886
              render_width = render_size[0];
              render_height = render_size[1];
887
            }
888
          }
clang-format's avatar
clang-format committed
889
          scaled_img =
890
              aom_img_alloc(NULL, img->fmt, render_width, render_height, 16);
891
          scaled_img->bit_depth = img->bit_depth;
892
        }
893

894
        if (img->d_w != scaled_img->d_w || img->d_h != scaled_img->d_h) {
895
#if CONFIG_LIBYUV
896
          libyuv_scale(img, scaled_img, kFilterBox);
897
          img = scaled_img;
898
#else
clang-format's avatar
clang-format committed
899 900
          fprintf(stderr,
                  "Failed  to scale output frame: %s.\n"
901 902
                  "Scaling is disabled in this configuration. "
                  "To enable scaling, configure with --enable-libyuv\n",
903
                  aom_codec_error(&decoder));
James Zern's avatar
James Zern committed
904
          goto fail;
905
#endif
906 907
        }
      }
908
#if CONFIG_HIGHBITDEPTH
909
      // Default to codec bit depth if output bit depth not set
910
      if (!output_bit_depth && single_file && !do_md5) {
911 912 913
        output_bit_depth = img->bit_depth;
      }
      // Shift up or down if necessary
Sebastien Alaiwan's avatar
Sebastien Alaiwan committed
914
      if (output_bit_depth != 0) {
915
        const aom_img_fmt_t shifted_fmt =
clang-format's avatar
clang-format committed
916
            output_bit_depth == 8
917 918
                ? img->fmt ^ (img->fmt & AOM_IMG_FMT_HIGHBITDEPTH)
                : img->fmt | AOM_IMG_FMT_HIGHBITDEPTH;
Sebastien Alaiwan's avatar
Sebastien Alaiwan committed
919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938

        if (shifted_fmt != img->fmt || output_bit_depth != img->bit_depth) {
          if (img_shifted &&
              img_shifted_realloc_required(img, img_shifted, shifted_fmt)) {
            aom_img_free(img_shifted);
            img_shifted = NULL;
          }
          if (!img_shifted) {
            img_shifted =
                aom_img_alloc(NULL, shifted_fmt, img->d_w, img->d_h, 16);
            img_shifted->bit_depth = output_bit_depth;
          }
          if (output_bit_depth > img->bit_depth) {
            aom_img_upshift(img_shifted, img,
                            output_bit_depth - img->bit_depth);
          } else {
            aom_img_downshift(img_shifted, img,
                              img->bit_depth - output_bit_depth);
          }
          img = img_shifted;
939 940 941
        }
      }
#endif
942

943
#if CONFIG_EXT_TILE
944 945
      aom_input_ctx.width = img->d_w;
      aom_input_ctx.height = img->d_h;
946 947
#endif  // CONFIG_EXT_TILE

948
#if CONFIG_MONO_VIDEO
949
      int num_planes = (!use_y4m && img->cs == AOM_CS_MONOCHROME) ? 1 : 3;
950 951 952 953
#else
      int num_planes = 3;
#endif

954
      if (single_file) {
955
        if (use_y4m) {
956
          char y4m_buf[Y4M_BUFFER_SIZE] = { 0 };
957
          size_t len = 0;
958
          if (img->fmt == AOM_IMG_FMT_I440 || img->fmt == AOM_IMG_FMT_I44016) {
Deb Mukherjee's avatar
Deb Mukherjee committed
959 960 961
            fprintf(stderr, "Cannot produce y4m output for 440 sampling.\n");
            goto fail;
          }
962 963
          if (frame_out == 1) {
            // Y4M file header
clang-format's avatar
clang-format committed
964
            len = y4m_write_file_header(
965 966 967
                y4m_buf, sizeof(y4m_buf), aom_input_ctx.width,
                aom_input_ctx.height, &aom_input_ctx.framerate, img->fmt,
                img->bit_depth);
968
            if (do_md5) {
969
              MD5Update(&md5_ctx, (md5byte *)y4m_buf, (unsigned int)len);
970
            } else {
971
              fputs(y4m_buf, outfile);