vpxenc.c 66.3 KB
Newer Older
John Koleszar's avatar
John Koleszar committed
1
/*
2
 *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
John Koleszar's avatar
John Koleszar committed
3
 *
4
 *  Use of this source code is governed by a BSD-style license
5
6
 *  that can be found in the LICENSE file in the root of the source
 *  tree. An additional intellectual property rights grant can be found
7
 *  in the file PATENTS.  All contributing project authors may
8
 *  be found in the AUTHORS file in the root of the source tree.
John Koleszar's avatar
John Koleszar committed
9
10
 */

Christian Duvivier's avatar
Christian Duvivier committed
11
#include "vpx_config.h"
John Koleszar's avatar
John Koleszar committed
12
13
14
15

/* This is a simple program that encodes YV12 files and generates ivf
 * files using the new interface.
 */
16
#if defined(_WIN32) || !CONFIG_OS_SUPPORT
17
18
19
20
#define USE_POSIX_MMAP 0
#else
#define USE_POSIX_MMAP 1
#endif
John Koleszar's avatar
John Koleszar committed
21
22
23
24
25

#include <stdio.h>
#include <stdlib.h>
#include <stdarg.h>
#include <string.h>
John Koleszar's avatar
John Koleszar committed
26
#include <limits.h>
27
#include <assert.h>
28
#include "vpx/vpx_encoder.h"
John Koleszar's avatar
John Koleszar committed
29
30
31
32
33
34
35
#if USE_POSIX_MMAP
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/mman.h>
#include <fcntl.h>
#include <unistd.h>
#endif
36
#include "vpx_config.h"
John Koleszar's avatar
John Koleszar committed
37
#include "vpx_version.h"
38
#include "vpx/vp8cx.h"
39
40
#include "vpx/vp8dx.h"
#include "vpx/vpx_decoder.h"
John Koleszar's avatar
John Koleszar committed
41
42
#include "vpx_ports/mem_ops.h"
#include "vpx_ports/vpx_timer.h"
John Koleszar's avatar
John Koleszar committed
43
#include "tools_common.h"
44
#include "y4minput.h"
John Koleszar's avatar
John Koleszar committed
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
#include "libmkv/EbmlWriter.h"
#include "libmkv/EbmlIDs.h"

/* Need special handling of these functions on Windows */
#if defined(_MSC_VER)
/* MSVS doesn't define off_t, and uses _f{seek,tell}i64 */
typedef __int64 off_t;
#define fseeko _fseeki64
#define ftello _ftelli64
#elif defined(_WIN32)
/* MinGW defines off_t, and uses f{seek,tell}o64 */
#define fseeko fseeko64
#define ftello ftello64
#endif

#if defined(_MSC_VER)
#define LITERALU64(n) n
#else
#define LITERALU64(n) n##LLU
#endif
John Koleszar's avatar
John Koleszar committed
65

66
67
68
69
70
71
72
73
/* We should use 32-bit file operations in WebM file format
 * when building ARM executable file (.axf) with RVCT */
#if !CONFIG_OS_SUPPORT
typedef long off_t;
#define fseeko fseek
#define ftello ftell
#endif

John Koleszar's avatar
John Koleszar committed
74
75
76
static const char *exec_name;


Jim Bankoski's avatar
Jim Bankoski committed
77
78

#define VP8_FOURCC (0x78385056)
John Koleszar's avatar
John Koleszar committed
79
80
static const struct {
  char const *name;
Jim Bankoski's avatar
Jim Bankoski committed
81
  const vpx_codec_iface_t *(*iface)(void);
John Koleszar's avatar
John Koleszar committed
82
83
84
  unsigned int             fourcc;
  unsigned int             fourcc_mask;
} ifaces[] = {
85
86
#if CONFIG_VP9_DECODER
  {"vp9",  &vpx_codec_vp8_dx,   VP8_FOURCC, 0x00FFFFFF},
Jim Bankoski's avatar
Jim Bankoski committed
87
88
89
90
91
92
93
94
95
#endif
};

static const struct codec_item {
  char const *name;
  const vpx_codec_iface_t *(*iface)(void);
  unsigned int             fourcc;
  unsigned int             fourcc_mask;
} codecs[] = {
96
97
#if CONFIG_VP9_ENCODER
  {"vp9",  vpx_codec_vp8x_cx,   VP8_FOURCC, 0x00FFFFFF},
98
99
100
101
#endif
};


John Koleszar's avatar
John Koleszar committed
102
103
static void usage_exit();

John Koleszar's avatar
John Koleszar committed
104
105
106
107
108
109
void die(const char *fmt, ...) {
  va_list ap;
  va_start(ap, fmt);
  vfprintf(stderr, fmt, ap);
  fprintf(stderr, "\n");
  usage_exit();
John Koleszar's avatar
John Koleszar committed
110
111
}

John Koleszar's avatar
John Koleszar committed
112
113
114
static void ctx_exit_on_error(vpx_codec_ctx_t *ctx, const char *s) {
  if (ctx->err) {
    const char *detail = vpx_codec_error_detail(ctx);
John Koleszar's avatar
John Koleszar committed
115

John Koleszar's avatar
John Koleszar committed
116
    fprintf(stderr, "%s: %s\n", s, vpx_codec_error(ctx));
John Koleszar's avatar
John Koleszar committed
117

John Koleszar's avatar
John Koleszar committed
118
119
    if (detail)
      fprintf(stderr, "    %s\n", detail);
John Koleszar's avatar
John Koleszar committed
120

John Koleszar's avatar
John Koleszar committed
121
122
    exit(EXIT_FAILURE);
  }
John Koleszar's avatar
John Koleszar committed
123
124
125
126
127
}

/* This structure is used to abstract the different ways of handling
 * first pass statistics.
 */
John Koleszar's avatar
John Koleszar committed
128
129
130
131
132
133
typedef struct {
  vpx_fixed_buf_t buf;
  int             pass;
  FILE           *file;
  char           *buf_ptr;
  size_t          buf_alloc_sz;
John Koleszar's avatar
John Koleszar committed
134
135
} stats_io_t;

John Koleszar's avatar
John Koleszar committed
136
137
int stats_open_file(stats_io_t *stats, const char *fpf, int pass) {
  int res;
John Koleszar's avatar
John Koleszar committed
138

John Koleszar's avatar
John Koleszar committed
139
  stats->pass = pass;
John Koleszar's avatar
John Koleszar committed
140

John Koleszar's avatar
John Koleszar committed
141
142
143
144
145
146
  if (pass == 0) {
    stats->file = fopen(fpf, "wb");
    stats->buf.sz = 0;
    stats->buf.buf = NULL,
               res = (stats->file != NULL);
  } else {
John Koleszar's avatar
John Koleszar committed
147
148
#if 0
#elif USE_POSIX_MMAP
John Koleszar's avatar
John Koleszar committed
149
150
151
152
153
154
155
156
157
158
    struct stat stat_buf;
    int fd;

    fd = open(fpf, O_RDONLY);
    stats->file = fdopen(fd, "rb");
    fstat(fd, &stat_buf);
    stats->buf.sz = stat_buf.st_size;
    stats->buf.buf = mmap(NULL, stats->buf.sz, PROT_READ, MAP_PRIVATE,
                          fd, 0);
    res = (stats->buf.buf != NULL);
John Koleszar's avatar
John Koleszar committed
159
#else
John Koleszar's avatar
John Koleszar committed
160
    size_t nbytes;
John Koleszar's avatar
John Koleszar committed
161

John Koleszar's avatar
John Koleszar committed
162
    stats->file = fopen(fpf, "rb");
John Koleszar's avatar
John Koleszar committed
163

John Koleszar's avatar
John Koleszar committed
164
165
166
167
    if (fseek(stats->file, 0, SEEK_END)) {
      fprintf(stderr, "First-pass stats file must be seekable!\n");
      exit(EXIT_FAILURE);
    }
John Koleszar's avatar
John Koleszar committed
168

John Koleszar's avatar
John Koleszar committed
169
170
    stats->buf.sz = stats->buf_alloc_sz = ftell(stats->file);
    rewind(stats->file);
John Koleszar's avatar
John Koleszar committed
171

John Koleszar's avatar
John Koleszar committed
172
    stats->buf.buf = malloc(stats->buf_alloc_sz);
John Koleszar's avatar
John Koleszar committed
173

John Koleszar's avatar
John Koleszar committed
174
175
176
177
178
    if (!stats->buf.buf) {
      fprintf(stderr, "Failed to allocate first-pass stats buffer (%lu bytes)\n",
              (unsigned long)stats->buf_alloc_sz);
      exit(EXIT_FAILURE);
    }
John Koleszar's avatar
John Koleszar committed
179

John Koleszar's avatar
John Koleszar committed
180
181
    nbytes = fread(stats->buf.buf, 1, stats->buf.sz, stats->file);
    res = (nbytes == stats->buf.sz);
John Koleszar's avatar
John Koleszar committed
182
#endif
John Koleszar's avatar
John Koleszar committed
183
  }
John Koleszar's avatar
John Koleszar committed
184

John Koleszar's avatar
John Koleszar committed
185
  return res;
John Koleszar's avatar
John Koleszar committed
186
187
}

John Koleszar's avatar
John Koleszar committed
188
189
190
int stats_open_mem(stats_io_t *stats, int pass) {
  int res;
  stats->pass = pass;
John Koleszar's avatar
John Koleszar committed
191

John Koleszar's avatar
John Koleszar committed
192
193
194
195
196
  if (!pass) {
    stats->buf.sz = 0;
    stats->buf_alloc_sz = 64 * 1024;
    stats->buf.buf = malloc(stats->buf_alloc_sz);
  }
John Koleszar's avatar
John Koleszar committed
197

John Koleszar's avatar
John Koleszar committed
198
199
200
  stats->buf_ptr = stats->buf.buf;
  res = (stats->buf.buf != NULL);
  return res;
John Koleszar's avatar
John Koleszar committed
201
202
203
}


John Koleszar's avatar
John Koleszar committed
204
205
206
void stats_close(stats_io_t *stats, int last_pass) {
  if (stats->file) {
    if (stats->pass == last_pass) {
John Koleszar's avatar
John Koleszar committed
207
208
#if 0
#elif USE_POSIX_MMAP
John Koleszar's avatar
John Koleszar committed
209
      munmap(stats->buf.buf, stats->buf.sz);
John Koleszar's avatar
John Koleszar committed
210
#else
John Koleszar's avatar
John Koleszar committed
211
      free(stats->buf.buf);
John Koleszar's avatar
John Koleszar committed
212
213
#endif
    }
John Koleszar's avatar
John Koleszar committed
214
215
216
217
218
219
220

    fclose(stats->file);
    stats->file = NULL;
  } else {
    if (stats->pass == last_pass)
      free(stats->buf.buf);
  }
John Koleszar's avatar
John Koleszar committed
221
222
}

John Koleszar's avatar
John Koleszar committed
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
void stats_write(stats_io_t *stats, const void *pkt, size_t len) {
  if (stats->file) {
    if (fwrite(pkt, 1, len, stats->file));
  } else {
    if (stats->buf.sz + len > stats->buf_alloc_sz) {
      size_t  new_sz = stats->buf_alloc_sz + 64 * 1024;
      char   *new_ptr = realloc(stats->buf.buf, new_sz);

      if (new_ptr) {
        stats->buf_ptr = new_ptr + (stats->buf_ptr - (char *)stats->buf.buf);
        stats->buf.buf = new_ptr;
        stats->buf_alloc_sz = new_sz;
      } else {
        fprintf(stderr,
                "\nFailed to realloc firstpass stats buffer.\n");
        exit(EXIT_FAILURE);
      }
John Koleszar's avatar
John Koleszar committed
240
241
    }

John Koleszar's avatar
John Koleszar committed
242
243
244
245
    memcpy(stats->buf_ptr, pkt, len);
    stats->buf.sz += len;
    stats->buf_ptr += len;
  }
John Koleszar's avatar
John Koleszar committed
246
247
}

John Koleszar's avatar
John Koleszar committed
248
249
vpx_fixed_buf_t stats_get(stats_io_t *stats) {
  return stats->buf;
John Koleszar's avatar
John Koleszar committed
250
251
}

252
/* Stereo 3D packed frame format */
John Koleszar's avatar
John Koleszar committed
253
254
255
256
257
258
typedef enum stereo_format {
  STEREO_FORMAT_MONO       = 0,
  STEREO_FORMAT_LEFT_RIGHT = 1,
  STEREO_FORMAT_BOTTOM_TOP = 2,
  STEREO_FORMAT_TOP_BOTTOM = 3,
  STEREO_FORMAT_RIGHT_LEFT = 11
259
260
} stereo_format_t;

John Koleszar's avatar
John Koleszar committed
261
262
263
264
enum video_file_type {
  FILE_TYPE_RAW,
  FILE_TYPE_IVF,
  FILE_TYPE_Y4M
265
266
};

267
struct detect_buffer {
John Koleszar's avatar
John Koleszar committed
268
269
270
  char buf[4];
  size_t buf_read;
  size_t position;
271
272
273
};


John Koleszar's avatar
John Koleszar committed
274
#define IVF_FRAME_HDR_SZ (4+8) /* 4 byte size + 8 byte timestamp */
275
static int read_frame(FILE *f, vpx_image_t *img, unsigned int file_type,
John Koleszar's avatar
John Koleszar committed
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
                      y4m_input *y4m, struct detect_buffer *detect) {
  int plane = 0;
  int shortread = 0;

  if (file_type == FILE_TYPE_Y4M) {
    if (y4m_input_fetch_frame(y4m, f, img) < 1)
      return 0;
  } else {
    if (file_type == FILE_TYPE_IVF) {
      char junk[IVF_FRAME_HDR_SZ];

      /* Skip the frame header. We know how big the frame should be. See
       * write_ivf_frame_header() for documentation on the frame header
       * layout.
       */
      if (fread(junk, 1, IVF_FRAME_HDR_SZ, f));
John Koleszar's avatar
John Koleszar committed
292
    }
293

John Koleszar's avatar
John Koleszar committed
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
    for (plane = 0; plane < 3; plane++) {
      unsigned char *ptr;
      int w = (plane ? (1 + img->d_w) / 2 : img->d_w);
      int h = (plane ? (1 + img->d_h) / 2 : img->d_h);
      int r;

      /* Determine the correct plane based on the image format. The for-loop
       * always counts in Y,U,V order, but this may not match the order of
       * the data on disk.
       */
      switch (plane) {
        case 1:
          ptr = img->planes[img->fmt == VPX_IMG_FMT_YV12 ? VPX_PLANE_V : VPX_PLANE_U];
          break;
        case 2:
          ptr = img->planes[img->fmt == VPX_IMG_FMT_YV12 ? VPX_PLANE_U : VPX_PLANE_V];
          break;
        default:
          ptr = img->planes[plane];
      }

      for (r = 0; r < h; r++) {
        size_t needed = w;
        size_t buf_position = 0;
        const size_t left = detect->buf_read - detect->position;
        if (left > 0) {
          const size_t more = (left < needed) ? left : needed;
          memcpy(ptr, detect->buf + detect->position, more);
          buf_position = more;
          needed -= more;
          detect->position += more;
John Koleszar's avatar
John Koleszar committed
325
        }
John Koleszar's avatar
John Koleszar committed
326
327
        if (needed > 0) {
          shortread |= (fread(ptr + buf_position, 1, needed, f) < needed);
John Koleszar's avatar
John Koleszar committed
328
        }
John Koleszar's avatar
John Koleszar committed
329
330
331

        ptr += img->stride[plane];
      }
John Koleszar's avatar
John Koleszar committed
332
    }
John Koleszar's avatar
John Koleszar committed
333
  }
John Koleszar's avatar
John Koleszar committed
334

John Koleszar's avatar
John Koleszar committed
335
  return !shortread;
John Koleszar's avatar
John Koleszar committed
336
337
338
}


339
unsigned int file_is_y4m(FILE      *infile,
340
                         y4m_input *y4m,
John Koleszar's avatar
John Koleszar committed
341
342
343
344
345
                         char       detect[4]) {
  if (memcmp(detect, "YUV4", 4) == 0) {
    return 1;
  }
  return 0;
346
347
}

John Koleszar's avatar
John Koleszar committed
348
349
350
351
#define IVF_FILE_HDR_SZ (32)
unsigned int file_is_ivf(FILE *infile,
                         unsigned int *fourcc,
                         unsigned int *width,
352
                         unsigned int *height,
John Koleszar's avatar
John Koleszar committed
353
354
355
                         struct detect_buffer *detect) {
  char raw_hdr[IVF_FILE_HDR_SZ];
  int is_ivf = 0;
John Koleszar's avatar
John Koleszar committed
356

John Koleszar's avatar
John Koleszar committed
357
358
  if (memcmp(detect->buf, "DKIF", 4) != 0)
    return 0;
359

John Koleszar's avatar
John Koleszar committed
360
361
362
363
364
  /* See write_ivf_file_header() for more documentation on the file header
   * layout.
   */
  if (fread(raw_hdr + 4, 1, IVF_FILE_HDR_SZ - 4, infile)
      == IVF_FILE_HDR_SZ - 4) {
John Koleszar's avatar
John Koleszar committed
365
    {
John Koleszar's avatar
John Koleszar committed
366
      is_ivf = 1;
John Koleszar's avatar
John Koleszar committed
367

John Koleszar's avatar
John Koleszar committed
368
369
370
      if (mem_get_le16(raw_hdr + 4) != 0)
        fprintf(stderr, "Error: Unrecognized IVF version! This file may not"
                " decode properly.");
John Koleszar's avatar
John Koleszar committed
371

John Koleszar's avatar
John Koleszar committed
372
      *fourcc = mem_get_le32(raw_hdr + 8);
John Koleszar's avatar
John Koleszar committed
373
    }
John Koleszar's avatar
John Koleszar committed
374
  }
John Koleszar's avatar
John Koleszar committed
375

John Koleszar's avatar
John Koleszar committed
376
377
378
379
380
  if (is_ivf) {
    *width = mem_get_le16(raw_hdr + 12);
    *height = mem_get_le16(raw_hdr + 14);
    detect->position = 4;
  }
John Koleszar's avatar
John Koleszar committed
381

John Koleszar's avatar
John Koleszar committed
382
  return is_ivf;
John Koleszar's avatar
John Koleszar committed
383
384
385
386
387
388
}


static void write_ivf_file_header(FILE *outfile,
                                  const vpx_codec_enc_cfg_t *cfg,
                                  unsigned int fourcc,
John Koleszar's avatar
John Koleszar committed
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
                                  int frame_cnt) {
  char header[32];

  if (cfg->g_pass != VPX_RC_ONE_PASS && cfg->g_pass != VPX_RC_LAST_PASS)
    return;

  header[0] = 'D';
  header[1] = 'K';
  header[2] = 'I';
  header[3] = 'F';
  mem_put_le16(header + 4,  0);                 /* version */
  mem_put_le16(header + 6,  32);                /* headersize */
  mem_put_le32(header + 8,  fourcc);            /* headersize */
  mem_put_le16(header + 12, cfg->g_w);          /* width */
  mem_put_le16(header + 14, cfg->g_h);          /* height */
  mem_put_le32(header + 16, cfg->g_timebase.den); /* rate */
  mem_put_le32(header + 20, cfg->g_timebase.num); /* scale */
  mem_put_le32(header + 24, frame_cnt);         /* length */
  mem_put_le32(header + 28, 0);                 /* unused */

  if (fwrite(header, 1, 32, outfile));
John Koleszar's avatar
John Koleszar committed
410
411
412
413
}


static void write_ivf_frame_header(FILE *outfile,
John Koleszar's avatar
John Koleszar committed
414
415
416
                                   const vpx_codec_cx_pkt_t *pkt) {
  char             header[12];
  vpx_codec_pts_t  pts;
John Koleszar's avatar
John Koleszar committed
417

John Koleszar's avatar
John Koleszar committed
418
419
  if (pkt->kind != VPX_CODEC_CX_FRAME_PKT)
    return;
John Koleszar's avatar
John Koleszar committed
420

John Koleszar's avatar
John Koleszar committed
421
422
423
424
  pts = pkt->data.frame.pts;
  mem_put_le32(header, pkt->data.frame.sz);
  mem_put_le32(header + 4, pts & 0xFFFFFFFF);
  mem_put_le32(header + 8, pts >> 32);
John Koleszar's avatar
John Koleszar committed
425

John Koleszar's avatar
John Koleszar committed
426
  if (fwrite(header, 1, 12, outfile));
John Koleszar's avatar
John Koleszar committed
427
428
}

John Koleszar's avatar
John Koleszar committed
429
430
431
432

typedef off_t EbmlLoc;


John Koleszar's avatar
John Koleszar committed
433
434
435
struct cue_entry {
  unsigned int time;
  uint64_t     loc;
John Koleszar's avatar
John Koleszar committed
436
437
438
};


John Koleszar's avatar
John Koleszar committed
439
440
struct EbmlGlobal {
  int debug;
441

John Koleszar's avatar
John Koleszar committed
442
443
444
  FILE    *stream;
  int64_t last_pts_ms;
  vpx_rational_t  framerate;
John Koleszar's avatar
John Koleszar committed
445

John Koleszar's avatar
John Koleszar committed
446
447
448
449
450
451
452
  /* These pointers are to the start of an element */
  off_t    position_reference;
  off_t    seek_info_pos;
  off_t    segment_info_pos;
  off_t    track_pos;
  off_t    cue_pos;
  off_t    cluster_pos;
John Koleszar's avatar
John Koleszar committed
453

John Koleszar's avatar
John Koleszar committed
454
455
  /* This pointer is to a specific element to be serialized */
  off_t    track_id_pos;
John Koleszar's avatar
John Koleszar committed
456

John Koleszar's avatar
John Koleszar committed
457
458
459
  /* These pointers are to the size field of the element */
  EbmlLoc  startSegment;
  EbmlLoc  startCluster;
John Koleszar's avatar
John Koleszar committed
460

John Koleszar's avatar
John Koleszar committed
461
462
  uint32_t cluster_timecode;
  int      cluster_open;
John Koleszar's avatar
John Koleszar committed
463

John Koleszar's avatar
John Koleszar committed
464
465
  struct cue_entry *cue_list;
  unsigned int      cues;
John Koleszar's avatar
John Koleszar committed
466
467
468
469

};


John Koleszar's avatar
John Koleszar committed
470
471
void Ebml_Write(EbmlGlobal *glob, const void *buffer_in, unsigned long len) {
  if (fwrite(buffer_in, 1, len, glob->stream));
John Koleszar's avatar
John Koleszar committed
472
473
}

474
#define WRITE_BUFFER(s) \
John Koleszar's avatar
John Koleszar committed
475
476
  for(i = len-1; i>=0; i--)\
  { \
477
478
    x = *(const s *)buffer_in >> (i * CHAR_BIT); \
    Ebml_Write(glob, &x, 1); \
John Koleszar's avatar
John Koleszar committed
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
  }
void Ebml_Serialize(EbmlGlobal *glob, const void *buffer_in, int buffer_size, unsigned long len) {
  char x;
  int i;

  /* buffer_size:
   * 1 - int8_t;
   * 2 - int16_t;
   * 3 - int32_t;
   * 4 - int64_t;
   */
  switch (buffer_size) {
    case 1:
      WRITE_BUFFER(int8_t)
      break;
    case 2:
      WRITE_BUFFER(int16_t)
      break;
    case 4:
      WRITE_BUFFER(int32_t)
      break;
    case 8:
      WRITE_BUFFER(int64_t)
      break;
    default:
      break;
  }
John Koleszar's avatar
John Koleszar committed
506
}
507
#undef WRITE_BUFFER
John Koleszar's avatar
John Koleszar committed
508

509
/* Need a fixed size serializer for the track ID. libmkv provides a 64 bit
John Koleszar's avatar
John Koleszar committed
510
511
 * one, but not a 32 bit one.
 */
John Koleszar's avatar
John Koleszar committed
512
513
514
515
516
static void Ebml_SerializeUnsigned32(EbmlGlobal *glob, unsigned long class_id, uint64_t ui) {
  unsigned char sizeSerialized = 4 | 0x80;
  Ebml_WriteID(glob, class_id);
  Ebml_Serialize(glob, &sizeSerialized, sizeof(sizeSerialized), 1);
  Ebml_Serialize(glob, &ui, sizeof(ui), 4);
John Koleszar's avatar
John Koleszar committed
517
518
519
}


John Koleszar's avatar
John Koleszar committed
520
521
static void
Ebml_StartSubElement(EbmlGlobal *glob, EbmlLoc *ebmlLoc,
John Koleszar's avatar
John Koleszar committed
522
523
524
525
526
527
528
529
                     unsigned long class_id) {
  // todo this is always taking 8 bytes, this may need later optimization
  // this is a key that says length unknown
  uint64_t unknownLen =  LITERALU64(0x01FFFFFFFFFFFFFF);

  Ebml_WriteID(glob, class_id);
  *ebmlLoc = ftello(glob->stream);
  Ebml_Serialize(glob, &unknownLen, sizeof(unknownLen), 8);
John Koleszar's avatar
John Koleszar committed
530
531
532
}

static void
John Koleszar's avatar
John Koleszar committed
533
534
535
Ebml_EndSubElement(EbmlGlobal *glob, EbmlLoc *ebmlLoc) {
  off_t pos;
  uint64_t size;
John Koleszar's avatar
John Koleszar committed
536

John Koleszar's avatar
John Koleszar committed
537
538
  /* Save the current stream pointer */
  pos = ftello(glob->stream);
John Koleszar's avatar
John Koleszar committed
539

John Koleszar's avatar
John Koleszar committed
540
541
542
  /* Calculate the size of this element */
  size = pos - *ebmlLoc - 8;
  size |=  LITERALU64(0x0100000000000000);
John Koleszar's avatar
John Koleszar committed
543

John Koleszar's avatar
John Koleszar committed
544
545
546
  /* Seek back to the beginning of the element and write the new size */
  fseeko(glob->stream, *ebmlLoc, SEEK_SET);
  Ebml_Serialize(glob, &size, sizeof(size), 8);
John Koleszar's avatar
John Koleszar committed
547

John Koleszar's avatar
John Koleszar committed
548
549
  /* Reset the stream pointer */
  fseeko(glob->stream, pos, SEEK_SET);
John Koleszar's avatar
John Koleszar committed
550
551
}

John Koleszar's avatar
John Koleszar committed
552
553

static void
John Koleszar's avatar
John Koleszar committed
554
555
556
557
558
559
560
write_webm_seek_element(EbmlGlobal *ebml, unsigned long id, off_t pos) {
  uint64_t offset = pos - ebml->position_reference;
  EbmlLoc start;
  Ebml_StartSubElement(ebml, &start, Seek);
  Ebml_SerializeBinary(ebml, SeekID, id);
  Ebml_SerializeUnsigned64(ebml, SeekPosition, offset);
  Ebml_EndSubElement(ebml, &start);
John Koleszar's avatar
John Koleszar committed
561
562
563
564
}


static void
John Koleszar's avatar
John Koleszar committed
565
write_webm_seek_info(EbmlGlobal *ebml) {
John Koleszar's avatar
John Koleszar committed
566

John Koleszar's avatar
John Koleszar committed
567
  off_t pos;
John Koleszar's avatar
John Koleszar committed
568

John Koleszar's avatar
John Koleszar committed
569
570
  /* Save the current stream pointer */
  pos = ftello(ebml->stream);
John Koleszar's avatar
John Koleszar committed
571

John Koleszar's avatar
John Koleszar committed
572
573
574
575
  if (ebml->seek_info_pos)
    fseeko(ebml->stream, ebml->seek_info_pos, SEEK_SET);
  else
    ebml->seek_info_pos = pos;
John Koleszar's avatar
John Koleszar committed
576

John Koleszar's avatar
John Koleszar committed
577
578
  {
    EbmlLoc start;
John Koleszar's avatar
John Koleszar committed
579

John Koleszar's avatar
John Koleszar committed
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
    Ebml_StartSubElement(ebml, &start, SeekHead);
    write_webm_seek_element(ebml, Tracks, ebml->track_pos);
    write_webm_seek_element(ebml, Cues,   ebml->cue_pos);
    write_webm_seek_element(ebml, Info,   ebml->segment_info_pos);
    Ebml_EndSubElement(ebml, &start);
  }
  {
    // segment info
    EbmlLoc startInfo;
    uint64_t frame_time;

    frame_time = (uint64_t)1000 * ebml->framerate.den
                 / ebml->framerate.num;
    ebml->segment_info_pos = ftello(ebml->stream);
    Ebml_StartSubElement(ebml, &startInfo, Info);
    Ebml_SerializeUnsigned(ebml, TimecodeScale, 1000000);
    Ebml_SerializeFloat(ebml, Segment_Duration,
                        ebml->last_pts_ms + frame_time);
    Ebml_SerializeString(ebml, 0x4D80,
                         ebml->debug ? "vpxenc" : "vpxenc" VERSION_STRING);
    Ebml_SerializeString(ebml, 0x5741,
                         ebml->debug ? "vpxenc" : "vpxenc" VERSION_STRING);
    Ebml_EndSubElement(ebml, &startInfo);
  }
John Koleszar's avatar
John Koleszar committed
604
605
606
607
608
609
}


static void
write_webm_file_header(EbmlGlobal                *glob,
                       const vpx_codec_enc_cfg_t *cfg,
610
                       const struct vpx_rational *fps,
John Koleszar's avatar
John Koleszar committed
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
                       stereo_format_t            stereo_fmt) {
  {
    EbmlLoc start;
    Ebml_StartSubElement(glob, &start, EBML);
    Ebml_SerializeUnsigned(glob, EBMLVersion, 1);
    Ebml_SerializeUnsigned(glob, EBMLReadVersion, 1); // EBML Read Version
    Ebml_SerializeUnsigned(glob, EBMLMaxIDLength, 4); // EBML Max ID Length
    Ebml_SerializeUnsigned(glob, EBMLMaxSizeLength, 8); // EBML Max Size Length
    Ebml_SerializeString(glob, DocType, "webm"); // Doc Type
    Ebml_SerializeUnsigned(glob, DocTypeVersion, 2); // Doc Type Version
    Ebml_SerializeUnsigned(glob, DocTypeReadVersion, 2); // Doc Type Read Version
    Ebml_EndSubElement(glob, &start);
  }
  {
    Ebml_StartSubElement(glob, &glob->startSegment, Segment); // segment
    glob->position_reference = ftello(glob->stream);
    glob->framerate = *fps;
    write_webm_seek_info(glob);

John Koleszar's avatar
John Koleszar committed
630
    {
John Koleszar's avatar
John Koleszar committed
631
632
633
634
635
636
      EbmlLoc trackStart;
      glob->track_pos = ftello(glob->stream);
      Ebml_StartSubElement(glob, &trackStart, Tracks);
      {
        unsigned int trackNumber = 1;
        uint64_t     trackID = 0;
John Koleszar's avatar
John Koleszar committed
637

John Koleszar's avatar
John Koleszar committed
638
639
640
641
642
643
644
        EbmlLoc start;
        Ebml_StartSubElement(glob, &start, TrackEntry);
        Ebml_SerializeUnsigned(glob, TrackNumber, trackNumber);
        glob->track_id_pos = ftello(glob->stream);
        Ebml_SerializeUnsigned32(glob, TrackUID, trackID);
        Ebml_SerializeUnsigned(glob, TrackType, 1); // video is always 1
        Ebml_SerializeString(glob, CodecID, "V_VP8");
John Koleszar's avatar
John Koleszar committed
645
        {
John Koleszar's avatar
John Koleszar committed
646
647
648
649
650
651
652
653
654
655
656
          unsigned int pixelWidth = cfg->g_w;
          unsigned int pixelHeight = cfg->g_h;
          float        frameRate   = (float)fps->num / (float)fps->den;

          EbmlLoc videoStart;
          Ebml_StartSubElement(glob, &videoStart, Video);
          Ebml_SerializeUnsigned(glob, PixelWidth, pixelWidth);
          Ebml_SerializeUnsigned(glob, PixelHeight, pixelHeight);
          Ebml_SerializeUnsigned(glob, StereoMode, stereo_fmt);
          Ebml_SerializeFloat(glob, FrameRate, frameRate);
          Ebml_EndSubElement(glob, &videoStart); // Video
John Koleszar's avatar
John Koleszar committed
657
        }
John Koleszar's avatar
John Koleszar committed
658
659
660
        Ebml_EndSubElement(glob, &start); // Track Entry
      }
      Ebml_EndSubElement(glob, &trackStart);
John Koleszar's avatar
John Koleszar committed
661
    }
John Koleszar's avatar
John Koleszar committed
662
663
    // segment element is open
  }
John Koleszar's avatar
John Koleszar committed
664
665
666
667
668
669
}


static void
write_webm_block(EbmlGlobal                *glob,
                 const vpx_codec_enc_cfg_t *cfg,
John Koleszar's avatar
John Koleszar committed
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
                 const vpx_codec_cx_pkt_t  *pkt) {
  unsigned long  block_length;
  unsigned char  track_number;
  unsigned short block_timecode = 0;
  unsigned char  flags;
  int64_t        pts_ms;
  int            start_cluster = 0, is_keyframe;

  /* Calculate the PTS of this frame in milliseconds */
  pts_ms = pkt->data.frame.pts * 1000
           * (uint64_t)cfg->g_timebase.num / (uint64_t)cfg->g_timebase.den;
  if (pts_ms <= glob->last_pts_ms)
    pts_ms = glob->last_pts_ms + 1;
  glob->last_pts_ms = pts_ms;

  /* Calculate the relative time of this block */
  if (pts_ms - glob->cluster_timecode > SHRT_MAX)
    start_cluster = 1;
  else
    block_timecode = pts_ms - glob->cluster_timecode;

  is_keyframe = (pkt->data.frame.flags & VPX_FRAME_IS_KEY);
  if (start_cluster || is_keyframe) {
    if (glob->cluster_open)
      Ebml_EndSubElement(glob, &glob->startCluster);

    /* Open the new cluster */
    block_timecode = 0;
    glob->cluster_open = 1;
    glob->cluster_timecode = pts_ms;
    glob->cluster_pos = ftello(glob->stream);
    Ebml_StartSubElement(glob, &glob->startCluster, Cluster); // cluster
    Ebml_SerializeUnsigned(glob, Timecode, glob->cluster_timecode);

    /* Save a cue point if this is a keyframe. */
    if (is_keyframe) {
      struct cue_entry *cue, *new_cue_list;

      new_cue_list = realloc(glob->cue_list,
                             (glob->cues + 1) * sizeof(struct cue_entry));
      if (new_cue_list)
        glob->cue_list = new_cue_list;
      else {
        fprintf(stderr, "\nFailed to realloc cue list.\n");
        exit(EXIT_FAILURE);
      }
John Koleszar's avatar
John Koleszar committed
716

John Koleszar's avatar
John Koleszar committed
717
718
719
720
      cue = &glob->cue_list[glob->cues];
      cue->time = glob->cluster_timecode;
      cue->loc = glob->cluster_pos;
      glob->cues++;
John Koleszar's avatar
John Koleszar committed
721
    }
John Koleszar's avatar
John Koleszar committed
722
  }
John Koleszar's avatar
John Koleszar committed
723

John Koleszar's avatar
John Koleszar committed
724
725
  /* Write the Simple Block */
  Ebml_WriteID(glob, SimpleBlock);
John Koleszar's avatar
John Koleszar committed
726

John Koleszar's avatar
John Koleszar committed
727
728
729
  block_length = pkt->data.frame.sz + 4;
  block_length |= 0x10000000;
  Ebml_Serialize(glob, &block_length, sizeof(block_length), 4);
John Koleszar's avatar
John Koleszar committed
730

John Koleszar's avatar
John Koleszar committed
731
732
733
  track_number = 1;
  track_number |= 0x80;
  Ebml_Write(glob, &track_number, 1);
John Koleszar's avatar
John Koleszar committed
734

John Koleszar's avatar
John Koleszar committed
735
  Ebml_Serialize(glob, &block_timecode, sizeof(block_timecode), 2);
John Koleszar's avatar
John Koleszar committed
736

John Koleszar's avatar
John Koleszar committed
737
738
739
740
741
742
  flags = 0;
  if (is_keyframe)
    flags |= 0x80;
  if (pkt->data.frame.flags & VPX_FRAME_IS_INVISIBLE)
    flags |= 0x08;
  Ebml_Write(glob, &flags, 1);
John Koleszar's avatar
John Koleszar committed
743

John Koleszar's avatar
John Koleszar committed
744
  Ebml_Write(glob, pkt->data.frame.buf, pkt->data.frame.sz);
John Koleszar's avatar
John Koleszar committed
745
746
747
748
}


static void
John Koleszar's avatar
John Koleszar committed
749
write_webm_file_footer(EbmlGlobal *glob, long hash) {
John Koleszar's avatar
John Koleszar committed
750

John Koleszar's avatar
John Koleszar committed
751
752
  if (glob->cluster_open)
    Ebml_EndSubElement(glob, &glob->startCluster);
John Koleszar's avatar
John Koleszar committed
753

John Koleszar's avatar
John Koleszar committed
754
755
756
  {
    EbmlLoc start;
    int i;
John Koleszar's avatar
John Koleszar committed
757

John Koleszar's avatar
John Koleszar committed
758
759
760
761
762
    glob->cue_pos = ftello(glob->stream);
    Ebml_StartSubElement(glob, &start, Cues);
    for (i = 0; i < glob->cues; i++) {
      struct cue_entry *cue = &glob->cue_list[i];
      EbmlLoc start;
John Koleszar's avatar
John Koleszar committed
763

John Koleszar's avatar
John Koleszar committed
764
765
766
      Ebml_StartSubElement(glob, &start, CuePoint);
      {
        EbmlLoc start;
John Koleszar's avatar
John Koleszar committed
767

John Koleszar's avatar
John Koleszar committed
768
        Ebml_SerializeUnsigned(glob, CueTime, cue->time);
John Koleszar's avatar
John Koleszar committed
769

John Koleszar's avatar
John Koleszar committed
770
771
772
773
774
        Ebml_StartSubElement(glob, &start, CueTrackPositions);
        Ebml_SerializeUnsigned(glob, CueTrack, 1);
        Ebml_SerializeUnsigned64(glob, CueClusterPosition,
                                 cue->loc - glob->position_reference);
        // Ebml_SerializeUnsigned(glob, CueBlockNumber, cue->blockNumber);
John Koleszar's avatar
John Koleszar committed
775
        Ebml_EndSubElement(glob, &start);
John Koleszar's avatar
John Koleszar committed
776
777
      }
      Ebml_EndSubElement(glob, &start);
John Koleszar's avatar
John Koleszar committed
778
    }
John Koleszar's avatar
John Koleszar committed
779
780
    Ebml_EndSubElement(glob, &start);
  }
John Koleszar's avatar
John Koleszar committed
781

John Koleszar's avatar
John Koleszar committed
782
  Ebml_EndSubElement(glob, &glob->startSegment);
John Koleszar's avatar
John Koleszar committed
783

John Koleszar's avatar
John Koleszar committed
784
785
  /* Patch up the seek info block */
  write_webm_seek_info(glob);
John Koleszar's avatar
John Koleszar committed
786

John Koleszar's avatar
John Koleszar committed
787
788
789
  /* Patch up the track id */
  fseeko(glob->stream, glob->track_id_pos, SEEK_SET);
  Ebml_SerializeUnsigned32(glob, TrackUID, glob->debug ? 0xDEADBEEF : hash);
John Koleszar's avatar
John Koleszar committed
790

John Koleszar's avatar
John Koleszar committed
791
  fseeko(glob->stream, 0, SEEK_END);
John Koleszar's avatar
John Koleszar committed
792
793
794
}


John Koleszar's avatar
John Koleszar committed
795
/* Murmur hash derived from public domain reference implementation at
John Koleszar's avatar
John Koleszar committed
796
 *   http:// sites.google.com/site/murmurhash/
John Koleszar's avatar
John Koleszar committed
797
 */
John Koleszar's avatar
John Koleszar committed
798
799
800
static unsigned int murmur(const void *key, int len, unsigned int seed) {
  const unsigned int m = 0x5bd1e995;
  const int r = 24;
John Koleszar's avatar
John Koleszar committed
801

John Koleszar's avatar
John Koleszar committed
802
  unsigned int h = seed ^ len;
John Koleszar's avatar
John Koleszar committed
803

John Koleszar's avatar
John Koleszar committed
804
  const unsigned char *data = (const unsigned char *)key;
John Koleszar's avatar
John Koleszar committed
805

John Koleszar's avatar
John Koleszar committed
806
807
  while (len >= 4) {
    unsigned int k;
John Koleszar's avatar
John Koleszar committed
808

John Koleszar's avatar
John Koleszar committed
809
810
811
812
    k  = data[0];
    k |= data[1] << 8;
    k |= data[2] << 16;
    k |= data[3] << 24;
John Koleszar's avatar
John Koleszar committed
813

John Koleszar's avatar
John Koleszar committed
814
815
816
    k *= m;
    k ^= k >> r;
    k *= m;
John Koleszar's avatar
John Koleszar committed
817
818

    h *= m;
John Koleszar's avatar
John Koleszar committed
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
    h ^= k;

    data += 4;
    len -= 4;
  }

  switch (len) {
    case 3:
      h ^= data[2] << 16;
    case 2:
      h ^= data[1] << 8;
    case 1:
      h ^= data[0];
      h *= m;
  };

  h ^= h >> 13;
  h *= m;
  h ^= h >> 15;

  return h;
John Koleszar's avatar
John Koleszar committed
840
841
}

842
#include "math.h"
843
#define MAX_PSNR 100
John Koleszar's avatar
John Koleszar committed
844
845
static double vp8_mse2psnr(double Samples, double Peak, double Mse) {
  double psnr;
846

John Koleszar's avatar
John Koleszar committed
847
848
849
850
  if ((double)Mse > 0.0)
    psnr = 10.0 * log10(Peak * Peak * Samples / Mse);
  else
    psnr = MAX_PSNR;      // Limit to prevent / 0
851

John Koleszar's avatar
John Koleszar committed
852
853
  if (psnr > MAX_PSNR)
    psnr = MAX_PSNR;
854

John Koleszar's avatar
John Koleszar committed
855
  return psnr;
856
857
}

John Koleszar's avatar
John Koleszar committed
858

John Koleszar's avatar
John Koleszar committed
859
860
#include "args.h"

861
static const arg_def_t debugmode = ARG_DEF("D", "debug", 0,
John Koleszar's avatar
John Koleszar committed
862
                                           "Debug mode (makes output deterministic)");
863
static const arg_def_t outputfile = ARG_DEF("o", "output", 1,
John Koleszar's avatar
John Koleszar committed
864
                                            "Output filename");
John Koleszar's avatar
John Koleszar committed
865
static const arg_def_t use_yv12 = ARG_DEF(NULL, "yv12", 0,
John Koleszar's avatar
John Koleszar committed
866
                                          "Input file is YV12 ");
John Koleszar's avatar
John Koleszar committed
867
static const arg_def_t use_i420 = ARG_DEF(NULL, "i420", 0,
John Koleszar's avatar
John Koleszar committed
868
                                          "Input file is I420 (default)");
John Koleszar's avatar
John Koleszar committed
869
static const arg_def_t codecarg = ARG_DEF(NULL, "codec", 1,
John Koleszar's avatar
John Koleszar committed
870
                                          "Codec to use");
John Koleszar's avatar
John Koleszar committed
871
static const arg_def_t passes           = ARG_DEF("p", "passes", 1,
John Koleszar's avatar
John Koleszar committed
872
                                                  "Number of passes (1/2)");
John Koleszar's avatar
John Koleszar committed
873
static const arg_def_t pass_arg         = ARG_DEF(NULL, "pass", 1,
John Koleszar's avatar
John Koleszar committed
874
                                                  "Pass to execute (1/2)");
John Koleszar's avatar
John Koleszar committed
875
static const arg_def_t fpf_name         = ARG_DEF(NULL, "fpf", 1,
John Koleszar's avatar
John Koleszar committed
876
                                                  "First pass statistics file name");
John Koleszar's avatar
John Koleszar committed
877
878
static const arg_def_t limit = ARG_DEF(NULL, "limit", 1,
                                       "Stop encoding after n input frames");
879
static const arg_def_t skip = ARG_DEF(NULL, "skip", 1,
John Koleszar's avatar
John Koleszar committed
880
                                      "Skip the first n input frames");
John Koleszar's avatar
John Koleszar committed
881
static const arg_def_t deadline         = ARG_DEF("d", "deadline", 1,
John Koleszar's avatar
John Koleszar committed
882
                                                  "Deadline per frame (usec)");
John Koleszar's avatar
John Koleszar committed
883
static const arg_def_t best_dl          = ARG_DEF(NULL, "best", 0,
John Koleszar's avatar
John Koleszar committed
884
                                                  "Use Best Quality Deadline");
John Koleszar's avatar
John Koleszar committed
885
static const arg_def_t good_dl          = ARG_DEF(NULL, "good", 0,
John Koleszar's avatar
John Koleszar committed
886
                                                  "Use Good Quality Deadline");
John Koleszar's avatar
John Koleszar committed
887
static const arg_def_t rt_dl            = ARG_DEF(NULL, "rt", 0,
John Koleszar's avatar
John Koleszar committed
888
                                                  "Use Realtime Quality Deadline");
John Koleszar's avatar
John Koleszar committed
889
static const arg_def_t verbosearg       = ARG_DEF("v", "verbose", 0,
John Koleszar's avatar
John Koleszar committed
890
                                                  "Show encoder parameters");
John Koleszar's avatar
John Koleszar committed
891
static const arg_def_t psnrarg          = ARG_DEF(NULL, "psnr", 0,
John Koleszar's avatar
John Koleszar committed
892
                                                  "Show PSNR in status line");
893
static const arg_def_t recontest        = ARG_DEF(NULL, "test-decode", 0,
John Koleszar's avatar
John Koleszar committed
894
                                                  "Test enocde/decode have machted recon buffer");
895
static const arg_def_t framerate        = ARG_DEF(NULL, "fps", 1,
John Koleszar's avatar
John Koleszar committed
896
                                                  "Stream frame rate (rate/scale)");
John Koleszar's avatar
John Koleszar committed
897
static const arg_def_t use_ivf          = ARG_DEF(NULL, "ivf", 0,
John Koleszar's avatar
John Koleszar committed
898
                                                  "Output IVF (default is WebM)");
899
static const arg_def_t q_hist_n         = ARG_DEF(NULL, "q-hist", 1,
John Koleszar's avatar
John Koleszar committed
900
                                                  "Show quantizer histogram (n-buckets)");
901
static const arg_def_t rate_hist_n         = ARG_DEF(NULL, "rate-hist", 1,
John Koleszar's avatar
John Koleszar committed
902
                                                     "Show rate histogram (n-buckets)");
Hui Su's avatar
Hui Su committed
903
904
#if CONFIG_LOSSLESS
static const arg_def_t lossless_enabled = ARG_DEF(NULL, "lossless", 0,
John Koleszar's avatar
John Koleszar committed
905
                                                  "Enable lossless compression");
Hui Su's avatar
Hui Su committed
906
#endif
John Koleszar's avatar
John Koleszar committed
907
908
909
910
911
912
static const arg_def_t *main_args[] = {
  &debugmode,
  &outputfile, &codecarg, &passes, &pass_arg, &fpf_name, &limit, &skip,
  &deadline,
  &best_dl, &good_dl, &rt_dl,
  &verbosearg, &psnrarg, &recontest, &use_ivf, &q_hist_n, &rate_hist_n,
Hui Su's avatar
Hui Su committed
913
#if CONFIG_LOSSLESS
John Koleszar's avatar
John Koleszar committed
914
  &lossless_enabled,
Hui Su's avatar
Hui Su committed
915
#endif
John Koleszar's avatar
John Koleszar committed
916
  NULL
John Koleszar's avatar
John Koleszar committed
917
918
919
};

static const arg_def_t usage            = ARG_DEF("u", "usage", 1,
John Koleszar's avatar
John Koleszar committed
920
                                                  "Usage profile number to use");
John Koleszar's avatar
John Koleszar committed
921
static const arg_def_t threads          = ARG_DEF("t", "threads", 1,
John Koleszar's avatar
John Koleszar committed
922
                                                  "Max number of threads to use");
John Koleszar's avatar
John Koleszar committed
923
static const arg_def_t profile          = ARG_DEF(NULL, "profile", 1,
John Koleszar's avatar
John Koleszar committed
924
                                                  "Bitstream profile number to use");
John Koleszar's avatar
John Koleszar committed
925
static const arg_def_t width            = ARG_DEF("w", "width", 1,
John Koleszar's avatar
John Koleszar committed
926
                                                  "Frame width");
John Koleszar's avatar
John Koleszar committed
927
static const arg_def_t height           = ARG_DEF("h", "height", 1,
John Koleszar's avatar
John Koleszar committed
928
                                                  "Frame height");
929
static const struct arg_enum_list stereo_mode_enum[] = {
John Koleszar's avatar
John Koleszar committed
930
931
932
933
934
935
  {"mono", STEREO_FORMAT_MONO},
  {"left-right", STEREO_FORMAT_LEFT_RIGHT},
  {"bottom-top", STEREO_FORMAT_BOTTOM_TOP},
  {"top-bottom", STEREO_FORMAT_TOP_BOTTOM},
  {"right-left", STEREO_FORMAT_RIGHT_LEFT},
  {NULL, 0}
936
937
};
static const arg_def_t stereo_mode      = ARG_DEF_ENUM(NULL, "stereo-mode", 1,
John Koleszar's avatar
John Koleszar committed
938
                                                       "Stereo 3D video format", stereo_mode_enum);
John Koleszar's avatar
John Koleszar committed
939
static const arg_def_t timebase         = ARG_DEF(NULL, "timebase", 1,
John Koleszar's avatar
John Koleszar committed
940
                                                  "Output timestamp precision (fractional seconds)");
John Koleszar's avatar
John Koleszar committed
941
static const arg_def_t error_resilient  = ARG_DEF(NULL, "error-resilient", 1,
John Koleszar's avatar
John Koleszar committed
942
                                                  "Enable error resiliency features");
John Koleszar's avatar
John Koleszar committed
943
static const arg_def_t lag_in_frames    = ARG_DEF(NULL, "lag-in-frames", 1,
John Koleszar's avatar
John Koleszar committed
944
                                                  "Max number of frames to lag");
John Koleszar's avatar
John Koleszar committed
945

John Koleszar's avatar
John Koleszar committed
946
947
948
949
static const arg_def_t *global_args[] = {
  &use_yv12, &use_i420, &usage, &threads, &profile,
  &width, &height, &stereo_mode, &timebase, &framerate, &error_resilient,
  &lag_in_frames, NULL
John Koleszar's avatar
John Koleszar committed
950
951
952
};

static const arg_def_t dropframe_thresh   = ARG_DEF(NULL, "drop-frame", 1,
John Koleszar's avatar
John Koleszar committed
953
                                                    "Temporal resampling threshold (buf %)");
John Koleszar's avatar
John Koleszar committed
954
static const arg_def_t resize_allowed     = ARG_DEF(NULL, "resize-allowed", 1,
John Koleszar's avatar
John Koleszar committed
955
                                                    "Spatial resampling enabled (bool)");
John Koleszar's avatar
John Koleszar committed
956
static const arg_def_t resize_up_thresh   = ARG_DEF(NULL, "resize-up", 1,
John Koleszar's avatar
John Koleszar committed
957
                                                    "Upscale threshold (buf %)");
John Koleszar's avatar
John Koleszar committed
958
static const arg_def_t resize_down_thresh = ARG_DEF(NULL, "resize-down", 1,
John Koleszar's avatar
John Koleszar committed
959
                                                    "Downscale threshold (buf %)");
960
static const struct arg_enum_list end_usage_enum[] = {
John Koleszar's avatar
John Koleszar committed
961
962
963
964
  {"vbr", VPX_VBR},
  {"cbr", VPX_CBR},
  {"cq",  VPX_CQ},
  {NULL, 0}
965
966
};
static const arg_def_t end_usage          = ARG_DEF_ENUM(NULL, "end-usage", 1,
John Koleszar's avatar
John Koleszar committed
967
                                                         "Rate control mode", end_usage_enum);
John Koleszar's avatar
John Koleszar committed
968
static const arg_def_t target_bitrate     = ARG_DEF(NULL, "target-bitrate", 1,
John Koleszar's avatar
John Koleszar committed
969
                                                    "Bitrate (kbps)");
John Koleszar's avatar
John Koleszar committed
970
static const arg_def_t min_quantizer      = ARG_DEF(NULL, "min-q", 1,
John Koleszar's avatar
John Koleszar committed
971
                                                    "Minimum (best) quantizer");
John Koleszar's avatar
John Koleszar committed
972
static const arg_def_t max_quantizer      = ARG_DEF(NULL, "max-q", 1,
John Koleszar's avatar
John Koleszar committed
973
                                                    "Maximum (worst) quantizer");
John Koleszar's avatar
John Koleszar committed
974
static const arg_def_t undershoot_pct     = ARG_DEF(NULL, "undershoot-pct", 1,
John Koleszar's avatar
John Koleszar committed
975
                                                    "Datarate undershoot (min) target (%)");
John Koleszar's avatar
John Koleszar committed
976
static const arg_def_t overshoot_pct      = ARG_DEF(NULL, "overshoot-pct", 1,
John Koleszar's avatar
John Koleszar committed
977
                                                    "Datarate overshoot (max) target (%)");
John Koleszar's avatar
John Koleszar committed
978
static const arg_def_t buf_sz             = ARG_DEF(NULL, "buf-sz", 1,
John Koleszar's avatar
John Koleszar committed
979
                                                    "Client buffer size (ms)");
John Koleszar's avatar
John Koleszar committed
980
static const arg_def_t buf_initial_sz     = ARG_DEF(NULL, "buf-initial-sz", 1,
John Koleszar's avatar
John Koleszar committed
981
                                                    "Client initial buffer size (ms)");
John Koleszar's avatar
John Koleszar committed
982
static const arg_def_t buf_optimal_sz     = ARG_DEF(NULL, "buf-optimal-sz", 1,
John Koleszar's avatar
John Koleszar committed
983
984
985
986
987
988
                                                    "Client optimal buffer size (ms)");
static const arg_def_t *rc_args[] = {
  &dropframe_thresh, &resize_allowed, &resize_up_thresh, &resize_down_thresh,
  &end_usage, &target_bitrate, &min_quantizer, &max_quantizer,
  &undershoot_pct, &overshoot_pct, &buf_sz, &buf_initial_sz, &buf_optimal_sz,
  NULL
John Koleszar's avatar
John Koleszar committed
989
990
991
992
};


static const arg_def_t bias_pct = ARG_DEF(NULL, "bias-pct", 1,
John Koleszar's avatar
John Koleszar committed
993
                                          "CBR/VBR bias (0=CBR, 100=VBR)");
John Koleszar's avatar
John Koleszar committed
994
static const arg_def_t minsection_pct = ARG_DEF(NULL, "minsection-pct", 1,
John Koleszar's avatar
John Koleszar committed
995
                                                "GOP min bitrate (% of target)");
John Koleszar's avatar
John Koleszar committed
996
static const arg_def_t maxsection_pct = ARG_DEF(NULL, "maxsection-pct", 1,
John Koleszar's avatar
John Koleszar committed
997
998
999
                                                "GOP max bitrate (% of target)");
static const arg_def_t *rc_twopass_args[] = {
  &bias_pct, &minsection_pct, &maxsection_pct, NULL
John Koleszar's avatar
John Koleszar committed
1000
1001
1002
1003
};


static const arg_def_t kf_min_dist = ARG_DEF(NULL, "kf-min-dist", 1,
John Koleszar's avatar
John Koleszar committed
1004
                                             "Minimum keyframe interval (frames)");
John Koleszar's avatar
John Koleszar committed
1005
static const arg_def_t kf_max_dist = ARG_DEF(NULL, "kf-max-dist", 1,
John Koleszar's avatar
John Koleszar committed
1006
                                             "Maximum keyframe interval (frames)");
1007
static const arg_def_t kf_disabled = ARG_DEF(NULL, "disable-kf", 0,
John Koleszar's avatar
John Koleszar committed
1008
1009
1010
                                             "Disable keyframe placement");
static const arg_def_t *kf_args[] = {
  &kf_min_dist, &kf_max_dist, &kf_disabled, NULL
John Koleszar's avatar
John Koleszar committed
1011
1012
1013
};


1014
#if CONFIG_VP9_ENCODER
John Koleszar's avatar
John Koleszar committed
1015
static const arg_def_t noise_sens = ARG_DEF(NULL, "noise-sensitivity", 1,
John Koleszar's avatar
John Koleszar committed
1016
                                            "Noise sensitivity (frames to blur)");
John Koleszar's avatar
John Koleszar committed
1017
static const arg_def_t sharpness = ARG_DEF(NULL, "sharpness", 1,
John Koleszar's avatar
John Koleszar committed
1018
                                           "Filter sharpness (0-7)");
John Koleszar's avatar
John Koleszar committed
1019
static const arg_def_t static_thresh = ARG_DEF(NULL, "static-thresh", 1,
John Koleszar's avatar
John Koleszar committed
1020
                                               "Motion detection threshold");
John Koleszar's avatar
John Koleszar committed
1021
1022
#endif

1023
#if CONFIG_VP9_ENCODER
John Koleszar's avatar
John Koleszar committed
1024
static const arg_def_t cpu_used = ARG_DEF(NULL, "cpu-used", 1,
John Koleszar's avatar
John Koleszar committed
1025
                                          "CPU Used (-16..16)");
John Koleszar's avatar
John Koleszar committed
1026
1027
1028
#endif


1029
#if CONFIG_VP9_ENCODER
John Koleszar's avatar
John Koleszar committed
1030
static const arg_def_t token_parts = ARG_DEF(NULL, "token-parts", 1,
John Koleszar's avatar
John Koleszar committed
1031
                                             "Number of token partitions to use, log2");
John Koleszar's avatar
John Koleszar committed
1032
static const arg_def_t auto_altref = ARG_DEF(NULL, "auto-alt-ref", 1,
John Koleszar's avatar
John Koleszar committed
1033
                                             "Enable automatic alt reference frames");
John Koleszar's avatar
John Koleszar committed
1034
static const arg_def_t arnr_maxframes = ARG_DEF(NULL, "arnr-maxframes", 1,
John Koleszar's avatar
John Koleszar committed
1035
                                                "AltRef Max Frames");
John Koleszar's avatar
John Koleszar committed
1036
static const arg_def_t arnr_strength = ARG_DEF(NULL, "arnr-strength", 1,
John Koleszar's avatar
John Koleszar committed
1037
                                               "AltRef Strength");
John Koleszar's avatar
John Koleszar committed
1038
static const arg_def_t arnr_type = ARG_DEF(NULL, "arnr-type", 1,
John Koleszar's avatar
John Koleszar committed
1039
                                           "AltRef Type");
John Koleszar's avatar
John Koleszar committed
1040
static const struct arg_enum_list tuning_enum[] = {
John Koleszar's avatar
John Koleszar committed
1041
1042
1043
  {"psnr", VP8_TUNE_PSNR},
  {"ssim", VP8_TUNE_SSIM},
  {NULL, 0}
John Koleszar's avatar
John Koleszar committed
1044
1045
};
static const arg_def_t tune_ssim = ARG_DEF_ENUM(NULL, "tune", 1,
John Koleszar's avatar
John Koleszar committed
1046
                                                "Material to favor", tuning_enum);
Paul Wilkins's avatar
CQ Mode    
Paul Wilkins committed
1047
static const arg_def_t cq_level = ARG_DEF(NULL, "cq-level", 1,
John Koleszar's avatar
John Koleszar committed
1048
                                          "Constrained Quality Level");
1049
static const arg_def_t max_intra_rate_pct = ARG_DEF(NULL, "max-intra-rate", 1,
John Koleszar's avatar
John Koleszar committed
1050
                                                    "Max I-frame bitrate (pct)");
John Koleszar's avatar
John Koleszar committed
1051

John Koleszar's avatar
John Koleszar committed
1052
1053
1054
1055
static const arg_def_t *vp8_args[] = {
  &cpu_used, &auto_altref, &noise_sens, &sharpness, &static_thresh,
  &token_parts, &arnr_maxframes, &arnr_strength, &arnr_type,
  &tune_ssim, &cq_level, &max_intra_rate_pct, NULL
John Koleszar's avatar
John Koleszar committed
1056
};
John Koleszar's avatar
John Koleszar committed
1057
1058
1059
1060
1061
1062
static const int vp8_arg_ctrl_map[] = {
  VP8E_SET_CPUUSED, VP8E_SET_ENABLEAUTOALTREF,
  VP8E_SET_NOISE_SENSITIVITY, VP8E_SET_SHARPNESS, VP8E_SET_STATIC_THRESHOLD,
  VP8E_SET_TOKEN_PARTITIONS,
  VP8E_SET_ARNR_MAXFRAMES, VP8E_SET_ARNR_STRENGTH, VP8E_SET_ARNR_TYPE,
  VP8E_SET_TUNING, VP8E_SET_CQ_LEVEL, VP8E_SET_MAX_INTRA_BITRATE_PCT, 0
John Koleszar's avatar
John Koleszar committed
1063
1064
1065
1066
1067
};
#endif

static const arg_def_t *no_args[] = { NULL };

John Koleszar's avatar
John Koleszar committed
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
1083
static void usage_exit() {
  int i;

  fprintf(stderr, "Usage: %s <options> -o dst_filename src_filename \n",
          exec_name);

  fprintf(stderr, "\nOptions:\n");
  arg_show_usage(stdout, main_args);
  fprintf(stderr, "\nEncoder Global Options:\n");
  arg_show_usage(stdout, global_args);
  fprintf(stderr, "\nRate Control Options:\n");
  arg_show_usage(stdout, rc_args);
  fprintf(stderr, "\nTwopass Rate Control Options:\n");
  arg_show_usage(stdout, rc_twopass_args);
  fprintf(stderr, "\nKeyframe Placement Options:\n");
  arg_show_usage(stdout, kf_args);
1084
#if CONFIG_VP9_ENCODER
John Koleszar's avatar
John Koleszar committed
1085
1086
  fprintf(stderr, "\nVP8 Specific Options:\n");
  arg_show_usage(stdout, vp8_args);
John Koleszar's avatar
John Koleszar committed
1087
#endif
John Koleszar's avatar
John Koleszar committed
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
  fprintf(stderr, "\nStream timebase (--timebase):\n"
          "  The desired precision of timestamps in the output, expressed\n"
          "  in fractional seconds. Default is 1/1000.\n");
  fprintf(stderr, "\n"
          "Included encoders:\n"
          "\n");

  for (i = 0; i < sizeof(codecs) / sizeof(codecs[0]); i++)
    fprintf(stderr, "    %-6s - %s\n",
            codecs[i].name,
Jim Bankoski's avatar
Jim Bankoski committed
1098
            vpx_codec_iface_name(codecs[i].iface()));
John Koleszar's avatar
John Koleszar committed
1099
1100

  exit(EXIT_FAILURE);
John Koleszar's avatar
John Koleszar committed
1101
1102
}

1103
1104

#define HIST_BAR_MAX 40
John Koleszar's avatar
John Koleszar committed
1105
1106
struct hist_bucket {
  int low, high, count;
1107
1108
1109
1110
1111
};


static int merge_hist_buckets(struct hist_bucket *bucket,
                              int *buckets_,
John Koleszar's avatar
John Koleszar committed
1112
1113
1114
1115
1116
1117
1118
1119
1120
1121
1122
1123
1124
1125
1126
1127
1128
1129
1130
1131
1132
1133
1134