vpxenc.c 66.1 KB
Newer Older
John Koleszar's avatar
John Koleszar committed
1
/*
2
 *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
John Koleszar's avatar
John Koleszar committed
3
 *
4
 *  Use of this source code is governed by a BSD-style license
5
6
 *  that can be found in the LICENSE file in the root of the source
 *  tree. An additional intellectual property rights grant can be found
7
 *  in the file PATENTS.  All contributing project authors may
8
 *  be found in the AUTHORS file in the root of the source tree.
John Koleszar's avatar
John Koleszar committed
9
10
11
12
13
14
 */


/* This is a simple program that encodes YV12 files and generates ivf
 * files using the new interface.
 */
15
#if defined(_WIN32) || !CONFIG_OS_SUPPORT
16
17
18
19
#define USE_POSIX_MMAP 0
#else
#define USE_POSIX_MMAP 1
#endif
John Koleszar's avatar
John Koleszar committed
20
21
22
23
24

#include <stdio.h>
#include <stdlib.h>
#include <stdarg.h>
#include <string.h>
John Koleszar's avatar
John Koleszar committed
25
#include <limits.h>
26
#include <assert.h>
27
#include "vpx/vpx_encoder.h"
John Koleszar's avatar
John Koleszar committed
28
29
30
31
32
33
34
#if USE_POSIX_MMAP
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/mman.h>
#include <fcntl.h>
#include <unistd.h>
#endif
35
#include "vpx_config.h"
John Koleszar's avatar
John Koleszar committed
36
#include "vpx_version.h"
37
#include "vpx/vp8cx.h"
38
39
#include "vpx/vp8dx.h"
#include "vpx/vpx_decoder.h"
John Koleszar's avatar
John Koleszar committed
40
41
#include "vpx_ports/mem_ops.h"
#include "vpx_ports/vpx_timer.h"
John Koleszar's avatar
John Koleszar committed
42
#include "tools_common.h"
43
#include "y4minput.h"
John Koleszar's avatar
John Koleszar committed
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
#include "libmkv/EbmlWriter.h"
#include "libmkv/EbmlIDs.h"

/* Need special handling of these functions on Windows */
#if defined(_MSC_VER)
/* MSVS doesn't define off_t, and uses _f{seek,tell}i64 */
typedef __int64 off_t;
#define fseeko _fseeki64
#define ftello _ftelli64
#elif defined(_WIN32)
/* MinGW defines off_t, and uses f{seek,tell}o64 */
#define fseeko fseeko64
#define ftello ftello64
#endif

#if defined(_MSC_VER)
#define LITERALU64(n) n
#else
#define LITERALU64(n) n##LLU
#endif
John Koleszar's avatar
John Koleszar committed
64

65
66
67
68
69
70
71
72
/* We should use 32-bit file operations in WebM file format
 * when building ARM executable file (.axf) with RVCT */
#if !CONFIG_OS_SUPPORT
typedef long off_t;
#define fseeko fseek
#define ftello ftell
#endif

John Koleszar's avatar
John Koleszar committed
73
74
static const char *exec_name;

John Koleszar's avatar
John Koleszar committed
75
76
77
78
79
static const struct codec_item {
  char const              *name;
  const vpx_codec_iface_t *iface;
  unsigned int             fourcc;
} codecs[] = {
80
#if CONFIG_EXPERIMENTAL && CONFIG_VP8_ENCODER
John Koleszar's avatar
John Koleszar committed
81
  {"vp8x",  &vpx_codec_vp8x_cx_algo, 0x78385056},
82
#endif
John Koleszar's avatar
John Koleszar committed
83
#if CONFIG_VP8_ENCODER
John Koleszar's avatar
John Koleszar committed
84
  {"vp8",  &vpx_codec_vp8_cx_algo, 0x30385056},
John Koleszar's avatar
John Koleszar committed
85
86
87
#endif
};

88
#define VP8_FOURCC (0x00385056)
John Koleszar's avatar
John Koleszar committed
89
90
91
92
93
94
static const struct {
  char const *name;
  const vpx_codec_iface_t *iface;
  unsigned int             fourcc;
  unsigned int             fourcc_mask;
} ifaces[] = {
95
#if CONFIG_VP8_DECODER
John Koleszar's avatar
John Koleszar committed
96
  {"vp8",  &vpx_codec_vp8_dx_algo,   VP8_FOURCC, 0x00FFFFFF},
97
98
99
100
#endif
};


John Koleszar's avatar
John Koleszar committed
101
102
static void usage_exit();

John Koleszar's avatar
John Koleszar committed
103
104
105
106
107
108
void die(const char *fmt, ...) {
  va_list ap;
  va_start(ap, fmt);
  vfprintf(stderr, fmt, ap);
  fprintf(stderr, "\n");
  usage_exit();
John Koleszar's avatar
John Koleszar committed
109
110
}

John Koleszar's avatar
John Koleszar committed
111
112
113
static void ctx_exit_on_error(vpx_codec_ctx_t *ctx, const char *s) {
  if (ctx->err) {
    const char *detail = vpx_codec_error_detail(ctx);
John Koleszar's avatar
John Koleszar committed
114

John Koleszar's avatar
John Koleszar committed
115
    fprintf(stderr, "%s: %s\n", s, vpx_codec_error(ctx));
John Koleszar's avatar
John Koleszar committed
116

John Koleszar's avatar
John Koleszar committed
117
118
    if (detail)
      fprintf(stderr, "    %s\n", detail);
John Koleszar's avatar
John Koleszar committed
119

John Koleszar's avatar
John Koleszar committed
120
121
    exit(EXIT_FAILURE);
  }
John Koleszar's avatar
John Koleszar committed
122
123
124
125
126
}

/* This structure is used to abstract the different ways of handling
 * first pass statistics.
 */
John Koleszar's avatar
John Koleszar committed
127
128
129
130
131
132
typedef struct {
  vpx_fixed_buf_t buf;
  int             pass;
  FILE           *file;
  char           *buf_ptr;
  size_t          buf_alloc_sz;
John Koleszar's avatar
John Koleszar committed
133
134
} stats_io_t;

John Koleszar's avatar
John Koleszar committed
135
136
int stats_open_file(stats_io_t *stats, const char *fpf, int pass) {
  int res;
John Koleszar's avatar
John Koleszar committed
137

John Koleszar's avatar
John Koleszar committed
138
  stats->pass = pass;
John Koleszar's avatar
John Koleszar committed
139

John Koleszar's avatar
John Koleszar committed
140
141
142
143
144
145
  if (pass == 0) {
    stats->file = fopen(fpf, "wb");
    stats->buf.sz = 0;
    stats->buf.buf = NULL,
               res = (stats->file != NULL);
  } else {
John Koleszar's avatar
John Koleszar committed
146
147
#if 0
#elif USE_POSIX_MMAP
John Koleszar's avatar
John Koleszar committed
148
149
150
151
152
153
154
155
156
157
    struct stat stat_buf;
    int fd;

    fd = open(fpf, O_RDONLY);
    stats->file = fdopen(fd, "rb");
    fstat(fd, &stat_buf);
    stats->buf.sz = stat_buf.st_size;
    stats->buf.buf = mmap(NULL, stats->buf.sz, PROT_READ, MAP_PRIVATE,
                          fd, 0);
    res = (stats->buf.buf != NULL);
John Koleszar's avatar
John Koleszar committed
158
#else
John Koleszar's avatar
John Koleszar committed
159
    size_t nbytes;
John Koleszar's avatar
John Koleszar committed
160

John Koleszar's avatar
John Koleszar committed
161
    stats->file = fopen(fpf, "rb");
John Koleszar's avatar
John Koleszar committed
162

John Koleszar's avatar
John Koleszar committed
163
164
165
166
    if (fseek(stats->file, 0, SEEK_END)) {
      fprintf(stderr, "First-pass stats file must be seekable!\n");
      exit(EXIT_FAILURE);
    }
John Koleszar's avatar
John Koleszar committed
167

John Koleszar's avatar
John Koleszar committed
168
169
    stats->buf.sz = stats->buf_alloc_sz = ftell(stats->file);
    rewind(stats->file);
John Koleszar's avatar
John Koleszar committed
170

John Koleszar's avatar
John Koleszar committed
171
    stats->buf.buf = malloc(stats->buf_alloc_sz);
John Koleszar's avatar
John Koleszar committed
172

John Koleszar's avatar
John Koleszar committed
173
174
175
176
177
    if (!stats->buf.buf) {
      fprintf(stderr, "Failed to allocate first-pass stats buffer (%lu bytes)\n",
              (unsigned long)stats->buf_alloc_sz);
      exit(EXIT_FAILURE);
    }
John Koleszar's avatar
John Koleszar committed
178

John Koleszar's avatar
John Koleszar committed
179
180
    nbytes = fread(stats->buf.buf, 1, stats->buf.sz, stats->file);
    res = (nbytes == stats->buf.sz);
John Koleszar's avatar
John Koleszar committed
181
#endif
John Koleszar's avatar
John Koleszar committed
182
  }
John Koleszar's avatar
John Koleszar committed
183

John Koleszar's avatar
John Koleszar committed
184
  return res;
John Koleszar's avatar
John Koleszar committed
185
186
}

John Koleszar's avatar
John Koleszar committed
187
188
189
int stats_open_mem(stats_io_t *stats, int pass) {
  int res;
  stats->pass = pass;
John Koleszar's avatar
John Koleszar committed
190

John Koleszar's avatar
John Koleszar committed
191
192
193
194
195
  if (!pass) {
    stats->buf.sz = 0;
    stats->buf_alloc_sz = 64 * 1024;
    stats->buf.buf = malloc(stats->buf_alloc_sz);
  }
John Koleszar's avatar
John Koleszar committed
196

John Koleszar's avatar
John Koleszar committed
197
198
199
  stats->buf_ptr = stats->buf.buf;
  res = (stats->buf.buf != NULL);
  return res;
John Koleszar's avatar
John Koleszar committed
200
201
202
}


John Koleszar's avatar
John Koleszar committed
203
204
205
void stats_close(stats_io_t *stats, int last_pass) {
  if (stats->file) {
    if (stats->pass == last_pass) {
John Koleszar's avatar
John Koleszar committed
206
207
#if 0
#elif USE_POSIX_MMAP
John Koleszar's avatar
John Koleszar committed
208
      munmap(stats->buf.buf, stats->buf.sz);
John Koleszar's avatar
John Koleszar committed
209
#else
John Koleszar's avatar
John Koleszar committed
210
      free(stats->buf.buf);
John Koleszar's avatar
John Koleszar committed
211
212
#endif
    }
John Koleszar's avatar
John Koleszar committed
213
214
215
216
217
218
219

    fclose(stats->file);
    stats->file = NULL;
  } else {
    if (stats->pass == last_pass)
      free(stats->buf.buf);
  }
John Koleszar's avatar
John Koleszar committed
220
221
}

John Koleszar's avatar
John Koleszar committed
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
void stats_write(stats_io_t *stats, const void *pkt, size_t len) {
  if (stats->file) {
    if (fwrite(pkt, 1, len, stats->file));
  } else {
    if (stats->buf.sz + len > stats->buf_alloc_sz) {
      size_t  new_sz = stats->buf_alloc_sz + 64 * 1024;
      char   *new_ptr = realloc(stats->buf.buf, new_sz);

      if (new_ptr) {
        stats->buf_ptr = new_ptr + (stats->buf_ptr - (char *)stats->buf.buf);
        stats->buf.buf = new_ptr;
        stats->buf_alloc_sz = new_sz;
      } else {
        fprintf(stderr,
                "\nFailed to realloc firstpass stats buffer.\n");
        exit(EXIT_FAILURE);
      }
John Koleszar's avatar
John Koleszar committed
239
240
    }

John Koleszar's avatar
John Koleszar committed
241
242
243
244
    memcpy(stats->buf_ptr, pkt, len);
    stats->buf.sz += len;
    stats->buf_ptr += len;
  }
John Koleszar's avatar
John Koleszar committed
245
246
}

John Koleszar's avatar
John Koleszar committed
247
248
vpx_fixed_buf_t stats_get(stats_io_t *stats) {
  return stats->buf;
John Koleszar's avatar
John Koleszar committed
249
250
}

251
/* Stereo 3D packed frame format */
John Koleszar's avatar
John Koleszar committed
252
253
254
255
256
257
typedef enum stereo_format {
  STEREO_FORMAT_MONO       = 0,
  STEREO_FORMAT_LEFT_RIGHT = 1,
  STEREO_FORMAT_BOTTOM_TOP = 2,
  STEREO_FORMAT_TOP_BOTTOM = 3,
  STEREO_FORMAT_RIGHT_LEFT = 11
258
259
} stereo_format_t;

John Koleszar's avatar
John Koleszar committed
260
261
262
263
enum video_file_type {
  FILE_TYPE_RAW,
  FILE_TYPE_IVF,
  FILE_TYPE_Y4M
264
265
};

266
struct detect_buffer {
John Koleszar's avatar
John Koleszar committed
267
268
269
  char buf[4];
  size_t buf_read;
  size_t position;
270
271
272
};


John Koleszar's avatar
John Koleszar committed
273
#define IVF_FRAME_HDR_SZ (4+8) /* 4 byte size + 8 byte timestamp */
274
static int read_frame(FILE *f, vpx_image_t *img, unsigned int file_type,
John Koleszar's avatar
John Koleszar committed
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
                      y4m_input *y4m, struct detect_buffer *detect) {
  int plane = 0;
  int shortread = 0;

  if (file_type == FILE_TYPE_Y4M) {
    if (y4m_input_fetch_frame(y4m, f, img) < 1)
      return 0;
  } else {
    if (file_type == FILE_TYPE_IVF) {
      char junk[IVF_FRAME_HDR_SZ];

      /* Skip the frame header. We know how big the frame should be. See
       * write_ivf_frame_header() for documentation on the frame header
       * layout.
       */
      if (fread(junk, 1, IVF_FRAME_HDR_SZ, f));
John Koleszar's avatar
John Koleszar committed
291
    }
292

John Koleszar's avatar
John Koleszar committed
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
    for (plane = 0; plane < 3; plane++) {
      unsigned char *ptr;
      int w = (plane ? (1 + img->d_w) / 2 : img->d_w);
      int h = (plane ? (1 + img->d_h) / 2 : img->d_h);
      int r;

      /* Determine the correct plane based on the image format. The for-loop
       * always counts in Y,U,V order, but this may not match the order of
       * the data on disk.
       */
      switch (plane) {
        case 1:
          ptr = img->planes[img->fmt == VPX_IMG_FMT_YV12 ? VPX_PLANE_V : VPX_PLANE_U];
          break;
        case 2:
          ptr = img->planes[img->fmt == VPX_IMG_FMT_YV12 ? VPX_PLANE_U : VPX_PLANE_V];
          break;
        default:
          ptr = img->planes[plane];
      }

      for (r = 0; r < h; r++) {
        size_t needed = w;
        size_t buf_position = 0;
        const size_t left = detect->buf_read - detect->position;
        if (left > 0) {
          const size_t more = (left < needed) ? left : needed;
          memcpy(ptr, detect->buf + detect->position, more);
          buf_position = more;
          needed -= more;
          detect->position += more;
John Koleszar's avatar
John Koleszar committed
324
        }
John Koleszar's avatar
John Koleszar committed
325
326
        if (needed > 0) {
          shortread |= (fread(ptr + buf_position, 1, needed, f) < needed);
John Koleszar's avatar
John Koleszar committed
327
        }
John Koleszar's avatar
John Koleszar committed
328
329
330

        ptr += img->stride[plane];
      }
John Koleszar's avatar
John Koleszar committed
331
    }
John Koleszar's avatar
John Koleszar committed
332
  }
John Koleszar's avatar
John Koleszar committed
333

John Koleszar's avatar
John Koleszar committed
334
  return !shortread;
John Koleszar's avatar
John Koleszar committed
335
336
337
}


338
unsigned int file_is_y4m(FILE      *infile,
339
                         y4m_input *y4m,
John Koleszar's avatar
John Koleszar committed
340
341
342
343
344
                         char       detect[4]) {
  if (memcmp(detect, "YUV4", 4) == 0) {
    return 1;
  }
  return 0;
345
346
}

John Koleszar's avatar
John Koleszar committed
347
348
349
350
#define IVF_FILE_HDR_SZ (32)
unsigned int file_is_ivf(FILE *infile,
                         unsigned int *fourcc,
                         unsigned int *width,
351
                         unsigned int *height,
John Koleszar's avatar
John Koleszar committed
352
353
354
                         struct detect_buffer *detect) {
  char raw_hdr[IVF_FILE_HDR_SZ];
  int is_ivf = 0;
John Koleszar's avatar
John Koleszar committed
355

John Koleszar's avatar
John Koleszar committed
356
357
  if (memcmp(detect->buf, "DKIF", 4) != 0)
    return 0;
358

John Koleszar's avatar
John Koleszar committed
359
360
361
362
363
  /* See write_ivf_file_header() for more documentation on the file header
   * layout.
   */
  if (fread(raw_hdr + 4, 1, IVF_FILE_HDR_SZ - 4, infile)
      == IVF_FILE_HDR_SZ - 4) {
John Koleszar's avatar
John Koleszar committed
364
    {
John Koleszar's avatar
John Koleszar committed
365
      is_ivf = 1;
John Koleszar's avatar
John Koleszar committed
366

John Koleszar's avatar
John Koleszar committed
367
368
369
      if (mem_get_le16(raw_hdr + 4) != 0)
        fprintf(stderr, "Error: Unrecognized IVF version! This file may not"
                " decode properly.");
John Koleszar's avatar
John Koleszar committed
370

John Koleszar's avatar
John Koleszar committed
371
      *fourcc = mem_get_le32(raw_hdr + 8);
John Koleszar's avatar
John Koleszar committed
372
    }
John Koleszar's avatar
John Koleszar committed
373
  }
John Koleszar's avatar
John Koleszar committed
374

John Koleszar's avatar
John Koleszar committed
375
376
377
378
379
  if (is_ivf) {
    *width = mem_get_le16(raw_hdr + 12);
    *height = mem_get_le16(raw_hdr + 14);
    detect->position = 4;
  }
John Koleszar's avatar
John Koleszar committed
380

John Koleszar's avatar
John Koleszar committed
381
  return is_ivf;
John Koleszar's avatar
John Koleszar committed
382
383
384
385
386
387
}


static void write_ivf_file_header(FILE *outfile,
                                  const vpx_codec_enc_cfg_t *cfg,
                                  unsigned int fourcc,
John Koleszar's avatar
John Koleszar committed
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
                                  int frame_cnt) {
  char header[32];

  if (cfg->g_pass != VPX_RC_ONE_PASS && cfg->g_pass != VPX_RC_LAST_PASS)
    return;

  header[0] = 'D';
  header[1] = 'K';
  header[2] = 'I';
  header[3] = 'F';
  mem_put_le16(header + 4,  0);                 /* version */
  mem_put_le16(header + 6,  32);                /* headersize */
  mem_put_le32(header + 8,  fourcc);            /* headersize */
  mem_put_le16(header + 12, cfg->g_w);          /* width */
  mem_put_le16(header + 14, cfg->g_h);          /* height */
  mem_put_le32(header + 16, cfg->g_timebase.den); /* rate */
  mem_put_le32(header + 20, cfg->g_timebase.num); /* scale */
  mem_put_le32(header + 24, frame_cnt);         /* length */
  mem_put_le32(header + 28, 0);                 /* unused */

  if (fwrite(header, 1, 32, outfile));
John Koleszar's avatar
John Koleszar committed
409
410
411
412
}


static void write_ivf_frame_header(FILE *outfile,
John Koleszar's avatar
John Koleszar committed
413
414
415
                                   const vpx_codec_cx_pkt_t *pkt) {
  char             header[12];
  vpx_codec_pts_t  pts;
John Koleszar's avatar
John Koleszar committed
416

John Koleszar's avatar
John Koleszar committed
417
418
  if (pkt->kind != VPX_CODEC_CX_FRAME_PKT)
    return;
John Koleszar's avatar
John Koleszar committed
419

John Koleszar's avatar
John Koleszar committed
420
421
422
423
  pts = pkt->data.frame.pts;
  mem_put_le32(header, pkt->data.frame.sz);
  mem_put_le32(header + 4, pts & 0xFFFFFFFF);
  mem_put_le32(header + 8, pts >> 32);
John Koleszar's avatar
John Koleszar committed
424

John Koleszar's avatar
John Koleszar committed
425
  if (fwrite(header, 1, 12, outfile));
John Koleszar's avatar
John Koleszar committed
426
427
}

John Koleszar's avatar
John Koleszar committed
428
429
430
431

typedef off_t EbmlLoc;


John Koleszar's avatar
John Koleszar committed
432
433
434
struct cue_entry {
  unsigned int time;
  uint64_t     loc;
John Koleszar's avatar
John Koleszar committed
435
436
437
};


John Koleszar's avatar
John Koleszar committed
438
439
struct EbmlGlobal {
  int debug;
440

John Koleszar's avatar
John Koleszar committed
441
442
443
  FILE    *stream;
  int64_t last_pts_ms;
  vpx_rational_t  framerate;
John Koleszar's avatar
John Koleszar committed
444

John Koleszar's avatar
John Koleszar committed
445
446
447
448
449
450
451
  /* These pointers are to the start of an element */
  off_t    position_reference;
  off_t    seek_info_pos;
  off_t    segment_info_pos;
  off_t    track_pos;
  off_t    cue_pos;
  off_t    cluster_pos;
John Koleszar's avatar
John Koleszar committed
452

John Koleszar's avatar
John Koleszar committed
453
454
  /* This pointer is to a specific element to be serialized */
  off_t    track_id_pos;
John Koleszar's avatar
John Koleszar committed
455

John Koleszar's avatar
John Koleszar committed
456
457
458
  /* These pointers are to the size field of the element */
  EbmlLoc  startSegment;
  EbmlLoc  startCluster;
John Koleszar's avatar
John Koleszar committed
459

John Koleszar's avatar
John Koleszar committed
460
461
  uint32_t cluster_timecode;
  int      cluster_open;
John Koleszar's avatar
John Koleszar committed
462

John Koleszar's avatar
John Koleszar committed
463
464
  struct cue_entry *cue_list;
  unsigned int      cues;
John Koleszar's avatar
John Koleszar committed
465
466
467
468

};


John Koleszar's avatar
John Koleszar committed
469
470
void Ebml_Write(EbmlGlobal *glob, const void *buffer_in, unsigned long len) {
  if (fwrite(buffer_in, 1, len, glob->stream));
John Koleszar's avatar
John Koleszar committed
471
472
}

473
#define WRITE_BUFFER(s) \
John Koleszar's avatar
John Koleszar committed
474
475
  for(i = len-1; i>=0; i--)\
  { \
476
477
    x = *(const s *)buffer_in >> (i * CHAR_BIT); \
    Ebml_Write(glob, &x, 1); \
John Koleszar's avatar
John Koleszar committed
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
  }
void Ebml_Serialize(EbmlGlobal *glob, const void *buffer_in, int buffer_size, unsigned long len) {
  char x;
  int i;

  /* buffer_size:
   * 1 - int8_t;
   * 2 - int16_t;
   * 3 - int32_t;
   * 4 - int64_t;
   */
  switch (buffer_size) {
    case 1:
      WRITE_BUFFER(int8_t)
      break;
    case 2:
      WRITE_BUFFER(int16_t)
      break;
    case 4:
      WRITE_BUFFER(int32_t)
      break;
    case 8:
      WRITE_BUFFER(int64_t)
      break;
    default:
      break;
  }
John Koleszar's avatar
John Koleszar committed
505
}
506
#undef WRITE_BUFFER
John Koleszar's avatar
John Koleszar committed
507

508
/* Need a fixed size serializer for the track ID. libmkv provides a 64 bit
John Koleszar's avatar
John Koleszar committed
509
510
 * one, but not a 32 bit one.
 */
John Koleszar's avatar
John Koleszar committed
511
512
513
514
515
static void Ebml_SerializeUnsigned32(EbmlGlobal *glob, unsigned long class_id, uint64_t ui) {
  unsigned char sizeSerialized = 4 | 0x80;
  Ebml_WriteID(glob, class_id);
  Ebml_Serialize(glob, &sizeSerialized, sizeof(sizeSerialized), 1);
  Ebml_Serialize(glob, &ui, sizeof(ui), 4);
John Koleszar's avatar
John Koleszar committed
516
517
518
}


John Koleszar's avatar
John Koleszar committed
519
520
static void
Ebml_StartSubElement(EbmlGlobal *glob, EbmlLoc *ebmlLoc,
John Koleszar's avatar
John Koleszar committed
521
522
523
524
525
526
527
528
                     unsigned long class_id) {
  // todo this is always taking 8 bytes, this may need later optimization
  // this is a key that says length unknown
  uint64_t unknownLen =  LITERALU64(0x01FFFFFFFFFFFFFF);

  Ebml_WriteID(glob, class_id);
  *ebmlLoc = ftello(glob->stream);
  Ebml_Serialize(glob, &unknownLen, sizeof(unknownLen), 8);
John Koleszar's avatar
John Koleszar committed
529
530
531
}

static void
John Koleszar's avatar
John Koleszar committed
532
533
534
Ebml_EndSubElement(EbmlGlobal *glob, EbmlLoc *ebmlLoc) {
  off_t pos;
  uint64_t size;
John Koleszar's avatar
John Koleszar committed
535

John Koleszar's avatar
John Koleszar committed
536
537
  /* Save the current stream pointer */
  pos = ftello(glob->stream);
John Koleszar's avatar
John Koleszar committed
538

John Koleszar's avatar
John Koleszar committed
539
540
541
  /* Calculate the size of this element */
  size = pos - *ebmlLoc - 8;
  size |=  LITERALU64(0x0100000000000000);
John Koleszar's avatar
John Koleszar committed
542

John Koleszar's avatar
John Koleszar committed
543
544
545
  /* Seek back to the beginning of the element and write the new size */
  fseeko(glob->stream, *ebmlLoc, SEEK_SET);
  Ebml_Serialize(glob, &size, sizeof(size), 8);
John Koleszar's avatar
John Koleszar committed
546

John Koleszar's avatar
John Koleszar committed
547
548
  /* Reset the stream pointer */
  fseeko(glob->stream, pos, SEEK_SET);
John Koleszar's avatar
John Koleszar committed
549
550
}

John Koleszar's avatar
John Koleszar committed
551
552

static void
John Koleszar's avatar
John Koleszar committed
553
554
555
556
557
558
559
write_webm_seek_element(EbmlGlobal *ebml, unsigned long id, off_t pos) {
  uint64_t offset = pos - ebml->position_reference;
  EbmlLoc start;
  Ebml_StartSubElement(ebml, &start, Seek);
  Ebml_SerializeBinary(ebml, SeekID, id);
  Ebml_SerializeUnsigned64(ebml, SeekPosition, offset);
  Ebml_EndSubElement(ebml, &start);
John Koleszar's avatar
John Koleszar committed
560
561
562
563
}


static void
John Koleszar's avatar
John Koleszar committed
564
write_webm_seek_info(EbmlGlobal *ebml) {
John Koleszar's avatar
John Koleszar committed
565

John Koleszar's avatar
John Koleszar committed
566
  off_t pos;
John Koleszar's avatar
John Koleszar committed
567

John Koleszar's avatar
John Koleszar committed
568
569
  /* Save the current stream pointer */
  pos = ftello(ebml->stream);
John Koleszar's avatar
John Koleszar committed
570

John Koleszar's avatar
John Koleszar committed
571
572
573
574
  if (ebml->seek_info_pos)
    fseeko(ebml->stream, ebml->seek_info_pos, SEEK_SET);
  else
    ebml->seek_info_pos = pos;
John Koleszar's avatar
John Koleszar committed
575

John Koleszar's avatar
John Koleszar committed
576
577
  {
    EbmlLoc start;
John Koleszar's avatar
John Koleszar committed
578

John Koleszar's avatar
John Koleszar committed
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
    Ebml_StartSubElement(ebml, &start, SeekHead);
    write_webm_seek_element(ebml, Tracks, ebml->track_pos);
    write_webm_seek_element(ebml, Cues,   ebml->cue_pos);
    write_webm_seek_element(ebml, Info,   ebml->segment_info_pos);
    Ebml_EndSubElement(ebml, &start);
  }
  {
    // segment info
    EbmlLoc startInfo;
    uint64_t frame_time;

    frame_time = (uint64_t)1000 * ebml->framerate.den
                 / ebml->framerate.num;
    ebml->segment_info_pos = ftello(ebml->stream);
    Ebml_StartSubElement(ebml, &startInfo, Info);
    Ebml_SerializeUnsigned(ebml, TimecodeScale, 1000000);
    Ebml_SerializeFloat(ebml, Segment_Duration,
                        ebml->last_pts_ms + frame_time);
    Ebml_SerializeString(ebml, 0x4D80,
                         ebml->debug ? "vpxenc" : "vpxenc" VERSION_STRING);
    Ebml_SerializeString(ebml, 0x5741,
                         ebml->debug ? "vpxenc" : "vpxenc" VERSION_STRING);
    Ebml_EndSubElement(ebml, &startInfo);
  }
John Koleszar's avatar
John Koleszar committed
603
604
605
606
607
608
}


static void
write_webm_file_header(EbmlGlobal                *glob,
                       const vpx_codec_enc_cfg_t *cfg,
609
                       const struct vpx_rational *fps,
John Koleszar's avatar
John Koleszar committed
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
                       stereo_format_t            stereo_fmt) {
  {
    EbmlLoc start;
    Ebml_StartSubElement(glob, &start, EBML);
    Ebml_SerializeUnsigned(glob, EBMLVersion, 1);
    Ebml_SerializeUnsigned(glob, EBMLReadVersion, 1); // EBML Read Version
    Ebml_SerializeUnsigned(glob, EBMLMaxIDLength, 4); // EBML Max ID Length
    Ebml_SerializeUnsigned(glob, EBMLMaxSizeLength, 8); // EBML Max Size Length
    Ebml_SerializeString(glob, DocType, "webm"); // Doc Type
    Ebml_SerializeUnsigned(glob, DocTypeVersion, 2); // Doc Type Version
    Ebml_SerializeUnsigned(glob, DocTypeReadVersion, 2); // Doc Type Read Version
    Ebml_EndSubElement(glob, &start);
  }
  {
    Ebml_StartSubElement(glob, &glob->startSegment, Segment); // segment
    glob->position_reference = ftello(glob->stream);
    glob->framerate = *fps;
    write_webm_seek_info(glob);

John Koleszar's avatar
John Koleszar committed
629
    {
John Koleszar's avatar
John Koleszar committed
630
631
632
633
634
635
      EbmlLoc trackStart;
      glob->track_pos = ftello(glob->stream);
      Ebml_StartSubElement(glob, &trackStart, Tracks);
      {
        unsigned int trackNumber = 1;
        uint64_t     trackID = 0;
John Koleszar's avatar
John Koleszar committed
636

John Koleszar's avatar
John Koleszar committed
637
638
639
640
641
642
643
        EbmlLoc start;
        Ebml_StartSubElement(glob, &start, TrackEntry);
        Ebml_SerializeUnsigned(glob, TrackNumber, trackNumber);
        glob->track_id_pos = ftello(glob->stream);
        Ebml_SerializeUnsigned32(glob, TrackUID, trackID);
        Ebml_SerializeUnsigned(glob, TrackType, 1); // video is always 1
        Ebml_SerializeString(glob, CodecID, "V_VP8");
John Koleszar's avatar
John Koleszar committed
644
        {
John Koleszar's avatar
John Koleszar committed
645
646
647
648
649
650
651
652
653
654
655
          unsigned int pixelWidth = cfg->g_w;
          unsigned int pixelHeight = cfg->g_h;
          float        frameRate   = (float)fps->num / (float)fps->den;

          EbmlLoc videoStart;
          Ebml_StartSubElement(glob, &videoStart, Video);
          Ebml_SerializeUnsigned(glob, PixelWidth, pixelWidth);
          Ebml_SerializeUnsigned(glob, PixelHeight, pixelHeight);
          Ebml_SerializeUnsigned(glob, StereoMode, stereo_fmt);
          Ebml_SerializeFloat(glob, FrameRate, frameRate);
          Ebml_EndSubElement(glob, &videoStart); // Video
John Koleszar's avatar
John Koleszar committed
656
        }
John Koleszar's avatar
John Koleszar committed
657
658
659
        Ebml_EndSubElement(glob, &start); // Track Entry
      }
      Ebml_EndSubElement(glob, &trackStart);
John Koleszar's avatar
John Koleszar committed
660
    }
John Koleszar's avatar
John Koleszar committed
661
662
    // segment element is open
  }
John Koleszar's avatar
John Koleszar committed
663
664
665
666
667
668
}


static void
write_webm_block(EbmlGlobal                *glob,
                 const vpx_codec_enc_cfg_t *cfg,
John Koleszar's avatar
John Koleszar committed
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
                 const vpx_codec_cx_pkt_t  *pkt) {
  unsigned long  block_length;
  unsigned char  track_number;
  unsigned short block_timecode = 0;
  unsigned char  flags;
  int64_t        pts_ms;
  int            start_cluster = 0, is_keyframe;

  /* Calculate the PTS of this frame in milliseconds */
  pts_ms = pkt->data.frame.pts * 1000
           * (uint64_t)cfg->g_timebase.num / (uint64_t)cfg->g_timebase.den;
  if (pts_ms <= glob->last_pts_ms)
    pts_ms = glob->last_pts_ms + 1;
  glob->last_pts_ms = pts_ms;

  /* Calculate the relative time of this block */
  if (pts_ms - glob->cluster_timecode > SHRT_MAX)
    start_cluster = 1;
  else
    block_timecode = pts_ms - glob->cluster_timecode;

  is_keyframe = (pkt->data.frame.flags & VPX_FRAME_IS_KEY);
  if (start_cluster || is_keyframe) {
    if (glob->cluster_open)
      Ebml_EndSubElement(glob, &glob->startCluster);

    /* Open the new cluster */
    block_timecode = 0;
    glob->cluster_open = 1;
    glob->cluster_timecode = pts_ms;
    glob->cluster_pos = ftello(glob->stream);
    Ebml_StartSubElement(glob, &glob->startCluster, Cluster); // cluster
    Ebml_SerializeUnsigned(glob, Timecode, glob->cluster_timecode);

    /* Save a cue point if this is a keyframe. */
    if (is_keyframe) {
      struct cue_entry *cue, *new_cue_list;

      new_cue_list = realloc(glob->cue_list,
                             (glob->cues + 1) * sizeof(struct cue_entry));
      if (new_cue_list)
        glob->cue_list = new_cue_list;
      else {
        fprintf(stderr, "\nFailed to realloc cue list.\n");
        exit(EXIT_FAILURE);
      }
John Koleszar's avatar
John Koleszar committed
715

John Koleszar's avatar
John Koleszar committed
716
717
718
719
      cue = &glob->cue_list[glob->cues];
      cue->time = glob->cluster_timecode;
      cue->loc = glob->cluster_pos;
      glob->cues++;
John Koleszar's avatar
John Koleszar committed
720
    }
John Koleszar's avatar
John Koleszar committed
721
  }
John Koleszar's avatar
John Koleszar committed
722

John Koleszar's avatar
John Koleszar committed
723
724
  /* Write the Simple Block */
  Ebml_WriteID(glob, SimpleBlock);
John Koleszar's avatar
John Koleszar committed
725

John Koleszar's avatar
John Koleszar committed
726
727
728
  block_length = pkt->data.frame.sz + 4;
  block_length |= 0x10000000;
  Ebml_Serialize(glob, &block_length, sizeof(block_length), 4);
John Koleszar's avatar
John Koleszar committed
729

John Koleszar's avatar
John Koleszar committed
730
731
732
  track_number = 1;
  track_number |= 0x80;
  Ebml_Write(glob, &track_number, 1);
John Koleszar's avatar
John Koleszar committed
733

John Koleszar's avatar
John Koleszar committed
734
  Ebml_Serialize(glob, &block_timecode, sizeof(block_timecode), 2);
John Koleszar's avatar
John Koleszar committed
735

John Koleszar's avatar
John Koleszar committed
736
737
738
739
740
741
  flags = 0;
  if (is_keyframe)
    flags |= 0x80;
  if (pkt->data.frame.flags & VPX_FRAME_IS_INVISIBLE)
    flags |= 0x08;
  Ebml_Write(glob, &flags, 1);
John Koleszar's avatar
John Koleszar committed
742

John Koleszar's avatar
John Koleszar committed
743
  Ebml_Write(glob, pkt->data.frame.buf, pkt->data.frame.sz);
John Koleszar's avatar
John Koleszar committed
744
745
746
747
}


static void
John Koleszar's avatar
John Koleszar committed
748
write_webm_file_footer(EbmlGlobal *glob, long hash) {
John Koleszar's avatar
John Koleszar committed
749

John Koleszar's avatar
John Koleszar committed
750
751
  if (glob->cluster_open)
    Ebml_EndSubElement(glob, &glob->startCluster);
John Koleszar's avatar
John Koleszar committed
752

John Koleszar's avatar
John Koleszar committed
753
754
755
  {
    EbmlLoc start;
    int i;
John Koleszar's avatar
John Koleszar committed
756

John Koleszar's avatar
John Koleszar committed
757
758
759
760
761
    glob->cue_pos = ftello(glob->stream);
    Ebml_StartSubElement(glob, &start, Cues);
    for (i = 0; i < glob->cues; i++) {
      struct cue_entry *cue = &glob->cue_list[i];
      EbmlLoc start;
John Koleszar's avatar
John Koleszar committed
762

John Koleszar's avatar
John Koleszar committed
763
764
765
      Ebml_StartSubElement(glob, &start, CuePoint);
      {
        EbmlLoc start;
John Koleszar's avatar
John Koleszar committed
766

John Koleszar's avatar
John Koleszar committed
767
        Ebml_SerializeUnsigned(glob, CueTime, cue->time);
John Koleszar's avatar
John Koleszar committed
768

John Koleszar's avatar
John Koleszar committed
769
770
771
772
773
        Ebml_StartSubElement(glob, &start, CueTrackPositions);
        Ebml_SerializeUnsigned(glob, CueTrack, 1);
        Ebml_SerializeUnsigned64(glob, CueClusterPosition,
                                 cue->loc - glob->position_reference);
        // Ebml_SerializeUnsigned(glob, CueBlockNumber, cue->blockNumber);
John Koleszar's avatar
John Koleszar committed
774
        Ebml_EndSubElement(glob, &start);
John Koleszar's avatar
John Koleszar committed
775
776
      }
      Ebml_EndSubElement(glob, &start);
John Koleszar's avatar
John Koleszar committed
777
    }
John Koleszar's avatar
John Koleszar committed
778
779
    Ebml_EndSubElement(glob, &start);
  }
John Koleszar's avatar
John Koleszar committed
780

John Koleszar's avatar
John Koleszar committed
781
  Ebml_EndSubElement(glob, &glob->startSegment);
John Koleszar's avatar
John Koleszar committed
782

John Koleszar's avatar
John Koleszar committed
783
784
  /* Patch up the seek info block */
  write_webm_seek_info(glob);
John Koleszar's avatar
John Koleszar committed
785

John Koleszar's avatar
John Koleszar committed
786
787
788
  /* Patch up the track id */
  fseeko(glob->stream, glob->track_id_pos, SEEK_SET);
  Ebml_SerializeUnsigned32(glob, TrackUID, glob->debug ? 0xDEADBEEF : hash);
John Koleszar's avatar
John Koleszar committed
789

John Koleszar's avatar
John Koleszar committed
790
  fseeko(glob->stream, 0, SEEK_END);
John Koleszar's avatar
John Koleszar committed
791
792
793
}


John Koleszar's avatar
John Koleszar committed
794
/* Murmur hash derived from public domain reference implementation at
John Koleszar's avatar
John Koleszar committed
795
 *   http:// sites.google.com/site/murmurhash/
John Koleszar's avatar
John Koleszar committed
796
 */
John Koleszar's avatar
John Koleszar committed
797
798
799
static unsigned int murmur(const void *key, int len, unsigned int seed) {
  const unsigned int m = 0x5bd1e995;
  const int r = 24;
John Koleszar's avatar
John Koleszar committed
800

John Koleszar's avatar
John Koleszar committed
801
  unsigned int h = seed ^ len;
John Koleszar's avatar
John Koleszar committed
802

John Koleszar's avatar
John Koleszar committed
803
  const unsigned char *data = (const unsigned char *)key;
John Koleszar's avatar
John Koleszar committed
804

John Koleszar's avatar
John Koleszar committed
805
806
  while (len >= 4) {
    unsigned int k;
John Koleszar's avatar
John Koleszar committed
807

John Koleszar's avatar
John Koleszar committed
808
809
810
811
    k  = data[0];
    k |= data[1] << 8;
    k |= data[2] << 16;
    k |= data[3] << 24;
John Koleszar's avatar
John Koleszar committed
812

John Koleszar's avatar
John Koleszar committed
813
814
815
    k *= m;
    k ^= k >> r;
    k *= m;
John Koleszar's avatar
John Koleszar committed
816
817

    h *= m;
John Koleszar's avatar
John Koleszar committed
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
    h ^= k;

    data += 4;
    len -= 4;
  }

  switch (len) {
    case 3:
      h ^= data[2] << 16;
    case 2:
      h ^= data[1] << 8;
    case 1:
      h ^= data[0];
      h *= m;
  };

  h ^= h >> 13;
  h *= m;
  h ^= h >> 15;

  return h;
John Koleszar's avatar
John Koleszar committed
839
840
}

841
#include "math.h"
842
#define MAX_PSNR 100
John Koleszar's avatar
John Koleszar committed
843
844
static double vp8_mse2psnr(double Samples, double Peak, double Mse) {
  double psnr;
845

John Koleszar's avatar
John Koleszar committed
846
847
848
849
  if ((double)Mse > 0.0)
    psnr = 10.0 * log10(Peak * Peak * Samples / Mse);
  else
    psnr = MAX_PSNR;      // Limit to prevent / 0
850

John Koleszar's avatar
John Koleszar committed
851
852
  if (psnr > MAX_PSNR)
    psnr = MAX_PSNR;
853

John Koleszar's avatar
John Koleszar committed
854
  return psnr;
855
856
}

John Koleszar's avatar
John Koleszar committed
857

John Koleszar's avatar
John Koleszar committed
858
859
#include "args.h"

860
static const arg_def_t debugmode = ARG_DEF("D", "debug", 0,
John Koleszar's avatar
John Koleszar committed
861
                                           "Debug mode (makes output deterministic)");
862
static const arg_def_t outputfile = ARG_DEF("o", "output", 1,
John Koleszar's avatar
John Koleszar committed
863
                                            "Output filename");
John Koleszar's avatar
John Koleszar committed
864
static const arg_def_t use_yv12 = ARG_DEF(NULL, "yv12", 0,
John Koleszar's avatar
John Koleszar committed
865
                                          "Input file is YV12 ");
John Koleszar's avatar
John Koleszar committed
866
static const arg_def_t use_i420 = ARG_DEF(NULL, "i420", 0,
John Koleszar's avatar
John Koleszar committed
867
                                          "Input file is I420 (default)");
John Koleszar's avatar
John Koleszar committed
868
static const arg_def_t codecarg = ARG_DEF(NULL, "codec", 1,
John Koleszar's avatar
John Koleszar committed
869
                                          "Codec to use");
John Koleszar's avatar
John Koleszar committed
870
static const arg_def_t passes           = ARG_DEF("p", "passes", 1,
John Koleszar's avatar
John Koleszar committed
871
                                                  "Number of passes (1/2)");
John Koleszar's avatar
John Koleszar committed
872
static const arg_def_t pass_arg         = ARG_DEF(NULL, "pass", 1,
John Koleszar's avatar
John Koleszar committed
873
                                                  "Pass to execute (1/2)");
John Koleszar's avatar
John Koleszar committed
874
static const arg_def_t fpf_name         = ARG_DEF(NULL, "fpf", 1,
John Koleszar's avatar
John Koleszar committed
875
                                                  "First pass statistics file name");
John Koleszar's avatar
John Koleszar committed
876
877
static const arg_def_t limit = ARG_DEF(NULL, "limit", 1,
                                       "Stop encoding after n input frames");
878
static const arg_def_t skip = ARG_DEF(NULL, "skip", 1,
John Koleszar's avatar
John Koleszar committed
879
                                      "Skip the first n input frames");
John Koleszar's avatar
John Koleszar committed
880
static const arg_def_t deadline         = ARG_DEF("d", "deadline", 1,
John Koleszar's avatar
John Koleszar committed
881
                                                  "Deadline per frame (usec)");
John Koleszar's avatar
John Koleszar committed
882
static const arg_def_t best_dl          = ARG_DEF(NULL, "best", 0,
John Koleszar's avatar
John Koleszar committed
883
                                                  "Use Best Quality Deadline");
John Koleszar's avatar
John Koleszar committed
884
static const arg_def_t good_dl          = ARG_DEF(NULL, "good", 0,
John Koleszar's avatar
John Koleszar committed
885
                                                  "Use Good Quality Deadline");
John Koleszar's avatar
John Koleszar committed
886
static const arg_def_t rt_dl            = ARG_DEF(NULL, "rt", 0,
John Koleszar's avatar
John Koleszar committed
887
                                                  "Use Realtime Quality Deadline");
John Koleszar's avatar
John Koleszar committed
888
static const arg_def_t verbosearg       = ARG_DEF("v", "verbose", 0,
John Koleszar's avatar
John Koleszar committed
889
                                                  "Show encoder parameters");
John Koleszar's avatar
John Koleszar committed
890
static const arg_def_t psnrarg          = ARG_DEF(NULL, "psnr", 0,
John Koleszar's avatar
John Koleszar committed
891
                                                  "Show PSNR in status line");
892
static const arg_def_t recontest        = ARG_DEF(NULL, "test-decode", 0,
John Koleszar's avatar
John Koleszar committed
893
                                                  "Test enocde/decode have machted recon buffer");
894
static const arg_def_t framerate        = ARG_DEF(NULL, "fps", 1,
John Koleszar's avatar
John Koleszar committed
895
                                                  "Stream frame rate (rate/scale)");
John Koleszar's avatar
John Koleszar committed
896
static const arg_def_t use_ivf          = ARG_DEF(NULL, "ivf", 0,
John Koleszar's avatar
John Koleszar committed
897
                                                  "Output IVF (default is WebM)");
898
static const arg_def_t q_hist_n         = ARG_DEF(NULL, "q-hist", 1,
John Koleszar's avatar
John Koleszar committed
899
                                                  "Show quantizer histogram (n-buckets)");
900
static const arg_def_t rate_hist_n         = ARG_DEF(NULL, "rate-hist", 1,
John Koleszar's avatar
John Koleszar committed
901
                                                     "Show rate histogram (n-buckets)");
Hui Su's avatar
Hui Su committed
902
903
#if CONFIG_LOSSLESS
static const arg_def_t lossless_enabled = ARG_DEF(NULL, "lossless", 0,
John Koleszar's avatar
John Koleszar committed
904
                                                  "Enable lossless compression");
Hui Su's avatar
Hui Su committed
905
#endif
John Koleszar's avatar
John Koleszar committed
906
907
908
909
910
911
static const arg_def_t *main_args[] = {
  &debugmode,
  &outputfile, &codecarg, &passes, &pass_arg, &fpf_name, &limit, &skip,
  &deadline,
  &best_dl, &good_dl, &rt_dl,
  &verbosearg, &psnrarg, &recontest, &use_ivf, &q_hist_n, &rate_hist_n,
Hui Su's avatar
Hui Su committed
912
#if CONFIG_LOSSLESS
John Koleszar's avatar
John Koleszar committed
913
  &lossless_enabled,
Hui Su's avatar
Hui Su committed
914
#endif
John Koleszar's avatar
John Koleszar committed
915
  NULL
John Koleszar's avatar
John Koleszar committed
916
917
918
};

static const arg_def_t usage            = ARG_DEF("u", "usage", 1,
John Koleszar's avatar
John Koleszar committed
919
                                                  "Usage profile number to use");
John Koleszar's avatar
John Koleszar committed
920
static const arg_def_t threads          = ARG_DEF("t", "threads", 1,
John Koleszar's avatar
John Koleszar committed
921
                                                  "Max number of threads to use");
John Koleszar's avatar
John Koleszar committed
922
static const arg_def_t profile          = ARG_DEF(NULL, "profile", 1,
John Koleszar's avatar
John Koleszar committed
923
                                                  "Bitstream profile number to use");
John Koleszar's avatar
John Koleszar committed
924
static const arg_def_t width            = ARG_DEF("w", "width", 1,
John Koleszar's avatar
John Koleszar committed
925
                                                  "Frame width");
John Koleszar's avatar
John Koleszar committed
926
static const arg_def_t height           = ARG_DEF("h", "height", 1,
John Koleszar's avatar
John Koleszar committed
927
                                                  "Frame height");
928
static const struct arg_enum_list stereo_mode_enum[] = {
John Koleszar's avatar
John Koleszar committed
929
930
931
932
933
934
  {"mono", STEREO_FORMAT_MONO},
  {"left-right", STEREO_FORMAT_LEFT_RIGHT},
  {"bottom-top", STEREO_FORMAT_BOTTOM_TOP},
  {"top-bottom", STEREO_FORMAT_TOP_BOTTOM},
  {"right-left", STEREO_FORMAT_RIGHT_LEFT},
  {NULL, 0}
935
936
};
static const arg_def_t stereo_mode      = ARG_DEF_ENUM(NULL, "stereo-mode", 1,
John Koleszar's avatar
John Koleszar committed
937
                                                       "Stereo 3D video format", stereo_mode_enum);
John Koleszar's avatar
John Koleszar committed
938
static const arg_def_t timebase         = ARG_DEF(NULL, "timebase", 1,
John Koleszar's avatar
John Koleszar committed
939
                                                  "Output timestamp precision (fractional seconds)");
John Koleszar's avatar
John Koleszar committed
940
static const arg_def_t error_resilient  = ARG_DEF(NULL, "error-resilient", 1,
John Koleszar's avatar
John Koleszar committed
941
                                                  "Enable error resiliency features");
John Koleszar's avatar
John Koleszar committed
942
static const arg_def_t lag_in_frames    = ARG_DEF(NULL, "lag-in-frames", 1,
John Koleszar's avatar
John Koleszar committed
943
                                                  "Max number of frames to lag");
John Koleszar's avatar
John Koleszar committed
944

John Koleszar's avatar
John Koleszar committed
945
946
947
948
static const arg_def_t *global_args[] = {
  &use_yv12, &use_i420, &usage, &threads, &profile,
  &width, &height, &stereo_mode, &timebase, &framerate, &error_resilient,
  &lag_in_frames, NULL
John Koleszar's avatar
John Koleszar committed
949
950
951
};

static const arg_def_t dropframe_thresh   = ARG_DEF(NULL, "drop-frame", 1,
John Koleszar's avatar
John Koleszar committed
952
                                                    "Temporal resampling threshold (buf %)");
John Koleszar's avatar
John Koleszar committed
953
static const arg_def_t resize_allowed     = ARG_DEF(NULL, "resize-allowed", 1,
John Koleszar's avatar
John Koleszar committed
954
                                                    "Spatial resampling enabled (bool)");
John Koleszar's avatar
John Koleszar committed
955
static const arg_def_t resize_up_thresh   = ARG_DEF(NULL, "resize-up", 1,
John Koleszar's avatar
John Koleszar committed
956
                                                    "Upscale threshold (buf %)");
John Koleszar's avatar
John Koleszar committed
957
static const arg_def_t resize_down_thresh = ARG_DEF(NULL, "resize-down", 1,
John Koleszar's avatar
John Koleszar committed
958
                                                    "Downscale threshold (buf %)");
959
static const struct arg_enum_list end_usage_enum[] = {
John Koleszar's avatar
John Koleszar committed
960
961
962
963
  {"vbr", VPX_VBR},
  {"cbr", VPX_CBR},
  {"cq",  VPX_CQ},
  {NULL, 0}
964
965
};
static const arg_def_t end_usage          = ARG_DEF_ENUM(NULL, "end-usage", 1,
John Koleszar's avatar
John Koleszar committed
966
                                                         "Rate control mode", end_usage_enum);
John Koleszar's avatar
John Koleszar committed
967
static const arg_def_t target_bitrate     = ARG_DEF(NULL, "target-bitrate", 1,
John Koleszar's avatar
John Koleszar committed
968
                                                    "Bitrate (kbps)");
John Koleszar's avatar
John Koleszar committed
969
static const arg_def_t min_quantizer      = ARG_DEF(NULL, "min-q", 1,
John Koleszar's avatar
John Koleszar committed
970
                                                    "Minimum (best) quantizer");
John Koleszar's avatar
John Koleszar committed
971
static const arg_def_t max_quantizer      = ARG_DEF(NULL, "max-q", 1,
John Koleszar's avatar
John Koleszar committed
972
                                                    "Maximum (worst) quantizer");
John Koleszar's avatar
John Koleszar committed
973
static const arg_def_t undershoot_pct     = ARG_DEF(NULL, "undershoot-pct", 1,
John Koleszar's avatar
John Koleszar committed
974
                                                    "Datarate undershoot (min) target (%)");
John Koleszar's avatar
John Koleszar committed
975
static const arg_def_t overshoot_pct      = ARG_DEF(NULL, "overshoot-pct", 1,
John Koleszar's avatar
John Koleszar committed
976
                                                    "Datarate overshoot (max) target (%)");
John Koleszar's avatar
John Koleszar committed
977
static const arg_def_t buf_sz             = ARG_DEF(NULL, "buf-sz", 1,
John Koleszar's avatar
John Koleszar committed
978
                                                    "Client buffer size (ms)");
John Koleszar's avatar
John Koleszar committed
979
static const arg_def_t buf_initial_sz     = ARG_DEF(NULL, "buf-initial-sz", 1,
John Koleszar's avatar
John Koleszar committed
980
                                                    "Client initial buffer size (ms)");
John Koleszar's avatar
John Koleszar committed
981
static const arg_def_t buf_optimal_sz     = ARG_DEF(NULL, "buf-optimal-sz", 1,
John Koleszar's avatar
John Koleszar committed
982
983
984
985
986
987
                                                    "Client optimal buffer size (ms)");
static const arg_def_t *rc_args[] = {
  &dropframe_thresh, &resize_allowed, &resize_up_thresh, &resize_down_thresh,
  &end_usage, &target_bitrate, &min_quantizer, &max_quantizer,
  &undershoot_pct, &overshoot_pct, &buf_sz, &buf_initial_sz, &buf_optimal_sz,
  NULL
John Koleszar's avatar
John Koleszar committed
988
989
990
991
};


static const arg_def_t bias_pct = ARG_DEF(NULL, "bias-pct", 1,
John Koleszar's avatar
John Koleszar committed
992
                                          "CBR/VBR bias (0=CBR, 100=VBR)");
John Koleszar's avatar
John Koleszar committed
993
static const arg_def_t minsection_pct = ARG_DEF(NULL, "minsection-pct", 1,
John Koleszar's avatar
John Koleszar committed
994
                                                "GOP min bitrate (% of target)");
John Koleszar's avatar
John Koleszar committed
995
static const arg_def_t maxsection_pct = ARG_DEF(NULL, "maxsection-pct", 1,
John Koleszar's avatar
John Koleszar committed
996
997
998
                                                "GOP max bitrate (% of target)");
static const arg_def_t *rc_twopass_args[] = {
  &bias_pct, &minsection_pct, &maxsection_pct, NULL
John Koleszar's avatar
John Koleszar committed
999
1000
1001
1002
};


static const arg_def_t kf_min_dist = ARG_DEF(NULL, "kf-min-dist", 1,
John Koleszar's avatar
John Koleszar committed
1003
                                             "Minimum keyframe interval (frames)");
John Koleszar's avatar
John Koleszar committed
1004
static const arg_def_t kf_max_dist = ARG_DEF(NULL, "kf-max-dist", 1,
John Koleszar's avatar
John Koleszar committed
1005
                                             "Maximum keyframe interval (frames)");
1006
static const arg_def_t kf_disabled = ARG_DEF(NULL, "disable-kf", 0,
John Koleszar's avatar
John Koleszar committed
1007
1008
1009
                                             "Disable keyframe placement");
static const arg_def_t *kf_args[] = {
  &kf_min_dist, &kf_max_dist, &kf_disabled, NULL
John Koleszar's avatar
John Koleszar committed
1010
1011
1012
1013
1014
};


#if CONFIG_VP8_ENCODER
static const arg_def_t noise_sens = ARG_DEF(NULL, "noise-sensitivity", 1,
John Koleszar's avatar
John Koleszar committed
1015
                                            "Noise sensitivity (frames to blur)");
John Koleszar's avatar
John Koleszar committed
1016
static const arg_def_t sharpness = ARG_DEF(NULL, "sharpness", 1,
John Koleszar's avatar
John Koleszar committed
1017
                                           "Filter sharpness (0-7)");
John Koleszar's avatar
John Koleszar committed
1018
static const arg_def_t static_thresh = ARG_DEF(NULL, "static-thresh", 1,
John Koleszar's avatar
John Koleszar committed
1019
                                               "Motion detection threshold");
John Koleszar's avatar
John Koleszar committed
1020
1021
1022
1023
#endif

#if CONFIG_VP8_ENCODER
static const arg_def_t cpu_used = ARG_DEF(NULL, "cpu-used", 1,
John Koleszar's avatar
John Koleszar committed
1024
                                          "CPU Used (-16..16)");
John Koleszar's avatar
John Koleszar committed
1025
1026
1027
1028
1029
#endif


#if CONFIG_VP8_ENCODER
static const arg_def_t token_parts = ARG_DEF(NULL, "token-parts", 1,
John Koleszar's avatar
John Koleszar committed
1030
                                             "Number of token partitions to use, log2");
John Koleszar's avatar
John Koleszar committed
1031
static const arg_def_t auto_altref = ARG_DEF(NULL, "auto-alt-ref", 1,
John Koleszar's avatar
John Koleszar committed
1032
                                             "Enable automatic alt reference frames");
John Koleszar's avatar
John Koleszar committed
1033
static const arg_def_t arnr_maxframes = ARG_DEF(NULL, "arnr-maxframes", 1,
John Koleszar's avatar
John Koleszar committed
1034
                                                "AltRef Max Frames");
John Koleszar's avatar
John Koleszar committed
1035
static const arg_def_t arnr_strength = ARG_DEF(NULL, "arnr-strength", 1,
John Koleszar's avatar
John Koleszar committed
1036
                                               "AltRef Strength");
John Koleszar's avatar
John Koleszar committed
1037
static const arg_def_t arnr_type = ARG_DEF(NULL, "arnr-type", 1,
John Koleszar's avatar
John Koleszar committed
1038
                                           "AltRef Type");
John Koleszar's avatar
John Koleszar committed
1039
static const struct arg_enum_list tuning_enum[] = {
John Koleszar's avatar
John Koleszar committed
1040
1041
1042
  {"psnr", VP8_TUNE_PSNR},
  {"ssim", VP8_TUNE_SSIM},
  {NULL, 0}
John Koleszar's avatar
John Koleszar committed
1043
1044
};
static const arg_def_t tune_ssim = ARG_DEF_ENUM(NULL, "tune", 1,
John Koleszar's avatar
John Koleszar committed
1045
                                                "Material to favor", tuning_enum);
Paul Wilkins's avatar
CQ Mode    
Paul Wilkins committed
1046
static const arg_def_t cq_level = ARG_DEF(NULL, "cq-level", 1,
John Koleszar's avatar
John Koleszar committed
1047
                                          "Constrained Quality Level");
1048
static const arg_def_t max_intra_rate_pct = ARG_DEF(NULL, "max-intra-rate", 1,
John Koleszar's avatar
John Koleszar committed
1049
                                                    "Max I-frame bitrate (pct)");
John Koleszar's avatar
John Koleszar committed
1050

John Koleszar's avatar
John Koleszar committed
1051
1052
1053
1054
static const arg_def_t *vp8_args[] = {
  &cpu_used, &auto_altref, &noise_sens, &sharpness, &static_thresh,
  &token_parts, &arnr_maxframes, &arnr_strength, &arnr_type,
  &tune_ssim, &cq_level, &max_intra_rate_pct, NULL
John Koleszar's avatar
John Koleszar committed
1055
};
John Koleszar's avatar
John Koleszar committed
1056
1057
1058
1059
1060
1061
static const int vp8_arg_ctrl_map[] = {
  VP8E_SET_CPUUSED, VP8E_SET_ENABLEAUTOALTREF,
  VP8E_SET_NOISE_SENSITIVITY, VP8E_SET_SHARPNESS, VP8E_SET_STATIC_THRESHOLD,
  VP8E_SET_TOKEN_PARTITIONS,
  VP8E_SET_ARNR_MAXFRAMES, VP8E_SET_ARNR_STRENGTH, VP8E_SET_ARNR_TYPE,
  VP8E_SET_TUNING, VP8E_SET_CQ_LEVEL, VP8E_SET_MAX_INTRA_BITRATE_PCT, 0
John Koleszar's avatar
John Koleszar committed
1062
1063
1064
1065
1066
};
#endif

static const arg_def_t *no_args[] = { NULL };

John Koleszar's avatar
John Koleszar committed
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
static void usage_exit() {
  int i;

  fprintf(stderr, "Usage: %s <options> -o dst_filename src_filename \n",
          exec_name);

  fprintf(stderr, "\nOptions:\n");
  arg_show_usage(stdout, main_args);
  fprintf(stderr, "\nEncoder Global Options:\n");
  arg_show_usage(stdout, global_args);
  fprintf(stderr, "\nRate Control Options:\n");
  arg_show_usage(stdout, rc_args);
  fprintf(stderr, "\nTwopass Rate Control Options:\n");
  arg_show_usage(stdout, rc_twopass_args);
  fprintf(stderr, "\nKeyframe Placement Options:\n");
  arg_show_usage(stdout, kf_args);
John Koleszar's avatar
John Koleszar committed
1083
#if CONFIG_VP8_ENCODER
John Koleszar's avatar
John Koleszar committed
1084
1085
  fprintf(stderr, "\nVP8 Specific Options:\n");
  arg_show_usage(stdout, vp8_args);
John Koleszar's avatar
John Koleszar committed
1086
#endif
John Koleszar's avatar
John Koleszar committed
1087
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
1098
1099
  fprintf(stderr, "\nStream timebase (--timebase):\n"
          "  The desired precision of timestamps in the output, expressed\n"
          "  in fractional seconds. Default is 1/1000.\n");
  fprintf(stderr, "\n"
          "Included encoders:\n"
          "\n");

  for (i = 0; i < sizeof(codecs) / sizeof(codecs[0]); i++)
    fprintf(stderr, "    %-6s - %s\n",
            codecs[i].name,
            vpx_codec_iface_name(codecs[i].iface));

  exit(EXIT_FAILURE);
John Koleszar's avatar
John Koleszar committed
1100
1101
}

1102
1103

#define HIST_BAR_MAX 40
John Koleszar's avatar
John Koleszar committed
1104
1105
struct hist_bucket {
  int low, high, count;
1106
1107
1108
1109
1110
};


static int merge_hist_buckets(struct hist_bucket *bucket,
                              int *buckets_,
John Koleszar's avatar
John Koleszar committed
1111
1112
1113
1114
1115
1116
1117
1118
1119
1120
1121
1122
1123
1124
1125
1126
1127
1128
1129
1130
1131
1132
1133
1134
1135
1136
1137
1138
1139
1140
1141
1142
1143
1144
1145
1146
1147
1148
1149
1150
1151
1152
                              int max_buckets) {
  int small_bucket = 0, merge_bucket = INT_MAX, big_bucket = 0;
  int buckets = *buckets_;
  int i;

  /* Find the extrema for this list of buckets */
  big_bucket = small_bucket = 0;
  for (i = 0; i < buckets; i++) {
    if (bucket[i].count < bucket[small_bucket].count)
      small_bucket = i;
    if (bucket[i].count > bucket[big_bucket].count)
      big_bucket = i;
  }

  /* If we have too many buckets, merge the smallest with an adjacent
   * bucket.