vp9_firstpass.c 91 KB
Newer Older
John Koleszar's avatar
John Koleszar committed
1
/*
2
 *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
John Koleszar's avatar
John Koleszar committed
3
 *
4
 *  Use of this source code is governed by a BSD-style license
5
6
 *  that can be found in the LICENSE file in the root of the source
 *  tree. An additional intellectual property rights grant can be found
7
 *  in the file PATENTS.  All contributing project authors may
8
 *  be found in the AUTHORS file in the root of the source tree.
John Koleszar's avatar
John Koleszar committed
9
10
11
12
 */

#include "math.h"
#include "limits.h"
13
14
15
16
17
18
#include "vp9/encoder/vp9_block.h"
#include "vp9/encoder/vp9_onyx_int.h"
#include "vp9/encoder/vp9_variance.h"
#include "vp9/encoder/vp9_encodeintra.h"
#include "vp9/encoder/vp9_mcomp.h"
#include "vp9/encoder/vp9_firstpass.h"
Johann's avatar
Johann committed
19
#include "vpx_scale/vpx_scale.h"
20
#include "vp9/encoder/vp9_encodeframe.h"
21
#include "vp9/encoder/vp9_encodemb.h"
22
23
#include "vp9/common/vp9_extend.h"
#include "vp9/common/vp9_systemdependent.h"
John Koleszar's avatar
John Koleszar committed
24
#include "vpx_mem/vpx_mem.h"
25
#include "vpx_scale/yv12config.h"
John Koleszar's avatar
John Koleszar committed
26
#include <stdio.h>
27
#include "vp9/encoder/vp9_quantize.h"
28
29
#include "vp9/encoder/vp9_rdopt.h"
#include "vp9/encoder/vp9_ratectrl.h"
30
31
#include "vp9/common/vp9_quant_common.h"
#include "vp9/common/vp9_entropymv.h"
32
#include "vp9/encoder/vp9_encodemv.h"
33
#include "./vpx_scale_rtcd.h"
34
35
// TODO(jkoleszar): for setup_dst_planes
#include "vp9/common/vp9_reconinter.h"
John Koleszar's avatar
John Koleszar committed
36

37
#define OUTPUT_FPF 0
John Koleszar's avatar
John Koleszar committed
38

39
40
#define IIFACTOR   12.5
#define IIKFACTOR1 12.5
41
#define IIKFACTOR2 15.0
42
#define RMAX       512.0
43
#define GF_RMAX    96.0
Paul Wilkins's avatar
Paul Wilkins committed
44
#define ERR_DIVISOR   150.0
45
#define MIN_DECAY_FACTOR 0.1
John Koleszar's avatar
John Koleszar committed
46

47
48
#define KF_MB_INTRA_MIN 150
#define GF_MB_INTRA_MIN 100
Paul Wilkins's avatar
CQ Mode    
Paul Wilkins committed
49

50
#define DOUBLE_DIVIDE_CHECK(x) ((x) < 0 ? (x) - 0.000001 : (x) + 0.000001)
John Koleszar's avatar
John Koleszar committed
51
52
53
54

#define POW1 (double)cpi->oxcf.two_pass_vbrbias/100.0
#define POW2 (double)cpi->oxcf.two_pass_vbrbias/100.0

55
56
57
58
59
60
static void swap_yv12(YV12_BUFFER_CONFIG *a, YV12_BUFFER_CONFIG *b) {
  YV12_BUFFER_CONFIG temp = *a;
  *a = *b;
  *b = temp;
}

61
static void find_next_key_frame(VP9_COMP *cpi, FIRSTPASS_STATS *this_frame);
Paul Wilkins's avatar
Paul Wilkins committed
62

John Koleszar's avatar
John Koleszar committed
63
64
65
static int select_cq_level(int qindex) {
  int ret_val = QINDEX_RANGE - 1;
  int i;
Paul Wilkins's avatar
Paul Wilkins committed
66

67
  double target_q = (vp9_convert_qindex_to_q(qindex) * 0.5847) + 1.0;
Paul Wilkins's avatar
Paul Wilkins committed
68

John Koleszar's avatar
John Koleszar committed
69
  for (i = 0; i < QINDEX_RANGE; i++) {
70
    if (target_q <= vp9_convert_qindex_to_q(i)) {
John Koleszar's avatar
John Koleszar committed
71
72
      ret_val = i;
      break;
Paul Wilkins's avatar
Paul Wilkins committed
73
    }
John Koleszar's avatar
John Koleszar committed
74
  }
Paul Wilkins's avatar
Paul Wilkins committed
75

John Koleszar's avatar
John Koleszar committed
76
  return ret_val;
Paul Wilkins's avatar
Paul Wilkins committed
77
}
Paul Wilkins's avatar
CQ Mode    
Paul Wilkins committed
78

John Koleszar's avatar
John Koleszar committed
79
80

// Resets the first pass file to the given position using a relative seek from the current position
81
82
static void reset_fpf_position(VP9_COMP *cpi, FIRSTPASS_STATS *position) {
  cpi->twopass.stats_in = position;
John Koleszar's avatar
John Koleszar committed
83
84
}

85
static int lookup_next_frame_stats(VP9_COMP *cpi, FIRSTPASS_STATS *next_frame) {
John Koleszar's avatar
John Koleszar committed
86
87
  if (cpi->twopass.stats_in >= cpi->twopass.stats_in_end)
    return EOF;
John Koleszar's avatar
John Koleszar committed
88

John Koleszar's avatar
John Koleszar committed
89
90
  *next_frame = *cpi->twopass.stats_in;
  return 1;
John Koleszar's avatar
John Koleszar committed
91
92
}

93
// Read frame stats at an offset from the current position
94
static int read_frame_stats(VP9_COMP *cpi,
John Koleszar's avatar
John Koleszar committed
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
                            FIRSTPASS_STATS *frame_stats,
                            int offset) {
  FIRSTPASS_STATS *fps_ptr = cpi->twopass.stats_in;

  // Check legality of offset
  if (offset >= 0) {
    if (&fps_ptr[offset] >= cpi->twopass.stats_in_end)
      return EOF;
  } else if (offset < 0) {
    if (&fps_ptr[offset] < cpi->twopass.stats_in_start)
      return EOF;
  }

  *frame_stats = fps_ptr[offset];
  return 1;
110
111
}

112
static int input_stats(VP9_COMP *cpi, FIRSTPASS_STATS *fps) {
John Koleszar's avatar
John Koleszar committed
113
114
  if (cpi->twopass.stats_in >= cpi->twopass.stats_in_end)
    return EOF;
115

John Koleszar's avatar
John Koleszar committed
116
117
118
119
  *fps = *cpi->twopass.stats_in;
  cpi->twopass.stats_in =
    (void *)((char *)cpi->twopass.stats_in + sizeof(FIRSTPASS_STATS));
  return 1;
120
121
}

122
static void output_stats(const VP9_COMP            *cpi,
123
                         struct vpx_codec_pkt_list *pktlist,
John Koleszar's avatar
John Koleszar committed
124
125
126
127
128
129
                         FIRSTPASS_STATS            *stats) {
  struct vpx_codec_cx_pkt pkt;
  pkt.kind = VPX_CODEC_STATS_PKT;
  pkt.data.twopass_stats.buf = stats;
  pkt.data.twopass_stats.sz = sizeof(FIRSTPASS_STATS);
  vpx_codec_pkt_list_add(pktlist, &pkt);
130
131
132
133

// TEMP debug code
#if OUTPUT_FPF

John Koleszar's avatar
John Koleszar committed
134
135
136
137
  {
    FILE *fpfile;
    fpfile = fopen("firstpass.stt", "a");

138
    fprintf(stdout, "%12.0f %12.0f %12.0f %12.0f %12.0f %12.4f %12.4f"
John Koleszar's avatar
John Koleszar committed
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
            "%12.4f %12.4f %12.4f %12.4f %12.4f %12.4f %12.4f"
            "%12.0f %12.0f %12.4f %12.0f %12.0f %12.4f\n",
            stats->frame,
            stats->intra_error,
            stats->coded_error,
            stats->sr_coded_error,
            stats->ssim_weighted_pred_err,
            stats->pcnt_inter,
            stats->pcnt_motion,
            stats->pcnt_second_ref,
            stats->pcnt_neutral,
            stats->MVr,
            stats->mvr_abs,
            stats->MVc,
            stats->mvc_abs,
            stats->MVrv,
            stats->MVcv,
            stats->mv_in_out_count,
            stats->new_mv_count,
            stats->count,
            stats->duration);
    fclose(fpfile);
  }
162
163
164
#endif
}

John Koleszar's avatar
John Koleszar committed
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
static void zero_stats(FIRSTPASS_STATS *section) {
  section->frame      = 0.0;
  section->intra_error = 0.0;
  section->coded_error = 0.0;
  section->sr_coded_error = 0.0;
  section->ssim_weighted_pred_err = 0.0;
  section->pcnt_inter  = 0.0;
  section->pcnt_motion  = 0.0;
  section->pcnt_second_ref = 0.0;
  section->pcnt_neutral = 0.0;
  section->MVr        = 0.0;
  section->mvr_abs     = 0.0;
  section->MVc        = 0.0;
  section->mvc_abs     = 0.0;
  section->MVrv       = 0.0;
  section->MVcv       = 0.0;
  section->mv_in_out_count  = 0.0;
  section->new_mv_count = 0.0;
  section->count      = 0.0;
  section->duration   = 1.0;
185
186
}

John Koleszar's avatar
John Koleszar committed
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
static void accumulate_stats(FIRSTPASS_STATS *section, FIRSTPASS_STATS *frame) {
  section->frame += frame->frame;
  section->intra_error += frame->intra_error;
  section->coded_error += frame->coded_error;
  section->sr_coded_error += frame->sr_coded_error;
  section->ssim_weighted_pred_err += frame->ssim_weighted_pred_err;
  section->pcnt_inter  += frame->pcnt_inter;
  section->pcnt_motion += frame->pcnt_motion;
  section->pcnt_second_ref += frame->pcnt_second_ref;
  section->pcnt_neutral += frame->pcnt_neutral;
  section->MVr        += frame->MVr;
  section->mvr_abs     += frame->mvr_abs;
  section->MVc        += frame->MVc;
  section->mvc_abs     += frame->mvc_abs;
  section->MVrv       += frame->MVrv;
  section->MVcv       += frame->MVcv;
  section->mv_in_out_count  += frame->mv_in_out_count;
  section->new_mv_count += frame->new_mv_count;
  section->count      += frame->count;
  section->duration   += frame->duration;
207
208
}

John Koleszar's avatar
John Koleszar committed
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
static void subtract_stats(FIRSTPASS_STATS *section, FIRSTPASS_STATS *frame) {
  section->frame -= frame->frame;
  section->intra_error -= frame->intra_error;
  section->coded_error -= frame->coded_error;
  section->sr_coded_error -= frame->sr_coded_error;
  section->ssim_weighted_pred_err -= frame->ssim_weighted_pred_err;
  section->pcnt_inter  -= frame->pcnt_inter;
  section->pcnt_motion -= frame->pcnt_motion;
  section->pcnt_second_ref -= frame->pcnt_second_ref;
  section->pcnt_neutral -= frame->pcnt_neutral;
  section->MVr        -= frame->MVr;
  section->mvr_abs     -= frame->mvr_abs;
  section->MVc        -= frame->MVc;
  section->mvc_abs     -= frame->mvc_abs;
  section->MVrv       -= frame->MVrv;
  section->MVcv       -= frame->MVcv;
  section->mv_in_out_count  -= frame->mv_in_out_count;
  section->new_mv_count -= frame->new_mv_count;
  section->count      -= frame->count;
  section->duration   -= frame->duration;
229
230
}

John Koleszar's avatar
John Koleszar committed
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
static void avg_stats(FIRSTPASS_STATS *section) {
  if (section->count < 1.0)
    return;

  section->intra_error /= section->count;
  section->coded_error /= section->count;
  section->sr_coded_error /= section->count;
  section->ssim_weighted_pred_err /= section->count;
  section->pcnt_inter  /= section->count;
  section->pcnt_second_ref /= section->count;
  section->pcnt_neutral /= section->count;
  section->pcnt_motion /= section->count;
  section->MVr        /= section->count;
  section->mvr_abs     /= section->count;
  section->MVc        /= section->count;
  section->mvc_abs     /= section->count;
  section->MVrv       /= section->count;
  section->MVcv       /= section->count;
  section->mv_in_out_count   /= section->count;
  section->duration   /= section->count;
251
252
}

John Koleszar's avatar
John Koleszar committed
253
// Calculate a modified Error used in distributing bits between easier and harder frames
254
static double calculate_modified_err(VP9_COMP *cpi, FIRSTPASS_STATS *this_frame) {
255
256
257
258
259
  const FIRSTPASS_STATS *const stats = &cpi->twopass.total_stats;
  const double av_err = stats->ssim_weighted_pred_err / stats->count;
  const double this_err = this_frame->ssim_weighted_pred_err;
  return av_err * pow(this_err / DOUBLE_DIVIDE_CHECK(av_err),
                      this_err > av_err ? POW1 : POW2);
John Koleszar's avatar
John Koleszar committed
260
261
}

262
static const double weight_table[256] = {
John Koleszar's avatar
John Koleszar committed
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
  0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000,
  0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000,
  0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000,
  0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000,
  0.020000, 0.031250, 0.062500, 0.093750, 0.125000, 0.156250, 0.187500, 0.218750,
  0.250000, 0.281250, 0.312500, 0.343750, 0.375000, 0.406250, 0.437500, 0.468750,
  0.500000, 0.531250, 0.562500, 0.593750, 0.625000, 0.656250, 0.687500, 0.718750,
  0.750000, 0.781250, 0.812500, 0.843750, 0.875000, 0.906250, 0.937500, 0.968750,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000
295
296
};

John Koleszar's avatar
John Koleszar committed
297
298
299
static double simple_weight(YV12_BUFFER_CONFIG *source) {
  int i, j;

300
  uint8_t *src = source->y_buffer;
John Koleszar's avatar
John Koleszar committed
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
  double sum_weights = 0.0;

  // Loop throught the Y plane raw examining levels and creating a weight for the image
  i = source->y_height;
  do {
    j = source->y_width;
    do {
      sum_weights += weight_table[ *src];
      src++;
    } while (--j);
    src -= source->y_width;
    src += source->y_stride;
  } while (--i);

  sum_weights /= (source->y_height * source->y_width);

  return sum_weights;
John Koleszar's avatar
John Koleszar committed
318
319
}

320

321
// This function returns the current per frame maximum bitrate target.
322
static int frame_max_bits(VP9_COMP *cpi) {
323
324
325
326
  // Max allocation for a single frame based on the max section guidelines
  // passed in and how many bits are left.
  // For VBR base this on the bits and frames left plus the
  // two_pass_vbrmax_section rate passed in by the user.
327
328
329
  const double max_bits = (1.0 * cpi->twopass.bits_left /
      (cpi->twopass.total_stats.count - cpi->common.current_video_frame)) *
      (cpi->oxcf.two_pass_vbrmax_section / 100.0);
John Koleszar's avatar
John Koleszar committed
330

331
  // Trap case where we are out of bits.
332
  return MAX((int)max_bits, 0);
John Koleszar's avatar
John Koleszar committed
333
334
}

335
void vp9_init_first_pass(VP9_COMP *cpi) {
336
  zero_stats(&cpi->twopass.total_stats);
John Koleszar's avatar
John Koleszar committed
337
338
}

339
void vp9_end_first_pass(VP9_COMP *cpi) {
340
  output_stats(cpi, cpi->output_pkt_list, &cpi->twopass.total_stats);
341
}
John Koleszar's avatar
John Koleszar committed
342

343
static void zz_motion_search(VP9_COMP *cpi, MACROBLOCK *x, YV12_BUFFER_CONFIG *recon_buffer, int *best_motion_err, int recon_yoffset) {
John Koleszar's avatar
John Koleszar committed
344
  MACROBLOCKD *const xd = &x->e_mbd;
John Koleszar's avatar
John Koleszar committed
345

John Koleszar's avatar
John Koleszar committed
346
  // Set up pointers for this macro block recon buffer
347
  xd->plane[0].pre[0].buf = recon_buffer->y_buffer + recon_yoffset;
John Koleszar's avatar
John Koleszar committed
348

349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
  switch (xd->mode_info_context->mbmi.sb_type) {
    case BLOCK_SIZE_SB8X8:
      vp9_mse8x8(x->plane[0].src.buf, x->plane[0].src.stride,
                 xd->plane[0].pre[0].buf, xd->plane[0].pre[0].stride,
                 (unsigned int *)(best_motion_err));
      break;
    case BLOCK_SIZE_SB16X8:
      vp9_mse16x8(x->plane[0].src.buf, x->plane[0].src.stride,
                  xd->plane[0].pre[0].buf, xd->plane[0].pre[0].stride,
                  (unsigned int *)(best_motion_err));
      break;
    case BLOCK_SIZE_SB8X16:
      vp9_mse8x16(x->plane[0].src.buf, x->plane[0].src.stride,
                  xd->plane[0].pre[0].buf, xd->plane[0].pre[0].stride,
                  (unsigned int *)(best_motion_err));
      break;
    default:
      vp9_mse16x16(x->plane[0].src.buf, x->plane[0].src.stride,
                   xd->plane[0].pre[0].buf, xd->plane[0].pre[0].stride,
                   (unsigned int *)(best_motion_err));
      break;
  }
}

static enum BlockSize get_bs(BLOCK_SIZE_TYPE b) {
  switch (b) {
    case BLOCK_SIZE_SB8X8:
      return BLOCK_8X8;
    case BLOCK_SIZE_SB16X8:
      return BLOCK_16X8;
    case BLOCK_SIZE_SB8X16:
      return BLOCK_8X16;
    default:
      return BLOCK_16X16;
  }
John Koleszar's avatar
John Koleszar committed
384
385
}

386
static void first_pass_motion_search(VP9_COMP *cpi, MACROBLOCK *x,
Scott LaVarnway's avatar
Scott LaVarnway committed
387
388
                                     int_mv *ref_mv, MV *best_mv,
                                     YV12_BUFFER_CONFIG *recon_buffer,
John Koleszar's avatar
John Koleszar committed
389
                                     int *best_motion_err, int recon_yoffset) {
John Koleszar's avatar
John Koleszar committed
390
  MACROBLOCKD *const xd = &x->e_mbd;
John Koleszar's avatar
John Koleszar committed
391
392
393
394
395
396
397
398
399
  int num00;

  int_mv tmp_mv;
  int_mv ref_mv_full;

  int tmp_err;
  int step_param = 3;
  int further_steps = (MAX_MVSEARCH_STEPS - 1) - step_param;
  int n;
400
401
  vp9_variance_fn_ptr_t v_fn_ptr =
      cpi->fn_ptr[get_bs(xd->mode_info_context->mbmi.sb_type)];
John Koleszar's avatar
John Koleszar committed
402
403
  int new_mv_mode_penalty = 256;

404
  int sr = 0;
405
  int quart_frm = MIN(cpi->common.width, cpi->common.height);
406
407
408
409
410
411
412
413
414
415
416

  // refine the motion search range accroding to the frame dimension
  // for first pass test
  while ((quart_frm << sr) < MAX_FULL_PEL_VAL)
    sr++;
  if (sr)
    sr--;

  step_param    += sr;
  further_steps -= sr;

John Koleszar's avatar
John Koleszar committed
417
  // override the default variance function to use MSE
418
419
420
421
422
423
424
425
426
427
428
429
430
431
  switch (xd->mode_info_context->mbmi.sb_type) {
    case BLOCK_SIZE_SB8X8:
      v_fn_ptr.vf = vp9_mse8x8;
      break;
    case BLOCK_SIZE_SB16X8:
      v_fn_ptr.vf = vp9_mse16x8;
      break;
    case BLOCK_SIZE_SB8X16:
      v_fn_ptr.vf = vp9_mse8x16;
      break;
    default:
      v_fn_ptr.vf = vp9_mse16x16;
      break;
  }
John Koleszar's avatar
John Koleszar committed
432
433

  // Set up pointers for this macro block recon buffer
434
  xd->plane[0].pre[0].buf = recon_buffer->y_buffer + recon_yoffset;
John Koleszar's avatar
John Koleszar committed
435
436
437
438
439

  // Initial step/diamond search centred on best mv
  tmp_mv.as_int = 0;
  ref_mv_full.as_mv.col = ref_mv->as_mv.col >> 3;
  ref_mv_full.as_mv.row = ref_mv->as_mv.row >> 3;
John Koleszar's avatar
John Koleszar committed
440
  tmp_err = cpi->diamond_search_sad(x, &ref_mv_full, &tmp_mv, step_param,
John Koleszar's avatar
John Koleszar committed
441
                                    x->sadperbit16, &num00, &v_fn_ptr,
442
443
                                    x->nmvjointcost,
                                    x->mvcost, ref_mv);
John Koleszar's avatar
John Koleszar committed
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
  if (tmp_err < INT_MAX - new_mv_mode_penalty)
    tmp_err += new_mv_mode_penalty;

  if (tmp_err < *best_motion_err) {
    *best_motion_err = tmp_err;
    best_mv->row = tmp_mv.as_mv.row;
    best_mv->col = tmp_mv.as_mv.col;
  }

  // Further step/diamond searches as necessary
  n = num00;
  num00 = 0;

  while (n < further_steps) {
    n++;

    if (num00)
      num00--;
    else {
John Koleszar's avatar
John Koleszar committed
463
      tmp_err = cpi->diamond_search_sad(x, &ref_mv_full, &tmp_mv,
John Koleszar's avatar
John Koleszar committed
464
465
                                        step_param + n, x->sadperbit16,
                                        &num00, &v_fn_ptr,
466
467
                                        x->nmvjointcost,
                                        x->mvcost, ref_mv);
John Koleszar's avatar
John Koleszar committed
468
      if (tmp_err < INT_MAX - new_mv_mode_penalty)
John Koleszar's avatar
John Koleszar committed
469
470
        tmp_err += new_mv_mode_penalty;

John Koleszar's avatar
John Koleszar committed
471
      if (tmp_err < *best_motion_err) {
John Koleszar's avatar
John Koleszar committed
472
        *best_motion_err = tmp_err;
Scott LaVarnway's avatar
Scott LaVarnway committed
473
474
        best_mv->row = tmp_mv.as_mv.row;
        best_mv->col = tmp_mv.as_mv.col;
John Koleszar's avatar
John Koleszar committed
475
      }
John Koleszar's avatar
John Koleszar committed
476
    }
John Koleszar's avatar
John Koleszar committed
477
  }
John Koleszar's avatar
John Koleszar committed
478
479
}

480
void vp9_first_pass(VP9_COMP *cpi) {
John Koleszar's avatar
John Koleszar committed
481
  int mb_row, mb_col;
John Koleszar's avatar
John Koleszar committed
482
  MACROBLOCK *const x = &cpi->mb;
483
  VP9_COMMON *const cm = &cpi->common;
John Koleszar's avatar
John Koleszar committed
484
  MACROBLOCKD *const xd = &x->e_mbd;
John Koleszar's avatar
John Koleszar committed
485
486

  int recon_yoffset, recon_uvoffset;
487
488
489
490
491
492
493
  const int lst_yv12_idx = cm->ref_frame_map[cpi->lst_fb_idx];
  const int gld_yv12_idx = cm->ref_frame_map[cpi->gld_fb_idx];
  YV12_BUFFER_CONFIG *const lst_yv12 = &cm->yv12_fb[lst_yv12_idx];
  YV12_BUFFER_CONFIG *const new_yv12 = &cm->yv12_fb[cm->new_fb_idx];
  YV12_BUFFER_CONFIG *const gld_yv12 = &cm->yv12_fb[gld_yv12_idx];
  const int recon_y_stride = lst_yv12->y_stride;
  const int recon_uv_stride = lst_yv12->uv_stride;
John Koleszar's avatar
John Koleszar committed
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
  int64_t intra_error = 0;
  int64_t coded_error = 0;
  int64_t sr_coded_error = 0;

  int sum_mvr = 0, sum_mvc = 0;
  int sum_mvr_abs = 0, sum_mvc_abs = 0;
  int sum_mvrs = 0, sum_mvcs = 0;
  int mvcount = 0;
  int intercount = 0;
  int second_ref_count = 0;
  int intrapenalty = 256;
  int neutral_count = 0;
  int new_mv_count = 0;
  int sum_in_vectors = 0;
  uint32_t lastmv_as_int = 0;

  int_mv zero_ref_mv;

  zero_ref_mv.as_int = 0;

514
  vp9_clear_system_state();  // __asm emms;
John Koleszar's avatar
John Koleszar committed
515

John Koleszar's avatar
John Koleszar committed
516
  vp9_setup_src_planes(x, cpi->Source, 0, 0);
517
  setup_pre_planes(xd, lst_yv12, NULL, 0, 0, NULL, NULL);
518
  setup_dst_planes(xd, new_yv12, 0, 0);
John Koleszar's avatar
John Koleszar committed
519
520
521
522
523

  x->partition_info = x->pi;

  xd->mode_info_context = cm->mi;

524
  vp9_setup_block_dptrs(&x->e_mbd, cm->subsampling_x, cm->subsampling_y);
John Koleszar's avatar
John Koleszar committed
525

526
  vp9_frame_init_quantizer(cpi);
John Koleszar's avatar
John Koleszar committed
527
528
529
530
531

  // Initialise the MV cost table to the defaults
  // if( cm->current_video_frame == 0)
  // if ( 0 )
  {
532
    vp9_init_mv_probs(cm);
533
    vp9_initialize_rd_consts(cpi, cm->base_qindex + cm->y_dc_delta_q);
John Koleszar's avatar
John Koleszar committed
534
535
536
537
538
539
540
541
542
543
544
545
546
547
  }

  // for each macroblock row in image
  for (mb_row = 0; mb_row < cm->mb_rows; mb_row++) {
    int_mv best_ref_mv;

    best_ref_mv.as_int = 0;

    // reset above block coeffs
    xd->up_available = (mb_row != 0);
    recon_yoffset = (mb_row * recon_y_stride * 16);
    recon_uvoffset = (mb_row * recon_uv_stride * 8);

    // Set up limit values for motion vectors to prevent them extending outside the UMV borders
Jingning Han's avatar
Jingning Han committed
548
    x->mv_row_min = -((mb_row * 16) + (VP9BORDERINPIXELS - 8));
John Koleszar's avatar
John Koleszar committed
549
    x->mv_row_max = ((cm->mb_rows - 1 - mb_row) * 16)
Jingning Han's avatar
Jingning Han committed
550
                    + (VP9BORDERINPIXELS - 8);
John Koleszar's avatar
John Koleszar committed
551
552
553
554
555
556
557

    // for each macroblock col in image
    for (mb_col = 0; mb_col < cm->mb_cols; mb_col++) {
      int this_error;
      int gf_motion_error = INT_MAX;
      int use_dc_pred = (mb_col || mb_row) && (!mb_col || !mb_row);

558
559
560
      xd->plane[0].dst.buf = new_yv12->y_buffer + recon_yoffset;
      xd->plane[1].dst.buf = new_yv12->u_buffer + recon_uvoffset;
      xd->plane[2].dst.buf = new_yv12->v_buffer + recon_uvoffset;
John Koleszar's avatar
John Koleszar committed
561
562
      xd->left_available = (mb_col != 0);

563
564
565
566
567
568
569
570
571
572
573
574
575
      if (mb_col * 2 + 1 < cm->mi_cols) {
        if (mb_row * 2 + 1 < cm->mi_rows) {
          xd->mode_info_context->mbmi.sb_type = BLOCK_SIZE_MB16X16;
        } else {
          xd->mode_info_context->mbmi.sb_type = BLOCK_SIZE_SB16X8;
        }
      } else {
        if (mb_row * 2 + 1 < cm->mi_rows) {
          xd->mode_info_context->mbmi.sb_type = BLOCK_SIZE_SB8X16;
        } else {
          xd->mode_info_context->mbmi.sb_type = BLOCK_SIZE_SB8X8;
        }
      }
Ronald S. Bultje's avatar
Ronald S. Bultje committed
576
      xd->mode_info_context->mbmi.ref_frame[0] = INTRA_FRAME;
577
578
579
580
581
      set_mi_row_col(cm, xd,
                     mb_row << 1,
                     1 << mi_height_log2(xd->mode_info_context->mbmi.sb_type),
                     mb_col << 1,
                     1 << mi_height_log2(xd->mode_info_context->mbmi.sb_type));
Jingning Han's avatar
Jingning Han committed
582

John Koleszar's avatar
John Koleszar committed
583
      // do intra 16x16 prediction
584
      this_error = vp9_encode_intra(cpi, x, use_dc_pred);
John Koleszar's avatar
John Koleszar committed
585
586
587
588
589
590
591
592
593
594
595

      // "intrapenalty" below deals with situations where the intra and inter error scores are very low (eg a plain black frame)
      // We do not have special cases in first pass for 0,0 and nearest etc so all inter modes carry an overhead cost estimate fot the mv.
      // When the error score is very low this causes us to pick all or lots of INTRA modes and throw lots of key frames.
      // This penalty adds a cost matching that of a 0,0 mv to the intra case.
      this_error += intrapenalty;

      // Cumulative intra error total
      intra_error += (int64_t)this_error;

      // Set up limit values for motion vectors to prevent them extending outside the UMV borders
Jingning Han's avatar
Jingning Han committed
596
      x->mv_col_min = -((mb_col * 16) + (VP9BORDERINPIXELS - 8));
John Koleszar's avatar
John Koleszar committed
597
      x->mv_col_max = ((cm->mb_cols - 1 - mb_col) * 16)
Jingning Han's avatar
Jingning Han committed
598
                      + (VP9BORDERINPIXELS - 8);
John Koleszar's avatar
John Koleszar committed
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626

      // Other than for the first frame do a motion search
      if (cm->current_video_frame > 0) {
        int tmp_err;
        int motion_error = INT_MAX;
        int_mv mv, tmp_mv;

        // Simple 0,0 motion with no mv overhead
        zz_motion_search(cpi, x, lst_yv12, &motion_error, recon_yoffset);
        mv.as_int = tmp_mv.as_int = 0;

        // Test last reference frame using the previous best mv as the
        // starting point (best reference) for the search
        first_pass_motion_search(cpi, x, &best_ref_mv,
                                 &mv.as_mv, lst_yv12,
                                 &motion_error, recon_yoffset);

        // If the current best reference mv is not centred on 0,0 then do a 0,0 based search as well
        if (best_ref_mv.as_int) {
          tmp_err = INT_MAX;
          first_pass_motion_search(cpi, x, &zero_ref_mv, &tmp_mv.as_mv,
                                   lst_yv12, &tmp_err, recon_yoffset);

          if (tmp_err < motion_error) {
            motion_error = tmp_err;
            mv.as_int = tmp_mv.as_int;
          }
        }
John Koleszar's avatar
John Koleszar committed
627

John Koleszar's avatar
John Koleszar committed
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
        // Experimental search in an older reference frame
        if (cm->current_video_frame > 1) {
          // Simple 0,0 motion with no mv overhead
          zz_motion_search(cpi, x, gld_yv12,
                           &gf_motion_error, recon_yoffset);

          first_pass_motion_search(cpi, x, &zero_ref_mv,
                                   &tmp_mv.as_mv, gld_yv12,
                                   &gf_motion_error, recon_yoffset);

          if ((gf_motion_error < motion_error) &&
              (gf_motion_error < this_error)) {
            second_ref_count++;
          }

          // Reset to last frame as reference buffer
644
645
646
          xd->plane[0].pre[0].buf = lst_yv12->y_buffer + recon_yoffset;
          xd->plane[1].pre[0].buf = lst_yv12->u_buffer + recon_uvoffset;
          xd->plane[2].pre[0].buf = lst_yv12->v_buffer + recon_uvoffset;
John Koleszar's avatar
John Koleszar committed
647
648
649
650
651
652
653
654
655
656
657

          // In accumulating a score for the older reference frame
          // take the best of the motion predicted score and
          // the intra coded error (just as will be done for)
          // accumulation of "coded_error" for the last frame.
          if (gf_motion_error < this_error)
            sr_coded_error += gf_motion_error;
          else
            sr_coded_error += this_error;
        } else
          sr_coded_error += motion_error;
658

John Koleszar's avatar
John Koleszar committed
659
        /* Intra assumed best */
660
        best_ref_mv.as_int = 0;
John Koleszar's avatar
John Koleszar committed
661

John Koleszar's avatar
John Koleszar committed
662
663
664
665
666
667
668
669
670
671
672
673
674
675
        if (motion_error <= this_error) {
          // Keep a count of cases where the inter and intra were
          // very close and very low. This helps with scene cut
          // detection for example in cropped clips with black bars
          // at the sides or top and bottom.
          if ((((this_error - intrapenalty) * 9) <=
               (motion_error * 10)) &&
              (this_error < (2 * intrapenalty))) {
            neutral_count++;
          }

          mv.as_mv.row <<= 3;
          mv.as_mv.col <<= 3;
          this_error = motion_error;
676
          vp9_set_mbmode_and_mvs(x, NEWMV, &mv);
677
          xd->mode_info_context->mbmi.txfm_size = TX_4X4;
Ronald S. Bultje's avatar
Ronald S. Bultje committed
678
679
          xd->mode_info_context->mbmi.ref_frame[0] = LAST_FRAME;
          xd->mode_info_context->mbmi.ref_frame[1] = NONE;
Jingning Han's avatar
Jingning Han committed
680
681
          vp9_build_inter_predictors_sby(xd, mb_row << 1,
                                         mb_col << 1,
682
683
                                         xd->mode_info_context->mbmi.sb_type);
          vp9_encode_sby(cm, x, xd->mode_info_context->mbmi.sb_type);
John Koleszar's avatar
John Koleszar committed
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
          sum_mvr += mv.as_mv.row;
          sum_mvr_abs += abs(mv.as_mv.row);
          sum_mvc += mv.as_mv.col;
          sum_mvc_abs += abs(mv.as_mv.col);
          sum_mvrs += mv.as_mv.row * mv.as_mv.row;
          sum_mvcs += mv.as_mv.col * mv.as_mv.col;
          intercount++;

          best_ref_mv.as_int = mv.as_int;

          // Was the vector non-zero
          if (mv.as_int) {
            mvcount++;

            // Was it different from the last non zero vector
            if (mv.as_int != lastmv_as_int)
              new_mv_count++;
            lastmv_as_int = mv.as_int;

            // Does the Row vector point inwards or outwards
            if (mb_row < cm->mb_rows / 2) {
              if (mv.as_mv.row > 0)
                sum_in_vectors--;
              else if (mv.as_mv.row < 0)
                sum_in_vectors++;
            } else if (mb_row > cm->mb_rows / 2) {
              if (mv.as_mv.row > 0)
                sum_in_vectors++;
              else if (mv.as_mv.row < 0)
                sum_in_vectors--;
John Koleszar's avatar
John Koleszar committed
714
715
            }

John Koleszar's avatar
John Koleszar committed
716
717
718
719
720
721
722
723
724
725
726
727
728
            // Does the Row vector point inwards or outwards
            if (mb_col < cm->mb_cols / 2) {
              if (mv.as_mv.col > 0)
                sum_in_vectors--;
              else if (mv.as_mv.col < 0)
                sum_in_vectors++;
            } else if (mb_col > cm->mb_cols / 2) {
              if (mv.as_mv.col > 0)
                sum_in_vectors++;
              else if (mv.as_mv.col < 0)
                sum_in_vectors--;
            }
          }
John Koleszar's avatar
John Koleszar committed
729
        }
John Koleszar's avatar
John Koleszar committed
730
731
      } else
        sr_coded_error += (int64_t)this_error;
John Koleszar's avatar
John Koleszar committed
732

John Koleszar's avatar
John Koleszar committed
733
      coded_error += (int64_t)this_error;
John Koleszar's avatar
John Koleszar committed
734

John Koleszar's avatar
John Koleszar committed
735
      // adjust to the next column of macroblocks
John Koleszar's avatar
John Koleszar committed
736
737
738
      x->plane[0].src.buf += 16;
      x->plane[1].src.buf += 8;
      x->plane[2].src.buf += 8;
John Koleszar's avatar
John Koleszar committed
739

John Koleszar's avatar
John Koleszar committed
740
741
      recon_yoffset += 16;
      recon_uvoffset += 8;
John Koleszar's avatar
John Koleszar committed
742
743
    }

John Koleszar's avatar
John Koleszar committed
744
    // adjust to the next row of mbs
John Koleszar's avatar
John Koleszar committed
745
746
747
    x->plane[0].src.buf += 16 * x->plane[0].src.stride - 16 * cm->mb_cols;
    x->plane[1].src.buf += 8 * x->plane[1].src.stride - 8 * cm->mb_cols;
    x->plane[2].src.buf += 8 * x->plane[1].src.stride - 8 * cm->mb_cols;
John Koleszar's avatar
John Koleszar committed
748

749
    vp9_clear_system_state();  // __asm emms;
John Koleszar's avatar
John Koleszar committed
750
751
  }

752
  vp9_clear_system_state();  // __asm emms;
John Koleszar's avatar
John Koleszar committed
753
754
755
756
757
758
  {
    double weight = 0.0;

    FIRSTPASS_STATS fps;

    fps.frame      = cm->current_video_frame;
759
760
761
    fps.intra_error = (double)(intra_error >> 8);
    fps.coded_error = (double)(coded_error >> 8);
    fps.sr_coded_error = (double)(sr_coded_error >> 8);
John Koleszar's avatar
John Koleszar committed
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
    weight = simple_weight(cpi->Source);


    if (weight < 0.1)
      weight = 0.1;

    fps.ssim_weighted_pred_err = fps.coded_error * weight;

    fps.pcnt_inter  = 0.0;
    fps.pcnt_motion = 0.0;
    fps.MVr        = 0.0;
    fps.mvr_abs     = 0.0;
    fps.MVc        = 0.0;
    fps.mvc_abs     = 0.0;
    fps.MVrv       = 0.0;
    fps.MVcv       = 0.0;
    fps.mv_in_out_count  = 0.0;
    fps.new_mv_count = 0.0;
    fps.count      = 1.0;

    fps.pcnt_inter   = 1.0 * (double)intercount / cm->MBs;
    fps.pcnt_second_ref = 1.0 * (double)second_ref_count / cm->MBs;
    fps.pcnt_neutral = 1.0 * (double)neutral_count / cm->MBs;

    if (mvcount > 0) {
      fps.MVr = (double)sum_mvr / (double)mvcount;
      fps.mvr_abs = (double)sum_mvr_abs / (double)mvcount;
      fps.MVc = (double)sum_mvc / (double)mvcount;
      fps.mvc_abs = (double)sum_mvc_abs / (double)mvcount;
      fps.MVrv = ((double)sum_mvrs - (fps.MVr * fps.MVr / (double)mvcount)) / (double)mvcount;
      fps.MVcv = ((double)sum_mvcs - (fps.MVc * fps.MVc / (double)mvcount)) / (double)mvcount;
      fps.mv_in_out_count = (double)sum_in_vectors / (double)(mvcount * 2);
      fps.new_mv_count = new_mv_count;

      fps.pcnt_motion = 1.0 * (double)mvcount / cpi->common.MBs;
Paul Wilkins's avatar
Paul Wilkins committed
797
    }
John Koleszar's avatar
John Koleszar committed
798

John Koleszar's avatar
John Koleszar committed
799
    // TODO:  handle the case when duration is set to 0, or something less
800
    // than the full time between subsequent values of cpi->source_time_stamp.
801
802
    fps.duration = (double)(cpi->source->ts_end
                            - cpi->source->ts_start);
John Koleszar's avatar
John Koleszar committed
803
804

    // don't want to do output stats with a stack variable!
805
    cpi->twopass.this_frame_stats = fps;
806
807
    output_stats(cpi, cpi->output_pkt_list, &cpi->twopass.this_frame_stats);
    accumulate_stats(&cpi->twopass.total_stats, &fps);
John Koleszar's avatar
John Koleszar committed
808
809
810
811
812
813
  }

  // Copy the previous Last Frame back into gf and and arf buffers if
  // the prediction is good enough... but also dont allow it to lag too far
  if ((cpi->twopass.sr_update_lag > 3) ||
      ((cm->current_video_frame > 0) &&
814
815
816
       (cpi->twopass.this_frame_stats.pcnt_inter > 0.20) &&
       ((cpi->twopass.this_frame_stats.intra_error /
         DOUBLE_DIVIDE_CHECK(cpi->twopass.this_frame_stats.coded_error)) >
817
        2.0))) {
John Koleszar's avatar
John Koleszar committed
818
    vp8_yv12_copy_frame(lst_yv12, gld_yv12);
John Koleszar's avatar
John Koleszar committed
819
820
821
    cpi->twopass.sr_update_lag = 1;
  } else
    cpi->twopass.sr_update_lag++;
John Koleszar's avatar
John Koleszar committed
822

John Koleszar's avatar
John Koleszar committed
823
  // swap frame pointers so last frame refers to the frame we just compressed
824
825
  swap_yv12(lst_yv12, new_yv12);

John Koleszar's avatar
John Koleszar committed
826
  vp9_extend_frame_borders(lst_yv12, cm->subsampling_x, cm->subsampling_y);
John Koleszar's avatar
John Koleszar committed
827

John Koleszar's avatar
John Koleszar committed
828
  // Special case for the first frame. Copy into the GF buffer as a second reference.
829
  if (cm->current_video_frame == 0)
John Koleszar's avatar
John Koleszar committed
830
    vp8_yv12_copy_frame(lst_yv12, gld_yv12);
John Koleszar's avatar
John Koleszar committed
831

John Koleszar's avatar
John Koleszar committed
832
833
834
835
836
  // use this to see what the first pass reconstruction looks like
  if (0) {
    char filename[512];
    FILE *recon_file;
    sprintf(filename, "enc%04d.yuv", (int) cm->current_video_frame);
John Koleszar's avatar
John Koleszar committed
837

John Koleszar's avatar
John Koleszar committed
838
839
840
841
842
    if (cm->current_video_frame == 0)
      recon_file = fopen(filename, "wb");
    else
      recon_file = fopen(filename, "ab");

Frank Galligan's avatar
Frank Galligan committed
843
    (void)fwrite(lst_yv12->buffer_alloc, lst_yv12->frame_size, 1, recon_file);
John Koleszar's avatar
John Koleszar committed
844
845
    fclose(recon_file);
  }
John Koleszar's avatar
John Koleszar committed
846

John Koleszar's avatar
John Koleszar committed
847
  cm->current_video_frame++;
John Koleszar's avatar
John Koleszar committed
848
849
850

}

851
852
853
854
855
856
// Estimate a cost per mb attributable to overheads such as the coding of
// modes and motion vectors.
// Currently simplistic in its assumptions for testing.
//


857
static double bitcost(double prob) {
John Koleszar's avatar
John Koleszar committed
858
  return -(log(prob) / log(2.0));
859
}
860

861
static int64_t estimate_modemvcost(VP9_COMP *cpi,
John Koleszar's avatar
John Koleszar committed
862
                                     FIRSTPASS_STATS *fpstats) {
863
#if 0
John Koleszar's avatar
John Koleszar committed
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
  int mv_cost;
  int mode_cost;

  double av_pct_inter = fpstats->pcnt_inter / fpstats->count;
  double av_pct_motion = fpstats->pcnt_motion / fpstats->count;
  double av_intra = (1.0 - av_pct_inter);

  double zz_cost;
  double motion_cost;
  double intra_cost;

  zz_cost = bitcost(av_pct_inter - av_pct_motion);
  motion_cost = bitcost(av_pct_motion);
  intra_cost = bitcost(av_intra);

  // Estimate of extra bits per mv overhead for mbs
880
  // << 9 is the normalization to the (bits * 512) used in vp9_bits_per_mb
John Koleszar's avatar
John Koleszar committed
881
882
883
  mv_cost = ((int)(fpstats->new_mv_count / fpstats->count) * 8) << 9;

  // Crude estimate of overhead cost from modes
884
  // << 9 is the normalization to (bits * 512) used in vp9_bits_per_mb
John Koleszar's avatar
John Koleszar committed
885
886
887
888
889
890
891
  mode_cost =
    (int)((((av_pct_inter - av_pct_motion) * zz_cost) +
           (av_pct_motion * motion_cost) +
           (av_intra * intra_cost)) * cpi->common.MBs) << 9;

  // return mv_cost + mode_cost;
  // TODO PGW Fix overhead costs for extended Q range
892
#endif
John Koleszar's avatar
John Koleszar committed
893
  return 0;
894
895
}

John Koleszar's avatar
John Koleszar committed
896
897
898
899
static double calc_correction_factor(double err_per_mb,
                                     double err_divisor,
                                     double pt_low,
                                     double pt_high,
900
901
                                     int q) {
  const double error_term = err_per_mb / err_divisor;
902

John Koleszar's avatar
John Koleszar committed
903
  // Adjustment based on actual quantizer to power term.
904
905
  const double power_term = MIN(vp9_convert_qindex_to_q(q) * 0.01 + pt_low,
                                pt_high);
906

John Koleszar's avatar
John Koleszar committed
907
  // Calculate correction factor
John Koleszar's avatar
John Koleszar committed
908
909
  if (power_term < 1.0)
    assert(error_term >= 0.0);
910

911
  return fclamp(pow(error_term, power_term), 0.05, 5.0);
912
913
}

Paul Wilkins's avatar
Paul Wilkins committed
914
915
// Given a current maxQ value sets a range for future values.
// PGW TODO..
916
// This code removes direct dependency on QIndex to determine the range
Paul Wilkins's avatar
Paul Wilkins committed
917
// (now uses the actual quantizer) but has not been tuned.
918
static void adjust_maxq_qrange(VP9_COMP *cpi) {
John Koleszar's avatar
John Koleszar committed
919
920
  int i;
  // Set the max corresponding to cpi->avg_q * 2.0
921
  double q = cpi->avg_q * 2.0;
John Koleszar's avatar
John Koleszar committed
922
923
924
  cpi->twopass.maxq_max_limit = cpi->worst_quality;
  for (i = cpi->best_quality; i <= cpi->worst_quality; i++) {
    cpi->twopass.maxq_max_limit = i;
925
    if (vp9_convert_qindex_to_q(i) >= q)
John Koleszar's avatar
John Koleszar committed
926
927
928
929
930
931
932
933
      break;
  }

  // Set the min corresponding to cpi->avg_q * 0.5
  q = cpi->avg_q * 0.5;
  cpi->twopass.maxq_min_limit = cpi->best_quality;
  for (i = cpi->worst_quality; i >= cpi->best_quality; i--) {
    cpi->twopass.maxq_min_limit = i;
934
    if (vp9_convert_qindex_to_q(i) <= q)
John Koleszar's avatar
John Koleszar committed
935
936
      break;
  }
Paul Wilkins's avatar
Paul Wilkins committed
937
}
Paul Wilkins's avatar
Paul Wilkins committed
938

939
static int estimate_max_q(VP9_COMP *cpi,
John Koleszar's avatar
John Koleszar committed
940
                          FIRSTPASS_STATS *fpstats,
941
                          int section_target_bandwitdh) {
942
  int q;
John Koleszar's avatar
John Koleszar committed
943
944
945
  int num_mbs = cpi->common.MBs;
  int target_norm_bits_per_mb;

946
  double section_err = fpstats->coded_error / fpstats->count;
John Koleszar's avatar
John Koleszar committed
947
948
949
950
951
952
953
954
  double sr_correction;
  double err_per_mb = section_err / num_mbs;
  double err_correction_factor;
  double speed_correction = 1.0;

  if (section_target_bandwitdh <= 0)
    return cpi->twopass.maxq_max_limit;          // Highest value allowed

955
956
957
  target_norm_bits_per_mb = section_target_bandwitdh < (1 << 20)
                              ? (512 * section_target_bandwitdh) / num_mbs
                              : 512 * (section_target_bandwitdh / num_mbs);
John Koleszar's avatar
John Koleszar committed
958
959
960

  // Look at the drop in prediction quality between the last frame
  // and the GF buffer (which contained an older frame).
John Koleszar's avatar
John Koleszar committed
961
  if (fpstats->sr_coded_error > fpstats->coded_error) {
962
963
964
    double sr_err_diff = (fpstats->sr_coded_error - fpstats->coded_error) /
                             (fpstats->count * cpi->common.MBs);
    sr_correction = fclamp(pow(sr_err_diff / 32.0, 0.25), 0.75, 1.25);
John Koleszar's avatar
John Koleszar committed
965
  } else {
John Koleszar's avatar
John Koleszar committed
966
    sr_correction = 0.75;
John Koleszar's avatar
John Koleszar committed
967
  }
John Koleszar's avatar
John Koleszar committed
968
969
970

  // Calculate a corrective factor based on a rolling ratio of bits spent
  // vs target bits
971
972
973
974
  if (cpi->rolling_target_bits > 0 &&
      cpi->active_worst_quality < cpi->worst_quality) {
    double rolling_ratio = (double)cpi->rolling_actual_bits /
                               (double)cpi->rolling_target_bits;
John Koleszar's avatar
John Koleszar committed
975
976
977
978
979
980

    if (rolling_ratio < 0.95)
      cpi->twopass.est_max_qcorrection_factor -= 0.005;
    else if (rolling_ratio > 1.05)
      cpi->twopass.est_max_qcorrection_factor += 0.005;

981
982
    cpi->twopass.est_max_qcorrection_factor = fclamp(
        cpi->twopass.est_max_qcorrection_factor, 0.1, 10.0);
John Koleszar's avatar
John Koleszar committed
983
984
985
986
  }

  // Corrections for higher compression speed settings
  // (reduced compression expected)
987
988
  // FIXME(jimbankoski): Once we settle on vp9 speed features we need to
  // change this code.
989
990
  if (cpi->compressor_speed == 1)
    speed_correction = cpi->oxcf.cpu_used <= 5 ?
991
                          1.04 + (/*cpi->oxcf.cpu_used*/0 * 0.04) :
992
                          1.25;
John Koleszar's avatar
John Koleszar committed
993
994
995

  // Try and pick a max Q that will be high enough to encode the
  // content at the given rate.
996
  for (q = cpi->twopass.maxq_min_limit; q < cpi->twopass.maxq_max_limit; q++) {
John Koleszar's avatar
John Koleszar committed
997
998
    int bits_per_mb_at_this_q;

999
1000
1001
1002
    err_correction_factor = calc_correction_factor(err_per_mb,
                                                   ERR_DIVISOR, 0.4, 0.90, q) *
                                sr_correction * speed_correction *
                                cpi->twopass.est_max_qcorrection_factor;
John Koleszar's avatar
John Koleszar committed
1003

1004
1005
    bits_per_mb_at_this_q = vp9_bits_per_mb(INTER_FRAME, q,
                                            err_correction_factor);
John Koleszar's avatar
John Koleszar committed
1006
1007
1008
1009
1010
1011

    if (bits_per_mb_at_this_q <= target_norm_bits_per_mb)
      break;
  }

  // Restriction on active max q for constrained quality mode.
1012
1013
1014
  if (cpi->oxcf.end_usage == USAGE_CONSTRAINED_QUALITY &&
      q < cpi->cq_target_quality)
    q = cpi->cq_target_quality;
John Koleszar's avatar
John Koleszar committed
1015
1016

  // Adjust maxq_min_limit and maxq_max_limit limits based on
1017
  // average q observed in clip for non kf/gf/arf frames
John Koleszar's avatar
John Koleszar committed
1018
1019
  // Give average a chance to settle though.
  // PGW TODO.. This code is broken for the extended Q range
1020
1021
  if (cpi->ni_frames > ((int)cpi->twopass.total_stats.count >> 8) &&
      cpi->ni_frames > 25)
John Koleszar's avatar
John Koleszar committed
1022
1023
    adjust_maxq_qrange(cpi);

1024
  return q;
John Koleszar's avatar
John Koleszar committed
1025
}
1026
1027
1028

// For cq mode estimate a cq level that matches the observed
// complexity and data rate.
1029
static int estimate_cq(VP9_COMP *cpi,
John Koleszar's avatar
John Koleszar committed
1030
                       FIRSTPASS_STATS *fpstats,
1031
                       int section_target_bandwitdh) {
1032
  int q;
John Koleszar's avatar
John Koleszar committed
1033
1034
1035
1036
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
  int num_mbs = cpi->common.MBs;
  int target_norm_bits_per_mb;

  double section_err = (fpstats->coded_error / fpstats->count);
  double err_per_mb = section_err / num_mbs;
  double err_correction_factor;
  double sr_err_diff;
  double sr_correction;
  double speed_correction = 1.0;
  double clip_iiratio;
  double clip_iifactor;

  target_norm_bits_per_mb = (section_target_bandwitdh < (1 << 20))
                            ? (512 * section_target_bandwitdh) / num_mbs
                            : 512 * (section_target_bandwitdh / num_mbs);


  // Corrections for higher compression speed settings
  // (reduced compression expected)
  if (cpi->compressor_speed == 1) {
    if (cpi->oxcf.cpu_used <= 5)
1054
      speed_correction = 1.04 + (/*cpi->oxcf.cpu_used*/ 0 * 0.04);
John Koleszar's avatar
John Koleszar committed
1055
1056
1057
1058
1059
1060
    else
      speed_correction = 1.25;
  }

  // Look at the drop in prediction quality between the last frame
  // and the GF buffer (which contained an older frame).
John Koleszar's avatar
John Koleszar committed
1061
1062
1063
1064
1065
1066
1067
1068
1069
1070
1071
  if (fpstats->sr_coded_error > fpstats->coded_error) {
    sr_err_diff =
      (fpstats->sr_coded_error - fpstats->coded_error) /
      (fpstats->count * cpi->common.MBs);
    sr_correction = (sr_err_diff / 32.0);
    sr_correction = pow(sr_correction, 0.25);
    if (sr_correction < 0.75)
      sr_correction = 0.75;
    else if (sr_correction > 1.25)
      sr_correction = 1.25;
  } else {
John Koleszar's avatar
John Koleszar committed
1072
    sr_correction = 0.75;
John Koleszar's avatar
John Koleszar committed
1073
  }
John Koleszar's avatar
John Koleszar committed
1074
1075

  // II ratio correction factor for clip as a whole
1076
1077
  clip_iiratio = cpi->twopass.total_stats.intra_error /
                 DOUBLE_DIVIDE_CHECK(cpi->twopass.total_stats.coded_error);
John Koleszar's avatar
John Koleszar committed
1078
1079
1080
1081
1082
  clip_iifactor = 1.0 - ((clip_iiratio - 10.0) * 0.025);
  if (clip_iifactor < 0.80)
    clip_iifactor = 0.80;

  // Try and pick a Q that can encode the content at the given rate.
1083
  for (q = 0; q < MAXQ; q++) {
John Koleszar's avatar
John Koleszar committed
1084
1085
1086
1087
    int bits_per_mb_at_this_q;

    // Error per MB based correction factor
    err_correction_factor =
1088
      calc_correction_factor(err_per_mb, 100.0, 0.4, 0.90, q) *
John Koleszar's avatar
John Koleszar committed
1089
1090
1091
      sr_correction * speed_correction * clip_iifactor;

    bits_per_mb_at_this_q =
1092
      vp9_bits_per_mb(INTER_FRAME, q, err_correction_factor);
1093

John Koleszar's avatar
John Koleszar committed
1094
1095
1096
    if (bits_per_mb_at_this_q <= target_norm_bits_per_mb)
      break;
  }
1097

John Koleszar's avatar
John Koleszar committed
1098
  // Clip value to range "best allowed to (worst allowed - 1)"
1099
1100
1101
1102
1103
  q = select_cq_level(q);
  if (q >= cpi->worst_quality)
    q = cpi->worst_quality - 1;
  if (q < cpi->best_quality)
    q = cpi->best_quality;
1104

1105
  return q;
1106
1107
}

Paul Wilkins's avatar
CQ Mode    
Paul Wilkins committed
1108

1109
extern void vp9_new_frame_rate(VP9_COMP *cpi, double framerate);
John Koleszar's avatar
John Koleszar committed
1110

1111
void vp9_init_second_pass(VP9_COMP *cpi) {
John Koleszar's avatar
John Koleszar committed
1112
1113
  FIRSTPASS_STATS this_frame;
  FIRSTPASS_STATS *start_pos;
John Koleszar's avatar
John Koleszar committed
1114

John Koleszar's avatar
John Koleszar committed
1115
1116
1117
  double lower_bounds_min_rate = FRAME_OVERHEAD_BITS * cpi->oxcf.frame_rate;
  double two_pass_min_rate = (double)(cpi->oxcf.target_bandwidth
                                      * cpi->oxcf.two_pass_vbrmin_section / 100);
1118

John Koleszar's avatar
John Koleszar committed
1119
1120
  if (two_pass_min_rate < lower_bounds_min_rate)
    two_pass_min_rate = lower_bounds_min_rate;
John Koleszar's avatar
John Koleszar committed
1121

1122
1123
  zero_stats(&cpi->twopass.total_stats);
  zero_stats(&cpi->twopass.total_left_stats);
John Koleszar's avatar
John Koleszar committed
1124

John Koleszar's avatar
John Koleszar committed
1125
1126
  if (!cpi->twopass.stats_in_end)
    return;
John Koleszar's avatar
John Koleszar committed
1127

1128
1129
  cpi->twopass.total_stats = *cpi->twopass.stats_in_end;
  cpi->twopass.total_left_stats = cpi->twopass.total_stats;
John Koleszar's avatar
John Koleszar committed
1130

John Koleszar's avatar
John Koleszar committed
1131
1132
1133
1134
1135
  // each frame can have a different duration, as the frame rate in the source
  // isn't guaranteed to be constant.   The frame rate prior to the first frame
  // encoded in the second pass is a guess.  However the sum duration is not.
  // Its calculated based on the actual durations of all frames from the first
  // pass.
1136
1137
  vp9_new_frame_rate(cpi, 10000000.0 * cpi->twopass.total_stats.count /
                       cpi->twopass.total_stats.duration);
John Koleszar's avatar
John Koleszar committed
1138

John Koleszar's avatar
John Koleszar committed
1139
  cpi->output_frame_rate = cpi->oxcf.frame_rate;
1140
  cpi->twopass.bits_left = (int64_t)(cpi->twopass.total_stats.duration *
1141
                                     cpi->oxcf.target_bandwidth / 10000000.0);
1142
  cpi->twopass.bits_left -= (int64_t)(cpi->twopass.total_stats.duration *
1143
                                      two_pass_min_rate / 10000000.0);
Paul Wilkins's avatar
Paul Wilkins committed
1144

John Koleszar's avatar
John Koleszar committed
1145
1146
1147
1148
1149
1150
  // Calculate a minimum intra value to be used in determining the IIratio
  // scores used in the second pass. We have this minimum to make sure
  // that clips that are static but "low complexity" in the intra domain
  // are still boosted appropriately for KF/GF/ARF
  cpi->twopass.kf_intra_err_min = KF_MB_INTRA_MIN * cpi->common.MBs;
  cpi->twopass.gf_intra_err_min = GF_MB_INTRA_MIN * cpi->common.MBs;
John Koleszar's avatar
John Koleszar committed
1151

John Koleszar's avatar
John Koleszar committed
1152
1153
  // This variable monitors how far behind the second ref update is lagging
  cpi->twopass.sr_update_lag = 1;
John Koleszar's avatar
John Koleszar committed
1154

John Koleszar's avatar
John Koleszar committed
1155
1156
1157
1158
  // Scan the first pass file and calculate an average Intra / Inter error score ratio for the sequence
  {
    double sum_iiratio = 0.0;
    double IIRatio;
John Koleszar's avatar
John Koleszar committed
1159

John Koleszar's avatar
John Koleszar committed
1160
    start_pos = cpi->twopass.stats_in;               // Note starting "file" position
John Koleszar's avatar
John Koleszar committed
1161