vp9_firstpass.c 86.5 KB
Newer Older
John Koleszar's avatar
John Koleszar committed
1
/*
2
 *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
John Koleszar's avatar
John Koleszar committed
3
 *
4
 *  Use of this source code is governed by a BSD-style license
5
6
 *  that can be found in the LICENSE file in the root of the source
 *  tree. An additional intellectual property rights grant can be found
7
 *  in the file PATENTS.  All contributing project authors may
8
 *  be found in the AUTHORS file in the root of the source tree.
John Koleszar's avatar
John Koleszar committed
9
10
11
12
 */

#include "math.h"
#include "limits.h"
13
14
15
16
17
18
19
#include "vp9_block.h"
#include "vp9_onyx_int.h"
#include "vp9_variance.h"
#include "vp9_encodeintra.h"
#include "vp9/common/vp9_setupintrarecon.h"
#include "vp9_mcomp.h"
#include "vp9_firstpass.h"
John Koleszar's avatar
John Koleszar committed
20
#include "vpx_scale/vpxscale.h"
21
22
23
24
#include "vp9/encoder/vp9_encodeframe.h"
#include "vp9_encodemb.h"
#include "vp9/common/vp9_extend.h"
#include "vp9/common/vp9_systemdependent.h"
John Koleszar's avatar
John Koleszar committed
25
#include "vpx_mem/vpx_mem.h"
26
#include "vp9/common/vp9_swapyv12buffer.h"
John Koleszar's avatar
John Koleszar committed
27
#include <stdio.h>
28
29
30
31
32
33
#include "vp9/encoder/vp9_quantize.h"
#include "vp9_rdopt.h"
#include "vp9_ratectrl.h"
#include "vp9/common/vp9_quant_common.h"
#include "vp9/common/vp9_entropymv.h"
#include "vp9_encodemv.h"
John Koleszar's avatar
John Koleszar committed
34

35
#define OUTPUT_FPF 0
John Koleszar's avatar
John Koleszar committed
36
37
38
39
40
41
42

#if CONFIG_RUNTIME_CPU_DETECT
#define IF_RTCD(x) (x)
#else
#define IF_RTCD(x) NULL
#endif

43
44
#define IIFACTOR   12.5
#define IIKFACTOR1 12.5
45
46
#define IIKFACTOR2 15.0
#define RMAX       128.0
47
#define GF_RMAX    96.0
Paul Wilkins's avatar
Paul Wilkins committed
48
#define ERR_DIVISOR   150.0
John Koleszar's avatar
John Koleszar committed
49

50
51
#define KF_MB_INTRA_MIN 300
#define GF_MB_INTRA_MIN 200
Paul Wilkins's avatar
CQ Mode    
Paul Wilkins committed
52

John Koleszar's avatar
John Koleszar committed
53
54
55
56
57
#define DOUBLE_DIVIDE_CHECK(X) ((X)<0?(X)-.000001:(X)+.000001)

#define POW1 (double)cpi->oxcf.two_pass_vbrbias/100.0
#define POW2 (double)cpi->oxcf.two_pass_vbrbias/100.0

58
static void find_next_key_frame(VP9_COMP *cpi, FIRSTPASS_STATS *this_frame);
Paul Wilkins's avatar
Paul Wilkins committed
59

John Koleszar's avatar
John Koleszar committed
60
61
62
static int select_cq_level(int qindex) {
  int ret_val = QINDEX_RANGE - 1;
  int i;
Paul Wilkins's avatar
Paul Wilkins committed
63

64
  double target_q = (vp9_convert_qindex_to_q(qindex) * 0.5847) + 1.0;
Paul Wilkins's avatar
Paul Wilkins committed
65

John Koleszar's avatar
John Koleszar committed
66
  for (i = 0; i < QINDEX_RANGE; i++) {
67
    if (target_q <= vp9_convert_qindex_to_q(i)) {
John Koleszar's avatar
John Koleszar committed
68
69
      ret_val = i;
      break;
Paul Wilkins's avatar
Paul Wilkins committed
70
    }
John Koleszar's avatar
John Koleszar committed
71
  }
Paul Wilkins's avatar
Paul Wilkins committed
72

John Koleszar's avatar
John Koleszar committed
73
  return ret_val;
Paul Wilkins's avatar
Paul Wilkins committed
74
}
Paul Wilkins's avatar
CQ Mode    
Paul Wilkins committed
75

John Koleszar's avatar
John Koleszar committed
76
77

// Resets the first pass file to the given position using a relative seek from the current position
78
static void reset_fpf_position(VP9_COMP *cpi, FIRSTPASS_STATS *Position) {
John Koleszar's avatar
John Koleszar committed
79
  cpi->twopass.stats_in = Position;
John Koleszar's avatar
John Koleszar committed
80
81
}

82
static int lookup_next_frame_stats(VP9_COMP *cpi, FIRSTPASS_STATS *next_frame) {
John Koleszar's avatar
John Koleszar committed
83
84
  if (cpi->twopass.stats_in >= cpi->twopass.stats_in_end)
    return EOF;
John Koleszar's avatar
John Koleszar committed
85

John Koleszar's avatar
John Koleszar committed
86
87
  *next_frame = *cpi->twopass.stats_in;
  return 1;
John Koleszar's avatar
John Koleszar committed
88
89
}

90
// Read frame stats at an offset from the current position
91
static int read_frame_stats(VP9_COMP *cpi,
John Koleszar's avatar
John Koleszar committed
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
                            FIRSTPASS_STATS *frame_stats,
                            int offset) {
  FIRSTPASS_STATS *fps_ptr = cpi->twopass.stats_in;

  // Check legality of offset
  if (offset >= 0) {
    if (&fps_ptr[offset] >= cpi->twopass.stats_in_end)
      return EOF;
  } else if (offset < 0) {
    if (&fps_ptr[offset] < cpi->twopass.stats_in_start)
      return EOF;
  }

  *frame_stats = fps_ptr[offset];
  return 1;
107
108
}

109
static int input_stats(VP9_COMP *cpi, FIRSTPASS_STATS *fps) {
John Koleszar's avatar
John Koleszar committed
110
111
  if (cpi->twopass.stats_in >= cpi->twopass.stats_in_end)
    return EOF;
112

John Koleszar's avatar
John Koleszar committed
113
114
115
116
  *fps = *cpi->twopass.stats_in;
  cpi->twopass.stats_in =
    (void *)((char *)cpi->twopass.stats_in + sizeof(FIRSTPASS_STATS));
  return 1;
117
118
}

119
static void output_stats(const VP9_COMP            *cpi,
120
                         struct vpx_codec_pkt_list *pktlist,
John Koleszar's avatar
John Koleszar committed
121
122
123
124
125
126
                         FIRSTPASS_STATS            *stats) {
  struct vpx_codec_cx_pkt pkt;
  pkt.kind = VPX_CODEC_STATS_PKT;
  pkt.data.twopass_stats.buf = stats;
  pkt.data.twopass_stats.sz = sizeof(FIRSTPASS_STATS);
  vpx_codec_pkt_list_add(pktlist, &pkt);
127
128
129
130

// TEMP debug code
#if OUTPUT_FPF

John Koleszar's avatar
John Koleszar committed
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
  {
    FILE *fpfile;
    fpfile = fopen("firstpass.stt", "a");

    fprintf(fpfile, "%12.0f %12.0f %12.0f %12.0f %12.0f %12.4f %12.4f"
            "%12.4f %12.4f %12.4f %12.4f %12.4f %12.4f %12.4f"
            "%12.0f %12.0f %12.4f %12.0f %12.0f %12.4f\n",
            stats->frame,
            stats->intra_error,
            stats->coded_error,
            stats->sr_coded_error,
            stats->ssim_weighted_pred_err,
            stats->pcnt_inter,
            stats->pcnt_motion,
            stats->pcnt_second_ref,
            stats->pcnt_neutral,
            stats->MVr,
            stats->mvr_abs,
            stats->MVc,
            stats->mvc_abs,
            stats->MVrv,
            stats->MVcv,
            stats->mv_in_out_count,
            stats->new_mv_count,
            stats->count,
            stats->duration);
    fclose(fpfile);
  }
159
160
161
#endif
}

John Koleszar's avatar
John Koleszar committed
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
static void zero_stats(FIRSTPASS_STATS *section) {
  section->frame      = 0.0;
  section->intra_error = 0.0;
  section->coded_error = 0.0;
  section->sr_coded_error = 0.0;
  section->ssim_weighted_pred_err = 0.0;
  section->pcnt_inter  = 0.0;
  section->pcnt_motion  = 0.0;
  section->pcnt_second_ref = 0.0;
  section->pcnt_neutral = 0.0;
  section->MVr        = 0.0;
  section->mvr_abs     = 0.0;
  section->MVc        = 0.0;
  section->mvc_abs     = 0.0;
  section->MVrv       = 0.0;
  section->MVcv       = 0.0;
  section->mv_in_out_count  = 0.0;
  section->new_mv_count = 0.0;
  section->count      = 0.0;
  section->duration   = 1.0;
182
183
}

John Koleszar's avatar
John Koleszar committed
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
static void accumulate_stats(FIRSTPASS_STATS *section, FIRSTPASS_STATS *frame) {
  section->frame += frame->frame;
  section->intra_error += frame->intra_error;
  section->coded_error += frame->coded_error;
  section->sr_coded_error += frame->sr_coded_error;
  section->ssim_weighted_pred_err += frame->ssim_weighted_pred_err;
  section->pcnt_inter  += frame->pcnt_inter;
  section->pcnt_motion += frame->pcnt_motion;
  section->pcnt_second_ref += frame->pcnt_second_ref;
  section->pcnt_neutral += frame->pcnt_neutral;
  section->MVr        += frame->MVr;
  section->mvr_abs     += frame->mvr_abs;
  section->MVc        += frame->MVc;
  section->mvc_abs     += frame->mvc_abs;
  section->MVrv       += frame->MVrv;
  section->MVcv       += frame->MVcv;
  section->mv_in_out_count  += frame->mv_in_out_count;
  section->new_mv_count += frame->new_mv_count;
  section->count      += frame->count;
  section->duration   += frame->duration;
204
205
}

John Koleszar's avatar
John Koleszar committed
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
static void subtract_stats(FIRSTPASS_STATS *section, FIRSTPASS_STATS *frame) {
  section->frame -= frame->frame;
  section->intra_error -= frame->intra_error;
  section->coded_error -= frame->coded_error;
  section->sr_coded_error -= frame->sr_coded_error;
  section->ssim_weighted_pred_err -= frame->ssim_weighted_pred_err;
  section->pcnt_inter  -= frame->pcnt_inter;
  section->pcnt_motion -= frame->pcnt_motion;
  section->pcnt_second_ref -= frame->pcnt_second_ref;
  section->pcnt_neutral -= frame->pcnt_neutral;
  section->MVr        -= frame->MVr;
  section->mvr_abs     -= frame->mvr_abs;
  section->MVc        -= frame->MVc;
  section->mvc_abs     -= frame->mvc_abs;
  section->MVrv       -= frame->MVrv;
  section->MVcv       -= frame->MVcv;
  section->mv_in_out_count  -= frame->mv_in_out_count;
  section->new_mv_count -= frame->new_mv_count;
  section->count      -= frame->count;
  section->duration   -= frame->duration;
226
227
}

John Koleszar's avatar
John Koleszar committed
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
static void avg_stats(FIRSTPASS_STATS *section) {
  if (section->count < 1.0)
    return;

  section->intra_error /= section->count;
  section->coded_error /= section->count;
  section->sr_coded_error /= section->count;
  section->ssim_weighted_pred_err /= section->count;
  section->pcnt_inter  /= section->count;
  section->pcnt_second_ref /= section->count;
  section->pcnt_neutral /= section->count;
  section->pcnt_motion /= section->count;
  section->MVr        /= section->count;
  section->mvr_abs     /= section->count;
  section->MVc        /= section->count;
  section->mvc_abs     /= section->count;
  section->MVrv       /= section->count;
  section->MVcv       /= section->count;
  section->mv_in_out_count   /= section->count;
  section->duration   /= section->count;
248
249
}

John Koleszar's avatar
John Koleszar committed
250
// Calculate a modified Error used in distributing bits between easier and harder frames
251
static double calculate_modified_err(VP9_COMP *cpi, FIRSTPASS_STATS *this_frame) {
John Koleszar's avatar
John Koleszar committed
252
253
254
255
256
257
258
259
260
261
262
  double av_err = (cpi->twopass.total_stats->ssim_weighted_pred_err /
                   cpi->twopass.total_stats->count);
  double this_err = this_frame->ssim_weighted_pred_err;
  double modified_err;

  if (this_err > av_err)
    modified_err = av_err * pow((this_err / DOUBLE_DIVIDE_CHECK(av_err)), POW1);
  else
    modified_err = av_err * pow((this_err / DOUBLE_DIVIDE_CHECK(av_err)), POW2);

  return modified_err;
John Koleszar's avatar
John Koleszar committed
263
264
}

265
static const double weight_table[256] = {
John Koleszar's avatar
John Koleszar committed
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
  0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000,
  0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000,
  0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000,
  0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000, 0.020000,
  0.020000, 0.031250, 0.062500, 0.093750, 0.125000, 0.156250, 0.187500, 0.218750,
  0.250000, 0.281250, 0.312500, 0.343750, 0.375000, 0.406250, 0.437500, 0.468750,
  0.500000, 0.531250, 0.562500, 0.593750, 0.625000, 0.656250, 0.687500, 0.718750,
  0.750000, 0.781250, 0.812500, 0.843750, 0.875000, 0.906250, 0.937500, 0.968750,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000,
  1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000, 1.000000
298
299
};

John Koleszar's avatar
John Koleszar committed
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
static double simple_weight(YV12_BUFFER_CONFIG *source) {
  int i, j;

  unsigned char *src = source->y_buffer;
  double sum_weights = 0.0;

  // Loop throught the Y plane raw examining levels and creating a weight for the image
  i = source->y_height;
  do {
    j = source->y_width;
    do {
      sum_weights += weight_table[ *src];
      src++;
    } while (--j);
    src -= source->y_width;
    src += source->y_stride;
  } while (--i);

  sum_weights /= (source->y_height * source->y_width);

  return sum_weights;
John Koleszar's avatar
John Koleszar committed
321
322
}

323

John Koleszar's avatar
John Koleszar committed
324
// This function returns the current per frame maximum bitrate target
325
static int frame_max_bits(VP9_COMP *cpi) {
John Koleszar's avatar
John Koleszar committed
326
327
  // Max allocation for a single frame based on the max section guidelines passed in and how many bits are left
  int max_bits;
John Koleszar's avatar
John Koleszar committed
328

John Koleszar's avatar
John Koleszar committed
329
330
  // For VBR base this on the bits and frames left plus the two_pass_vbrmax_section rate passed in by the user
  max_bits = (int)(((double)cpi->twopass.bits_left / (cpi->twopass.total_stats->count - (double)cpi->common.current_video_frame)) * ((double)cpi->oxcf.two_pass_vbrmax_section / 100.0));
John Koleszar's avatar
John Koleszar committed
331

John Koleszar's avatar
John Koleszar committed
332
333
334
  // Trap case where we are out of bits
  if (max_bits < 0)
    max_bits = 0;
John Koleszar's avatar
John Koleszar committed
335

John Koleszar's avatar
John Koleszar committed
336
  return max_bits;
John Koleszar's avatar
John Koleszar committed
337
338
}

339
void vp9_init_first_pass(VP9_COMP *cpi) {
John Koleszar's avatar
John Koleszar committed
340
  zero_stats(cpi->twopass.total_stats);
John Koleszar's avatar
John Koleszar committed
341
342
}

343
void vp9_end_first_pass(VP9_COMP *cpi) {
John Koleszar's avatar
John Koleszar committed
344
  output_stats(cpi, cpi->output_pkt_list, cpi->twopass.total_stats);
345
}
John Koleszar's avatar
John Koleszar committed
346

347
static void zz_motion_search(VP9_COMP *cpi, MACROBLOCK *x, YV12_BUFFER_CONFIG *recon_buffer, int *best_motion_err, int recon_yoffset) {
John Koleszar's avatar
John Koleszar committed
348
  MACROBLOCKD *const xd = &x->e_mbd;
John Koleszar's avatar
John Koleszar committed
349
350
  BLOCK *b = &x->block[0];
  BLOCKD *d = &x->e_mbd.block[0];
John Koleszar's avatar
John Koleszar committed
351

John Koleszar's avatar
John Koleszar committed
352
353
354
355
  unsigned char *src_ptr = (*(b->base_src) + b->src);
  int src_stride = b->src_stride;
  unsigned char *ref_ptr;
  int ref_stride = d->pre_stride;
John Koleszar's avatar
John Koleszar committed
356

John Koleszar's avatar
John Koleszar committed
357
358
  // Set up pointers for this macro block recon buffer
  xd->pre.y_buffer = recon_buffer->y_buffer + recon_yoffset;
John Koleszar's avatar
John Koleszar committed
359

John Koleszar's avatar
John Koleszar committed
360
  ref_ptr = (unsigned char *)(*(d->base_pre) + d->pre);
John Koleszar's avatar
John Koleszar committed
361

362
  vp9_mse16x16(src_ptr, src_stride, ref_ptr, ref_stride,
363
               (unsigned int *)(best_motion_err));
John Koleszar's avatar
John Koleszar committed
364
365
}

366
static void first_pass_motion_search(VP9_COMP *cpi, MACROBLOCK *x,
Scott LaVarnway's avatar
Scott LaVarnway committed
367
368
                                     int_mv *ref_mv, MV *best_mv,
                                     YV12_BUFFER_CONFIG *recon_buffer,
John Koleszar's avatar
John Koleszar committed
369
                                     int *best_motion_err, int recon_yoffset) {
John Koleszar's avatar
John Koleszar committed
370
  MACROBLOCKD *const xd = &x->e_mbd;
John Koleszar's avatar
John Koleszar committed
371
372
373
374
375
376
377
378
379
380
381
  BLOCK *b = &x->block[0];
  BLOCKD *d = &x->e_mbd.block[0];
  int num00;

  int_mv tmp_mv;
  int_mv ref_mv_full;

  int tmp_err;
  int step_param = 3;
  int further_steps = (MAX_MVSEARCH_STEPS - 1) - step_param;
  int n;
382
  vp9_variance_fn_ptr_t v_fn_ptr = cpi->fn_ptr[BLOCK_16X16];
John Koleszar's avatar
John Koleszar committed
383
384
385
  int new_mv_mode_penalty = 256;

  // override the default variance function to use MSE
386
  v_fn_ptr.vf = vp9_mse16x16;
John Koleszar's avatar
John Koleszar committed
387
388
389
390
391
392
393
394
395
396

  // Set up pointers for this macro block recon buffer
  xd->pre.y_buffer = recon_buffer->y_buffer + recon_yoffset;

  // Initial step/diamond search centred on best mv
  tmp_mv.as_int = 0;
  ref_mv_full.as_mv.col = ref_mv->as_mv.col >> 3;
  ref_mv_full.as_mv.row = ref_mv->as_mv.row >> 3;
  tmp_err = cpi->diamond_search_sad(x, b, d, &ref_mv_full, &tmp_mv, step_param,
                                    x->sadperbit16, &num00, &v_fn_ptr,
397
398
                                    x->nmvjointcost,
                                    x->mvcost, ref_mv);
John Koleszar's avatar
John Koleszar committed
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
  if (tmp_err < INT_MAX - new_mv_mode_penalty)
    tmp_err += new_mv_mode_penalty;

  if (tmp_err < *best_motion_err) {
    *best_motion_err = tmp_err;
    best_mv->row = tmp_mv.as_mv.row;
    best_mv->col = tmp_mv.as_mv.col;
  }

  // Further step/diamond searches as necessary
  n = num00;
  num00 = 0;

  while (n < further_steps) {
    n++;

    if (num00)
      num00--;
    else {
      tmp_err = cpi->diamond_search_sad(x, b, d, &ref_mv_full, &tmp_mv,
                                        step_param + n, x->sadperbit16,
                                        &num00, &v_fn_ptr,
421
422
                                        x->nmvjointcost,
                                        x->mvcost, ref_mv);
John Koleszar's avatar
John Koleszar committed
423
      if (tmp_err < INT_MAX - new_mv_mode_penalty)
John Koleszar's avatar
John Koleszar committed
424
425
        tmp_err += new_mv_mode_penalty;

John Koleszar's avatar
John Koleszar committed
426
      if (tmp_err < *best_motion_err) {
John Koleszar's avatar
John Koleszar committed
427
        *best_motion_err = tmp_err;
Scott LaVarnway's avatar
Scott LaVarnway committed
428
429
        best_mv->row = tmp_mv.as_mv.row;
        best_mv->col = tmp_mv.as_mv.col;
John Koleszar's avatar
John Koleszar committed
430
      }
John Koleszar's avatar
John Koleszar committed
431
    }
John Koleszar's avatar
John Koleszar committed
432
  }
John Koleszar's avatar
John Koleszar committed
433
434
}

435
void vp9_first_pass(VP9_COMP *cpi) {
John Koleszar's avatar
John Koleszar committed
436
  int mb_row, mb_col;
John Koleszar's avatar
John Koleszar committed
437
  MACROBLOCK *const x = &cpi->mb;
438
  VP9_COMMON *const cm = &cpi->common;
John Koleszar's avatar
John Koleszar committed
439
  MACROBLOCKD *const xd = &x->e_mbd;
John Koleszar's avatar
John Koleszar committed
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466

  int recon_yoffset, recon_uvoffset;
  YV12_BUFFER_CONFIG *lst_yv12 = &cm->yv12_fb[cm->lst_fb_idx];
  YV12_BUFFER_CONFIG *new_yv12 = &cm->yv12_fb[cm->new_fb_idx];
  YV12_BUFFER_CONFIG *gld_yv12 = &cm->yv12_fb[cm->gld_fb_idx];
  int recon_y_stride = lst_yv12->y_stride;
  int recon_uv_stride = lst_yv12->uv_stride;
  int64_t intra_error = 0;
  int64_t coded_error = 0;
  int64_t sr_coded_error = 0;

  int sum_mvr = 0, sum_mvc = 0;
  int sum_mvr_abs = 0, sum_mvc_abs = 0;
  int sum_mvrs = 0, sum_mvcs = 0;
  int mvcount = 0;
  int intercount = 0;
  int second_ref_count = 0;
  int intrapenalty = 256;
  int neutral_count = 0;
  int new_mv_count = 0;
  int sum_in_vectors = 0;
  uint32_t lastmv_as_int = 0;

  int_mv zero_ref_mv;

  zero_ref_mv.as_int = 0;

467
  vp9_clear_system_state();  // __asm emms;
John Koleszar's avatar
John Koleszar committed
468
469
470
471
472
473
474
475
476

  x->src = * cpi->Source;
  xd->pre = *lst_yv12;
  xd->dst = *new_yv12;

  x->partition_info = x->pi;

  xd->mode_info_context = cm->mi;

477
  vp9_build_block_offsets(x);
John Koleszar's avatar
John Koleszar committed
478

479
  vp9_setup_block_dptrs(&x->e_mbd);
John Koleszar's avatar
John Koleszar committed
480

481
  vp9_setup_block_ptrs(x);
John Koleszar's avatar
John Koleszar committed
482
483

  // set up frame new frame for intra coded blocks
484
  vp9_setup_intra_recon(new_yv12);
485
  vp9_frame_init_quantizer(cpi);
John Koleszar's avatar
John Koleszar committed
486
487
488
489
490
491

  // Initialise the MV cost table to the defaults
  // if( cm->current_video_frame == 0)
  // if ( 0 )
  {
    int flag[2] = {1, 1};
492
    vp9_init_mv_probs(cm);
493
    vp9_initialize_rd_consts(cpi, cm->base_qindex + cm->y1dc_delta_q);
John Koleszar's avatar
John Koleszar committed
494
495
496
497
498
499
500
501
502
503
504
505
506
507
  }

  // for each macroblock row in image
  for (mb_row = 0; mb_row < cm->mb_rows; mb_row++) {
    int_mv best_ref_mv;

    best_ref_mv.as_int = 0;

    // reset above block coeffs
    xd->up_available = (mb_row != 0);
    recon_yoffset = (mb_row * recon_y_stride * 16);
    recon_uvoffset = (mb_row * recon_uv_stride * 8);

    // Set up limit values for motion vectors to prevent them extending outside the UMV borders
John Koleszar's avatar
John Koleszar committed
508
509
510
    x->mv_row_min = -((mb_row * 16) + (VP9BORDERINPIXELS - 16));
    x->mv_row_max = ((cm->mb_rows - 1 - mb_row) * 16)
                    + (VP9BORDERINPIXELS - 16);
John Koleszar's avatar
John Koleszar committed
511
512
513
514
515
516
517
518
519
520
521
522
523


    // for each macroblock col in image
    for (mb_col = 0; mb_col < cm->mb_cols; mb_col++) {
      int this_error;
      int gf_motion_error = INT_MAX;
      int use_dc_pred = (mb_col || mb_row) && (!mb_col || !mb_row);

      xd->dst.y_buffer = new_yv12->y_buffer + recon_yoffset;
      xd->dst.u_buffer = new_yv12->u_buffer + recon_uvoffset;
      xd->dst.v_buffer = new_yv12->v_buffer + recon_uvoffset;
      xd->left_available = (mb_col != 0);

524
#if !CONFIG_SUPERBLOCKS
John Koleszar's avatar
John Koleszar committed
525
      // Copy current mb to a buffer
526
      vp9_copy_mem16x16(x->src.y_buffer, x->src.y_stride, x->thismb, 16);
527
#endif
John Koleszar's avatar
John Koleszar committed
528
529

      // do intra 16x16 prediction
530
      this_error = vp9_encode_intra(cpi, x, use_dc_pred);
John Koleszar's avatar
John Koleszar committed
531
532
533
534
535
536
537
538
539
540
541

      // "intrapenalty" below deals with situations where the intra and inter error scores are very low (eg a plain black frame)
      // We do not have special cases in first pass for 0,0 and nearest etc so all inter modes carry an overhead cost estimate fot the mv.
      // When the error score is very low this causes us to pick all or lots of INTRA modes and throw lots of key frames.
      // This penalty adds a cost matching that of a 0,0 mv to the intra case.
      this_error += intrapenalty;

      // Cumulative intra error total
      intra_error += (int64_t)this_error;

      // Set up limit values for motion vectors to prevent them extending outside the UMV borders
John Koleszar's avatar
John Koleszar committed
542
543
544
      x->mv_col_min = -((mb_col * 16) + (VP9BORDERINPIXELS - 16));
      x->mv_col_max = ((cm->mb_cols - 1 - mb_col) * 16)
                      + (VP9BORDERINPIXELS - 16);
John Koleszar's avatar
John Koleszar committed
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572

      // Other than for the first frame do a motion search
      if (cm->current_video_frame > 0) {
        int tmp_err;
        int motion_error = INT_MAX;
        int_mv mv, tmp_mv;

        // Simple 0,0 motion with no mv overhead
        zz_motion_search(cpi, x, lst_yv12, &motion_error, recon_yoffset);
        mv.as_int = tmp_mv.as_int = 0;

        // Test last reference frame using the previous best mv as the
        // starting point (best reference) for the search
        first_pass_motion_search(cpi, x, &best_ref_mv,
                                 &mv.as_mv, lst_yv12,
                                 &motion_error, recon_yoffset);

        // If the current best reference mv is not centred on 0,0 then do a 0,0 based search as well
        if (best_ref_mv.as_int) {
          tmp_err = INT_MAX;
          first_pass_motion_search(cpi, x, &zero_ref_mv, &tmp_mv.as_mv,
                                   lst_yv12, &tmp_err, recon_yoffset);

          if (tmp_err < motion_error) {
            motion_error = tmp_err;
            mv.as_int = tmp_mv.as_int;
          }
        }
John Koleszar's avatar
John Koleszar committed
573

John Koleszar's avatar
John Koleszar committed
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
        // Experimental search in an older reference frame
        if (cm->current_video_frame > 1) {
          // Simple 0,0 motion with no mv overhead
          zz_motion_search(cpi, x, gld_yv12,
                           &gf_motion_error, recon_yoffset);

          first_pass_motion_search(cpi, x, &zero_ref_mv,
                                   &tmp_mv.as_mv, gld_yv12,
                                   &gf_motion_error, recon_yoffset);

          if ((gf_motion_error < motion_error) &&
              (gf_motion_error < this_error)) {
            second_ref_count++;
          }

          // Reset to last frame as reference buffer
          xd->pre.y_buffer = lst_yv12->y_buffer + recon_yoffset;
          xd->pre.u_buffer = lst_yv12->u_buffer + recon_uvoffset;
          xd->pre.v_buffer = lst_yv12->v_buffer + recon_uvoffset;

          // In accumulating a score for the older reference frame
          // take the best of the motion predicted score and
          // the intra coded error (just as will be done for)
          // accumulation of "coded_error" for the last frame.
          if (gf_motion_error < this_error)
            sr_coded_error += gf_motion_error;
          else
            sr_coded_error += this_error;
        } else
          sr_coded_error += motion_error;
604

John Koleszar's avatar
John Koleszar committed
605
        /* Intra assumed best */
606
        best_ref_mv.as_int = 0;
John Koleszar's avatar
John Koleszar committed
607

John Koleszar's avatar
John Koleszar committed
608
609
610
611
612
613
614
615
616
617
618
619
620
621
        if (motion_error <= this_error) {
          // Keep a count of cases where the inter and intra were
          // very close and very low. This helps with scene cut
          // detection for example in cropped clips with black bars
          // at the sides or top and bottom.
          if ((((this_error - intrapenalty) * 9) <=
               (motion_error * 10)) &&
              (this_error < (2 * intrapenalty))) {
            neutral_count++;
          }

          mv.as_mv.row <<= 3;
          mv.as_mv.col <<= 3;
          this_error = motion_error;
622
          vp9_set_mbmode_and_mvs(x, NEWMV, &mv);
623
          xd->mode_info_context->mbmi.txfm_size = TX_4X4;
624
          vp9_encode_inter16x16y(x);
John Koleszar's avatar
John Koleszar committed
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
          sum_mvr += mv.as_mv.row;
          sum_mvr_abs += abs(mv.as_mv.row);
          sum_mvc += mv.as_mv.col;
          sum_mvc_abs += abs(mv.as_mv.col);
          sum_mvrs += mv.as_mv.row * mv.as_mv.row;
          sum_mvcs += mv.as_mv.col * mv.as_mv.col;
          intercount++;

          best_ref_mv.as_int = mv.as_int;

          // Was the vector non-zero
          if (mv.as_int) {
            mvcount++;

            // Was it different from the last non zero vector
            if (mv.as_int != lastmv_as_int)
              new_mv_count++;
            lastmv_as_int = mv.as_int;

            // Does the Row vector point inwards or outwards
            if (mb_row < cm->mb_rows / 2) {
              if (mv.as_mv.row > 0)
                sum_in_vectors--;
              else if (mv.as_mv.row < 0)
                sum_in_vectors++;
            } else if (mb_row > cm->mb_rows / 2) {
              if (mv.as_mv.row > 0)
                sum_in_vectors++;
              else if (mv.as_mv.row < 0)
                sum_in_vectors--;
John Koleszar's avatar
John Koleszar committed
655
656
            }

John Koleszar's avatar
John Koleszar committed
657
658
659
660
661
662
663
664
665
666
667
668
669
            // Does the Row vector point inwards or outwards
            if (mb_col < cm->mb_cols / 2) {
              if (mv.as_mv.col > 0)
                sum_in_vectors--;
              else if (mv.as_mv.col < 0)
                sum_in_vectors++;
            } else if (mb_col > cm->mb_cols / 2) {
              if (mv.as_mv.col > 0)
                sum_in_vectors++;
              else if (mv.as_mv.col < 0)
                sum_in_vectors--;
            }
          }
John Koleszar's avatar
John Koleszar committed
670
        }
John Koleszar's avatar
John Koleszar committed
671
672
      } else
        sr_coded_error += (int64_t)this_error;
John Koleszar's avatar
John Koleszar committed
673

John Koleszar's avatar
John Koleszar committed
674
      coded_error += (int64_t)this_error;
John Koleszar's avatar
John Koleszar committed
675

John Koleszar's avatar
John Koleszar committed
676
677
678
679
      // adjust to the next column of macroblocks
      x->src.y_buffer += 16;
      x->src.u_buffer += 8;
      x->src.v_buffer += 8;
John Koleszar's avatar
John Koleszar committed
680

John Koleszar's avatar
John Koleszar committed
681
682
      recon_yoffset += 16;
      recon_uvoffset += 8;
John Koleszar's avatar
John Koleszar committed
683
684
    }

John Koleszar's avatar
John Koleszar committed
685
686
687
688
689
690
    // adjust to the next row of mbs
    x->src.y_buffer += 16 * x->src.y_stride - 16 * cm->mb_cols;
    x->src.u_buffer += 8 * x->src.uv_stride - 8 * cm->mb_cols;
    x->src.v_buffer += 8 * x->src.uv_stride - 8 * cm->mb_cols;

    // extend the recon for intra prediction
691
692
    vp9_extend_mb_row(new_yv12, xd->dst.y_buffer + 16,
                      xd->dst.u_buffer + 8, xd->dst.v_buffer + 8);
693
    vp9_clear_system_state();  // __asm emms;
John Koleszar's avatar
John Koleszar committed
694
695
  }

696
  vp9_clear_system_state();  // __asm emms;
John Koleszar's avatar
John Koleszar committed
697
698
699
700
701
702
  {
    double weight = 0.0;

    FIRSTPASS_STATS fps;

    fps.frame      = cm->current_video_frame;
703
704
705
    fps.intra_error = (double)(intra_error >> 8);
    fps.coded_error = (double)(coded_error >> 8);
    fps.sr_coded_error = (double)(sr_coded_error >> 8);
John Koleszar's avatar
John Koleszar committed
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
    weight = simple_weight(cpi->Source);


    if (weight < 0.1)
      weight = 0.1;

    fps.ssim_weighted_pred_err = fps.coded_error * weight;

    fps.pcnt_inter  = 0.0;
    fps.pcnt_motion = 0.0;
    fps.MVr        = 0.0;
    fps.mvr_abs     = 0.0;
    fps.MVc        = 0.0;
    fps.mvc_abs     = 0.0;
    fps.MVrv       = 0.0;
    fps.MVcv       = 0.0;
    fps.mv_in_out_count  = 0.0;
    fps.new_mv_count = 0.0;
    fps.count      = 1.0;

    fps.pcnt_inter   = 1.0 * (double)intercount / cm->MBs;
    fps.pcnt_second_ref = 1.0 * (double)second_ref_count / cm->MBs;
    fps.pcnt_neutral = 1.0 * (double)neutral_count / cm->MBs;

    if (mvcount > 0) {
      fps.MVr = (double)sum_mvr / (double)mvcount;
      fps.mvr_abs = (double)sum_mvr_abs / (double)mvcount;
      fps.MVc = (double)sum_mvc / (double)mvcount;
      fps.mvc_abs = (double)sum_mvc_abs / (double)mvcount;
      fps.MVrv = ((double)sum_mvrs - (fps.MVr * fps.MVr / (double)mvcount)) / (double)mvcount;
      fps.MVcv = ((double)sum_mvcs - (fps.MVc * fps.MVc / (double)mvcount)) / (double)mvcount;
      fps.mv_in_out_count = (double)sum_in_vectors / (double)(mvcount * 2);
      fps.new_mv_count = new_mv_count;

      fps.pcnt_motion = 1.0 * (double)mvcount / cpi->common.MBs;
Paul Wilkins's avatar
Paul Wilkins committed
741
    }
John Koleszar's avatar
John Koleszar committed
742

John Koleszar's avatar
John Koleszar committed
743
744
    // TODO:  handle the case when duration is set to 0, or something less
    // than the full time between subsequent cpi->source_time_stamp s  .
745
746
    fps.duration = (double)(cpi->source->ts_end
                            - cpi->source->ts_start);
John Koleszar's avatar
John Koleszar committed
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762

    // don't want to do output stats with a stack variable!
    memcpy(cpi->twopass.this_frame_stats,
           &fps,
           sizeof(FIRSTPASS_STATS));
    output_stats(cpi, cpi->output_pkt_list, cpi->twopass.this_frame_stats);
    accumulate_stats(cpi->twopass.total_stats, &fps);
  }

  // Copy the previous Last Frame back into gf and and arf buffers if
  // the prediction is good enough... but also dont allow it to lag too far
  if ((cpi->twopass.sr_update_lag > 3) ||
      ((cm->current_video_frame > 0) &&
       (cpi->twopass.this_frame_stats->pcnt_inter > 0.20) &&
       ((cpi->twopass.this_frame_stats->intra_error /
         cpi->twopass.this_frame_stats->coded_error) > 2.0))) {
John Koleszar's avatar
John Koleszar committed
763
    vp8_yv12_copy_frame(lst_yv12, gld_yv12);
John Koleszar's avatar
John Koleszar committed
764
765
766
    cpi->twopass.sr_update_lag = 1;
  } else
    cpi->twopass.sr_update_lag++;
John Koleszar's avatar
John Koleszar committed
767

John Koleszar's avatar
John Koleszar committed
768
  // swap frame pointers so last frame refers to the frame we just compressed
769
  vp9_swap_yv12_buffer(lst_yv12, new_yv12);
John Koleszar's avatar
John Koleszar committed
770
  vp8_yv12_extend_frame_borders(lst_yv12);
John Koleszar's avatar
John Koleszar committed
771

John Koleszar's avatar
John Koleszar committed
772
773
  // Special case for the first frame. Copy into the GF buffer as a second reference.
  if (cm->current_video_frame == 0) {
John Koleszar's avatar
John Koleszar committed
774
    vp8_yv12_copy_frame(lst_yv12, gld_yv12);
John Koleszar's avatar
John Koleszar committed
775
  }
John Koleszar's avatar
John Koleszar committed
776
777


John Koleszar's avatar
John Koleszar committed
778
779
780
781
782
  // use this to see what the first pass reconstruction looks like
  if (0) {
    char filename[512];
    FILE *recon_file;
    sprintf(filename, "enc%04d.yuv", (int) cm->current_video_frame);
John Koleszar's avatar
John Koleszar committed
783

John Koleszar's avatar
John Koleszar committed
784
785
786
787
788
789
790
791
    if (cm->current_video_frame == 0)
      recon_file = fopen(filename, "wb");
    else
      recon_file = fopen(filename, "ab");

    if (fwrite(lst_yv12->buffer_alloc, lst_yv12->frame_size, 1, recon_file));
    fclose(recon_file);
  }
John Koleszar's avatar
John Koleszar committed
792

John Koleszar's avatar
John Koleszar committed
793
  cm->current_video_frame++;
John Koleszar's avatar
John Koleszar committed
794
795
796

}

797
798
799
800
801
802
// Estimate a cost per mb attributable to overheads such as the coding of
// modes and motion vectors.
// Currently simplistic in its assumptions for testing.
//


803
static double bitcost(double prob) {
John Koleszar's avatar
John Koleszar committed
804
  return -(log(prob) / log(2.0));
805
}
806

807
static long long estimate_modemvcost(VP9_COMP *cpi,
John Koleszar's avatar
John Koleszar committed
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
                                     FIRSTPASS_STATS *fpstats) {
  int mv_cost;
  int mode_cost;

  double av_pct_inter = fpstats->pcnt_inter / fpstats->count;
  double av_pct_motion = fpstats->pcnt_motion / fpstats->count;
  double av_intra = (1.0 - av_pct_inter);

  double zz_cost;
  double motion_cost;
  double intra_cost;

  zz_cost = bitcost(av_pct_inter - av_pct_motion);
  motion_cost = bitcost(av_pct_motion);
  intra_cost = bitcost(av_intra);

  // Estimate of extra bits per mv overhead for mbs
825
  // << 9 is the normalization to the (bits * 512) used in vp9_bits_per_mb
John Koleszar's avatar
John Koleszar committed
826
827
828
  mv_cost = ((int)(fpstats->new_mv_count / fpstats->count) * 8) << 9;

  // Crude estimate of overhead cost from modes
829
  // << 9 is the normalization to (bits * 512) used in vp9_bits_per_mb
John Koleszar's avatar
John Koleszar committed
830
831
832
833
834
835
836
837
  mode_cost =
    (int)((((av_pct_inter - av_pct_motion) * zz_cost) +
           (av_pct_motion * motion_cost) +
           (av_intra * intra_cost)) * cpi->common.MBs) << 9;

  // return mv_cost + mode_cost;
  // TODO PGW Fix overhead costs for extended Q range
  return 0;
838
839
}

John Koleszar's avatar
John Koleszar committed
840
841
842
843
844
845
846
847
static double calc_correction_factor(double err_per_mb,
                                     double err_divisor,
                                     double pt_low,
                                     double pt_high,
                                     int Q) {
  double power_term;
  double error_term = err_per_mb / err_divisor;
  double correction_factor;
848

John Koleszar's avatar
John Koleszar committed
849
  // Adjustment based on actual quantizer to power term.
850
  power_term = (vp9_convert_qindex_to_q(Q) * 0.01) + pt_low;
John Koleszar's avatar
John Koleszar committed
851
  power_term = (power_term > pt_high) ? pt_high : power_term;
852

John Koleszar's avatar
John Koleszar committed
853
854
  // Adjustments to error term
  // TBD
855

John Koleszar's avatar
John Koleszar committed
856
857
  // Calculate correction factor
  correction_factor = pow(error_term, power_term);
858

John Koleszar's avatar
John Koleszar committed
859
860
861
862
  // Clip range
  correction_factor =
    (correction_factor < 0.05)
    ? 0.05 : (correction_factor > 2.0) ? 2.0 : correction_factor;
Paul Wilkins's avatar
Paul Wilkins committed
863

John Koleszar's avatar
John Koleszar committed
864
  return correction_factor;
865
866
}

Paul Wilkins's avatar
Paul Wilkins committed
867
868
869
870
// Given a current maxQ value sets a range for future values.
// PGW TODO..
// This code removes direct dependency on QIndex to determin the range
// (now uses the actual quantizer) but has not been tuned.
871
static void adjust_maxq_qrange(VP9_COMP *cpi) {
John Koleszar's avatar
John Koleszar committed
872
873
874
875
876
877
878
879
  int i;
  double q;

  // Set the max corresponding to cpi->avg_q * 2.0
  q = cpi->avg_q * 2.0;
  cpi->twopass.maxq_max_limit = cpi->worst_quality;
  for (i = cpi->best_quality; i <= cpi->worst_quality; i++) {
    cpi->twopass.maxq_max_limit = i;
880
    if (vp9_convert_qindex_to_q(i) >= q)
John Koleszar's avatar
John Koleszar committed
881
882
883
884
885
886
887
888
      break;
  }

  // Set the min corresponding to cpi->avg_q * 0.5
  q = cpi->avg_q * 0.5;
  cpi->twopass.maxq_min_limit = cpi->best_quality;
  for (i = cpi->worst_quality; i >= cpi->best_quality; i--) {
    cpi->twopass.maxq_min_limit = i;
889
    if (vp9_convert_qindex_to_q(i) <= q)
John Koleszar's avatar
John Koleszar committed
890
891
      break;
  }
Paul Wilkins's avatar
Paul Wilkins committed
892
}
Paul Wilkins's avatar
Paul Wilkins committed
893

894
static int estimate_max_q(VP9_COMP *cpi,
John Koleszar's avatar
John Koleszar committed
895
                          FIRSTPASS_STATS *fpstats,
896
                          int section_target_bandwitdh,
John Koleszar's avatar
John Koleszar committed
897
898
899
900
901
902
903
904
905
906
907
                          int overhead_bits) {
  int Q;
  int num_mbs = cpi->common.MBs;
  int target_norm_bits_per_mb;

  double section_err = (fpstats->coded_error / fpstats->count);
  double sr_err_diff;
  double sr_correction;
  double err_per_mb = section_err / num_mbs;
  double err_correction_factor;
  double speed_correction = 1.0;
908
  double overhead_bits_per_mb;
John Koleszar's avatar
John Koleszar committed
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982

  if (section_target_bandwitdh <= 0)
    return cpi->twopass.maxq_max_limit;          // Highest value allowed

  target_norm_bits_per_mb =
    (section_target_bandwitdh < (1 << 20))
    ? (512 * section_target_bandwitdh) / num_mbs
    : 512 * (section_target_bandwitdh / num_mbs);

  // Look at the drop in prediction quality between the last frame
  // and the GF buffer (which contained an older frame).
  sr_err_diff =
    (fpstats->sr_coded_error - fpstats->coded_error) /
    (fpstats->count * cpi->common.MBs);
  sr_correction = (sr_err_diff / 32.0);
  sr_correction = pow(sr_correction, 0.25);
  if (sr_correction < 0.75)
    sr_correction = 0.75;
  else if (sr_correction > 1.25)
    sr_correction = 1.25;

  // Calculate a corrective factor based on a rolling ratio of bits spent
  // vs target bits
  if ((cpi->rolling_target_bits > 0) &&
      (cpi->active_worst_quality < cpi->worst_quality)) {
    double rolling_ratio;

    rolling_ratio = (double)cpi->rolling_actual_bits /
                    (double)cpi->rolling_target_bits;

    if (rolling_ratio < 0.95)
      cpi->twopass.est_max_qcorrection_factor -= 0.005;
    else if (rolling_ratio > 1.05)
      cpi->twopass.est_max_qcorrection_factor += 0.005;

    cpi->twopass.est_max_qcorrection_factor =
      (cpi->twopass.est_max_qcorrection_factor < 0.1)
      ? 0.1
      : (cpi->twopass.est_max_qcorrection_factor > 10.0)
      ? 10.0 : cpi->twopass.est_max_qcorrection_factor;
  }

  // Corrections for higher compression speed settings
  // (reduced compression expected)
  if (cpi->compressor_speed == 1) {
    if (cpi->oxcf.cpu_used <= 5)
      speed_correction = 1.04 + (cpi->oxcf.cpu_used * 0.04);
    else
      speed_correction = 1.25;
  }

  // Estimate of overhead bits per mb
  // Correction to overhead bits for min allowed Q.
  // PGW TODO.. This code is broken for the extended Q range
  //            for now overhead set to 0.
  overhead_bits_per_mb = overhead_bits / num_mbs;
  overhead_bits_per_mb *= pow(0.98, (double)cpi->twopass.maxq_min_limit);

  // Try and pick a max Q that will be high enough to encode the
  // content at the given rate.
  for (Q = cpi->twopass.maxq_min_limit; Q < cpi->twopass.maxq_max_limit; Q++) {
    int bits_per_mb_at_this_q;

    err_correction_factor =
      calc_correction_factor(err_per_mb, ERR_DIVISOR, 0.4, 0.90, Q) *
      sr_correction * speed_correction *
      cpi->twopass.est_max_qcorrection_factor;

    if (err_correction_factor < 0.05)
      err_correction_factor = 0.05;
    else if (err_correction_factor > 5.0)
      err_correction_factor = 5.0;

    bits_per_mb_at_this_q =
983
      vp9_bits_per_mb(INTER_FRAME, Q) + (int)overhead_bits_per_mb;
John Koleszar's avatar
John Koleszar committed
984
985
986
987
988
989
990

    bits_per_mb_at_this_q = (int)(.5 + err_correction_factor *
                                  (double)bits_per_mb_at_this_q);

    // Mode and motion overhead
    // As Q rises in real encode loop rd code will force overhead down
    // We make a crude adjustment for this here as *.98 per Q step.
991
    // PGW TODO.. This code is broken for the extended Q range
Paul Wilkins's avatar
Paul Wilkins committed
992
    //            for now overhead set to 0.
John Koleszar's avatar
John Koleszar committed
993
994
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
    // overhead_bits_per_mb = (int)((double)overhead_bits_per_mb * 0.98);

    if (bits_per_mb_at_this_q <= target_norm_bits_per_mb)
      break;
  }

  // Restriction on active max q for constrained quality mode.
  if ((cpi->oxcf.end_usage == USAGE_CONSTRAINED_QUALITY) &&
      (Q < cpi->cq_target_quality)) {
    Q = cpi->cq_target_quality;
  }

  // Adjust maxq_min_limit and maxq_max_limit limits based on
  // averaga q observed in clip for non kf/gf/arf frames
  // Give average a chance to settle though.
  // PGW TODO.. This code is broken for the extended Q range
  if ((cpi->ni_frames >
1010
       ((int)cpi->twopass.total_stats->count >> 8)) &&
John Koleszar's avatar
John Koleszar committed
1011
1012
1013
1014
1015
      (cpi->ni_frames > 150)) {
    adjust_maxq_qrange(cpi);
  }

  return Q;
John Koleszar's avatar
John Koleszar committed
1016
}
1017
1018
1019

// For cq mode estimate a cq level that matches the observed
// complexity and data rate.
1020
static int estimate_cq(VP9_COMP *cpi,
John Koleszar's avatar
John Koleszar committed
1021
1022
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
                       FIRSTPASS_STATS *fpstats,
                       int section_target_bandwitdh,
                       int overhead_bits) {
  int Q;
  int num_mbs = cpi->common.MBs;
  int target_norm_bits_per_mb;

  double section_err = (fpstats->coded_error / fpstats->count);
  double err_per_mb = section_err / num_mbs;
  double err_correction_factor;
  double sr_err_diff;
  double sr_correction;
  double speed_correction = 1.0;
  double clip_iiratio;
  double clip_iifactor;
1036
  double overhead_bits_per_mb;
John Koleszar's avatar
John Koleszar committed
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
1054
1055
1056
1057
1058
1059
1060
1061
1062
1063
1064
1065
1066
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
1085
1086
1087
1088


  target_norm_bits_per_mb = (section_target_bandwitdh < (1 << 20))
                            ? (512 * section_target_bandwitdh) / num_mbs
                            : 512 * (section_target_bandwitdh / num_mbs);

  // Estimate of overhead bits per mb
  overhead_bits_per_mb = overhead_bits / num_mbs;

  // Corrections for higher compression speed settings
  // (reduced compression expected)
  if (cpi->compressor_speed == 1) {
    if (cpi->oxcf.cpu_used <= 5)
      speed_correction = 1.04 + (cpi->oxcf.cpu_used * 0.04);
    else
      speed_correction = 1.25;
  }

  // Look at the drop in prediction quality between the last frame
  // and the GF buffer (which contained an older frame).
  sr_err_diff =
    (fpstats->sr_coded_error - fpstats->coded_error) /
    (fpstats->count * cpi->common.MBs);
  sr_correction = (sr_err_diff / 32.0);
  sr_correction = pow(sr_correction, 0.25);
  if (sr_correction < 0.75)
    sr_correction = 0.75;
  else if (sr_correction > 1.25)
    sr_correction = 1.25;

  // II ratio correction factor for clip as a whole
  clip_iiratio = cpi->twopass.total_stats->intra_error /
                 DOUBLE_DIVIDE_CHECK(cpi->twopass.total_stats->coded_error);
  clip_iifactor = 1.0 - ((clip_iiratio - 10.0) * 0.025);
  if (clip_iifactor < 0.80)
    clip_iifactor = 0.80;

  // Try and pick a Q that can encode the content at the given rate.
  for (Q = 0; Q < MAXQ; Q++) {
    int bits_per_mb_at_this_q;

    // Error per MB based correction factor
    err_correction_factor =
      calc_correction_factor(err_per_mb, 100.0, 0.4, 0.90, Q) *
      sr_correction * speed_correction * clip_iifactor;

    if (err_correction_factor < 0.05)
      err_correction_factor = 0.05;
    else if (err_correction_factor > 5.0)
      err_correction_factor = 5.0;

    bits_per_mb_at_this_q =
1089
      vp9_bits_per_mb(INTER_FRAME, Q) + (int)overhead_bits_per_mb;
John Koleszar's avatar
John Koleszar committed
1090
1091
1092
1093
1094
1095
1096
1097
1098
1099

    bits_per_mb_at_this_q = (int)(.5 + err_correction_factor *
                                  (double)bits_per_mb_at_this_q);

    // Mode and motion overhead
    // As Q rises in real encode loop rd code will force overhead down
    // We make a crude adjustment for this here as *.98 per Q step.
    // PGW TODO.. This code is broken for the extended Q range
    //            for now overhead set to 0.
    overhead_bits_per_mb = (int)((double)overhead_bits_per_mb * 0.98);
1100

John Koleszar's avatar
John Koleszar committed
1101
1102
1103
    if (bits_per_mb_at_this_q <= target_norm_bits_per_mb)
      break;
  }
1104

John Koleszar's avatar
John Koleszar committed
1105
1106
1107
1108
1109
1110
  // Clip value to range "best allowed to (worst allowed - 1)"
  Q = select_cq_level(Q);
  if (Q >= cpi->worst_quality)
    Q = cpi->worst_quality - 1;
  if (Q < cpi->best_quality)
    Q = cpi->best_quality;
1111

John Koleszar's avatar
John Koleszar committed
1112
  return Q;
1113
1114
}

Paul Wilkins's avatar
CQ Mode    
Paul Wilkins committed
1115

1116
extern void vp9_new_frame_rate(VP9_COMP *cpi, double framerate);
John Koleszar's avatar
John Koleszar committed
1117

1118
void vp9_init_second_pass(VP9_COMP *cpi) {
John Koleszar's avatar
John Koleszar committed
1119
1120
  FIRSTPASS_STATS this_frame;
  FIRSTPASS_STATS *start_pos;
John Koleszar's avatar
John Koleszar committed
1121

John Koleszar's avatar
John Koleszar committed
1122
1123
1124
  double lower_bounds_min_rate = FRAME_OVERHEAD_BITS * cpi->oxcf.frame_rate;
  double two_pass_min_rate = (double)(cpi->oxcf.target_bandwidth
                                      * cpi->oxcf.two_pass_vbrmin_section / 100);
1125

John Koleszar's avatar
John Koleszar committed
1126
1127
  if (two_pass_min_rate < lower_bounds_min_rate)
    two_pass_min_rate = lower_bounds_min_rate;
John Koleszar's avatar
John Koleszar committed
1128

John Koleszar's avatar
John Koleszar committed
1129
1130
  zero_stats(cpi->twopass.total_stats);
  zero_stats(cpi->twopass.total_left_stats);
John Koleszar's avatar
John Koleszar committed
1131

John Koleszar's avatar
John Koleszar committed
1132
1133
  if (!cpi->twopass.stats_in_end)
    return;
John Koleszar's avatar
John Koleszar committed
1134

John Koleszar's avatar
John Koleszar committed
1135
1136
  *cpi->twopass.total_stats = *cpi->twopass.stats_in_end;
  *cpi->twopass.total_left_stats = *cpi->twopass.total_stats;
John Koleszar's avatar
John Koleszar committed
1137

John Koleszar's avatar
John Koleszar committed
1138
1139
1140
1141
1142
  // each frame can have a different duration, as the frame rate in the source
  // isn't guaranteed to be constant.   The frame rate prior to the first frame
  // encoded in the second pass is a guess.  However the sum duration is not.
  // Its calculated based on the actual durations of all frames from the first
  // pass.
1143
1144
1145
  vp9_new_frame_rate(cpi,
                     10000000.0 * cpi->twopass.total_stats->count /
                     cpi->twopass.total_stats->duration);
John Koleszar's avatar
John Koleszar committed
1146

John Koleszar's avatar
John Koleszar committed
1147
  cpi->output_frame_rate = cpi->oxcf.frame_rate;
1148
1149
1150
1151
  cpi->twopass.bits_left = (int64_t)(cpi->twopass.total_stats->duration *
                                     cpi->oxcf.target_bandwidth / 10000000.0);
  cpi->twopass.bits_left -= (int64_t)(cpi->twopass.total_stats->duration *
                                      two_pass_min_rate / 10000000.0);
Paul Wilkins's avatar
Paul Wilkins committed
1152

John Koleszar's avatar
John Koleszar committed
1153
1154
1155
1156
1157
1158
  // Calculate a minimum intra value to be used in determining the IIratio
  // scores used in the second pass. We have this minimum to make sure
  // that clips that are static but "low complexity" in the intra domain
  // are still boosted appropriately for KF/GF/ARF
  cpi->twopass.kf_intra_err_min = KF_MB_INTRA_MIN * cpi->common.MBs;
  cpi->twopass.gf_intra_err_min = GF_MB_INTRA_MIN * cpi->common.MBs;
John Koleszar's avatar
John Koleszar committed
1159

John Koleszar's avatar
John Koleszar committed
1160
1161
  // This variable monitors how far behind the second ref update is lagging
  cpi->twopass.sr_update_lag = 1;
John Koleszar's avatar
John Koleszar committed
1162

John Koleszar's avatar
John Koleszar committed
1163
1164
1165
1166
  // Scan the first pass file and calculate an average Intra / Inter error score ratio for the sequence
  {
    double sum_iiratio = 0.0;
    double IIRatio;
John Koleszar's avatar
John Koleszar committed
1167

John Koleszar's avatar
John Koleszar committed
1168
    start_pos = cpi->twopass.stats_in;               // Note starting "file" position
John Koleszar's avatar
John Koleszar committed
1169

John Koleszar's avatar
John Koleszar committed
1170
1171
1172
1173
    while (input_stats(cpi, &this_frame) != EOF) {
      IIRatio = this_frame.intra_error / DOUBLE_DIVIDE_CHECK(this_frame.coded_error);
      IIRatio = (IIRatio < 1.0) ? 1.0 : (IIRatio > 20.0) ? 20.0 : IIRatio;
      sum_iiratio += IIRatio;
John Koleszar's avatar
John Koleszar committed
1174
1175
    }

John Koleszar's avatar
John Koleszar committed
1176
    cpi->twopass.avg_iiratio = sum_iiratio / DOUBLE_DIVIDE_CHECK((double)cpi->twopass.total_stats->count);
John Koleszar's avatar
John Koleszar committed
1177

John Koleszar's avatar
John Koleszar committed
1178
1179
1180
    // Reset file position
    reset_fpf_position(cpi, start_pos);
  }
John Koleszar's avatar
John Koleszar committed
1181

John Koleszar's avatar
John Koleszar committed
1182
1183
1184
1185
  // Scan the first pass file and calculate a modified total error based upon the bias/power function
  // used to allocate bits
  {
    start_pos = cpi->twopass.stats_in;               // Note starting "file" position
John Koleszar's avatar
John Koleszar committed
1186

John Koleszar's avatar
John Koleszar committed
1187
1188
    cpi->twopass.modified_error_total = 0.0;
    cpi->twopass.modified_error_used = 0.0;
John Koleszar's avatar
John Koleszar committed
1189

John Koleszar's avatar
John Koleszar committed
1190
1191
    while (input_stats(cpi, &this_frame) != EOF) {
      cpi->twopass.modified_error_total += calculate_modified_err(cpi, &this_frame);
John Koleszar's avatar
John Koleszar committed
1192
    }
John Koleszar's avatar
John Koleszar committed
1193
1194
1195
1196
1197
    cpi->twopass.modified_error_left = cpi->twopass.modified_error_total;

    reset_fpf_position(cpi, start_pos);            // Reset file position

  }
John Koleszar's avatar
John Koleszar committed
1198
1199
}

1200
void vp9_end_second_pass(VP9_COMP *cpi) {
John Koleszar's avatar
John Koleszar committed
1201
1202
}

Paul Wilkins's avatar
Paul Wilkins committed
1203
// This function gives and estimate of how badly we believe
Adrian Grange's avatar
Adrian Grange committed
1204
// the prediction quality is decaying from frame to frame.
1205
static double get_prediction_decay_rate(VP9_COMP *cpi,
John Koleszar's avatar
John Koleszar committed
1206
1207
1208
1209
1210
1211
1212
1213
1214
1215
1216
1217
1218
1219
1220
1221
1222
1223
1224
1225
1226
1227
1228
1229
                                        FIRSTPASS_STATS *next_frame) {
  double prediction_decay_rate;
  double second_ref_decay;
  double mb_sr_err_diff;

  // Initial basis is the % mbs inter coded
  prediction_decay_rate = next_frame->pcnt_inter;

  // Look at the observed drop in prediction quality between the last frame
  // and the GF buffer (which contains an older frame).
  mb_sr_err_diff =
    (next_frame->sr_coded_error - next_frame->coded_error) /
    (cpi->common.MBs);
  second_ref_decay = 1.0 - (mb_sr_err_diff / 512.0);
  second_ref_decay = pow(second_ref_decay, 0.5);
  if (second_ref_decay < 0.85)
    second_ref_decay = 0.85;
  else if (second_ref_decay > 1.0)
    second_ref_decay = 1.0;

  if (second_ref_decay < prediction_decay_rate)
    prediction_decay_rate = second_ref_decay;

  return prediction_decay_rate;
Paul Wilkins's avatar
Paul Wilkins committed
1230
1231
}

Paul Wilkins's avatar
Paul Wilkins committed
1232
// Function to test for a condition where a complex transition is followed
1233
1234
// by a static section. For example in slide shows where there is a fade
// between slides. This is to help with more optimal kf and gf positioning.
1235
static int detect_transition_to_still(
1236
  VP9_COMP *cpi,
John Koleszar's avatar
John Koleszar committed
1237
1238
1239
1240
1241
1242
1243
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
1257
1258
  int frame_interval,
  int still_interval,
  double loop_decay_rate,
  double last_decay_rate) {
  BOOL trans_to_still = FALSE;

  // Break clause to detect very still sections after motion
  // For example a static image after a fade or other transition
  // instead of a clean scene cut.
  if ((frame_interval > MIN_GF_INTERVAL) &&
      (loop_decay_rate >= 0.999) &&
      (last_decay_rate < 0.9)) {
    int j;
    FIRSTPASS_STATS *position = cpi->twopass.stats_in;
    FIRSTPASS_STATS tmp_next_frame;
    double zz_inter;

    // Look ahead a few frames to see if static condition
    // persists...
    for (j = 0; j < still_interval; j++) {
      if (EOF == input_stats(cpi, &tmp_next_frame))
        break;
1259

John Koleszar's avatar
John Koleszar committed
1260
1261
1262
1263
      zz_inter =
        (tmp_next_frame.pcnt_inter - tmp_next_frame.pcnt_motion);
      if (zz_inter < 0.999)
        break;
1264
    }
John Koleszar's avatar
John Koleszar committed
1265
1266
    // Reset file position
    reset_fpf_position(cpi, position);
1267

John Koleszar's avatar
John Koleszar committed
1268
1269
1270
1271
1272
1273
    // Only if it does do we signal a transition to still
    if (j == still_interval)
      trans_to_still = TRUE;
  }

  return trans_to_still;
1274
}
Paul Wilkins's avatar
Paul Wilkins committed
1275

1276
1277
1278
// This function detects a flash through the high relative pcnt_second_ref
// score in the frame following a flash frame. The offset passed in should
// reflect this
1279
static BOOL detect_flash(VP9_COMP *cpi, int offset) {
John Koleszar's avatar
John Koleszar committed
1280
1281
1282
1283
1284
1285
1286
1287
1288
1289
1290
1291
1292
1293
1294
  FIRSTPASS_STATS next_frame;

  BOOL flash_detected = FALSE;

  // Read the frame data.
  // The return is FALSE (no flash detected) if not a valid frame
  if (read_frame_stats(cpi, &next_frame, offset) != EOF) {
    // What we are looking for here is a situation where there is a
    // brief break in prediction (such as a flash) but subsequent frames
    // are reasonably well predicted by an earlier (pre flash) frame.
    // The recovery after a flash is indicated by a high pcnt_second_ref
    // comapred to pcnt_inter.
    if ((next_frame.pcnt_second_ref > next_frame.pcnt_inter) &&
        (next_frame.pcnt_second_ref >= 0.5)) {
      flash_detected = TRUE;
1295
    }
John Koleszar's avatar
John Koleszar committed
1296
  }
1297

John Koleszar's avatar
John Koleszar committed
1298
  return flash_detected;
1299
1300
1301
1302
}

// Update the motion related elements to the GF arf boost calculation
static void accumulate_frame_motion_stats(