vp9_encodeframe.c 123 KB
Newer Older
John Koleszar's avatar
John Koleszar committed
1
/*
2
 *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
John Koleszar's avatar
John Koleszar committed
3
 *
4
 *  Use of this source code is governed by a BSD-style license
5
6
 *  that can be found in the LICENSE file in the root of the source
 *  tree. An additional intellectual property rights grant can be found
7
 *  in the file PATENTS.  All contributing project authors may
8
 *  be found in the AUTHORS file in the root of the source tree.
John Koleszar's avatar
John Koleszar committed
9
10
 */

Dmitry Kovalev's avatar
Dmitry Kovalev committed
11
12
13
14
#include <limits.h>
#include <math.h>
#include <stdio.h>

Jim Bankoski's avatar
Jim Bankoski committed
15
#include "./vp9_rtcd.h"
Dmitry Kovalev's avatar
Dmitry Kovalev committed
16
17
18
19
#include "./vpx_config.h"

#include "vpx_ports/vpx_timer.h"

20
#include "vp9/common/vp9_common.h"
Yaowu Xu's avatar
Yaowu Xu committed
21
#include "vp9/common/vp9_entropy.h"
22
#include "vp9/common/vp9_entropymode.h"
23
#include "vp9/common/vp9_idct.h"
Dmitry Kovalev's avatar
Dmitry Kovalev committed
24
25
26
#include "vp9/common/vp9_mvref_common.h"
#include "vp9/common/vp9_pred_common.h"
#include "vp9/common/vp9_quant_common.h"
27
#include "vp9/common/vp9_reconintra.h"
Dmitry Kovalev's avatar
Dmitry Kovalev committed
28
#include "vp9/common/vp9_reconinter.h"
29
#include "vp9/common/vp9_seg_common.h"
30
#include "vp9/common/vp9_systemdependent.h"
31
#include "vp9/common/vp9_tile_common.h"
32

33
#include "vp9/encoder/vp9_aq_complexity.h"
Marco Paniconi's avatar
Marco Paniconi committed
34
35
#include "vp9/encoder/vp9_aq_cyclicrefresh.h"
#include "vp9/encoder/vp9_aq_variance.h"
Dmitry Kovalev's avatar
Dmitry Kovalev committed
36
37
38
#include "vp9/encoder/vp9_encodeframe.h"
#include "vp9/encoder/vp9_encodemb.h"
#include "vp9/encoder/vp9_encodemv.h"
39
#include "vp9/encoder/vp9_extend.h"
40
#include "vp9/encoder/vp9_pickmode.h"
Dmitry Kovalev's avatar
Dmitry Kovalev committed
41
42
#include "vp9/encoder/vp9_rdopt.h"
#include "vp9/encoder/vp9_segmentation.h"
43
#include "vp9/encoder/vp9_tokenize.h"
44

45
46
47
48
49
50
#define GF_ZEROMV_ZBIN_BOOST 0
#define LF_ZEROMV_ZBIN_BOOST 0
#define MV_ZBIN_BOOST        0
#define SPLIT_MV_ZBIN_BOOST  0
#define INTRA_ZBIN_BOOST     0

Jim Bankoski's avatar
Jim Bankoski committed
51
static void encode_superblock(VP9_COMP *cpi, TOKENEXTRA **t, int output_enabled,
52
53
                              int mi_row, int mi_col, BLOCK_SIZE bsize,
                              PICK_MODE_CONTEXT *ctx);
54

55
// Motion vector component magnitude threshold for defining fast motion.
56
#define FAST_MOTION_MV_THRESH 24
57

58
59
60
61
// This is used as a reference when computing the source variance for the
//  purposes of activity masking.
// Eventually this should be replaced by custom no-reference routines,
//  which will be faster.
62
63
64
65
66
67
68
69
70
71
72
static const uint8_t VP9_VAR_OFFS[64] = {
  128, 128, 128, 128, 128, 128, 128, 128,
  128, 128, 128, 128, 128, 128, 128, 128,
  128, 128, 128, 128, 128, 128, 128, 128,
  128, 128, 128, 128, 128, 128, 128, 128,
  128, 128, 128, 128, 128, 128, 128, 128,
  128, 128, 128, 128, 128, 128, 128, 128,
  128, 128, 128, 128, 128, 128, 128, 128,
  128, 128, 128, 128, 128, 128, 128, 128
};

73
74
75
76
77
78
79
80
81
82
83
84
static void get_sse_sum_8x8(const uint8_t *src, int src_stride,
                            const uint8_t *ref, int ref_stride,
                            unsigned int *sse, int *sum) {
  variance(src, src_stride, ref, ref_stride, 8, 8, sse, sum);
}

static void get_sse_sum_16x16(const uint8_t *src, int src_stride,
                              const uint8_t *ref, int ref_stride,
                              unsigned int *sse, int *sum) {
  variance(src, src_stride, ref, ref_stride, 16, 16, sse, sum);
}

85
static unsigned int get_sby_perpixel_variance(VP9_COMP *cpi,
86
                                              const struct buf_2d *ref,
87
                                              BLOCK_SIZE bs) {
88
89
90
  unsigned int sse;
  const unsigned int var = cpi->fn_ptr[bs].vf(ref->buf, ref->stride,
                                              VP9_VAR_OFFS, 0, &sse);
91
  return ROUND_POWER_OF_TWO(var, num_pels_log2_lookup[bs]);
92
93
}

94
static unsigned int get_sby_perpixel_diff_variance(VP9_COMP *cpi,
95
96
                                                   const struct buf_2d *ref,
                                                   int mi_row, int mi_col,
97
                                                   BLOCK_SIZE bs) {
98
99
100
101
102
103
  const YV12_BUFFER_CONFIG *last = get_ref_frame_buffer(cpi, LAST_FRAME);
  const uint8_t* last_y = &last->y_buffer[mi_row * MI_SIZE * last->y_stride +
                                              mi_col * MI_SIZE];
  unsigned int sse;
  const unsigned int var = cpi->fn_ptr[bs].vf(ref->buf, ref->stride,
                                              last_y, last->y_stride, &sse);
104
105
106
107
108
109
  return ROUND_POWER_OF_TWO(var, num_pels_log2_lookup[bs]);
}

static BLOCK_SIZE get_rd_var_based_fixed_partition(VP9_COMP *cpi,
                                                   int mi_row,
                                                   int mi_col) {
110
  unsigned int var = get_sby_perpixel_diff_variance(cpi, &cpi->mb.plane[0].src,
111
112
113
                                                    mi_row, mi_col,
                                                    BLOCK_64X64);
  if (var < 8)
114
    return BLOCK_64X64;
115
  else if (var < 128)
116
    return BLOCK_32X32;
117
118
119
120
  else if (var < 2048)
    return BLOCK_16X16;
  else
    return BLOCK_8X8;
121
122
}

123
124
125
static BLOCK_SIZE get_nonrd_var_based_fixed_partition(VP9_COMP *cpi,
                                                      int mi_row,
                                                      int mi_col) {
126
  unsigned int var = get_sby_perpixel_diff_variance(cpi, &cpi->mb.plane[0].src,
127
128
                                                    mi_row, mi_col,
                                                    BLOCK_64X64);
129
  if (var < 4)
130
    return BLOCK_64X64;
131
  else if (var < 10)
132
133
    return BLOCK_32X32;
  else
134
    return BLOCK_16X16;
135
136
}

137
138
// Lighter version of set_offsets that only sets the mode info
// pointers.
139
static INLINE void set_modeinfo_offsets(VP9_COMMON *const cm,
140
141
142
                                        MACROBLOCKD *const xd,
                                        int mi_row,
                                        int mi_col) {
143
144
145
  const int idx_str = xd->mi_stride * mi_row + mi_col;
  xd->mi = cm->mi_grid_visible + idx_str;
  xd->mi[0] = cm->mi + idx_str;
146
147
}

Alex Converse's avatar
Alex Converse committed
148
static int is_block_in_mb_map(const VP9_COMP *cpi, int mi_row, int mi_col,
149
                              BLOCK_SIZE bsize) {
Alex Converse's avatar
Alex Converse committed
150
  const VP9_COMMON *const cm = &cpi->common;
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
  const int mb_rows = cm->mb_rows;
  const int mb_cols = cm->mb_cols;
  const int mb_row = mi_row >> 1;
  const int mb_col = mi_col >> 1;
  const int mb_width = num_8x8_blocks_wide_lookup[bsize] >> 1;
  const int mb_height = num_8x8_blocks_high_lookup[bsize] >> 1;
  int r, c;
  if (bsize <= BLOCK_16X16) {
    return cpi->active_map[mb_row * mb_cols + mb_col];
  }
  for (r = 0; r < mb_height; ++r) {
    for (c = 0; c < mb_width; ++c) {
      int row = mb_row + r;
      int col = mb_col + c;
      if (row >= mb_rows || col >= mb_cols)
        continue;
      if (cpi->active_map[row * mb_cols + col])
        return 1;
    }
  }
  return 0;
}

Alex Converse's avatar
Alex Converse committed
174
175
176
177
178
179
180
181
182
183
static int check_active_map(const VP9_COMP *cpi, const MACROBLOCK *x,
                            int mi_row, int mi_col,
                            BLOCK_SIZE bsize) {
  if (cpi->active_map_enabled && !x->e_mbd.lossless) {
    return is_block_in_mb_map(cpi, mi_row, mi_col, bsize);
  } else {
    return 1;
  }
}

184
185
186
187
188
189
190
191
192
193
static void set_offsets(VP9_COMP *cpi, const TileInfo *const tile,
                        int mi_row, int mi_col, BLOCK_SIZE bsize) {
  MACROBLOCK *const x = &cpi->mb;
  VP9_COMMON *const cm = &cpi->common;
  MACROBLOCKD *const xd = &x->e_mbd;
  MB_MODE_INFO *mbmi;
  const int mi_width = num_8x8_blocks_wide_lookup[bsize];
  const int mi_height = num_8x8_blocks_high_lookup[bsize];
  const struct segmentation *const seg = &cm->seg;

194
  set_skip_context(xd, mi_row, mi_col);
195
196

  // Activity map pointer
Alex Converse's avatar
Alex Converse committed
197
  x->in_active_map = check_active_map(cpi, x, mi_row, mi_col, bsize);
198
199
200

  set_modeinfo_offsets(cm, xd, mi_row, mi_col);

201
  mbmi = &xd->mi[0]->mbmi;
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221

  // Set up destination pointers.
  vp9_setup_dst_planes(xd, get_frame_new_buffer(cm), mi_row, mi_col);

  // Set up limit values for MV components.
  // Mv beyond the range do not produce new/different prediction block.
  x->mv_row_min = -(((mi_row + mi_height) * MI_SIZE) + VP9_INTERP_EXTEND);
  x->mv_col_min = -(((mi_col + mi_width) * MI_SIZE) + VP9_INTERP_EXTEND);
  x->mv_row_max = (cm->mi_rows - mi_row) * MI_SIZE + VP9_INTERP_EXTEND;
  x->mv_col_max = (cm->mi_cols - mi_col) * MI_SIZE + VP9_INTERP_EXTEND;

  // Set up distance of MB to edge of frame in 1/8th pel units.
  assert(!(mi_col & (mi_width - 1)) && !(mi_row & (mi_height - 1)));
  set_mi_row_col(xd, tile, mi_row, mi_height, mi_col, mi_width,
                 cm->mi_rows, cm->mi_cols);

  // Set up source buffers.
  vp9_setup_src_planes(x, cpi->Source, mi_row, mi_col);

  // R/D setup.
Dmitry Kovalev's avatar
Dmitry Kovalev committed
222
223
  x->rddiv = cpi->rd.RDDIV;
  x->rdmult = cpi->rd.RDMULT;
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240

  // Setup segment ID.
  if (seg->enabled) {
    if (cpi->oxcf.aq_mode != VARIANCE_AQ) {
      const uint8_t *const map = seg->update_map ? cpi->segmentation_map
                                                 : cm->last_frame_seg_map;
      mbmi->segment_id = vp9_get_segment_id(cm, map, bsize, mi_row, mi_col);
    }
    vp9_init_plane_quantizers(cpi, x);

    x->encode_breakout = cpi->segment_encode_breakout[mbmi->segment_id];
  } else {
    mbmi->segment_id = 0;
    x->encode_breakout = cpi->encode_breakout;
  }
}

241
static void duplicate_mode_info_in_sb(VP9_COMMON * const cm,
242
243
244
245
246
247
248
249
250
251
                                     MACROBLOCKD *const xd,
                                     int mi_row,
                                     int mi_col,
                                     BLOCK_SIZE bsize) {
  const int block_width = num_8x8_blocks_wide_lookup[bsize];
  const int block_height = num_8x8_blocks_high_lookup[bsize];
  int i, j;
  for (j = 0; j < block_height; ++j)
    for (i = 0; i < block_width; ++i) {
      if (mi_row + j < cm->mi_rows && mi_col + i < cm->mi_cols)
252
        xd->mi[j * xd->mi_stride + i] = xd->mi[0];
253
254
255
256
257
258
259
260
261
262
    }
}

static void set_block_size(VP9_COMP * const cpi,
                           const TileInfo *const tile,
                           int mi_row, int mi_col,
                           BLOCK_SIZE bsize) {
  if (cpi->common.mi_cols > mi_col && cpi->common.mi_rows > mi_row) {
    MACROBLOCKD *const xd = &cpi->mb.e_mbd;
    set_modeinfo_offsets(&cpi->common, xd, mi_row, mi_col);
263
    xd->mi[0]->mbmi.sb_type = bsize;
264
    duplicate_mode_info_in_sb(&cpi->common, xd, mi_row, mi_col, bsize);
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
  }
}

typedef struct {
  int64_t sum_square_error;
  int64_t sum_error;
  int count;
  int variance;
} var;

typedef struct {
  var none;
  var horz[2];
  var vert[2];
} partition_variance;

typedef struct {
  partition_variance part_variances;
  var split[4];
} v8x8;

typedef struct {
  partition_variance part_variances;
  v8x8 split[4];
} v16x16;

typedef struct {
  partition_variance part_variances;
  v16x16 split[4];
} v32x32;

typedef struct {
  partition_variance part_variances;
  v32x32 split[4];
} v64x64;

typedef struct {
  partition_variance *part_variances;
  var *split[4];
} variance_node;

typedef enum {
  V16X16,
  V32X32,
  V64X64,
} TREE_LEVEL;

static void tree_to_node(void *data, BLOCK_SIZE bsize, variance_node *node) {
  int i;
  switch (bsize) {
    case BLOCK_64X64: {
      v64x64 *vt = (v64x64 *) data;
      node->part_variances = &vt->part_variances;
      for (i = 0; i < 4; i++)
        node->split[i] = &vt->split[i].part_variances.none;
      break;
    }
    case BLOCK_32X32: {
      v32x32 *vt = (v32x32 *) data;
      node->part_variances = &vt->part_variances;
      for (i = 0; i < 4; i++)
        node->split[i] = &vt->split[i].part_variances.none;
      break;
    }
    case BLOCK_16X16: {
      v16x16 *vt = (v16x16 *) data;
      node->part_variances = &vt->part_variances;
      for (i = 0; i < 4; i++)
        node->split[i] = &vt->split[i].part_variances.none;
      break;
    }
    case BLOCK_8X8: {
      v8x8 *vt = (v8x8 *) data;
      node->part_variances = &vt->part_variances;
      for (i = 0; i < 4; i++)
        node->split[i] = &vt->split[i];
      break;
    }
    default: {
      assert(0);
    }
  }
}

// Set variance values given sum square error, sum error, count.
static void fill_variance(int64_t s2, int64_t s, int c, var *v) {
  v->sum_square_error = s2;
  v->sum_error = s;
  v->count = c;
  if (c > 0)
    v->variance = (int)(256 *
                        (v->sum_square_error - v->sum_error * v->sum_error /
                         v->count) / v->count);
  else
    v->variance = 0;
}

void sum_2_variances(const var *a, const var *b, var *r) {
  fill_variance(a->sum_square_error + b->sum_square_error,
                a->sum_error + b->sum_error, a->count + b->count, r);
}

static void fill_variance_tree(void *data, BLOCK_SIZE bsize) {
  variance_node node;
  tree_to_node(data, bsize, &node);
  sum_2_variances(node.split[0], node.split[1], &node.part_variances->horz[0]);
  sum_2_variances(node.split[2], node.split[3], &node.part_variances->horz[1]);
  sum_2_variances(node.split[0], node.split[2], &node.part_variances->vert[0]);
  sum_2_variances(node.split[1], node.split[3], &node.part_variances->vert[1]);
  sum_2_variances(&node.part_variances->vert[0], &node.part_variances->vert[1],
                  &node.part_variances->none);
}

static int set_vt_partitioning(VP9_COMP *cpi,
                               void *data,
                               const TileInfo *const tile,
                               BLOCK_SIZE bsize,
                               int mi_row,
                               int mi_col,
                               int mi_size) {
  VP9_COMMON * const cm = &cpi->common;
  variance_node vt;
  const int block_width = num_8x8_blocks_wide_lookup[bsize];
  const int block_height = num_8x8_blocks_high_lookup[bsize];
  // TODO(debargha): Choose this more intelligently.
  const int64_t threshold_multiplier = 25;
  int64_t threshold = threshold_multiplier * cpi->common.base_qindex;
  assert(block_height == block_width);

  tree_to_node(data, bsize, &vt);

  // Split none is available only if we have more than half a block size
  // in width and height inside the visible image.
  if (mi_col + block_width / 2 < cm->mi_cols &&
      mi_row + block_height / 2 < cm->mi_rows &&
      vt.part_variances->none.variance < threshold) {
    set_block_size(cpi, tile, mi_row, mi_col, bsize);
    return 1;
  }

  // Vertical split is available on all but the bottom border.
  if (mi_row + block_height / 2 < cm->mi_rows &&
      vt.part_variances->vert[0].variance < threshold &&
      vt.part_variances->vert[1].variance < threshold) {
    BLOCK_SIZE subsize = get_subsize(bsize, PARTITION_VERT);
    set_block_size(cpi, tile, mi_row, mi_col, subsize);
    set_block_size(cpi, tile, mi_row, mi_col + block_width / 2, subsize);
    return 1;
  }

  // Horizontal split is available on all but the right border.
  if (mi_col + block_width / 2 < cm->mi_cols &&
      vt.part_variances->horz[0].variance < threshold &&
      vt.part_variances->horz[1].variance < threshold) {
    BLOCK_SIZE subsize = get_subsize(bsize, PARTITION_HORZ);
    set_block_size(cpi, tile, mi_row, mi_col, subsize);
    set_block_size(cpi, tile, mi_row + block_height / 2, mi_col, subsize);
    return 1;
  }
  return 0;
}

// TODO(debargha): Fix this function and make it work as expected.
static void choose_partitioning(VP9_COMP *cpi,
                                const TileInfo *const tile,
                                int mi_row, int mi_col) {
  VP9_COMMON * const cm = &cpi->common;
  MACROBLOCK *x = &cpi->mb;
  MACROBLOCKD *xd = &cpi->mb.e_mbd;

  int i, j, k;
  v64x64 vt;
  uint8_t *s;
  const uint8_t *d;
  int sp;
  int dp;
  int pixels_wide = 64, pixels_high = 64;
  int_mv nearest_mv, near_mv;
  const YV12_BUFFER_CONFIG *yv12 = get_ref_frame_buffer(cpi, LAST_FRAME);
  const struct scale_factors *const sf = &cm->frame_refs[LAST_FRAME - 1].sf;

  vp9_zero(vt);
  set_offsets(cpi, tile, mi_row, mi_col, BLOCK_64X64);

  if (xd->mb_to_right_edge < 0)
    pixels_wide += (xd->mb_to_right_edge >> 3);
  if (xd->mb_to_bottom_edge < 0)
    pixels_high += (xd->mb_to_bottom_edge >> 3);

  s = x->plane[0].src.buf;
  sp = x->plane[0].src.stride;

  if (cm->frame_type != KEY_FRAME) {
    vp9_setup_pre_planes(xd, 0, yv12, mi_row, mi_col, sf);

460
461
    xd->mi[0]->mbmi.ref_frame[0] = LAST_FRAME;
    xd->mi[0]->mbmi.sb_type = BLOCK_64X64;
462
    vp9_find_best_ref_mvs(xd, cm->allow_high_precision_mv,
463
                          xd->mi[0]->mbmi.ref_mvs[LAST_FRAME],
464
465
                          &nearest_mv, &near_mv);

466
    xd->mi[0]->mbmi.mv[0] = nearest_mv;
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
    vp9_build_inter_predictors_sby(xd, mi_row, mi_col, BLOCK_64X64);

    d = xd->plane[0].dst.buf;
    dp = xd->plane[0].dst.stride;
  } else {
    d = VP9_VAR_OFFS;
    dp = 0;
  }

  // Fill in the entire tree of 8x8 variances for splits.
  for (i = 0; i < 4; i++) {
    const int x32_idx = ((i & 1) << 5);
    const int y32_idx = ((i >> 1) << 5);
    for (j = 0; j < 4; j++) {
      const int x16_idx = x32_idx + ((j & 1) << 4);
      const int y16_idx = y32_idx + ((j >> 1) << 4);
      v16x16 *vst = &vt.split[i].split[j];
      for (k = 0; k < 4; k++) {
        int x_idx = x16_idx + ((k & 1) << 3);
        int y_idx = y16_idx + ((k >> 1) << 3);
        unsigned int sse = 0;
        int sum = 0;
        if (x_idx < pixels_wide && y_idx < pixels_high)
490
491
          get_sse_sum_8x8(s + y_idx * sp + x_idx, sp,
                          d + y_idx * dp + x_idx, dp, &sse, &sum);
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
        fill_variance(sse, sum, 64, &vst->split[k].part_variances.none);
      }
    }
  }
  // Fill the rest of the variance tree by summing split partition values.
  for (i = 0; i < 4; i++) {
    for (j = 0; j < 4; j++) {
      fill_variance_tree(&vt.split[i].split[j], BLOCK_16X16);
    }
    fill_variance_tree(&vt.split[i], BLOCK_32X32);
  }
  fill_variance_tree(&vt, BLOCK_64X64);

  // Now go through the entire structure,  splitting every block size until
  // we get to one that's got a variance lower than our threshold,  or we
  // hit 8x8.
  if (!set_vt_partitioning(cpi, &vt, tile, BLOCK_64X64,
                           mi_row, mi_col, 8)) {
    for (i = 0; i < 4; ++i) {
      const int x32_idx = ((i & 1) << 2);
      const int y32_idx = ((i >> 1) << 2);
      if (!set_vt_partitioning(cpi, &vt.split[i], tile, BLOCK_32X32,
                               (mi_row + y32_idx), (mi_col + x32_idx), 4)) {
        for (j = 0; j < 4; ++j) {
          const int x16_idx = ((j & 1) << 1);
          const int y16_idx = ((j >> 1) << 1);
          // NOTE: This is a temporary hack to disable 8x8 partitions,
          // since it works really bad - possibly due to a bug
#define DISABLE_8X8_VAR_BASED_PARTITION
#ifdef DISABLE_8X8_VAR_BASED_PARTITION
          if (mi_row + y32_idx + y16_idx + 1 < cm->mi_rows &&
              mi_row + x32_idx + x16_idx + 1 < cm->mi_cols) {
            set_block_size(cpi, tile,
                           (mi_row + y32_idx + y16_idx),
                           (mi_col + x32_idx + x16_idx),
                           BLOCK_16X16);
          } else {
            for (k = 0; k < 4; ++k) {
              const int x8_idx = (k & 1);
              const int y8_idx = (k >> 1);
              set_block_size(cpi, tile,
                             (mi_row + y32_idx + y16_idx + y8_idx),
                             (mi_col + x32_idx + x16_idx + x8_idx),
                             BLOCK_8X8);
            }
          }
#else
          if (!set_vt_partitioning(cpi, &vt.split[i].split[j], tile,
                                   BLOCK_16X16,
                                   (mi_row + y32_idx + y16_idx),
                                   (mi_col + x32_idx + x16_idx), 2)) {
            for (k = 0; k < 4; ++k) {
              const int x8_idx = (k & 1);
              const int y8_idx = (k >> 1);
              set_block_size(cpi, tile,
                             (mi_row + y32_idx + y16_idx + y8_idx),
                             (mi_col + x32_idx + x16_idx + x8_idx),
                             BLOCK_8X8);
            }
          }
#endif
        }
      }
    }
  }
}

559
// Original activity measure from Tim T's code.
560
static unsigned int tt_activity_measure(MACROBLOCK *x) {
John Koleszar's avatar
John Koleszar committed
561
  unsigned int sse;
562
563
564
565
566
567
568
569
570
  // TODO: This could also be done over smaller areas (8x8), but that would
  // require extensive changes elsewhere, as lambda is assumed to be fixed
  // over an entire MB in most of the code.
  // Another option is to compute four 8x8 variances, and pick a single
  // lambda using a non-linear combination (e.g., the smallest, or second
  // smallest, etc.).
  const unsigned int act = vp9_variance16x16(x->plane[0].src.buf,
                                             x->plane[0].src.stride,
                                             VP9_VAR_OFFS, 0, &sse) << 4;
571
  // If the region is flat, lower the activity some more.
572
  return act < (8 << 12) ? MIN(act, 5 << 12) : act;
573
574
}

Jim Bankoski's avatar
Jim Bankoski committed
575
static void update_state(VP9_COMP *cpi, PICK_MODE_CONTEXT *ctx,
576
577
                         int mi_row, int mi_col, BLOCK_SIZE bsize,
                         int output_enabled) {
Ronald S. Bultje's avatar
Ronald S. Bultje committed
578
  int i, x_idx, y;
579
  VP9_COMMON *const cm = &cpi->common;
Dmitry Kovalev's avatar
Dmitry Kovalev committed
580
  RD_OPT *const rd_opt = &cpi->rd;
581
582
  MACROBLOCK *const x = &cpi->mb;
  MACROBLOCKD *const xd = &x->e_mbd;
583
584
  struct macroblock_plane *const p = x->plane;
  struct macroblockd_plane *const pd = xd->plane;
John Koleszar's avatar
John Koleszar committed
585
  MODE_INFO *mi = &ctx->mic;
586
587
  MB_MODE_INFO *const mbmi = &xd->mi[0]->mbmi;
  MODE_INFO *mi_addr = xd->mi[0];
588
  const struct segmentation *const seg = &cm->seg;
589

590
  const int mis = cm->mi_stride;
Jim Bankoski's avatar
Jim Bankoski committed
591
  const int mi_width = num_8x8_blocks_wide_lookup[bsize];
Jim Bankoski's avatar
Jim Bankoski committed
592
  const int mi_height = num_8x8_blocks_high_lookup[bsize];
593
  int max_plane;
Adrian Grange's avatar
Adrian Grange committed
594

595
  assert(mi->mbmi.sb_type == bsize);
596

597
598
  *mi_addr = *mi;

Paul Wilkins's avatar
Paul Wilkins committed
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
  // If segmentation in use
  if (seg->enabled && output_enabled) {
    // For in frame complexity AQ copy the segment id from the segment map.
    if (cpi->oxcf.aq_mode == COMPLEXITY_AQ) {
      const uint8_t *const map = seg->update_map ? cpi->segmentation_map
                                                 : cm->last_frame_seg_map;
      mi_addr->mbmi.segment_id =
        vp9_get_segment_id(cm, map, bsize, mi_row, mi_col);
    }
    // Else for cyclic refresh mode update the segment map, set the segment id
    // and then update the quantizer.
    else if (cpi->oxcf.aq_mode == CYCLIC_REFRESH_AQ) {
      vp9_cyclic_refresh_update_segment(cpi, &xd->mi[0]->mbmi,
                                        mi_row, mi_col, bsize, 1);
      vp9_init_plane_quantizers(cpi, x);
    }
615
  }
616

617
618
  max_plane = is_inter_block(mbmi) ? MAX_MB_PLANE : 1;
  for (i = 0; i < max_plane; ++i) {
619
    p[i].coeff = ctx->coeff_pbuf[i][1];
620
    p[i].qcoeff = ctx->qcoeff_pbuf[i][1];
621
    pd[i].dqcoeff = ctx->dqcoeff_pbuf[i][1];
622
    p[i].eobs = ctx->eobs_pbuf[i][1];
623
624
  }

625
626
  for (i = max_plane; i < MAX_MB_PLANE; ++i) {
    p[i].coeff = ctx->coeff_pbuf[i][2];
627
    p[i].qcoeff = ctx->qcoeff_pbuf[i][2];
628
    pd[i].dqcoeff = ctx->dqcoeff_pbuf[i][2];
629
    p[i].eobs = ctx->eobs_pbuf[i][2];
630
631
  }

John Koleszar's avatar
John Koleszar committed
632
633
  // Restore the coding context of the MB to that that was in place
  // when the mode was picked for it
634
635
  for (y = 0; y < mi_height; y++)
    for (x_idx = 0; x_idx < mi_width; x_idx++)
James Zern's avatar
James Zern committed
636
      if ((xd->mb_to_right_edge >> (3 + MI_SIZE_LOG2)) + mi_width > x_idx
637
        && (xd->mb_to_bottom_edge >> (3 + MI_SIZE_LOG2)) + mi_height > y) {
638
        xd->mi[x_idx + y * mis] = mi_addr;
639
      }
640

641
  if (cpi->oxcf.aq_mode)
Dmitry Kovalev's avatar
Dmitry Kovalev committed
642
    vp9_init_plane_quantizers(cpi, x);
643

644
645
  // FIXME(rbultje) I'm pretty sure this should go to the end of this block
  // (i.e. after the output_enabled)
646
647
  if (bsize < BLOCK_32X32) {
    if (bsize < BLOCK_16X16)
648
649
      ctx->tx_rd_diff[ALLOW_16X16] = ctx->tx_rd_diff[ALLOW_8X8];
    ctx->tx_rd_diff[ALLOW_32X32] = ctx->tx_rd_diff[ALLOW_16X16];
Ronald S. Bultje's avatar
Ronald S. Bultje committed
650
  }
Adrian Grange's avatar
Adrian Grange committed
651

652
  if (is_inter_block(mbmi) && mbmi->sb_type < BLOCK_8X8) {
653
654
    mbmi->mv[0].as_int = mi->bmi[3].as_mv[0].as_int;
    mbmi->mv[1].as_int = mi->bmi[3].as_mv[1].as_int;
John Koleszar's avatar
John Koleszar committed
655
656
  }

657
  x->skip = ctx->skip;
658
  vpx_memcpy(x->zcoeff_blk[mbmi->tx_size], ctx->zcoeff_blk,
659
             sizeof(uint8_t) * ctx->num_4x4_blk);
660

Ronald S. Bultje's avatar
Ronald S. Bultje committed
661
662
663
  if (!output_enabled)
    return;

664
  if (!vp9_segfeature_active(&cm->seg, mbmi->segment_id, SEG_LVL_SKIP)) {
665
    for (i = 0; i < TX_MODES; i++)
Dmitry Kovalev's avatar
Dmitry Kovalev committed
666
      rd_opt->tx_select_diff[i] += ctx->tx_rd_diff[i];
667
668
  }

669
#if CONFIG_INTERNAL_STATS
670
  if (frame_is_intra_only(cm)) {
John Koleszar's avatar
John Koleszar committed
671
    static const int kf_mode_index[] = {
672
673
674
675
      THR_DC        /*DC_PRED*/,
      THR_V_PRED    /*V_PRED*/,
      THR_H_PRED    /*H_PRED*/,
      THR_D45_PRED  /*D45_PRED*/,
John Koleszar's avatar
John Koleszar committed
676
677
678
      THR_D135_PRED /*D135_PRED*/,
      THR_D117_PRED /*D117_PRED*/,
      THR_D153_PRED /*D153_PRED*/,
Dmitry Kovalev's avatar
Dmitry Kovalev committed
679
      THR_D207_PRED /*D207_PRED*/,
680
681
      THR_D63_PRED  /*D63_PRED*/,
      THR_TM        /*TM_PRED*/,
John Koleszar's avatar
John Koleszar committed
682
    };
683
    ++cpi->mode_chosen_counts[kf_mode_index[mbmi->mode]];
John Koleszar's avatar
John Koleszar committed
684
685
  } else {
    // Note how often each mode chosen as best
686
687
688
689
    ++cpi->mode_chosen_counts[ctx->best_mode_index];
  }
#endif
  if (!frame_is_intra_only(cm)) {
690
    if (is_inter_block(mbmi)) {
691
      vp9_update_mv_count(cm, xd);
692
693
694
695
696

      if (cm->interp_filter == SWITCHABLE) {
        const int ctx = vp9_get_pred_context_switchable_interp(xd);
        ++cm->counts.switchable_interp[ctx][mbmi->interp_filter];
      }
697
    }
Adrian Grange's avatar
Adrian Grange committed
698

Dmitry Kovalev's avatar
Dmitry Kovalev committed
699
700
701
    rd_opt->comp_pred_diff[SINGLE_REFERENCE] += ctx->single_pred_diff;
    rd_opt->comp_pred_diff[COMPOUND_REFERENCE] += ctx->comp_pred_diff;
    rd_opt->comp_pred_diff[REFERENCE_MODE_SELECT] += ctx->hybrid_pred_diff;
702

703
    for (i = 0; i < SWITCHABLE_FILTER_CONTEXTS; ++i)
Dmitry Kovalev's avatar
Dmitry Kovalev committed
704
      rd_opt->filter_diff[i] += ctx->best_filter_diff[i];
John Koleszar's avatar
John Koleszar committed
705
  }
Adrian Grange's avatar
Adrian Grange committed
706
707
}

Jim Bankoski's avatar
Jim Bankoski committed
708
void vp9_setup_src_planes(MACROBLOCK *x, const YV12_BUFFER_CONFIG *src,
709
710
711
712
713
                          int mi_row, int mi_col) {
  uint8_t *const buffers[4] = {src->y_buffer, src->u_buffer, src->v_buffer,
                               src->alpha_buffer};
  const int strides[4] = {src->y_stride, src->uv_stride, src->uv_stride,
                          src->alpha_stride};
714
715
  int i;

716
717
718
  // Set current frame pointer.
  x->e_mbd.cur_buf = src;

719
720
  for (i = 0; i < MAX_MB_PLANE; i++)
    setup_pred_plane(&x->plane[i].src, buffers[i], strides[i], mi_row, mi_col,
Jim Bankoski's avatar
Jim Bankoski committed
721
                     NULL, x->e_mbd.plane[i].subsampling_x,
722
                     x->e_mbd.plane[i].subsampling_y);
John Koleszar's avatar
John Koleszar committed
723
724
}

725
726
727
728
static void rd_pick_sb_modes(VP9_COMP *cpi, const TileInfo *const tile,
                             int mi_row, int mi_col,
                             int *totalrate, int64_t *totaldist,
                             BLOCK_SIZE bsize, PICK_MODE_CONTEXT *ctx,
729
                             int64_t best_rd, int block) {
730
731
732
  VP9_COMMON *const cm = &cpi->common;
  MACROBLOCK *const x = &cpi->mb;
  MACROBLOCKD *const xd = &x->e_mbd;
733
  MB_MODE_INFO *mbmi;
734
735
  struct macroblock_plane *const p = x->plane;
  struct macroblockd_plane *const pd = xd->plane;
736
  const AQ_MODE aq_mode = cpi->oxcf.aq_mode;
737
  int i, orig_rdmult;
738
739
  double rdmult_ratio;

740
  vp9_clear_system_state();
741
  rdmult_ratio = 1.0;  // avoid uninitialized warnings
Ronald S. Bultje's avatar
Ronald S. Bultje committed
742

743
  // Use the lower precision, but faster, 32x32 fdct for mode selection.
744
  x->use_lp32x32fdct = 1;
745

746
747
748
  // TODO(JBB): Most other places in the code instead of calling the function
  // and then checking if its not the first 8x8 we put the check in the
  // calling function.  Do that here.
749
  if (bsize < BLOCK_8X8) {
750
751
    // When ab_index = 0 all sub-blocks are handled, so for ab_index != 0
    // there is nothing to be done.
752
    if (block != 0) {
753
754
      *totalrate = 0;
      *totaldist = 0;
755
      return;
756
    }
757
  }
758

James Zern's avatar
James Zern committed
759
  set_offsets(cpi, tile, mi_row, mi_col, bsize);
760
  mbmi = &xd->mi[0]->mbmi;
761
  mbmi->sb_type = bsize;
762

763
  for (i = 0; i < MAX_MB_PLANE; ++i) {
764
    p[i].coeff = ctx->coeff_pbuf[i][0];
765
    p[i].qcoeff = ctx->qcoeff_pbuf[i][0];
766
    pd[i].dqcoeff = ctx->dqcoeff_pbuf[i][0];
767
    p[i].eobs = ctx->eobs_pbuf[i][0];
768
  }
769
  ctx->is_coded = 0;
770
  x->skip_recode = 0;
771

772
  // Set to zero to make sure we do not use the previous encoded frame stats
773
  mbmi->skip = 0;
774

775
  x->source_variance = get_sby_perpixel_variance(cpi, &x->plane[0].src, bsize);
776

777
778
779
  // Save rdmult before it might be changed, so it can be restored later.
  orig_rdmult = x->rdmult;

780
  if (aq_mode == VARIANCE_AQ) {
781
782
    const int energy = bsize <= BLOCK_16X16 ? x->mb_energy
                                            : vp9_block_energy(cpi, x, bsize);
Paul Wilkins's avatar
Paul Wilkins committed
783
784
785
    if (cm->frame_type == KEY_FRAME ||
        cpi->refresh_alt_ref_frame ||
        (cpi->refresh_golden_frame && !cpi->rc.is_src_frame_alt_ref)) {
786
      mbmi->segment_id = vp9_vaq_segment_id(energy);
Paul Wilkins's avatar
Paul Wilkins committed
787
788
789
    } else {
      const uint8_t *const map = cm->seg.update_map ? cpi->segmentation_map
                                                    : cm->last_frame_seg_map;
790
      mbmi->segment_id = vp9_get_segment_id(cm, map, bsize, mi_row, mi_col);
Paul Wilkins's avatar
Paul Wilkins committed
791
792
    }

793
    rdmult_ratio = vp9_vaq_rdmult_ratio(energy);
Dmitry Kovalev's avatar
Dmitry Kovalev committed
794
    vp9_init_plane_quantizers(cpi, x);
795
    vp9_clear_system_state();
796
    x->rdmult = (int)round(x->rdmult * rdmult_ratio);
797
  } else if (aq_mode == COMPLEXITY_AQ) {
798
799
    const int mi_offset = mi_row * cm->mi_cols + mi_col;
    unsigned char complexity = cpi->complexity_map[mi_offset];
Paul Wilkins's avatar
Paul Wilkins committed
800
801
    const int is_edge = (mi_row <= 1) || (mi_row >= (cm->mi_rows - 2)) ||
                        (mi_col <= 1) || (mi_col >= (cm->mi_cols - 2));
802
803
    if (!is_edge && (complexity > 128))
      x->rdmult += ((x->rdmult * (complexity - 128)) / 256);
804
  } else if (aq_mode == CYCLIC_REFRESH_AQ) {
805
    const uint8_t *const map = cm->seg.update_map ? cpi->segmentation_map
806
                                                  : cm->last_frame_seg_map;
807
808
    // If segment 1, use rdmult for that segment.
    if (vp9_get_segment_id(cm, map, bsize, mi_row, mi_col))
809
      x->rdmult = vp9_cyclic_refresh_get_rdmult(cpi->cyclic_refresh);
810
  }
811

812
813
  // Find best coding mode & reconstruct the MB so it is available
  // as a predictor for MBs that follow in the SB
814
  if (frame_is_intra_only(cm)) {
815
816
    vp9_rd_pick_intra_mode_sb(cpi, x, totalrate, totaldist, bsize, ctx,
                              best_rd);
817
818
  } else {
    if (bsize >= BLOCK_8X8)
James Zern's avatar
James Zern committed
819
820
      vp9_rd_pick_inter_mode_sb(cpi, x, tile, mi_row, mi_col,
                                totalrate, totaldist, bsize, ctx, best_rd);
821
    else
James Zern's avatar
James Zern committed
822
      vp9_rd_pick_inter_mode_sub8x8(cpi, x, tile, mi_row, mi_col, totalrate,
823
824
                                    totaldist, bsize, ctx, best_rd);
  }
825

826
827
828
829
830
  x->rdmult = orig_rdmult;

  if (aq_mode == VARIANCE_AQ && *totalrate != INT_MAX) {
    vp9_clear_system_state();
    *totalrate = (int)round(*totalrate * rdmult_ratio);
Paul Wilkins's avatar
Paul Wilkins committed
831
  }
Ronald S. Bultje's avatar
Ronald S. Bultje committed
832
}
Adrian Grange's avatar
Adrian Grange committed
833

834
835
static void update_stats(VP9_COMP *cpi) {
  VP9_COMMON *const cm = &cpi->common;
836
837
  const MACROBLOCK *const x = &cpi->mb;
  const MACROBLOCKD *const xd = &x->e_mbd;
838
  const MODE_INFO *const mi = xd->mi[0];
839
  const MB_MODE_INFO *const mbmi = &mi->mbmi;
Adrian Grange's avatar
Adrian Grange committed
840

841
  if (!frame_is_intra_only(cm)) {
842
    const int seg_ref_active = vp9_segfeature_active(&cm->seg, mbmi->segment_id,
843
                                                     SEG_LVL_REF_FRAME);
844
845
846
847
848
849
850
851
852
853
854
    if (!seg_ref_active) {
      FRAME_COUNTS *const counts = &cm->counts;
      const int inter_block = is_inter_block(mbmi);

      counts->intra_inter[vp9_get_intra_inter_context(xd)][inter_block]++;

      // If the segment reference feature is enabled we have only a single
      // reference frame allowed for the segment so exclude it from
      // the reference frame counts used to work out probabilities.
      if (inter_block) {
        const MV_REFERENCE_FRAME ref0 = mbmi->ref_frame[0];
855

856
857
858
859
860
861
862
863
864
865
866
867
868
869
        if (cm->reference_mode == REFERENCE_MODE_SELECT)
          counts->comp_inter[vp9_get_reference_mode_context(cm, xd)]
                            [has_second_ref(mbmi)]++;

        if (has_second_ref(mbmi)) {
          counts->comp_ref[vp9_get_pred_context_comp_ref_p(cm, xd)]
                          [ref0 == GOLDEN_FRAME]++;
        } else {
          counts->single_ref[vp9_get_pred_context_single_ref_p1(xd)][0]
                            [ref0 != LAST_FRAME]++;
          if (ref0 != LAST_FRAME)
            counts->single_ref[vp9_get_pred_context_single_ref_p2(xd)][1]
                              [ref0 != GOLDEN_FRAME]++;
        }
Ronald S. Bultje's avatar
Ronald S. Bultje committed
870
      }
Ronald S. Bultje's avatar
Ronald S. Bultje committed
871
    }
Ronald S. Bultje's avatar
Ronald S. Bultje committed
872
873
  }
}
John Koleszar's avatar
John Koleszar committed
874

875
876
877
static void restore_context(VP9_COMP *cpi, int mi_row, int mi_col,
                            ENTROPY_CONTEXT a[16 * MAX_MB_PLANE],
                            ENTROPY_CONTEXT l[16 * MAX_MB_PLANE],
Jim Bankoski's avatar
Jim Bankoski committed
878
                            PARTITION_CONTEXT sa[8], PARTITION_CONTEXT sl[8],
879
                            BLOCK_SIZE bsize) {
Jim Bankoski's avatar
Jim Bankoski committed
880
881
  MACROBLOCK *const x = &cpi->mb;
  MACROBLOCKD *const xd = &x->e_mbd;
882
  int p;
Jim Bankoski's avatar
Jim Bankoski committed
883
884
  const int num_4x4_blocks_wide = num_4x4_blocks_wide_lookup[bsize];
  const int num_4x4_blocks_high = num_4x4_blocks_high_lookup[bsize];
Jim Bankoski's avatar
Jim Bankoski committed
885
886
  int mi_width = num_8x8_blocks_wide_lookup[bsize];
  int mi_height = num_8x8_blocks_high_lookup[bsize];
887
  for (p = 0; p < MAX_MB_PLANE; p++) {
Jim Bankoski's avatar
Jim Bankoski committed
888
    vpx_memcpy(
889
        xd->above_context[p] + ((mi_col * 2) >> xd->plane[p].subsampling_x),
Jim Bankoski's avatar
Jim Bankoski committed
890
891
892
        a + num_4x4_blocks_wide * p,
        (sizeof(ENTROPY_CONTEXT) * num_4x4_blocks_wide) >>
        xd->plane[p].subsampling_x);
Jim Bankoski's avatar
Jim Bankoski committed
893
    vpx_memcpy(
894
        xd->left_context[p]
Jim Bankoski's avatar
Jim Bankoski committed
895
896
897
898
899
            + ((mi_row & MI_MASK) * 2 >> xd->plane[p].subsampling_y),
        l + num_4x4_blocks_high * p,
        (sizeof(ENTROPY_CONTEXT) * num_4x4_blocks_high) >>
        xd->plane[p].subsampling_y);
  }
900
901
902
903
  vpx_memcpy(xd->above_seg_context + mi_col, sa,
             sizeof(*xd->above_seg_context) * mi_width);
  vpx_memcpy(xd->left_seg_context + (mi_row & MI_MASK), sl,
             sizeof(xd->left_seg_context[0]) * mi_height);
904
}
Jim Bankoski's avatar
Jim Bankoski committed
905
static void save_context(VP9_COMP *cpi, int mi_row, int mi_col,
Jim Bankoski's avatar
Jim Bankoski committed
906
907
908
                         ENTROPY_CONTEXT a[16 * MAX_MB_PLANE],
                         ENTROPY_CONTEXT l[16 * MAX_MB_PLANE],
                         PARTITION_CONTEXT sa[8], PARTITION_CONTEXT sl[8],
909
                         BLOCK_SIZE bsize) {
Jim Bankoski's avatar
Jim Bankoski committed
910
911
  const MACROBLOCK *const x = &cpi->mb;
  const MACROBLOCKD *const xd = &x->e_mbd;
Jim Bankoski's avatar
Jim Bankoski committed
912
  int p;
Jim Bankoski's avatar
Jim Bankoski committed
913
914
  const int num_4x4_blocks_wide = num_4x4_blocks_wide_lookup[bsize];
  const int num_4x4_blocks_high = num_4x4_blocks_high_lookup[bsize];
Jim Bankoski's avatar
Jim Bankoski committed
915
916
  int mi_width = num_8x8_blocks_wide_lookup[bsize];
  int mi_height = num_8x8_blocks_high_lookup[bsize];
Jim Bankoski's avatar
Jim Bankoski committed
917
918
919

  // buffer the above/left context information of the block in search.
  for (p = 0; p < MAX_MB_PLANE; ++p) {
Jim Bankoski's avatar
Jim Bankoski committed
920
    vpx_memcpy(
Jim Bankoski's avatar
Jim Bankoski committed
921
        a + num_4x4_blocks_wide * p,
922
        xd->above_context[p] + (mi_col * 2 >> xd->plane[p].subsampling_x),
Jim Bankoski's avatar
Jim Bankoski committed
923
924
        (sizeof(ENTROPY_CONTEXT) * num_4x4_blocks_wide) >>
        xd->plane[p].subsampling_x);
Jim Bankoski's avatar
Jim Bankoski committed
925
    vpx_memcpy(
Jim Bankoski's avatar
Jim Bankoski committed
926
        l + num_4x4_blocks_high * p,
927
        xd->left_context[p]
Jim Bankoski's avatar
Jim Bankoski committed
928
929
930
931
            + ((mi_row & MI_MASK) * 2 >> xd->plane[p].subsampling_y),
        (sizeof(ENTROPY_CONTEXT) * num_4x4_blocks_high) >>
        xd->plane[p].subsampling_y);
  }
932
933
934
935
  vpx_memcpy(sa, xd->above_seg_context + mi_col,
             sizeof(*xd->above_seg_context) * mi_width);
  vpx_memcpy(sl, xd->left_seg_context + (mi_row & MI_MASK),
             sizeof(xd->left_seg_context[0]) * mi_height);
Jim Bankoski's avatar
Jim Bankoski committed
936
}
937

James Zern's avatar
James Zern committed
938
939
static void encode_b(VP9_COMP *cpi, const TileInfo *const tile,
                     TOKENEXTRA **tp, int mi_row, int mi_col,
940
941
                     int output_enabled, BLOCK_SIZE bsize,
                     PICK_MODE_CONTEXT *ctx) {
John Koleszar's avatar
John Koleszar committed
942

James Zern's avatar
James Zern committed
943
  set_offsets(cpi, tile, mi_row, mi_col, bsize);
944
945
  update_state(cpi, ctx, mi_row, mi_col, bsize, output_enabled);
  encode_superblock(cpi, tp, output_enabled, mi_row, mi_col, bsize, ctx);
John Koleszar's avatar
John Koleszar committed
946

947
  if (output_enabled) {
948
    update_stats(cpi);
949

950
951
    (*tp)->token = EOSB_TOKEN;
    (*tp)++;
John Koleszar's avatar
John Koleszar committed
952
  }
Ronald S. Bultje's avatar
Ronald S. Bultje committed
953
954
}

James Zern's avatar
James Zern committed
955
956
static void encode_sb(VP9_COMP *cpi, const TileInfo *const tile,
                      TOKENEXTRA **tp, int mi_row, int mi_col,
957
958
                      int output_enabled, BLOCK_SIZE bsize,
                      PC_TREE *pc_tree) {
959
960
  VP9_COMMON *const cm = &cpi->common;
  MACROBLOCK *const x = &cpi->mb;
961
962
  MACROBLOCKD *const xd = &x->e_mbd;

963
964
  const int bsl = b_width_log2(bsize), hbs = (1 << bsl) / 4;
  int ctx;
Jim Bankoski's avatar
Jim Bankoski committed
965
  PARTITION_TYPE partition;
966
  BLOCK_SIZE subsize = bsize;
967

968
969
  if (mi_row >= cm->mi_rows || mi_col >= cm->mi_cols)
    return;
970

971
  if (bsize >= BLOCK_8X8) {
972
    ctx = partition_plane_context(xd, mi_row, mi_col, bsize);
973
    subsize = get_subsize(bsize, pc_tree->partitioning);
974
975
976
  } else {
    ctx = 0;
    subsize = BLOCK_4X4;
977
  }
978
979

  partition = partition_lookup[bsl][subsize];
980
981
  if (output_enabled && bsize != BLOCK_4X4)
    cm->counts.partition[ctx][partition]++;
Ronald S. Bultje's avatar
Ronald S. Bultje committed
982

Jim Bankoski's avatar
Jim Bankoski committed
983
984
  switch (partition) {
    case PARTITION_NONE:
985
986
      encode_b(cpi, tile, tp, mi_row, mi_col, output_enabled, subsize,
               &pc_tree->none);
Jim Bankoski's avatar
Jim Bankoski committed
987
988
      break;
    case PARTITION_VERT:
989
990
991
992
993
      encode_b(cpi, tile, tp, mi_row, mi_col, output_enabled, subsize,
               &pc_tree->vertical[0]);
      if (mi_col + hbs < cm->mi_cols && bsize > BLOCK_8X8) {
        encode_b(cpi, tile, tp, mi_row, mi_col + hbs, output_enabled, subsize,
                 &pc_tree->vertical[1]);
994
      }
Jim Bankoski's avatar
Jim Bankoski committed
995
996
      break;
    case PARTITION_HORZ:
997
998
999
1000
1001
      encode_b(cpi, tile, tp, mi_row, mi_col, output_enabled, subsize,
               &pc_tree->horizontal[0]);
      if (mi_row + hbs < cm->mi_rows && bsize > BLOCK_8X8) {
        encode_b(cpi, tile, tp, mi_row + hbs, mi_col, output_enabled, subsize,
                 &pc_tree->horizontal[1]);
1002
      }
Jim Bankoski's avatar
Jim Bankoski committed
1003
1004
      break;
    case PARTITION_SPLIT:
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
1016
1017
      if (bsize == BLOCK_8X8) {
        encode_b(cpi, tile, tp, mi_row, mi_col, output_enabled, subsize,
                 pc_tree->leaf_split[0]);
      } else {
        encode_sb(cpi, tile, tp, mi_row, mi_col, output_enabled, subsize,
                  pc_tree->split[0]);
        encode_sb(cpi, tile, tp, mi_row, mi_col + hbs, output_enabled, subsize,
                  pc_tree->split[1]);
        encode_sb(cpi, tile, tp, mi_row + hbs, mi_col, output_enabled, subsize,
                  pc_tree->split[2]);
        encode_sb(cpi, tile, tp, mi_row + hbs, mi_col + hbs, output_enabled,
                  subsize, pc_tree->split[3]);
      }
Jim Bankoski's avatar
Jim Bankoski committed
1018
1019
      break;
    default:
1020
      assert("Invalid partition type.");
Ronald S. Bultje's avatar
Ronald S. Bultje committed
1021
  }
1022

1023
  if (partition != PARTITION_SPLIT || bsize == BLOCK_8X8)
1024
    update_partition_context(xd, mi_row, mi_col, subsize, bsize);
Adrian Grange's avatar
Adrian Grange committed
1025
}
John Koleszar's avatar
John Koleszar committed
1026

Paul Wilkins's avatar
Paul Wilkins committed
1027
1028
1029
1030
1031
1032
// Check to see if the given partition size is allowed for a specified number
// of 8x8 block rows and columns remaining in the image.
// If not then return the largest allowed partition size
static BLOCK_SIZE find_partition_size(BLOCK_SIZE bsize,
                                      int rows_left, int cols_left,
                                      int *bh, int *bw) {
1033
  if (rows_left <= 0 || cols_left <= 0) {
Paul Wilkins's avatar
Paul Wilkins committed
1034
1035
    return MIN(bsize, BLOCK_8X8);
  } else {
1036
    for (; bsize > 0; bsize -= 3) {
Paul Wilkins's avatar
Paul Wilkins committed
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
      *bh = num_8x8_blocks_high_lookup[bsize];
      *bw = num_8x8_blocks_wide_lookup[bsize];
      if ((*bh <= rows_left) && (*bw <= cols_left)) {
        break;
      }
    }
  }
  return bsize;
}

1047
1048
1049
1050
1051
1052
1053
1054
1055
1056
1057
1058
1059
1060
1061
1062
static void set_partial_b64x64_partition(MODE_INFO *mi, int mis,
    int bh_in, int bw_in, int row8x8_remaining, int col8x8_remaining,
    BLOCK_SIZE bsize, MODE_INFO **mi_8x8) {
  int bh = bh_in;
  int r, c;
  for (r = 0; r < MI_BLOCK_SIZE; r += bh) {
    int bw = bw_in;