reconinter.c 85.2 KB
Newer Older
Jingning Han's avatar
Jingning Han committed
1
/*
Yaowu Xu's avatar
Yaowu Xu committed
2
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
Jingning Han's avatar
Jingning Han committed
3
 *
Yaowu Xu's avatar
Yaowu Xu committed
4 5 6 7 8 9
 * This source code is subject to the terms of the BSD 2 Clause License and
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
 * was not distributed with this source code in the LICENSE file, you can
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
 * Media Patent License 1.0 was not distributed with this source code in the
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
Jingning Han's avatar
Jingning Han committed
10 11 12 13
 */

#include <assert.h>

Yaowu Xu's avatar
Yaowu Xu committed
14 15 16
#include "./aom_scale_rtcd.h"
#include "./aom_dsp_rtcd.h"
#include "./aom_config.h"
Jingning Han's avatar
Jingning Han committed
17

Yaowu Xu's avatar
Yaowu Xu committed
18
#include "aom/aom_integer.h"
19
#include "aom_dsp/blend.h"
Jingning Han's avatar
Jingning Han committed
20

21 22 23
#include "av1/common/blockd.h"
#include "av1/common/reconinter.h"
#include "av1/common/reconintra.h"
Yue Chen's avatar
Yue Chen committed
24
#if CONFIG_MOTION_VAR
25
#include "av1/common/onyxc_int.h"
Yue Chen's avatar
Yue Chen committed
26
#endif  // CONFIG_MOTION_VAR
27
#if CONFIG_GLOBAL_MOTION
28
#include "av1/common/warped_motion.h"
29
#endif  // CONFIG_GLOBAL_MOTION
Jingning Han's avatar
Jingning Han committed
30

31
#if CONFIG_EXT_INTER
32

clang-format's avatar
clang-format committed
33
#define NSMOOTHERS 1
34
static int get_masked_weight(int m, int smoothness) {
clang-format's avatar
clang-format committed
35 36
#define SMOOTHER_LEN 32
  static const uint8_t smoothfn[NSMOOTHERS][2 * SMOOTHER_LEN + 1] = { {
clang-format's avatar
clang-format committed
37 38 39 40
      0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,
      0,  0,  0,  0,  0,  0,  0,  0,  0,  1,  2,  4,  7,  13, 21, 32, 43,
      51, 57, 60, 62, 63, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64,
      64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64,
clang-format's avatar
clang-format committed
41
  } };
42 43 44 45 46
  if (m < -SMOOTHER_LEN)
    return 0;
  else if (m > SMOOTHER_LEN)
    return (1 << WEDGE_WEIGHT_BITS);
  else
47
    return smoothfn[smoothness][m + SMOOTHER_LEN];
48 49
}

50
// [smoother][negative][direction]
clang-format's avatar
clang-format committed
51 52 53
DECLARE_ALIGNED(16, static uint8_t,
                wedge_mask_obl[NSMOOTHERS][2][WEDGE_DIRECTIONS]
                              [MASK_MASTER_SIZE * MASK_MASTER_SIZE]);
54

clang-format's avatar
clang-format committed
55 56
DECLARE_ALIGNED(16, static uint8_t,
                wedge_signflip_lookup[BLOCK_SIZES][MAX_WEDGE_TYPES]);
57

58 59
// 3 * MAX_WEDGE_SQUARE is an easy to compute and fairly tight upper bound
// on the sum of all mask sizes up to an including MAX_WEDGE_SQUARE.
clang-format's avatar
clang-format committed
60 61
DECLARE_ALIGNED(16, static uint8_t,
                wedge_mask_buf[2 * MAX_WEDGE_TYPES * 3 * MAX_WEDGE_SQUARE]);
62 63 64

static wedge_masks_type wedge_masks[BLOCK_SIZES][2];

65 66 67
// Some unused wedge codebooks left temporarily to facilitate experiments.
// To be removed when setteld.
static wedge_code_type wedge_codebook_8_hgtw[8] = {
clang-format's avatar
clang-format committed
68 69 70 71
  { WEDGE_OBLIQUE27, 4, 4 },  { WEDGE_OBLIQUE63, 4, 4 },
  { WEDGE_OBLIQUE117, 4, 4 }, { WEDGE_OBLIQUE153, 4, 4 },
  { WEDGE_OBLIQUE27, 4, 2 },  { WEDGE_OBLIQUE27, 4, 6 },
  { WEDGE_OBLIQUE153, 4, 2 }, { WEDGE_OBLIQUE153, 4, 6 },
72 73
};

74
static wedge_code_type wedge_codebook_8_hltw[8] = {
clang-format's avatar
clang-format committed
75 76 77 78
  { WEDGE_OBLIQUE27, 4, 4 },  { WEDGE_OBLIQUE63, 4, 4 },
  { WEDGE_OBLIQUE117, 4, 4 }, { WEDGE_OBLIQUE153, 4, 4 },
  { WEDGE_OBLIQUE63, 2, 4 },  { WEDGE_OBLIQUE63, 6, 4 },
  { WEDGE_OBLIQUE117, 2, 4 }, { WEDGE_OBLIQUE117, 6, 4 },
79 80
};

81
static wedge_code_type wedge_codebook_8_heqw[8] = {
clang-format's avatar
clang-format committed
82 83 84 85
  { WEDGE_OBLIQUE27, 4, 4 },  { WEDGE_OBLIQUE63, 4, 4 },
  { WEDGE_OBLIQUE117, 4, 4 }, { WEDGE_OBLIQUE153, 4, 4 },
  { WEDGE_HORIZONTAL, 4, 2 }, { WEDGE_HORIZONTAL, 4, 6 },
  { WEDGE_VERTICAL, 2, 4 },   { WEDGE_VERTICAL, 6, 4 },
86 87
};

88 89
#if !USE_LARGE_WEDGE_CODEBOOK
static const wedge_code_type wedge_codebook_16_hgtw[16] = {
clang-format's avatar
clang-format committed
90 91 92 93 94 95 96 97
  { WEDGE_OBLIQUE27, 4, 4 },  { WEDGE_OBLIQUE63, 4, 4 },
  { WEDGE_OBLIQUE117, 4, 4 }, { WEDGE_OBLIQUE153, 4, 4 },
  { WEDGE_HORIZONTAL, 4, 2 }, { WEDGE_HORIZONTAL, 4, 4 },
  { WEDGE_HORIZONTAL, 4, 6 }, { WEDGE_VERTICAL, 4, 4 },
  { WEDGE_OBLIQUE27, 4, 2 },  { WEDGE_OBLIQUE27, 4, 6 },
  { WEDGE_OBLIQUE153, 4, 2 }, { WEDGE_OBLIQUE153, 4, 6 },
  { WEDGE_OBLIQUE63, 2, 4 },  { WEDGE_OBLIQUE63, 6, 4 },
  { WEDGE_OBLIQUE117, 2, 4 }, { WEDGE_OBLIQUE117, 6, 4 },
Debargha Mukherjee's avatar
Debargha Mukherjee committed
98
};
99

100
static const wedge_code_type wedge_codebook_16_hltw[16] = {
clang-format's avatar
clang-format committed
101 102 103 104 105 106 107 108
  { WEDGE_OBLIQUE27, 4, 4 },  { WEDGE_OBLIQUE63, 4, 4 },
  { WEDGE_OBLIQUE117, 4, 4 }, { WEDGE_OBLIQUE153, 4, 4 },
  { WEDGE_VERTICAL, 2, 4 },   { WEDGE_VERTICAL, 4, 4 },
  { WEDGE_VERTICAL, 6, 4 },   { WEDGE_HORIZONTAL, 4, 4 },
  { WEDGE_OBLIQUE27, 4, 2 },  { WEDGE_OBLIQUE27, 4, 6 },
  { WEDGE_OBLIQUE153, 4, 2 }, { WEDGE_OBLIQUE153, 4, 6 },
  { WEDGE_OBLIQUE63, 2, 4 },  { WEDGE_OBLIQUE63, 6, 4 },
  { WEDGE_OBLIQUE117, 2, 4 }, { WEDGE_OBLIQUE117, 6, 4 },
109 110
};

111
static const wedge_code_type wedge_codebook_16_heqw[16] = {
clang-format's avatar
clang-format committed
112 113 114 115 116 117 118 119
  { WEDGE_OBLIQUE27, 4, 4 },  { WEDGE_OBLIQUE63, 4, 4 },
  { WEDGE_OBLIQUE117, 4, 4 }, { WEDGE_OBLIQUE153, 4, 4 },
  { WEDGE_HORIZONTAL, 4, 2 }, { WEDGE_HORIZONTAL, 4, 6 },
  { WEDGE_VERTICAL, 2, 4 },   { WEDGE_VERTICAL, 6, 4 },
  { WEDGE_OBLIQUE27, 4, 2 },  { WEDGE_OBLIQUE27, 4, 6 },
  { WEDGE_OBLIQUE153, 4, 2 }, { WEDGE_OBLIQUE153, 4, 6 },
  { WEDGE_OBLIQUE63, 2, 4 },  { WEDGE_OBLIQUE63, 6, 4 },
  { WEDGE_OBLIQUE117, 2, 4 }, { WEDGE_OBLIQUE117, 6, 4 },
120 121
};

122
const wedge_params_type wedge_params_lookup[BLOCK_SIZES] = {
clang-format's avatar
clang-format committed
123 124 125 126 127 128 129 130 131 132 133 134 135
  { 0, NULL, NULL, 0, NULL },
  { 0, NULL, NULL, 0, NULL },
  { 0, NULL, NULL, 0, NULL },
  { 4, wedge_codebook_16_heqw, wedge_signflip_lookup[3], 0, wedge_masks[3] },
  { 4, wedge_codebook_16_hgtw, wedge_signflip_lookup[4], 0, wedge_masks[4] },
  { 4, wedge_codebook_16_hltw, wedge_signflip_lookup[5], 0, wedge_masks[5] },
  { 4, wedge_codebook_16_heqw, wedge_signflip_lookup[6], 0, wedge_masks[6] },
  { 4, wedge_codebook_16_hgtw, wedge_signflip_lookup[7], 0, wedge_masks[7] },
  { 4, wedge_codebook_16_hltw, wedge_signflip_lookup[8], 0, wedge_masks[8] },
  { 4, wedge_codebook_16_heqw, wedge_signflip_lookup[9], 0, wedge_masks[9] },
  { 0, wedge_codebook_8_hgtw, wedge_signflip_lookup[10], 0, wedge_masks[10] },
  { 0, wedge_codebook_8_hltw, wedge_signflip_lookup[11], 0, wedge_masks[11] },
  { 0, wedge_codebook_8_heqw, wedge_signflip_lookup[12], 0, wedge_masks[12] },
136
#if CONFIG_EXT_PARTITION
clang-format's avatar
clang-format committed
137 138 139
  { 0, NULL, NULL, 0, NULL },
  { 0, NULL, NULL, 0, NULL },
  { 0, NULL, NULL, 0, NULL },
140
#endif  // CONFIG_EXT_PARTITION
141 142
};

143 144 145
#else

static const wedge_code_type wedge_codebook_32_hgtw[32] = {
clang-format's avatar
clang-format committed
146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161
  { WEDGE_OBLIQUE27, 4, 4 },  { WEDGE_OBLIQUE63, 4, 4 },
  { WEDGE_OBLIQUE117, 4, 4 }, { WEDGE_OBLIQUE153, 4, 4 },
  { WEDGE_HORIZONTAL, 4, 2 }, { WEDGE_HORIZONTAL, 4, 4 },
  { WEDGE_HORIZONTAL, 4, 6 }, { WEDGE_VERTICAL, 4, 4 },
  { WEDGE_OBLIQUE27, 4, 1 },  { WEDGE_OBLIQUE27, 4, 2 },
  { WEDGE_OBLIQUE27, 4, 3 },  { WEDGE_OBLIQUE27, 4, 5 },
  { WEDGE_OBLIQUE27, 4, 6 },  { WEDGE_OBLIQUE27, 4, 7 },
  { WEDGE_OBLIQUE153, 4, 1 }, { WEDGE_OBLIQUE153, 4, 2 },
  { WEDGE_OBLIQUE153, 4, 3 }, { WEDGE_OBLIQUE153, 4, 5 },
  { WEDGE_OBLIQUE153, 4, 6 }, { WEDGE_OBLIQUE153, 4, 7 },
  { WEDGE_OBLIQUE63, 1, 4 },  { WEDGE_OBLIQUE63, 2, 4 },
  { WEDGE_OBLIQUE63, 3, 4 },  { WEDGE_OBLIQUE63, 5, 4 },
  { WEDGE_OBLIQUE63, 6, 4 },  { WEDGE_OBLIQUE63, 7, 4 },
  { WEDGE_OBLIQUE117, 1, 4 }, { WEDGE_OBLIQUE117, 2, 4 },
  { WEDGE_OBLIQUE117, 3, 4 }, { WEDGE_OBLIQUE117, 5, 4 },
  { WEDGE_OBLIQUE117, 6, 4 }, { WEDGE_OBLIQUE117, 7, 4 },
162 163
};

164
static const wedge_code_type wedge_codebook_32_hltw[32] = {
clang-format's avatar
clang-format committed
165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180
  { WEDGE_OBLIQUE27, 4, 4 },  { WEDGE_OBLIQUE63, 4, 4 },
  { WEDGE_OBLIQUE117, 4, 4 }, { WEDGE_OBLIQUE153, 4, 4 },
  { WEDGE_VERTICAL, 2, 4 },   { WEDGE_VERTICAL, 4, 4 },
  { WEDGE_VERTICAL, 6, 4 },   { WEDGE_HORIZONTAL, 4, 4 },
  { WEDGE_OBLIQUE27, 4, 1 },  { WEDGE_OBLIQUE27, 4, 2 },
  { WEDGE_OBLIQUE27, 4, 3 },  { WEDGE_OBLIQUE27, 4, 5 },
  { WEDGE_OBLIQUE27, 4, 6 },  { WEDGE_OBLIQUE27, 4, 7 },
  { WEDGE_OBLIQUE153, 4, 1 }, { WEDGE_OBLIQUE153, 4, 2 },
  { WEDGE_OBLIQUE153, 4, 3 }, { WEDGE_OBLIQUE153, 4, 5 },
  { WEDGE_OBLIQUE153, 4, 6 }, { WEDGE_OBLIQUE153, 4, 7 },
  { WEDGE_OBLIQUE63, 1, 4 },  { WEDGE_OBLIQUE63, 2, 4 },
  { WEDGE_OBLIQUE63, 3, 4 },  { WEDGE_OBLIQUE63, 5, 4 },
  { WEDGE_OBLIQUE63, 6, 4 },  { WEDGE_OBLIQUE63, 7, 4 },
  { WEDGE_OBLIQUE117, 1, 4 }, { WEDGE_OBLIQUE117, 2, 4 },
  { WEDGE_OBLIQUE117, 3, 4 }, { WEDGE_OBLIQUE117, 5, 4 },
  { WEDGE_OBLIQUE117, 6, 4 }, { WEDGE_OBLIQUE117, 7, 4 },
181 182
};

183
static const wedge_code_type wedge_codebook_32_heqw[32] = {
clang-format's avatar
clang-format committed
184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199
  { WEDGE_OBLIQUE27, 4, 4 },  { WEDGE_OBLIQUE63, 4, 4 },
  { WEDGE_OBLIQUE117, 4, 4 }, { WEDGE_OBLIQUE153, 4, 4 },
  { WEDGE_HORIZONTAL, 4, 2 }, { WEDGE_HORIZONTAL, 4, 6 },
  { WEDGE_VERTICAL, 2, 4 },   { WEDGE_VERTICAL, 6, 4 },
  { WEDGE_OBLIQUE27, 4, 1 },  { WEDGE_OBLIQUE27, 4, 2 },
  { WEDGE_OBLIQUE27, 4, 3 },  { WEDGE_OBLIQUE27, 4, 5 },
  { WEDGE_OBLIQUE27, 4, 6 },  { WEDGE_OBLIQUE27, 4, 7 },
  { WEDGE_OBLIQUE153, 4, 1 }, { WEDGE_OBLIQUE153, 4, 2 },
  { WEDGE_OBLIQUE153, 4, 3 }, { WEDGE_OBLIQUE153, 4, 5 },
  { WEDGE_OBLIQUE153, 4, 6 }, { WEDGE_OBLIQUE153, 4, 7 },
  { WEDGE_OBLIQUE63, 1, 4 },  { WEDGE_OBLIQUE63, 2, 4 },
  { WEDGE_OBLIQUE63, 3, 4 },  { WEDGE_OBLIQUE63, 5, 4 },
  { WEDGE_OBLIQUE63, 6, 4 },  { WEDGE_OBLIQUE63, 7, 4 },
  { WEDGE_OBLIQUE117, 1, 4 }, { WEDGE_OBLIQUE117, 2, 4 },
  { WEDGE_OBLIQUE117, 3, 4 }, { WEDGE_OBLIQUE117, 5, 4 },
  { WEDGE_OBLIQUE117, 6, 4 }, { WEDGE_OBLIQUE117, 7, 4 },
200 201
};

202
const wedge_params_type wedge_params_lookup[BLOCK_SIZES] = {
clang-format's avatar
clang-format committed
203 204 205 206 207 208 209 210 211 212 213 214 215
  { 0, NULL, NULL, 0, NULL },
  { 0, NULL, NULL, 0, NULL },
  { 0, NULL, NULL, 0, NULL },
  { 5, wedge_codebook_32_heqw, wedge_signflip_lookup[3], 0, wedge_masks[3] },
  { 5, wedge_codebook_32_hgtw, wedge_signflip_lookup[4], 0, wedge_masks[4] },
  { 5, wedge_codebook_32_hltw, wedge_signflip_lookup[5], 0, wedge_masks[5] },
  { 5, wedge_codebook_32_heqw, wedge_signflip_lookup[6], 0, wedge_masks[6] },
  { 5, wedge_codebook_32_hgtw, wedge_signflip_lookup[7], 0, wedge_masks[7] },
  { 5, wedge_codebook_32_hltw, wedge_signflip_lookup[8], 0, wedge_masks[8] },
  { 5, wedge_codebook_32_heqw, wedge_signflip_lookup[9], 0, wedge_masks[9] },
  { 0, wedge_codebook_8_hgtw, wedge_signflip_lookup[10], 0, wedge_masks[10] },
  { 0, wedge_codebook_8_hltw, wedge_signflip_lookup[11], 0, wedge_masks[11] },
  { 0, wedge_codebook_8_heqw, wedge_signflip_lookup[12], 0, wedge_masks[12] },
Debargha Mukherjee's avatar
Debargha Mukherjee committed
216
#if CONFIG_EXT_PARTITION
clang-format's avatar
clang-format committed
217 218 219
  { 0, NULL, NULL, 0, NULL },
  { 0, NULL, NULL, 0, NULL },
  { 0, NULL, NULL, 0, NULL },
Debargha Mukherjee's avatar
Debargha Mukherjee committed
220
#endif  // CONFIG_EXT_PARTITION
221
};
222
#endif  // USE_LARGE_WEDGE_CODEBOOK
223

clang-format's avatar
clang-format committed
224
static const uint8_t *get_wedge_mask_inplace(int wedge_index, int neg,
225
                                             BLOCK_SIZE sb_type) {
Debargha Mukherjee's avatar
Debargha Mukherjee committed
226
  const uint8_t *master;
227 228
  const int bh = 4 << b_height_log2_lookup[sb_type];
  const int bw = 4 << b_width_log2_lookup[sb_type];
229 230 231
  const wedge_code_type *a =
      wedge_params_lookup[sb_type].codebook + wedge_index;
  const int smoother = wedge_params_lookup[sb_type].smoother;
232
  int woff, hoff;
233 234 235 236 237 238 239
  const uint8_t wsignflip = wedge_params_lookup[sb_type].signflip[wedge_index];

  assert(wedge_index >= 0 &&
         wedge_index < (1 << get_wedge_bits_lookup(sb_type)));
  woff = (a->x_offset * bw) >> 3;
  hoff = (a->y_offset * bh) >> 3;
  master = wedge_mask_obl[smoother][neg ^ wsignflip][a->direction] +
clang-format's avatar
clang-format committed
240 241
           MASK_MASTER_STRIDE * (MASK_MASTER_SIZE / 2 - hoff) +
           MASK_MASTER_SIZE / 2 - woff;
Debargha Mukherjee's avatar
Debargha Mukherjee committed
242 243 244
  return master;
}

Yaowu Xu's avatar
Yaowu Xu committed
245 246 247
const uint8_t *av1_get_soft_mask(int wedge_index, int wedge_sign,
                                 BLOCK_SIZE sb_type, int offset_x,
                                 int offset_y) {
248
  const uint8_t *mask =
249
      get_wedge_mask_inplace(wedge_index, wedge_sign, sb_type);
clang-format's avatar
clang-format committed
250
  if (mask) mask -= (offset_x + offset_y * MASK_MASTER_STRIDE);
251
  return mask;
252 253
}

254
static void init_wedge_master_masks() {
255 256 257 258
  int i, j, s;
  const int w = MASK_MASTER_SIZE;
  const int h = MASK_MASTER_SIZE;
  const int stride = MASK_MASTER_STRIDE;
clang-format's avatar
clang-format committed
259
  const int a[2] = { 2, 1 };
260 261 262 263 264 265 266 267
  const double asqrt = sqrt(a[0] * a[0] + a[1] * a[1]);
  for (s = 0; s < NSMOOTHERS; s++) {
    for (i = 0; i < h; ++i)
      for (j = 0; j < w; ++j) {
        int x = (2 * j + 1 - w);
        int y = (2 * i + 1 - h);
        int m = (int)rint((a[0] * x + a[1] * y) / asqrt);
        wedge_mask_obl[s][1][WEDGE_OBLIQUE63][i * stride + j] =
clang-format's avatar
clang-format committed
268 269
            wedge_mask_obl[s][1][WEDGE_OBLIQUE27][j * stride + i] =
                get_masked_weight(m, s);
270
        wedge_mask_obl[s][1][WEDGE_OBLIQUE117][i * stride + w - 1 - j] =
clang-format's avatar
clang-format committed
271 272
            wedge_mask_obl[s][1][WEDGE_OBLIQUE153][(w - 1 - j) * stride + i] =
                (1 << WEDGE_WEIGHT_BITS) - get_masked_weight(m, s);
273
        wedge_mask_obl[s][0][WEDGE_OBLIQUE63][i * stride + j] =
clang-format's avatar
clang-format committed
274 275
            wedge_mask_obl[s][0][WEDGE_OBLIQUE27][j * stride + i] =
                (1 << WEDGE_WEIGHT_BITS) - get_masked_weight(m, s);
276
        wedge_mask_obl[s][0][WEDGE_OBLIQUE117][i * stride + w - 1 - j] =
clang-format's avatar
clang-format committed
277 278
            wedge_mask_obl[s][0][WEDGE_OBLIQUE153][(w - 1 - j) * stride + i] =
                get_masked_weight(m, s);
279
        wedge_mask_obl[s][1][WEDGE_VERTICAL][i * stride + j] =
clang-format's avatar
clang-format committed
280 281
            wedge_mask_obl[s][1][WEDGE_HORIZONTAL][j * stride + i] =
                get_masked_weight(x, s);
282
        wedge_mask_obl[s][0][WEDGE_VERTICAL][i * stride + j] =
clang-format's avatar
clang-format committed
283 284
            wedge_mask_obl[s][0][WEDGE_HORIZONTAL][j * stride + i] =
                (1 << WEDGE_WEIGHT_BITS) - get_masked_weight(x, s);
285 286
      }
  }
287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305
}

// If the signs for the wedges for various blocksizes are
// inconsistent flip the sign flag. Do it only once for every
// wedge codebook.
static void init_wedge_signs() {
  BLOCK_SIZE sb_type;
  memset(wedge_signflip_lookup, 0, sizeof(wedge_signflip_lookup));
  for (sb_type = BLOCK_4X4; sb_type < BLOCK_SIZES; ++sb_type) {
    const int bw = 4 * num_4x4_blocks_wide_lookup[sb_type];
    const int bh = 4 * num_4x4_blocks_high_lookup[sb_type];
    const wedge_params_type wedge_params = wedge_params_lookup[sb_type];
    const int wbits = wedge_params.bits;
    const int wtypes = 1 << wbits;
    int i, w;
    if (wbits == 0) continue;
    for (w = 0; w < wtypes; ++w) {
      const uint8_t *mask = get_wedge_mask_inplace(w, 0, sb_type);
      int sum = 0;
clang-format's avatar
clang-format committed
306 307
      for (i = 0; i < bw; ++i) sum += mask[i];
      for (i = 0; i < bh; ++i) sum += mask[i * MASK_MASTER_STRIDE];
308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328
      sum = (sum + (bw + bh) / 2) / (bw + bh);
      wedge_params.signflip[w] = (sum < 32);
    }
  }
}

static void init_wedge_masks() {
  uint8_t *dst = wedge_mask_buf;
  BLOCK_SIZE bsize;
  memset(wedge_masks, 0, sizeof(wedge_masks));
  for (bsize = BLOCK_4X4; bsize < BLOCK_SIZES; ++bsize) {
    const uint8_t *mask;
    const int bw = 4 * num_4x4_blocks_wide_lookup[bsize];
    const int bh = 4 * num_4x4_blocks_high_lookup[bsize];
    const wedge_params_type *wedge_params = &wedge_params_lookup[bsize];
    const int wbits = wedge_params->bits;
    const int wtypes = 1 << wbits;
    int w;
    if (wbits == 0) continue;
    for (w = 0; w < wtypes; ++w) {
      mask = get_wedge_mask_inplace(w, 0, bsize);
Yaowu Xu's avatar
Yaowu Xu committed
329
      aom_convolve_copy(mask, MASK_MASTER_STRIDE, dst, bw, NULL, 0, NULL, 0, bw,
clang-format's avatar
clang-format committed
330
                        bh);
331 332 333 334
      wedge_params->masks[0][w] = dst;
      dst += bw * bh;

      mask = get_wedge_mask_inplace(w, 1, bsize);
Yaowu Xu's avatar
Yaowu Xu committed
335
      aom_convolve_copy(mask, MASK_MASTER_STRIDE, dst, bw, NULL, 0, NULL, 0, bw,
clang-format's avatar
clang-format committed
336
                        bh);
337 338 339 340 341 342 343 344
      wedge_params->masks[1][w] = dst;
      dst += bw * bh;
    }
    assert(sizeof(wedge_mask_buf) >= (size_t)(dst - wedge_mask_buf));
  }
}

// Equation of line: f(x, y) = a[0]*(x - a[2]*w/8) + a[1]*(y - a[3]*h/8) = 0
Yaowu Xu's avatar
Yaowu Xu committed
345
void av1_init_wedge_masks() {
346
  init_wedge_master_masks();
347
  init_wedge_signs();
348
  init_wedge_masks();
349 350
}

351 352
#if CONFIG_SUPERTX
static void build_masked_compound_wedge_extend(
clang-format's avatar
clang-format committed
353 354 355
    uint8_t *dst, int dst_stride, const uint8_t *src0, int src0_stride,
    const uint8_t *src1, int src1_stride, int wedge_index, int wedge_sign,
    BLOCK_SIZE sb_type, int wedge_offset_x, int wedge_offset_y, int h, int w) {
356 357
  const int subh = (2 << b_height_log2_lookup[sb_type]) == h;
  const int subw = (2 << b_width_log2_lookup[sb_type]) == w;
Yaowu Xu's avatar
Yaowu Xu committed
358 359 360
  const uint8_t *mask = av1_get_soft_mask(wedge_index, wedge_sign, sb_type,
                                          wedge_offset_x, wedge_offset_y);
  aom_blend_a64_mask(dst, dst_stride, src0, src0_stride, src1, src1_stride,
clang-format's avatar
clang-format committed
361
                     mask, MASK_MASTER_STRIDE, h, w, subh, subw);
362 363
}

Yaowu Xu's avatar
Yaowu Xu committed
364
#if CONFIG_AOM_HIGHBITDEPTH
365
static void build_masked_compound_wedge_extend_highbd(
clang-format's avatar
clang-format committed
366 367 368 369
    uint8_t *dst_8, int dst_stride, const uint8_t *src0_8, int src0_stride,
    const uint8_t *src1_8, int src1_stride, int wedge_index, int wedge_sign,
    BLOCK_SIZE sb_type, int wedge_offset_x, int wedge_offset_y, int h, int w,
    int bd) {
370 371
  const int subh = (2 << b_height_log2_lookup[sb_type]) == h;
  const int subw = (2 << b_width_log2_lookup[sb_type]) == w;
Yaowu Xu's avatar
Yaowu Xu committed
372 373 374
  const uint8_t *mask = av1_get_soft_mask(wedge_index, wedge_sign, sb_type,
                                          wedge_offset_x, wedge_offset_y);
  aom_highbd_blend_a64_mask(dst_8, dst_stride, src0_8, src0_stride, src1_8,
clang-format's avatar
clang-format committed
375 376
                            src1_stride, mask, MASK_MASTER_STRIDE, h, w, subh,
                            subw, bd);
377
}
Yaowu Xu's avatar
Yaowu Xu committed
378
#endif  // CONFIG_AOM_HIGHBITDEPTH
379
#endif  // CONFIG_SUPERTX
380

clang-format's avatar
clang-format committed
381 382 383 384 385
static void build_masked_compound_wedge(uint8_t *dst, int dst_stride,
                                        const uint8_t *src0, int src0_stride,
                                        const uint8_t *src1, int src1_stride,
                                        int wedge_index, int wedge_sign,
                                        BLOCK_SIZE sb_type, int h, int w) {
386 387 388 389
  // Derive subsampling from h and w passed in. May be refactored to
  // pass in subsampling factors directly.
  const int subh = (2 << b_height_log2_lookup[sb_type]) == h;
  const int subw = (2 << b_width_log2_lookup[sb_type]) == w;
clang-format's avatar
clang-format committed
390
  const uint8_t *mask =
Yaowu Xu's avatar
Yaowu Xu committed
391 392
      av1_get_contiguous_soft_mask(wedge_index, wedge_sign, sb_type);
  aom_blend_a64_mask(dst, dst_stride, src0, src0_stride, src1, src1_stride,
clang-format's avatar
clang-format committed
393 394
                     mask, 4 * num_4x4_blocks_wide_lookup[sb_type], h, w, subh,
                     subw);
395 396
}

Yaowu Xu's avatar
Yaowu Xu committed
397
#if CONFIG_AOM_HIGHBITDEPTH
Geza Lore's avatar
Geza Lore committed
398
static void build_masked_compound_wedge_highbd(
clang-format's avatar
clang-format committed
399 400 401
    uint8_t *dst_8, int dst_stride, const uint8_t *src0_8, int src0_stride,
    const uint8_t *src1_8, int src1_stride, int wedge_index, int wedge_sign,
    BLOCK_SIZE sb_type, int h, int w, int bd) {
402 403 404 405
  // Derive subsampling from h and w passed in. May be refactored to
  // pass in subsampling factors directly.
  const int subh = (2 << b_height_log2_lookup[sb_type]) == h;
  const int subw = (2 << b_width_log2_lookup[sb_type]) == w;
clang-format's avatar
clang-format committed
406
  const uint8_t *mask =
Yaowu Xu's avatar
Yaowu Xu committed
407 408
      av1_get_contiguous_soft_mask(wedge_index, wedge_sign, sb_type);
  aom_highbd_blend_a64_mask(
clang-format's avatar
clang-format committed
409 410
      dst_8, dst_stride, src0_8, src0_stride, src1_8, src1_stride, mask,
      4 * num_4x4_blocks_wide_lookup[sb_type], h, w, subh, subw, bd);
411
}
Yaowu Xu's avatar
Yaowu Xu committed
412
#endif  // CONFIG_AOM_HIGHBITDEPTH
413

Yaowu Xu's avatar
Yaowu Xu committed
414 415 416 417 418
void av1_make_masked_inter_predictor(const uint8_t *pre, int pre_stride,
                                     uint8_t *dst, int dst_stride,
                                     const int subpel_x, const int subpel_y,
                                     const struct scale_factors *sf, int w,
                                     int h,
419
#if CONFIG_DUAL_FILTER
James Zern's avatar
James Zern committed
420
                                     const InterpFilter *interp_filter,
421
#else
James Zern's avatar
James Zern committed
422
                                     const InterpFilter interp_filter,
423
#endif
Yaowu Xu's avatar
Yaowu Xu committed
424
                                     int xs, int ys,
425
#if CONFIG_SUPERTX
Yaowu Xu's avatar
Yaowu Xu committed
426
                                     int wedge_offset_x, int wedge_offset_y,
427
#endif  // CONFIG_SUPERTX
Yaowu Xu's avatar
Yaowu Xu committed
428
                                     const MACROBLOCKD *xd) {
429
  const MODE_INFO *mi = xd->mi[0];
clang-format's avatar
clang-format committed
430 431
// The prediction filter types used here should be those for
// the second reference block.
Geza Lore's avatar
Geza Lore committed
432
#if CONFIG_DUAL_FILTER
James Zern's avatar
James Zern committed
433
  InterpFilter tmp_ipf[4] = {
Geza Lore's avatar
Geza Lore committed
434
    interp_filter[2], interp_filter[3], interp_filter[2], interp_filter[3],
435
  };
Geza Lore's avatar
Geza Lore committed
436
#else
James Zern's avatar
James Zern committed
437
  InterpFilter tmp_ipf = interp_filter;
Geza Lore's avatar
Geza Lore committed
438
#endif  // CONFIG_DUAL_FILTER
Yaowu Xu's avatar
Yaowu Xu committed
439
#if CONFIG_AOM_HIGHBITDEPTH
440
  DECLARE_ALIGNED(16, uint8_t, tmp_dst_[2 * MAX_SB_SQUARE]);
clang-format's avatar
clang-format committed
441 442 443
  uint8_t *tmp_dst = (xd->cur_buf->flags & YV12_FLAG_HIGHBITDEPTH)
                         ? CONVERT_TO_BYTEPTR(tmp_dst_)
                         : tmp_dst_;
Yaowu Xu's avatar
Yaowu Xu committed
444 445
  av1_make_inter_predictor(pre, pre_stride, tmp_dst, MAX_SB_SIZE, subpel_x,
                           subpel_y, sf, w, h, 0, tmp_ipf, xs, ys, xd);
446 447
#if CONFIG_SUPERTX
  if (xd->cur_buf->flags & YV12_FLAG_HIGHBITDEPTH)
448
    build_masked_compound_wedge_extend_highbd(
clang-format's avatar
clang-format committed
449 450 451
        dst, dst_stride, dst, dst_stride, tmp_dst, MAX_SB_SIZE,
        mi->mbmi.interinter_wedge_index, mi->mbmi.interinter_wedge_sign,
        mi->mbmi.sb_type, wedge_offset_x, wedge_offset_y, h, w, xd->bd);
452
  else
453
    build_masked_compound_wedge_extend(
clang-format's avatar
clang-format committed
454 455 456
        dst, dst_stride, dst, dst_stride, tmp_dst, MAX_SB_SIZE,
        mi->mbmi.interinter_wedge_index, mi->mbmi.interinter_wedge_sign,
        mi->mbmi.sb_type, wedge_offset_x, wedge_offset_y, h, w);
457 458
#else
  if (xd->cur_buf->flags & YV12_FLAG_HIGHBITDEPTH)
459
    build_masked_compound_wedge_highbd(
clang-format's avatar
clang-format committed
460 461
        dst, dst_stride, dst, dst_stride, tmp_dst, MAX_SB_SIZE,
        mi->mbmi.interinter_wedge_index, mi->mbmi.interinter_wedge_sign,
462
        mi->mbmi.sb_type, h, w, xd->bd);
463
  else
clang-format's avatar
clang-format committed
464 465 466 467
    build_masked_compound_wedge(dst, dst_stride, dst, dst_stride, tmp_dst,
                                MAX_SB_SIZE, mi->mbmi.interinter_wedge_index,
                                mi->mbmi.interinter_wedge_sign,
                                mi->mbmi.sb_type, h, w);
468
#endif  // CONFIG_SUPERTX
Yaowu Xu's avatar
Yaowu Xu committed
469
#else   // CONFIG_AOM_HIGHBITDEPTH
470
  DECLARE_ALIGNED(16, uint8_t, tmp_dst[MAX_SB_SQUARE]);
Yaowu Xu's avatar
Yaowu Xu committed
471 472
  av1_make_inter_predictor(pre, pre_stride, tmp_dst, MAX_SB_SIZE, subpel_x,
                           subpel_y, sf, w, h, 0, tmp_ipf, xs, ys, xd);
473
#if CONFIG_SUPERTX
474
  build_masked_compound_wedge_extend(
clang-format's avatar
clang-format committed
475 476 477
      dst, dst_stride, dst, dst_stride, tmp_dst, MAX_SB_SIZE,
      mi->mbmi.interinter_wedge_index, mi->mbmi.interinter_wedge_sign,
      mi->mbmi.sb_type, wedge_offset_x, wedge_offset_y, h, w);
478
#else
clang-format's avatar
clang-format committed
479 480 481 482
  build_masked_compound_wedge(dst, dst_stride, dst, dst_stride, tmp_dst,
                              MAX_SB_SIZE, mi->mbmi.interinter_wedge_index,
                              mi->mbmi.interinter_wedge_sign, mi->mbmi.sb_type,
                              h, w);
483
#endif  // CONFIG_SUPERTX
Yaowu Xu's avatar
Yaowu Xu committed
484
#endif  // CONFIG_AOM_HIGHBITDEPTH
485 486
}
#endif  // CONFIG_EXT_INTER
487

Yaowu Xu's avatar
Yaowu Xu committed
488 489
#if CONFIG_AOM_HIGHBITDEPTH
void av1_highbd_build_inter_predictor(
clang-format's avatar
clang-format committed
490 491
    const uint8_t *src, int src_stride, uint8_t *dst, int dst_stride,
    const MV *src_mv, const struct scale_factors *sf, int w, int h, int ref,
492
#if CONFIG_DUAL_FILTER
James Zern's avatar
James Zern committed
493
    const InterpFilter *interp_filter,
494
#else
James Zern's avatar
James Zern committed
495
    const InterpFilter interp_filter,
496
#endif
clang-format's avatar
clang-format committed
497
    enum mv_precision precision, int x, int y, int bd) {
Jingning Han's avatar
Jingning Han committed
498 499 500
  const int is_q4 = precision == MV_PRECISION_Q4;
  const MV mv_q4 = { is_q4 ? src_mv->row : src_mv->row * 2,
                     is_q4 ? src_mv->col : src_mv->col * 2 };
Yaowu Xu's avatar
Yaowu Xu committed
501
  MV32 mv = av1_scale_mv(&mv_q4, x, y, sf);
Jingning Han's avatar
Jingning Han committed
502 503 504 505 506
  const int subpel_x = mv.col & SUBPEL_MASK;
  const int subpel_y = mv.row & SUBPEL_MASK;

  src += (mv.row >> SUBPEL_BITS) * src_stride + (mv.col >> SUBPEL_BITS);

507
  highbd_inter_predictor(src, src_stride, dst, dst_stride, subpel_x, subpel_y,
508 509
                         sf, w, h, ref, interp_filter, sf->x_step_q4,
                         sf->y_step_q4, bd);
Jingning Han's avatar
Jingning Han committed
510
}
Yaowu Xu's avatar
Yaowu Xu committed
511
#endif  // CONFIG_AOM_HIGHBITDEPTH
Jingning Han's avatar
Jingning Han committed
512

Yaowu Xu's avatar
Yaowu Xu committed
513 514 515 516
void av1_build_inter_predictor(const uint8_t *src, int src_stride, uint8_t *dst,
                               int dst_stride, const MV *src_mv,
                               const struct scale_factors *sf, int w, int h,
                               int ref,
517
#if CONFIG_DUAL_FILTER
James Zern's avatar
James Zern committed
518
                               const InterpFilter *interp_filter,
519
#else
James Zern's avatar
James Zern committed
520
                               const InterpFilter interp_filter,
521
#endif
Yaowu Xu's avatar
Yaowu Xu committed
522
                               enum mv_precision precision, int x, int y) {
Jingning Han's avatar
Jingning Han committed
523 524 525
  const int is_q4 = precision == MV_PRECISION_Q4;
  const MV mv_q4 = { is_q4 ? src_mv->row : src_mv->row * 2,
                     is_q4 ? src_mv->col : src_mv->col * 2 };
Yaowu Xu's avatar
Yaowu Xu committed
526
  MV32 mv = av1_scale_mv(&mv_q4, x, y, sf);
Jingning Han's avatar
Jingning Han committed
527 528 529 530 531
  const int subpel_x = mv.col & SUBPEL_MASK;
  const int subpel_y = mv.row & SUBPEL_MASK;

  src += (mv.row >> SUBPEL_BITS) * src_stride + (mv.col >> SUBPEL_BITS);

clang-format's avatar
clang-format committed
532 533
  inter_predictor(src, src_stride, dst, dst_stride, subpel_x, subpel_y, sf, w,
                  h, ref, interp_filter, sf->x_step_q4, sf->y_step_q4);
Jingning Han's avatar
Jingning Han committed
534 535
}

536
void build_inter_predictors(MACROBLOCKD *xd, int plane,
Yue Chen's avatar
Yue Chen committed
537
#if CONFIG_MOTION_VAR
538
                            int mi_col_offset, int mi_row_offset,
Yue Chen's avatar
Yue Chen committed
539
#endif  // CONFIG_MOTION_VAR
clang-format's avatar
clang-format committed
540 541
                            int block, int bw, int bh, int x, int y, int w,
                            int h,
542 543 544
#if CONFIG_SUPERTX && CONFIG_EXT_INTER
                            int wedge_offset_x, int wedge_offset_y,
#endif  // CONFIG_SUPERTX && CONFIG_EXT_INTER
545
                            int mi_x, int mi_y) {
Jingning Han's avatar
Jingning Han committed
546
  struct macroblockd_plane *const pd = &xd->plane[plane];
Yue Chen's avatar
Yue Chen committed
547
#if CONFIG_MOTION_VAR
548
  const MODE_INFO *mi = xd->mi[mi_col_offset + xd->mi_stride * mi_row_offset];
549
  const int build_for_obmc = !(mi_col_offset == 0 && mi_row_offset == 0);
550
#else
Jingning Han's avatar
Jingning Han committed
551
  const MODE_INFO *mi = xd->mi[0];
Yue Chen's avatar
Yue Chen committed
552
#endif  // CONFIG_MOTION_VAR
Jingning Han's avatar
Jingning Han committed
553 554
  const int is_compound = has_second_ref(&mi->mbmi);
  int ref;
555 556 557 558 559
#if CONFIG_GLOBAL_MOTION
  Global_Motion_Params *gm[2];
  int is_global[2];
  for (ref = 0; ref < 1 + is_compound; ++ref) {
    gm[ref] = &xd->global_motion[mi->mbmi.ref_frame[ref]];
clang-format's avatar
clang-format committed
560
    is_global[ref] =
561
        (get_y_mode(mi, block) == ZEROMV && gm[ref]->gmtype > GLOBAL_ZERO);
562 563
  }
  // TODO(sarahparker) remove these once gm works with all experiments
clang-format's avatar
clang-format committed
564 565
  (void)gm;
  (void)is_global;
566
#endif  // CONFIG_GLOBAL_MOTION
Jingning Han's avatar
Jingning Han committed
567

568 569
// TODO(sarahparker) enable the use of DUAL_FILTER in warped motion functions
// in order to allow GLOBAL_MOTION and DUAL_FILTER to work together
570
#if CONFIG_SUB8X8_MC
571 572 573
#if CONFIG_MOTION_VAR
  if (mi->mbmi.sb_type < BLOCK_8X8 && plane > 0 && !build_for_obmc) {
#else
574
  if (mi->mbmi.sb_type < BLOCK_8X8 && plane > 0) {
575
#endif  // CONFIG_MOTION_VAR
576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607
    // block size in log2
    const int b4_wl = b_width_log2_lookup[mi->mbmi.sb_type];
    const int b4_hl = b_height_log2_lookup[mi->mbmi.sb_type];
    const int b8_sl = b_width_log2_lookup[BLOCK_8X8];

    // block size
    const int b4_w = 1 << b4_wl;
    const int b4_h = 1 << b4_hl;
    const int b8_s = 1 << b8_sl;
    int idx, idy;

    const int x_base = x;
    const int y_base = y;

    // processing unit size
    const int x_step = w >> (b8_sl - b4_wl);
    const int y_step = h >> (b8_sl - b4_hl);

    for (idy = 0; idy < b8_s; idy += b4_h) {
      for (idx = 0; idx < b8_s; idx += b4_w) {
        const int chr_idx = (idy * 2) + idx;
        for (ref = 0; ref < 1 + is_compound; ++ref) {
          const struct scale_factors *const sf = &xd->block_refs[ref]->sf;
          struct buf_2d *const pre_buf = &pd->pre[ref];
          struct buf_2d *const dst_buf = &pd->dst;
          uint8_t *dst = dst_buf->buf;
          const MV mv = mi->bmi[chr_idx].as_mv[ref].as_mv;
          const MV mv_q4 = clamp_mv_to_umv_border_sb(
              xd, &mv, bw, bh, pd->subsampling_x, pd->subsampling_y);
          uint8_t *pre;
          MV32 scaled_mv;
          int xs, ys, subpel_x, subpel_y;
Yaowu Xu's avatar
Yaowu Xu committed
608
          const int is_scaled = av1_is_scaled(sf);
609 610 611 612 613 614 615 616 617

          x = x_base + idx * x_step;
          y = y_base + idy * y_step;

          dst += dst_buf->stride * y + x;

          if (is_scaled) {
            pre =
                pre_buf->buf + scaled_buffer_offset(x, y, pre_buf->stride, sf);
Yaowu Xu's avatar
Yaowu Xu committed
618
            scaled_mv = av1_scale_mv(&mv_q4, mi_x + x, mi_y + y, sf);
619 620 621 622 623 624 625 626 627 628 629 630 631
            xs = sf->x_step_q4;
            ys = sf->y_step_q4;
          } else {
            pre = pre_buf->buf + y * pre_buf->stride + x;
            scaled_mv.row = mv_q4.row;
            scaled_mv.col = mv_q4.col;
            xs = ys = 16;
          }

          subpel_x = scaled_mv.col & SUBPEL_MASK;
          subpel_y = scaled_mv.row & SUBPEL_MASK;
          pre += (scaled_mv.row >> SUBPEL_BITS) * pre_buf->stride +
                 (scaled_mv.col >> SUBPEL_BITS);
632

633 634 635
#if CONFIG_EXT_INTER
          if (ref && is_interinter_wedge_used(mi->mbmi.sb_type) &&
              mi->mbmi.use_wedge_interinter)
Yaowu Xu's avatar
Yaowu Xu committed
636
            av1_make_masked_inter_predictor(
637 638 639 640 641 642 643 644
                pre, pre_buf->stride, dst, dst_buf->stride, subpel_x, subpel_y,
                sf, w, h, mi->mbmi.interp_filter, xs, ys,
#if CONFIG_SUPERTX
                wedge_offset_x, wedge_offset_y,
#endif  // CONFIG_SUPERTX
                xd);
          else
#endif  // CONFIG_EXT_INTER
Yaowu Xu's avatar
Yaowu Xu committed
645 646 647
            av1_make_inter_predictor(pre, pre_buf->stride, dst, dst_buf->stride,
                                     subpel_x, subpel_y, sf, x_step, y_step,
                                     ref, mi->mbmi.interp_filter, xs, ys, xd);
648
        }
649 650 651 652 653 654
      }
    }
    return;
  }
#endif

Jingning Han's avatar
Jingning Han committed
655 656 657 658 659 660
  for (ref = 0; ref < 1 + is_compound; ++ref) {
    const struct scale_factors *const sf = &xd->block_refs[ref]->sf;
    struct buf_2d *const pre_buf = &pd->pre[ref];
    struct buf_2d *const dst_buf = &pd->dst;
    uint8_t *const dst = dst_buf->buf + dst_buf->stride * y + x;
    const MV mv = mi->mbmi.sb_type < BLOCK_8X8
661 662 663 664
#if CONFIG_MOTION_VAR
                      ? (build_for_obmc ? mi->bmi[block].as_mv[ref].as_mv
                                        : average_split_mvs(pd, mi, ref, block))
#else
clang-format's avatar
clang-format committed
665
                      ? average_split_mvs(pd, mi, ref, block)
666
#endif  // CONFIG_MOTION_VAR
clang-format's avatar
clang-format committed
667
                      : mi->mbmi.mv[ref].as_mv;
Jingning Han's avatar
Jingning Han committed
668 669 670 671 672 673

    // TODO(jkoleszar): This clamping is done in the incorrect place for the
    // scaling case. It needs to be done on the scaled MV, not the pre-scaling
    // MV. Note however that it performs the subsampling aware scaling so
    // that the result is always q4.
    // mv_precision precision is MV_PRECISION_Q4.
clang-format's avatar
clang-format committed
674 675
    const MV mv_q4 = clamp_mv_to_umv_border_sb(
        xd, &mv, bw, bh, pd->subsampling_x, pd->subsampling_y);
Jingning Han's avatar
Jingning Han committed
676 677 678 679

    uint8_t *pre;
    MV32 scaled_mv;
    int xs, ys, subpel_x, subpel_y;
Yaowu Xu's avatar
Yaowu Xu committed
680
    const int is_scaled = av1_is_scaled(sf);
Jingning Han's avatar
Jingning Han committed
681 682 683

    if (is_scaled) {
      pre = pre_buf->buf + scaled_buffer_offset(x, y, pre_buf->stride, sf);
Yaowu Xu's avatar
Yaowu Xu committed
684
      scaled_mv = av1_scale_mv(&mv_q4, mi_x + x, mi_y + y, sf);
Jingning Han's avatar
Jingning Han committed
685 686 687 688 689 690 691 692
      xs = sf->x_step_q4;
      ys = sf->y_step_q4;
    } else {
      pre = pre_buf->buf + (y * pre_buf->stride + x);
      scaled_mv.row = mv_q4.row;
      scaled_mv.col = mv_q4.col;
      xs = ys = 16;
    }
693

Jingning Han's avatar
Jingning Han committed
694 695
    subpel_x = scaled_mv.col & SUBPEL_MASK;
    subpel_y = scaled_mv.row & SUBPEL_MASK;
clang-format's avatar
clang-format committed
696 697
    pre += (scaled_mv.row >> SUBPEL_BITS) * pre_buf->stride +
           (scaled_mv.col >> SUBPEL_BITS);
Jingning Han's avatar
Jingning Han committed
698

699
#if CONFIG_EXT_INTER
Debargha Mukherjee's avatar
Debargha Mukherjee committed
700
    if (ref && is_interinter_wedge_used(mi->mbmi.sb_type) &&
701
        mi->mbmi.use_wedge_interinter)
Yaowu Xu's avatar
Yaowu Xu committed
702 703 704
      av1_make_masked_inter_predictor(pre, pre_buf->stride, dst,
                                      dst_buf->stride, subpel_x, subpel_y, sf,
                                      w, h, mi->mbmi.interp_filter, xs, ys,
705
#if CONFIG_SUPERTX
Yaowu Xu's avatar
Yaowu Xu committed
706
                                      wedge_offset_x, wedge_offset_y,
707
#endif  // CONFIG_SUPERTX
Yaowu Xu's avatar
Yaowu Xu committed
708
                                      xd);
709
    else
710 711 712
#else  // CONFIG_EXT_INTER
#if CONFIG_GLOBAL_MOTION
    if (is_global[ref])
Yaowu Xu's avatar
Yaowu Xu committed
713 714 715 716 717 718 719
      av1_warp_plane(&(gm[ref]->motion_params),
#if CONFIG_AOM_HIGHBITDEPTH
                     xd->cur_buf->flags & YV12_FLAG_HIGHBITDEPTH, xd->bd,
#endif  // CONFIG_AOM_HIGHBITDEPTH
                     pre_buf->buf0, pre_buf->width, pre_buf->height,
                     pre_buf->stride, dst, (mi_x >> pd->subsampling_x) + x,
                     (mi_y >> pd->subsampling_y) + y, w, h, dst_buf->stride,
720
                     pd->subsampling_x, pd->subsampling_y, xs, ys, ref);
721 722
    else
#endif  // CONFIG_GLOBAL_MOTION
723
#endif  // CONFIG_EXT_INTER
Yaowu Xu's avatar
Yaowu Xu committed
724 725 726
      av1_make_inter_predictor(pre, pre_buf->stride, dst, dst_buf->stride,
                               subpel_x, subpel_y, sf, w, h, ref,
                               mi->mbmi.interp_filter, xs, ys, xd);
Jingning Han's avatar
Jingning Han committed
727 728 729
  }
}

Yaowu Xu's avatar
Yaowu Xu committed
730 731
void av1_build_inter_predictor_sub8x8(MACROBLOCKD *xd, int plane, int i, int ir,
                                      int ic, int mi_row, int mi_col) {
732 733 734 735 736 737 738 739 740 741 742 743 744
  struct macroblockd_plane *const pd = &xd->plane[plane];
  MODE_INFO *const mi = xd->mi[0];
  const BLOCK_SIZE plane_bsize = get_plane_block_size(mi->mbmi.sb_type, pd);
  const int width = 4 * num_4x4_blocks_wide_lookup[plane_bsize];
  const int height = 4 * num_4x4_blocks_high_lookup[plane_bsize];

  uint8_t *const dst = &pd->dst.buf[(ir * pd->dst.stride + ic) << 2];
  int ref;
  const int is_compound = has_second_ref(&mi->mbmi);

  for (ref = 0; ref < 1 + is_compound; ++ref) {
    const uint8_t *pre =
        &pd->pre[ref].buf[(ir * pd->pre[ref].stride + ic) << 2];
Yaowu Xu's avatar
Yaowu Xu committed
745
#if CONFIG_AOM_HIGHBITDEPTH
clang-format's avatar
clang-format committed
746
    if (xd->cur_buf->flags & YV12_FLAG_HIGHBITDEPTH) {
Yaowu Xu's avatar
Yaowu Xu committed
747
      av1_highbd_build_inter_predictor(
clang-format's avatar
clang-format committed
748 749 750 751 752
          pre, pd->pre[ref].stride, dst, pd->dst.stride,
          &mi->bmi[i].as_mv[ref].as_mv, &xd->block_refs[ref]->sf, width, height,
          ref, mi->mbmi.interp_filter, MV_PRECISION_Q3,
          mi_col * MI_SIZE + 4 * ic, mi_row * MI_SIZE + 4 * ir, xd->bd);
    } else {
Yaowu Xu's avatar
Yaowu Xu committed
753
      av1_build_inter_predictor(
clang-format's avatar
clang-format committed
754 755 756 757 758
          pre, pd->pre[ref].stride, dst, pd->dst.stride,
          &mi->bmi[i].as_mv[ref].as_mv, &xd->block_refs[ref]->sf, width, height,
          ref, mi->mbmi.interp_filter, MV_PRECISION_Q3,
          mi_col * MI_SIZE + 4 * ic, mi_row * MI_SIZE + 4 * ir);
    }
759
#else
Yaowu Xu's avatar
Yaowu Xu committed
760
    av1_build_inter_predictor(
clang-format's avatar
clang-format committed
761 762 763 764
        pre, pd->pre[ref].stride, dst, pd->dst.stride,
        &mi->bmi[i].as_mv[ref].as_mv, &xd->block_refs[ref]->sf, width, height,
        ref, mi->mbmi.interp_filter, MV_PRECISION_Q3, mi_col * MI_SIZE + 4 * ic,
        mi_row * MI_SIZE + 4 * ir);
Yaowu Xu's avatar
Yaowu Xu committed
765
#endif  // CONFIG_AOM_HIGHBITDEPTH
766 767 768
  }
}

Jingning Han's avatar
Jingning Han committed
769 770 771 772 773 774 775
static void build_inter_predictors_for_planes(MACROBLOCKD *xd, BLOCK_SIZE bsize,
                                              int mi_row, int mi_col,
                                              int plane_from, int plane_to) {
  int plane;
  const int mi_x = mi_col * MI_SIZE;
  const int mi_y = mi_row * MI_SIZE;
  for (plane = plane_from; plane <= plane_to; ++plane) {
776 777 778
    const struct macroblockd_plane *pd = &xd->plane[plane];
    const int bw = 4 * num_4x4_blocks_wide_lookup[bsize] >> pd->subsampling_x;
    const int bh = 4 * num_4x4_blocks_high_lookup[bsize] >> pd->subsampling_y;
Jingning Han's avatar
Jingning Han committed
779 780

    if (xd->mi[0]->mbmi.sb_type < BLOCK_8X8) {
781 782 783 784 785 786 787
      const PARTITION_TYPE bp = bsize - xd->mi[0]->mbmi.sb_type;
      const int have_vsplit = bp != PARTITION_HORZ;
      const int have_hsplit = bp != PARTITION_VERT;
      const int num_4x4_w = 2 >> ((!have_vsplit) | pd->subsampling_x);
      const int num_4x4_h = 2 >> ((!have_hsplit) | pd->subsampling_y);
      const int pw = 8 >> (have_vsplit | pd->subsampling_x);
      const int ph = 8 >> (have_hsplit | pd->subsampling_y);
788
      int x, y;
789
      assert(bp != PARTITION_NONE && bp < PARTITION_TYPES);
Jingning Han's avatar
Jingning Han committed
790
      assert(bsize == BLOCK_8X8);
791
      assert(pw * num_4x4_w == bw && ph * num_4x4_h == bh);
Jingning Han's avatar
Jingning Han committed
792 793
      for (y = 0; y < num_4x4_h; ++y)
        for (x = 0; x < num_4x4_w; ++x)
clang-format's avatar
clang-format committed
794
          build_inter_predictors(xd, plane,
Yue Chen's avatar
Yue Chen committed
795
#if CONFIG_MOTION_VAR
clang-format's avatar
clang-format committed
796
                                 0, 0,
Yue Chen's avatar
Yue Chen committed
797
#endif  // CONFIG_MOTION_VAR
clang-format's avatar
clang-format committed
798
                                 y * 2 + x, bw, bh, 4 * x, 4 * y, pw, ph,
799
#if CONFIG_SUPERTX && CONFIG_EXT_INTER
clang-format's avatar
clang-format committed
800
                                 0, 0,
801
#endif  // CONFIG_SUPERTX && CONFIG_EXT_INTER
clang-format's avatar
clang-format committed
802
                                 mi_x, mi_y);
Jingning Han's avatar
Jingning Han committed
803
    } else {
804
      build_inter_predictors(xd, plane,
Yue Chen's avatar
Yue Chen committed
805
#if CONFIG_MOTION_VAR
806
                             0, 0,
Yue Chen's avatar
Yue Chen committed
807
#endif  // CONFIG_MOTION_VAR
clang-format's avatar
clang-format committed
808
                             0, bw, bh, 0, 0, bw, bh,
809 810 811 812
#if CONFIG_SUPERTX && CONFIG_EXT_INTER
                             0, 0,
#endif  // CONFIG_SUPERTX && CONFIG_EXT_INTER
                             mi_x, mi_y);
Jingning Han's avatar
Jingning Han committed
813 814 815 816
    }
  }
}

Yaowu Xu's avatar
Yaowu Xu committed
817 818
void av1_build_inter_predictors_sby(MACROBLOCKD *xd, int mi_row, int mi_col,
                                    BLOCK_SIZE bsize) {
Jingning Han's avatar
Jingning Han committed
819
  build_inter_predictors_for_planes(xd, bsize, mi_row, mi_col, 0, 0);
820 821
#if CONFIG_EXT_INTER
  if (is_interintra_pred(&xd->mi[0]->mbmi))
Yaowu Xu's avatar
Yaowu Xu committed
822 823
    av1_build_interintra_predictors_sby(xd, xd->plane[0].dst.buf,
                                        xd->plane[0].dst.stride, bsize);
824
#endif  // CONFIG_EXT_INTER
Jingning Han's avatar
Jingning Han committed
825 826
}

Yaowu Xu's avatar
Yaowu Xu committed
827 828
void av1_build_inter_predictors_sbp(MACROBLOCKD *xd, int mi_row, int mi_col,
                                    BLOCK_SIZE bsize, int plane) {
Jingning Han's avatar
Jingning Han committed
829
  build_inter_predictors_for_planes(xd, bsize, mi_row, mi_col, plane, plane);