filter.c 40 KB
Newer Older
John Koleszar's avatar
John Koleszar committed
1
/*
2
 *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
John Koleszar's avatar
John Koleszar committed
3
 *
4
 *  Use of this source code is governed by a BSD-style license
5
6
 *  that can be found in the LICENSE file in the root of the source
 *  tree. An additional intellectual property rights grant can be found
7
 *  in the file PATENTS.  All contributing project authors may
8
 *  be found in the AUTHORS file in the root of the source tree.
John Koleszar's avatar
John Koleszar committed
9
10
11
12
 */


#include <stdlib.h>
Johann's avatar
Johann committed
13
14
#include "filter.h"
#include "vpx_ports/mem.h"
John Koleszar's avatar
John Koleszar committed
15

John Koleszar's avatar
John Koleszar committed
16
DECLARE_ALIGNED(16, const short, vp8_bilinear_filters[SUBPEL_SHIFTS][2]) = {
17
#if SUBPEL_SHIFTS==16
John Koleszar's avatar
John Koleszar committed
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
  { 128,   0 },
  { 120,   8 },
  { 112,  16 },
  { 104,  24 },
  {  96,  32 },
  {  88,  40 },
  {  80,  48 },
  {  72,  56 },
  {  64,  64 },
  {  56,  72 },
  {  48,  80 },
  {  40,  88 },
  {  32,  96 },
  {  24, 104 },
  {  16, 112 },
  {   8, 120 }
34
#else
John Koleszar's avatar
John Koleszar committed
35
36
37
38
39
40
41
42
  { 128,   0 },
  { 112,  16 },
  {  96,  32 },
  {  80,  48 },
  {  64,  64 },
  {  48,  80 },
  {  32,  96 },
  {  16, 112 }
43
#endif  /* SUBPEL_SHIFTS==16 */
John Koleszar's avatar
John Koleszar committed
44
45
};

46
#define FILTER_ALPHA       0
47
#define FILTER_ALPHA_SHARP 1
48
DECLARE_ALIGNED(16, const short, vp8_sub_pel_filters_8[SUBPEL_SHIFTS][8]) = {
49
50
#if SUBPEL_SHIFTS==16
#if FILTER_ALPHA == 0
John Koleszar's avatar
John Koleszar committed
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
  /* Lagrangian interpolation filter */
  { 0,   0,   0, 128,   0,   0,   0,  0},
  { 0,   1,  -5, 126,   8,  -3,   1,  0},
  { -1,   3, -10, 122,  18,  -6,   2,  0},
  { -1,   4, -13, 118,  27,  -9,   3, -1},
  { -1,   4, -16, 112,  37, -11,   4, -1},
  { -1,   5, -18, 105,  48, -14,   4, -1},
  { -1,   5, -19,  97,  58, -16,   5, -1},
  { -1,   6, -19,  88,  68, -18,   5, -1},
  { -1,   6, -19,  78,  78, -19,   6, -1},
  { -1,   5, -18,  68,  88, -19,   6, -1},
  { -1,   5, -16,  58,  97, -19,   5, -1},
  { -1,   4, -14,  48, 105, -18,   5, -1},
  { -1,   4, -11,  37, 112, -16,   4, -1},
  { -1,   3,  -9,  27, 118, -13,   4, -1},
  { 0,   2,  -6,  18, 122, -10,   3, -1},
  { 0,   1,  -3,   8, 126,  -5,   1,  0}
68
#elif FILTER_ALPHA == 50
John Koleszar's avatar
John Koleszar committed
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
  /* Generated using MATLAB:
   * alpha = 0.5;
   * b=intfilt(8,4,alpha);
   * bi=round(128*b);
   * ba=flipud(reshape([bi 0], 8, 8));
   * disp(num2str(ba, '%d,'))
   */
  { 0,   0,   0, 128,   0,   0,   0,  0},
  { 0,   1,  -5, 126,   8,  -3,   1,  0},
  { 0,   2, -10, 122,  18,  -6,   2,  0},
  { -1,   3, -13, 118,  27,  -9,   3,  0},
  { -1,   4, -16, 112,  37, -11,   3,  0},
  { -1,   5, -17, 104,  48, -14,   4, -1},
  { -1,   5, -18,  96,  58, -16,   5, -1},
  { -1,   5, -19,  88,  68, -17,   5, -1},
  { -1,   5, -18,  78,  78, -18,   5, -1},
  { -1,   5, -17,  68,  88, -19,   5, -1},
  { -1,   5, -16,  58,  96, -18,   5, -1},
  { -1,   4, -14,  48, 104, -17,   5, -1},
  { 0,   3, -11,  37, 112, -16,   4, -1},
  { 0,   3,  -9,  27, 118, -13,   3, -1},
  { 0,   2,  -6,  18, 122, -10,   2,  0},
  { 0,   1,  -3,   8, 126,  -5,   1,  0}
92
93
94
#endif  /* FILTER_ALPHA */
#else   /* SUBPEL_SHIFTS==16 */
#if FILTER_ALPHA == 0
John Koleszar's avatar
John Koleszar committed
95
96
97
98
99
100
101
102
  { 0,   0,   0, 128,   0,   0,   0,   0},
  { -1,   3, -10, 122,  18,  -6,   2,   0},
  { -1,   4, -16, 112,  37, -11,   4,  -1},
  { -1,   5, -19,  97,  58, -16,   5,  -1},
  { -1,   6, -19,  78,  78, -19,   6,  -1},
  { -1,   5, -16,  58,  97, -19,   5,  -1},
  { -1,   4, -11,  37, 112, -16,   4,  -1},
  { 0,   2,  -6,  18, 122, -10,   3,  -1},
103
#elif FILTER_ALPHA == 50
John Koleszar's avatar
John Koleszar committed
104
105
106
107
108
109
110
111
112
  /* alpha = 0.50 */
  { 0,   0,   0, 128,   0,   0,   0,  0},
  { 0,   2, -10, 122,  18,  -6,   2,  0},
  { -1,   4, -16, 112,  37, -11,   3,  0},
  { -1,   5, -18,  96,  58, -16,   5, -1},
  { -1,   5, -18,  78,  78, -18,   5, -1},
  { -1,   5, -16,  58,  96, -18,   5, -1},
  { 0,   3, -11,  37, 112, -16,   4, -1},
  { 0,   2,  -6,  18, 122, -10,   2,  0}
113
114
115
116
#endif  /* FILTER_ALPHA */
#endif  /* SUBPEL_SHIFTS==16 */
};

117
DECLARE_ALIGNED(16, const short, vp8_sub_pel_filters_8s[SUBPEL_SHIFTS][8]) = {
118
#if SUBPEL_SHIFTS==16
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
#if FILTER_ALPHA_SHARP == 1
  /* dct based filter */
  {0,   0,   0, 128,   0,   0,   0, 0},
  {-1,   3,  -7, 127,   8,  -3,   1, 0},
  {-2,   5, -13, 125,  17,  -6,   3, -1},
  {-3,   7, -17, 121,  27, -10,   5, -2},
  {-4,   9, -20, 115,  37, -13,   6, -2},
  {-4,  10, -23, 108,  48, -16,   8, -3},
  {-4,  10, -24, 100,  59, -19,   9, -3},
  {-4,  11, -24,  90,  70, -21,  10, -4},
  {-4,  11, -23,  80,  80, -23,  11, -4},
  {-4,  10, -21,  70,  90, -24,  11, -4},
  {-3,   9, -19,  59, 100, -24,  10, -4},
  {-3,   8, -16,  48, 108, -23,  10, -4},
  {-2,   6, -13,  37, 115, -20,   9, -4},
  {-2,   5, -10,  27, 121, -17,   7, -3},
  {-1,   3,  -6,  17, 125, -13,   5, -2},
  {0,   1,  -3,   8, 127,  -7,   3, -1}
#elif FILTER_ALPHA_SHARP == 75
138
  /* alpha = 0.75 */
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
  {0,   0,   0, 128,   0,   0,   0, 0},
  {-1,   2,  -6, 126,   9,  -3,   2, -1},
  {-1,   4, -11, 123,  18,  -7,   3, -1},
  {-2,   6, -16, 119,  28, -10,   5, -2},
  {-2,   7, -19, 113,  38, -13,   6, -2},
  {-3,   8, -21, 106,  49, -16,   7, -2},
  {-3,   9, -22,  99,  59, -19,   8, -3},
  {-3,   9, -23,  90,  70, -21,   9, -3},
  {-3,   9, -22,  80,  80, -22,   9, -3},
  {-3,   9, -21,  70,  90, -23,   9, -3},
  {-3,   8, -19,  59,  99, -22,   9, -3},
  {-2,   7, -16,  49, 106, -21,   8, -3},
  {-2,   6, -13,  38, 113, -19,   7, -2},
  {-2,   5, -10,  28, 119, -16,   6, -2},
  {-1,   3,  -7,  18, 123, -11,   4, -1},
  {-1,   2,  -3,   9, 126,  -6,   2, -1}
#elif FILTER_ALPHA_SHARP == 65
John Koleszar's avatar
John Koleszar committed
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
  /* alpha = 0.65 */
  { 0,   0,   0, 128,   0,   0,   0,  0},
  { 0,   2,  -6, 126,   8,  -3,   1,  0},
  { -1,   3, -10, 123,  18,  -6,   2, -1},
  { -1,   5, -14, 118,  27, -10,   4, -1},
  { -1,   5, -17, 112,  38, -13,   5, -1},
  { -2,   6, -19, 106,  48, -15,   5, -1},
  { -2,   7, -21,  98,  59, -17,   6, -2},
  { -2,   7, -21,  89,  69, -19,   7, -2},
  { -2,   7, -20,  79,  79, -20,   7, -2},
  { -2,   7, -19,  69,  89, -21,   7, -2},
  { -2,   6, -17,  59,  98, -21,   7, -2},
  { -1,   5, -15,  48, 106, -19,   6, -2},
  { -1,   5, -13,  38, 112, -17,   5, -1},
  { -1,   4, -10,  27, 118, -14,   5, -1},
  { -1,   2,  -6,  18, 123, -10,   3, -1},
  { 0,   1,  -3,   8, 126,  -6,   2,  0}
173
#endif  /* FILTER_ALPHA_SHARP */
174
#else   /* SUBPEL_SHIFTS==16 */
175
#if FILTER_ALPHA_SHARP == 1
176
  /* dct based filter */
177
178
179
180
181
182
183
184
185
  {0,   0,   0, 128,   0,   0,   0, 0},
  {-2,   5, -13, 125,  17,  -6,   3, -1},
  {-4,   9, -20, 115,  37, -13,   6, -2},
  {-4,  10, -24, 100,  59, -19,   9, -3},
  {-4,  10, -23,  81,  81, -23,  10, -4},
  {-3,   9, -19,  59, 100, -24,  10, -4},
  {-2,   6, -13,  37, 115, -20,   9, -4},
  {-1,   3,  -6,  17, 125, -13,   5, -2}
#elif FILTER_ALPHA_SHARP == 75
186
  /* alpha = 0.75 */
187
188
189
190
191
192
193
194
195
  {0,   0,   0, 128,   0,   0,   0, 0},
  {-1,   4, -11, 123,  18,  -7,   3, -1},
  {-2,   7, -19, 113,  38, -13,   6, -2},
  {-3,   9, -22,  99,  59, -19,   8, -3},
  {-3,   9, -22,  80,  80, -22,   9, -3},
  {-3,   8, -19,  59,  99, -22,   9, -3},
  {-2,   6, -13,  38, 113, -19,   7, -2},
  {-1,   3,  -7,  18, 123, -11,   4, -1}
#elif FILTER_ALPHA_SHARP == 65
John Koleszar's avatar
John Koleszar committed
196
197
198
199
200
201
202
203
204
  /* alpha = 0.65 */
  { 0,   0,   0, 128,   0,   0,   0, 0},
  { -1,   3, -10, 123,  18,  -6,   2, -1},
  { -1,   5, -17, 112,  38, -13,   5, -1},
  { -2,   7, -21,  98,  59, -17,   6, -2},
  { -2,   7, -20,  79,  79, -20,   7, -2},
  { -2,   6, -17,  59,  98, -21,   7, -2},
  { -1,   5, -13,  38, 112, -17,   5, -1},
  { -1,   2,  -6,  18, 123, -10,   3, -1}
205
#endif  /* FILTER_ALPHA_SHARP */
206
#endif  /* SUBPEL_SHIFTS==16 */
207
};
208

John Koleszar's avatar
John Koleszar committed
209
DECLARE_ALIGNED(16, const short, vp8_sub_pel_filters_6[SUBPEL_SHIFTS][6]) = {
210
#if SUBPEL_SHIFTS==16
John Koleszar's avatar
John Koleszar committed
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
  {0,   0, 128,   0,   0, 0},
  {1,  -5, 125,   8,  -2, 1},
  {1,  -8, 122,  17,  -5, 1},
  {2, -11, 116,  27,  -8, 2},
  {3, -14, 110,  37, -10, 2},
  {3, -15, 103,  47, -12, 2},
  {3, -16,  95,  57, -14, 3},
  {3, -16,  86,  67, -15, 3},
  {3, -16,  77,  77, -16, 3},
  {3, -15,  67,  86, -16, 3},
  {3, -14,  57,  95, -16, 3},
  {2, -12,  47, 103, -15, 3},
  {2, -10,  37, 110, -14, 3},
  {2,  -8,  27, 116, -11, 2},
  {1,  -5,  17, 122,  -8, 1},
  {1,  -2,   8, 125,  -5, 1}
227
#else
John Koleszar's avatar
John Koleszar committed
228
229
230
231
232
233
234
235
  { 0,  0,  128,    0,   0,  0 },         /* note that 1/8 pel positions are just as per alpha -0.5 bicubic */
  { 0, -6,  123,   12,  -1,  0 },
  { 2, -11, 108,   36,  -8,  1 },         /* New 1/4 pel 6 tap filter */
  { 0, -9,   93,   50,  -6,  0 },
  { 3, -16,  77,   77, -16,  3 },         /* New 1/2 pel 6 tap filter */
  { 0, -6,   50,   93,  -9,  0 },
  { 1, -8,   36,  108, -11,  2 },         /* New 1/4 pel 6 tap filter */
  { 0, -1,   12,  123,  -6,  0 },
236
#endif  /* SUBPEL_SHIFTS==16 */
John Koleszar's avatar
John Koleszar committed
237
};
238

239
static void filter_block2d_first_pass_6
John Koleszar's avatar
John Koleszar committed
240
(
John Koleszar's avatar
John Koleszar committed
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
  unsigned char *src_ptr,
  int *output_ptr,
  unsigned int src_pixels_per_line,
  unsigned int pixel_step,
  unsigned int output_height,
  unsigned int output_width,
  const short *vp8_filter
) {
  unsigned int i, j;
  int  Temp;

  for (i = 0; i < output_height; i++) {
    for (j = 0; j < output_width; j++) {
      Temp = ((int)src_ptr[-2 * (int)pixel_step] * vp8_filter[0]) +
             ((int)src_ptr[-1 * (int)pixel_step] * vp8_filter[1]) +
             ((int)src_ptr[0]                    * vp8_filter[2]) +
             ((int)src_ptr[pixel_step]           * vp8_filter[3]) +
             ((int)src_ptr[2 * pixel_step]         * vp8_filter[4]) +
             ((int)src_ptr[3 * pixel_step]         * vp8_filter[5]) +
             (VP8_FILTER_WEIGHT >> 1);      /* Rounding */

      /* Normalize back to 0-255 */
      Temp = Temp >> VP8_FILTER_SHIFT;

      if (Temp < 0)
        Temp = 0;
      else if (Temp > 255)
        Temp = 255;

      output_ptr[j] = Temp;
      src_ptr++;
John Koleszar's avatar
John Koleszar committed
272
    }
John Koleszar's avatar
John Koleszar committed
273
274
275
276
277

    /* Next row... */
    src_ptr    += src_pixels_per_line - output_width;
    output_ptr += output_width;
  }
John Koleszar's avatar
John Koleszar committed
278
279
}

280
static void filter_block2d_second_pass_6
John Koleszar's avatar
John Koleszar committed
281
(
John Koleszar's avatar
John Koleszar committed
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
  int *src_ptr,
  unsigned char *output_ptr,
  int output_pitch,
  unsigned int src_pixels_per_line,
  unsigned int pixel_step,
  unsigned int output_height,
  unsigned int output_width,
  const short *vp8_filter
) {
  unsigned int i, j;
  int  Temp;

  for (i = 0; i < output_height; i++) {
    for (j = 0; j < output_width; j++) {
      /* Apply filter */
      Temp = ((int)src_ptr[-2 * (int)pixel_step] * vp8_filter[0]) +
             ((int)src_ptr[-1 * (int)pixel_step] * vp8_filter[1]) +
             ((int)src_ptr[0]                    * vp8_filter[2]) +
             ((int)src_ptr[pixel_step]           * vp8_filter[3]) +
             ((int)src_ptr[2 * pixel_step]         * vp8_filter[4]) +
             ((int)src_ptr[3 * pixel_step]         * vp8_filter[5]) +
             (VP8_FILTER_WEIGHT >> 1);   /* Rounding */

      /* Normalize back to 0-255 */
      Temp = Temp >> VP8_FILTER_SHIFT;

      if (Temp < 0)
        Temp = 0;
      else if (Temp > 255)
        Temp = 255;

      output_ptr[j] = (unsigned char)Temp;
      src_ptr++;
John Koleszar's avatar
John Koleszar committed
315
    }
John Koleszar's avatar
John Koleszar committed
316
317
318
319
320

    /* Start next row */
    src_ptr    += src_pixels_per_line - output_width;
    output_ptr += output_pitch;
  }
John Koleszar's avatar
John Koleszar committed
321
322
}

323
324
325
326
327
328
329
330
/*
 * The only functional difference between filter_block2d_second_pass()
 * and this function is that filter_block2d_second_pass() does a sixtap
 * filter on the input and stores it in the output. This function
 * (filter_block2d_second_pass_avg()) does a sixtap filter on the input,
 * and then averages that with the content already present in the output
 * ((filter_result + dest + 1) >> 1) and stores that in the output.
 */
331
static void filter_block2d_second_pass_avg_6
332
(
John Koleszar's avatar
John Koleszar committed
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
  int *src_ptr,
  unsigned char *output_ptr,
  int output_pitch,
  unsigned int src_pixels_per_line,
  unsigned int pixel_step,
  unsigned int output_height,
  unsigned int output_width,
  const short *vp8_filter
) {
  unsigned int i, j;
  int  Temp;

  for (i = 0; i < output_height; i++) {
    for (j = 0; j < output_width; j++) {
      /* Apply filter */
      Temp = ((int)src_ptr[-2 * (int)pixel_step] * vp8_filter[0]) +
             ((int)src_ptr[-1 * (int)pixel_step] * vp8_filter[1]) +
             ((int)src_ptr[0]                    * vp8_filter[2]) +
             ((int)src_ptr[pixel_step]           * vp8_filter[3]) +
             ((int)src_ptr[2 * pixel_step]         * vp8_filter[4]) +
             ((int)src_ptr[3 * pixel_step]         * vp8_filter[5]) +
             (VP8_FILTER_WEIGHT >> 1);   /* Rounding */

      /* Normalize back to 0-255 */
      Temp = Temp >> VP8_FILTER_SHIFT;

      if (Temp < 0)
        Temp = 0;
      else if (Temp > 255)
        Temp = 255;

      output_ptr[j] = (unsigned char)((output_ptr[j] + Temp + 1) >> 1);
      src_ptr++;
366
    }
John Koleszar's avatar
John Koleszar committed
367
368
369
370
371

    /* Start next row */
    src_ptr    += src_pixels_per_line - output_width;
    output_ptr += output_pitch;
  }
372
}
John Koleszar's avatar
John Koleszar committed
373

374
375
#define Interp_Extend 3
static void filter_block2d_6
John Koleszar's avatar
John Koleszar committed
376
(
John Koleszar's avatar
John Koleszar committed
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
  unsigned char  *src_ptr,
  unsigned char  *output_ptr,
  unsigned int src_pixels_per_line,
  int output_pitch,
  const short  *HFilter,
  const short  *VFilter
) {
  int FData[(3 + Interp_Extend * 2) * 4]; /* Temp data buffer used in filtering */

  /* First filter 1-D horizontally... */
  filter_block2d_first_pass_6(src_ptr - ((Interp_Extend - 1) * src_pixels_per_line), FData, src_pixels_per_line, 1,
                              3 + Interp_Extend * 2, 4, HFilter);

  /* then filter verticaly... */
  filter_block2d_second_pass_6(FData + 4 * (Interp_Extend - 1), output_ptr, output_pitch, 4, 4, 4, 4, VFilter);
John Koleszar's avatar
John Koleszar committed
392
393
394
395
396
}


void vp8_sixtap_predict_c
(
John Koleszar's avatar
John Koleszar committed
397
398
399
400
401
402
403
404
405
406
407
408
409
410
  unsigned char  *src_ptr,
  int   src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int dst_pitch
) {
  const short  *HFilter;
  const short  *VFilter;

  HFilter = vp8_sub_pel_filters_6[xoffset];   /* 6 tap */
  VFilter = vp8_sub_pel_filters_6[yoffset];   /* 6 tap */

  filter_block2d_6(src_ptr, dst_ptr, src_pixels_per_line, dst_pitch, HFilter, VFilter);
John Koleszar's avatar
John Koleszar committed
411
}
412
413
414
415
416
417
418
419
420
421

/*
 * The difference between filter_block2d_6() and filter_block2d_avg_6 is
 * that filter_block2d_6() does a 6-tap filter and stores it in the output
 * buffer, whereas filter_block2d_avg_6() does the same 6-tap filter, and
 * then averages that with the content already present in the output
 * ((filter_result + dest + 1) >> 1) and stores that in the output.
 */
static void filter_block2d_avg_6
(
John Koleszar's avatar
John Koleszar committed
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
  unsigned char  *src_ptr,
  unsigned char  *output_ptr,
  unsigned int src_pixels_per_line,
  int output_pitch,
  const short  *HFilter,
  const short  *VFilter
) {
  int FData[(3 + Interp_Extend * 2) * 4]; /* Temp data buffer used in filtering */

  /* First filter 1-D horizontally... */
  filter_block2d_first_pass_6(src_ptr - ((Interp_Extend - 1) * src_pixels_per_line),
                              FData, src_pixels_per_line, 1,
                              3 + Interp_Extend * 2, 4, HFilter);

  /* then filter verticaly... */
  filter_block2d_second_pass_avg_6(FData + 4 * (Interp_Extend - 1), output_ptr,
                                   output_pitch, 4, 4, 4, 4, VFilter);
439
440
441
442
}

void vp8_sixtap_predict_avg_c
(
John Koleszar's avatar
John Koleszar committed
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
  unsigned char  *src_ptr,
  int   src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int dst_pitch
) {
  const short  *HFilter;
  const short  *VFilter;

  HFilter = vp8_sub_pel_filters_6[xoffset];   /* 6 tap */
  VFilter = vp8_sub_pel_filters_6[yoffset];   /* 6 tap */

  filter_block2d_avg_6(src_ptr, dst_ptr, src_pixels_per_line,
                       dst_pitch, HFilter, VFilter);
458
459
}

John Koleszar's avatar
John Koleszar committed
460
461
void vp8_sixtap_predict8x8_c
(
John Koleszar's avatar
John Koleszar committed
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
  const short  *HFilter;
  const short  *VFilter;
  // int FData[(7+Interp_Extend*2)*16];   /* Temp data buffer used in filtering */
  int FData[(7 + Interp_Extend * 2) * 8]; /* Temp data buffer used in filtering */

  HFilter = vp8_sub_pel_filters_6[xoffset];   /* 6 tap */
  VFilter = vp8_sub_pel_filters_6[yoffset];   /* 6 tap */

  /* First filter 1-D horizontally... */
  filter_block2d_first_pass_6(src_ptr - ((Interp_Extend - 1) * src_pixels_per_line), FData, src_pixels_per_line, 1,
                              7 + Interp_Extend * 2, 8, HFilter);


  /* then filter verticaly... */
  filter_block2d_second_pass_6(FData + 8 * (Interp_Extend - 1), dst_ptr, dst_pitch, 8, 8, 8, 8, VFilter);
John Koleszar's avatar
John Koleszar committed
484
485
486

}

487
488
void vp8_sixtap_predict_avg8x8_c
(
John Koleszar's avatar
John Koleszar committed
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
  const short  *HFilter;
  const short  *VFilter;
  // int FData[(7+Interp_Extend*2)*16];   /* Temp data buffer used in filtering */
  int FData[(7 + Interp_Extend * 2) * 8]; /* Temp data buffer used in filtering */

  HFilter = vp8_sub_pel_filters_6[xoffset];   /* 6 tap */
  VFilter = vp8_sub_pel_filters_6[yoffset];   /* 6 tap */

  /* First filter 1-D horizontally... */
  filter_block2d_first_pass_6(src_ptr - ((Interp_Extend - 1) * src_pixels_per_line), FData, src_pixels_per_line, 1,
                              7 + Interp_Extend * 2, 8, HFilter);

  /* then filter verticaly... */
  filter_block2d_second_pass_avg_6(FData + 8 * (Interp_Extend - 1), dst_ptr, dst_pitch, 8, 8, 8, 8, VFilter);
510
511
}

John Koleszar's avatar
John Koleszar committed
512
513
void vp8_sixtap_predict8x4_c
(
John Koleszar's avatar
John Koleszar committed
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
  const short  *HFilter;
  const short  *VFilter;
  // int FData[(7+Interp_Extend*2)*16];   /* Temp data buffer used in filtering */
  int FData[(3 + Interp_Extend * 2) * 8]; /* Temp data buffer used in filtering */

  HFilter = vp8_sub_pel_filters_6[xoffset];   /* 6 tap */
  VFilter = vp8_sub_pel_filters_6[yoffset];   /* 6 tap */

  /* First filter 1-D horizontally... */
  filter_block2d_first_pass_6(src_ptr - ((Interp_Extend - 1) * src_pixels_per_line), FData, src_pixels_per_line, 1,
                              3 + Interp_Extend * 2, 8, HFilter);


  /* then filter verticaly... */
  filter_block2d_second_pass_6(FData + 8 * (Interp_Extend - 1), dst_ptr, dst_pitch, 8, 8, 4, 8, VFilter);
John Koleszar's avatar
John Koleszar committed
536
537
538
539
540

}

void vp8_sixtap_predict16x16_c
(
John Koleszar's avatar
John Koleszar committed
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
  const short  *HFilter;
  const short  *VFilter;
  // int FData[(15+Interp_Extend*2)*24];   /* Temp data buffer used in filtering */
  int FData[(15 + Interp_Extend * 2) * 16]; /* Temp data buffer used in filtering */


  HFilter = vp8_sub_pel_filters_6[xoffset];   /* 6 tap */
  VFilter = vp8_sub_pel_filters_6[yoffset];   /* 6 tap */

  /* First filter 1-D horizontally... */
  filter_block2d_first_pass_6(src_ptr - ((Interp_Extend - 1) * src_pixels_per_line), FData, src_pixels_per_line, 1,
                              15 + Interp_Extend * 2, 16, HFilter);

  /* then filter verticaly... */
  filter_block2d_second_pass_6(FData + 16 * (Interp_Extend - 1), dst_ptr, dst_pitch, 16, 16, 16, 16, VFilter);
John Koleszar's avatar
John Koleszar committed
563
564
565

}

566
567
void vp8_sixtap_predict_avg16x16_c
(
John Koleszar's avatar
John Koleszar committed
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
  const short  *HFilter;
  const short  *VFilter;
  // int FData[(15+Interp_Extend*2)*24];   /* Temp data buffer used in filtering */
  int FData[(15 + Interp_Extend * 2) * 16]; /* Temp data buffer used in filtering */

  HFilter = vp8_sub_pel_filters_6[xoffset];   /* 6 tap */
  VFilter = vp8_sub_pel_filters_6[yoffset];   /* 6 tap */

  /* First filter 1-D horizontally... */
  filter_block2d_first_pass_6(src_ptr - ((Interp_Extend - 1) * src_pixels_per_line), FData,
                              src_pixels_per_line, 1, 15 + Interp_Extend * 2, 16, HFilter);

  /* then filter verticaly... */
  filter_block2d_second_pass_avg_6(FData + 16 * (Interp_Extend - 1), dst_ptr, dst_pitch,
589
590
                                   16, 16, 16, 16, VFilter);
}
John Koleszar's avatar
John Koleszar committed
591

592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
typedef enum {
  VPX_FILTER_4x4 = 0,
  VPX_FILTER_8x8 = 1,
  VPX_FILTER_8x4 = 2,
  VPX_FILTER_16x16 = 3,
} filter_size_t;

static const unsigned int filter_size_to_wh[][2] = {
  {4, 4},
  {8, 8},
  {8, 4},
  {16,16},
};

static const unsigned int filter_max_height = 16;
static const unsigned int filter_max_width = 16;
608

609
static void vp8_filter_block2d_8_c
610
(
611
612
613
614
615
616
617
 const unsigned char *src_ptr,
 const unsigned int   src_stride,
 const short *HFilter,
 const short *VFilter,
 const filter_size_t filter_size,
 unsigned char *dst_ptr,
 unsigned int   dst_stride
John Koleszar's avatar
John Koleszar committed
618
) {
619
620
621
622
623
624
625
626
627
628
629
630
  const unsigned int output_width = filter_size_to_wh[filter_size][0];
  const unsigned int output_height = filter_size_to_wh[filter_size][1];

  // Between passes, we use an intermediate buffer whose height is extended to
  // have enough horizontally filtered values as input for the vertical pass.
  // This buffer is allocated to be big enough for the largest block type we
  // support.
  const int kInterp_Extend = 4;
  const unsigned int intermediate_height =
    (kInterp_Extend - 1) +     output_height + kInterp_Extend;
  const unsigned int max_intermediate_height =
    (kInterp_Extend - 1) + filter_max_height + kInterp_Extend;
Yaowu Xu's avatar
Yaowu Xu committed
631
632
633
634
#ifdef _MSC_VER
  // MSVC does not support C99 style declaration
  unsigned char intermediate_buffer[23 * 16];
#else
635
  unsigned char intermediate_buffer[max_intermediate_height * filter_max_width];
Yaowu Xu's avatar
Yaowu Xu committed
636
#endif
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
  const int intermediate_next_stride = 1 - intermediate_height * output_width;

  // Horizontal pass (src -> transposed intermediate).
  {
    unsigned char *output_ptr = intermediate_buffer;
    const int src_next_row_stride = src_stride - output_width;
    unsigned int i, j;
    src_ptr -= (kInterp_Extend - 1) * src_stride + (kInterp_Extend - 1);
    for (i = 0; i < intermediate_height; i++) {
      for (j = 0; j < output_width; j++) {
        // Apply filter...
        int temp = ((int)src_ptr[0] * HFilter[0]) +
                   ((int)src_ptr[1] * HFilter[1]) +
                   ((int)src_ptr[2] * HFilter[2]) +
                   ((int)src_ptr[3] * HFilter[3]) +
                   ((int)src_ptr[4] * HFilter[4]) +
                   ((int)src_ptr[5] * HFilter[5]) +
                   ((int)src_ptr[6] * HFilter[6]) +
                   ((int)src_ptr[7] * HFilter[7]) +
                   (VP8_FILTER_WEIGHT >> 1); // Rounding

        // Normalize back to 0-255...
        temp >>= VP8_FILTER_SHIFT;
        if (temp < 0) {
          temp = 0;
        } else if (temp > 255) {
          temp = 255;
        }
        src_ptr++;
        *output_ptr = temp;
        output_ptr += intermediate_height;
      }
      src_ptr += src_next_row_stride;
      output_ptr += intermediate_next_stride;
671
    }
John Koleszar's avatar
John Koleszar committed
672
673
  }

674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
  // Vertical pass (transposed intermediate -> dst).
  {
    unsigned char *src_ptr = intermediate_buffer;
    const int dst_next_row_stride = dst_stride - output_width;
    unsigned int i, j;
    for (i = 0; i < output_height; i++) {
      for (j = 0; j < output_width; j++) {
        // Apply filter...
        int temp = ((int)src_ptr[0] * VFilter[0]) +
                   ((int)src_ptr[1] * VFilter[1]) +
                   ((int)src_ptr[2] * VFilter[2]) +
                   ((int)src_ptr[3] * VFilter[3]) +
                   ((int)src_ptr[4] * VFilter[4]) +
                   ((int)src_ptr[5] * VFilter[5]) +
                   ((int)src_ptr[6] * VFilter[6]) +
                   ((int)src_ptr[7] * VFilter[7]) +
                   (VP8_FILTER_WEIGHT >> 1); // Rounding

        // Normalize back to 0-255...
        temp >>= VP8_FILTER_SHIFT;
        if (temp < 0) {
          temp = 0;
        } else if (temp > 255) {
          temp = 255;
        }

        src_ptr += intermediate_height;
        *dst_ptr++ = (unsigned char)temp;
      }
      src_ptr += intermediate_next_stride;
      dst_ptr += dst_next_row_stride;
705
    }
John Koleszar's avatar
John Koleszar committed
706
  }
707
708
}

709
static void vp8_block2d_average_c
710
(
711
712
  unsigned char *src,
  unsigned int   src_stride,
John Koleszar's avatar
John Koleszar committed
713
  unsigned char *output_ptr,
714
715
  unsigned int output_stride,
  const filter_size_t filter_size
John Koleszar's avatar
John Koleszar committed
716
) {
717
718
  const unsigned int output_width = filter_size_to_wh[filter_size][0];
  const unsigned int output_height = filter_size_to_wh[filter_size][1];
John Koleszar's avatar
John Koleszar committed
719

720
  unsigned int i, j;
John Koleszar's avatar
John Koleszar committed
721
722
  for (i = 0; i < output_height; i++) {
    for (j = 0; j < output_width; j++) {
723
      output_ptr[j] = (output_ptr[j] + src[i * src_stride + j] + 1) >> 1;
724
    }
725
    output_ptr += output_stride;
John Koleszar's avatar
John Koleszar committed
726
  }
727
728
}

729
730
#define vp8_filter_block2d_8 vp8_filter_block2d_8_c
#define vp8_block2d_average vp8_block2d_average_c
731

732
733
void vp8_eighttap_predict_c
(
John Koleszar's avatar
John Koleszar committed
734
735
736
737
738
739
740
741
742
743
  unsigned char  *src_ptr,
  int   src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int dst_pitch
) {
  const short  *HFilter;
  const short  *VFilter;

744
745
  HFilter = vp8_sub_pel_filters_8[xoffset];
  VFilter = vp8_sub_pel_filters_8[yoffset];
John Koleszar's avatar
John Koleszar committed
746

747
748
749
  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_4x4,
                       dst_ptr, dst_pitch);
750
751
}

752
753
void vp8_eighttap_predict_avg4x4_c
(
John Koleszar's avatar
John Koleszar committed
754
755
756
757
758
759
760
  unsigned char  *src_ptr,
  int   src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int dst_pitch
) {
761
762
763
764
765
766
767
768
  const short  *HFilter = vp8_sub_pel_filters_8[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8[yoffset];
  unsigned char tmp[4 * 4];

  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_4x4,
                       tmp, 4);
  vp8_block2d_average(tmp, 4, dst_ptr, dst_pitch, VPX_FILTER_4x4);
769
770
}

771
772
void vp8_eighttap_predict_sharp_c
(
John Koleszar's avatar
John Koleszar committed
773
774
775
776
777
778
779
780
781
782
  unsigned char  *src_ptr,
  int   src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int dst_pitch
) {
  const short  *HFilter;
  const short  *VFilter;

783
784
  HFilter = vp8_sub_pel_filters_8s[xoffset];
  VFilter = vp8_sub_pel_filters_8s[yoffset];
John Koleszar's avatar
John Koleszar committed
785

786
787
788
  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_4x4,
                       dst_ptr, dst_pitch);
789
790
}

791
792
void vp8_eighttap_predict_avg4x4_sharp_c
(
John Koleszar's avatar
John Koleszar committed
793
794
795
796
797
798
799
  unsigned char  *src_ptr,
  int   src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int dst_pitch
) {
800
801
802
803
804
805
806
807
  const short  *HFilter = vp8_sub_pel_filters_8s[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8s[yoffset];
  unsigned char tmp[4 * 4];

  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_4x4,
                       tmp, 4);
  vp8_block2d_average(tmp, 4, dst_ptr, dst_pitch, VPX_FILTER_4x4);
808
809
}

810
811
void vp8_eighttap_predict8x8_c
(
John Koleszar's avatar
John Koleszar committed
812
813
814
815
816
817
818
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
819
820
  const short  *HFilter = vp8_sub_pel_filters_8[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8[yoffset];
John Koleszar's avatar
John Koleszar committed
821

822
823
824
  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_8x8,
                       dst_ptr, dst_pitch);
825
826
827
828
}

void vp8_eighttap_predict8x8_sharp_c
(
John Koleszar's avatar
John Koleszar committed
829
830
831
832
833
834
835
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
836
837
  const short  *HFilter = vp8_sub_pel_filters_8s[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8s[yoffset];
John Koleszar's avatar
John Koleszar committed
838

839
840
841
  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_8x8,
                       dst_ptr, dst_pitch);
842
843
844
845
}

void vp8_eighttap_predict_avg8x8_c
(
John Koleszar's avatar
John Koleszar committed
846
847
848
849
850
851
852
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
853
854
855
856
857
858
859
860
  unsigned char tmp[8 * 8];
  const short  *HFilter = vp8_sub_pel_filters_8[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8[yoffset];

  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_8x8,
                       tmp, 8);
  vp8_block2d_average(tmp, 8, dst_ptr, dst_pitch, VPX_FILTER_8x8);
861
862
863
864
}

void vp8_eighttap_predict_avg8x8_sharp_c
(
John Koleszar's avatar
John Koleszar committed
865
866
867
868
869
870
871
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
872
873
874
875
876
877
878
879
  unsigned char tmp[8 * 8];
  const short  *HFilter = vp8_sub_pel_filters_8s[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8s[yoffset];

  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_8x8,
                       tmp, 8);
  vp8_block2d_average(tmp, 8, dst_ptr, dst_pitch, VPX_FILTER_8x8);
880
881
882
883
}

void vp8_eighttap_predict8x4_c
(
John Koleszar's avatar
John Koleszar committed
884
885
886
887
888
889
890
891
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {

892
893
  const short  *HFilter = vp8_sub_pel_filters_8[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8[yoffset];
894

895
896
897
  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_8x4,
                       dst_ptr, dst_pitch);
898
899
900
901
}

void vp8_eighttap_predict8x4_sharp_c
(
John Koleszar's avatar
John Koleszar committed
902
903
904
905
906
907
908
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
909
910
  const short  *HFilter = vp8_sub_pel_filters_8s[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8s[yoffset];
911

912
913
914
  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_8x4,
                       dst_ptr, dst_pitch);
915
916
917
918
}

void vp8_eighttap_predict16x16_c
(
John Koleszar's avatar
John Koleszar committed
919
920
921
922
923
924
925
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
926
927
  const short  *HFilter = vp8_sub_pel_filters_8[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8[yoffset];
928

929
930
931
  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_16x16,
                       dst_ptr, dst_pitch);
932
933
934
935
}

void vp8_eighttap_predict16x16_sharp_c
(
John Koleszar's avatar
John Koleszar committed
936
937
938
939
940
941
942
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
943
944
  const short  *HFilter = vp8_sub_pel_filters_8s[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8s[yoffset];
945

946
947
948
  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_16x16,
                       dst_ptr, dst_pitch);
949
950
951
952
}

void vp8_eighttap_predict_avg16x16_c
(
John Koleszar's avatar
John Koleszar committed
953
954
955
956
957
958
959
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
960
  unsigned char tmp[16 * 16];
John Koleszar's avatar
John Koleszar committed
961

962
963
  const short  *HFilter = vp8_sub_pel_filters_8[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8[yoffset];
John Koleszar's avatar
John Koleszar committed
964

965
966
967
968
  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_16x16,
                       tmp, 16);
  vp8_block2d_average(tmp, 16, dst_ptr, dst_pitch, VPX_FILTER_16x16);
969
970
971
972
}

void vp8_eighttap_predict_avg16x16_sharp_c
(
John Koleszar's avatar
John Koleszar committed
973
974
975
976
977
978
979
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
980
981
982
983
984
985
986
987
  unsigned char tmp[16 * 16];
  const short  *HFilter = vp8_sub_pel_filters_8s[xoffset];
  const short  *VFilter = vp8_sub_pel_filters_8s[yoffset];

  vp8_filter_block2d_8(src_ptr, src_pixels_per_line,
                       HFilter, VFilter, VPX_FILTER_16x16,
                       tmp, 16);
  vp8_block2d_average(tmp, 16, dst_ptr, dst_pitch, VPX_FILTER_16x16);
988
989
}

John Koleszar's avatar
John Koleszar committed
990
991
992
993
/****************************************************************************
 *
 *  ROUTINE       : filter_block2d_bil_first_pass
 *
Johann's avatar
Johann committed
994
995
996
997
998
 *  INPUTS        : UINT8  *src_ptr    : Pointer to source block.
 *                  UINT32  src_stride : Stride of source block.
 *                  UINT32  height     : Block height.
 *                  UINT32  width      : Block width.
 *                  INT32  *vp8_filter : Array of 2 bi-linear filter taps.
John Koleszar's avatar
John Koleszar committed
999
 *
Johann's avatar
Johann committed
1000
 *  OUTPUTS       : INT32  *dst_ptr    : Pointer to filtered block.
John Koleszar's avatar
John Koleszar committed
1001
1002
1003
 *
 *  RETURNS       : void
 *
Johann's avatar
Johann committed
1004
1005
1006
 *  FUNCTION      : Applies a 1-D 2-tap bi-linear filter to the source block
 *                  in the horizontal direction to produce the filtered output
 *                  block. Used to implement first-pass of 2-D separable filter.
John Koleszar's avatar
John Koleszar committed
1007
1008
1009
1010
1011
 *
 *  SPECIAL NOTES : Produces INT32 output to retain precision for next pass.
 *                  Two filter taps should sum to VP8_FILTER_WEIGHT.
 *
 ****************************************************************************/
1012
static void filter_block2d_bil_first_pass
John Koleszar's avatar
John Koleszar committed
1013
(
John Koleszar's avatar
John Koleszar committed
1014
1015
1016
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
1027
1028
1029
  unsigned char  *src_ptr,
  unsigned short *dst_ptr,
  unsigned int    src_stride,
  unsigned int    height,
  unsigned int    width,
  const short    *vp8_filter
) {
  unsigned int i, j;

  for (i = 0; i < height; i++) {
    for (j = 0; j < width; j++) {
      /* Apply bilinear filter */
      dst_ptr[j] = (((int)src_ptr[0] * vp8_filter[0]) +
                    ((int)src_ptr[1] * vp8_filter[1]) +
                    (VP8_FILTER_WEIGHT / 2)) >> VP8_FILTER_SHIFT;
      src_ptr++;
John Koleszar's avatar
John Koleszar committed
1030
    }
John Koleszar's avatar
John Koleszar committed
1031
1032
1033
1034
1035

    /* Next row... */
    src_ptr += src_stride - width;
    dst_ptr += width;
  }
John Koleszar's avatar
John Koleszar committed
1036
1037
1038
1039
1040
1041
}

/****************************************************************************
 *
 *  ROUTINE       : filter_block2d_bil_second_pass
 *
Johann's avatar
Johann committed
1042
1043
1044
1045
1046
 *  INPUTS        : INT32  *src_ptr    : Pointer to source block.
 *                  UINT32  dst_pitch  : Destination block pitch.
 *                  UINT32  height     : Block height.
 *                  UINT32  width      : Block width.
 *                  INT32  *vp8_filter : Array of 2 bi-linear filter taps.
John Koleszar's avatar
John Koleszar committed
1047
 *
Johann's avatar
Johann committed
1048
 *  OUTPUTS       : UINT16 *dst_ptr    : Pointer to filtered block.
John Koleszar's avatar
John Koleszar committed
1049
1050
1051
 *
 *  RETURNS       : void
 *
Johann's avatar
Johann committed
1052
1053
1054
 *  FUNCTION      : Applies a 1-D 2-tap bi-linear filter to the source block
 *                  in the vertical direction to produce the filtered output
 *                  block. Used to implement second-pass of 2-D separable filter.
John Koleszar's avatar
John Koleszar committed
1055
1056
1057
1058
1059
 *
 *  SPECIAL NOTES : Requires 32-bit input as produced by filter_block2d_bil_first_pass.
 *                  Two filter taps should sum to VP8_FILTER_WEIGHT.
 *
 ****************************************************************************/
1060
static void filter_block2d_bil_second_pass
John Koleszar's avatar
John Koleszar committed
1061
(
John Koleszar's avatar
John Koleszar committed
1062
1063
1064
1065
1066
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
  unsigned short *src_ptr,
  unsigned char  *dst_ptr,
  int             dst_pitch,
  unsigned int    height,
  unsigned int    width,
  const short    *vp8_filter
) {
  unsigned int  i, j;
  int  Temp;

  for (i = 0; i < height; i++) {
    for (j = 0; j < width; j++) {
      /* Apply filter */
      Temp = ((int)src_ptr[0]     * vp8_filter[0]) +
             ((int)src_ptr[width] * vp8_filter[1]) +
             (VP8_FILTER_WEIGHT / 2);
      dst_ptr[j] = (unsigned int)(Temp >> VP8_FILTER_SHIFT);
      src_ptr++;
John Koleszar's avatar
John Koleszar committed
1080
    }
John Koleszar's avatar
John Koleszar committed
1081
1082
1083
1084

    /* Next row... */
    dst_ptr += dst_pitch;
  }
John Koleszar's avatar
John Koleszar committed
1085
1086
}

1087
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
/*
 * As before for filter_block2d_second_pass_avg(), the functional difference
 * between filter_block2d_bil_second_pass() and filter_block2d_bil_second_pass_avg()
 * is that filter_block2d_bil_second_pass() does a bilinear filter on input
 * and stores the result in output; filter_block2d_bil_second_pass_avg(),
 * instead, does a bilinear filter on input, averages the resulting value
 * with the values already present in the output and stores the result of
 * that back into the output ((filter_result + dest + 1) >> 1).
 */
static void filter_block2d_bil_second_pass_avg
(
John Koleszar's avatar
John Koleszar committed
1098
1099
1100
1101
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
1112
1113
1114
1115
  unsigned short *src_ptr,
  unsigned char  *dst_ptr,
  int             dst_pitch,
  unsigned int    height,
  unsigned int    width,
  const short    *vp8_filter
) {
  unsigned int  i, j;
  int  Temp;

  for (i = 0; i < height; i++) {
    for (j = 0; j < width; j++) {
      /* Apply filter */
      Temp = ((int)src_ptr[0]     * vp8_filter[0]) +
             ((int)src_ptr[width] * vp8_filter[1]) +
             (VP8_FILTER_WEIGHT / 2);
      dst_ptr[j] = (unsigned int)(((Temp >> VP8_FILTER_SHIFT) + dst_ptr[j] + 1) >> 1);
      src_ptr++;
1116
    }
John Koleszar's avatar
John Koleszar committed
1117
1118
1119
1120

    /* Next row... */
    dst_ptr += dst_pitch;
  }
1121
}
John Koleszar's avatar
John Koleszar committed
1122
1123
1124
1125
1126
1127

/****************************************************************************
 *
 *  ROUTINE       : filter_block2d_bil
 *
 *  INPUTS        : UINT8  *src_ptr          : Pointer to source block.
Johann's avatar
Johann committed
1128
1129
1130
1131
1132
1133
 *                  UINT32  src_pitch        : Stride of source block.
 *                  UINT32  dst_pitch        : Stride of destination block.
 *                  INT32  *HFilter          : Array of 2 horizontal filter taps.
 *                  INT32  *VFilter          : Array of 2 vertical filter taps.
 *                  INT32  Width             : Block width
 *                  INT32  Height            : Block height
John Koleszar's avatar
John Koleszar committed
1134
 *
Johann's avatar
Johann committed
1135
 *  OUTPUTS       : UINT16 *dst_ptr       : Pointer to filtered block.
John Koleszar's avatar
John Koleszar committed
1136
1137
1138
1139
1140
1141
1142
1143
1144
1145
 *
 *  RETURNS       : void
 *
 *  FUNCTION      : 2-D filters an input block by applying a 2-tap
 *                  bi-linear filter horizontally followed by a 2-tap
 *                  bi-linear filter vertically on the result.
 *
 *  SPECIAL NOTES : The largest block size can be handled here is 16x16
 *
 ****************************************************************************/
1146
static void filter_block2d_bil
John Koleszar's avatar
John Koleszar committed
1147
(
John Koleszar's avatar
John Koleszar committed
1148
1149
1150
1151
1152
1153
1154
1155
1156
1157
1158
1159
1160
1161
1162
1163
1164
  unsigned char *src_ptr,
  unsigned char *dst_ptr,
  unsigned int   src_pitch,
  unsigned int   dst_pitch,
  const short   *HFilter,
  const short   *VFilter,
  int            Width,
  int            Height
) {

  unsigned short FData[17 * 16];  /* Temp data buffer used in filtering */

  /* First filter 1-D horizontally... */
  filter_block2d_bil_first_pass(src_ptr, FData, src_pitch, Height + 1, Width, HFilter);

  /* then 1-D vertically... */
  filter_block2d_bil_second_pass(FData, dst_ptr, dst_pitch, Height, Width, VFilter);
John Koleszar's avatar
John Koleszar committed
1165
1166
}

1167
1168
static void filter_block2d_bil_avg
(
John Koleszar's avatar
John Koleszar committed
1169
1170
1171
1172
1173
1174
1175
1176
1177
1178
1179
1180
1181
1182
1183
1184
  unsigned char *src_ptr,
  unsigned char *dst_ptr,
  unsigned int   src_pitch,
  unsigned int   dst_pitch,
  const short   *HFilter,
  const short   *VFilter,
  int            Width,
  int            Height
) {
  unsigned short FData[17 * 16];  /* Temp data buffer used in filtering */

  /* First filter 1-D horizontally... */
  filter_block2d_bil_first_pass(src_ptr, FData, src_pitch, Height + 1, Width, HFilter);

  /* then 1-D vertically... */
  filter_block2d_bil_second_pass_avg(FData, dst_ptr, dst_pitch, Height, Width, VFilter);
1185
}
John Koleszar's avatar
John Koleszar committed
1186
1187
1188

void vp8_bilinear_predict4x4_c
(
John Koleszar's avatar
John Koleszar committed
1189
1190
1191
1192
1193
1194
1195
1196
1197
1198
1199
1200
  unsigned char  *src_ptr,
  int   src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int dst_pitch
) {
  const short *HFilter;
  const short *VFilter;

  HFilter = vp8_bilinear_filters[xoffset];
  VFilter = vp8_bilinear_filters[yoffset];
John Koleszar's avatar
John Koleszar committed
1201
#if 0
John Koleszar's avatar
John Koleszar committed
1202
1203
1204
1205
1206
1207
1208
  {
    int i;
    unsigned char temp1[16];
    unsigned char temp2[16];

    bilinear_predict4x4_mmx(src_ptr, src_pixels_per_line, xoffset, yoffset, temp1, 4);
    filter_block2d_bil(src_ptr, temp2, src_pixels_per_line, 4, HFilter, VFilter, 4, 4);
John Koleszar's avatar
John Koleszar committed
1209

John Koleszar's avatar
John Koleszar committed
1210
1211
    for (i = 0; i < 16; i++) {
      if (temp1[i] != temp2[i]) {
John Koleszar's avatar
John Koleszar committed
1212
        bilinear_predict4x4_mmx(src_ptr, src_pixels_per_line, xoffset, yoffset, temp1, 4);
1213
        filter_block2d_bil(src_ptr, temp2, src_pixels_per_line, 4, HFilter, VFilter, 4, 4);
John Koleszar's avatar
John Koleszar committed
1214
      }
John Koleszar's avatar
John Koleszar committed
1215
    }
John Koleszar's avatar
John Koleszar committed
1216
  }
John Koleszar's avatar
John Koleszar committed
1217
#endif
John Koleszar's avatar
John Koleszar committed
1218
  filter_block2d_bil(src_ptr, dst_ptr, src_pixels_per_line, dst_pitch, HFilter, VFilter, 4, 4);
John Koleszar's avatar
John Koleszar committed
1219
1220
1221

}

1222
1223
void vp8_bilinear_predict_avg4x4_c
(
John Koleszar's avatar
John Koleszar committed
1224
1225
1226
1227
1228
1229
1230
1231
1232
1233
1234
1235
1236
1237
1238
  unsigned char  *src_ptr,
  int   src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int dst_pitch
) {
  const short *HFilter;
  const short *VFilter;

  HFilter = vp8_bilinear_filters[xoffset];
  VFilter = vp8_bilinear_filters[yoffset];

  filter_block2d_bil_avg(src_ptr, dst_ptr, src_pixels_per_line,
                         dst_pitch, HFilter, VFilter, 4, 4);
1239
1240
}

John Koleszar's avatar
John Koleszar committed
1241
1242
void vp8_bilinear_predict8x8_c
(
John Koleszar's avatar
John Koleszar committed
1243
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
  const short *HFilter;
  const short *VFilter;

  HFilter = vp8_bilinear_filters[xoffset];
  VFilter = vp8_bilinear_filters[yoffset];

  filter_block2d_bil(src_ptr, dst_ptr, src_pixels_per_line, dst_pitch, HFilter, VFilter, 8, 8);
John Koleszar's avatar
John Koleszar committed
1257
1258
1259

}

1260
1261
void vp8_bilinear_predict_avg8x8_c
(
John Koleszar's avatar
John Koleszar committed
1262
1263
1264
1265
1266
1267
1268
1269
1270
1271
1272
1273
1274
1275
1276
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
  const short *HFilter;
  const short *VFilter;

  HFilter = vp8_bilinear_filters[xoffset];
  VFilter = vp8_bilinear_filters[yoffset];

  filter_block2d_bil_avg(src_ptr, dst_ptr, src_pixels_per_line,
                         dst_pitch, HFilter, VFilter, 8, 8);
1277
1278
}

John Koleszar's avatar
John Koleszar committed
1279
1280
void vp8_bilinear_predict8x4_c
(
John Koleszar's avatar
John Koleszar committed
1281
1282
1283
1284
1285
1286
1287
1288
1289
1290
1291
1292
1293
1294
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
  const short *HFilter;
  const short *VFilter;

  HFilter = vp8_bilinear_filters[xoffset];
  VFilter = vp8_bilinear_filters[yoffset];

  filter_block2d_bil(src_ptr, dst_ptr, src_pixels_per_line, dst_pitch, HFilter, VFilter, 8, 4);
John Koleszar's avatar
John Koleszar committed
1295
1296
1297
1298
1299

}

void vp8_bilinear_predict16x16_c
(
John Koleszar's avatar
John Koleszar committed
1300
1301
1302
1303
1304
1305
1306
1307
1308
1309
1310
1311
1312
1313
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
  const short *HFilter;
  const short *VFilter;

  HFilter = vp8_bilinear_filters[xoffset];
  VFilter = vp8_bilinear_filters[yoffset];

  filter_block2d_bil(src_ptr, dst_ptr, src_pixels_per_line, dst_pitch, HFilter, VFilter, 16, 16);
John Koleszar's avatar
John Koleszar committed
1314
}
1315
1316
1317

void vp8_bilinear_predict_avg16x16_c
(
John Koleszar's avatar
John Koleszar committed
1318
1319
1320
1321
1322
1323
1324
1325
1326
1327
1328
1329
1330
1331
1332
  unsigned char  *src_ptr,
  int  src_pixels_per_line,
  int  xoffset,
  int  yoffset,
  unsigned char *dst_ptr,
  int  dst_pitch
) {
  const short *HFilter;
  const short *VFilter;

  HFilter = vp8_bilinear_filters[xoffset];
  VFilter = vp8_bilinear_filters[yoffset];

  filter_block2d_bil_avg(src_ptr, dst_ptr, src_pixels_per_line,
                         dst_pitch, HFilter, VFilter, 16, 16);
1333
}