lpf_8_test.cc 27.2 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
/*
 *  Copyright (c) 2014 The WebM project authors. All Rights Reserved.
 *
 *  Use of this source code is governed by a BSD-style license
 *  that can be found in the LICENSE file in the root of the source
 *  tree. An additional intellectual property rights grant can be found
 *  in the file PATENTS.  All contributing project authors may
 *  be found in the AUTHORS file in the root of the source tree.
 */

#include <cmath>
#include <cstdlib>
#include <string>

#include "third_party/googletest/src/include/gtest/gtest.h"
16
17
18

#include "./vpx_config.h"
#include "./vpx_dsp_rtcd.h"
19
20
21
22
23
#include "test/acm_random.h"
#include "test/clear_system_state.h"
#include "test/register_state_check.h"
#include "test/util.h"
#include "vp9/common/vp9_entropy.h"
Deb Mukherjee's avatar
Deb Mukherjee committed
24
#include "vp9/common/vp9_loopfilter.h"
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
#include "vpx/vpx_integer.h"

using libvpx_test::ACMRandom;

namespace {
// Horizontally and Vertically need 32x32: 8  Coeffs preceeding filtered section
//                                         16 Coefs within filtered section
//                                         8  Coeffs following filtered section
const int kNumCoeffs = 1024;

const int number_of_iterations = 10000;

#if CONFIG_VP9_HIGHBITDEPTH
typedef void (*loop_op_t)(uint16_t *s, int p, const uint8_t *blimit,
                          const uint8_t *limit, const uint8_t *thresh,
                          int count, int bd);
typedef void (*dual_loop_op_t)(uint16_t *s, int p, const uint8_t *blimit0,
                               const uint8_t *limit0, const uint8_t *thresh0,
                               const uint8_t *blimit1, const uint8_t *limit1,
                               const uint8_t *thresh1, int bd);
45
46
47
48
49
50
51
52
53
54
55

// wrapper for loopfilter functions without a 'count' param.
typedef void (*loop_op_nc_t)(uint16_t *s, int p, const uint8_t *blimit,
                             const uint8_t *limit, const uint8_t *thresh,
                             int bd);
template <loop_op_nc_t fn>
void wrapper_nc(uint16_t *s, int p, const uint8_t *blimit,
                const uint8_t *limit, const uint8_t *thresh,
                int /*count*/, int bd) {
  fn(s, p, blimit, limit, thresh, bd);
}
56
57
58
59
60
61
62
63
64
#else
typedef void (*loop_op_t)(uint8_t *s, int p, const uint8_t *blimit,
                          const uint8_t *limit, const uint8_t *thresh,
                          int count);
typedef void (*dual_loop_op_t)(uint8_t *s, int p, const uint8_t *blimit0,
                               const uint8_t *limit0, const uint8_t *thresh0,
                               const uint8_t *blimit1, const uint8_t *limit1,
                               const uint8_t *thresh1);

65
66
67
68
69
70
71
72
// wrapper for loopfilter functions without a 'count' param.
typedef void (*loop_op_nc_t)(uint8_t *s, int p, const uint8_t *blimit,
                             const uint8_t *limit, const uint8_t *thresh);
template <loop_op_nc_t fn>
void wrapper_nc(uint8_t *s, int p, const uint8_t *blimit,
                const uint8_t *limit, const uint8_t *thresh,
                int /*count*/) {
  fn(s, p, blimit, limit, thresh);
73
74
75
}
#endif  // CONFIG_VP9_HIGHBITDEPTH

76
77
typedef std::tr1::tuple<loop_op_t, loop_op_t, int, int> loop8_param_t;
typedef std::tr1::tuple<dual_loop_op_t, dual_loop_op_t, int> dualloop8_param_t;
78

79
80
81
82
83
84
85
class Loop8Test6Param : public ::testing::TestWithParam<loop8_param_t> {
 public:
  virtual ~Loop8Test6Param() {}
  virtual void SetUp() {
    loopfilter_op_ = GET_PARAM(0);
    ref_loopfilter_op_ = GET_PARAM(1);
    bit_depth_ = GET_PARAM(2);
Ed Baker's avatar
Ed Baker committed
86
    count_ = GET_PARAM(3);
87
88
89
90
91
92
93
    mask_ = (1 << bit_depth_) - 1;
  }

  virtual void TearDown() { libvpx_test::ClearSystemState(); }

 protected:
  int bit_depth_;
Ed Baker's avatar
Ed Baker committed
94
  int count_;
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
  int mask_;
  loop_op_t loopfilter_op_;
  loop_op_t ref_loopfilter_op_;
};

class Loop8Test9Param : public ::testing::TestWithParam<dualloop8_param_t> {
 public:
  virtual ~Loop8Test9Param() {}
  virtual void SetUp() {
    loopfilter_op_ = GET_PARAM(0);
    ref_loopfilter_op_ = GET_PARAM(1);
    bit_depth_ = GET_PARAM(2);
    mask_ = (1 << bit_depth_) - 1;
  }

  virtual void TearDown() { libvpx_test::ClearSystemState(); }

 protected:
  int bit_depth_;
  int mask_;
  dual_loop_op_t loopfilter_op_;
  dual_loop_op_t ref_loopfilter_op_;
};

TEST_P(Loop8Test6Param, OperationCheck) {
  ACMRandom rnd(ACMRandom::DeterministicSeed());
  const int count_test_block = number_of_iterations;
#if CONFIG_VP9_HIGHBITDEPTH
  int32_t bd = bit_depth_;
124
125
  DECLARE_ALIGNED(16, uint16_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(16, uint16_t, ref_s[kNumCoeffs]);
126
#else
127
128
  DECLARE_ALIGNED(8, uint8_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(8, uint8_t, ref_s[kNumCoeffs]);
129
130
131
132
133
#endif  // CONFIG_VP9_HIGHBITDEPTH
  int err_count_total = 0;
  int first_failure = -1;
  for (int i = 0; i < count_test_block; ++i) {
    int err_count = 0;
Deb Mukherjee's avatar
Deb Mukherjee committed
134
    uint8_t tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
135
136
137
138
    DECLARE_ALIGNED(16, const uint8_t, blimit[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
139
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
    DECLARE_ALIGNED(16, const uint8_t, limit[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    int32_t p = kNumCoeffs/32;

    uint16_t tmp_s[kNumCoeffs];
    int j = 0;
    while (j < kNumCoeffs) {
      uint8_t val = rnd.Rand8();
      if (val & 0x80) {  // 50% chance to choose a new value.
        tmp_s[j] = rnd.Rand16();
        j++;
      } else {  // 50% chance to repeat previous value in row X times
        int k = 0;
        while (k++ < ((val & 0x1f) + 1) && j < kNumCoeffs) {
          if (j < 1) {
            tmp_s[j] = rnd.Rand16();
          } else if (val & 0x20) {  // Increment by an value within the limit
            tmp_s[j] = (tmp_s[j - 1] + (*limit - 1));
          } else {  // Decrement by an value within the limit
            tmp_s[j] = (tmp_s[j - 1] - (*limit - 1));
          }
          j++;
        }
      }
    }
    for (j = 0; j < kNumCoeffs; j++) {
      if (i % 2) {
        s[j] = tmp_s[j] & mask_;
      } else {
        s[j] = tmp_s[p * (j % p) + j / p] & mask_;
      }
      ref_s[j] = s[j];
    }
#if CONFIG_VP9_HIGHBITDEPTH
Ed Baker's avatar
Ed Baker committed
181
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit, limit, thresh, count_, bd);
182
    ASM_REGISTER_STATE_CHECK(
Ed Baker's avatar
Ed Baker committed
183
        loopfilter_op_(s + 8 + p * 8, p, blimit, limit, thresh, count_, bd));
184
#else
Ed Baker's avatar
Ed Baker committed
185
    ref_loopfilter_op_(ref_s+8+p*8, p, blimit, limit, thresh, count_);
186
    ASM_REGISTER_STATE_CHECK(
Ed Baker's avatar
Ed Baker committed
187
        loopfilter_op_(s + 8 + p * 8, p, blimit, limit, thresh, count_));
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
#endif  // CONFIG_VP9_HIGHBITDEPTH

    for (int j = 0; j < kNumCoeffs; ++j) {
      err_count += ref_s[j] != s[j];
    }
    if (err_count && !err_count_total) {
      first_failure = i;
    }
    err_count_total += err_count;
  }
  EXPECT_EQ(0, err_count_total)
      << "Error: Loop8Test6Param, C output doesn't match SSE2 "
         "loopfilter output. "
      << "First failed at test case " << first_failure;
}

TEST_P(Loop8Test6Param, ValueCheck) {
  ACMRandom rnd(ACMRandom::DeterministicSeed());
  const int count_test_block = number_of_iterations;
#if CONFIG_VP9_HIGHBITDEPTH
  const int32_t bd = bit_depth_;
209
210
  DECLARE_ALIGNED(16, uint16_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(16, uint16_t, ref_s[kNumCoeffs]);
211
#else
212
213
  DECLARE_ALIGNED(8, uint8_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(8, uint8_t, ref_s[kNumCoeffs]);
214
215
216
#endif  // CONFIG_VP9_HIGHBITDEPTH
  int err_count_total = 0;
  int first_failure = -1;
Deb Mukherjee's avatar
Deb Mukherjee committed
217
218
219
220
221

  // NOTE: The code in vp9_loopfilter.c:update_sharpness computes mblim as a
  // function of sharpness_lvl and the loopfilter lvl as:
  // block_inside_limit = lvl >> ((sharpness_lvl > 0) + (sharpness_lvl > 4));
  // ...
James Zern's avatar
James Zern committed
222
223
  // memset(lfi->lfthr[lvl].mblim, (2 * (lvl + 2) + block_inside_limit),
  //        SIMD_WIDTH);
Deb Mukherjee's avatar
Deb Mukherjee committed
224
225
226
227
228
229
  // This means that the largest value for mblim will occur when sharpness_lvl
  // is equal to 0, and lvl is equal to its greatest value (MAX_LOOP_FILTER).
  // In this case block_inside_limit will be equal to MAX_LOOP_FILTER and
  // therefore mblim will be equal to (2 * (lvl + 2) + block_inside_limit) =
  // 2 * (MAX_LOOP_FILTER + 2) + MAX_LOOP_FILTER = 3 * MAX_LOOP_FILTER + 4

230
231
  for (int i = 0; i < count_test_block; ++i) {
    int err_count = 0;
Deb Mukherjee's avatar
Deb Mukherjee committed
232
    uint8_t tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
233
234
235
236
    DECLARE_ALIGNED(16, const uint8_t, blimit[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
237
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
    DECLARE_ALIGNED(16, const uint8_t, limit[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    int32_t p = kNumCoeffs / 32;
    for (int j = 0; j < kNumCoeffs; ++j) {
      s[j] = rnd.Rand16() & mask_;
      ref_s[j] = s[j];
    }
#if CONFIG_VP9_HIGHBITDEPTH
Ed Baker's avatar
Ed Baker committed
253
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit, limit, thresh, count_, bd);
254
    ASM_REGISTER_STATE_CHECK(
Ed Baker's avatar
Ed Baker committed
255
        loopfilter_op_(s + 8 + p * 8, p, blimit, limit, thresh, count_, bd));
256
#else
Ed Baker's avatar
Ed Baker committed
257
    ref_loopfilter_op_(ref_s+8+p*8, p, blimit, limit, thresh, count_);
258
    ASM_REGISTER_STATE_CHECK(
Ed Baker's avatar
Ed Baker committed
259
        loopfilter_op_(s + 8 + p * 8, p, blimit, limit, thresh, count_));
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
#endif  // CONFIG_VP9_HIGHBITDEPTH
    for (int j = 0; j < kNumCoeffs; ++j) {
      err_count += ref_s[j] != s[j];
    }
    if (err_count && !err_count_total) {
      first_failure = i;
    }
    err_count_total += err_count;
  }
  EXPECT_EQ(0, err_count_total)
      << "Error: Loop8Test6Param, C output doesn't match SSE2 "
         "loopfilter output. "
      << "First failed at test case " << first_failure;
}

TEST_P(Loop8Test9Param, OperationCheck) {
  ACMRandom rnd(ACMRandom::DeterministicSeed());
  const int count_test_block = number_of_iterations;
#if CONFIG_VP9_HIGHBITDEPTH
  const int32_t bd = bit_depth_;
280
281
  DECLARE_ALIGNED(16, uint16_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(16, uint16_t, ref_s[kNumCoeffs]);
282
#else
283
284
  DECLARE_ALIGNED(8,  uint8_t,  s[kNumCoeffs]);
  DECLARE_ALIGNED(8,  uint8_t,  ref_s[kNumCoeffs]);
285
286
287
288
289
#endif  // CONFIG_VP9_HIGHBITDEPTH
  int err_count_total = 0;
  int first_failure = -1;
  for (int i = 0; i < count_test_block; ++i) {
    int err_count = 0;
Deb Mukherjee's avatar
Deb Mukherjee committed
290
    uint8_t tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
291
292
293
294
    DECLARE_ALIGNED(16, const uint8_t, blimit0[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
295
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
296
297
298
299
300
301
302
303
304
    DECLARE_ALIGNED(16, const uint8_t, limit0[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh0[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
305
    tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
306
307
308
309
    DECLARE_ALIGNED(16, const uint8_t, blimit1[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
310
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
    DECLARE_ALIGNED(16, const uint8_t, limit1[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh1[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    int32_t p = kNumCoeffs / 32;
    uint16_t tmp_s[kNumCoeffs];
    int j = 0;
    const uint8_t limit = *limit0 < *limit1 ? *limit0 : *limit1;
    while (j < kNumCoeffs) {
      uint8_t val = rnd.Rand8();
      if (val & 0x80) {  // 50% chance to choose a new value.
        tmp_s[j] = rnd.Rand16();
        j++;
      } else {  // 50% chance to repeat previous value in row X times.
        int k = 0;
        while (k++ < ((val & 0x1f) + 1) && j < kNumCoeffs) {
          if (j < 1) {
            tmp_s[j] = rnd.Rand16();
          } else if (val & 0x20) {  // Increment by a value within the limit.
            tmp_s[j] = (tmp_s[j - 1] + (limit - 1));
          } else {  // Decrement by an value within the limit.
            tmp_s[j] = (tmp_s[j - 1] - (limit - 1));
          }
          j++;
        }
      }
    }
    for (j = 0; j < kNumCoeffs; j++) {
      if (i % 2) {
        s[j] = tmp_s[j] & mask_;
      } else {
        s[j] = tmp_s[p * (j % p) + j / p] & mask_;
      }
      ref_s[j] = s[j];
    }
#if CONFIG_VP9_HIGHBITDEPTH
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1, bd);
    ASM_REGISTER_STATE_CHECK(
        loopfilter_op_(s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1, bd));
#else
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1);
    ASM_REGISTER_STATE_CHECK(
        loopfilter_op_(s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1));
#endif  // CONFIG_VP9_HIGHBITDEPTH
    for (int j = 0; j < kNumCoeffs; ++j) {
      err_count += ref_s[j] != s[j];
    }
    if (err_count && !err_count_total) {
      first_failure = i;
    }
    err_count_total += err_count;
  }
  EXPECT_EQ(0, err_count_total)
      << "Error: Loop8Test9Param, C output doesn't match SSE2 "
         "loopfilter output. "
      << "First failed at test case " << first_failure;
}

TEST_P(Loop8Test9Param, ValueCheck) {
  ACMRandom rnd(ACMRandom::DeterministicSeed());
  const int count_test_block = number_of_iterations;
#if CONFIG_VP9_HIGHBITDEPTH
382
383
  DECLARE_ALIGNED(16, uint16_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(16, uint16_t, ref_s[kNumCoeffs]);
384
#else
385
386
  DECLARE_ALIGNED(8,  uint8_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(8,  uint8_t, ref_s[kNumCoeffs]);
387
388
389
390
391
#endif  // CONFIG_VP9_HIGHBITDEPTH
  int err_count_total = 0;
  int first_failure = -1;
  for (int i = 0; i < count_test_block; ++i) {
    int err_count = 0;
Deb Mukherjee's avatar
Deb Mukherjee committed
392
    uint8_t tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
393
394
395
396
    DECLARE_ALIGNED(16, const uint8_t, blimit0[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
397
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
398
399
400
401
402
403
404
405
406
    DECLARE_ALIGNED(16, const uint8_t, limit0[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh0[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
407
    tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
408
409
410
411
    DECLARE_ALIGNED(16, const uint8_t, blimit1[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
412
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
    DECLARE_ALIGNED(16, const uint8_t, limit1[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh1[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    int32_t p = kNumCoeffs / 32;  // TODO(pdlf) can we have non-square here?
    for (int j = 0; j < kNumCoeffs; ++j) {
      s[j] = rnd.Rand16() & mask_;
      ref_s[j] = s[j];
    }
#if CONFIG_VP9_HIGHBITDEPTH
    const int32_t bd = bit_depth_;
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1, bd);
    ASM_REGISTER_STATE_CHECK(
        loopfilter_op_(s + 8 + p * 8, p, blimit0, limit0,
                       thresh0, blimit1, limit1, thresh1, bd));
#else
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1);
    ASM_REGISTER_STATE_CHECK(
        loopfilter_op_(s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1));
#endif  // CONFIG_VP9_HIGHBITDEPTH
    for (int j = 0; j < kNumCoeffs; ++j) {
      err_count += ref_s[j] != s[j];
    }
    if (err_count && !err_count_total) {
      first_failure = i;
    }
    err_count_total += err_count;
  }
  EXPECT_EQ(0, err_count_total)
      << "Error: Loop8Test9Param, C output doesn't match SSE2"
         "loopfilter output. "
      << "First failed at test case " << first_failure;
}

using std::tr1::make_tuple;

457
458
459
460
#if HAVE_MMX && !CONFIG_VP9_HIGHBITDEPTH
INSTANTIATE_TEST_CASE_P(
    MMX, Loop8Test6Param,
    ::testing::Values(
461
        make_tuple(&vpx_lpf_horizontal_4_mmx, &vpx_lpf_horizontal_4_c, 8, 1),
462
463
        make_tuple(&wrapper_nc<vpx_lpf_vertical_4_mmx>,
                   &wrapper_nc<vpx_lpf_vertical_4_c>, 8, 1)));
464
465
#endif  // HAVE_MMX

466
467
468
#if HAVE_SSE2
#if CONFIG_VP9_HIGHBITDEPTH
INSTANTIATE_TEST_CASE_P(
469
    SSE2, Loop8Test6Param,
470
    ::testing::Values(
471
472
473
474
475
476
477
478
479
480
481
482
        make_tuple(&vpx_highbd_lpf_horizontal_4_sse2,
                   &vpx_highbd_lpf_horizontal_4_c, 8, 1),
        make_tuple(&vpx_highbd_lpf_vertical_4_sse2,
                   &vpx_highbd_lpf_vertical_4_c, 8, 1),
        make_tuple(&vpx_highbd_lpf_horizontal_8_sse2,
                   &vpx_highbd_lpf_horizontal_8_c, 8, 1),
        make_tuple(&vpx_highbd_lpf_horizontal_16_sse2,
                   &vpx_highbd_lpf_horizontal_16_c, 8, 1),
        make_tuple(&vpx_highbd_lpf_horizontal_16_sse2,
                   &vpx_highbd_lpf_horizontal_16_c, 8, 2),
        make_tuple(&vpx_highbd_lpf_vertical_8_sse2,
                   &vpx_highbd_lpf_vertical_8_c, 8, 1),
483
484
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_c>, 8, 1),
485
486
487
488
489
490
491
492
493
494
495
496
        make_tuple(&vpx_highbd_lpf_horizontal_4_sse2,
                   &vpx_highbd_lpf_horizontal_4_c, 10, 1),
        make_tuple(&vpx_highbd_lpf_vertical_4_sse2,
                   &vpx_highbd_lpf_vertical_4_c, 10, 1),
        make_tuple(&vpx_highbd_lpf_horizontal_8_sse2,
                   &vpx_highbd_lpf_horizontal_8_c, 10, 1),
        make_tuple(&vpx_highbd_lpf_horizontal_16_sse2,
                   &vpx_highbd_lpf_horizontal_16_c, 10, 1),
        make_tuple(&vpx_highbd_lpf_horizontal_16_sse2,
                   &vpx_highbd_lpf_horizontal_16_c, 10, 2),
        make_tuple(&vpx_highbd_lpf_vertical_8_sse2,
                   &vpx_highbd_lpf_vertical_8_c, 10, 1),
497
498
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_c>, 10, 1),
499
500
501
502
503
504
505
506
507
508
509
510
        make_tuple(&vpx_highbd_lpf_horizontal_4_sse2,
                   &vpx_highbd_lpf_horizontal_4_c, 12, 1),
        make_tuple(&vpx_highbd_lpf_vertical_4_sse2,
                   &vpx_highbd_lpf_vertical_4_c, 12, 1),
        make_tuple(&vpx_highbd_lpf_horizontal_8_sse2,
                   &vpx_highbd_lpf_horizontal_8_c, 12, 1),
        make_tuple(&vpx_highbd_lpf_horizontal_16_sse2,
                   &vpx_highbd_lpf_horizontal_16_c, 12, 1),
        make_tuple(&vpx_highbd_lpf_horizontal_16_sse2,
                   &vpx_highbd_lpf_horizontal_16_c, 12, 2),
        make_tuple(&vpx_highbd_lpf_vertical_8_sse2,
                   &vpx_highbd_lpf_vertical_8_c, 12, 1),
511
512
513
514
515
516
517
518
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_c>, 12, 1),
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_dual_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_dual_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_dual_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_dual_c>, 10, 1),
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_dual_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_dual_c>, 12, 1)));
519
520
#else
INSTANTIATE_TEST_CASE_P(
Deb Mukherjee's avatar
Deb Mukherjee committed
521
    SSE2, Loop8Test6Param,
522
    ::testing::Values(
523
524
525
        make_tuple(&vpx_lpf_horizontal_8_sse2, &vpx_lpf_horizontal_8_c, 8, 1),
        make_tuple(&vpx_lpf_horizontal_16_sse2, &vpx_lpf_horizontal_16_c, 8, 1),
        make_tuple(&vpx_lpf_horizontal_16_sse2, &vpx_lpf_horizontal_16_c, 8, 2),
526
527
        make_tuple(&wrapper_nc<vpx_lpf_vertical_8_sse2>,
                   &wrapper_nc<vpx_lpf_vertical_8_c>, 8, 1),
528
529
530
531
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_sse2>,
                   &wrapper_nc<vpx_lpf_vertical_16_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_dual_sse2>,
                   &wrapper_nc<vpx_lpf_vertical_16_dual_c>, 8, 1)));
532
533
534
#endif  // CONFIG_VP9_HIGHBITDEPTH
#endif

levytamar82's avatar
levytamar82 committed
535
536
#if HAVE_AVX2 && (!CONFIG_VP9_HIGHBITDEPTH)
INSTANTIATE_TEST_CASE_P(
Deb Mukherjee's avatar
Deb Mukherjee committed
537
    AVX2, Loop8Test6Param,
levytamar82's avatar
levytamar82 committed
538
    ::testing::Values(
539
540
        make_tuple(&vpx_lpf_horizontal_16_avx2, &vpx_lpf_horizontal_16_c, 8, 1),
        make_tuple(&vpx_lpf_horizontal_16_avx2, &vpx_lpf_horizontal_16_c, 8,
Ed Baker's avatar
Ed Baker committed
541
                   2)));
levytamar82's avatar
levytamar82 committed
542
543
#endif

544
545
546
#if HAVE_SSE2
#if CONFIG_VP9_HIGHBITDEPTH
INSTANTIATE_TEST_CASE_P(
547
    SSE2, Loop8Test9Param,
548
    ::testing::Values(
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
        make_tuple(&vpx_highbd_lpf_horizontal_4_dual_sse2,
                   &vpx_highbd_lpf_horizontal_4_dual_c, 8),
        make_tuple(&vpx_highbd_lpf_horizontal_8_dual_sse2,
                   &vpx_highbd_lpf_horizontal_8_dual_c, 8),
        make_tuple(&vpx_highbd_lpf_vertical_4_dual_sse2,
                   &vpx_highbd_lpf_vertical_4_dual_c, 8),
        make_tuple(&vpx_highbd_lpf_vertical_8_dual_sse2,
                   &vpx_highbd_lpf_vertical_8_dual_c, 8),
        make_tuple(&vpx_highbd_lpf_horizontal_4_dual_sse2,
                   &vpx_highbd_lpf_horizontal_4_dual_c, 10),
        make_tuple(&vpx_highbd_lpf_horizontal_8_dual_sse2,
                   &vpx_highbd_lpf_horizontal_8_dual_c, 10),
        make_tuple(&vpx_highbd_lpf_vertical_4_dual_sse2,
                   &vpx_highbd_lpf_vertical_4_dual_c, 10),
        make_tuple(&vpx_highbd_lpf_vertical_8_dual_sse2,
                   &vpx_highbd_lpf_vertical_8_dual_c, 10),
        make_tuple(&vpx_highbd_lpf_horizontal_4_dual_sse2,
                   &vpx_highbd_lpf_horizontal_4_dual_c, 12),
        make_tuple(&vpx_highbd_lpf_horizontal_8_dual_sse2,
                   &vpx_highbd_lpf_horizontal_8_dual_c, 12),
        make_tuple(&vpx_highbd_lpf_vertical_4_dual_sse2,
                   &vpx_highbd_lpf_vertical_4_dual_c, 12),
        make_tuple(&vpx_highbd_lpf_vertical_8_dual_sse2,
                   &vpx_highbd_lpf_vertical_8_dual_c, 12)));
573
574
#else
INSTANTIATE_TEST_CASE_P(
Deb Mukherjee's avatar
Deb Mukherjee committed
575
    SSE2, Loop8Test9Param,
576
    ::testing::Values(
577
578
579
580
581
582
583
584
        make_tuple(&vpx_lpf_horizontal_4_dual_sse2,
                   &vpx_lpf_horizontal_4_dual_c, 8),
        make_tuple(&vpx_lpf_horizontal_8_dual_sse2,
                   &vpx_lpf_horizontal_8_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_4_dual_sse2,
                   &vpx_lpf_vertical_4_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_8_dual_sse2,
                   &vpx_lpf_vertical_8_dual_c, 8)));
585
586
#endif  // CONFIG_VP9_HIGHBITDEPTH
#endif
levytamar82's avatar
levytamar82 committed
587

588
589
590
591
#if HAVE_NEON
#if CONFIG_VP9_HIGHBITDEPTH
// No neon high bitdepth functions.
#else
592
593
594
595
INSTANTIATE_TEST_CASE_P(
    NEON, Loop8Test6Param,
    ::testing::Values(
#if HAVE_NEON_ASM
596
597
// Using #if inside the macro is unsupported on MSVS but the tests are not
// currently built for MSVS with ARM and NEON.
598
599
600
601
        make_tuple(&vpx_lpf_horizontal_16_neon,
                   &vpx_lpf_horizontal_16_c, 8, 1),
        make_tuple(&vpx_lpf_horizontal_16_neon,
                   &vpx_lpf_horizontal_16_c, 8, 2),
602
603
604
605
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_neon>,
                   &wrapper_nc<vpx_lpf_vertical_16_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_dual_neon>,
                   &wrapper_nc<vpx_lpf_vertical_16_dual_c>, 8, 1),
606
#endif  // HAVE_NEON_ASM
607
608
        make_tuple(&vpx_lpf_horizontal_8_neon,
                   &vpx_lpf_horizontal_8_c, 8, 1),
609
610
        make_tuple(&wrapper_nc<vpx_lpf_vertical_8_neon>,
                   &wrapper_nc<vpx_lpf_vertical_8_c>, 8, 1),
611
612
        make_tuple(&vpx_lpf_horizontal_4_neon,
                   &vpx_lpf_horizontal_4_c, 8, 1),
613
614
        make_tuple(&wrapper_nc<vpx_lpf_vertical_4_neon>,
                   &wrapper_nc<vpx_lpf_vertical_4_c>, 8, 1)));
615
616
617
INSTANTIATE_TEST_CASE_P(
    NEON, Loop8Test9Param,
    ::testing::Values(
Johann's avatar
Johann committed
618
#if HAVE_NEON_ASM
619
620
621
622
        make_tuple(&vpx_lpf_horizontal_8_dual_neon,
                   &vpx_lpf_horizontal_8_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_8_dual_neon,
                   &vpx_lpf_vertical_8_dual_c, 8),
Johann's avatar
Johann committed
623
#endif  // HAVE_NEON_ASM
624
625
626
627
        make_tuple(&vpx_lpf_horizontal_4_dual_neon,
                   &vpx_lpf_horizontal_4_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_4_dual_neon,
                   &vpx_lpf_vertical_4_dual_c, 8)));
628
629
#endif  // CONFIG_VP9_HIGHBITDEPTH
#endif  // HAVE_NEON
630

631
632
633
634
635
636
637
638
639
640
#if HAVE_DSPR2 && !CONFIG_VP9_HIGHBITDEPTH
INSTANTIATE_TEST_CASE_P(
    DSPR2, Loop8Test6Param,
    ::testing::Values(
        make_tuple(&vpx_lpf_horizontal_4_dspr2, &vpx_lpf_horizontal_4_c, 8, 1),
        make_tuple(&vpx_lpf_horizontal_8_dspr2, &vpx_lpf_horizontal_8_c, 8, 1),
        make_tuple(&vpx_lpf_horizontal_16_dspr2,
                   &vpx_lpf_horizontal_16_c, 8, 1),
        make_tuple(&vpx_lpf_horizontal_16_dspr2,
                   &vpx_lpf_horizontal_16_c, 8, 2),
641
642
        make_tuple(&wrapper_nc<vpx_lpf_vertical_4_dspr2>,
                   &wrapper_nc<vpx_lpf_vertical_4_c>, 8, 1),
643
644
        make_tuple(&wrapper_nc<vpx_lpf_vertical_8_dspr2>,
                   &wrapper_nc<vpx_lpf_vertical_8_c>, 8, 1),
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_dspr2>,
                   &wrapper_nc<vpx_lpf_vertical_16_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_dual_dspr2>,
                   &wrapper_nc<vpx_lpf_vertical_16_dual_c>, 8, 1)));

INSTANTIATE_TEST_CASE_P(
    DSPR2, Loop8Test9Param,
    ::testing::Values(
        make_tuple(&vpx_lpf_horizontal_4_dual_dspr2,
                   &vpx_lpf_horizontal_4_dual_c, 8),
        make_tuple(&vpx_lpf_horizontal_8_dual_dspr2,
                   &vpx_lpf_horizontal_8_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_4_dual_dspr2,
                   &vpx_lpf_vertical_4_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_8_dual_dspr2,
                   &vpx_lpf_vertical_8_dual_c, 8)));
#endif  // HAVE_DSPR2 && !CONFIG_VP9_HIGHBITDEPTH

663
664
665
666
#if HAVE_MSA && (!CONFIG_VP9_HIGHBITDEPTH)
INSTANTIATE_TEST_CASE_P(
    MSA, Loop8Test6Param,
    ::testing::Values(
667
        make_tuple(&vpx_lpf_horizontal_4_msa, &vpx_lpf_horizontal_4_c, 8, 1),
668
669
670
        make_tuple(&vpx_lpf_horizontal_8_msa, &vpx_lpf_horizontal_8_c, 8, 1),
        make_tuple(&vpx_lpf_horizontal_16_msa, &vpx_lpf_horizontal_16_c, 8, 1),
        make_tuple(&vpx_lpf_horizontal_16_msa, &vpx_lpf_horizontal_16_c, 8, 2),
671
672
        make_tuple(&wrapper_nc<vpx_lpf_vertical_4_msa>,
                   &wrapper_nc<vpx_lpf_vertical_4_c>, 8, 1),
673
674
        make_tuple(&wrapper_nc<vpx_lpf_vertical_8_msa>,
                   &wrapper_nc<vpx_lpf_vertical_8_c>, 8, 1),
675
676
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_msa>,
                   &wrapper_nc<vpx_lpf_vertical_16_c>, 8, 1)));
677
678
679
680

INSTANTIATE_TEST_CASE_P(
    MSA, Loop8Test9Param,
    ::testing::Values(
681
682
683
684
685
686
687
688
        make_tuple(&vpx_lpf_horizontal_4_dual_msa,
                   &vpx_lpf_horizontal_4_dual_c, 8),
        make_tuple(&vpx_lpf_horizontal_8_dual_msa,
                   &vpx_lpf_horizontal_8_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_4_dual_msa,
                   &vpx_lpf_vertical_4_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_8_dual_msa,
                   &vpx_lpf_vertical_8_dual_c, 8)));
689
690
#endif  // HAVE_MSA && (!CONFIG_VP9_HIGHBITDEPTH)

691
}  // namespace