lpf_8_test.cc 28.4 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
/*
 *  Copyright (c) 2014 The WebM project authors. All Rights Reserved.
 *
 *  Use of this source code is governed by a BSD-style license
 *  that can be found in the LICENSE file in the root of the source
 *  tree. An additional intellectual property rights grant can be found
 *  in the file PATENTS.  All contributing project authors may
 *  be found in the AUTHORS file in the root of the source tree.
 */

#include <cmath>
#include <cstdlib>
#include <string>

#include "third_party/googletest/src/include/gtest/gtest.h"
16
17
18

#include "./vpx_config.h"
#include "./vpx_dsp_rtcd.h"
19
20
21
22
23
#include "test/acm_random.h"
#include "test/clear_system_state.h"
#include "test/register_state_check.h"
#include "test/util.h"
#include "vp9/common/vp9_entropy.h"
Deb Mukherjee's avatar
Deb Mukherjee committed
24
#include "vp9/common/vp9_loopfilter.h"
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
#include "vpx/vpx_integer.h"

using libvpx_test::ACMRandom;

namespace {
// Horizontally and Vertically need 32x32: 8  Coeffs preceeding filtered section
//                                         16 Coefs within filtered section
//                                         8  Coeffs following filtered section
const int kNumCoeffs = 1024;

const int number_of_iterations = 10000;

#if CONFIG_VP9_HIGHBITDEPTH
typedef void (*loop_op_t)(uint16_t *s, int p, const uint8_t *blimit,
                          const uint8_t *limit, const uint8_t *thresh,
                          int count, int bd);
typedef void (*dual_loop_op_t)(uint16_t *s, int p, const uint8_t *blimit0,
                               const uint8_t *limit0, const uint8_t *thresh0,
                               const uint8_t *blimit1, const uint8_t *limit1,
                               const uint8_t *thresh1, int bd);
45
46
47
48
49
50
51
52
53
54
55

// wrapper for loopfilter functions without a 'count' param.
typedef void (*loop_op_nc_t)(uint16_t *s, int p, const uint8_t *blimit,
                             const uint8_t *limit, const uint8_t *thresh,
                             int bd);
template <loop_op_nc_t fn>
void wrapper_nc(uint16_t *s, int p, const uint8_t *blimit,
                const uint8_t *limit, const uint8_t *thresh,
                int /*count*/, int bd) {
  fn(s, p, blimit, limit, thresh, bd);
}
56
57
58
59
60
61
62
63
64
#else
typedef void (*loop_op_t)(uint8_t *s, int p, const uint8_t *blimit,
                          const uint8_t *limit, const uint8_t *thresh,
                          int count);
typedef void (*dual_loop_op_t)(uint8_t *s, int p, const uint8_t *blimit0,
                               const uint8_t *limit0, const uint8_t *thresh0,
                               const uint8_t *blimit1, const uint8_t *limit1,
                               const uint8_t *thresh1);

65
66
67
68
69
70
71
72
// wrapper for loopfilter functions without a 'count' param.
typedef void (*loop_op_nc_t)(uint8_t *s, int p, const uint8_t *blimit,
                             const uint8_t *limit, const uint8_t *thresh);
template <loop_op_nc_t fn>
void wrapper_nc(uint8_t *s, int p, const uint8_t *blimit,
                const uint8_t *limit, const uint8_t *thresh,
                int /*count*/) {
  fn(s, p, blimit, limit, thresh);
73
74
75
}
#endif  // CONFIG_VP9_HIGHBITDEPTH

76
77
typedef std::tr1::tuple<loop_op_t, loop_op_t, int, int> loop8_param_t;
typedef std::tr1::tuple<dual_loop_op_t, dual_loop_op_t, int> dualloop8_param_t;
78

79
80
81
82
83
84
85
class Loop8Test6Param : public ::testing::TestWithParam<loop8_param_t> {
 public:
  virtual ~Loop8Test6Param() {}
  virtual void SetUp() {
    loopfilter_op_ = GET_PARAM(0);
    ref_loopfilter_op_ = GET_PARAM(1);
    bit_depth_ = GET_PARAM(2);
Ed Baker's avatar
Ed Baker committed
86
    count_ = GET_PARAM(3);
87
88
89
90
91
92
93
    mask_ = (1 << bit_depth_) - 1;
  }

  virtual void TearDown() { libvpx_test::ClearSystemState(); }

 protected:
  int bit_depth_;
Ed Baker's avatar
Ed Baker committed
94
  int count_;
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
  int mask_;
  loop_op_t loopfilter_op_;
  loop_op_t ref_loopfilter_op_;
};

class Loop8Test9Param : public ::testing::TestWithParam<dualloop8_param_t> {
 public:
  virtual ~Loop8Test9Param() {}
  virtual void SetUp() {
    loopfilter_op_ = GET_PARAM(0);
    ref_loopfilter_op_ = GET_PARAM(1);
    bit_depth_ = GET_PARAM(2);
    mask_ = (1 << bit_depth_) - 1;
  }

  virtual void TearDown() { libvpx_test::ClearSystemState(); }

 protected:
  int bit_depth_;
  int mask_;
  dual_loop_op_t loopfilter_op_;
  dual_loop_op_t ref_loopfilter_op_;
};

TEST_P(Loop8Test6Param, OperationCheck) {
  ACMRandom rnd(ACMRandom::DeterministicSeed());
  const int count_test_block = number_of_iterations;
#if CONFIG_VP9_HIGHBITDEPTH
  int32_t bd = bit_depth_;
124
125
  DECLARE_ALIGNED(16, uint16_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(16, uint16_t, ref_s[kNumCoeffs]);
126
#else
127
128
  DECLARE_ALIGNED(8, uint8_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(8, uint8_t, ref_s[kNumCoeffs]);
129
130
131
132
133
#endif  // CONFIG_VP9_HIGHBITDEPTH
  int err_count_total = 0;
  int first_failure = -1;
  for (int i = 0; i < count_test_block; ++i) {
    int err_count = 0;
Deb Mukherjee's avatar
Deb Mukherjee committed
134
    uint8_t tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
135
136
137
138
    DECLARE_ALIGNED(16, const uint8_t, blimit[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
139
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
    DECLARE_ALIGNED(16, const uint8_t, limit[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    int32_t p = kNumCoeffs/32;

    uint16_t tmp_s[kNumCoeffs];
    int j = 0;
    while (j < kNumCoeffs) {
      uint8_t val = rnd.Rand8();
      if (val & 0x80) {  // 50% chance to choose a new value.
        tmp_s[j] = rnd.Rand16();
        j++;
      } else {  // 50% chance to repeat previous value in row X times
        int k = 0;
        while (k++ < ((val & 0x1f) + 1) && j < kNumCoeffs) {
          if (j < 1) {
            tmp_s[j] = rnd.Rand16();
          } else if (val & 0x20) {  // Increment by an value within the limit
            tmp_s[j] = (tmp_s[j - 1] + (*limit - 1));
          } else {  // Decrement by an value within the limit
            tmp_s[j] = (tmp_s[j - 1] - (*limit - 1));
          }
          j++;
        }
      }
    }
    for (j = 0; j < kNumCoeffs; j++) {
      if (i % 2) {
        s[j] = tmp_s[j] & mask_;
      } else {
        s[j] = tmp_s[p * (j % p) + j / p] & mask_;
      }
      ref_s[j] = s[j];
    }
#if CONFIG_VP9_HIGHBITDEPTH
Ed Baker's avatar
Ed Baker committed
181
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit, limit, thresh, count_, bd);
182
    ASM_REGISTER_STATE_CHECK(
Ed Baker's avatar
Ed Baker committed
183
        loopfilter_op_(s + 8 + p * 8, p, blimit, limit, thresh, count_, bd));
184
#else
Ed Baker's avatar
Ed Baker committed
185
    ref_loopfilter_op_(ref_s+8+p*8, p, blimit, limit, thresh, count_);
186
    ASM_REGISTER_STATE_CHECK(
Ed Baker's avatar
Ed Baker committed
187
        loopfilter_op_(s + 8 + p * 8, p, blimit, limit, thresh, count_));
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
#endif  // CONFIG_VP9_HIGHBITDEPTH

    for (int j = 0; j < kNumCoeffs; ++j) {
      err_count += ref_s[j] != s[j];
    }
    if (err_count && !err_count_total) {
      first_failure = i;
    }
    err_count_total += err_count;
  }
  EXPECT_EQ(0, err_count_total)
      << "Error: Loop8Test6Param, C output doesn't match SSE2 "
         "loopfilter output. "
      << "First failed at test case " << first_failure;
}

TEST_P(Loop8Test6Param, ValueCheck) {
  ACMRandom rnd(ACMRandom::DeterministicSeed());
  const int count_test_block = number_of_iterations;
#if CONFIG_VP9_HIGHBITDEPTH
  const int32_t bd = bit_depth_;
209
210
  DECLARE_ALIGNED(16, uint16_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(16, uint16_t, ref_s[kNumCoeffs]);
211
#else
212
213
  DECLARE_ALIGNED(8, uint8_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(8, uint8_t, ref_s[kNumCoeffs]);
214
215
216
#endif  // CONFIG_VP9_HIGHBITDEPTH
  int err_count_total = 0;
  int first_failure = -1;
Deb Mukherjee's avatar
Deb Mukherjee committed
217
218
219
220
221

  // NOTE: The code in vp9_loopfilter.c:update_sharpness computes mblim as a
  // function of sharpness_lvl and the loopfilter lvl as:
  // block_inside_limit = lvl >> ((sharpness_lvl > 0) + (sharpness_lvl > 4));
  // ...
James Zern's avatar
James Zern committed
222
223
  // memset(lfi->lfthr[lvl].mblim, (2 * (lvl + 2) + block_inside_limit),
  //        SIMD_WIDTH);
Deb Mukherjee's avatar
Deb Mukherjee committed
224
225
226
227
228
229
  // This means that the largest value for mblim will occur when sharpness_lvl
  // is equal to 0, and lvl is equal to its greatest value (MAX_LOOP_FILTER).
  // In this case block_inside_limit will be equal to MAX_LOOP_FILTER and
  // therefore mblim will be equal to (2 * (lvl + 2) + block_inside_limit) =
  // 2 * (MAX_LOOP_FILTER + 2) + MAX_LOOP_FILTER = 3 * MAX_LOOP_FILTER + 4

230
231
  for (int i = 0; i < count_test_block; ++i) {
    int err_count = 0;
Deb Mukherjee's avatar
Deb Mukherjee committed
232
    uint8_t tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
233
234
235
236
    DECLARE_ALIGNED(16, const uint8_t, blimit[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
237
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
    DECLARE_ALIGNED(16, const uint8_t, limit[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    int32_t p = kNumCoeffs / 32;
    for (int j = 0; j < kNumCoeffs; ++j) {
      s[j] = rnd.Rand16() & mask_;
      ref_s[j] = s[j];
    }
#if CONFIG_VP9_HIGHBITDEPTH
Ed Baker's avatar
Ed Baker committed
253
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit, limit, thresh, count_, bd);
254
    ASM_REGISTER_STATE_CHECK(
Ed Baker's avatar
Ed Baker committed
255
        loopfilter_op_(s + 8 + p * 8, p, blimit, limit, thresh, count_, bd));
256
#else
Ed Baker's avatar
Ed Baker committed
257
    ref_loopfilter_op_(ref_s+8+p*8, p, blimit, limit, thresh, count_);
258
    ASM_REGISTER_STATE_CHECK(
Ed Baker's avatar
Ed Baker committed
259
        loopfilter_op_(s + 8 + p * 8, p, blimit, limit, thresh, count_));
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
#endif  // CONFIG_VP9_HIGHBITDEPTH
    for (int j = 0; j < kNumCoeffs; ++j) {
      err_count += ref_s[j] != s[j];
    }
    if (err_count && !err_count_total) {
      first_failure = i;
    }
    err_count_total += err_count;
  }
  EXPECT_EQ(0, err_count_total)
      << "Error: Loop8Test6Param, C output doesn't match SSE2 "
         "loopfilter output. "
      << "First failed at test case " << first_failure;
}

TEST_P(Loop8Test9Param, OperationCheck) {
  ACMRandom rnd(ACMRandom::DeterministicSeed());
  const int count_test_block = number_of_iterations;
#if CONFIG_VP9_HIGHBITDEPTH
  const int32_t bd = bit_depth_;
280
281
  DECLARE_ALIGNED(16, uint16_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(16, uint16_t, ref_s[kNumCoeffs]);
282
#else
283
284
  DECLARE_ALIGNED(8,  uint8_t,  s[kNumCoeffs]);
  DECLARE_ALIGNED(8,  uint8_t,  ref_s[kNumCoeffs]);
285
286
287
288
289
#endif  // CONFIG_VP9_HIGHBITDEPTH
  int err_count_total = 0;
  int first_failure = -1;
  for (int i = 0; i < count_test_block; ++i) {
    int err_count = 0;
Deb Mukherjee's avatar
Deb Mukherjee committed
290
    uint8_t tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
291
292
293
294
    DECLARE_ALIGNED(16, const uint8_t, blimit0[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
295
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
296
297
298
299
300
301
302
303
304
    DECLARE_ALIGNED(16, const uint8_t, limit0[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh0[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
305
    tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
306
307
308
309
    DECLARE_ALIGNED(16, const uint8_t, blimit1[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
310
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
    DECLARE_ALIGNED(16, const uint8_t, limit1[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh1[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    int32_t p = kNumCoeffs / 32;
    uint16_t tmp_s[kNumCoeffs];
    int j = 0;
    const uint8_t limit = *limit0 < *limit1 ? *limit0 : *limit1;
    while (j < kNumCoeffs) {
      uint8_t val = rnd.Rand8();
      if (val & 0x80) {  // 50% chance to choose a new value.
        tmp_s[j] = rnd.Rand16();
        j++;
      } else {  // 50% chance to repeat previous value in row X times.
        int k = 0;
        while (k++ < ((val & 0x1f) + 1) && j < kNumCoeffs) {
          if (j < 1) {
            tmp_s[j] = rnd.Rand16();
          } else if (val & 0x20) {  // Increment by a value within the limit.
            tmp_s[j] = (tmp_s[j - 1] + (limit - 1));
          } else {  // Decrement by an value within the limit.
            tmp_s[j] = (tmp_s[j - 1] - (limit - 1));
          }
          j++;
        }
      }
    }
    for (j = 0; j < kNumCoeffs; j++) {
      if (i % 2) {
        s[j] = tmp_s[j] & mask_;
      } else {
        s[j] = tmp_s[p * (j % p) + j / p] & mask_;
      }
      ref_s[j] = s[j];
    }
#if CONFIG_VP9_HIGHBITDEPTH
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1, bd);
    ASM_REGISTER_STATE_CHECK(
        loopfilter_op_(s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1, bd));
#else
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1);
    ASM_REGISTER_STATE_CHECK(
        loopfilter_op_(s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1));
#endif  // CONFIG_VP9_HIGHBITDEPTH
    for (int j = 0; j < kNumCoeffs; ++j) {
      err_count += ref_s[j] != s[j];
    }
    if (err_count && !err_count_total) {
      first_failure = i;
    }
    err_count_total += err_count;
  }
  EXPECT_EQ(0, err_count_total)
      << "Error: Loop8Test9Param, C output doesn't match SSE2 "
         "loopfilter output. "
      << "First failed at test case " << first_failure;
}

TEST_P(Loop8Test9Param, ValueCheck) {
  ACMRandom rnd(ACMRandom::DeterministicSeed());
  const int count_test_block = number_of_iterations;
#if CONFIG_VP9_HIGHBITDEPTH
382
383
  DECLARE_ALIGNED(16, uint16_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(16, uint16_t, ref_s[kNumCoeffs]);
384
#else
385
386
  DECLARE_ALIGNED(8,  uint8_t, s[kNumCoeffs]);
  DECLARE_ALIGNED(8,  uint8_t, ref_s[kNumCoeffs]);
387
388
389
390
391
#endif  // CONFIG_VP9_HIGHBITDEPTH
  int err_count_total = 0;
  int first_failure = -1;
  for (int i = 0; i < count_test_block; ++i) {
    int err_count = 0;
Deb Mukherjee's avatar
Deb Mukherjee committed
392
    uint8_t tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
393
394
395
396
    DECLARE_ALIGNED(16, const uint8_t, blimit0[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
397
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
398
399
400
401
402
403
404
405
406
    DECLARE_ALIGNED(16, const uint8_t, limit0[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh0[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
407
    tmp = static_cast<uint8_t>(rnd(3 * MAX_LOOP_FILTER + 4));
408
409
410
411
    DECLARE_ALIGNED(16, const uint8_t, blimit1[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
Deb Mukherjee's avatar
Deb Mukherjee committed
412
    tmp = static_cast<uint8_t>(rnd(MAX_LOOP_FILTER));
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
    DECLARE_ALIGNED(16, const uint8_t, limit1[16])  = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    tmp = rnd.Rand8();
    DECLARE_ALIGNED(16, const uint8_t, thresh1[16]) = {
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp,
        tmp, tmp, tmp, tmp, tmp, tmp, tmp, tmp
    };
    int32_t p = kNumCoeffs / 32;  // TODO(pdlf) can we have non-square here?
    for (int j = 0; j < kNumCoeffs; ++j) {
      s[j] = rnd.Rand16() & mask_;
      ref_s[j] = s[j];
    }
#if CONFIG_VP9_HIGHBITDEPTH
    const int32_t bd = bit_depth_;
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1, bd);
    ASM_REGISTER_STATE_CHECK(
        loopfilter_op_(s + 8 + p * 8, p, blimit0, limit0,
                       thresh0, blimit1, limit1, thresh1, bd));
#else
    ref_loopfilter_op_(ref_s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1);
    ASM_REGISTER_STATE_CHECK(
        loopfilter_op_(s + 8 + p * 8, p, blimit0, limit0, thresh0,
                       blimit1, limit1, thresh1));
#endif  // CONFIG_VP9_HIGHBITDEPTH
    for (int j = 0; j < kNumCoeffs; ++j) {
      err_count += ref_s[j] != s[j];
    }
    if (err_count && !err_count_total) {
      first_failure = i;
    }
    err_count_total += err_count;
  }
  EXPECT_EQ(0, err_count_total)
      << "Error: Loop8Test9Param, C output doesn't match SSE2"
         "loopfilter output. "
      << "First failed at test case " << first_failure;
}

using std::tr1::make_tuple;

457
458
459
460
#if HAVE_MMX && !CONFIG_VP9_HIGHBITDEPTH
INSTANTIATE_TEST_CASE_P(
    MMX, Loop8Test6Param,
    ::testing::Values(
461
462
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_4_mmx>,
                   &wrapper_nc<vpx_lpf_horizontal_4_c>, 8, 1),
463
464
        make_tuple(&wrapper_nc<vpx_lpf_vertical_4_mmx>,
                   &wrapper_nc<vpx_lpf_vertical_4_c>, 8, 1)));
465
466
#endif  // HAVE_MMX

467
468
469
#if HAVE_SSE2
#if CONFIG_VP9_HIGHBITDEPTH
INSTANTIATE_TEST_CASE_P(
470
    SSE2, Loop8Test6Param,
471
    ::testing::Values(
472
473
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_4_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_4_c>, 8, 1),
474
475
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_4_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_4_c>, 8, 1),
476
477
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_8_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_8_c>, 8, 1),
478
479
480
481
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_edge_8_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_edge_8_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_edge_16_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_edge_16_c>, 8, 1),
482
483
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_8_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_8_c>, 8, 1),
484
485
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_c>, 8, 1),
486
487
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_4_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_4_c>, 10, 1),
488
489
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_4_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_4_c>, 10, 1),
490
491
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_8_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_8_c>, 10, 1),
492
493
494
495
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_edge_8_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_edge_8_c>, 10, 1),
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_edge_16_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_edge_16_c>, 10, 1),
496
497
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_8_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_8_c>, 10, 1),
498
499
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_c>, 10, 1),
500
501
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_4_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_4_c>, 12, 1),
502
503
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_4_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_4_c>, 12, 1),
504
505
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_8_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_8_c>, 12, 1),
506
507
508
509
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_edge_8_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_edge_8_c>, 12, 1),
        make_tuple(&wrapper_nc<vpx_highbd_lpf_horizontal_edge_16_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_horizontal_edge_16_c>, 12, 1),
510
511
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_8_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_8_c>, 12, 1),
512
513
514
515
516
517
518
519
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_c>, 12, 1),
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_dual_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_dual_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_dual_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_dual_c>, 10, 1),
        make_tuple(&wrapper_nc<vpx_highbd_lpf_vertical_16_dual_sse2>,
                   &wrapper_nc<vpx_highbd_lpf_vertical_16_dual_c>, 12, 1)));
520
521
#else
INSTANTIATE_TEST_CASE_P(
Deb Mukherjee's avatar
Deb Mukherjee committed
522
    SSE2, Loop8Test6Param,
523
    ::testing::Values(
524
525
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_8_sse2>,
                   &wrapper_nc<vpx_lpf_horizontal_8_c>, 8, 1),
526
527
528
529
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_edge_8_sse2>,
                   &wrapper_nc<vpx_lpf_horizontal_edge_8_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_edge_16_sse2>,
                   &wrapper_nc<vpx_lpf_horizontal_edge_16_c>, 8, 1),
530
531
        make_tuple(&wrapper_nc<vpx_lpf_vertical_8_sse2>,
                   &wrapper_nc<vpx_lpf_vertical_8_c>, 8, 1),
532
533
534
535
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_sse2>,
                   &wrapper_nc<vpx_lpf_vertical_16_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_dual_sse2>,
                   &wrapper_nc<vpx_lpf_vertical_16_dual_c>, 8, 1)));
536
537
538
#endif  // CONFIG_VP9_HIGHBITDEPTH
#endif

levytamar82's avatar
levytamar82 committed
539
540
#if HAVE_AVX2 && (!CONFIG_VP9_HIGHBITDEPTH)
INSTANTIATE_TEST_CASE_P(
Deb Mukherjee's avatar
Deb Mukherjee committed
541
    AVX2, Loop8Test6Param,
levytamar82's avatar
levytamar82 committed
542
    ::testing::Values(
543
544
545
546
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_edge_8_avx2>,
                   &wrapper_nc<vpx_lpf_horizontal_edge_8_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_edge_16_avx2>,
                   &wrapper_nc<vpx_lpf_horizontal_edge_16_c>, 8, 1)));
levytamar82's avatar
levytamar82 committed
547
548
#endif

549
550
551
#if HAVE_SSE2
#if CONFIG_VP9_HIGHBITDEPTH
INSTANTIATE_TEST_CASE_P(
552
    SSE2, Loop8Test9Param,
553
    ::testing::Values(
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
        make_tuple(&vpx_highbd_lpf_horizontal_4_dual_sse2,
                   &vpx_highbd_lpf_horizontal_4_dual_c, 8),
        make_tuple(&vpx_highbd_lpf_horizontal_8_dual_sse2,
                   &vpx_highbd_lpf_horizontal_8_dual_c, 8),
        make_tuple(&vpx_highbd_lpf_vertical_4_dual_sse2,
                   &vpx_highbd_lpf_vertical_4_dual_c, 8),
        make_tuple(&vpx_highbd_lpf_vertical_8_dual_sse2,
                   &vpx_highbd_lpf_vertical_8_dual_c, 8),
        make_tuple(&vpx_highbd_lpf_horizontal_4_dual_sse2,
                   &vpx_highbd_lpf_horizontal_4_dual_c, 10),
        make_tuple(&vpx_highbd_lpf_horizontal_8_dual_sse2,
                   &vpx_highbd_lpf_horizontal_8_dual_c, 10),
        make_tuple(&vpx_highbd_lpf_vertical_4_dual_sse2,
                   &vpx_highbd_lpf_vertical_4_dual_c, 10),
        make_tuple(&vpx_highbd_lpf_vertical_8_dual_sse2,
                   &vpx_highbd_lpf_vertical_8_dual_c, 10),
        make_tuple(&vpx_highbd_lpf_horizontal_4_dual_sse2,
                   &vpx_highbd_lpf_horizontal_4_dual_c, 12),
        make_tuple(&vpx_highbd_lpf_horizontal_8_dual_sse2,
                   &vpx_highbd_lpf_horizontal_8_dual_c, 12),
        make_tuple(&vpx_highbd_lpf_vertical_4_dual_sse2,
                   &vpx_highbd_lpf_vertical_4_dual_c, 12),
        make_tuple(&vpx_highbd_lpf_vertical_8_dual_sse2,
                   &vpx_highbd_lpf_vertical_8_dual_c, 12)));
578
579
#else
INSTANTIATE_TEST_CASE_P(
Deb Mukherjee's avatar
Deb Mukherjee committed
580
    SSE2, Loop8Test9Param,
581
    ::testing::Values(
582
583
584
585
586
587
588
589
        make_tuple(&vpx_lpf_horizontal_4_dual_sse2,
                   &vpx_lpf_horizontal_4_dual_c, 8),
        make_tuple(&vpx_lpf_horizontal_8_dual_sse2,
                   &vpx_lpf_horizontal_8_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_4_dual_sse2,
                   &vpx_lpf_vertical_4_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_8_dual_sse2,
                   &vpx_lpf_vertical_8_dual_c, 8)));
590
591
#endif  // CONFIG_VP9_HIGHBITDEPTH
#endif
levytamar82's avatar
levytamar82 committed
592

593
594
595
596
#if HAVE_NEON
#if CONFIG_VP9_HIGHBITDEPTH
// No neon high bitdepth functions.
#else
597
598
599
600
INSTANTIATE_TEST_CASE_P(
    NEON, Loop8Test6Param,
    ::testing::Values(
#if HAVE_NEON_ASM
601
602
// Using #if inside the macro is unsupported on MSVS but the tests are not
// currently built for MSVS with ARM and NEON.
603
604
605
606
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_edge_8_neon>,
                   &wrapper_nc<vpx_lpf_horizontal_edge_8_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_edge_16_neon>,
                   &wrapper_nc<vpx_lpf_horizontal_edge_16_c>, 8, 1),
607
608
609
610
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_neon>,
                   &wrapper_nc<vpx_lpf_vertical_16_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_dual_neon>,
                   &wrapper_nc<vpx_lpf_vertical_16_dual_c>, 8, 1),
611
#endif  // HAVE_NEON_ASM
612
613
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_8_neon>,
                   &wrapper_nc<vpx_lpf_horizontal_8_c>, 8, 1),
614
615
        make_tuple(&wrapper_nc<vpx_lpf_vertical_8_neon>,
                   &wrapper_nc<vpx_lpf_vertical_8_c>, 8, 1),
616
617
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_4_neon>,
                   &wrapper_nc<vpx_lpf_horizontal_4_c>, 8, 1),
618
619
        make_tuple(&wrapper_nc<vpx_lpf_vertical_4_neon>,
                   &wrapper_nc<vpx_lpf_vertical_4_c>, 8, 1)));
620
621
622
INSTANTIATE_TEST_CASE_P(
    NEON, Loop8Test9Param,
    ::testing::Values(
Johann's avatar
Johann committed
623
#if HAVE_NEON_ASM
624
625
626
627
        make_tuple(&vpx_lpf_horizontal_8_dual_neon,
                   &vpx_lpf_horizontal_8_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_8_dual_neon,
                   &vpx_lpf_vertical_8_dual_c, 8),
Johann's avatar
Johann committed
628
#endif  // HAVE_NEON_ASM
629
630
631
632
        make_tuple(&vpx_lpf_horizontal_4_dual_neon,
                   &vpx_lpf_horizontal_4_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_4_dual_neon,
                   &vpx_lpf_vertical_4_dual_c, 8)));
633
634
#endif  // CONFIG_VP9_HIGHBITDEPTH
#endif  // HAVE_NEON
635

636
637
638
639
#if HAVE_DSPR2 && !CONFIG_VP9_HIGHBITDEPTH
INSTANTIATE_TEST_CASE_P(
    DSPR2, Loop8Test6Param,
    ::testing::Values(
640
641
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_4_dspr2>,
                   &wrapper_nc<vpx_lpf_horizontal_4_c>, 8, 1),
642
643
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_8_dspr2>,
                   &wrapper_nc<vpx_lpf_horizontal_8_c>, 8, 1),
644
645
646
647
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_edge_8>,
                   &wrapper_nc<vpx_lpf_horizontal_edge_8>, 8, 1),
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_edge_16>,
                   &wrapper_nc<vpx_lpf_horizontal_edge_16>, 8, 1),
648
649
        make_tuple(&wrapper_nc<vpx_lpf_vertical_4_dspr2>,
                   &wrapper_nc<vpx_lpf_vertical_4_c>, 8, 1),
650
651
        make_tuple(&wrapper_nc<vpx_lpf_vertical_8_dspr2>,
                   &wrapper_nc<vpx_lpf_vertical_8_c>, 8, 1),
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_dspr2>,
                   &wrapper_nc<vpx_lpf_vertical_16_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_dual_dspr2>,
                   &wrapper_nc<vpx_lpf_vertical_16_dual_c>, 8, 1)));

INSTANTIATE_TEST_CASE_P(
    DSPR2, Loop8Test9Param,
    ::testing::Values(
        make_tuple(&vpx_lpf_horizontal_4_dual_dspr2,
                   &vpx_lpf_horizontal_4_dual_c, 8),
        make_tuple(&vpx_lpf_horizontal_8_dual_dspr2,
                   &vpx_lpf_horizontal_8_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_4_dual_dspr2,
                   &vpx_lpf_vertical_4_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_8_dual_dspr2,
                   &vpx_lpf_vertical_8_dual_c, 8)));
#endif  // HAVE_DSPR2 && !CONFIG_VP9_HIGHBITDEPTH

670
671
672
673
#if HAVE_MSA && (!CONFIG_VP9_HIGHBITDEPTH)
INSTANTIATE_TEST_CASE_P(
    MSA, Loop8Test6Param,
    ::testing::Values(
674
675
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_4_msa>,
                   &wrapper_nc<vpx_lpf_horizontal_4_c>, 8, 1),
676
677
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_8_msa>,
                   &wrapper_nc<vpx_lpf_horizontal_8_c>, 8, 1),
678
679
680
681
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_edge_8_msa>,
                   &wrapper_nc<vpx_lpf_horizontal_edge_8_c>, 8, 1),
        make_tuple(&wrapper_nc<vpx_lpf_horizontal_edge_16_msa>,
                   &wrapper_nc<vpx_lpf_horizontal_edge_16_c>, 8, 1),
682
683
        make_tuple(&wrapper_nc<vpx_lpf_vertical_4_msa>,
                   &wrapper_nc<vpx_lpf_vertical_4_c>, 8, 1),
684
685
        make_tuple(&wrapper_nc<vpx_lpf_vertical_8_msa>,
                   &wrapper_nc<vpx_lpf_vertical_8_c>, 8, 1),
686
687
        make_tuple(&wrapper_nc<vpx_lpf_vertical_16_msa>,
                   &wrapper_nc<vpx_lpf_vertical_16_c>, 8, 1)));
688
689
690
691

INSTANTIATE_TEST_CASE_P(
    MSA, Loop8Test9Param,
    ::testing::Values(
692
693
694
695
696
697
698
699
        make_tuple(&vpx_lpf_horizontal_4_dual_msa,
                   &vpx_lpf_horizontal_4_dual_c, 8),
        make_tuple(&vpx_lpf_horizontal_8_dual_msa,
                   &vpx_lpf_horizontal_8_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_4_dual_msa,
                   &vpx_lpf_vertical_4_dual_c, 8),
        make_tuple(&vpx_lpf_vertical_8_dual_msa,
                   &vpx_lpf_vertical_8_dual_c, 8)));
700
701
#endif  // HAVE_MSA && (!CONFIG_VP9_HIGHBITDEPTH)

702
}  // namespace