1 /* 2 * Copyright (c) 2010 The WebM project authors. All Rights Reserved. 3 * 4 * Use of this source code is governed by a BSD-style license 5 * that can be found in the LICENSE file in the root of the source 6 * tree. An additional intellectual property rights grant can be found 7 * in the file PATENTS. All contributing project authors may 8 * be found in the AUTHORS file in the root of the source tree. 9 */ 10 11 #include <string.h> 12 #include "test/acm_random.h" 13 #include "test/register_state_check.h" 14 #include "test/util.h" 15 #include "third_party/googletest/src/include/gtest/gtest.h" 16 17 extern "C" { 18 #include "./vpx_config.h" 19 #include "./vp9_rtcd.h" 20 #include "vp9/common/vp9_filter.h" 21 #include "vpx_mem/vpx_mem.h" 22 #include "vpx_ports/mem.h" 23 } 24 25 namespace { 26 typedef void (*convolve_fn_t)(const uint8_t *src, ptrdiff_t src_stride, 27 uint8_t *dst, ptrdiff_t dst_stride, 28 const int16_t *filter_x, int filter_x_stride, 29 const int16_t *filter_y, int filter_y_stride, 30 int w, int h); 31 32 struct ConvolveFunctions { 33 ConvolveFunctions(convolve_fn_t h8, convolve_fn_t h8_avg, 34 convolve_fn_t v8, convolve_fn_t v8_avg, 35 convolve_fn_t hv8, convolve_fn_t hv8_avg) 36 : h8_(h8), v8_(v8), hv8_(hv8), h8_avg_(h8_avg), v8_avg_(v8_avg), 37 hv8_avg_(hv8_avg) {} 38 39 convolve_fn_t h8_; 40 convolve_fn_t v8_; 41 convolve_fn_t hv8_; 42 convolve_fn_t h8_avg_; 43 convolve_fn_t v8_avg_; 44 convolve_fn_t hv8_avg_; 45 }; 46 47 // Reference 8-tap subpixel filter, slightly modified to fit into this test. 48 #define VP9_FILTER_WEIGHT 128 49 #define VP9_FILTER_SHIFT 7 50 uint8_t clip_pixel(int x) { 51 return x < 0 ? 0 : 52 x > 255 ? 255 : 53 x; 54 } 55 56 void filter_block2d_8_c(const uint8_t *src_ptr, 57 const unsigned int src_stride, 58 const int16_t *HFilter, 59 const int16_t *VFilter, 60 uint8_t *dst_ptr, 61 unsigned int dst_stride, 62 unsigned int output_width, 63 unsigned int output_height) { 64 // Between passes, we use an intermediate buffer whose height is extended to 65 // have enough horizontally filtered values as input for the vertical pass. 66 // This buffer is allocated to be big enough for the largest block type we 67 // support. 68 const int kInterp_Extend = 4; 69 const unsigned int intermediate_height = 70 (kInterp_Extend - 1) + output_height + kInterp_Extend; 71 72 /* Size of intermediate_buffer is max_intermediate_height * filter_max_width, 73 * where max_intermediate_height = (kInterp_Extend - 1) + filter_max_height 74 * + kInterp_Extend 75 * = 3 + 16 + 4 76 * = 23 77 * and filter_max_width = 16 78 */ 79 uint8_t intermediate_buffer[71 * 64]; 80 const int intermediate_next_stride = 1 - intermediate_height * output_width; 81 82 // Horizontal pass (src -> transposed intermediate). 83 { 84 uint8_t *output_ptr = intermediate_buffer; 85 const int src_next_row_stride = src_stride - output_width; 86 unsigned int i, j; 87 src_ptr -= (kInterp_Extend - 1) * src_stride + (kInterp_Extend - 1); 88 for (i = 0; i < intermediate_height; ++i) { 89 for (j = 0; j < output_width; ++j) { 90 // Apply filter... 91 const int temp = (src_ptr[0] * HFilter[0]) + 92 (src_ptr[1] * HFilter[1]) + 93 (src_ptr[2] * HFilter[2]) + 94 (src_ptr[3] * HFilter[3]) + 95 (src_ptr[4] * HFilter[4]) + 96 (src_ptr[5] * HFilter[5]) + 97 (src_ptr[6] * HFilter[6]) + 98 (src_ptr[7] * HFilter[7]) + 99 (VP9_FILTER_WEIGHT >> 1); // Rounding 100 101 // Normalize back to 0-255... 102 *output_ptr = clip_pixel(temp >> VP9_FILTER_SHIFT); 103 ++src_ptr; 104 output_ptr += intermediate_height; 105 } 106 src_ptr += src_next_row_stride; 107 output_ptr += intermediate_next_stride; 108 } 109 } 110 111 // Vertical pass (transposed intermediate -> dst). 112 { 113 uint8_t *src_ptr = intermediate_buffer; 114 const int dst_next_row_stride = dst_stride - output_width; 115 unsigned int i, j; 116 for (i = 0; i < output_height; ++i) { 117 for (j = 0; j < output_width; ++j) { 118 // Apply filter... 119 const int temp = (src_ptr[0] * VFilter[0]) + 120 (src_ptr[1] * VFilter[1]) + 121 (src_ptr[2] * VFilter[2]) + 122 (src_ptr[3] * VFilter[3]) + 123 (src_ptr[4] * VFilter[4]) + 124 (src_ptr[5] * VFilter[5]) + 125 (src_ptr[6] * VFilter[6]) + 126 (src_ptr[7] * VFilter[7]) + 127 (VP9_FILTER_WEIGHT >> 1); // Rounding 128 129 // Normalize back to 0-255... 130 *dst_ptr++ = clip_pixel(temp >> VP9_FILTER_SHIFT); 131 src_ptr += intermediate_height; 132 } 133 src_ptr += intermediate_next_stride; 134 dst_ptr += dst_next_row_stride; 135 } 136 } 137 } 138 139 void block2d_average_c(uint8_t *src, 140 unsigned int src_stride, 141 uint8_t *output_ptr, 142 unsigned int output_stride, 143 unsigned int output_width, 144 unsigned int output_height) { 145 unsigned int i, j; 146 for (i = 0; i < output_height; ++i) { 147 for (j = 0; j < output_width; ++j) { 148 output_ptr[j] = (output_ptr[j] + src[i * src_stride + j] + 1) >> 1; 149 } 150 output_ptr += output_stride; 151 } 152 } 153 154 void filter_average_block2d_8_c(const uint8_t *src_ptr, 155 const unsigned int src_stride, 156 const int16_t *HFilter, 157 const int16_t *VFilter, 158 uint8_t *dst_ptr, 159 unsigned int dst_stride, 160 unsigned int output_width, 161 unsigned int output_height) { 162 uint8_t tmp[64 * 64]; 163 164 assert(output_width <= 64); 165 assert(output_height <= 64); 166 filter_block2d_8_c(src_ptr, src_stride, HFilter, VFilter, tmp, 64, 167 output_width, output_height); 168 block2d_average_c(tmp, 64, dst_ptr, dst_stride, 169 output_width, output_height); 170 } 171 172 class ConvolveTest : public PARAMS(int, int, const ConvolveFunctions*) { 173 public: 174 static void SetUpTestCase() { 175 // Force input_ to be unaligned, output to be 16 byte aligned. 176 input_ = reinterpret_cast<uint8_t*>( 177 vpx_memalign(kDataAlignment, kInputBufferSize + 1)) + 1; 178 output_ = reinterpret_cast<uint8_t*>( 179 vpx_memalign(kDataAlignment, kOutputBufferSize)); 180 } 181 182 static void TearDownTestCase() { 183 vpx_free(input_ - 1); 184 input_ = NULL; 185 vpx_free(output_); 186 output_ = NULL; 187 } 188 189 protected: 190 static const int kDataAlignment = 16; 191 static const int kOuterBlockSize = 256; 192 static const int kInputStride = kOuterBlockSize; 193 static const int kOutputStride = kOuterBlockSize; 194 static const int kMaxDimension = 64; 195 static const int kInputBufferSize = kOuterBlockSize * kOuterBlockSize; 196 static const int kOutputBufferSize = kOuterBlockSize * kOuterBlockSize; 197 198 int Width() const { return GET_PARAM(0); } 199 int Height() const { return GET_PARAM(1); } 200 int BorderLeft() const { 201 const int center = (kOuterBlockSize - Width()) / 2; 202 return (center + (kDataAlignment - 1)) & ~(kDataAlignment - 1); 203 } 204 int BorderTop() const { return (kOuterBlockSize - Height()) / 2; } 205 206 bool IsIndexInBorder(int i) { 207 return (i < BorderTop() * kOuterBlockSize || 208 i >= (BorderTop() + Height()) * kOuterBlockSize || 209 i % kOuterBlockSize < BorderLeft() || 210 i % kOuterBlockSize >= (BorderLeft() + Width())); 211 } 212 213 virtual void SetUp() { 214 UUT_ = GET_PARAM(2); 215 /* Set up guard blocks for an inner block centered in the outer block */ 216 for (int i = 0; i < kOutputBufferSize; ++i) { 217 if (IsIndexInBorder(i)) 218 output_[i] = 255; 219 else 220 output_[i] = 0; 221 } 222 223 ::libvpx_test::ACMRandom prng; 224 for (int i = 0; i < kInputBufferSize; ++i) 225 input_[i] = prng.Rand8Extremes(); 226 } 227 228 void SetConstantInput(int value) { 229 memset(input_, value, kInputBufferSize); 230 } 231 232 void CheckGuardBlocks() { 233 for (int i = 0; i < kOutputBufferSize; ++i) { 234 if (IsIndexInBorder(i)) 235 EXPECT_EQ(255, output_[i]); 236 } 237 } 238 239 uint8_t* input() const { 240 return input_ + BorderTop() * kOuterBlockSize + BorderLeft(); 241 } 242 243 uint8_t* output() const { 244 return output_ + BorderTop() * kOuterBlockSize + BorderLeft(); 245 } 246 247 const ConvolveFunctions* UUT_; 248 static uint8_t* input_; 249 static uint8_t* output_; 250 }; 251 uint8_t* ConvolveTest::input_ = NULL; 252 uint8_t* ConvolveTest::output_ = NULL; 253 254 TEST_P(ConvolveTest, GuardBlocks) { 255 CheckGuardBlocks(); 256 } 257 258 TEST_P(ConvolveTest, CopyHoriz) { 259 uint8_t* const in = input(); 260 uint8_t* const out = output(); 261 DECLARE_ALIGNED(256, const int16_t, filter8[8]) = {0, 0, 0, 128, 0, 0, 0, 0}; 262 263 REGISTER_STATE_CHECK( 264 UUT_->h8_(in, kInputStride, out, kOutputStride, filter8, 16, filter8, 16, 265 Width(), Height())); 266 267 CheckGuardBlocks(); 268 269 for (int y = 0; y < Height(); ++y) 270 for (int x = 0; x < Width(); ++x) 271 ASSERT_EQ(out[y * kOutputStride + x], in[y * kInputStride + x]) 272 << "(" << x << "," << y << ")"; 273 } 274 275 TEST_P(ConvolveTest, CopyVert) { 276 uint8_t* const in = input(); 277 uint8_t* const out = output(); 278 DECLARE_ALIGNED(256, const int16_t, filter8[8]) = {0, 0, 0, 128, 0, 0, 0, 0}; 279 280 REGISTER_STATE_CHECK( 281 UUT_->v8_(in, kInputStride, out, kOutputStride, filter8, 16, filter8, 16, 282 Width(), Height())); 283 284 CheckGuardBlocks(); 285 286 for (int y = 0; y < Height(); ++y) 287 for (int x = 0; x < Width(); ++x) 288 ASSERT_EQ(out[y * kOutputStride + x], in[y * kInputStride + x]) 289 << "(" << x << "," << y << ")"; 290 } 291 292 TEST_P(ConvolveTest, Copy2D) { 293 uint8_t* const in = input(); 294 uint8_t* const out = output(); 295 DECLARE_ALIGNED(256, const int16_t, filter8[8]) = {0, 0, 0, 128, 0, 0, 0, 0}; 296 297 REGISTER_STATE_CHECK( 298 UUT_->hv8_(in, kInputStride, out, kOutputStride, filter8, 16, filter8, 16, 299 Width(), Height())); 300 301 CheckGuardBlocks(); 302 303 for (int y = 0; y < Height(); ++y) 304 for (int x = 0; x < Width(); ++x) 305 ASSERT_EQ(out[y * kOutputStride + x], in[y * kInputStride + x]) 306 << "(" << x << "," << y << ")"; 307 } 308 309 const int16_t (*kTestFilterList[])[8] = { 310 vp9_bilinear_filters, 311 vp9_sub_pel_filters_8, 312 vp9_sub_pel_filters_8s, 313 vp9_sub_pel_filters_8lp 314 }; 315 const int kNumFilterBanks = sizeof(kTestFilterList) / 316 sizeof(kTestFilterList[0]); 317 const int kNumFilters = 16; 318 319 TEST(ConvolveTest, FiltersWontSaturateWhenAddedPairwise) { 320 for (int filter_bank = 0; filter_bank < kNumFilterBanks; ++filter_bank) { 321 const int16_t (*filters)[8] = kTestFilterList[filter_bank]; 322 for (int i = 0; i < kNumFilters; i++) { 323 const int p0 = filters[i][0] + filters[i][1]; 324 const int p1 = filters[i][2] + filters[i][3]; 325 const int p2 = filters[i][4] + filters[i][5]; 326 const int p3 = filters[i][6] + filters[i][7]; 327 EXPECT_LE(p0, 128); 328 EXPECT_LE(p1, 128); 329 EXPECT_LE(p2, 128); 330 EXPECT_LE(p3, 128); 331 EXPECT_LE(p0 + p3, 128); 332 EXPECT_LE(p0 + p3 + p1, 128); 333 EXPECT_LE(p0 + p3 + p1 + p2, 128); 334 EXPECT_EQ(p0 + p1 + p2 + p3, 128); 335 } 336 } 337 } 338 339 const int16_t kInvalidFilter[8] = { 0 }; 340 341 TEST_P(ConvolveTest, MatchesReferenceSubpixelFilter) { 342 uint8_t* const in = input(); 343 uint8_t* const out = output(); 344 uint8_t ref[kOutputStride * kMaxDimension]; 345 346 347 for (int filter_bank = 0; filter_bank < kNumFilterBanks; ++filter_bank) { 348 const int16_t (*filters)[8] = kTestFilterList[filter_bank]; 349 350 for (int filter_x = 0; filter_x < kNumFilters; ++filter_x) { 351 for (int filter_y = 0; filter_y < kNumFilters; ++filter_y) { 352 filter_block2d_8_c(in, kInputStride, 353 filters[filter_x], filters[filter_y], 354 ref, kOutputStride, 355 Width(), Height()); 356 357 if (filters == vp9_sub_pel_filters_8lp || (filter_x && filter_y)) 358 REGISTER_STATE_CHECK( 359 UUT_->hv8_(in, kInputStride, out, kOutputStride, 360 filters[filter_x], 16, filters[filter_y], 16, 361 Width(), Height())); 362 else if (filter_y) 363 REGISTER_STATE_CHECK( 364 UUT_->v8_(in, kInputStride, out, kOutputStride, 365 kInvalidFilter, 16, filters[filter_y], 16, 366 Width(), Height())); 367 else 368 REGISTER_STATE_CHECK( 369 UUT_->h8_(in, kInputStride, out, kOutputStride, 370 filters[filter_x], 16, kInvalidFilter, 16, 371 Width(), Height())); 372 373 CheckGuardBlocks(); 374 375 for (int y = 0; y < Height(); ++y) 376 for (int x = 0; x < Width(); ++x) 377 ASSERT_EQ(ref[y * kOutputStride + x], out[y * kOutputStride + x]) 378 << "mismatch at (" << x << "," << y << "), " 379 << "filters (" << filter_bank << "," 380 << filter_x << "," << filter_y << ")"; 381 } 382 } 383 } 384 } 385 386 TEST_P(ConvolveTest, MatchesReferenceAveragingSubpixelFilter) { 387 uint8_t* const in = input(); 388 uint8_t* const out = output(); 389 uint8_t ref[kOutputStride * kMaxDimension]; 390 391 // Populate ref and out with some random data 392 ::libvpx_test::ACMRandom prng; 393 for (int y = 0; y < Height(); ++y) { 394 for (int x = 0; x < Width(); ++x) { 395 const uint8_t r = prng.Rand8Extremes(); 396 397 out[y * kOutputStride + x] = r; 398 ref[y * kOutputStride + x] = r; 399 } 400 } 401 402 const int kNumFilterBanks = sizeof(kTestFilterList) / 403 sizeof(kTestFilterList[0]); 404 405 for (int filter_bank = 0; filter_bank < kNumFilterBanks; ++filter_bank) { 406 const int16_t (*filters)[8] = kTestFilterList[filter_bank]; 407 const int kNumFilters = 16; 408 409 for (int filter_x = 0; filter_x < kNumFilters; ++filter_x) { 410 for (int filter_y = 0; filter_y < kNumFilters; ++filter_y) { 411 filter_average_block2d_8_c(in, kInputStride, 412 filters[filter_x], filters[filter_y], 413 ref, kOutputStride, 414 Width(), Height()); 415 416 if (filters == vp9_sub_pel_filters_8lp || (filter_x && filter_y)) 417 REGISTER_STATE_CHECK( 418 UUT_->hv8_avg_(in, kInputStride, out, kOutputStride, 419 filters[filter_x], 16, filters[filter_y], 16, 420 Width(), Height())); 421 else if (filter_y) 422 REGISTER_STATE_CHECK( 423 UUT_->v8_avg_(in, kInputStride, out, kOutputStride, 424 filters[filter_x], 16, filters[filter_y], 16, 425 Width(), Height())); 426 else 427 REGISTER_STATE_CHECK( 428 UUT_->h8_avg_(in, kInputStride, out, kOutputStride, 429 filters[filter_x], 16, filters[filter_y], 16, 430 Width(), Height())); 431 432 CheckGuardBlocks(); 433 434 for (int y = 0; y < Height(); ++y) 435 for (int x = 0; x < Width(); ++x) 436 ASSERT_EQ(ref[y * kOutputStride + x], out[y * kOutputStride + x]) 437 << "mismatch at (" << x << "," << y << "), " 438 << "filters (" << filter_bank << "," 439 << filter_x << "," << filter_y << ")"; 440 } 441 } 442 } 443 } 444 445 DECLARE_ALIGNED(256, const int16_t, kChangeFilters[16][8]) = { 446 { 0, 0, 0, 0, 0, 0, 0, 128}, 447 { 0, 0, 0, 0, 0, 0, 128}, 448 { 0, 0, 0, 0, 0, 128}, 449 { 0, 0, 0, 0, 128}, 450 { 0, 0, 0, 128}, 451 { 0, 0, 128}, 452 { 0, 128}, 453 { 128}, 454 { 0, 0, 0, 0, 0, 0, 0, 128}, 455 { 0, 0, 0, 0, 0, 0, 128}, 456 { 0, 0, 0, 0, 0, 128}, 457 { 0, 0, 0, 0, 128}, 458 { 0, 0, 0, 128}, 459 { 0, 0, 128}, 460 { 0, 128}, 461 { 128} 462 }; 463 464 /* This test exercises the horizontal and vertical filter functions. */ 465 TEST_P(ConvolveTest, ChangeFilterWorks) { 466 uint8_t* const in = input(); 467 uint8_t* const out = output(); 468 469 /* Assume that the first input sample is at the 8/16th position. */ 470 const int kInitialSubPelOffset = 8; 471 472 /* Filters are 8-tap, so the first filter tap will be applied to the pixel 473 * at position -3 with respect to the current filtering position. Since 474 * kInitialSubPelOffset is set to 8, we first select sub-pixel filter 8, 475 * which is non-zero only in the last tap. So, applying the filter at the 476 * current input position will result in an output equal to the pixel at 477 * offset +4 (-3 + 7) with respect to the current filtering position. 478 */ 479 const int kPixelSelected = 4; 480 481 /* Assume that each output pixel requires us to step on by 17/16th pixels in 482 * the input. 483 */ 484 const int kInputPixelStep = 17; 485 486 /* The filters are setup in such a way that the expected output produces 487 * sets of 8 identical output samples. As the filter position moves to the 488 * next 1/16th pixel position the only active (=128) filter tap moves one 489 * position to the left, resulting in the same input pixel being replicated 490 * in to the output for 8 consecutive samples. After each set of 8 positions 491 * the filters select a different input pixel. kFilterPeriodAdjust below 492 * computes which input pixel is written to the output for a specified 493 * x or y position. 494 */ 495 496 /* Test the horizontal filter. */ 497 REGISTER_STATE_CHECK(UUT_->h8_(in, kInputStride, out, kOutputStride, 498 kChangeFilters[kInitialSubPelOffset], 499 kInputPixelStep, NULL, 0, Width(), Height())); 500 501 for (int x = 0; x < Width(); ++x) { 502 const int kFilterPeriodAdjust = (x >> 3) << 3; 503 const int ref_x = 504 kPixelSelected + ((kInitialSubPelOffset 505 + kFilterPeriodAdjust * kInputPixelStep) 506 >> SUBPEL_BITS); 507 ASSERT_EQ(in[ref_x], out[x]) << "x == " << x << "width = " << Width(); 508 } 509 510 /* Test the vertical filter. */ 511 REGISTER_STATE_CHECK(UUT_->v8_(in, kInputStride, out, kOutputStride, 512 NULL, 0, kChangeFilters[kInitialSubPelOffset], 513 kInputPixelStep, Width(), Height())); 514 515 for (int y = 0; y < Height(); ++y) { 516 const int kFilterPeriodAdjust = (y >> 3) << 3; 517 const int ref_y = 518 kPixelSelected + ((kInitialSubPelOffset 519 + kFilterPeriodAdjust * kInputPixelStep) 520 >> SUBPEL_BITS); 521 ASSERT_EQ(in[ref_y * kInputStride], out[y * kInputStride]) << "y == " << y; 522 } 523 524 /* Test the horizontal and vertical filters in combination. */ 525 REGISTER_STATE_CHECK(UUT_->hv8_(in, kInputStride, out, kOutputStride, 526 kChangeFilters[kInitialSubPelOffset], 527 kInputPixelStep, 528 kChangeFilters[kInitialSubPelOffset], 529 kInputPixelStep, 530 Width(), Height())); 531 532 for (int y = 0; y < Height(); ++y) { 533 const int kFilterPeriodAdjustY = (y >> 3) << 3; 534 const int ref_y = 535 kPixelSelected + ((kInitialSubPelOffset 536 + kFilterPeriodAdjustY * kInputPixelStep) 537 >> SUBPEL_BITS); 538 for (int x = 0; x < Width(); ++x) { 539 const int kFilterPeriodAdjustX = (x >> 3) << 3; 540 const int ref_x = 541 kPixelSelected + ((kInitialSubPelOffset 542 + kFilterPeriodAdjustX * kInputPixelStep) 543 >> SUBPEL_BITS); 544 545 ASSERT_EQ(in[ref_y * kInputStride + ref_x], out[y * kOutputStride + x]) 546 << "x == " << x << ", y == " << y; 547 } 548 } 549 } 550 551 /* This test exercises that enough rows and columns are filtered with every 552 possible initial fractional positions and scaling steps. */ 553 TEST_P(ConvolveTest, CheckScalingFiltering) { 554 uint8_t* const in = input(); 555 uint8_t* const out = output(); 556 557 SetConstantInput(127); 558 559 for (int frac = 0; frac < 16; ++frac) { 560 for (int step = 1; step <= 32; ++step) { 561 /* Test the horizontal and vertical filters in combination. */ 562 REGISTER_STATE_CHECK(UUT_->hv8_(in, kInputStride, out, kOutputStride, 563 vp9_sub_pel_filters_8[frac], step, 564 vp9_sub_pel_filters_8[frac], step, 565 Width(), Height())); 566 567 CheckGuardBlocks(); 568 569 for (int y = 0; y < Height(); ++y) { 570 for (int x = 0; x < Width(); ++x) { 571 ASSERT_EQ(in[y * kInputStride + x], out[y * kOutputStride + x]) 572 << "x == " << x << ", y == " << y 573 << ", frac == " << frac << ", step == " << step; 574 } 575 } 576 } 577 } 578 } 579 580 using std::tr1::make_tuple; 581 582 const ConvolveFunctions convolve8_c( 583 vp9_convolve8_horiz_c, vp9_convolve8_avg_horiz_c, 584 vp9_convolve8_vert_c, vp9_convolve8_avg_vert_c, 585 vp9_convolve8_c, vp9_convolve8_avg_c); 586 587 INSTANTIATE_TEST_CASE_P(C, ConvolveTest, ::testing::Values( 588 make_tuple(4, 4, &convolve8_c), 589 make_tuple(8, 4, &convolve8_c), 590 make_tuple(4, 8, &convolve8_c), 591 make_tuple(8, 8, &convolve8_c), 592 make_tuple(16, 8, &convolve8_c), 593 make_tuple(8, 16, &convolve8_c), 594 make_tuple(16, 16, &convolve8_c), 595 make_tuple(32, 16, &convolve8_c), 596 make_tuple(16, 32, &convolve8_c), 597 make_tuple(32, 32, &convolve8_c), 598 make_tuple(64, 32, &convolve8_c), 599 make_tuple(32, 64, &convolve8_c), 600 make_tuple(64, 64, &convolve8_c))); 601 602 #if HAVE_SSE2 603 const ConvolveFunctions convolve8_sse2( 604 vp9_convolve8_horiz_sse2, vp9_convolve8_avg_horiz_sse2, 605 vp9_convolve8_vert_sse2, vp9_convolve8_avg_vert_sse2, 606 vp9_convolve8_sse2, vp9_convolve8_avg_sse2); 607 608 INSTANTIATE_TEST_CASE_P(SSE2, ConvolveTest, ::testing::Values( 609 make_tuple(4, 4, &convolve8_sse2), 610 make_tuple(8, 4, &convolve8_sse2), 611 make_tuple(4, 8, &convolve8_sse2), 612 make_tuple(8, 8, &convolve8_sse2), 613 make_tuple(16, 8, &convolve8_sse2), 614 make_tuple(8, 16, &convolve8_sse2), 615 make_tuple(16, 16, &convolve8_sse2), 616 make_tuple(32, 16, &convolve8_sse2), 617 make_tuple(16, 32, &convolve8_sse2), 618 make_tuple(32, 32, &convolve8_sse2), 619 make_tuple(64, 32, &convolve8_sse2), 620 make_tuple(32, 64, &convolve8_sse2), 621 make_tuple(64, 64, &convolve8_sse2))); 622 #endif 623 624 #if HAVE_SSSE3 625 const ConvolveFunctions convolve8_ssse3( 626 vp9_convolve8_horiz_ssse3, vp9_convolve8_avg_horiz_ssse3, 627 vp9_convolve8_vert_ssse3, vp9_convolve8_avg_vert_ssse3, 628 vp9_convolve8_ssse3, vp9_convolve8_avg_ssse3); 629 630 INSTANTIATE_TEST_CASE_P(SSSE3, ConvolveTest, ::testing::Values( 631 make_tuple(4, 4, &convolve8_ssse3), 632 make_tuple(8, 4, &convolve8_ssse3), 633 make_tuple(4, 8, &convolve8_ssse3), 634 make_tuple(8, 8, &convolve8_ssse3), 635 make_tuple(16, 8, &convolve8_ssse3), 636 make_tuple(8, 16, &convolve8_ssse3), 637 make_tuple(16, 16, &convolve8_ssse3), 638 make_tuple(32, 16, &convolve8_ssse3), 639 make_tuple(16, 32, &convolve8_ssse3), 640 make_tuple(32, 32, &convolve8_ssse3), 641 make_tuple(64, 32, &convolve8_ssse3), 642 make_tuple(32, 64, &convolve8_ssse3), 643 make_tuple(64, 64, &convolve8_ssse3))); 644 #endif 645 646 #if HAVE_NEON 647 const ConvolveFunctions convolve8_neon( 648 vp9_convolve8_horiz_neon, vp9_convolve8_avg_horiz_neon, 649 vp9_convolve8_vert_neon, vp9_convolve8_avg_vert_neon, 650 vp9_convolve8_neon, vp9_convolve8_avg_neon); 651 652 INSTANTIATE_TEST_CASE_P(NEON, ConvolveTest, ::testing::Values( 653 make_tuple(4, 4, &convolve8_neon), 654 make_tuple(8, 4, &convolve8_neon), 655 make_tuple(4, 8, &convolve8_neon), 656 make_tuple(8, 8, &convolve8_neon), 657 make_tuple(16, 8, &convolve8_neon), 658 make_tuple(8, 16, &convolve8_neon), 659 make_tuple(16, 16, &convolve8_neon), 660 make_tuple(32, 16, &convolve8_neon), 661 make_tuple(16, 32, &convolve8_neon), 662 make_tuple(32, 32, &convolve8_neon), 663 make_tuple(64, 32, &convolve8_neon), 664 make_tuple(32, 64, &convolve8_neon), 665 make_tuple(64, 64, &convolve8_neon))); 666 #endif 667 668 #if HAVE_DSPR2 669 const ConvolveFunctions convolve8_dspr2( 670 vp9_convolve8_horiz_dspr2, vp9_convolve8_avg_horiz_dspr2, 671 vp9_convolve8_vert_dspr2, vp9_convolve8_avg_vert_dspr2, 672 vp9_convolve8_dspr2, vp9_convolve8_avg_dspr2); 673 674 INSTANTIATE_TEST_CASE_P(DSPR2, ConvolveTest, ::testing::Values( 675 make_tuple(4, 4, &convolve8_dspr2), 676 make_tuple(8, 4, &convolve8_dspr2), 677 make_tuple(4, 8, &convolve8_dspr2), 678 make_tuple(8, 8, &convolve8_dspr2), 679 make_tuple(16, 8, &convolve8_dspr2), 680 make_tuple(8, 16, &convolve8_dspr2), 681 make_tuple(16, 16, &convolve8_dspr2), 682 make_tuple(32, 16, &convolve8_dspr2), 683 make_tuple(16, 32, &convolve8_dspr2), 684 make_tuple(32, 32, &convolve8_dspr2), 685 make_tuple(64, 32, &convolve8_dspr2), 686 make_tuple(32, 64, &convolve8_dspr2), 687 make_tuple(64, 64, &convolve8_dspr2))); 688 #endif 689 } // namespace 690