/* * Copyright (c) 2012 The WebM project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #include #include #include #include "./vpx_config.h" #include "./vpx_dsp_rtcd.h" #include "vpx_mem/vpx_mem.h" /* Needed for ROUND_POWER_OF_TWO and CONVERT_TO* macros, both of which should be * moved to a more generic location. Alternatively the *avg functions could be * restricted to VP9 builds, but it would be better to avoid that sort of * specificity. * TODO(johannkoenig): move these macros to a common location. */ #if CONFIG_VP9_HIGHBITDEPTH #include "vp9/common/vp9_common.h" #endif // CONFIG_VP9_HIGHBITDEPTH #ifndef ROUND_POWER_OF_TWO #define ROUND_POWER_OF_TWO(value, n) \ (((value) + (1 << ((n) - 1))) >> (n)) #endif // ROUND_POWER_OF_TWO #include "test/acm_random.h" #include "test/clear_system_state.h" #include "test/register_state_check.h" #include "test/util.h" #include "third_party/googletest/src/include/gtest/gtest.h" #include "vpx/vpx_codec.h" typedef unsigned int (*SadMxNFunc)(const uint8_t *src_ptr, int src_stride, const uint8_t *ref_ptr, int ref_stride); typedef std::tr1::tuple SadMxNParam; typedef uint32_t (*SadMxNAvgFunc)(const uint8_t *src_ptr, int src_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred); typedef std::tr1::tuple SadMxNAvgParam; typedef void (*SadMxNx4Func)(const uint8_t *src_ptr, int src_stride, const uint8_t *const ref_ptr[], int ref_stride, uint32_t *sad_array); typedef std::tr1::tuple SadMxNx4Param; using libvpx_test::ACMRandom; namespace { class SADTestBase : public ::testing::Test { public: SADTestBase(int width, int height, int bit_depth) : width_(width), height_(height), bd_(bit_depth) {} static void SetUpTestCase() { source_data8_ = reinterpret_cast( vpx_memalign(kDataAlignment, kDataBlockSize)); reference_data8_ = reinterpret_cast( vpx_memalign(kDataAlignment, kDataBufferSize)); second_pred8_ = reinterpret_cast( vpx_memalign(kDataAlignment, 64*64)); source_data16_ = reinterpret_cast( vpx_memalign(kDataAlignment, kDataBlockSize*sizeof(uint16_t))); reference_data16_ = reinterpret_cast( vpx_memalign(kDataAlignment, kDataBufferSize*sizeof(uint16_t))); second_pred16_ = reinterpret_cast( vpx_memalign(kDataAlignment, 64*64*sizeof(uint16_t))); } static void TearDownTestCase() { vpx_free(source_data8_); source_data8_ = NULL; vpx_free(reference_data8_); reference_data8_ = NULL; vpx_free(second_pred8_); second_pred8_ = NULL; vpx_free(source_data16_); source_data16_ = NULL; vpx_free(reference_data16_); reference_data16_ = NULL; vpx_free(second_pred16_); second_pred16_ = NULL; } virtual void TearDown() { libvpx_test::ClearSystemState(); } protected: // Handle blocks up to 4 blocks 64x64 with stride up to 128 static const int kDataAlignment = 16; static const int kDataBlockSize = 64 * 128; static const int kDataBufferSize = 4 * kDataBlockSize; virtual void SetUp() { if (bd_ == -1) { use_high_bit_depth_ = false; bit_depth_ = VPX_BITS_8; source_data_ = source_data8_; reference_data_ = reference_data8_; second_pred_ = second_pred8_; #if CONFIG_VP9_HIGHBITDEPTH } else { use_high_bit_depth_ = true; bit_depth_ = static_cast(bd_); source_data_ = CONVERT_TO_BYTEPTR(source_data16_); reference_data_ = CONVERT_TO_BYTEPTR(reference_data16_); second_pred_ = CONVERT_TO_BYTEPTR(second_pred16_); #endif // CONFIG_VP9_HIGHBITDEPTH } mask_ = (1 << bit_depth_) - 1; source_stride_ = (width_ + 31) & ~31; reference_stride_ = width_ * 2; rnd_.Reset(ACMRandom::DeterministicSeed()); } virtual uint8_t *GetReference(int block_idx) { #if CONFIG_VP9_HIGHBITDEPTH if (use_high_bit_depth_) return CONVERT_TO_BYTEPTR(CONVERT_TO_SHORTPTR(reference_data_) + block_idx * kDataBlockSize); #endif // CONFIG_VP9_HIGHBITDEPTH return reference_data_ + block_idx * kDataBlockSize; } // Sum of Absolute Differences. Given two blocks, calculate the absolute // difference between two pixels in the same relative location; accumulate. unsigned int ReferenceSAD(int block_idx) { unsigned int sad = 0; const uint8_t *const reference8 = GetReference(block_idx); const uint8_t *const source8 = source_data_; #if CONFIG_VP9_HIGHBITDEPTH const uint16_t *const reference16 = CONVERT_TO_SHORTPTR(GetReference(block_idx)); const uint16_t *const source16 = CONVERT_TO_SHORTPTR(source_data_); #endif // CONFIG_VP9_HIGHBITDEPTH for (int h = 0; h < height_; ++h) { for (int w = 0; w < width_; ++w) { if (!use_high_bit_depth_) { sad += abs(source8[h * source_stride_ + w] - reference8[h * reference_stride_ + w]); #if CONFIG_VP9_HIGHBITDEPTH } else { sad += abs(source16[h * source_stride_ + w] - reference16[h * reference_stride_ + w]); #endif // CONFIG_VP9_HIGHBITDEPTH } } } return sad; } // Sum of Absolute Differences Average. Given two blocks, and a prediction // calculate the absolute difference between one pixel and average of the // corresponding and predicted pixels; accumulate. unsigned int ReferenceSADavg(int block_idx) { unsigned int sad = 0; const uint8_t *const reference8 = GetReference(block_idx); const uint8_t *const source8 = source_data_; const uint8_t *const second_pred8 = second_pred_; #if CONFIG_VP9_HIGHBITDEPTH const uint16_t *const reference16 = CONVERT_TO_SHORTPTR(GetReference(block_idx)); const uint16_t *const source16 = CONVERT_TO_SHORTPTR(source_data_); const uint16_t *const second_pred16 = CONVERT_TO_SHORTPTR(second_pred_); #endif // CONFIG_VP9_HIGHBITDEPTH for (int h = 0; h < height_; ++h) { for (int w = 0; w < width_; ++w) { if (!use_high_bit_depth_) { const int tmp = second_pred8[h * width_ + w] + reference8[h * reference_stride_ + w]; const uint8_t comp_pred = ROUND_POWER_OF_TWO(tmp, 1); sad += abs(source8[h * source_stride_ + w] - comp_pred); #if CONFIG_VP9_HIGHBITDEPTH } else { const int tmp = second_pred16[h * width_ + w] + reference16[h * reference_stride_ + w]; const uint16_t comp_pred = ROUND_POWER_OF_TWO(tmp, 1); sad += abs(source16[h * source_stride_ + w] - comp_pred); #endif // CONFIG_VP9_HIGHBITDEPTH } } } return sad; } void FillConstant(uint8_t *data, int stride, uint16_t fill_constant) { uint8_t *data8 = data; #if CONFIG_VP9_HIGHBITDEPTH uint16_t *data16 = CONVERT_TO_SHORTPTR(data); #endif // CONFIG_VP9_HIGHBITDEPTH for (int h = 0; h < height_; ++h) { for (int w = 0; w < width_; ++w) { if (!use_high_bit_depth_) { data8[h * stride + w] = static_cast(fill_constant); #if CONFIG_VP9_HIGHBITDEPTH } else { data16[h * stride + w] = fill_constant; #endif // CONFIG_VP9_HIGHBITDEPTH } } } } void FillRandom(uint8_t *data, int stride) { uint8_t *data8 = data; #if CONFIG_VP9_HIGHBITDEPTH uint16_t *data16 = CONVERT_TO_SHORTPTR(data); #endif // CONFIG_VP9_HIGHBITDEPTH for (int h = 0; h < height_; ++h) { for (int w = 0; w < width_; ++w) { if (!use_high_bit_depth_) { data8[h * stride + w] = rnd_.Rand8(); #if CONFIG_VP9_HIGHBITDEPTH } else { data16[h * stride + w] = rnd_.Rand16() & mask_; #endif // CONFIG_VP9_HIGHBITDEPTH } } } } int width_, height_, mask_, bd_; vpx_bit_depth_t bit_depth_; static uint8_t *source_data_; static uint8_t *reference_data_; static uint8_t *second_pred_; int source_stride_; bool use_high_bit_depth_; static uint8_t *source_data8_; static uint8_t *reference_data8_; static uint8_t *second_pred8_; static uint16_t *source_data16_; static uint16_t *reference_data16_; static uint16_t *second_pred16_; int reference_stride_; ACMRandom rnd_; }; class SADx4Test : public SADTestBase, public ::testing::WithParamInterface { public: SADx4Test() : SADTestBase(GET_PARAM(0), GET_PARAM(1), GET_PARAM(3)) {} protected: void SADs(unsigned int *results) { const uint8_t *references[] = {GetReference(0), GetReference(1), GetReference(2), GetReference(3)}; ASM_REGISTER_STATE_CHECK(GET_PARAM(2)(source_data_, source_stride_, references, reference_stride_, results)); } void CheckSADs() { unsigned int reference_sad, exp_sad[4]; SADs(exp_sad); for (int block = 0; block < 4; ++block) { reference_sad = ReferenceSAD(block); EXPECT_EQ(reference_sad, exp_sad[block]) << "block " << block; } } }; class SADTest : public SADTestBase, public ::testing::WithParamInterface { public: SADTest() : SADTestBase(GET_PARAM(0), GET_PARAM(1), GET_PARAM(3)) {} protected: unsigned int SAD(int block_idx) { unsigned int ret; const uint8_t *const reference = GetReference(block_idx); ASM_REGISTER_STATE_CHECK(ret = GET_PARAM(2)(source_data_, source_stride_, reference, reference_stride_)); return ret; } void CheckSAD() { const unsigned int reference_sad = ReferenceSAD(0); const unsigned int exp_sad = SAD(0); ASSERT_EQ(reference_sad, exp_sad); } }; class SADavgTest : public SADTestBase, public ::testing::WithParamInterface { public: SADavgTest() : SADTestBase(GET_PARAM(0), GET_PARAM(1), GET_PARAM(3)) {} protected: unsigned int SAD_avg(int block_idx) { unsigned int ret; const uint8_t *const reference = GetReference(block_idx); ASM_REGISTER_STATE_CHECK(ret = GET_PARAM(2)(source_data_, source_stride_, reference, reference_stride_, second_pred_)); return ret; } void CheckSAD() { const unsigned int reference_sad = ReferenceSADavg(0); const unsigned int exp_sad = SAD_avg(0); ASSERT_EQ(reference_sad, exp_sad); } }; uint8_t *SADTestBase::source_data_ = NULL; uint8_t *SADTestBase::reference_data_ = NULL; uint8_t *SADTestBase::second_pred_ = NULL; uint8_t *SADTestBase::source_data8_ = NULL; uint8_t *SADTestBase::reference_data8_ = NULL; uint8_t *SADTestBase::second_pred8_ = NULL; uint16_t *SADTestBase::source_data16_ = NULL; uint16_t *SADTestBase::reference_data16_ = NULL; uint16_t *SADTestBase::second_pred16_ = NULL; TEST_P(SADTest, MaxRef) { FillConstant(source_data_, source_stride_, 0); FillConstant(reference_data_, reference_stride_, mask_); CheckSAD(); } TEST_P(SADTest, MaxSrc) { FillConstant(source_data_, source_stride_, mask_); FillConstant(reference_data_, reference_stride_, 0); CheckSAD(); } TEST_P(SADTest, ShortRef) { const int tmp_stride = reference_stride_; reference_stride_ >>= 1; FillRandom(source_data_, source_stride_); FillRandom(reference_data_, reference_stride_); CheckSAD(); reference_stride_ = tmp_stride; } TEST_P(SADTest, UnalignedRef) { // The reference frame, but not the source frame, may be unaligned for // certain types of searches. const int tmp_stride = reference_stride_; reference_stride_ -= 1; FillRandom(source_data_, source_stride_); FillRandom(reference_data_, reference_stride_); CheckSAD(); reference_stride_ = tmp_stride; } TEST_P(SADTest, ShortSrc) { const int tmp_stride = source_stride_; source_stride_ >>= 1; FillRandom(source_data_, source_stride_); FillRandom(reference_data_, reference_stride_); CheckSAD(); source_stride_ = tmp_stride; } TEST_P(SADavgTest, MaxRef) { FillConstant(source_data_, source_stride_, 0); FillConstant(reference_data_, reference_stride_, mask_); FillConstant(second_pred_, width_, 0); CheckSAD(); } TEST_P(SADavgTest, MaxSrc) { FillConstant(source_data_, source_stride_, mask_); FillConstant(reference_data_, reference_stride_, 0); FillConstant(second_pred_, width_, 0); CheckSAD(); } TEST_P(SADavgTest, ShortRef) { const int tmp_stride = reference_stride_; reference_stride_ >>= 1; FillRandom(source_data_, source_stride_); FillRandom(reference_data_, reference_stride_); FillRandom(second_pred_, width_); CheckSAD(); reference_stride_ = tmp_stride; } TEST_P(SADavgTest, UnalignedRef) { // The reference frame, but not the source frame, may be unaligned for // certain types of searches. const int tmp_stride = reference_stride_; reference_stride_ -= 1; FillRandom(source_data_, source_stride_); FillRandom(reference_data_, reference_stride_); FillRandom(second_pred_, width_); CheckSAD(); reference_stride_ = tmp_stride; } TEST_P(SADavgTest, ShortSrc) { const int tmp_stride = source_stride_; source_stride_ >>= 1; FillRandom(source_data_, source_stride_); FillRandom(reference_data_, reference_stride_); FillRandom(second_pred_, width_); CheckSAD(); source_stride_ = tmp_stride; } TEST_P(SADx4Test, MaxRef) { FillConstant(source_data_, source_stride_, 0); FillConstant(GetReference(0), reference_stride_, mask_); FillConstant(GetReference(1), reference_stride_, mask_); FillConstant(GetReference(2), reference_stride_, mask_); FillConstant(GetReference(3), reference_stride_, mask_); CheckSADs(); } TEST_P(SADx4Test, MaxSrc) { FillConstant(source_data_, source_stride_, mask_); FillConstant(GetReference(0), reference_stride_, 0); FillConstant(GetReference(1), reference_stride_, 0); FillConstant(GetReference(2), reference_stride_, 0); FillConstant(GetReference(3), reference_stride_, 0); CheckSADs(); } TEST_P(SADx4Test, ShortRef) { int tmp_stride = reference_stride_; reference_stride_ >>= 1; FillRandom(source_data_, source_stride_); FillRandom(GetReference(0), reference_stride_); FillRandom(GetReference(1), reference_stride_); FillRandom(GetReference(2), reference_stride_); FillRandom(GetReference(3), reference_stride_); CheckSADs(); reference_stride_ = tmp_stride; } TEST_P(SADx4Test, UnalignedRef) { // The reference frame, but not the source frame, may be unaligned for // certain types of searches. int tmp_stride = reference_stride_; reference_stride_ -= 1; FillRandom(source_data_, source_stride_); FillRandom(GetReference(0), reference_stride_); FillRandom(GetReference(1), reference_stride_); FillRandom(GetReference(2), reference_stride_); FillRandom(GetReference(3), reference_stride_); CheckSADs(); reference_stride_ = tmp_stride; } TEST_P(SADx4Test, ShortSrc) { int tmp_stride = source_stride_; source_stride_ >>= 1; FillRandom(source_data_, source_stride_); FillRandom(GetReference(0), reference_stride_); FillRandom(GetReference(1), reference_stride_); FillRandom(GetReference(2), reference_stride_); FillRandom(GetReference(3), reference_stride_); CheckSADs(); source_stride_ = tmp_stride; } TEST_P(SADx4Test, SrcAlignedByWidth) { uint8_t * tmp_source_data = source_data_; source_data_ += width_; FillRandom(source_data_, source_stride_); FillRandom(GetReference(0), reference_stride_); FillRandom(GetReference(1), reference_stride_); FillRandom(GetReference(2), reference_stride_); FillRandom(GetReference(3), reference_stride_); CheckSADs(); source_data_ = tmp_source_data; } using std::tr1::make_tuple; //------------------------------------------------------------------------------ // C functions const SadMxNFunc sad64x64_c = vpx_sad64x64_c; const SadMxNFunc sad64x32_c = vpx_sad64x32_c; const SadMxNFunc sad32x64_c = vpx_sad32x64_c; const SadMxNFunc sad32x32_c = vpx_sad32x32_c; const SadMxNFunc sad32x16_c = vpx_sad32x16_c; const SadMxNFunc sad16x32_c = vpx_sad16x32_c; const SadMxNFunc sad16x16_c = vpx_sad16x16_c; const SadMxNFunc sad16x8_c = vpx_sad16x8_c; const SadMxNFunc sad8x16_c = vpx_sad8x16_c; const SadMxNFunc sad8x8_c = vpx_sad8x8_c; const SadMxNFunc sad8x4_c = vpx_sad8x4_c; const SadMxNFunc sad4x8_c = vpx_sad4x8_c; const SadMxNFunc sad4x4_c = vpx_sad4x4_c; #if CONFIG_VP9_HIGHBITDEPTH const SadMxNFunc highbd_sad64x64_c = vpx_highbd_sad64x64_c; const SadMxNFunc highbd_sad64x32_c = vpx_highbd_sad64x32_c; const SadMxNFunc highbd_sad32x64_c = vpx_highbd_sad32x64_c; const SadMxNFunc highbd_sad32x32_c = vpx_highbd_sad32x32_c; const SadMxNFunc highbd_sad32x16_c = vpx_highbd_sad32x16_c; const SadMxNFunc highbd_sad16x32_c = vpx_highbd_sad16x32_c; const SadMxNFunc highbd_sad16x16_c = vpx_highbd_sad16x16_c; const SadMxNFunc highbd_sad16x8_c = vpx_highbd_sad16x8_c; const SadMxNFunc highbd_sad8x16_c = vpx_highbd_sad8x16_c; const SadMxNFunc highbd_sad8x8_c = vpx_highbd_sad8x8_c; const SadMxNFunc highbd_sad8x4_c = vpx_highbd_sad8x4_c; const SadMxNFunc highbd_sad4x8_c = vpx_highbd_sad4x8_c; const SadMxNFunc highbd_sad4x4_c = vpx_highbd_sad4x4_c; #endif // CONFIG_VP9_HIGHBITDEPTH const SadMxNParam c_tests[] = { make_tuple(64, 64, sad64x64_c, -1), make_tuple(64, 32, sad64x32_c, -1), make_tuple(32, 64, sad32x64_c, -1), make_tuple(32, 32, sad32x32_c, -1), make_tuple(32, 16, sad32x16_c, -1), make_tuple(16, 32, sad16x32_c, -1), make_tuple(16, 16, sad16x16_c, -1), make_tuple(16, 8, sad16x8_c, -1), make_tuple(8, 16, sad8x16_c, -1), make_tuple(8, 8, sad8x8_c, -1), make_tuple(8, 4, sad8x4_c, -1), make_tuple(4, 8, sad4x8_c, -1), make_tuple(4, 4, sad4x4_c, -1), #if CONFIG_VP9_HIGHBITDEPTH make_tuple(64, 64, highbd_sad64x64_c, 8), make_tuple(64, 32, highbd_sad64x32_c, 8), make_tuple(32, 64, highbd_sad32x64_c, 8), make_tuple(32, 32, highbd_sad32x32_c, 8), make_tuple(32, 16, highbd_sad32x16_c, 8), make_tuple(16, 32, highbd_sad16x32_c, 8), make_tuple(16, 16, highbd_sad16x16_c, 8), make_tuple(16, 8, highbd_sad16x8_c, 8), make_tuple(8, 16, highbd_sad8x16_c, 8), make_tuple(8, 8, highbd_sad8x8_c, 8), make_tuple(8, 4, highbd_sad8x4_c, 8), make_tuple(4, 8, highbd_sad4x8_c, 8), make_tuple(4, 4, highbd_sad4x4_c, 8), make_tuple(64, 64, highbd_sad64x64_c, 10), make_tuple(64, 32, highbd_sad64x32_c, 10), make_tuple(32, 64, highbd_sad32x64_c, 10), make_tuple(32, 32, highbd_sad32x32_c, 10), make_tuple(32, 16, highbd_sad32x16_c, 10), make_tuple(16, 32, highbd_sad16x32_c, 10), make_tuple(16, 16, highbd_sad16x16_c, 10), make_tuple(16, 8, highbd_sad16x8_c, 10), make_tuple(8, 16, highbd_sad8x16_c, 10), make_tuple(8, 8, highbd_sad8x8_c, 10), make_tuple(8, 4, highbd_sad8x4_c, 10), make_tuple(4, 8, highbd_sad4x8_c, 10), make_tuple(4, 4, highbd_sad4x4_c, 10), make_tuple(64, 64, highbd_sad64x64_c, 12), make_tuple(64, 32, highbd_sad64x32_c, 12), make_tuple(32, 64, highbd_sad32x64_c, 12), make_tuple(32, 32, highbd_sad32x32_c, 12), make_tuple(32, 16, highbd_sad32x16_c, 12), make_tuple(16, 32, highbd_sad16x32_c, 12), make_tuple(16, 16, highbd_sad16x16_c, 12), make_tuple(16, 8, highbd_sad16x8_c, 12), make_tuple(8, 16, highbd_sad8x16_c, 12), make_tuple(8, 8, highbd_sad8x8_c, 12), make_tuple(8, 4, highbd_sad8x4_c, 12), make_tuple(4, 8, highbd_sad4x8_c, 12), make_tuple(4, 4, highbd_sad4x4_c, 12), #endif // CONFIG_VP9_HIGHBITDEPTH }; INSTANTIATE_TEST_CASE_P(C, SADTest, ::testing::ValuesIn(c_tests)); const SadMxNAvgFunc sad64x64_avg_c = vpx_sad64x64_avg_c; const SadMxNAvgFunc sad64x32_avg_c = vpx_sad64x32_avg_c; const SadMxNAvgFunc sad32x64_avg_c = vpx_sad32x64_avg_c; const SadMxNAvgFunc sad32x32_avg_c = vpx_sad32x32_avg_c; const SadMxNAvgFunc sad32x16_avg_c = vpx_sad32x16_avg_c; const SadMxNAvgFunc sad16x32_avg_c = vpx_sad16x32_avg_c; const SadMxNAvgFunc sad16x16_avg_c = vpx_sad16x16_avg_c; const SadMxNAvgFunc sad16x8_avg_c = vpx_sad16x8_avg_c; const SadMxNAvgFunc sad8x16_avg_c = vpx_sad8x16_avg_c; const SadMxNAvgFunc sad8x8_avg_c = vpx_sad8x8_avg_c; const SadMxNAvgFunc sad8x4_avg_c = vpx_sad8x4_avg_c; const SadMxNAvgFunc sad4x8_avg_c = vpx_sad4x8_avg_c; const SadMxNAvgFunc sad4x4_avg_c = vpx_sad4x4_avg_c; #if CONFIG_VP9_HIGHBITDEPTH const SadMxNAvgFunc highbd_sad64x64_avg_c = vpx_highbd_sad64x64_avg_c; const SadMxNAvgFunc highbd_sad64x32_avg_c = vpx_highbd_sad64x32_avg_c; const SadMxNAvgFunc highbd_sad32x64_avg_c = vpx_highbd_sad32x64_avg_c; const SadMxNAvgFunc highbd_sad32x32_avg_c = vpx_highbd_sad32x32_avg_c; const SadMxNAvgFunc highbd_sad32x16_avg_c = vpx_highbd_sad32x16_avg_c; const SadMxNAvgFunc highbd_sad16x32_avg_c = vpx_highbd_sad16x32_avg_c; const SadMxNAvgFunc highbd_sad16x16_avg_c = vpx_highbd_sad16x16_avg_c; const SadMxNAvgFunc highbd_sad16x8_avg_c = vpx_highbd_sad16x8_avg_c; const SadMxNAvgFunc highbd_sad8x16_avg_c = vpx_highbd_sad8x16_avg_c; const SadMxNAvgFunc highbd_sad8x8_avg_c = vpx_highbd_sad8x8_avg_c; const SadMxNAvgFunc highbd_sad8x4_avg_c = vpx_highbd_sad8x4_avg_c; const SadMxNAvgFunc highbd_sad4x8_avg_c = vpx_highbd_sad4x8_avg_c; const SadMxNAvgFunc highbd_sad4x4_avg_c = vpx_highbd_sad4x4_avg_c; #endif // CONFIG_VP9_HIGHBITDEPTH const SadMxNAvgParam avg_c_tests[] = { make_tuple(64, 64, sad64x64_avg_c, -1), make_tuple(64, 32, sad64x32_avg_c, -1), make_tuple(32, 64, sad32x64_avg_c, -1), make_tuple(32, 32, sad32x32_avg_c, -1), make_tuple(32, 16, sad32x16_avg_c, -1), make_tuple(16, 32, sad16x32_avg_c, -1), make_tuple(16, 16, sad16x16_avg_c, -1), make_tuple(16, 8, sad16x8_avg_c, -1), make_tuple(8, 16, sad8x16_avg_c, -1), make_tuple(8, 8, sad8x8_avg_c, -1), make_tuple(8, 4, sad8x4_avg_c, -1), make_tuple(4, 8, sad4x8_avg_c, -1), make_tuple(4, 4, sad4x4_avg_c, -1), #if CONFIG_VP9_HIGHBITDEPTH make_tuple(64, 64, highbd_sad64x64_avg_c, 8), make_tuple(64, 32, highbd_sad64x32_avg_c, 8), make_tuple(32, 64, highbd_sad32x64_avg_c, 8), make_tuple(32, 32, highbd_sad32x32_avg_c, 8), make_tuple(32, 16, highbd_sad32x16_avg_c, 8), make_tuple(16, 32, highbd_sad16x32_avg_c, 8), make_tuple(16, 16, highbd_sad16x16_avg_c, 8), make_tuple(16, 8, highbd_sad16x8_avg_c, 8), make_tuple(8, 16, highbd_sad8x16_avg_c, 8), make_tuple(8, 8, highbd_sad8x8_avg_c, 8), make_tuple(8, 4, highbd_sad8x4_avg_c, 8), make_tuple(4, 8, highbd_sad4x8_avg_c, 8), make_tuple(4, 4, highbd_sad4x4_avg_c, 8), make_tuple(64, 64, highbd_sad64x64_avg_c, 10), make_tuple(64, 32, highbd_sad64x32_avg_c, 10), make_tuple(32, 64, highbd_sad32x64_avg_c, 10), make_tuple(32, 32, highbd_sad32x32_avg_c, 10), make_tuple(32, 16, highbd_sad32x16_avg_c, 10), make_tuple(16, 32, highbd_sad16x32_avg_c, 10), make_tuple(16, 16, highbd_sad16x16_avg_c, 10), make_tuple(16, 8, highbd_sad16x8_avg_c, 10), make_tuple(8, 16, highbd_sad8x16_avg_c, 10), make_tuple(8, 8, highbd_sad8x8_avg_c, 10), make_tuple(8, 4, highbd_sad8x4_avg_c, 10), make_tuple(4, 8, highbd_sad4x8_avg_c, 10), make_tuple(4, 4, highbd_sad4x4_avg_c, 10), make_tuple(64, 64, highbd_sad64x64_avg_c, 12), make_tuple(64, 32, highbd_sad64x32_avg_c, 12), make_tuple(32, 64, highbd_sad32x64_avg_c, 12), make_tuple(32, 32, highbd_sad32x32_avg_c, 12), make_tuple(32, 16, highbd_sad32x16_avg_c, 12), make_tuple(16, 32, highbd_sad16x32_avg_c, 12), make_tuple(16, 16, highbd_sad16x16_avg_c, 12), make_tuple(16, 8, highbd_sad16x8_avg_c, 12), make_tuple(8, 16, highbd_sad8x16_avg_c, 12), make_tuple(8, 8, highbd_sad8x8_avg_c, 12), make_tuple(8, 4, highbd_sad8x4_avg_c, 12), make_tuple(4, 8, highbd_sad4x8_avg_c, 12), make_tuple(4, 4, highbd_sad4x4_avg_c, 12), #endif // CONFIG_VP9_HIGHBITDEPTH }; INSTANTIATE_TEST_CASE_P(C, SADavgTest, ::testing::ValuesIn(avg_c_tests)); const SadMxNx4Func sad64x64x4d_c = vpx_sad64x64x4d_c; const SadMxNx4Func sad64x32x4d_c = vpx_sad64x32x4d_c; const SadMxNx4Func sad32x64x4d_c = vpx_sad32x64x4d_c; const SadMxNx4Func sad32x32x4d_c = vpx_sad32x32x4d_c; const SadMxNx4Func sad32x16x4d_c = vpx_sad32x16x4d_c; const SadMxNx4Func sad16x32x4d_c = vpx_sad16x32x4d_c; const SadMxNx4Func sad16x16x4d_c = vpx_sad16x16x4d_c; const SadMxNx4Func sad16x8x4d_c = vpx_sad16x8x4d_c; const SadMxNx4Func sad8x16x4d_c = vpx_sad8x16x4d_c; const SadMxNx4Func sad8x8x4d_c = vpx_sad8x8x4d_c; const SadMxNx4Func sad8x4x4d_c = vpx_sad8x4x4d_c; const SadMxNx4Func sad4x8x4d_c = vpx_sad4x8x4d_c; const SadMxNx4Func sad4x4x4d_c = vpx_sad4x4x4d_c; #if CONFIG_VP9_HIGHBITDEPTH const SadMxNx4Func highbd_sad64x64x4d_c = vpx_highbd_sad64x64x4d_c; const SadMxNx4Func highbd_sad64x32x4d_c = vpx_highbd_sad64x32x4d_c; const SadMxNx4Func highbd_sad32x64x4d_c = vpx_highbd_sad32x64x4d_c; const SadMxNx4Func highbd_sad32x32x4d_c = vpx_highbd_sad32x32x4d_c; const SadMxNx4Func highbd_sad32x16x4d_c = vpx_highbd_sad32x16x4d_c; const SadMxNx4Func highbd_sad16x32x4d_c = vpx_highbd_sad16x32x4d_c; const SadMxNx4Func highbd_sad16x16x4d_c = vpx_highbd_sad16x16x4d_c; const SadMxNx4Func highbd_sad16x8x4d_c = vpx_highbd_sad16x8x4d_c; const SadMxNx4Func highbd_sad8x16x4d_c = vpx_highbd_sad8x16x4d_c; const SadMxNx4Func highbd_sad8x8x4d_c = vpx_highbd_sad8x8x4d_c; const SadMxNx4Func highbd_sad8x4x4d_c = vpx_highbd_sad8x4x4d_c; const SadMxNx4Func highbd_sad4x8x4d_c = vpx_highbd_sad4x8x4d_c; const SadMxNx4Func highbd_sad4x4x4d_c = vpx_highbd_sad4x4x4d_c; #endif // CONFIG_VP9_HIGHBITDEPTH const SadMxNx4Param x4d_c_tests[] = { make_tuple(64, 64, sad64x64x4d_c, -1), make_tuple(64, 32, sad64x32x4d_c, -1), make_tuple(32, 64, sad32x64x4d_c, -1), make_tuple(32, 32, sad32x32x4d_c, -1), make_tuple(32, 16, sad32x16x4d_c, -1), make_tuple(16, 32, sad16x32x4d_c, -1), make_tuple(16, 16, sad16x16x4d_c, -1), make_tuple(16, 8, sad16x8x4d_c, -1), make_tuple(8, 16, sad8x16x4d_c, -1), make_tuple(8, 8, sad8x8x4d_c, -1), make_tuple(8, 4, sad8x4x4d_c, -1), make_tuple(4, 8, sad4x8x4d_c, -1), make_tuple(4, 4, sad4x4x4d_c, -1), #if CONFIG_VP9_HIGHBITDEPTH make_tuple(64, 64, highbd_sad64x64x4d_c, 8), make_tuple(64, 32, highbd_sad64x32x4d_c, 8), make_tuple(32, 64, highbd_sad32x64x4d_c, 8), make_tuple(32, 32, highbd_sad32x32x4d_c, 8), make_tuple(32, 16, highbd_sad32x16x4d_c, 8), make_tuple(16, 32, highbd_sad16x32x4d_c, 8), make_tuple(16, 16, highbd_sad16x16x4d_c, 8), make_tuple(16, 8, highbd_sad16x8x4d_c, 8), make_tuple(8, 16, highbd_sad8x16x4d_c, 8), make_tuple(8, 8, highbd_sad8x8x4d_c, 8), make_tuple(8, 4, highbd_sad8x4x4d_c, 8), make_tuple(4, 8, highbd_sad4x8x4d_c, 8), make_tuple(4, 4, highbd_sad4x4x4d_c, 8), make_tuple(64, 64, highbd_sad64x64x4d_c, 10), make_tuple(64, 32, highbd_sad64x32x4d_c, 10), make_tuple(32, 64, highbd_sad32x64x4d_c, 10), make_tuple(32, 32, highbd_sad32x32x4d_c, 10), make_tuple(32, 16, highbd_sad32x16x4d_c, 10), make_tuple(16, 32, highbd_sad16x32x4d_c, 10), make_tuple(16, 16, highbd_sad16x16x4d_c, 10), make_tuple(16, 8, highbd_sad16x8x4d_c, 10), make_tuple(8, 16, highbd_sad8x16x4d_c, 10), make_tuple(8, 8, highbd_sad8x8x4d_c, 10), make_tuple(8, 4, highbd_sad8x4x4d_c, 10), make_tuple(4, 8, highbd_sad4x8x4d_c, 10), make_tuple(4, 4, highbd_sad4x4x4d_c, 10), make_tuple(64, 64, highbd_sad64x64x4d_c, 12), make_tuple(64, 32, highbd_sad64x32x4d_c, 12), make_tuple(32, 64, highbd_sad32x64x4d_c, 12), make_tuple(32, 32, highbd_sad32x32x4d_c, 12), make_tuple(32, 16, highbd_sad32x16x4d_c, 12), make_tuple(16, 32, highbd_sad16x32x4d_c, 12), make_tuple(16, 16, highbd_sad16x16x4d_c, 12), make_tuple(16, 8, highbd_sad16x8x4d_c, 12), make_tuple(8, 16, highbd_sad8x16x4d_c, 12), make_tuple(8, 8, highbd_sad8x8x4d_c, 12), make_tuple(8, 4, highbd_sad8x4x4d_c, 12), make_tuple(4, 8, highbd_sad4x8x4d_c, 12), make_tuple(4, 4, highbd_sad4x4x4d_c, 12), #endif // CONFIG_VP9_HIGHBITDEPTH }; INSTANTIATE_TEST_CASE_P(C, SADx4Test, ::testing::ValuesIn(x4d_c_tests)); //------------------------------------------------------------------------------ // ARM functions #if HAVE_MEDIA const SadMxNFunc sad16x16_media = vpx_sad16x16_media; const SadMxNParam media_tests[] = { make_tuple(16, 16, sad16x16_media, -1), }; INSTANTIATE_TEST_CASE_P(MEDIA, SADTest, ::testing::ValuesIn(media_tests)); #endif // HAVE_MEDIA #if HAVE_NEON const SadMxNFunc sad64x64_neon = vpx_sad64x64_neon; const SadMxNFunc sad32x32_neon = vpx_sad32x32_neon; const SadMxNFunc sad16x16_neon = vpx_sad16x16_neon; const SadMxNFunc sad16x8_neon = vpx_sad16x8_neon; const SadMxNFunc sad8x16_neon = vpx_sad8x16_neon; const SadMxNFunc sad8x8_neon = vpx_sad8x8_neon; const SadMxNFunc sad4x4_neon = vpx_sad4x4_neon; const SadMxNParam neon_tests[] = { make_tuple(64, 64, sad64x64_neon, -1), make_tuple(32, 32, sad32x32_neon, -1), make_tuple(16, 16, sad16x16_neon, -1), make_tuple(16, 8, sad16x8_neon, -1), make_tuple(8, 16, sad8x16_neon, -1), make_tuple(8, 8, sad8x8_neon, -1), make_tuple(4, 4, sad4x4_neon, -1), }; INSTANTIATE_TEST_CASE_P(NEON, SADTest, ::testing::ValuesIn(neon_tests)); const SadMxNx4Func sad64x64x4d_neon = vpx_sad64x64x4d_neon; const SadMxNx4Func sad32x32x4d_neon = vpx_sad32x32x4d_neon; const SadMxNx4Func sad16x16x4d_neon = vpx_sad16x16x4d_neon; const SadMxNx4Param x4d_neon_tests[] = { make_tuple(64, 64, sad64x64x4d_neon, -1), make_tuple(32, 32, sad32x32x4d_neon, -1), make_tuple(16, 16, sad16x16x4d_neon, -1), }; INSTANTIATE_TEST_CASE_P(NEON, SADx4Test, ::testing::ValuesIn(x4d_neon_tests)); #endif // HAVE_NEON //------------------------------------------------------------------------------ // x86 functions #if HAVE_MMX const SadMxNFunc sad16x16_mmx = vpx_sad16x16_mmx; const SadMxNFunc sad16x8_mmx = vpx_sad16x8_mmx; const SadMxNFunc sad8x16_mmx = vpx_sad8x16_mmx; const SadMxNFunc sad8x8_mmx = vpx_sad8x8_mmx; const SadMxNFunc sad4x4_mmx = vpx_sad4x4_mmx; const SadMxNParam mmx_tests[] = { make_tuple(16, 16, sad16x16_mmx, -1), make_tuple(16, 8, sad16x8_mmx, -1), make_tuple(8, 16, sad8x16_mmx, -1), make_tuple(8, 8, sad8x8_mmx, -1), make_tuple(4, 4, sad4x4_mmx, -1), }; INSTANTIATE_TEST_CASE_P(MMX, SADTest, ::testing::ValuesIn(mmx_tests)); #endif // HAVE_MMX #if HAVE_SSE #if CONFIG_USE_X86INC const SadMxNFunc sad4x8_sse = vpx_sad4x8_sse; const SadMxNFunc sad4x4_sse = vpx_sad4x4_sse; const SadMxNParam sse_tests[] = { make_tuple(4, 8, sad4x8_sse, -1), make_tuple(4, 4, sad4x4_sse, -1), }; INSTANTIATE_TEST_CASE_P(SSE, SADTest, ::testing::ValuesIn(sse_tests)); const SadMxNAvgFunc sad4x8_avg_sse = vpx_sad4x8_avg_sse; const SadMxNAvgFunc sad4x4_avg_sse = vpx_sad4x4_avg_sse; const SadMxNAvgParam avg_sse_tests[] = { make_tuple(4, 8, sad4x8_avg_sse, -1), make_tuple(4, 4, sad4x4_avg_sse, -1), }; INSTANTIATE_TEST_CASE_P(SSE, SADavgTest, ::testing::ValuesIn(avg_sse_tests)); const SadMxNx4Func sad4x8x4d_sse = vpx_sad4x8x4d_sse; const SadMxNx4Func sad4x4x4d_sse = vpx_sad4x4x4d_sse; const SadMxNx4Param x4d_sse_tests[] = { make_tuple(4, 8, sad4x8x4d_sse, -1), make_tuple(4, 4, sad4x4x4d_sse, -1), }; INSTANTIATE_TEST_CASE_P(SSE, SADx4Test, ::testing::ValuesIn(x4d_sse_tests)); #endif // CONFIG_USE_X86INC #endif // HAVE_SSE #if HAVE_SSE2 #if CONFIG_USE_X86INC const SadMxNFunc sad64x64_sse2 = vpx_sad64x64_sse2; const SadMxNFunc sad64x32_sse2 = vpx_sad64x32_sse2; const SadMxNFunc sad32x64_sse2 = vpx_sad32x64_sse2; const SadMxNFunc sad32x32_sse2 = vpx_sad32x32_sse2; const SadMxNFunc sad32x16_sse2 = vpx_sad32x16_sse2; const SadMxNFunc sad16x32_sse2 = vpx_sad16x32_sse2; const SadMxNFunc sad16x16_sse2 = vpx_sad16x16_sse2; const SadMxNFunc sad16x8_sse2 = vpx_sad16x8_sse2; const SadMxNFunc sad8x16_sse2 = vpx_sad8x16_sse2; const SadMxNFunc sad8x8_sse2 = vpx_sad8x8_sse2; const SadMxNFunc sad8x4_sse2 = vpx_sad8x4_sse2; #if CONFIG_VP9_HIGHBITDEPTH const SadMxNFunc highbd_sad64x64_sse2 = vpx_highbd_sad64x64_sse2; const SadMxNFunc highbd_sad64x32_sse2 = vpx_highbd_sad64x32_sse2; const SadMxNFunc highbd_sad32x64_sse2 = vpx_highbd_sad32x64_sse2; const SadMxNFunc highbd_sad32x32_sse2 = vpx_highbd_sad32x32_sse2; const SadMxNFunc highbd_sad32x16_sse2 = vpx_highbd_sad32x16_sse2; const SadMxNFunc highbd_sad16x32_sse2 = vpx_highbd_sad16x32_sse2; const SadMxNFunc highbd_sad16x16_sse2 = vpx_highbd_sad16x16_sse2; const SadMxNFunc highbd_sad16x8_sse2 = vpx_highbd_sad16x8_sse2; const SadMxNFunc highbd_sad8x16_sse2 = vpx_highbd_sad8x16_sse2; const SadMxNFunc highbd_sad8x8_sse2 = vpx_highbd_sad8x8_sse2; const SadMxNFunc highbd_sad8x4_sse2 = vpx_highbd_sad8x4_sse2; #endif // CONFIG_VP9_HIGHBITDEPTH const SadMxNParam sse2_tests[] = { make_tuple(64, 64, sad64x64_sse2, -1), make_tuple(64, 32, sad64x32_sse2, -1), make_tuple(32, 64, sad32x64_sse2, -1), make_tuple(32, 32, sad32x32_sse2, -1), make_tuple(32, 16, sad32x16_sse2, -1), make_tuple(16, 32, sad16x32_sse2, -1), make_tuple(16, 16, sad16x16_sse2, -1), make_tuple(16, 8, sad16x8_sse2, -1), make_tuple(8, 16, sad8x16_sse2, -1), make_tuple(8, 8, sad8x8_sse2, -1), make_tuple(8, 4, sad8x4_sse2, -1), #if CONFIG_VP9_HIGHBITDEPTH make_tuple(64, 64, highbd_sad64x64_sse2, 8), make_tuple(64, 32, highbd_sad64x32_sse2, 8), make_tuple(32, 64, highbd_sad32x64_sse2, 8), make_tuple(32, 32, highbd_sad32x32_sse2, 8), make_tuple(32, 16, highbd_sad32x16_sse2, 8), make_tuple(16, 32, highbd_sad16x32_sse2, 8), make_tuple(16, 16, highbd_sad16x16_sse2, 8), make_tuple(16, 8, highbd_sad16x8_sse2, 8), make_tuple(8, 16, highbd_sad8x16_sse2, 8), make_tuple(8, 8, highbd_sad8x8_sse2, 8), make_tuple(8, 4, highbd_sad8x4_sse2, 8), make_tuple(64, 64, highbd_sad64x64_sse2, 10), make_tuple(64, 32, highbd_sad64x32_sse2, 10), make_tuple(32, 64, highbd_sad32x64_sse2, 10), make_tuple(32, 32, highbd_sad32x32_sse2, 10), make_tuple(32, 16, highbd_sad32x16_sse2, 10), make_tuple(16, 32, highbd_sad16x32_sse2, 10), make_tuple(16, 16, highbd_sad16x16_sse2, 10), make_tuple(16, 8, highbd_sad16x8_sse2, 10), make_tuple(8, 16, highbd_sad8x16_sse2, 10), make_tuple(8, 8, highbd_sad8x8_sse2, 10), make_tuple(8, 4, highbd_sad8x4_sse2, 10), make_tuple(64, 64, highbd_sad64x64_sse2, 12), make_tuple(64, 32, highbd_sad64x32_sse2, 12), make_tuple(32, 64, highbd_sad32x64_sse2, 12), make_tuple(32, 32, highbd_sad32x32_sse2, 12), make_tuple(32, 16, highbd_sad32x16_sse2, 12), make_tuple(16, 32, highbd_sad16x32_sse2, 12), make_tuple(16, 16, highbd_sad16x16_sse2, 12), make_tuple(16, 8, highbd_sad16x8_sse2, 12), make_tuple(8, 16, highbd_sad8x16_sse2, 12), make_tuple(8, 8, highbd_sad8x8_sse2, 12), make_tuple(8, 4, highbd_sad8x4_sse2, 12), #endif // CONFIG_VP9_HIGHBITDEPTH }; INSTANTIATE_TEST_CASE_P(SSE2, SADTest, ::testing::ValuesIn(sse2_tests)); const SadMxNAvgFunc sad64x64_avg_sse2 = vpx_sad64x64_avg_sse2; const SadMxNAvgFunc sad64x32_avg_sse2 = vpx_sad64x32_avg_sse2; const SadMxNAvgFunc sad32x64_avg_sse2 = vpx_sad32x64_avg_sse2; const SadMxNAvgFunc sad32x32_avg_sse2 = vpx_sad32x32_avg_sse2; const SadMxNAvgFunc sad32x16_avg_sse2 = vpx_sad32x16_avg_sse2; const SadMxNAvgFunc sad16x32_avg_sse2 = vpx_sad16x32_avg_sse2; const SadMxNAvgFunc sad16x16_avg_sse2 = vpx_sad16x16_avg_sse2; const SadMxNAvgFunc sad16x8_avg_sse2 = vpx_sad16x8_avg_sse2; const SadMxNAvgFunc sad8x16_avg_sse2 = vpx_sad8x16_avg_sse2; const SadMxNAvgFunc sad8x8_avg_sse2 = vpx_sad8x8_avg_sse2; const SadMxNAvgFunc sad8x4_avg_sse2 = vpx_sad8x4_avg_sse2; #if CONFIG_VP9_HIGHBITDEPTH const SadMxNAvgFunc highbd_sad64x64_avg_sse2 = vpx_highbd_sad64x64_avg_sse2; const SadMxNAvgFunc highbd_sad64x32_avg_sse2 = vpx_highbd_sad64x32_avg_sse2; const SadMxNAvgFunc highbd_sad32x64_avg_sse2 = vpx_highbd_sad32x64_avg_sse2; const SadMxNAvgFunc highbd_sad32x32_avg_sse2 = vpx_highbd_sad32x32_avg_sse2; const SadMxNAvgFunc highbd_sad32x16_avg_sse2 = vpx_highbd_sad32x16_avg_sse2; const SadMxNAvgFunc highbd_sad16x32_avg_sse2 = vpx_highbd_sad16x32_avg_sse2; const SadMxNAvgFunc highbd_sad16x16_avg_sse2 = vpx_highbd_sad16x16_avg_sse2; const SadMxNAvgFunc highbd_sad16x8_avg_sse2 = vpx_highbd_sad16x8_avg_sse2; const SadMxNAvgFunc highbd_sad8x16_avg_sse2 = vpx_highbd_sad8x16_avg_sse2; const SadMxNAvgFunc highbd_sad8x8_avg_sse2 = vpx_highbd_sad8x8_avg_sse2; const SadMxNAvgFunc highbd_sad8x4_avg_sse2 = vpx_highbd_sad8x4_avg_sse2; #endif // CONFIG_VP9_HIGHBITDEPTH const SadMxNAvgParam avg_sse2_tests[] = { make_tuple(64, 64, sad64x64_avg_sse2, -1), make_tuple(64, 32, sad64x32_avg_sse2, -1), make_tuple(32, 64, sad32x64_avg_sse2, -1), make_tuple(32, 32, sad32x32_avg_sse2, -1), make_tuple(32, 16, sad32x16_avg_sse2, -1), make_tuple(16, 32, sad16x32_avg_sse2, -1), make_tuple(16, 16, sad16x16_avg_sse2, -1), make_tuple(16, 8, sad16x8_avg_sse2, -1), make_tuple(8, 16, sad8x16_avg_sse2, -1), make_tuple(8, 8, sad8x8_avg_sse2, -1), make_tuple(8, 4, sad8x4_avg_sse2, -1), #if CONFIG_VP9_HIGHBITDEPTH make_tuple(64, 64, highbd_sad64x64_avg_sse2, 8), make_tuple(64, 32, highbd_sad64x32_avg_sse2, 8), make_tuple(32, 64, highbd_sad32x64_avg_sse2, 8), make_tuple(32, 32, highbd_sad32x32_avg_sse2, 8), make_tuple(32, 16, highbd_sad32x16_avg_sse2, 8), make_tuple(16, 32, highbd_sad16x32_avg_sse2, 8), make_tuple(16, 16, highbd_sad16x16_avg_sse2, 8), make_tuple(16, 8, highbd_sad16x8_avg_sse2, 8), make_tuple(8, 16, highbd_sad8x16_avg_sse2, 8), make_tuple(8, 8, highbd_sad8x8_avg_sse2, 8), make_tuple(8, 4, highbd_sad8x4_avg_sse2, 8), make_tuple(64, 64, highbd_sad64x64_avg_sse2, 10), make_tuple(64, 32, highbd_sad64x32_avg_sse2, 10), make_tuple(32, 64, highbd_sad32x64_avg_sse2, 10), make_tuple(32, 32, highbd_sad32x32_avg_sse2, 10), make_tuple(32, 16, highbd_sad32x16_avg_sse2, 10), make_tuple(16, 32, highbd_sad16x32_avg_sse2, 10), make_tuple(16, 16, highbd_sad16x16_avg_sse2, 10), make_tuple(16, 8, highbd_sad16x8_avg_sse2, 10), make_tuple(8, 16, highbd_sad8x16_avg_sse2, 10), make_tuple(8, 8, highbd_sad8x8_avg_sse2, 10), make_tuple(8, 4, highbd_sad8x4_avg_sse2, 10), make_tuple(64, 64, highbd_sad64x64_avg_sse2, 12), make_tuple(64, 32, highbd_sad64x32_avg_sse2, 12), make_tuple(32, 64, highbd_sad32x64_avg_sse2, 12), make_tuple(32, 32, highbd_sad32x32_avg_sse2, 12), make_tuple(32, 16, highbd_sad32x16_avg_sse2, 12), make_tuple(16, 32, highbd_sad16x32_avg_sse2, 12), make_tuple(16, 16, highbd_sad16x16_avg_sse2, 12), make_tuple(16, 8, highbd_sad16x8_avg_sse2, 12), make_tuple(8, 16, highbd_sad8x16_avg_sse2, 12), make_tuple(8, 8, highbd_sad8x8_avg_sse2, 12), make_tuple(8, 4, highbd_sad8x4_avg_sse2, 12), #endif // CONFIG_VP9_HIGHBITDEPTH }; INSTANTIATE_TEST_CASE_P(SSE2, SADavgTest, ::testing::ValuesIn(avg_sse2_tests)); const SadMxNx4Func sad64x64x4d_sse2 = vpx_sad64x64x4d_sse2; const SadMxNx4Func sad64x32x4d_sse2 = vpx_sad64x32x4d_sse2; const SadMxNx4Func sad32x64x4d_sse2 = vpx_sad32x64x4d_sse2; const SadMxNx4Func sad32x32x4d_sse2 = vpx_sad32x32x4d_sse2; const SadMxNx4Func sad32x16x4d_sse2 = vpx_sad32x16x4d_sse2; const SadMxNx4Func sad16x32x4d_sse2 = vpx_sad16x32x4d_sse2; const SadMxNx4Func sad16x16x4d_sse2 = vpx_sad16x16x4d_sse2; const SadMxNx4Func sad16x8x4d_sse2 = vpx_sad16x8x4d_sse2; const SadMxNx4Func sad8x16x4d_sse2 = vpx_sad8x16x4d_sse2; const SadMxNx4Func sad8x8x4d_sse2 = vpx_sad8x8x4d_sse2; const SadMxNx4Func sad8x4x4d_sse2 = vpx_sad8x4x4d_sse2; #if CONFIG_VP9_HIGHBITDEPTH const SadMxNx4Func highbd_sad64x64x4d_sse2 = vpx_highbd_sad64x64x4d_sse2; const SadMxNx4Func highbd_sad64x32x4d_sse2 = vpx_highbd_sad64x32x4d_sse2; const SadMxNx4Func highbd_sad32x64x4d_sse2 = vpx_highbd_sad32x64x4d_sse2; const SadMxNx4Func highbd_sad32x32x4d_sse2 = vpx_highbd_sad32x32x4d_sse2; const SadMxNx4Func highbd_sad32x16x4d_sse2 = vpx_highbd_sad32x16x4d_sse2; const SadMxNx4Func highbd_sad16x32x4d_sse2 = vpx_highbd_sad16x32x4d_sse2; const SadMxNx4Func highbd_sad16x16x4d_sse2 = vpx_highbd_sad16x16x4d_sse2; const SadMxNx4Func highbd_sad16x8x4d_sse2 = vpx_highbd_sad16x8x4d_sse2; const SadMxNx4Func highbd_sad8x16x4d_sse2 = vpx_highbd_sad8x16x4d_sse2; const SadMxNx4Func highbd_sad8x8x4d_sse2 = vpx_highbd_sad8x8x4d_sse2; const SadMxNx4Func highbd_sad8x4x4d_sse2 = vpx_highbd_sad8x4x4d_sse2; const SadMxNx4Func highbd_sad4x8x4d_sse2 = vpx_highbd_sad4x8x4d_sse2; const SadMxNx4Func highbd_sad4x4x4d_sse2 = vpx_highbd_sad4x4x4d_sse2; #endif // CONFIG_VP9_HIGHBITDEPTH const SadMxNx4Param x4d_sse2_tests[] = { make_tuple(64, 64, sad64x64x4d_sse2, -1), make_tuple(64, 32, sad64x32x4d_sse2, -1), make_tuple(32, 64, sad32x64x4d_sse2, -1), make_tuple(32, 32, sad32x32x4d_sse2, -1), make_tuple(32, 16, sad32x16x4d_sse2, -1), make_tuple(16, 32, sad16x32x4d_sse2, -1), make_tuple(16, 16, sad16x16x4d_sse2, -1), make_tuple(16, 8, sad16x8x4d_sse2, -1), make_tuple(8, 16, sad8x16x4d_sse2, -1), make_tuple(8, 8, sad8x8x4d_sse2, -1), make_tuple(8, 4, sad8x4x4d_sse2, -1), #if CONFIG_VP9_HIGHBITDEPTH make_tuple(64, 64, highbd_sad64x64x4d_sse2, 8), make_tuple(64, 32, highbd_sad64x32x4d_sse2, 8), make_tuple(32, 64, highbd_sad32x64x4d_sse2, 8), make_tuple(32, 32, highbd_sad32x32x4d_sse2, 8), make_tuple(32, 16, highbd_sad32x16x4d_sse2, 8), make_tuple(16, 32, highbd_sad16x32x4d_sse2, 8), make_tuple(16, 16, highbd_sad16x16x4d_sse2, 8), make_tuple(16, 8, highbd_sad16x8x4d_sse2, 8), make_tuple(8, 16, highbd_sad8x16x4d_sse2, 8), make_tuple(8, 8, highbd_sad8x8x4d_sse2, 8), make_tuple(8, 4, highbd_sad8x4x4d_sse2, 8), make_tuple(4, 8, highbd_sad4x8x4d_sse2, 8), make_tuple(4, 4, highbd_sad4x4x4d_sse2, 8), make_tuple(64, 64, highbd_sad64x64x4d_sse2, 10), make_tuple(64, 32, highbd_sad64x32x4d_sse2, 10), make_tuple(32, 64, highbd_sad32x64x4d_sse2, 10), make_tuple(32, 32, highbd_sad32x32x4d_sse2, 10), make_tuple(32, 16, highbd_sad32x16x4d_sse2, 10), make_tuple(16, 32, highbd_sad16x32x4d_sse2, 10), make_tuple(16, 16, highbd_sad16x16x4d_sse2, 10), make_tuple(16, 8, highbd_sad16x8x4d_sse2, 10), make_tuple(8, 16, highbd_sad8x16x4d_sse2, 10), make_tuple(8, 8, highbd_sad8x8x4d_sse2, 10), make_tuple(8, 4, highbd_sad8x4x4d_sse2, 10), make_tuple(4, 8, highbd_sad4x8x4d_sse2, 10), make_tuple(4, 4, highbd_sad4x4x4d_sse2, 10), make_tuple(64, 64, highbd_sad64x64x4d_sse2, 12), make_tuple(64, 32, highbd_sad64x32x4d_sse2, 12), make_tuple(32, 64, highbd_sad32x64x4d_sse2, 12), make_tuple(32, 32, highbd_sad32x32x4d_sse2, 12), make_tuple(32, 16, highbd_sad32x16x4d_sse2, 12), make_tuple(16, 32, highbd_sad16x32x4d_sse2, 12), make_tuple(16, 16, highbd_sad16x16x4d_sse2, 12), make_tuple(16, 8, highbd_sad16x8x4d_sse2, 12), make_tuple(8, 16, highbd_sad8x16x4d_sse2, 12), make_tuple(8, 8, highbd_sad8x8x4d_sse2, 12), make_tuple(8, 4, highbd_sad8x4x4d_sse2, 12), make_tuple(4, 8, highbd_sad4x8x4d_sse2, 12), make_tuple(4, 4, highbd_sad4x4x4d_sse2, 12), #endif // CONFIG_VP9_HIGHBITDEPTH }; INSTANTIATE_TEST_CASE_P(SSE2, SADx4Test, ::testing::ValuesIn(x4d_sse2_tests)); #endif // CONFIG_USE_X86INC #endif // HAVE_SSE2 #if HAVE_SSE3 // Only functions are x3, which do not have tests. #endif // HAVE_SSE3 #if HAVE_SSSE3 // Only functions are x3, which do not have tests. #endif // HAVE_SSSE3 #if HAVE_SSE4_1 // Only functions are x8, which do not have tests. #endif // HAVE_SSE4_1 #if HAVE_AVX2 const SadMxNFunc sad64x64_avx2 = vpx_sad64x64_avx2; const SadMxNFunc sad64x32_avx2 = vpx_sad64x32_avx2; const SadMxNFunc sad32x64_avx2 = vpx_sad32x64_avx2; const SadMxNFunc sad32x32_avx2 = vpx_sad32x32_avx2; const SadMxNFunc sad32x16_avx2 = vpx_sad32x16_avx2; const SadMxNParam avx2_tests[] = { make_tuple(64, 64, sad64x64_avx2, -1), make_tuple(64, 32, sad64x32_avx2, -1), make_tuple(32, 64, sad32x64_avx2, -1), make_tuple(32, 32, sad32x32_avx2, -1), make_tuple(32, 16, sad32x16_avx2, -1), }; INSTANTIATE_TEST_CASE_P(AVX2, SADTest, ::testing::ValuesIn(avx2_tests)); const SadMxNAvgFunc sad64x64_avg_avx2 = vpx_sad64x64_avg_avx2; const SadMxNAvgFunc sad64x32_avg_avx2 = vpx_sad64x32_avg_avx2; const SadMxNAvgFunc sad32x64_avg_avx2 = vpx_sad32x64_avg_avx2; const SadMxNAvgFunc sad32x32_avg_avx2 = vpx_sad32x32_avg_avx2; const SadMxNAvgFunc sad32x16_avg_avx2 = vpx_sad32x16_avg_avx2; const SadMxNAvgParam avg_avx2_tests[] = { make_tuple(64, 64, sad64x64_avg_avx2, -1), make_tuple(64, 32, sad64x32_avg_avx2, -1), make_tuple(32, 64, sad32x64_avg_avx2, -1), make_tuple(32, 32, sad32x32_avg_avx2, -1), make_tuple(32, 16, sad32x16_avg_avx2, -1), }; INSTANTIATE_TEST_CASE_P(AVX2, SADavgTest, ::testing::ValuesIn(avg_avx2_tests)); const SadMxNx4Func sad64x64x4d_avx2 = vpx_sad64x64x4d_avx2; const SadMxNx4Func sad32x32x4d_avx2 = vpx_sad32x32x4d_avx2; const SadMxNx4Param x4d_avx2_tests[] = { make_tuple(64, 64, sad64x64x4d_avx2, -1), make_tuple(32, 32, sad32x32x4d_avx2, -1), }; INSTANTIATE_TEST_CASE_P(AVX2, SADx4Test, ::testing::ValuesIn(x4d_avx2_tests)); #endif // HAVE_AVX2 } // namespace