/* * Copyright (c) 2017, Alliance for Open Media. All rights reserved * * This source code is subject to the terms of the BSD 2 Clause License and * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License * was not distributed with this source code in the LICENSE file, you can * obtain it at www.aomedia.org/license/software. If the Alliance for Open * Media Patent License 1.0 was not distributed with this source code in the * PATENTS file, you can obtain it at www.aomedia.org/license/patent. */ #include #include #include #include "config/aom_config.h" #include "config/av1_rtcd.h" #include "aom_ports/mem.h" #include "av1/common/scan.h" #include "av1/common/txb_common.h" #include "test/acm_random.h" #include "test/clear_system_state.h" #include "test/register_state_check.h" #include "test/util.h" #include "third_party/googletest/src/googletest/include/gtest/gtest.h" namespace { using libaom_test::ACMRandom; typedef void (*buildcompdiffwtdmaskd_func)(uint8_t *mask, DIFFWTD_MASK_TYPE mask_type, const uint8_t *src0, int src0_stride, const uint8_t *src1, int src1_stride, int h, int w); typedef ::testing::tuple BuildCompDiffwtdMaskDParam; #if HAVE_SSE4_1 ::testing::internal::ParamGenerator BuildParams( buildcompdiffwtdmaskd_func filter) { return ::testing::Combine(::testing::Range(BLOCK_4X4, BLOCK_SIZES_ALL), ::testing::Values(filter)); } #endif class BuildCompDiffwtdMaskTest : public ::testing::TestWithParam { public: virtual ~BuildCompDiffwtdMaskTest() {} virtual void TearDown() { libaom_test::ClearSystemState(); } void RunTest(buildcompdiffwtdmaskd_func test_impl, const int is_speed, const DIFFWTD_MASK_TYPE type); private: ACMRandom rnd_; }; typedef void (*buildcompdiffwtdmaskd16_func)( uint8_t *mask, DIFFWTD_MASK_TYPE mask_type, const CONV_BUF_TYPE *src0, int src0_stride, const CONV_BUF_TYPE *src1, int src1_stride, int h, int w, ConvolveParams *conv_params, int bd); typedef ::testing::tuple BuildCompDiffwtdMaskD16Param; #if HAVE_SSE4_1 || HAVE_NEON ::testing::internal::ParamGenerator BuildParams( buildcompdiffwtdmaskd16_func filter) { return ::testing::Combine(::testing::Range(8, 13, 2), ::testing::Values(filter), ::testing::Range(BLOCK_4X4, BLOCK_SIZES_ALL)); } #endif class BuildCompDiffwtdMaskD16Test : public ::testing::TestWithParam { public: ~BuildCompDiffwtdMaskD16Test() {} virtual void TearDown() { libaom_test::ClearSystemState(); } void SetUp() { rnd_.Reset(ACMRandom::DeterministicSeed()); } protected: void RunCheckOutput(buildcompdiffwtdmaskd16_func test_impl); void RunSpeedTest(buildcompdiffwtdmaskd16_func test_impl, DIFFWTD_MASK_TYPE mask_type); libaom_test::ACMRandom rnd_; }; // class BuildCompDiffwtdMaskD16Test void BuildCompDiffwtdMaskD16Test::RunCheckOutput( buildcompdiffwtdmaskd16_func test_impl) { const int block_idx = GET_PARAM(2); const int bd = GET_PARAM(0); const int width = block_size_wide[block_idx]; const int height = block_size_high[block_idx]; DECLARE_ALIGNED(16, uint8_t, mask_ref[2 * MAX_SB_SQUARE]); DECLARE_ALIGNED(16, uint8_t, mask_test[2 * MAX_SB_SQUARE]); DECLARE_ALIGNED(32, uint16_t, src0[MAX_SB_SQUARE]); DECLARE_ALIGNED(32, uint16_t, src1[MAX_SB_SQUARE]); ConvolveParams conv_params = get_conv_params_no_round(0, 0, NULL, 0, 1, bd); int in_precision = bd + 2 * FILTER_BITS - conv_params.round_0 - conv_params.round_1 + 2; for (int i = 0; i < MAX_SB_SQUARE; i++) { src0[i] = rnd_.Rand16() & ((1 << in_precision) - 1); src1[i] = rnd_.Rand16() & ((1 << in_precision) - 1); } for (int mask_type = 0; mask_type < DIFFWTD_MASK_TYPES; mask_type++) { av1_build_compound_diffwtd_mask_d16_c( mask_ref, (DIFFWTD_MASK_TYPE)mask_type, src0, width, src1, width, height, width, &conv_params, bd); test_impl(mask_test, (DIFFWTD_MASK_TYPE)mask_type, src0, width, src1, width, height, width, &conv_params, bd); for (int r = 0; r < height; ++r) { for (int c = 0; c < width; ++c) { ASSERT_EQ(mask_ref[c + r * width], mask_test[c + r * width]) << "Mismatch at unit tests for BuildCompDiffwtdMaskD16Test\n" << " Pixel mismatch at index " << "[" << r << "," << c << "] " << " @ " << width << "x" << height << " inv " << mask_type; } } } } void BuildCompDiffwtdMaskD16Test::RunSpeedTest( buildcompdiffwtdmaskd16_func test_impl, DIFFWTD_MASK_TYPE mask_type) { const int block_idx = GET_PARAM(2); const int bd = GET_PARAM(0); const int width = block_size_wide[block_idx]; const int height = block_size_high[block_idx]; DECLARE_ALIGNED(16, uint8_t, mask[MAX_SB_SQUARE]); DECLARE_ALIGNED(32, uint16_t, src0[MAX_SB_SQUARE]); DECLARE_ALIGNED(32, uint16_t, src1[MAX_SB_SQUARE]); ConvolveParams conv_params = get_conv_params_no_round(0, 0, NULL, 0, 1, bd); int in_precision = bd + 2 * FILTER_BITS - conv_params.round_0 - conv_params.round_1 + 2; for (int i = 0; i < MAX_SB_SQUARE; i++) { src0[i] = rnd_.Rand16() & ((1 << in_precision) - 1); src1[i] = rnd_.Rand16() & ((1 << in_precision) - 1); } const int num_loops = 10000000 / (width + height); aom_usec_timer timer; aom_usec_timer_start(&timer); for (int i = 0; i < num_loops; ++i) av1_build_compound_diffwtd_mask_d16_c(mask, mask_type, src0, width, src1, width, height, width, &conv_params, bd); aom_usec_timer_mark(&timer); const int elapsed_time = static_cast(aom_usec_timer_elapsed(&timer)); aom_usec_timer timer1; aom_usec_timer_start(&timer1); for (int i = 0; i < num_loops; ++i) test_impl(mask, mask_type, src0, width, src1, width, height, width, &conv_params, bd); aom_usec_timer_mark(&timer1); const int elapsed_time1 = static_cast(aom_usec_timer_elapsed(&timer1)); printf("av1_build_compound_diffwtd_mask_d16 %3dx%-3d: %7.2f \n", width, height, elapsed_time / double(elapsed_time1)); } #if HAVE_SSE4_1 void BuildCompDiffwtdMaskTest::RunTest(buildcompdiffwtdmaskd_func test_impl, const int is_speed, const DIFFWTD_MASK_TYPE type) { const int sb_type = GET_PARAM(0); const int width = block_size_wide[sb_type]; const int height = block_size_high[sb_type]; DECLARE_ALIGNED(16, uint8_t, mask_ref[MAX_SB_SQUARE]); DECLARE_ALIGNED(16, uint8_t, mask_test[MAX_SB_SQUARE]); DECLARE_ALIGNED(16, uint8_t, src0[MAX_SB_SQUARE]); DECLARE_ALIGNED(16, uint8_t, src1[MAX_SB_SQUARE]); ACMRandom rnd(ACMRandom::DeterministicSeed()); for (int i = 0; i < width * height; i++) { src0[i] = rnd.Rand8(); src1[i] = rnd.Rand8(); } const int run_times = is_speed ? (10000000 / (width + height)) : 1; aom_usec_timer timer; aom_usec_timer_start(&timer); for (int i = 0; i < run_times; ++i) { av1_build_compound_diffwtd_mask_c(mask_ref, type, src0, width, src1, width, height, width); } const double t1 = get_time_mark(&timer); aom_usec_timer_start(&timer); for (int i = 0; i < run_times; ++i) { test_impl(mask_test, type, src0, width, src1, width, height, width); } const double t2 = get_time_mark(&timer); if (is_speed) { printf("mask %d %3dx%-3d:%7.2f/%7.2fns", type, width, height, t1, t2); printf("(%3.2f)\n", t1 / t2); } for (int r = 0; r < height; ++r) { for (int c = 0; c < width; ++c) { ASSERT_EQ(mask_ref[c + r * width], mask_test[c + r * width]) << "[" << r << "," << c << "] " << run_times << " @ " << width << "x" << height << " inv " << type; } } } TEST_P(BuildCompDiffwtdMaskTest, match) { RunTest(GET_PARAM(1), 0, DIFFWTD_38); RunTest(GET_PARAM(1), 0, DIFFWTD_38_INV); } TEST_P(BuildCompDiffwtdMaskTest, DISABLED_Speed) { RunTest(GET_PARAM(1), 1, DIFFWTD_38); RunTest(GET_PARAM(1), 1, DIFFWTD_38_INV); } #endif TEST_P(BuildCompDiffwtdMaskD16Test, CheckOutput) { RunCheckOutput(GET_PARAM(1)); } TEST_P(BuildCompDiffwtdMaskD16Test, DISABLED_Speed) { RunSpeedTest(GET_PARAM(1), DIFFWTD_38); RunSpeedTest(GET_PARAM(1), DIFFWTD_38_INV); } #if HAVE_SSE4_1 INSTANTIATE_TEST_CASE_P(SSE4_1, BuildCompDiffwtdMaskTest, BuildParams(av1_build_compound_diffwtd_mask_sse4_1)); INSTANTIATE_TEST_CASE_P( SSE4_1, BuildCompDiffwtdMaskD16Test, BuildParams(av1_build_compound_diffwtd_mask_d16_sse4_1)); #endif #if HAVE_AVX2 INSTANTIATE_TEST_CASE_P(AVX2, BuildCompDiffwtdMaskTest, BuildParams(av1_build_compound_diffwtd_mask_avx2)); INSTANTIATE_TEST_CASE_P(AVX2, BuildCompDiffwtdMaskD16Test, BuildParams(av1_build_compound_diffwtd_mask_d16_avx2)); #endif #if HAVE_NEON INSTANTIATE_TEST_CASE_P(NEON, BuildCompDiffwtdMaskD16Test, BuildParams(av1_build_compound_diffwtd_mask_d16_neon)); #endif } // namespace