/* * Copyright (c) 2018, Alliance for Open Media. All rights reserved * * This source code is subject to the terms of the BSD 2 Clause License and * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License * was not distributed with this source code in the LICENSE file, you can * obtain it at www.aomedia.org/license/software. If the Alliance for Open * Media Patent License 1.0 was not distributed with this source code in the * PATENTS file, you can obtain it at www.aomedia.org/license/patent. */ #include "third_party/googletest/src/googletest/include/gtest/gtest.h" #include "config/aom_config.h" #include "config/aom_dsp_rtcd.h" #include "aom_mem/aom_mem.h" #include "aom_ports/aom_timer.h" #include "av1/common/blockd.h" #include "av1/common/pred_common.h" #include "av1/common/reconintra.h" #include "test/acm_random.h" #include "test/clear_system_state.h" #include "test/register_state_check.h" #include "test/util.h" namespace { const int kZ1Start = 0; const int kZ2Start = 90; const int kZ3Start = 180; const TX_SIZE kTxSize[] = { TX_4X4, TX_8X8, TX_16X16, TX_32X32, TX_64X64, TX_4X8, TX_8X4, TX_8X16, TX_16X8, TX_16X32, TX_32X16, TX_32X64, TX_64X32, TX_4X16, TX_16X4, TX_8X32, TX_32X8, TX_16X64, TX_64X16 }; const char *const kTxSizeStrings[] = { "TX_4X4", "TX_8X8", "TX_16X16", "TX_32X32", "TX_64X64", "TX_4X8", "TX_8X4", "TX_8X16", "TX_16X8", "TX_16X32", "TX_32X16", "TX_32X64", "TX_64X32", "TX_4X16", "TX_16X4", "TX_8X32", "TX_32X8", "TX_16X64", "TX_64X16" }; using libaom_test::ACMRandom; typedef void (*DrPred_Hbd)(uint16_t *dst, ptrdiff_t stride, int bw, int bh, const uint16_t *above, const uint16_t *left, int upsample_above, int upsample_left, int dx, int dy, int bd); typedef void (*DrPred)(uint8_t *dst, ptrdiff_t stride, int bw, int bh, const uint8_t *above, const uint8_t *left, int upsample_above, int upsample_left, int dx, int dy, int bd); typedef void (*Z1_Lbd)(uint8_t *dst, ptrdiff_t stride, int bw, int bh, const uint8_t *above, const uint8_t *left, int upsample_above, int dx, int dy); template void z1_wrapper(uint8_t *dst, ptrdiff_t stride, int bw, int bh, const uint8_t *above, const uint8_t *left, int upsample_above, int /*upsample_left*/, int dx, int dy, int /*bd*/) { fn(dst, stride, bw, bh, above, left, upsample_above, dx, dy); } typedef void (*Z2_Lbd)(uint8_t *dst, ptrdiff_t stride, int bw, int bh, const uint8_t *above, const uint8_t *left, int upsample_above, int upsample_left, int dx, int dy); template void z2_wrapper(uint8_t *dst, ptrdiff_t stride, int bw, int bh, const uint8_t *above, const uint8_t *left, int upsample_above, int upsample_left, int dx, int dy, int /*bd*/) { fn(dst, stride, bw, bh, above, left, upsample_above, upsample_left, dx, dy); } typedef void (*Z3_Lbd)(uint8_t *dst, ptrdiff_t stride, int bw, int bh, const uint8_t *above, const uint8_t *left, int upsample_left, int dx, int dy); template void z3_wrapper(uint8_t *dst, ptrdiff_t stride, int bw, int bh, const uint8_t *above, const uint8_t *left, int /*upsample_above*/, int upsample_left, int dx, int dy, int /*bd*/) { fn(dst, stride, bw, bh, above, left, upsample_left, dx, dy); } typedef void (*Z1_Hbd)(uint16_t *dst, ptrdiff_t stride, int bw, int bh, const uint16_t *above, const uint16_t *left, int upsample_above, int dx, int dy, int bd); template void z1_wrapper_hbd(uint16_t *dst, ptrdiff_t stride, int bw, int bh, const uint16_t *above, const uint16_t *left, int upsample_above, int /*upsample_left*/, int dx, int dy, int bd) { fn(dst, stride, bw, bh, above, left, upsample_above, dx, dy, bd); } typedef void (*Z2_Hbd)(uint16_t *dst, ptrdiff_t stride, int bw, int bh, const uint16_t *above, const uint16_t *left, int upsample_above, int upsample_left, int dx, int dy, int bd); template void z2_wrapper_hbd(uint16_t *dst, ptrdiff_t stride, int bw, int bh, const uint16_t *above, const uint16_t *left, int upsample_above, int upsample_left, int dx, int dy, int bd) { fn(dst, stride, bw, bh, above, left, upsample_above, upsample_left, dx, dy, bd); } typedef void (*Z3_Hbd)(uint16_t *dst, ptrdiff_t stride, int bw, int bh, const uint16_t *above, const uint16_t *left, int upsample_left, int dx, int dy, int bd); template void z3_wrapper_hbd(uint16_t *dst, ptrdiff_t stride, int bw, int bh, const uint16_t *above, const uint16_t *left, int /*upsample_above*/, int upsample_left, int dx, int dy, int bd) { fn(dst, stride, bw, bh, above, left, upsample_left, dx, dy, bd); } template struct DrPredFunc { DrPredFunc(FuncType pred = NULL, FuncType tst = NULL, int bit_depth_value = 0, int start_angle_value = 0) : ref_fn(pred), tst_fn(tst), bit_depth(bit_depth_value), start_angle(start_angle_value) {} FuncType ref_fn; FuncType tst_fn; int bit_depth; int start_angle; }; template class DrPredTest : public ::testing::TestWithParam > { protected: static const int kMaxNumTests = 100000; static const int kIterations = 10; static const int kDstStride = 64; static const int kDstSize = kDstStride * kDstStride; static const int kOffset = 16; static const int kBufSize = ((2 * MAX_TX_SIZE) << 1) + 16; DrPredTest() : enable_upsample_(0), upsample_above_(0), upsample_left_(0), bw_(0), bh_(0), dx_(1), dy_(1), bd_(8), txsize_(TX_4X4) { params_ = this->GetParam(); start_angle_ = params_.start_angle; stop_angle_ = start_angle_ + 90; dst_ref_ = &dst_ref_data_[0]; dst_tst_ = &dst_tst_data_[0]; dst_stride_ = kDstStride; above_ = &above_data_[kOffset]; left_ = &left_data_[kOffset]; for (int i = 0; i < kBufSize; ++i) { above_data_[i] = rng_.Rand8(); left_data_[i] = rng_.Rand8(); } for (int i = 0; i < kDstSize; ++i) { dst_ref_[i] = 0; } } virtual ~DrPredTest() {} void Predict(bool speedtest, int tx) { const int kNumTests = speedtest ? kMaxNumTests : 1; aom_usec_timer timer; aom_usec_timer_start(&timer); for (int k = 0; k < kNumTests; ++k) { params_.ref_fn(dst_ref_, dst_stride_, bw_, bh_, above_, left_, upsample_above_, upsample_left_, dx_, dy_, bd_); } aom_usec_timer_mark(&timer); const int ref_time = static_cast(aom_usec_timer_elapsed(&timer)); aom_usec_timer_start(&timer); if (params_.tst_fn) { for (int k = 0; k < kNumTests; ++k) { ASM_REGISTER_STATE_CHECK(params_.tst_fn(dst_tst_, dst_stride_, bw_, bh_, above_, left_, upsample_above_, upsample_left_, dx_, dy_, bd_)); } } aom_usec_timer_mark(&timer); const int tst_time = static_cast(aom_usec_timer_elapsed(&timer)); OutputTimes(kNumTests, ref_time, tst_time, tx); } void RunTest(bool speedtest, int p_angle) { for (int i = 0; i < kBufSize; ++i) { above_data_[i] = left_data_[i] = (1 << bd_) - 1; } for (int tx = 0; tx < TX_SIZES_ALL; ++tx) { if (params_.tst_fn == NULL) { for (int i = 0; i < kDstSize; ++i) { dst_tst_[i] = (1 << bd_) - 1; } } else { for (int i = 0; i < kDstSize; ++i) { dst_tst_[i] = 0; } } bw_ = tx_size_wide[kTxSize[tx]]; bh_ = tx_size_high[kTxSize[tx]]; if (enable_upsample_) { upsample_above_ = av1_use_intra_edge_upsample(bw_, bh_, p_angle - 90, 0); upsample_left_ = av1_use_intra_edge_upsample(bw_, bh_, p_angle - 180, 0); } else { upsample_above_ = upsample_left_ = 0; } Predict(speedtest, tx); for (int r = 0; r < bh_; ++r) { for (int c = 0; c < bw_; ++c) { ASSERT_EQ(dst_ref_[r * dst_stride_ + c], dst_tst_[r * dst_stride_ + c]) << bw_ << "x" << bh_ << " r: " << r << " c: " << c << " dx: " << dx_ << " dy: " << dy_ << " upsample_above: " << upsample_above_ << " upsample_left: " << upsample_left_; } } } } void OutputTimes(int num_tests, int ref_time, int tst_time, int tx) { if (num_tests > 1) { if (params_.tst_fn) { const float x = static_cast(ref_time) / tst_time; printf("\t[%8s] :: ref time %6d, tst time %6d %3.2f\n", kTxSizeStrings[tx], ref_time, tst_time, x); } else { printf("\t[%8s] :: ref time %6d\n", kTxSizeStrings[tx], ref_time); } } } Pixel dst_ref_data_[kDstSize]; Pixel dst_tst_data_[kDstSize]; Pixel left_data_[kBufSize]; Pixel dummy_data_[kBufSize]; Pixel above_data_[kBufSize]; Pixel *dst_ref_; Pixel *dst_tst_; Pixel *above_; Pixel *left_; int dst_stride_; int enable_upsample_; int upsample_above_; int upsample_left_; int bw_; int bh_; int dx_; int dy_; int bd_; TX_SIZE txsize_; int start_angle_; int stop_angle_; ACMRandom rng_; DrPredFunc params_; }; class LowbdDrPredTest : public DrPredTest {}; TEST_P(LowbdDrPredTest, SaturatedValues) { for (int iter = 0; iter < kIterations && !HasFatalFailure(); ++iter) { enable_upsample_ = iter & 1; for (int angle = start_angle_; angle < stop_angle_; ++angle) { dx_ = av1_get_dx(angle); dy_ = av1_get_dy(angle); if (dx_ && dy_) RunTest(false, angle); } } } TEST_P(LowbdDrPredTest, DISABLED_Speed) { const int angles[] = { 3, 45, 87 }; for (enable_upsample_ = 0; enable_upsample_ < 2; ++enable_upsample_) { for (int i = 0; i < 3; ++i) { const int angle = angles[i] + start_angle_; dx_ = av1_get_dx(angle); dy_ = av1_get_dy(angle); printf("enable_upsample: %d angle: %d ~~~~~~~~~~~~~~~\n", enable_upsample_, angle); if (dx_ && dy_) RunTest(true, angle); } } } using ::testing::make_tuple; INSTANTIATE_TEST_CASE_P( C, LowbdDrPredTest, ::testing::Values(DrPredFunc(&z1_wrapper, NULL, AOM_BITS_8, kZ1Start), DrPredFunc(&z2_wrapper, NULL, AOM_BITS_8, kZ2Start), DrPredFunc(&z3_wrapper, NULL, AOM_BITS_8, kZ3Start))); class HighbdDrPredTest : public DrPredTest {}; TEST_P(HighbdDrPredTest, SaturatedValues) { for (int iter = 0; iter < kIterations && !HasFatalFailure(); ++iter) { enable_upsample_ = iter & 1; for (int angle = start_angle_; angle < stop_angle_; ++angle) { dx_ = av1_get_dx(angle); dy_ = av1_get_dy(angle); if (dx_ && dy_) RunTest(false, angle); } } } TEST_P(HighbdDrPredTest, DISABLED_Speed) { const int angles[] = { 3, 45, 87 }; for (enable_upsample_ = 0; enable_upsample_ < 2; ++enable_upsample_) { for (int i = 0; i < 3; ++i) { const int angle = angles[i] + start_angle_; dx_ = av1_get_dx(angle); dy_ = av1_get_dy(angle); printf("enable_upsample: %d angle: %d ~~~~~~~~~~~~~~~\n", enable_upsample_, angle); if (dx_ && dy_) RunTest(true, angle); } } } INSTANTIATE_TEST_CASE_P( C, HighbdDrPredTest, ::testing::Values( DrPredFunc(&z1_wrapper_hbd, NULL, AOM_BITS_8, kZ1Start), DrPredFunc(&z1_wrapper_hbd, NULL, AOM_BITS_10, kZ1Start), DrPredFunc(&z1_wrapper_hbd, NULL, AOM_BITS_12, kZ1Start), DrPredFunc(&z2_wrapper_hbd, NULL, AOM_BITS_8, kZ2Start), DrPredFunc(&z2_wrapper_hbd, NULL, AOM_BITS_10, kZ2Start), DrPredFunc(&z2_wrapper_hbd, NULL, AOM_BITS_12, kZ2Start), DrPredFunc(&z3_wrapper_hbd, NULL, AOM_BITS_8, kZ3Start), DrPredFunc(&z3_wrapper_hbd, NULL, AOM_BITS_10, kZ3Start), DrPredFunc(&z3_wrapper_hbd, NULL, AOM_BITS_12, kZ3Start))); } // namespace