1*77c1e3ccSAndroid Build Coastguard Worker /*
2*77c1e3ccSAndroid Build Coastguard Worker * Copyright (c) 2017, Alliance for Open Media. All rights reserved.
3*77c1e3ccSAndroid Build Coastguard Worker *
4*77c1e3ccSAndroid Build Coastguard Worker * This source code is subject to the terms of the BSD 2 Clause License and
5*77c1e3ccSAndroid Build Coastguard Worker * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6*77c1e3ccSAndroid Build Coastguard Worker * was not distributed with this source code in the LICENSE file, you can
7*77c1e3ccSAndroid Build Coastguard Worker * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8*77c1e3ccSAndroid Build Coastguard Worker * Media Patent License 1.0 was not distributed with this source code in the
9*77c1e3ccSAndroid Build Coastguard Worker * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10*77c1e3ccSAndroid Build Coastguard Worker */
11*77c1e3ccSAndroid Build Coastguard Worker
12*77c1e3ccSAndroid Build Coastguard Worker #include <stdint.h>
13*77c1e3ccSAndroid Build Coastguard Worker #include <stdio.h>
14*77c1e3ccSAndroid Build Coastguard Worker #include <string.h>
15*77c1e3ccSAndroid Build Coastguard Worker #include <tuple>
16*77c1e3ccSAndroid Build Coastguard Worker
17*77c1e3ccSAndroid Build Coastguard Worker #include "config/aom_config.h"
18*77c1e3ccSAndroid Build Coastguard Worker #include "config/av1_rtcd.h"
19*77c1e3ccSAndroid Build Coastguard Worker
20*77c1e3ccSAndroid Build Coastguard Worker #include "aom_ports/mem.h"
21*77c1e3ccSAndroid Build Coastguard Worker #include "av1/common/scan.h"
22*77c1e3ccSAndroid Build Coastguard Worker #include "av1/common/txb_common.h"
23*77c1e3ccSAndroid Build Coastguard Worker #include "gtest/gtest.h"
24*77c1e3ccSAndroid Build Coastguard Worker #include "test/acm_random.h"
25*77c1e3ccSAndroid Build Coastguard Worker #include "test/register_state_check.h"
26*77c1e3ccSAndroid Build Coastguard Worker #include "test/util.h"
27*77c1e3ccSAndroid Build Coastguard Worker
28*77c1e3ccSAndroid Build Coastguard Worker namespace {
29*77c1e3ccSAndroid Build Coastguard Worker using libaom_test::ACMRandom;
30*77c1e3ccSAndroid Build Coastguard Worker
31*77c1e3ccSAndroid Build Coastguard Worker using BuildCompDiffWtdMaskFunc = void (*)(uint8_t *mask,
32*77c1e3ccSAndroid Build Coastguard Worker DIFFWTD_MASK_TYPE mask_type,
33*77c1e3ccSAndroid Build Coastguard Worker const uint8_t *src0, int src0_stride,
34*77c1e3ccSAndroid Build Coastguard Worker const uint8_t *src1, int src1_stride,
35*77c1e3ccSAndroid Build Coastguard Worker int h, int w);
36*77c1e3ccSAndroid Build Coastguard Worker
37*77c1e3ccSAndroid Build Coastguard Worker using BuildCompDiffwtdMaskDParam =
38*77c1e3ccSAndroid Build Coastguard Worker std::tuple<BLOCK_SIZE, BuildCompDiffWtdMaskFunc>;
39*77c1e3ccSAndroid Build Coastguard Worker
40*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE4_1 || HAVE_AVX2 || HAVE_NEON
BuildParams(BuildCompDiffWtdMaskFunc filter)41*77c1e3ccSAndroid Build Coastguard Worker ::testing::internal::ParamGenerator<BuildCompDiffwtdMaskDParam> BuildParams(
42*77c1e3ccSAndroid Build Coastguard Worker BuildCompDiffWtdMaskFunc filter) {
43*77c1e3ccSAndroid Build Coastguard Worker return ::testing::Combine(::testing::Range(BLOCK_4X4, BLOCK_SIZES_ALL),
44*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(filter));
45*77c1e3ccSAndroid Build Coastguard Worker }
46*77c1e3ccSAndroid Build Coastguard Worker #endif
47*77c1e3ccSAndroid Build Coastguard Worker
48*77c1e3ccSAndroid Build Coastguard Worker class BuildCompDiffwtdMaskTest
49*77c1e3ccSAndroid Build Coastguard Worker : public ::testing::TestWithParam<BuildCompDiffwtdMaskDParam> {
50*77c1e3ccSAndroid Build Coastguard Worker public:
BuildCompDiffwtdMaskTest()51*77c1e3ccSAndroid Build Coastguard Worker BuildCompDiffwtdMaskTest() : rnd_(ACMRandom::DeterministicSeed()) {}
52*77c1e3ccSAndroid Build Coastguard Worker ~BuildCompDiffwtdMaskTest() override = default;
53*77c1e3ccSAndroid Build Coastguard Worker
54*77c1e3ccSAndroid Build Coastguard Worker protected:
RunTest(BuildCompDiffWtdMaskFunc test_impl,bool is_speed,const DIFFWTD_MASK_TYPE type)55*77c1e3ccSAndroid Build Coastguard Worker void RunTest(BuildCompDiffWtdMaskFunc test_impl, bool is_speed,
56*77c1e3ccSAndroid Build Coastguard Worker const DIFFWTD_MASK_TYPE type) {
57*77c1e3ccSAndroid Build Coastguard Worker const int sb_type = GET_PARAM(0);
58*77c1e3ccSAndroid Build Coastguard Worker const int width = block_size_wide[sb_type];
59*77c1e3ccSAndroid Build Coastguard Worker const int height = block_size_high[sb_type];
60*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, uint8_t, mask_ref[MAX_SB_SQUARE]);
61*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, uint8_t, mask_test[MAX_SB_SQUARE]);
62*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, uint8_t, src0[MAX_SB_SQUARE]);
63*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, uint8_t, src1[MAX_SB_SQUARE]);
64*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < width * height; i++) {
65*77c1e3ccSAndroid Build Coastguard Worker src0[i] = rnd_.Rand8();
66*77c1e3ccSAndroid Build Coastguard Worker src1[i] = rnd_.Rand8();
67*77c1e3ccSAndroid Build Coastguard Worker }
68*77c1e3ccSAndroid Build Coastguard Worker const int run_times = is_speed ? (10000000 / (width + height)) : 1;
69*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer timer;
70*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer);
71*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < run_times; ++i) {
72*77c1e3ccSAndroid Build Coastguard Worker av1_build_compound_diffwtd_mask_c(mask_ref, type, src0, width, src1,
73*77c1e3ccSAndroid Build Coastguard Worker width, height, width);
74*77c1e3ccSAndroid Build Coastguard Worker }
75*77c1e3ccSAndroid Build Coastguard Worker const double t1 = get_time_mark(&timer);
76*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer);
77*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < run_times; ++i) {
78*77c1e3ccSAndroid Build Coastguard Worker test_impl(mask_test, type, src0, width, src1, width, height, width);
79*77c1e3ccSAndroid Build Coastguard Worker }
80*77c1e3ccSAndroid Build Coastguard Worker const double t2 = get_time_mark(&timer);
81*77c1e3ccSAndroid Build Coastguard Worker if (is_speed) {
82*77c1e3ccSAndroid Build Coastguard Worker printf("mask %d %3dx%-3d:%7.2f/%7.2fns", type, width, height, t1, t2);
83*77c1e3ccSAndroid Build Coastguard Worker printf("(%3.2f)\n", t1 / t2);
84*77c1e3ccSAndroid Build Coastguard Worker }
85*77c1e3ccSAndroid Build Coastguard Worker for (int r = 0; r < height; ++r) {
86*77c1e3ccSAndroid Build Coastguard Worker for (int c = 0; c < width; ++c) {
87*77c1e3ccSAndroid Build Coastguard Worker ASSERT_EQ(mask_ref[c + r * width], mask_test[c + r * width])
88*77c1e3ccSAndroid Build Coastguard Worker << "[" << r << "," << c << "] " << run_times << " @ " << width
89*77c1e3ccSAndroid Build Coastguard Worker << "x" << height << " inv " << type;
90*77c1e3ccSAndroid Build Coastguard Worker }
91*77c1e3ccSAndroid Build Coastguard Worker }
92*77c1e3ccSAndroid Build Coastguard Worker }
93*77c1e3ccSAndroid Build Coastguard Worker
94*77c1e3ccSAndroid Build Coastguard Worker private:
95*77c1e3ccSAndroid Build Coastguard Worker ACMRandom rnd_;
96*77c1e3ccSAndroid Build Coastguard Worker };
97*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(BuildCompDiffwtdMaskTest);
98*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(BuildCompDiffwtdMaskTest,match)99*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BuildCompDiffwtdMaskTest, match) {
100*77c1e3ccSAndroid Build Coastguard Worker RunTest(GET_PARAM(1), 0, DIFFWTD_38);
101*77c1e3ccSAndroid Build Coastguard Worker RunTest(GET_PARAM(1), 0, DIFFWTD_38_INV);
102*77c1e3ccSAndroid Build Coastguard Worker }
TEST_P(BuildCompDiffwtdMaskTest,DISABLED_Speed)103*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BuildCompDiffwtdMaskTest, DISABLED_Speed) {
104*77c1e3ccSAndroid Build Coastguard Worker RunTest(GET_PARAM(1), 1, DIFFWTD_38);
105*77c1e3ccSAndroid Build Coastguard Worker RunTest(GET_PARAM(1), 1, DIFFWTD_38_INV);
106*77c1e3ccSAndroid Build Coastguard Worker }
107*77c1e3ccSAndroid Build Coastguard Worker
108*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE4_1
109*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(SSE4_1, BuildCompDiffwtdMaskTest,
110*77c1e3ccSAndroid Build Coastguard Worker BuildParams(av1_build_compound_diffwtd_mask_sse4_1));
111*77c1e3ccSAndroid Build Coastguard Worker #endif
112*77c1e3ccSAndroid Build Coastguard Worker
113*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
114*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(AVX2, BuildCompDiffwtdMaskTest,
115*77c1e3ccSAndroid Build Coastguard Worker BuildParams(av1_build_compound_diffwtd_mask_avx2));
116*77c1e3ccSAndroid Build Coastguard Worker #endif
117*77c1e3ccSAndroid Build Coastguard Worker
118*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
119*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(NEON, BuildCompDiffwtdMaskTest,
120*77c1e3ccSAndroid Build Coastguard Worker BuildParams(av1_build_compound_diffwtd_mask_neon));
121*77c1e3ccSAndroid Build Coastguard Worker #endif
122*77c1e3ccSAndroid Build Coastguard Worker
123*77c1e3ccSAndroid Build Coastguard Worker #if CONFIG_AV1_HIGHBITDEPTH
124*77c1e3ccSAndroid Build Coastguard Worker
125*77c1e3ccSAndroid Build Coastguard Worker using BuildCompDiffWtdMaskHighbdFunc =
126*77c1e3ccSAndroid Build Coastguard Worker void (*)(uint8_t *mask, DIFFWTD_MASK_TYPE mask_type, const uint8_t *src0,
127*77c1e3ccSAndroid Build Coastguard Worker int src0_stride, const uint8_t *src1, int src1_stride, int h,
128*77c1e3ccSAndroid Build Coastguard Worker int w, int bd);
129*77c1e3ccSAndroid Build Coastguard Worker
130*77c1e3ccSAndroid Build Coastguard Worker using BuildCompDiffwtdMaskHighbdParam =
131*77c1e3ccSAndroid Build Coastguard Worker std::tuple<BLOCK_SIZE, int, BuildCompDiffWtdMaskHighbdFunc>;
132*77c1e3ccSAndroid Build Coastguard Worker
133*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSSE3 || HAVE_AVX2 || HAVE_NEON
134*77c1e3ccSAndroid Build Coastguard Worker ::testing::internal::ParamGenerator<BuildCompDiffwtdMaskHighbdParam>
BuildParamsHighbd(BuildCompDiffWtdMaskHighbdFunc filter)135*77c1e3ccSAndroid Build Coastguard Worker BuildParamsHighbd(BuildCompDiffWtdMaskHighbdFunc filter) {
136*77c1e3ccSAndroid Build Coastguard Worker return ::testing::Combine(::testing::Range(BLOCK_4X4, BLOCK_SIZES_ALL),
137*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(8, 10, 12),
138*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(filter));
139*77c1e3ccSAndroid Build Coastguard Worker }
140*77c1e3ccSAndroid Build Coastguard Worker #endif
141*77c1e3ccSAndroid Build Coastguard Worker
142*77c1e3ccSAndroid Build Coastguard Worker class BuildCompDiffwtdMaskHighbdTest
143*77c1e3ccSAndroid Build Coastguard Worker : public ::testing::TestWithParam<BuildCompDiffwtdMaskHighbdParam> {
144*77c1e3ccSAndroid Build Coastguard Worker public:
BuildCompDiffwtdMaskHighbdTest()145*77c1e3ccSAndroid Build Coastguard Worker BuildCompDiffwtdMaskHighbdTest() : rnd_(ACMRandom::DeterministicSeed()) {}
146*77c1e3ccSAndroid Build Coastguard Worker ~BuildCompDiffwtdMaskHighbdTest() override = default;
147*77c1e3ccSAndroid Build Coastguard Worker
148*77c1e3ccSAndroid Build Coastguard Worker protected:
RunTest(BuildCompDiffWtdMaskHighbdFunc test_impl,bool is_speed,const DIFFWTD_MASK_TYPE type)149*77c1e3ccSAndroid Build Coastguard Worker void RunTest(BuildCompDiffWtdMaskHighbdFunc test_impl, bool is_speed,
150*77c1e3ccSAndroid Build Coastguard Worker const DIFFWTD_MASK_TYPE type) {
151*77c1e3ccSAndroid Build Coastguard Worker const int sb_type = GET_PARAM(0);
152*77c1e3ccSAndroid Build Coastguard Worker const int bd = GET_PARAM(1);
153*77c1e3ccSAndroid Build Coastguard Worker const int width = block_size_wide[sb_type];
154*77c1e3ccSAndroid Build Coastguard Worker const int height = block_size_high[sb_type];
155*77c1e3ccSAndroid Build Coastguard Worker const int mask = (1 << bd) - 1;
156*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, uint8_t, mask_ref[MAX_SB_SQUARE]);
157*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, uint8_t, mask_test[MAX_SB_SQUARE]);
158*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, uint16_t, src0[MAX_SB_SQUARE]);
159*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, uint16_t, src1[MAX_SB_SQUARE]);
160*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < width * height; i++) {
161*77c1e3ccSAndroid Build Coastguard Worker src0[i] = rnd_.Rand16() & mask;
162*77c1e3ccSAndroid Build Coastguard Worker src1[i] = rnd_.Rand16() & mask;
163*77c1e3ccSAndroid Build Coastguard Worker }
164*77c1e3ccSAndroid Build Coastguard Worker const int run_times = is_speed ? (10000000 / (width + height)) : 1;
165*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer timer;
166*77c1e3ccSAndroid Build Coastguard Worker
167*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer);
168*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < run_times; ++i) {
169*77c1e3ccSAndroid Build Coastguard Worker uint8_t *src0_8 = CONVERT_TO_BYTEPTR(src0);
170*77c1e3ccSAndroid Build Coastguard Worker uint8_t *src1_8 = CONVERT_TO_BYTEPTR(src1);
171*77c1e3ccSAndroid Build Coastguard Worker av1_build_compound_diffwtd_mask_highbd_c(
172*77c1e3ccSAndroid Build Coastguard Worker mask_ref, type, src0_8, width, src1_8, width, height, width, bd);
173*77c1e3ccSAndroid Build Coastguard Worker }
174*77c1e3ccSAndroid Build Coastguard Worker const double t1 = get_time_mark(&timer);
175*77c1e3ccSAndroid Build Coastguard Worker
176*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer);
177*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < run_times; ++i) {
178*77c1e3ccSAndroid Build Coastguard Worker uint8_t *src0_8 = CONVERT_TO_BYTEPTR(src0);
179*77c1e3ccSAndroid Build Coastguard Worker uint8_t *src1_8 = CONVERT_TO_BYTEPTR(src1);
180*77c1e3ccSAndroid Build Coastguard Worker test_impl(mask_test, type, src0_8, width, src1_8, width, height, width,
181*77c1e3ccSAndroid Build Coastguard Worker bd);
182*77c1e3ccSAndroid Build Coastguard Worker }
183*77c1e3ccSAndroid Build Coastguard Worker const double t2 = get_time_mark(&timer);
184*77c1e3ccSAndroid Build Coastguard Worker
185*77c1e3ccSAndroid Build Coastguard Worker if (is_speed) {
186*77c1e3ccSAndroid Build Coastguard Worker printf("mask %d %3dx%-3d:%7.2f/%7.2fns", type, width, height, t1, t2);
187*77c1e3ccSAndroid Build Coastguard Worker printf("(%3.2f)\n", t1 / t2);
188*77c1e3ccSAndroid Build Coastguard Worker }
189*77c1e3ccSAndroid Build Coastguard Worker for (int r = 0; r < height; ++r) {
190*77c1e3ccSAndroid Build Coastguard Worker for (int c = 0; c < width; ++c) {
191*77c1e3ccSAndroid Build Coastguard Worker ASSERT_EQ(mask_ref[c + r * width], mask_test[c + r * width])
192*77c1e3ccSAndroid Build Coastguard Worker << "[" << r << "," << c << "] " << run_times << " @ " << width
193*77c1e3ccSAndroid Build Coastguard Worker << "x" << height << " inv " << type;
194*77c1e3ccSAndroid Build Coastguard Worker }
195*77c1e3ccSAndroid Build Coastguard Worker }
196*77c1e3ccSAndroid Build Coastguard Worker }
197*77c1e3ccSAndroid Build Coastguard Worker
198*77c1e3ccSAndroid Build Coastguard Worker private:
199*77c1e3ccSAndroid Build Coastguard Worker ACMRandom rnd_;
200*77c1e3ccSAndroid Build Coastguard Worker };
201*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(BuildCompDiffwtdMaskHighbdTest);
202*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(BuildCompDiffwtdMaskHighbdTest,match)203*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BuildCompDiffwtdMaskHighbdTest, match) {
204*77c1e3ccSAndroid Build Coastguard Worker RunTest(GET_PARAM(2), 0, DIFFWTD_38);
205*77c1e3ccSAndroid Build Coastguard Worker RunTest(GET_PARAM(2), 0, DIFFWTD_38_INV);
206*77c1e3ccSAndroid Build Coastguard Worker }
TEST_P(BuildCompDiffwtdMaskHighbdTest,DISABLED_Speed)207*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BuildCompDiffwtdMaskHighbdTest, DISABLED_Speed) {
208*77c1e3ccSAndroid Build Coastguard Worker RunTest(GET_PARAM(2), 1, DIFFWTD_38);
209*77c1e3ccSAndroid Build Coastguard Worker RunTest(GET_PARAM(2), 1, DIFFWTD_38_INV);
210*77c1e3ccSAndroid Build Coastguard Worker }
211*77c1e3ccSAndroid Build Coastguard Worker
212*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSSE3
213*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
214*77c1e3ccSAndroid Build Coastguard Worker SSSE3, BuildCompDiffwtdMaskHighbdTest,
215*77c1e3ccSAndroid Build Coastguard Worker BuildParamsHighbd(av1_build_compound_diffwtd_mask_highbd_ssse3));
216*77c1e3ccSAndroid Build Coastguard Worker #endif
217*77c1e3ccSAndroid Build Coastguard Worker
218*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
219*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
220*77c1e3ccSAndroid Build Coastguard Worker AVX2, BuildCompDiffwtdMaskHighbdTest,
221*77c1e3ccSAndroid Build Coastguard Worker BuildParamsHighbd(av1_build_compound_diffwtd_mask_highbd_avx2));
222*77c1e3ccSAndroid Build Coastguard Worker #endif
223*77c1e3ccSAndroid Build Coastguard Worker
224*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
225*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
226*77c1e3ccSAndroid Build Coastguard Worker NEON, BuildCompDiffwtdMaskHighbdTest,
227*77c1e3ccSAndroid Build Coastguard Worker BuildParamsHighbd(av1_build_compound_diffwtd_mask_highbd_neon));
228*77c1e3ccSAndroid Build Coastguard Worker #endif
229*77c1e3ccSAndroid Build Coastguard Worker #endif // CONFIG_AV1_HIGHBITDEPTH
230*77c1e3ccSAndroid Build Coastguard Worker
231*77c1e3ccSAndroid Build Coastguard Worker using BuildCompDiffWtdMaskD16Func = void (*)(
232*77c1e3ccSAndroid Build Coastguard Worker uint8_t *mask, DIFFWTD_MASK_TYPE mask_type, const CONV_BUF_TYPE *src0,
233*77c1e3ccSAndroid Build Coastguard Worker int src0_stride, const CONV_BUF_TYPE *src1, int src1_stride, int h, int w,
234*77c1e3ccSAndroid Build Coastguard Worker ConvolveParams *conv_params, int bd);
235*77c1e3ccSAndroid Build Coastguard Worker
236*77c1e3ccSAndroid Build Coastguard Worker using BuildCompDiffwtdMaskD16Param =
237*77c1e3ccSAndroid Build Coastguard Worker std::tuple<int, BuildCompDiffWtdMaskD16Func, BLOCK_SIZE>;
238*77c1e3ccSAndroid Build Coastguard Worker
239*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE4_1 || HAVE_AVX2 || HAVE_NEON
BuildParams(BuildCompDiffWtdMaskD16Func filter)240*77c1e3ccSAndroid Build Coastguard Worker ::testing::internal::ParamGenerator<BuildCompDiffwtdMaskD16Param> BuildParams(
241*77c1e3ccSAndroid Build Coastguard Worker BuildCompDiffWtdMaskD16Func filter) {
242*77c1e3ccSAndroid Build Coastguard Worker return ::testing::Combine(::testing::Range(8, 13, 2),
243*77c1e3ccSAndroid Build Coastguard Worker ::testing::Values(filter),
244*77c1e3ccSAndroid Build Coastguard Worker ::testing::Range(BLOCK_4X4, BLOCK_SIZES_ALL));
245*77c1e3ccSAndroid Build Coastguard Worker }
246*77c1e3ccSAndroid Build Coastguard Worker #endif
247*77c1e3ccSAndroid Build Coastguard Worker
248*77c1e3ccSAndroid Build Coastguard Worker class BuildCompDiffwtdMaskD16Test
249*77c1e3ccSAndroid Build Coastguard Worker : public ::testing::TestWithParam<BuildCompDiffwtdMaskD16Param> {
250*77c1e3ccSAndroid Build Coastguard Worker public:
BuildCompDiffwtdMaskD16Test()251*77c1e3ccSAndroid Build Coastguard Worker BuildCompDiffwtdMaskD16Test() : rnd_(ACMRandom::DeterministicSeed()) {}
252*77c1e3ccSAndroid Build Coastguard Worker ~BuildCompDiffwtdMaskD16Test() override = default;
253*77c1e3ccSAndroid Build Coastguard Worker
254*77c1e3ccSAndroid Build Coastguard Worker protected:
RunCheckOutput(BuildCompDiffWtdMaskD16Func test_impl)255*77c1e3ccSAndroid Build Coastguard Worker void RunCheckOutput(BuildCompDiffWtdMaskD16Func test_impl) {
256*77c1e3ccSAndroid Build Coastguard Worker const int block_idx = GET_PARAM(2);
257*77c1e3ccSAndroid Build Coastguard Worker const int bd = GET_PARAM(0);
258*77c1e3ccSAndroid Build Coastguard Worker const int width = block_size_wide[block_idx];
259*77c1e3ccSAndroid Build Coastguard Worker const int height = block_size_high[block_idx];
260*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, uint8_t, mask_ref[2 * MAX_SB_SQUARE]);
261*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, uint8_t, mask_test[2 * MAX_SB_SQUARE]);
262*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(32, uint16_t, src0[MAX_SB_SQUARE]);
263*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(32, uint16_t, src1[MAX_SB_SQUARE]);
264*77c1e3ccSAndroid Build Coastguard Worker
265*77c1e3ccSAndroid Build Coastguard Worker ConvolveParams conv_params =
266*77c1e3ccSAndroid Build Coastguard Worker get_conv_params_no_round(0, 0, nullptr, 0, 1, bd);
267*77c1e3ccSAndroid Build Coastguard Worker
268*77c1e3ccSAndroid Build Coastguard Worker const int in_precision =
269*77c1e3ccSAndroid Build Coastguard Worker bd + 2 * FILTER_BITS - conv_params.round_0 - conv_params.round_1 + 2;
270*77c1e3ccSAndroid Build Coastguard Worker
271*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < MAX_SB_SQUARE; i++) {
272*77c1e3ccSAndroid Build Coastguard Worker src0[i] = rnd_.Rand16() & ((1 << in_precision) - 1);
273*77c1e3ccSAndroid Build Coastguard Worker src1[i] = rnd_.Rand16() & ((1 << in_precision) - 1);
274*77c1e3ccSAndroid Build Coastguard Worker }
275*77c1e3ccSAndroid Build Coastguard Worker
276*77c1e3ccSAndroid Build Coastguard Worker for (int mask_type = 0; mask_type < DIFFWTD_MASK_TYPES; mask_type++) {
277*77c1e3ccSAndroid Build Coastguard Worker av1_build_compound_diffwtd_mask_d16_c(
278*77c1e3ccSAndroid Build Coastguard Worker mask_ref, (DIFFWTD_MASK_TYPE)mask_type, src0, width, src1, width,
279*77c1e3ccSAndroid Build Coastguard Worker height, width, &conv_params, bd);
280*77c1e3ccSAndroid Build Coastguard Worker
281*77c1e3ccSAndroid Build Coastguard Worker test_impl(mask_test, (DIFFWTD_MASK_TYPE)mask_type, src0, width, src1,
282*77c1e3ccSAndroid Build Coastguard Worker width, height, width, &conv_params, bd);
283*77c1e3ccSAndroid Build Coastguard Worker
284*77c1e3ccSAndroid Build Coastguard Worker for (int r = 0; r < height; ++r) {
285*77c1e3ccSAndroid Build Coastguard Worker for (int c = 0; c < width; ++c) {
286*77c1e3ccSAndroid Build Coastguard Worker ASSERT_EQ(mask_ref[c + r * width], mask_test[c + r * width])
287*77c1e3ccSAndroid Build Coastguard Worker << "Mismatch at unit tests for BuildCompDiffwtdMaskD16Test\n"
288*77c1e3ccSAndroid Build Coastguard Worker << " Pixel mismatch at index "
289*77c1e3ccSAndroid Build Coastguard Worker << "[" << r << "," << c << "] "
290*77c1e3ccSAndroid Build Coastguard Worker << " @ " << width << "x" << height << " inv " << mask_type;
291*77c1e3ccSAndroid Build Coastguard Worker }
292*77c1e3ccSAndroid Build Coastguard Worker }
293*77c1e3ccSAndroid Build Coastguard Worker }
294*77c1e3ccSAndroid Build Coastguard Worker }
295*77c1e3ccSAndroid Build Coastguard Worker
RunSpeedTest(BuildCompDiffWtdMaskD16Func test_impl,DIFFWTD_MASK_TYPE mask_type)296*77c1e3ccSAndroid Build Coastguard Worker void RunSpeedTest(BuildCompDiffWtdMaskD16Func test_impl,
297*77c1e3ccSAndroid Build Coastguard Worker DIFFWTD_MASK_TYPE mask_type) {
298*77c1e3ccSAndroid Build Coastguard Worker const int block_idx = GET_PARAM(2);
299*77c1e3ccSAndroid Build Coastguard Worker const int bd = GET_PARAM(0);
300*77c1e3ccSAndroid Build Coastguard Worker const int width = block_size_wide[block_idx];
301*77c1e3ccSAndroid Build Coastguard Worker const int height = block_size_high[block_idx];
302*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(16, uint8_t, mask[MAX_SB_SQUARE]);
303*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(32, uint16_t, src0[MAX_SB_SQUARE]);
304*77c1e3ccSAndroid Build Coastguard Worker DECLARE_ALIGNED(32, uint16_t, src1[MAX_SB_SQUARE]);
305*77c1e3ccSAndroid Build Coastguard Worker
306*77c1e3ccSAndroid Build Coastguard Worker ConvolveParams conv_params =
307*77c1e3ccSAndroid Build Coastguard Worker get_conv_params_no_round(0, 0, nullptr, 0, 1, bd);
308*77c1e3ccSAndroid Build Coastguard Worker
309*77c1e3ccSAndroid Build Coastguard Worker const int in_precision =
310*77c1e3ccSAndroid Build Coastguard Worker bd + 2 * FILTER_BITS - conv_params.round_0 - conv_params.round_1 + 2;
311*77c1e3ccSAndroid Build Coastguard Worker
312*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < MAX_SB_SQUARE; i++) {
313*77c1e3ccSAndroid Build Coastguard Worker src0[i] = rnd_.Rand16() & ((1 << in_precision) - 1);
314*77c1e3ccSAndroid Build Coastguard Worker src1[i] = rnd_.Rand16() & ((1 << in_precision) - 1);
315*77c1e3ccSAndroid Build Coastguard Worker }
316*77c1e3ccSAndroid Build Coastguard Worker
317*77c1e3ccSAndroid Build Coastguard Worker const int num_loops = 10000000 / (width + height);
318*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer timer;
319*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer);
320*77c1e3ccSAndroid Build Coastguard Worker
321*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < num_loops; ++i)
322*77c1e3ccSAndroid Build Coastguard Worker av1_build_compound_diffwtd_mask_d16_c(mask, mask_type, src0, width, src1,
323*77c1e3ccSAndroid Build Coastguard Worker width, height, width, &conv_params,
324*77c1e3ccSAndroid Build Coastguard Worker bd);
325*77c1e3ccSAndroid Build Coastguard Worker
326*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&timer);
327*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time = static_cast<int>(aom_usec_timer_elapsed(&timer));
328*77c1e3ccSAndroid Build Coastguard Worker
329*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer timer1;
330*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_start(&timer1);
331*77c1e3ccSAndroid Build Coastguard Worker
332*77c1e3ccSAndroid Build Coastguard Worker for (int i = 0; i < num_loops; ++i)
333*77c1e3ccSAndroid Build Coastguard Worker test_impl(mask, mask_type, src0, width, src1, width, height, width,
334*77c1e3ccSAndroid Build Coastguard Worker &conv_params, bd);
335*77c1e3ccSAndroid Build Coastguard Worker
336*77c1e3ccSAndroid Build Coastguard Worker aom_usec_timer_mark(&timer1);
337*77c1e3ccSAndroid Build Coastguard Worker const int elapsed_time1 = static_cast<int>(aom_usec_timer_elapsed(&timer1));
338*77c1e3ccSAndroid Build Coastguard Worker printf("av1_build_compound_diffwtd_mask_d16 %3dx%-3d: %7.2f \n", width,
339*77c1e3ccSAndroid Build Coastguard Worker height, elapsed_time / double(elapsed_time1));
340*77c1e3ccSAndroid Build Coastguard Worker }
341*77c1e3ccSAndroid Build Coastguard Worker
342*77c1e3ccSAndroid Build Coastguard Worker private:
343*77c1e3ccSAndroid Build Coastguard Worker ACMRandom rnd_;
344*77c1e3ccSAndroid Build Coastguard Worker }; // class BuildCompDiffwtdMaskD16Test
345*77c1e3ccSAndroid Build Coastguard Worker GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(BuildCompDiffwtdMaskD16Test);
346*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(BuildCompDiffwtdMaskD16Test,CheckOutput)347*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BuildCompDiffwtdMaskD16Test, CheckOutput) {
348*77c1e3ccSAndroid Build Coastguard Worker RunCheckOutput(GET_PARAM(1));
349*77c1e3ccSAndroid Build Coastguard Worker }
350*77c1e3ccSAndroid Build Coastguard Worker
TEST_P(BuildCompDiffwtdMaskD16Test,DISABLED_Speed)351*77c1e3ccSAndroid Build Coastguard Worker TEST_P(BuildCompDiffwtdMaskD16Test, DISABLED_Speed) {
352*77c1e3ccSAndroid Build Coastguard Worker RunSpeedTest(GET_PARAM(1), DIFFWTD_38);
353*77c1e3ccSAndroid Build Coastguard Worker RunSpeedTest(GET_PARAM(1), DIFFWTD_38_INV);
354*77c1e3ccSAndroid Build Coastguard Worker }
355*77c1e3ccSAndroid Build Coastguard Worker
356*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_SSE4_1
357*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(
358*77c1e3ccSAndroid Build Coastguard Worker SSE4_1, BuildCompDiffwtdMaskD16Test,
359*77c1e3ccSAndroid Build Coastguard Worker BuildParams(av1_build_compound_diffwtd_mask_d16_sse4_1));
360*77c1e3ccSAndroid Build Coastguard Worker #endif
361*77c1e3ccSAndroid Build Coastguard Worker
362*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_AVX2
363*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(AVX2, BuildCompDiffwtdMaskD16Test,
364*77c1e3ccSAndroid Build Coastguard Worker BuildParams(av1_build_compound_diffwtd_mask_d16_avx2));
365*77c1e3ccSAndroid Build Coastguard Worker #endif
366*77c1e3ccSAndroid Build Coastguard Worker
367*77c1e3ccSAndroid Build Coastguard Worker #if HAVE_NEON
368*77c1e3ccSAndroid Build Coastguard Worker INSTANTIATE_TEST_SUITE_P(NEON, BuildCompDiffwtdMaskD16Test,
369*77c1e3ccSAndroid Build Coastguard Worker BuildParams(av1_build_compound_diffwtd_mask_d16_neon));
370*77c1e3ccSAndroid Build Coastguard Worker #endif
371*77c1e3ccSAndroid Build Coastguard Worker
372*77c1e3ccSAndroid Build Coastguard Worker } // namespace
373