1*c217d954SCole Faust /*
2*c217d954SCole Faust * Copyright (c) 2019-2022 Arm Limited.
3*c217d954SCole Faust *
4*c217d954SCole Faust * SPDX-License-Identifier: MIT
5*c217d954SCole Faust *
6*c217d954SCole Faust * Permission is hereby granted, free of charge, to any person obtaining a copy
7*c217d954SCole Faust * of this software and associated documentation files (the "Software"), to
8*c217d954SCole Faust * deal in the Software without restriction, including without limitation the
9*c217d954SCole Faust * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10*c217d954SCole Faust * sell copies of the Software, and to permit persons to whom the Software is
11*c217d954SCole Faust * furnished to do so, subject to the following conditions:
12*c217d954SCole Faust *
13*c217d954SCole Faust * The above copyright notice and this permission notice shall be included in all
14*c217d954SCole Faust * copies or substantial portions of the Software.
15*c217d954SCole Faust *
16*c217d954SCole Faust * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17*c217d954SCole Faust * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18*c217d954SCole Faust * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19*c217d954SCole Faust * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20*c217d954SCole Faust * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21*c217d954SCole Faust * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22*c217d954SCole Faust * SOFTWARE.
23*c217d954SCole Faust */
24*c217d954SCole Faust #include "src/cpu/kernels/CpuDepthwiseConv2dNativeKernel.h"
25*c217d954SCole Faust #include "tests/NEON/Accessor.h"
26*c217d954SCole Faust #include "tests/NEON/Helper.h"
27*c217d954SCole Faust #include "tests/framework/Macros.h"
28*c217d954SCole Faust #include "tests/framework/datasets/Datasets.h"
29*c217d954SCole Faust #include "tests/validation/Validation.h"
30*c217d954SCole Faust #include "tests/validation/fixtures/DepthwiseConvolutionLayerFixture.h"
31*c217d954SCole Faust
32*c217d954SCole Faust namespace arm_compute
33*c217d954SCole Faust {
34*c217d954SCole Faust namespace test
35*c217d954SCole Faust {
36*c217d954SCole Faust namespace validation
37*c217d954SCole Faust {
38*c217d954SCole Faust using namespace arm_compute::misc::shape_calculator;
39*c217d954SCole Faust
40*c217d954SCole Faust // Create function for CpuDepthwiseConvolutionKernel
41*c217d954SCole Faust using CpuDepthwiseConvolutionNative = NESynthetizeFunctionWithZeroConstantKernelBorder<cpu::kernels::CpuDepthwiseConv2dNativeKernel>;
42*c217d954SCole Faust
43*c217d954SCole Faust // Fixture for NEDepthwiseConvolutionLayerKernel
44*c217d954SCole Faust template <typename T>
45*c217d954SCole Faust using CpuDepthwiseConvolutionNativeFixture = DepthwiseConvolutionLayerNativeValidationFixture<Tensor, Accessor, CpuDepthwiseConvolutionNative, T>;
46*c217d954SCole Faust
47*c217d954SCole Faust namespace
48*c217d954SCole Faust {
49*c217d954SCole Faust // *INDENT-OFF*
50*c217d954SCole Faust // clang-format off
51*c217d954SCole Faust RelativeTolerance<float> rel_tolerance_f32(0.001f);
52*c217d954SCole Faust constexpr float abs_tolerance_f32(0.0001f);
53*c217d954SCole Faust
54*c217d954SCole Faust /** Width values to test - Precommit */
55*c217d954SCole Faust const auto width_values_precommit = framework::dataset::make("width", { 17U } );
56*c217d954SCole Faust
57*c217d954SCole Faust /** Width values to test - Nightly */
58*c217d954SCole Faust const auto width_values_nightly = framework::dataset::make("width", { 53U, 47U } );
59*c217d954SCole Faust
60*c217d954SCole Faust /** Height values to test - Precommit */
61*c217d954SCole Faust const auto height_values_precommit = framework::dataset::make("height", { 19U } );
62*c217d954SCole Faust
63*c217d954SCole Faust /** Height values to test - Nightly */
64*c217d954SCole Faust const auto height_values_nightly = framework::dataset::make("height", { 39U, 43U } );
65*c217d954SCole Faust
66*c217d954SCole Faust /** Channel values to test - Precommit */
67*c217d954SCole Faust const auto channel_values_precommit = framework::dataset::make("channels", { 15U });
68*c217d954SCole Faust
69*c217d954SCole Faust /** Channel values to test - Nightly */
70*c217d954SCole Faust const auto channel_values_nightly = framework::dataset::make("channels", { 33U, 19U });
71*c217d954SCole Faust
72*c217d954SCole Faust /** Batch values to test - Precommit */
73*c217d954SCole Faust const auto batch_values_precommit = framework::dataset::make("batch", { 1U, 2U });
74*c217d954SCole Faust
75*c217d954SCole Faust /** Batch values to test - Nightly */
76*c217d954SCole Faust const auto batch_values_nightly = framework::dataset::make("batch", { 1U, 3U });
77*c217d954SCole Faust
78*c217d954SCole Faust /** Kernel size values to test - Precommit */
79*c217d954SCole Faust const auto kernel_sz_values_precommit = framework::dataset::make("kernel_size", { Size2D(1U, 1U), Size2D(1U, 3U) });
80*c217d954SCole Faust
81*c217d954SCole Faust /** Kernel size values to test - Nightly */
82*c217d954SCole Faust const auto kernel_sz_values_nightly = framework::dataset::make("kernel_size", { Size2D(3U, 5U), Size2D(5U, 1U), Size2D(1U, 7U), Size2D(9U, 7U) });
83*c217d954SCole Faust
84*c217d954SCole Faust /** Depth multiplier values to test - All */
85*c217d954SCole Faust const auto depth_multiplier_values = framework::dataset::make("depth_multiplier", { 1U, 3U });
86*c217d954SCole Faust
87*c217d954SCole Faust /** Dilation values to test - All */
88*c217d954SCole Faust const auto dilation_values = framework::dataset::make("dilation", { Size2D(1U, 1U), Size2D(3U, 3U) });
89*c217d954SCole Faust
90*c217d954SCole Faust /** Stride values to test - All */
91*c217d954SCole Faust const auto stride_values = framework::dataset::make("stride", { Size2D(1U, 1U), Size2D(3U, 2U) });
92*c217d954SCole Faust
93*c217d954SCole Faust /** Padding values to test - All */
94*c217d954SCole Faust const auto padding_valid_values = framework::dataset::make("padding_valid", { true, false });
95*c217d954SCole Faust
96*c217d954SCole Faust /** Data type values to test - All */
97*c217d954SCole Faust const auto data_type_values = framework::dataset::make("data_type", { DataType::F32 });
98*c217d954SCole Faust
99*c217d954SCole Faust /** Data layout values to test - All */
100*c217d954SCole Faust const auto data_layout_values = framework::dataset::make("data_layout", { DataLayout::NHWC });
101*c217d954SCole Faust } // namespace
102*c217d954SCole Faust
103*c217d954SCole Faust TEST_SUITE(NEON)
TEST_SUITE(DepthwiseConvolutionLayerNative)104*c217d954SCole Faust TEST_SUITE(DepthwiseConvolutionLayerNative)
105*c217d954SCole Faust
106*c217d954SCole Faust TEST_CASE(ValidateNoPadding, framework::DatasetMode::ALL)
107*c217d954SCole Faust {
108*c217d954SCole Faust // this test case will ensure that the kernel is not adding implicit padding
109*c217d954SCole Faust constexpr uint32_t vector_size = 8; // Asummed vector size of the current native kernel
110*c217d954SCole Faust constexpr auto depth = vector_size * 2 + 1; // mis-aligned depth to force padding if exists.
111*c217d954SCole Faust constexpr auto data_layout = DataLayout::NHWC;
112*c217d954SCole Faust constexpr auto data_type = DataType::F32;
113*c217d954SCole Faust
114*c217d954SCole Faust const auto input_size = Size2D{ 100, 100 }; // random plane size of the input
115*c217d954SCole Faust const auto kernel_size = Size2D{ 4, 4 }; // random plane size of the kernel
116*c217d954SCole Faust const auto pad_stride_info = PadStrideInfo(3, 3); // random convolution information to
117*c217d954SCole Faust
118*c217d954SCole Faust TensorShape src_shape{ depth, input_size.x(), input_size.y() };
119*c217d954SCole Faust TensorShape weights_shape{ depth, kernel_size.x(), kernel_size.y() };
120*c217d954SCole Faust TensorShape bias_shape{ depth };
121*c217d954SCole Faust
122*c217d954SCole Faust auto src = create_tensor<Tensor>(src_shape, data_type, 1, QuantizationInfo(), data_layout);
123*c217d954SCole Faust auto weights = create_tensor<Tensor>(weights_shape, data_type, 1, QuantizationInfo(), data_layout);
124*c217d954SCole Faust auto biases = create_tensor<Tensor>(bias_shape, data_type, 1, QuantizationInfo(), data_layout);
125*c217d954SCole Faust auto dst = create_tensor<Tensor>(TensorShape(), data_type, 1, QuantizationInfo(), data_layout);
126*c217d954SCole Faust
127*c217d954SCole Faust cpu::kernels::CpuDepthwiseConv2dNativeKernel dwc;
128*c217d954SCole Faust const ConvolutionInfo info{pad_stride_info, 1, ActivationLayerInfo(), Size2D(1, 1)};
129*c217d954SCole Faust dwc.configure(src.info(), weights.info(), biases.info(), dst.info(), info);
130*c217d954SCole Faust
131*c217d954SCole Faust ARM_COMPUTE_EXPECT(src.info()->padding().empty(), framework::LogLevel::ERRORS);
132*c217d954SCole Faust ARM_COMPUTE_EXPECT(weights.info()->padding().empty(), framework::LogLevel::ERRORS);
133*c217d954SCole Faust ARM_COMPUTE_EXPECT(biases.info()->padding().empty(), framework::LogLevel::ERRORS);
134*c217d954SCole Faust ARM_COMPUTE_EXPECT(dst.info()->padding().empty(), framework::LogLevel::ERRORS);
135*c217d954SCole Faust }
136*c217d954SCole Faust
137*c217d954SCole Faust TEST_SUITE(KERNEL_SELECTION)
138*c217d954SCole Faust DATA_TEST_CASE(KernelSelection_mul_and_add, framework::DatasetMode::ALL,
139*c217d954SCole Faust combine(combine(framework::dataset::make("CpuExt", std::string("NEON")),
140*c217d954SCole Faust framework::dataset::make("DataType", { DataType::F32,
141*c217d954SCole Faust DataType::F16,
142*c217d954SCole Faust DataType::QASYMM8_SIGNED,
143*c217d954SCole Faust DataType::QASYMM8,
144*c217d954SCole Faust DataType::QSYMM8_PER_CHANNEL
145*c217d954SCole Faust })),
146*c217d954SCole Faust framework::dataset::make("DataType_per_channel", { DataType::QASYMM8,
147*c217d954SCole Faust DataType::QASYMM8_SIGNED
148*c217d954SCole Faust })),
149*c217d954SCole Faust cpu_ext, data_type, data_type_per_channel)
150*c217d954SCole Faust {
151*c217d954SCole Faust using namespace cpu::kernels;
152*c217d954SCole Faust
153*c217d954SCole Faust cpuinfo::CpuIsaInfo cpu_isa{};
154*c217d954SCole Faust cpu_isa.neon = (cpu_ext == "NEON");
155*c217d954SCole Faust cpu_isa.fp16 = (data_type == DataType::F16);
156*c217d954SCole Faust
157*c217d954SCole Faust const auto *selected_impl = CpuDepthwiseConv2dNativeKernel::get_implementation(
158*c217d954SCole Faust DepthwiseConv2dNativeDataTypeISASelectorData{ data_type, data_type_per_channel,cpu_isa },
159*c217d954SCole Faust cpu::KernelSelectionType::Preferred );
160*c217d954SCole Faust
161*c217d954SCole Faust ARM_COMPUTE_ERROR_ON_NULLPTR(selected_impl);
162*c217d954SCole Faust
163*c217d954SCole Faust std::string per_channel_str = "_";
164*c217d954SCole Faust if (data_type == DataType::QSYMM8_PER_CHANNEL)
165*c217d954SCole Faust {
166*c217d954SCole Faust per_channel_str = "_" + cpu_impl_dt(data_type_per_channel) + "_" ;
167*c217d954SCole Faust }
168*c217d954SCole Faust std::string expected = lower_string(cpu_ext) + "_" + cpu_impl_dt(data_type) + per_channel_str + "deptwiseconv2dnative";
169*c217d954SCole Faust std::string actual = selected_impl->name;
170*c217d954SCole Faust
171*c217d954SCole Faust ARM_COMPUTE_EXPECT_EQUAL(expected, actual, framework::LogLevel::ERRORS);
172*c217d954SCole Faust }
173*c217d954SCole Faust TEST_SUITE_END() // KERNEL_SELECTION
174*c217d954SCole Faust
TEST_SUITE(Float)175*c217d954SCole Faust TEST_SUITE(Float)
176*c217d954SCole Faust TEST_SUITE(FP32)
177*c217d954SCole Faust FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CpuDepthwiseConvolutionNativeFixture<float>, framework::DatasetMode::ALL,
178*c217d954SCole Faust combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(width_values_precommit,
179*c217d954SCole Faust height_values_precommit),
180*c217d954SCole Faust channel_values_precommit),
181*c217d954SCole Faust batch_values_precommit),
182*c217d954SCole Faust kernel_sz_values_precommit),
183*c217d954SCole Faust depth_multiplier_values),
184*c217d954SCole Faust dilation_values),
185*c217d954SCole Faust stride_values),
186*c217d954SCole Faust padding_valid_values),
187*c217d954SCole Faust data_type_values),
188*c217d954SCole Faust data_layout_values))
189*c217d954SCole Faust {
190*c217d954SCole Faust // Validate output
191*c217d954SCole Faust validate(Accessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);
192*c217d954SCole Faust }
193*c217d954SCole Faust
FIXTURE_DATA_TEST_CASE_NEW(RunLarge,CpuDepthwiseConvolutionNativeFixture<float>,framework::DatasetMode::NIGHTLY,combine (combine (combine (combine (combine (combine (combine (combine (combine (combine (width_values_nightly,height_values_nightly),channel_values_nightly),batch_values_nightly),kernel_sz_values_nightly),depth_multiplier_values),dilation_values),stride_values),padding_valid_values),data_type_values),data_layout_values))194*c217d954SCole Faust FIXTURE_DATA_TEST_CASE_NEW(RunLarge, CpuDepthwiseConvolutionNativeFixture<float>, framework::DatasetMode::NIGHTLY,
195*c217d954SCole Faust combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(width_values_nightly,
196*c217d954SCole Faust height_values_nightly),
197*c217d954SCole Faust channel_values_nightly),
198*c217d954SCole Faust batch_values_nightly),
199*c217d954SCole Faust kernel_sz_values_nightly),
200*c217d954SCole Faust depth_multiplier_values),
201*c217d954SCole Faust dilation_values),
202*c217d954SCole Faust stride_values),
203*c217d954SCole Faust padding_valid_values),
204*c217d954SCole Faust data_type_values),
205*c217d954SCole Faust data_layout_values))
206*c217d954SCole Faust {
207*c217d954SCole Faust // Validate output
208*c217d954SCole Faust validate(Accessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);
209*c217d954SCole Faust }
210*c217d954SCole Faust
211*c217d954SCole Faust TEST_SUITE_END() // FP32
212*c217d954SCole Faust TEST_SUITE_END() // Float
213*c217d954SCole Faust TEST_SUITE_END() // DepthwiseConvolutionLayerNative
214*c217d954SCole Faust TEST_SUITE_END() // Neon
215*c217d954SCole Faust } // namespace validation
216*c217d954SCole Faust } // namespace test
217*c217d954SCole Faust } // namespace arm_compute
218