xref: /aosp_15_r20/external/ComputeLibrary/tests/validation/NEON/DepthwiseConvolutionLayerNative.cpp (revision c217d954acce2dbc11938adb493fc0abd69584f3)
1*c217d954SCole Faust /*
2*c217d954SCole Faust  * Copyright (c) 2019-2022 Arm Limited.
3*c217d954SCole Faust  *
4*c217d954SCole Faust  * SPDX-License-Identifier: MIT
5*c217d954SCole Faust  *
6*c217d954SCole Faust  * Permission is hereby granted, free of charge, to any person obtaining a copy
7*c217d954SCole Faust  * of this software and associated documentation files (the "Software"), to
8*c217d954SCole Faust  * deal in the Software without restriction, including without limitation the
9*c217d954SCole Faust  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10*c217d954SCole Faust  * sell copies of the Software, and to permit persons to whom the Software is
11*c217d954SCole Faust  * furnished to do so, subject to the following conditions:
12*c217d954SCole Faust  *
13*c217d954SCole Faust  * The above copyright notice and this permission notice shall be included in all
14*c217d954SCole Faust  * copies or substantial portions of the Software.
15*c217d954SCole Faust  *
16*c217d954SCole Faust  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17*c217d954SCole Faust  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18*c217d954SCole Faust  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19*c217d954SCole Faust  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20*c217d954SCole Faust  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21*c217d954SCole Faust  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22*c217d954SCole Faust  * SOFTWARE.
23*c217d954SCole Faust  */
24*c217d954SCole Faust #include "src/cpu/kernels/CpuDepthwiseConv2dNativeKernel.h"
25*c217d954SCole Faust #include "tests/NEON/Accessor.h"
26*c217d954SCole Faust #include "tests/NEON/Helper.h"
27*c217d954SCole Faust #include "tests/framework/Macros.h"
28*c217d954SCole Faust #include "tests/framework/datasets/Datasets.h"
29*c217d954SCole Faust #include "tests/validation/Validation.h"
30*c217d954SCole Faust #include "tests/validation/fixtures/DepthwiseConvolutionLayerFixture.h"
31*c217d954SCole Faust 
32*c217d954SCole Faust namespace arm_compute
33*c217d954SCole Faust {
34*c217d954SCole Faust namespace test
35*c217d954SCole Faust {
36*c217d954SCole Faust namespace validation
37*c217d954SCole Faust {
38*c217d954SCole Faust using namespace arm_compute::misc::shape_calculator;
39*c217d954SCole Faust 
40*c217d954SCole Faust // Create function for CpuDepthwiseConvolutionKernel
41*c217d954SCole Faust using CpuDepthwiseConvolutionNative = NESynthetizeFunctionWithZeroConstantKernelBorder<cpu::kernels::CpuDepthwiseConv2dNativeKernel>;
42*c217d954SCole Faust 
43*c217d954SCole Faust // Fixture for NEDepthwiseConvolutionLayerKernel
44*c217d954SCole Faust template <typename T>
45*c217d954SCole Faust using CpuDepthwiseConvolutionNativeFixture = DepthwiseConvolutionLayerNativeValidationFixture<Tensor, Accessor, CpuDepthwiseConvolutionNative, T>;
46*c217d954SCole Faust 
47*c217d954SCole Faust namespace
48*c217d954SCole Faust {
49*c217d954SCole Faust // *INDENT-OFF*
50*c217d954SCole Faust // clang-format off
51*c217d954SCole Faust RelativeTolerance<float> rel_tolerance_f32(0.001f);
52*c217d954SCole Faust constexpr float          abs_tolerance_f32(0.0001f);
53*c217d954SCole Faust 
54*c217d954SCole Faust /** Width values to test - Precommit */
55*c217d954SCole Faust const auto width_values_precommit = framework::dataset::make("width", { 17U } );
56*c217d954SCole Faust 
57*c217d954SCole Faust /** Width values to test - Nightly */
58*c217d954SCole Faust const auto width_values_nightly = framework::dataset::make("width", { 53U, 47U } );
59*c217d954SCole Faust 
60*c217d954SCole Faust /** Height values to test - Precommit */
61*c217d954SCole Faust const auto height_values_precommit = framework::dataset::make("height", { 19U } );
62*c217d954SCole Faust 
63*c217d954SCole Faust /** Height values to test - Nightly */
64*c217d954SCole Faust const auto height_values_nightly = framework::dataset::make("height", { 39U, 43U } );
65*c217d954SCole Faust 
66*c217d954SCole Faust /** Channel values to test - Precommit */
67*c217d954SCole Faust const auto channel_values_precommit = framework::dataset::make("channels", { 15U });
68*c217d954SCole Faust 
69*c217d954SCole Faust /** Channel values to test - Nightly */
70*c217d954SCole Faust const auto channel_values_nightly = framework::dataset::make("channels", { 33U, 19U });
71*c217d954SCole Faust 
72*c217d954SCole Faust /** Batch values to test - Precommit */
73*c217d954SCole Faust const auto batch_values_precommit = framework::dataset::make("batch", { 1U, 2U });
74*c217d954SCole Faust 
75*c217d954SCole Faust /** Batch values to test - Nightly */
76*c217d954SCole Faust const auto batch_values_nightly = framework::dataset::make("batch", { 1U, 3U });
77*c217d954SCole Faust 
78*c217d954SCole Faust /** Kernel size values to test - Precommit */
79*c217d954SCole Faust const auto kernel_sz_values_precommit = framework::dataset::make("kernel_size", { Size2D(1U, 1U), Size2D(1U, 3U) });
80*c217d954SCole Faust 
81*c217d954SCole Faust /** Kernel size values to test - Nightly */
82*c217d954SCole Faust const auto kernel_sz_values_nightly = framework::dataset::make("kernel_size", { Size2D(3U, 5U), Size2D(5U, 1U), Size2D(1U, 7U), Size2D(9U, 7U) });
83*c217d954SCole Faust 
84*c217d954SCole Faust /** Depth multiplier values to test - All */
85*c217d954SCole Faust const auto depth_multiplier_values = framework::dataset::make("depth_multiplier", { 1U, 3U });
86*c217d954SCole Faust 
87*c217d954SCole Faust /** Dilation values to test - All */
88*c217d954SCole Faust const auto dilation_values = framework::dataset::make("dilation", { Size2D(1U, 1U), Size2D(3U, 3U) });
89*c217d954SCole Faust 
90*c217d954SCole Faust /** Stride values to test - All */
91*c217d954SCole Faust const auto stride_values = framework::dataset::make("stride", { Size2D(1U, 1U), Size2D(3U, 2U) });
92*c217d954SCole Faust 
93*c217d954SCole Faust /** Padding values to test - All */
94*c217d954SCole Faust const auto padding_valid_values = framework::dataset::make("padding_valid", { true, false });
95*c217d954SCole Faust 
96*c217d954SCole Faust /** Data type values to test - All */
97*c217d954SCole Faust const auto data_type_values = framework::dataset::make("data_type", { DataType::F32 });
98*c217d954SCole Faust 
99*c217d954SCole Faust /** Data layout values to test - All */
100*c217d954SCole Faust const auto data_layout_values = framework::dataset::make("data_layout", { DataLayout::NHWC });
101*c217d954SCole Faust } // namespace
102*c217d954SCole Faust 
103*c217d954SCole Faust TEST_SUITE(NEON)
TEST_SUITE(DepthwiseConvolutionLayerNative)104*c217d954SCole Faust TEST_SUITE(DepthwiseConvolutionLayerNative)
105*c217d954SCole Faust 
106*c217d954SCole Faust TEST_CASE(ValidateNoPadding, framework::DatasetMode::ALL)
107*c217d954SCole Faust {
108*c217d954SCole Faust     // this test case will ensure that the kernel is not adding implicit padding
109*c217d954SCole Faust     constexpr uint32_t vector_size = 8; // Asummed vector size of the current native kernel
110*c217d954SCole Faust     constexpr auto     depth = vector_size * 2 + 1; // mis-aligned depth to force padding if exists.
111*c217d954SCole Faust     constexpr auto     data_layout = DataLayout::NHWC;
112*c217d954SCole Faust     constexpr auto     data_type = DataType::F32;
113*c217d954SCole Faust 
114*c217d954SCole Faust     const auto input_size  = Size2D{ 100, 100 }; // random plane size of the input
115*c217d954SCole Faust     const auto kernel_size = Size2D{ 4, 4 }; // random plane size of the kernel
116*c217d954SCole Faust     const auto pad_stride_info = PadStrideInfo(3, 3); // random convolution information to
117*c217d954SCole Faust 
118*c217d954SCole Faust     TensorShape src_shape{ depth, input_size.x(), input_size.y() };
119*c217d954SCole Faust     TensorShape weights_shape{ depth, kernel_size.x(), kernel_size.y() };
120*c217d954SCole Faust     TensorShape bias_shape{ depth };
121*c217d954SCole Faust 
122*c217d954SCole Faust     auto src     = create_tensor<Tensor>(src_shape, data_type, 1, QuantizationInfo(), data_layout);
123*c217d954SCole Faust     auto weights = create_tensor<Tensor>(weights_shape, data_type, 1, QuantizationInfo(), data_layout);
124*c217d954SCole Faust     auto biases  = create_tensor<Tensor>(bias_shape, data_type, 1, QuantizationInfo(), data_layout);
125*c217d954SCole Faust     auto dst     = create_tensor<Tensor>(TensorShape(), data_type, 1, QuantizationInfo(), data_layout);
126*c217d954SCole Faust 
127*c217d954SCole Faust     cpu::kernels::CpuDepthwiseConv2dNativeKernel dwc;
128*c217d954SCole Faust     const ConvolutionInfo info{pad_stride_info, 1, ActivationLayerInfo(), Size2D(1, 1)};
129*c217d954SCole Faust     dwc.configure(src.info(), weights.info(), biases.info(), dst.info(), info);
130*c217d954SCole Faust 
131*c217d954SCole Faust     ARM_COMPUTE_EXPECT(src.info()->padding().empty(), framework::LogLevel::ERRORS);
132*c217d954SCole Faust     ARM_COMPUTE_EXPECT(weights.info()->padding().empty(), framework::LogLevel::ERRORS);
133*c217d954SCole Faust     ARM_COMPUTE_EXPECT(biases.info()->padding().empty(), framework::LogLevel::ERRORS);
134*c217d954SCole Faust     ARM_COMPUTE_EXPECT(dst.info()->padding().empty(), framework::LogLevel::ERRORS);
135*c217d954SCole Faust }
136*c217d954SCole Faust 
137*c217d954SCole Faust TEST_SUITE(KERNEL_SELECTION)
138*c217d954SCole Faust DATA_TEST_CASE(KernelSelection_mul_and_add, framework::DatasetMode::ALL,
139*c217d954SCole Faust                combine(combine(framework::dataset::make("CpuExt", std::string("NEON")),
140*c217d954SCole Faust                        framework::dataset::make("DataType", { DataType::F32,
141*c217d954SCole Faust                                                               DataType::F16,
142*c217d954SCole Faust                                                               DataType::QASYMM8_SIGNED,
143*c217d954SCole Faust                                                               DataType::QASYMM8,
144*c217d954SCole Faust                                                               DataType::QSYMM8_PER_CHANNEL
145*c217d954SCole Faust                                                             })),
146*c217d954SCole Faust                        framework::dataset::make("DataType_per_channel", { DataType::QASYMM8,
147*c217d954SCole Faust                                                                           DataType::QASYMM8_SIGNED
148*c217d954SCole Faust                                                             })),
149*c217d954SCole Faust                 cpu_ext, data_type, data_type_per_channel)
150*c217d954SCole Faust {
151*c217d954SCole Faust     using namespace cpu::kernels;
152*c217d954SCole Faust 
153*c217d954SCole Faust     cpuinfo::CpuIsaInfo cpu_isa{};
154*c217d954SCole Faust     cpu_isa.neon = (cpu_ext == "NEON");
155*c217d954SCole Faust     cpu_isa.fp16 = (data_type == DataType::F16);
156*c217d954SCole Faust 
157*c217d954SCole Faust     const auto *selected_impl = CpuDepthwiseConv2dNativeKernel::get_implementation(
158*c217d954SCole Faust         DepthwiseConv2dNativeDataTypeISASelectorData{ data_type, data_type_per_channel,cpu_isa },
159*c217d954SCole Faust         cpu::KernelSelectionType::Preferred );
160*c217d954SCole Faust 
161*c217d954SCole Faust     ARM_COMPUTE_ERROR_ON_NULLPTR(selected_impl);
162*c217d954SCole Faust 
163*c217d954SCole Faust     std::string per_channel_str = "_";
164*c217d954SCole Faust     if (data_type == DataType::QSYMM8_PER_CHANNEL)
165*c217d954SCole Faust     {
166*c217d954SCole Faust         per_channel_str = "_" + cpu_impl_dt(data_type_per_channel) + "_" ;
167*c217d954SCole Faust     }
168*c217d954SCole Faust     std::string expected = lower_string(cpu_ext) + "_" + cpu_impl_dt(data_type)  + per_channel_str + "deptwiseconv2dnative";
169*c217d954SCole Faust     std::string actual   = selected_impl->name;
170*c217d954SCole Faust 
171*c217d954SCole Faust     ARM_COMPUTE_EXPECT_EQUAL(expected, actual, framework::LogLevel::ERRORS);
172*c217d954SCole Faust }
173*c217d954SCole Faust TEST_SUITE_END() // KERNEL_SELECTION
174*c217d954SCole Faust 
TEST_SUITE(Float)175*c217d954SCole Faust TEST_SUITE(Float)
176*c217d954SCole Faust TEST_SUITE(FP32)
177*c217d954SCole Faust FIXTURE_DATA_TEST_CASE_NEW(RunSmall, CpuDepthwiseConvolutionNativeFixture<float>, framework::DatasetMode::ALL,
178*c217d954SCole Faust                 combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(width_values_precommit,
179*c217d954SCole Faust                                                                                                 height_values_precommit),
180*c217d954SCole Faust                                                                                                 channel_values_precommit),
181*c217d954SCole Faust                                                                                                 batch_values_precommit),
182*c217d954SCole Faust                                                                                                 kernel_sz_values_precommit),
183*c217d954SCole Faust                                                                                                 depth_multiplier_values),
184*c217d954SCole Faust                                                                                                 dilation_values),
185*c217d954SCole Faust                                                                                                 stride_values),
186*c217d954SCole Faust                                                                                                 padding_valid_values),
187*c217d954SCole Faust                                                                                                 data_type_values),
188*c217d954SCole Faust                                                                                                 data_layout_values))
189*c217d954SCole Faust {
190*c217d954SCole Faust     // Validate output
191*c217d954SCole Faust     validate(Accessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);
192*c217d954SCole Faust }
193*c217d954SCole Faust 
FIXTURE_DATA_TEST_CASE_NEW(RunLarge,CpuDepthwiseConvolutionNativeFixture<float>,framework::DatasetMode::NIGHTLY,combine (combine (combine (combine (combine (combine (combine (combine (combine (combine (width_values_nightly,height_values_nightly),channel_values_nightly),batch_values_nightly),kernel_sz_values_nightly),depth_multiplier_values),dilation_values),stride_values),padding_valid_values),data_type_values),data_layout_values))194*c217d954SCole Faust FIXTURE_DATA_TEST_CASE_NEW(RunLarge, CpuDepthwiseConvolutionNativeFixture<float>, framework::DatasetMode::NIGHTLY,
195*c217d954SCole Faust                 combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(width_values_nightly,
196*c217d954SCole Faust                                                                                                 height_values_nightly),
197*c217d954SCole Faust                                                                                                 channel_values_nightly),
198*c217d954SCole Faust                                                                                                 batch_values_nightly),
199*c217d954SCole Faust                                                                                                 kernel_sz_values_nightly),
200*c217d954SCole Faust                                                                                                 depth_multiplier_values),
201*c217d954SCole Faust                                                                                                 dilation_values),
202*c217d954SCole Faust                                                                                                 stride_values),
203*c217d954SCole Faust                                                                                                 padding_valid_values),
204*c217d954SCole Faust                                                                                                 data_type_values),
205*c217d954SCole Faust                                                                                                 data_layout_values))
206*c217d954SCole Faust {
207*c217d954SCole Faust     // Validate output
208*c217d954SCole Faust     validate(Accessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);
209*c217d954SCole Faust }
210*c217d954SCole Faust 
211*c217d954SCole Faust TEST_SUITE_END() // FP32
212*c217d954SCole Faust TEST_SUITE_END() // Float
213*c217d954SCole Faust TEST_SUITE_END() // DepthwiseConvolutionLayerNative
214*c217d954SCole Faust TEST_SUITE_END() // Neon
215*c217d954SCole Faust } // namespace validation
216*c217d954SCole Faust } // namespace test
217*c217d954SCole Faust } // namespace arm_compute
218