1*c217d954SCole Faust /*
2*c217d954SCole Faust * Copyright (c) 2019-2022 Arm Limited.
3*c217d954SCole Faust *
4*c217d954SCole Faust * SPDX-License-Identifier: MIT
5*c217d954SCole Faust *
6*c217d954SCole Faust * Permission is hereby granted, free of charge, to any person obtaining a copy
7*c217d954SCole Faust * of this software and associated documentation files (the "Software"), to
8*c217d954SCole Faust * deal in the Software without restriction, including without limitation the
9*c217d954SCole Faust * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10*c217d954SCole Faust * sell copies of the Software, and to permit persons to whom the Software is
11*c217d954SCole Faust * furnished to do so, subject to the following conditions:
12*c217d954SCole Faust *
13*c217d954SCole Faust * The above copyright notice and this permission notice shall be included in all
14*c217d954SCole Faust * copies or substantial portions of the Software.
15*c217d954SCole Faust *
16*c217d954SCole Faust * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17*c217d954SCole Faust * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18*c217d954SCole Faust * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19*c217d954SCole Faust * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20*c217d954SCole Faust * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21*c217d954SCole Faust * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22*c217d954SCole Faust * SOFTWARE.
23*c217d954SCole Faust */
24*c217d954SCole Faust #include "arm_compute/core/Types.h"
25*c217d954SCole Faust #include "arm_compute/runtime/NEON/functions/NECast.h"
26*c217d954SCole Faust #include "arm_compute/runtime/Tensor.h"
27*c217d954SCole Faust #include "arm_compute/runtime/TensorAllocator.h"
28*c217d954SCole Faust #include "src/common/cpuinfo/CpuIsaInfo.h"
29*c217d954SCole Faust #include "src/cpu/kernels/CpuCastKernel.h"
30*c217d954SCole Faust #include "tests/NEON/Accessor.h"
31*c217d954SCole Faust #include "tests/PaddingCalculator.h"
32*c217d954SCole Faust #include "tests/datasets/ConvertPolicyDataset.h"
33*c217d954SCole Faust #include "tests/datasets/ShapeDatasets.h"
34*c217d954SCole Faust #include "tests/framework/Asserts.h"
35*c217d954SCole Faust #include "tests/framework/Macros.h"
36*c217d954SCole Faust #include "tests/framework/datasets/Datasets.h"
37*c217d954SCole Faust #include "tests/validation/Validation.h"
38*c217d954SCole Faust #include "tests/validation/fixtures/CastFixture.h"
39*c217d954SCole Faust namespace arm_compute
40*c217d954SCole Faust {
41*c217d954SCole Faust namespace test
42*c217d954SCole Faust {
43*c217d954SCole Faust namespace validation
44*c217d954SCole Faust {
45*c217d954SCole Faust namespace
46*c217d954SCole Faust {
47*c217d954SCole Faust // Tolerance
48*c217d954SCole Faust constexpr AbsoluteTolerance<float> one_tolerance(1);
49*c217d954SCole Faust constexpr AbsoluteTolerance<float> zero_tolerance(0);
50*c217d954SCole Faust
51*c217d954SCole Faust /*
52*c217d954SCole Faust *This function ignores the scale and zeroPoint of quanized tensors,so QASYMM8 input is treated as uint8 values.
53*c217d954SCole Faust */
54*c217d954SCole Faust
55*c217d954SCole Faust /** Input data sets **/
56*c217d954SCole Faust
57*c217d954SCole Faust // QASYMM8_SIGNED
58*c217d954SCole Faust const auto CastQASYMM8_SIGNEDtoS16Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::S16));
59*c217d954SCole Faust const auto CastQASYMM8_SIGNEDtoS32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::S32));
60*c217d954SCole Faust const auto CastQASYMM8_SIGNEDtoF32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::F32));
61*c217d954SCole Faust const auto CastQASYMM8_SIGNEDtoF16Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::F16));
62*c217d954SCole Faust
63*c217d954SCole Faust // QASYMM8
64*c217d954SCole Faust const auto CastQASYMM8toF16Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8), framework::dataset::make("DataType", DataType::F16));
65*c217d954SCole Faust const auto CastQASYMM8toF32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8), framework::dataset::make("DataType", DataType::F32));
66*c217d954SCole Faust const auto CastQASYMM8toS32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8), framework::dataset::make("DataType", DataType::S32));
67*c217d954SCole Faust
68*c217d954SCole Faust // U8
69*c217d954SCole Faust const auto CastU8toU16Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::U16));
70*c217d954SCole Faust const auto CastU8toS16Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::S16));
71*c217d954SCole Faust const auto CastU8toS32Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::S32));
72*c217d954SCole Faust const auto CastU8toF32Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::F32));
73*c217d954SCole Faust
74*c217d954SCole Faust // U16
75*c217d954SCole Faust const auto CastU16toU8Dataset = combine(framework::dataset::make("DataType", DataType::U16), framework::dataset::make("DataType", DataType::U8));
76*c217d954SCole Faust const auto CastU16toU32Dataset = combine(framework::dataset::make("DataType", DataType::U16), framework::dataset::make("DataType", DataType::U32));
77*c217d954SCole Faust
78*c217d954SCole Faust // S16
79*c217d954SCole Faust const auto CastS16toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::S16), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
80*c217d954SCole Faust const auto CastS16toU8Dataset = combine(framework::dataset::make("DataType", DataType::S16), framework::dataset::make("DataType", DataType::U8));
81*c217d954SCole Faust const auto CastS16toS32Dataset = combine(framework::dataset::make("DataType", DataType::S16), framework::dataset::make("DataType", DataType::S32));
82*c217d954SCole Faust
83*c217d954SCole Faust //S32
84*c217d954SCole Faust const auto CastS32toF16Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::F16));
85*c217d954SCole Faust const auto CastS32toU8Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::U8));
86*c217d954SCole Faust const auto CastS32toF32Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::F32));
87*c217d954SCole Faust const auto CastS32toQASYMM8Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::QASYMM8));
88*c217d954SCole Faust const auto CastS32toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
89*c217d954SCole Faust
90*c217d954SCole Faust // F16
91*c217d954SCole Faust const auto CastF16toF32Dataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::F32));
92*c217d954SCole Faust const auto CastF16toS32Dataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::S32));
93*c217d954SCole Faust const auto CastF16toQASYMM8Dataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::QASYMM8));
94*c217d954SCole Faust const auto CastF16toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
95*c217d954SCole Faust
96*c217d954SCole Faust // F32
97*c217d954SCole Faust const auto CastF32toU8Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::U8));
98*c217d954SCole Faust const auto CastF32toF16Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::F16));
99*c217d954SCole Faust const auto CastF32toS32Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::S32));
100*c217d954SCole Faust const auto CastF32toQASYMM8Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::QASYMM8));
101*c217d954SCole Faust const auto CastF32toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
102*c217d954SCole Faust
103*c217d954SCole Faust } // namespace
104*c217d954SCole Faust
105*c217d954SCole Faust TEST_SUITE(NEON)
106*c217d954SCole Faust TEST_SUITE(Cast)
107*c217d954SCole Faust template <typename T>
108*c217d954SCole Faust using NECastToU8Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint8_t>;
109*c217d954SCole Faust template <typename T>
110*c217d954SCole Faust using NECastToU16Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint16_t>;
111*c217d954SCole Faust template <typename T>
112*c217d954SCole Faust using NECastToS16Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, int16_t>;
113*c217d954SCole Faust template <typename T>
114*c217d954SCole Faust using NECastToU32Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint32_t>;
115*c217d954SCole Faust template <typename T>
116*c217d954SCole Faust using NECastToS32Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, int32_t>;
117*c217d954SCole Faust template <typename T>
118*c217d954SCole Faust using NECastToF16Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, half>;
119*c217d954SCole Faust template <typename T>
120*c217d954SCole Faust using NECastToF32Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, float>;
121*c217d954SCole Faust template <typename T>
122*c217d954SCole Faust using NECastToQASYMM8Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint8_t>;
123*c217d954SCole Faust template <typename T>
124*c217d954SCole Faust using NECastToQASYMM8_SIGNEDFixture = CastValidationFixture<Tensor, Accessor, NECast, T, int8_t>;
125*c217d954SCole Faust
126*c217d954SCole Faust #define CAST_SUITE(NAME, idt, odt, type, dataset, tolerance) \
127*c217d954SCole Faust TEST_SUITE(NAME) \
128*c217d954SCole Faust FIXTURE_DATA_TEST_CASE(RunSmall, type, framework::DatasetMode::PRECOMMIT, combine(combine(datasets::SmallShapes(), dataset), \
129*c217d954SCole Faust datasets::ConvertPolicies())) \
130*c217d954SCole Faust { \
131*c217d954SCole Faust validate(Accessor(_target), _reference, tolerance); \
132*c217d954SCole Faust } \
133*c217d954SCole Faust TEST_SUITE_END()
134*c217d954SCole Faust
135*c217d954SCole Faust //QASYMM8_SIGNED
CAST_SUITE(QASYMM8_SIGNED_to_S16,DataType::QASYMM8_SIGNED,DataType::S16,NECastToS16Fixture<int8_t>,CastQASYMM8_SIGNEDtoS16Dataset,one_tolerance)136*c217d954SCole Faust CAST_SUITE(QASYMM8_SIGNED_to_S16, DataType::QASYMM8_SIGNED, DataType::S16, NECastToS16Fixture<int8_t>, CastQASYMM8_SIGNEDtoS16Dataset, one_tolerance)
137*c217d954SCole Faust CAST_SUITE(QASYMM8_SIGNED_to_S32, DataType::QASYMM8_SIGNED, DataType::S32, NECastToS32Fixture<int8_t>, CastQASYMM8_SIGNEDtoS32Dataset, one_tolerance)
138*c217d954SCole Faust CAST_SUITE(QASYMM8_SIGNED_to_F32, DataType::QASYMM8_SIGNED, DataType::F32, NECastToF32Fixture<int8_t>, CastQASYMM8_SIGNEDtoF32Dataset, one_tolerance)
139*c217d954SCole Faust #ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
140*c217d954SCole Faust CAST_SUITE(QASYMM8_SIGNED_to_F16, DataType::QASYMM8_SIGNED, DataType::F16, NECastToF16Fixture<int8_t>, CastQASYMM8_SIGNEDtoF16Dataset, one_tolerance)
141*c217d954SCole Faust #endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
142*c217d954SCole Faust
143*c217d954SCole Faust //QASYMM8
144*c217d954SCole Faust #ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
145*c217d954SCole Faust CAST_SUITE(QASYMM8_to_F16, DataType::QASYMM8, DataType::F16, NECastToF16Fixture<uint8_t>, CastQASYMM8toF16Dataset, one_tolerance)
146*c217d954SCole Faust #endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
147*c217d954SCole Faust CAST_SUITE(QASYMM8_to_F32, DataType::QASYMM8, DataType::F32, NECastToF32Fixture<uint8_t>, CastQASYMM8toF32Dataset, one_tolerance)
148*c217d954SCole Faust CAST_SUITE(QASYMM8_to_S32, DataType::QASYMM8, DataType::S32, NECastToS32Fixture<uint8_t>, CastQASYMM8toS32Dataset, one_tolerance)
149*c217d954SCole Faust
150*c217d954SCole Faust // U8
151*c217d954SCole Faust CAST_SUITE(U8_to_U16, DataType::U8, DataType::U16, NECastToU16Fixture<uint8_t>, CastU8toU16Dataset, zero_tolerance)
152*c217d954SCole Faust CAST_SUITE(U8_to_S16, DataType::U8, DataType::S16, NECastToS16Fixture<uint8_t>, CastU8toS16Dataset, zero_tolerance)
153*c217d954SCole Faust CAST_SUITE(U8_to_S32, DataType::U8, DataType::S32, NECastToS32Fixture<uint8_t>, CastU8toS32Dataset, zero_tolerance)
154*c217d954SCole Faust CAST_SUITE(U8_to_F32, DataType::U8, DataType::F32, NECastToF32Fixture<uint8_t>, CastU8toF32Dataset, zero_tolerance)
155*c217d954SCole Faust
156*c217d954SCole Faust // U16
157*c217d954SCole Faust CAST_SUITE(U16_to_U8, DataType::U16, DataType::U8, NECastToU8Fixture<uint16_t>, CastU16toU8Dataset, zero_tolerance)
158*c217d954SCole Faust CAST_SUITE(U16_to_U32, DataType::U16, DataType::U32, NECastToU32Fixture<uint16_t>, CastU16toU32Dataset, zero_tolerance)
159*c217d954SCole Faust
160*c217d954SCole Faust // S16
161*c217d954SCole Faust CAST_SUITE(S16_to_QASYMM8_SIGNED, DataType::S16, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<int16_t>, CastS16toQASYMM8_SIGNEDDataset, zero_tolerance)
162*c217d954SCole Faust CAST_SUITE(S16_to_U8, DataType::S16, DataType::U8, NECastToU8Fixture<int16_t>, CastS16toU8Dataset, zero_tolerance)
163*c217d954SCole Faust CAST_SUITE(S16_to_S32, DataType::S16, DataType::S32, NECastToS32Fixture<int16_t>, CastS16toS32Dataset, zero_tolerance)
164*c217d954SCole Faust
165*c217d954SCole Faust // S32
166*c217d954SCole Faust CAST_SUITE(S32_to_QASYMM8_SIGNED, DataType::S32, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<int32_t>, CastS32toQASYMM8_SIGNEDDataset, one_tolerance)
167*c217d954SCole Faust CAST_SUITE(S32_to_QASYMM8, DataType::S32, DataType::QASYMM8, NECastToQASYMM8Fixture<int32_t>, CastS32toQASYMM8Dataset, one_tolerance)
168*c217d954SCole Faust #ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
169*c217d954SCole Faust CAST_SUITE(S32_to_F16, DataType::S32, DataType::F16, NECastToF16Fixture<int32_t>, CastS32toF16Dataset, zero_tolerance)
170*c217d954SCole Faust #endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
171*c217d954SCole Faust CAST_SUITE(S32_to_F32, DataType::S32, DataType::F32, NECastToF32Fixture<int32_t>, CastS32toF32Dataset, one_tolerance)
172*c217d954SCole Faust CAST_SUITE(S32_to_U8, DataType::S32, DataType::U8, NECastToU8Fixture<int32_t>, CastS32toU8Dataset, one_tolerance)
173*c217d954SCole Faust
174*c217d954SCole Faust // F16
175*c217d954SCole Faust #ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
176*c217d954SCole Faust CAST_SUITE(F16_to_QASYMM8_SIGNED, DataType::F16, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<half>, CastF16toQASYMM8_SIGNEDDataset, one_tolerance)
177*c217d954SCole Faust CAST_SUITE(F16_to_QASYMM8, DataType::F16, DataType::QASYMM8, NECastToQASYMM8Fixture<half>, CastF16toQASYMM8Dataset, one_tolerance)
178*c217d954SCole Faust CAST_SUITE(F16_to_F32, DataType::F16, DataType::F32, NECastToF32Fixture<half>, CastF16toF32Dataset, zero_tolerance)
179*c217d954SCole Faust CAST_SUITE(F16_to_S32, DataType::F16, DataType::S32, NECastToS32Fixture<half>, CastF16toS32Dataset, one_tolerance)
180*c217d954SCole Faust #endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
181*c217d954SCole Faust
182*c217d954SCole Faust // F32
183*c217d954SCole Faust CAST_SUITE(F32_to_QASYMM8_SIGNED, DataType::F32, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<float>, CastF32toQASYMM8_SIGNEDDataset, one_tolerance)
184*c217d954SCole Faust CAST_SUITE(F32_to_QASYMM8, DataType::F32, DataType::QASYMM8, NECastToQASYMM8Fixture<float>, CastF32toQASYMM8Dataset, one_tolerance)
185*c217d954SCole Faust #ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
186*c217d954SCole Faust CAST_SUITE(F32_to_F16, DataType::F32, DataType::F16, NECastToF16Fixture<float>, CastF32toF16Dataset, zero_tolerance)
187*c217d954SCole Faust #endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
188*c217d954SCole Faust CAST_SUITE(F32_to_S32, DataType::F32, DataType::S32, NECastToS32Fixture<float>, CastF32toS32Dataset, one_tolerance)
189*c217d954SCole Faust CAST_SUITE(F32_to_U8, DataType::F32, DataType::S32, NECastToS32Fixture<float>, CastF32toS32Dataset, one_tolerance)
190*c217d954SCole Faust
191*c217d954SCole Faust DATA_TEST_CASE(KernelSelectionDstFP16, framework::DatasetMode::ALL,
192*c217d954SCole Faust combine(framework::dataset::make("CpuExt", std::string("NEON")),
193*c217d954SCole Faust framework::dataset::make("DataType",
194*c217d954SCole Faust {
195*c217d954SCole Faust DataType::F16,
196*c217d954SCole Faust DataType::U8,
197*c217d954SCole Faust DataType::S32,
198*c217d954SCole Faust DataType::QASYMM8,
199*c217d954SCole Faust DataType::QASYMM8_SIGNED,
200*c217d954SCole Faust DataType::BFLOAT16,
201*c217d954SCole Faust })),
202*c217d954SCole Faust cpu_ext, data_type)
203*c217d954SCole Faust {
204*c217d954SCole Faust using namespace cpu::kernels;
205*c217d954SCole Faust const CpuCastKernel::CastKernel *selected_impl;
206*c217d954SCole Faust
207*c217d954SCole Faust cpuinfo::CpuIsaInfo cpu_isa{};
208*c217d954SCole Faust cpu_isa.neon = (cpu_ext == "NEON");
209*c217d954SCole Faust
210*c217d954SCole Faust cpu_isa.bf16 = (data_type == DataType::BFLOAT16);
211*c217d954SCole Faust
212*c217d954SCole Faust /* bf16 cast is different from all the others being converted to fp32 and not to fp16 */
213*c217d954SCole Faust if(cpu_isa.bf16)
214*c217d954SCole Faust {
215*c217d954SCole Faust cpu_isa.fp16 = false;
216*c217d954SCole Faust selected_impl = CpuCastKernel::get_implementation(CastDataTypeISASelectorData{ data_type, DataType::F32, cpu_isa }, cpu::KernelSelectionType::Preferred);
217*c217d954SCole Faust }
218*c217d954SCole Faust else
219*c217d954SCole Faust {
220*c217d954SCole Faust cpu_isa.fp16 = true;
221*c217d954SCole Faust selected_impl = CpuCastKernel::get_implementation(CastDataTypeISASelectorData{ data_type, DataType::F16, cpu_isa }, cpu::KernelSelectionType::Preferred);
222*c217d954SCole Faust }
223*c217d954SCole Faust
224*c217d954SCole Faust ARM_COMPUTE_ERROR_ON_NULLPTR(selected_impl);
225*c217d954SCole Faust
226*c217d954SCole Faust std::string expected = lower_string(cpu_ext) + "_" + cpu_impl_dt(data_type) + "_cast";
227*c217d954SCole Faust std::string actual = selected_impl->name;
228*c217d954SCole Faust
229*c217d954SCole Faust ARM_COMPUTE_EXPECT_EQUAL(expected, actual, framework::LogLevel::ERRORS);
230*c217d954SCole Faust }
231*c217d954SCole Faust
232*c217d954SCole Faust DATA_TEST_CASE(KernelSelectionSrcFP32, framework::DatasetMode::ALL,
233*c217d954SCole Faust combine(framework::dataset::make("CpuExt", std::string("NEON")),
234*c217d954SCole Faust framework::dataset::make("DataType",
235*c217d954SCole Faust {
236*c217d954SCole Faust DataType::F16,
237*c217d954SCole Faust DataType::BFLOAT16,
238*c217d954SCole Faust })),
239*c217d954SCole Faust cpu_ext, data_type)
240*c217d954SCole Faust {
241*c217d954SCole Faust using namespace cpu::kernels;
242*c217d954SCole Faust
243*c217d954SCole Faust cpuinfo::CpuIsaInfo cpu_isa{};
244*c217d954SCole Faust cpu_isa.neon = (cpu_ext == "NEON");
245*c217d954SCole Faust cpu_isa.fp16 = (data_type == DataType::F16);
246*c217d954SCole Faust cpu_isa.bf16 = (data_type == DataType::BFLOAT16);
247*c217d954SCole Faust
248*c217d954SCole Faust const auto *selected_impl = CpuCastKernel::get_implementation(CastDataTypeISASelectorData{ DataType::F32, data_type, cpu_isa }, cpu::KernelSelectionType::Preferred);
249*c217d954SCole Faust
250*c217d954SCole Faust ARM_COMPUTE_ERROR_ON_NULLPTR(selected_impl);
251*c217d954SCole Faust
252*c217d954SCole Faust std::string expected = lower_string(cpu_ext) + "_fp32_to_" + cpu_impl_dt(data_type) + "_cast";
253*c217d954SCole Faust std::string actual = selected_impl->name;
254*c217d954SCole Faust
255*c217d954SCole Faust ARM_COMPUTE_EXPECT_EQUAL(expected, actual, framework::LogLevel::ERRORS);
256*c217d954SCole Faust }
257*c217d954SCole Faust
258*c217d954SCole Faust TEST_SUITE_END() // Cast
259*c217d954SCole Faust TEST_SUITE_END() // Neon
260*c217d954SCole Faust } // namespace validation
261*c217d954SCole Faust } // namespace test
262*c217d954SCole Faust } // namespace arm_compute
263