xref: /aosp_15_r20/external/armnn/src/backends/neon/workloads/NeonDepthToSpaceWorkload.cpp (revision 89c4ff92f2867872bb9e2354d150bf0c8c502810)
1 //
2 // Copyright © 2019 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 
6 #include "NeonDepthToSpaceWorkload.hpp"
7 
8 #include "NeonWorkloadUtils.hpp"
9 
10 #include <aclCommon/ArmComputeTensorUtils.hpp>
11 #include <armnn/utility/NumericCast.hpp>
12 #include <armnn/utility/PolymorphicDowncast.hpp>
13 
14 namespace armnn
15 {
16 
17 using namespace armcomputetensorutils;
18 
NeonDepthToSpaceWorkloadValidate(const TensorInfo & input,const TensorInfo & output,const DepthToSpaceDescriptor & descriptor)19 arm_compute::Status NeonDepthToSpaceWorkloadValidate(const TensorInfo& input,
20                                                      const TensorInfo& output,
21                                                      const DepthToSpaceDescriptor& descriptor)
22 {
23     DataLayout dataLayout = descriptor.m_DataLayout;
24     const arm_compute::TensorInfo aclInput = BuildArmComputeTensorInfo(input, dataLayout);
25     const arm_compute::TensorInfo aclOutput = BuildArmComputeTensorInfo(output, dataLayout);
26 
27     int32_t blockSize = armnn::numeric_cast<int32_t>(descriptor.m_BlockSize);
28 
29     return arm_compute::NEDepthToSpaceLayer::validate(&aclInput, &aclOutput, blockSize);
30 }
31 
NeonDepthToSpaceWorkload(const DepthToSpaceQueueDescriptor & descriptor,const WorkloadInfo & info)32 NeonDepthToSpaceWorkload::NeonDepthToSpaceWorkload(const DepthToSpaceQueueDescriptor& descriptor,
33                                                    const WorkloadInfo& info)
34     : NeonBaseWorkload<DepthToSpaceQueueDescriptor>(descriptor, info)
35 {
36     // Report Profiling Details
37     ARMNN_REPORT_PROFILING_WORKLOAD_DESC("NeonDepthToSpaceWorkload_Construct",
38                                          descriptor.m_Parameters,
39                                          info,
40                                          this->GetGuid());
41 
42     m_Data.ValidateInputsOutputs("NeonDepthToSpaceWorkload", 1, 1);
43 
44     arm_compute::DataLayout aclDataLayout = ConvertDataLayout(m_Data.m_Parameters.m_DataLayout);
45 
46     arm_compute::ITensor& input =
47             PolymorphicPointerDowncast<IAclTensorHandle>(m_Data.m_Inputs[0])->GetTensor();
48     input.info()->set_data_layout(aclDataLayout);
49 
50     int32_t blockSize = armnn::numeric_cast<int32_t>(descriptor.m_Parameters.m_BlockSize);
51 
52     arm_compute::ITensor& output =
53             PolymorphicPointerDowncast<IAclTensorHandle>(m_Data.m_Outputs[0])->GetTensor();
54     output.info()->set_data_layout(aclDataLayout);
55 
56     m_Layer.configure(&input, &output, blockSize);
57     m_Layer.prepare();
58 }
59 
Execute() const60 void NeonDepthToSpaceWorkload::Execute() const
61 {
62     ARMNN_SCOPED_PROFILING_EVENT_NEON_GUID("NeonDepthToSpaceWorkload_Execute", this->GetGuid());
63     m_Layer.run();
64 }
65 
66 } // namespace armnn
67