xref: /aosp_15_r20/external/armnn/src/backends/cl/workloads/ClDepthToSpaceWorkload.cpp (revision 89c4ff92f2867872bb9e2354d150bf0c8c502810)
1 //
2 // Copyright © 2019 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 
6 #include "ClDepthToSpaceWorkload.hpp"
7 
8 #include "ClWorkloadUtils.hpp"
9 
10 #include <aclCommon/ArmComputeTensorUtils.hpp>
11 
12 #include <armnn/utility/NumericCast.hpp>
13 #include <armnn/utility/PolymorphicDowncast.hpp>
14 
15 #include <cl/ClTensorHandle.hpp>
16 
17 namespace armnn
18 {
19 
20 using namespace armcomputetensorutils;
21 
ClDepthToSpaceWorkloadValidate(const TensorInfo & input,const TensorInfo & output,const DepthToSpaceDescriptor & descriptor)22 arm_compute::Status ClDepthToSpaceWorkloadValidate(const TensorInfo& input,
23                                                    const TensorInfo& output,
24                                                    const DepthToSpaceDescriptor& descriptor)
25 {
26     DataLayout dataLayout = descriptor.m_DataLayout;
27     const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input, dataLayout);
28 
29     int32_t blockSize = armnn::numeric_cast<int32_t>(descriptor.m_BlockSize);
30 
31     const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output, dataLayout);
32 
33     const arm_compute::Status aclStatus = arm_compute::CLDepthToSpaceLayer::validate(&aclInputInfo,
34                                                                                      &aclOutputInfo,
35                                                                                      blockSize);
36     return aclStatus;
37 }
38 
ClDepthToSpaceWorkload(const DepthToSpaceQueueDescriptor & descriptor,const WorkloadInfo & info,const arm_compute::CLCompileContext & clCompileContext)39 ClDepthToSpaceWorkload::ClDepthToSpaceWorkload(const DepthToSpaceQueueDescriptor& descriptor,
40                                                const WorkloadInfo& info,
41                                                const arm_compute::CLCompileContext& clCompileContext)
42     : ClBaseWorkload<DepthToSpaceQueueDescriptor>(descriptor, info)
43 {
44     // Report Profiling Details
45     ARMNN_REPORT_PROFILING_WORKLOAD_DESC("ClDepthToSpaceWorkload_Construct",
46                                          descriptor.m_Parameters,
47                                          info,
48                                          this->GetGuid());
49 
50     m_Data.ValidateInputsOutputs("ClDepthToSpaceWorkload", 1, 1);
51 
52     arm_compute::DataLayout aclDataLayout = ConvertDataLayout(m_Data.m_Parameters.m_DataLayout);
53 
54     arm_compute::ICLTensor& input =
55         PolymorphicPointerDowncast<IClTensorHandle>(m_Data.m_Inputs[0])->GetTensor();
56     input.info()->set_data_layout(aclDataLayout);
57 
58     int32_t blockSize = armnn::numeric_cast<int32_t>(descriptor.m_Parameters.m_BlockSize);
59 
60     arm_compute::ICLTensor& output =
61         PolymorphicPointerDowncast<IClTensorHandle>(m_Data.m_Outputs[0])->GetTensor();
62     output.info()->set_data_layout(aclDataLayout);
63 
64     {
65         ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "ClDepthToSpaceWorkload_configure");
66         m_Layer.configure(clCompileContext, &input, &output, blockSize);
67     }
68 }
69 
Execute() const70 void ClDepthToSpaceWorkload::Execute() const
71 {
72     ARMNN_SCOPED_PROFILING_EVENT_CL_GUID("ClDepthToSpaceWorkload_Execute", this->GetGuid());
73     RunClFunction(m_Layer, CHECK_LOCATION());
74 }
75 
76 } // namespace armnn
77