xref: /aosp_15_r20/external/armnn/src/backends/cl/workloads/ClArgMinMaxWorkload.cpp (revision 89c4ff92f2867872bb9e2354d150bf0c8c502810)
1 //
2 // Copyright © 2019 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 
6 #include "ClArgMinMaxWorkload.hpp"
7 #include "ClWorkloadUtils.hpp"
8 
9 #include <aclCommon/ArmComputeTensorUtils.hpp>
10 
11 #include <armnn/backends/TensorHandle.hpp>
12 
13 #include <armnnUtils/TensorUtils.hpp>
14 #include <armnn/utility/NumericCast.hpp>
15 
16 #include <cl/ClTensorHandle.hpp>
17 #include <cl/ClLayerSupport.hpp>
18 
19 namespace
20 {
CalcAclAxis(unsigned int numDimensions,unsigned int axisIndex)21 unsigned int CalcAclAxis(unsigned int numDimensions, unsigned int axisIndex)
22 {
23     return (numDimensions - axisIndex) - 1;
24 }
25 
26 } //namespace
27 
28 namespace armnn
29 {
30 
ClArgMinMaxWorkloadValidate(const TensorInfo & input,const TensorInfo & output,const ArgMinMaxDescriptor & descriptor)31 arm_compute::Status ClArgMinMaxWorkloadValidate(const TensorInfo& input,
32                                                 const TensorInfo& output,
33                                                 const ArgMinMaxDescriptor& descriptor)
34 {
35     const arm_compute::TensorInfo aclInput = armcomputetensorutils::BuildArmComputeTensorInfo(input);
36     const arm_compute::TensorInfo aclOutput = armcomputetensorutils::BuildArmComputeTensorInfo(output);
37 
38     auto numDims = input.GetNumDimensions();
39     auto unsignedAxis = armnnUtils::GetUnsignedAxis(numDims, descriptor.m_Axis);
40     int aclAxis = armnn::numeric_cast<int>(CalcAclAxis(numDims, unsignedAxis));
41 
42     if (descriptor.m_Function == ArgMinMaxFunction::Max)
43     {
44         return arm_compute::CLArgMinMaxLayer::validate(&aclInput, aclAxis, &aclOutput,
45                                                        arm_compute::ReductionOperation::ARG_IDX_MAX);
46     }
47     else
48     {
49         return arm_compute::CLArgMinMaxLayer::validate(&aclInput, aclAxis, &aclOutput,
50                                                        arm_compute::ReductionOperation::ARG_IDX_MIN);
51     }
52 }
53 
54 
ClArgMinMaxWorkload(const ArgMinMaxQueueDescriptor & descriptor,const WorkloadInfo & info,const arm_compute::CLCompileContext & clCompileContext)55 ClArgMinMaxWorkload::ClArgMinMaxWorkload(const ArgMinMaxQueueDescriptor& descriptor,
56                                          const WorkloadInfo& info,
57                                          const arm_compute::CLCompileContext& clCompileContext)
58         : ClBaseWorkload<ArgMinMaxQueueDescriptor>(descriptor, info)
59 {
60     // Report Profiling Details
61     ARMNN_REPORT_PROFILING_WORKLOAD_DESC("ClArgMinMaxWorkload_Construct",
62                                          descriptor.m_Parameters,
63                                          info,
64                                          this->GetGuid());
65 
66     arm_compute::ICLTensor& input = static_cast<IClTensorHandle*>(this->m_Data.m_Inputs[0])->GetTensor();
67     arm_compute::ICLTensor& output = static_cast<IClTensorHandle*>(this->m_Data.m_Outputs[0])->GetTensor();
68 
69     auto numDims = info.m_InputTensorInfos[0].GetNumDimensions();
70     auto unsignedAxis = armnnUtils::GetUnsignedAxis(numDims, m_Data.m_Parameters.m_Axis);
71     int aclAxis = armnn::numeric_cast<int>(CalcAclAxis(numDims, unsignedAxis));
72 
73     {
74         ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "ClArgMinMaxWorkload_configure");
75         if (m_Data.m_Parameters.m_Function == ArgMinMaxFunction::Max)
76         {
77             m_ArgMinMaxLayer.configure(clCompileContext,
78                                        &input,
79                                        aclAxis,
80                                        &output,
81                                        arm_compute::ReductionOperation::ARG_IDX_MAX);
82         }
83         else
84         {
85             m_ArgMinMaxLayer.configure(clCompileContext,
86                                        &input,
87                                        aclAxis,
88                                        &output,
89                                        arm_compute::ReductionOperation::ARG_IDX_MIN);
90         }
91     }
92 }
93 
Execute() const94 void ClArgMinMaxWorkload::Execute() const
95 {
96     ARMNN_SCOPED_PROFILING_EVENT_CL_GUID("ClArgMinMaxWorkload_Execute", this->GetGuid());
97     RunClFunction(m_ArgMinMaxLayer, CHECK_LOCATION());
98 }
99 
100 } //namespace armnn
101 
102