xref: /aosp_15_r20/external/armnn/src/backends/neon/workloads/NeonMinimumWorkload.cpp (revision 89c4ff92f2867872bb9e2354d150bf0c8c502810)
1 //
2 // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 
6 #include "NeonMinimumWorkload.hpp"
7 
8 #include <aclCommon/ArmComputeTensorUtils.hpp>
9 #include <armnn/utility/PolymorphicDowncast.hpp>
10 #include <armnn/backends/TensorHandle.hpp>
11 
12 namespace armnn
13 {
14 
NeonMinimumWorkloadValidate(const TensorInfo & input0,const TensorInfo & input1,const TensorInfo & output)15 arm_compute::Status NeonMinimumWorkloadValidate(const TensorInfo& input0,
16                                                 const TensorInfo& input1,
17                                                 const TensorInfo& output)
18 {
19     const arm_compute::TensorInfo aclInput0 = armcomputetensorutils::BuildArmComputeTensorInfo(input0);
20     const arm_compute::TensorInfo aclInput1 = armcomputetensorutils::BuildArmComputeTensorInfo(input1);
21     const arm_compute::TensorInfo aclOutput = armcomputetensorutils::BuildArmComputeTensorInfo(output);
22 
23     return arm_compute::NEElementwiseMin::validate(&aclInput0,
24                                                    &aclInput1,
25                                                    &aclOutput);
26 }
27 
NeonMinimumWorkload(const MinimumQueueDescriptor & descriptor,const WorkloadInfo & info)28 NeonMinimumWorkload::NeonMinimumWorkload(const MinimumQueueDescriptor& descriptor,
29                                          const WorkloadInfo& info)
30     : NeonBaseWorkload<MinimumQueueDescriptor>(descriptor, info)
31 {
32     m_Data.ValidateInputsOutputs("NeonMinimumWorkload", 2, 1);
33 
34     arm_compute::ITensor& input0 = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
35     arm_compute::ITensor& input1 = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();
36     arm_compute::ITensor& output = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
37 
38     m_MinLayer.configure(&input0, &input1, &output);
39 }
40 
Execute() const41 void NeonMinimumWorkload::Execute() const
42 {
43     ARMNN_SCOPED_PROFILING_EVENT_NEON_GUID("NeonMinimumWorkload_Execute", this->GetGuid());
44     m_MinLayer.run();
45 }
46 
47 } //namespace armnn
48