xref: /aosp_15_r20/external/armnn/src/backends/neon/workloads/NeonMaximumWorkload.cpp (revision 89c4ff92f2867872bb9e2354d150bf0c8c502810)
1 //
2 // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 
6 #include "NeonMaximumWorkload.hpp"
7 #include <aclCommon/ArmComputeTensorUtils.hpp>
8 #include <armnn/utility/PolymorphicDowncast.hpp>
9 #include <armnn/backends/TensorHandle.hpp>
10 
11 namespace armnn
12 {
13 
NeonMaximumWorkloadValidate(const TensorInfo & input0,const TensorInfo & input1,const TensorInfo & output)14 arm_compute::Status NeonMaximumWorkloadValidate(const TensorInfo& input0,
15                                                 const TensorInfo& input1,
16                                                 const TensorInfo& output)
17 {
18     const arm_compute::TensorInfo aclInput0 = armcomputetensorutils::BuildArmComputeTensorInfo(input0);
19     const arm_compute::TensorInfo aclInput1 = armcomputetensorutils::BuildArmComputeTensorInfo(input1);
20     const arm_compute::TensorInfo aclOutput = armcomputetensorutils::BuildArmComputeTensorInfo(output);
21 
22     return arm_compute::NEElementwiseMax::validate(&aclInput0,
23                                                    &aclInput1,
24                                                    &aclOutput);
25 }
26 
NeonMaximumWorkload(const MaximumQueueDescriptor & descriptor,const WorkloadInfo & info)27 NeonMaximumWorkload::NeonMaximumWorkload(const MaximumQueueDescriptor& descriptor,
28                                          const WorkloadInfo& info)
29     : NeonBaseWorkload<MaximumQueueDescriptor>(descriptor, info)
30 {
31     m_Data.ValidateInputsOutputs("NeonMaximumWorkload", 2, 1);
32 
33     arm_compute::ITensor& input0 = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
34     arm_compute::ITensor& input1 = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();
35     arm_compute::ITensor& output = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
36 
37     m_MaxLayer.configure(&input0, &input1, &output);
38 }
39 
Execute() const40 void NeonMaximumWorkload::Execute() const
41 {
42     ARMNN_SCOPED_PROFILING_EVENT_NEON_GUID("NeonMaximumWorkload_Execute", this->GetGuid());
43     m_MaxLayer.run();
44 }
45 
46 } //namespace armnn
47