1 //
2 // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5
6 #include "NeonMaximumWorkload.hpp"
7 #include <aclCommon/ArmComputeTensorUtils.hpp>
8 #include <armnn/utility/PolymorphicDowncast.hpp>
9 #include <armnn/backends/TensorHandle.hpp>
10
11 namespace armnn
12 {
13
NeonMaximumWorkloadValidate(const TensorInfo & input0,const TensorInfo & input1,const TensorInfo & output)14 arm_compute::Status NeonMaximumWorkloadValidate(const TensorInfo& input0,
15 const TensorInfo& input1,
16 const TensorInfo& output)
17 {
18 const arm_compute::TensorInfo aclInput0 = armcomputetensorutils::BuildArmComputeTensorInfo(input0);
19 const arm_compute::TensorInfo aclInput1 = armcomputetensorutils::BuildArmComputeTensorInfo(input1);
20 const arm_compute::TensorInfo aclOutput = armcomputetensorutils::BuildArmComputeTensorInfo(output);
21
22 return arm_compute::NEElementwiseMax::validate(&aclInput0,
23 &aclInput1,
24 &aclOutput);
25 }
26
NeonMaximumWorkload(const MaximumQueueDescriptor & descriptor,const WorkloadInfo & info)27 NeonMaximumWorkload::NeonMaximumWorkload(const MaximumQueueDescriptor& descriptor,
28 const WorkloadInfo& info)
29 : NeonBaseWorkload<MaximumQueueDescriptor>(descriptor, info)
30 {
31 m_Data.ValidateInputsOutputs("NeonMaximumWorkload", 2, 1);
32
33 arm_compute::ITensor& input0 = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
34 arm_compute::ITensor& input1 = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();
35 arm_compute::ITensor& output = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
36
37 m_MaxLayer.configure(&input0, &input1, &output);
38 }
39
Execute() const40 void NeonMaximumWorkload::Execute() const
41 {
42 ARMNN_SCOPED_PROFILING_EVENT_NEON_GUID("NeonMaximumWorkload_Execute", this->GetGuid());
43 m_MaxLayer.run();
44 }
45
46 } //namespace armnn
47