xref: /aosp_15_r20/external/armnn/src/backends/neon/workloads/NeonDivisionWorkload.cpp (revision 89c4ff92f2867872bb9e2354d150bf0c8c502810)
1 //
2 // Copyright © 2020 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 
6 #include "NeonDivisionWorkload.hpp"
7 
8 #include <aclCommon/ArmComputeTensorUtils.hpp>
9 #include <aclCommon/ArmComputeUtils.hpp>
10 
11 #include <armnn/utility/PolymorphicDowncast.hpp>
12 
13 #include <armnn/backends/TensorHandle.hpp>
14 
15 namespace armnn
16 {
17 
NeonDivisionWorkloadValidate(const TensorInfo & input0,const TensorInfo & input1,const TensorInfo & output,const ActivationDescriptor * activationDescriptor)18 arm_compute::Status NeonDivisionWorkloadValidate(const TensorInfo& input0,
19                                                  const TensorInfo& input1,
20                                                  const TensorInfo& output,
21                                                  const ActivationDescriptor* activationDescriptor)
22 {
23     const arm_compute::TensorInfo aclInput0 = armcomputetensorutils::BuildArmComputeTensorInfo(input0);
24     const arm_compute::TensorInfo aclInput1 = armcomputetensorutils::BuildArmComputeTensorInfo(input1);
25     const arm_compute::TensorInfo aclOutput = armcomputetensorutils::BuildArmComputeTensorInfo(output);
26 
27     const arm_compute::ActivationLayerInfo activationInfo = ConvertActivationDescriptorToAclActivationLayerInfo(
28             activationDescriptor);
29 
30     return arm_compute::NEElementwiseDivision::validate(&aclInput0,
31                                                         &aclInput1,
32                                                         &aclOutput,
33                                                         activationInfo);
34 }
35 
NeonDivisionWorkload(const DivisionQueueDescriptor & descriptor,const WorkloadInfo & info)36 NeonDivisionWorkload::NeonDivisionWorkload(const DivisionQueueDescriptor& descriptor,
37                                          const WorkloadInfo& info)
38     : NeonBaseWorkload<DivisionQueueDescriptor>(descriptor, info)
39 {
40     m_Data.ValidateInputsOutputs("NeonDivisionWorkload", 2, 1);
41 
42     arm_compute::ITensor& input0 = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
43     arm_compute::ITensor& input1 = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();
44     arm_compute::ITensor& output = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
45 
46     const arm_compute::ActivationLayerInfo activationInfo = ConvertAdditionalInfoToAclActivationLayerInfo(descriptor);
47 
48     m_DivLayer.configure(&input0, &input1, &output, activationInfo);
49 }
50 
Execute() const51 void NeonDivisionWorkload::Execute() const
52 {
53     ARMNN_SCOPED_PROFILING_EVENT_NEON_GUID("NeonDivisionWorkload_Execute", this->GetGuid());
54     m_DivLayer.run();
55 }
56 
57 } //namespace armnn
58