xref: /aosp_15_r20/external/armnn/src/backends/reference/workloads/RefTransposeWorkload.cpp (revision 89c4ff92f2867872bb9e2354d150bf0c8c502810)
1 //
2 // Copyright © 2022 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 
6 #include "RefTransposeWorkload.hpp"
7 #include "RefWorkloadUtils.hpp"
8 
9 #include <armnnUtils/Transpose.hpp>
10 
11 #include <ResolveType.hpp>
12 
13 namespace armnn
14 {
15 
16 template <armnn::DataType DataType>
Execute() const17 void RefTransposeWorkload<DataType>::Execute() const
18 {
19     Execute(m_Data.m_Inputs, m_Data.m_Outputs);
20 }
21 
22 template <armnn::DataType DataType>
ExecuteAsync(ExecutionData & executionData)23 void RefTransposeWorkload<DataType>::ExecuteAsync(ExecutionData& executionData)
24 {
25     WorkingMemDescriptor* workingMemDescriptor = static_cast<WorkingMemDescriptor*>(executionData.m_Data);
26     Execute(workingMemDescriptor->m_Inputs, workingMemDescriptor->m_Outputs);
27 }
28 
29 template <armnn::DataType DataType>
Execute(std::vector<ITensorHandle * > inputs,std::vector<ITensorHandle * > outputs) const30 void RefTransposeWorkload<DataType>::Execute(std::vector<ITensorHandle*> inputs,
31                                              std::vector<ITensorHandle*> outputs) const
32 {
33     using T = ResolveType<DataType>;
34 
35     ARMNN_SCOPED_PROFILING_EVENT(Compute::CpuRef, GetName() + "_Execute");
36 
37     const ITensorHandle*     src      = inputs[0];
38     ITensorHandle*           dst      = outputs[0];
39     const PermutationVector& mappings = m_Data.m_Parameters.m_DimMappings;
40 
41     armnnUtils::Transpose(GetTensorInfo(src).GetShape(), mappings, src->Map(), dst->Map(), sizeof(T));
42 }
43 
44 template class RefTransposeWorkload<DataType::BFloat16>;
45 template class RefTransposeWorkload<DataType::Float16>;
46 template class RefTransposeWorkload<DataType::Float32>;
47 template class RefTransposeWorkload<DataType::QAsymmS8>;
48 template class RefTransposeWorkload<DataType::QAsymmU8>;
49 template class RefTransposeWorkload<DataType::QSymmS16>;
50 
51 } //namespace armnn
52