xref: /aosp_15_r20/external/armnn/src/backends/cl/OpenClTimer.cpp (revision 89c4ff92f2867872bb9e2354d150bf0c8c502810)
1*89c4ff92SAndroid Build Coastguard Worker //
2*89c4ff92SAndroid Build Coastguard Worker // Copyright © 2017 Arm Ltd. All rights reserved.
3*89c4ff92SAndroid Build Coastguard Worker // SPDX-License-Identifier: MIT
4*89c4ff92SAndroid Build Coastguard Worker //
5*89c4ff92SAndroid Build Coastguard Worker 
6*89c4ff92SAndroid Build Coastguard Worker #include "OpenClTimer.hpp"
7*89c4ff92SAndroid Build Coastguard Worker 
8*89c4ff92SAndroid Build Coastguard Worker #include <armnn/utility/IgnoreUnused.hpp>
9*89c4ff92SAndroid Build Coastguard Worker 
10*89c4ff92SAndroid Build Coastguard Worker #include <string>
11*89c4ff92SAndroid Build Coastguard Worker #include <sstream>
12*89c4ff92SAndroid Build Coastguard Worker 
13*89c4ff92SAndroid Build Coastguard Worker 
14*89c4ff92SAndroid Build Coastguard Worker namespace armnn
15*89c4ff92SAndroid Build Coastguard Worker {
16*89c4ff92SAndroid Build Coastguard Worker 
OpenClTimer()17*89c4ff92SAndroid Build Coastguard Worker OpenClTimer::OpenClTimer()
18*89c4ff92SAndroid Build Coastguard Worker {
19*89c4ff92SAndroid Build Coastguard Worker }
20*89c4ff92SAndroid Build Coastguard Worker 
Start()21*89c4ff92SAndroid Build Coastguard Worker void OpenClTimer::Start()
22*89c4ff92SAndroid Build Coastguard Worker {
23*89c4ff92SAndroid Build Coastguard Worker     m_Kernels.clear();
24*89c4ff92SAndroid Build Coastguard Worker 
25*89c4ff92SAndroid Build Coastguard Worker     auto interceptor = [this](  cl_command_queue command_queue,
26*89c4ff92SAndroid Build Coastguard Worker                                 cl_kernel        kernel,
27*89c4ff92SAndroid Build Coastguard Worker                                 cl_uint          work_dim,
28*89c4ff92SAndroid Build Coastguard Worker                                 const size_t    *gwo,
29*89c4ff92SAndroid Build Coastguard Worker                                 const size_t    *gws,
30*89c4ff92SAndroid Build Coastguard Worker                                 const size_t    *lws,
31*89c4ff92SAndroid Build Coastguard Worker                                 cl_uint          num_events_in_wait_list,
32*89c4ff92SAndroid Build Coastguard Worker                                 const cl_event * event_wait_list,
33*89c4ff92SAndroid Build Coastguard Worker                                 cl_event *       event)
34*89c4ff92SAndroid Build Coastguard Worker         {
35*89c4ff92SAndroid Build Coastguard Worker             IgnoreUnused(event);
36*89c4ff92SAndroid Build Coastguard Worker             cl_int retVal = 0;
37*89c4ff92SAndroid Build Coastguard Worker 
38*89c4ff92SAndroid Build Coastguard Worker             // Get the name of the kernel
39*89c4ff92SAndroid Build Coastguard Worker             cl::Kernel retainedKernel(kernel, true);
40*89c4ff92SAndroid Build Coastguard Worker             std::stringstream ss;
41*89c4ff92SAndroid Build Coastguard Worker             ss << retainedKernel.getInfo<CL_KERNEL_FUNCTION_NAME>();
42*89c4ff92SAndroid Build Coastguard Worker 
43*89c4ff92SAndroid Build Coastguard Worker             // Embed workgroup sizes into the name
44*89c4ff92SAndroid Build Coastguard Worker             if(gws != nullptr)
45*89c4ff92SAndroid Build Coastguard Worker             {
46*89c4ff92SAndroid Build Coastguard Worker                 ss << " GWS[" << gws[0] << "," << gws[1] << "," << gws[2] << "]";
47*89c4ff92SAndroid Build Coastguard Worker             }
48*89c4ff92SAndroid Build Coastguard Worker             if(lws != nullptr)
49*89c4ff92SAndroid Build Coastguard Worker             {
50*89c4ff92SAndroid Build Coastguard Worker                 ss << " LWS[" << lws[0] << "," << lws[1] << "," << lws[2] << "]";
51*89c4ff92SAndroid Build Coastguard Worker             }
52*89c4ff92SAndroid Build Coastguard Worker 
53*89c4ff92SAndroid Build Coastguard Worker             cl_event customEvent;
54*89c4ff92SAndroid Build Coastguard Worker 
55*89c4ff92SAndroid Build Coastguard Worker             // Forward to original OpenCl function
56*89c4ff92SAndroid Build Coastguard Worker             retVal = m_OriginalEnqueueFunction( command_queue,
57*89c4ff92SAndroid Build Coastguard Worker                                                 kernel,
58*89c4ff92SAndroid Build Coastguard Worker                                                 work_dim,
59*89c4ff92SAndroid Build Coastguard Worker                                                 gwo,
60*89c4ff92SAndroid Build Coastguard Worker                                                 gws,
61*89c4ff92SAndroid Build Coastguard Worker                                                 lws,
62*89c4ff92SAndroid Build Coastguard Worker                                                 num_events_in_wait_list,
63*89c4ff92SAndroid Build Coastguard Worker                                                 event_wait_list,
64*89c4ff92SAndroid Build Coastguard Worker                                                 &customEvent);
65*89c4ff92SAndroid Build Coastguard Worker 
66*89c4ff92SAndroid Build Coastguard Worker             // Store the Kernel info for later GetMeasurements() call
67*89c4ff92SAndroid Build Coastguard Worker             m_Kernels.emplace_back(ss.str(), customEvent);
68*89c4ff92SAndroid Build Coastguard Worker 
69*89c4ff92SAndroid Build Coastguard Worker             if(event != nullptr)
70*89c4ff92SAndroid Build Coastguard Worker             {
71*89c4ff92SAndroid Build Coastguard Worker                 //return cl_event from the intercepted call
72*89c4ff92SAndroid Build Coastguard Worker                 clRetainEvent(customEvent);
73*89c4ff92SAndroid Build Coastguard Worker                 *event = customEvent;
74*89c4ff92SAndroid Build Coastguard Worker             }
75*89c4ff92SAndroid Build Coastguard Worker 
76*89c4ff92SAndroid Build Coastguard Worker             return retVal;
77*89c4ff92SAndroid Build Coastguard Worker         };
78*89c4ff92SAndroid Build Coastguard Worker 
79*89c4ff92SAndroid Build Coastguard Worker     m_OriginalEnqueueFunction = CLSymbols::get().clEnqueueNDRangeKernel_ptr;
80*89c4ff92SAndroid Build Coastguard Worker     CLSymbols::get().clEnqueueNDRangeKernel_ptr = interceptor;
81*89c4ff92SAndroid Build Coastguard Worker }
82*89c4ff92SAndroid Build Coastguard Worker 
Stop()83*89c4ff92SAndroid Build Coastguard Worker void OpenClTimer::Stop()
84*89c4ff92SAndroid Build Coastguard Worker {
85*89c4ff92SAndroid Build Coastguard Worker     CLSymbols::get().clEnqueueNDRangeKernel_ptr = m_OriginalEnqueueFunction;
86*89c4ff92SAndroid Build Coastguard Worker }
87*89c4ff92SAndroid Build Coastguard Worker 
HasKernelMeasurements() const88*89c4ff92SAndroid Build Coastguard Worker bool OpenClTimer::HasKernelMeasurements() const
89*89c4ff92SAndroid Build Coastguard Worker {
90*89c4ff92SAndroid Build Coastguard Worker     return m_Kernels.size() > 0;
91*89c4ff92SAndroid Build Coastguard Worker }
92*89c4ff92SAndroid Build Coastguard Worker 
GetMeasurements() const93*89c4ff92SAndroid Build Coastguard Worker std::vector<Measurement> OpenClTimer::GetMeasurements() const
94*89c4ff92SAndroid Build Coastguard Worker {
95*89c4ff92SAndroid Build Coastguard Worker     std::vector<Measurement> measurements;
96*89c4ff92SAndroid Build Coastguard Worker 
97*89c4ff92SAndroid Build Coastguard Worker     cl_command_queue_properties clQueueProperties = CLScheduler::get().queue().getInfo<CL_QUEUE_PROPERTIES>();
98*89c4ff92SAndroid Build Coastguard Worker 
99*89c4ff92SAndroid Build Coastguard Worker     int idx = 0;
100*89c4ff92SAndroid Build Coastguard Worker     for (auto& kernel : m_Kernels)
101*89c4ff92SAndroid Build Coastguard Worker     {
102*89c4ff92SAndroid Build Coastguard Worker         std::string name = std::string(this->GetName()) + "/" + std::to_string(idx++) + ": " + kernel.m_Name;
103*89c4ff92SAndroid Build Coastguard Worker 
104*89c4ff92SAndroid Build Coastguard Worker         double timeUs = 0.0;
105*89c4ff92SAndroid Build Coastguard Worker         if((clQueueProperties & CL_QUEUE_PROFILING_ENABLE) != 0)
106*89c4ff92SAndroid Build Coastguard Worker         {
107*89c4ff92SAndroid Build Coastguard Worker             // Wait for the event to finish before accessing profile results.
108*89c4ff92SAndroid Build Coastguard Worker             kernel.m_Event.wait();
109*89c4ff92SAndroid Build Coastguard Worker 
110*89c4ff92SAndroid Build Coastguard Worker             cl_ulong start = kernel.m_Event.getProfilingInfo<CL_PROFILING_COMMAND_START>();
111*89c4ff92SAndroid Build Coastguard Worker             cl_ulong end   = kernel.m_Event.getProfilingInfo<CL_PROFILING_COMMAND_END>();
112*89c4ff92SAndroid Build Coastguard Worker             timeUs = static_cast<double>(end - start) / 1000.0;
113*89c4ff92SAndroid Build Coastguard Worker         }
114*89c4ff92SAndroid Build Coastguard Worker 
115*89c4ff92SAndroid Build Coastguard Worker         measurements.emplace_back(name, timeUs, Measurement::Unit::TIME_US);
116*89c4ff92SAndroid Build Coastguard Worker     }
117*89c4ff92SAndroid Build Coastguard Worker 
118*89c4ff92SAndroid Build Coastguard Worker     return measurements;
119*89c4ff92SAndroid Build Coastguard Worker }
120*89c4ff92SAndroid Build Coastguard Worker 
121*89c4ff92SAndroid Build Coastguard Worker } //namespace armnn
122