1*89c4ff92SAndroid Build Coastguard Worker //
2*89c4ff92SAndroid Build Coastguard Worker // Copyright © 2017 Arm Ltd. All rights reserved.
3*89c4ff92SAndroid Build Coastguard Worker // SPDX-License-Identifier: MIT
4*89c4ff92SAndroid Build Coastguard Worker //
5*89c4ff92SAndroid Build Coastguard Worker
6*89c4ff92SAndroid Build Coastguard Worker #include "OpenClTimer.hpp"
7*89c4ff92SAndroid Build Coastguard Worker
8*89c4ff92SAndroid Build Coastguard Worker #include <armnn/utility/IgnoreUnused.hpp>
9*89c4ff92SAndroid Build Coastguard Worker
10*89c4ff92SAndroid Build Coastguard Worker #include <string>
11*89c4ff92SAndroid Build Coastguard Worker #include <sstream>
12*89c4ff92SAndroid Build Coastguard Worker
13*89c4ff92SAndroid Build Coastguard Worker
14*89c4ff92SAndroid Build Coastguard Worker namespace armnn
15*89c4ff92SAndroid Build Coastguard Worker {
16*89c4ff92SAndroid Build Coastguard Worker
OpenClTimer()17*89c4ff92SAndroid Build Coastguard Worker OpenClTimer::OpenClTimer()
18*89c4ff92SAndroid Build Coastguard Worker {
19*89c4ff92SAndroid Build Coastguard Worker }
20*89c4ff92SAndroid Build Coastguard Worker
Start()21*89c4ff92SAndroid Build Coastguard Worker void OpenClTimer::Start()
22*89c4ff92SAndroid Build Coastguard Worker {
23*89c4ff92SAndroid Build Coastguard Worker m_Kernels.clear();
24*89c4ff92SAndroid Build Coastguard Worker
25*89c4ff92SAndroid Build Coastguard Worker auto interceptor = [this]( cl_command_queue command_queue,
26*89c4ff92SAndroid Build Coastguard Worker cl_kernel kernel,
27*89c4ff92SAndroid Build Coastguard Worker cl_uint work_dim,
28*89c4ff92SAndroid Build Coastguard Worker const size_t *gwo,
29*89c4ff92SAndroid Build Coastguard Worker const size_t *gws,
30*89c4ff92SAndroid Build Coastguard Worker const size_t *lws,
31*89c4ff92SAndroid Build Coastguard Worker cl_uint num_events_in_wait_list,
32*89c4ff92SAndroid Build Coastguard Worker const cl_event * event_wait_list,
33*89c4ff92SAndroid Build Coastguard Worker cl_event * event)
34*89c4ff92SAndroid Build Coastguard Worker {
35*89c4ff92SAndroid Build Coastguard Worker IgnoreUnused(event);
36*89c4ff92SAndroid Build Coastguard Worker cl_int retVal = 0;
37*89c4ff92SAndroid Build Coastguard Worker
38*89c4ff92SAndroid Build Coastguard Worker // Get the name of the kernel
39*89c4ff92SAndroid Build Coastguard Worker cl::Kernel retainedKernel(kernel, true);
40*89c4ff92SAndroid Build Coastguard Worker std::stringstream ss;
41*89c4ff92SAndroid Build Coastguard Worker ss << retainedKernel.getInfo<CL_KERNEL_FUNCTION_NAME>();
42*89c4ff92SAndroid Build Coastguard Worker
43*89c4ff92SAndroid Build Coastguard Worker // Embed workgroup sizes into the name
44*89c4ff92SAndroid Build Coastguard Worker if(gws != nullptr)
45*89c4ff92SAndroid Build Coastguard Worker {
46*89c4ff92SAndroid Build Coastguard Worker ss << " GWS[" << gws[0] << "," << gws[1] << "," << gws[2] << "]";
47*89c4ff92SAndroid Build Coastguard Worker }
48*89c4ff92SAndroid Build Coastguard Worker if(lws != nullptr)
49*89c4ff92SAndroid Build Coastguard Worker {
50*89c4ff92SAndroid Build Coastguard Worker ss << " LWS[" << lws[0] << "," << lws[1] << "," << lws[2] << "]";
51*89c4ff92SAndroid Build Coastguard Worker }
52*89c4ff92SAndroid Build Coastguard Worker
53*89c4ff92SAndroid Build Coastguard Worker cl_event customEvent;
54*89c4ff92SAndroid Build Coastguard Worker
55*89c4ff92SAndroid Build Coastguard Worker // Forward to original OpenCl function
56*89c4ff92SAndroid Build Coastguard Worker retVal = m_OriginalEnqueueFunction( command_queue,
57*89c4ff92SAndroid Build Coastguard Worker kernel,
58*89c4ff92SAndroid Build Coastguard Worker work_dim,
59*89c4ff92SAndroid Build Coastguard Worker gwo,
60*89c4ff92SAndroid Build Coastguard Worker gws,
61*89c4ff92SAndroid Build Coastguard Worker lws,
62*89c4ff92SAndroid Build Coastguard Worker num_events_in_wait_list,
63*89c4ff92SAndroid Build Coastguard Worker event_wait_list,
64*89c4ff92SAndroid Build Coastguard Worker &customEvent);
65*89c4ff92SAndroid Build Coastguard Worker
66*89c4ff92SAndroid Build Coastguard Worker // Store the Kernel info for later GetMeasurements() call
67*89c4ff92SAndroid Build Coastguard Worker m_Kernels.emplace_back(ss.str(), customEvent);
68*89c4ff92SAndroid Build Coastguard Worker
69*89c4ff92SAndroid Build Coastguard Worker if(event != nullptr)
70*89c4ff92SAndroid Build Coastguard Worker {
71*89c4ff92SAndroid Build Coastguard Worker //return cl_event from the intercepted call
72*89c4ff92SAndroid Build Coastguard Worker clRetainEvent(customEvent);
73*89c4ff92SAndroid Build Coastguard Worker *event = customEvent;
74*89c4ff92SAndroid Build Coastguard Worker }
75*89c4ff92SAndroid Build Coastguard Worker
76*89c4ff92SAndroid Build Coastguard Worker return retVal;
77*89c4ff92SAndroid Build Coastguard Worker };
78*89c4ff92SAndroid Build Coastguard Worker
79*89c4ff92SAndroid Build Coastguard Worker m_OriginalEnqueueFunction = CLSymbols::get().clEnqueueNDRangeKernel_ptr;
80*89c4ff92SAndroid Build Coastguard Worker CLSymbols::get().clEnqueueNDRangeKernel_ptr = interceptor;
81*89c4ff92SAndroid Build Coastguard Worker }
82*89c4ff92SAndroid Build Coastguard Worker
Stop()83*89c4ff92SAndroid Build Coastguard Worker void OpenClTimer::Stop()
84*89c4ff92SAndroid Build Coastguard Worker {
85*89c4ff92SAndroid Build Coastguard Worker CLSymbols::get().clEnqueueNDRangeKernel_ptr = m_OriginalEnqueueFunction;
86*89c4ff92SAndroid Build Coastguard Worker }
87*89c4ff92SAndroid Build Coastguard Worker
HasKernelMeasurements() const88*89c4ff92SAndroid Build Coastguard Worker bool OpenClTimer::HasKernelMeasurements() const
89*89c4ff92SAndroid Build Coastguard Worker {
90*89c4ff92SAndroid Build Coastguard Worker return m_Kernels.size() > 0;
91*89c4ff92SAndroid Build Coastguard Worker }
92*89c4ff92SAndroid Build Coastguard Worker
GetMeasurements() const93*89c4ff92SAndroid Build Coastguard Worker std::vector<Measurement> OpenClTimer::GetMeasurements() const
94*89c4ff92SAndroid Build Coastguard Worker {
95*89c4ff92SAndroid Build Coastguard Worker std::vector<Measurement> measurements;
96*89c4ff92SAndroid Build Coastguard Worker
97*89c4ff92SAndroid Build Coastguard Worker cl_command_queue_properties clQueueProperties = CLScheduler::get().queue().getInfo<CL_QUEUE_PROPERTIES>();
98*89c4ff92SAndroid Build Coastguard Worker
99*89c4ff92SAndroid Build Coastguard Worker int idx = 0;
100*89c4ff92SAndroid Build Coastguard Worker for (auto& kernel : m_Kernels)
101*89c4ff92SAndroid Build Coastguard Worker {
102*89c4ff92SAndroid Build Coastguard Worker std::string name = std::string(this->GetName()) + "/" + std::to_string(idx++) + ": " + kernel.m_Name;
103*89c4ff92SAndroid Build Coastguard Worker
104*89c4ff92SAndroid Build Coastguard Worker double timeUs = 0.0;
105*89c4ff92SAndroid Build Coastguard Worker if((clQueueProperties & CL_QUEUE_PROFILING_ENABLE) != 0)
106*89c4ff92SAndroid Build Coastguard Worker {
107*89c4ff92SAndroid Build Coastguard Worker // Wait for the event to finish before accessing profile results.
108*89c4ff92SAndroid Build Coastguard Worker kernel.m_Event.wait();
109*89c4ff92SAndroid Build Coastguard Worker
110*89c4ff92SAndroid Build Coastguard Worker cl_ulong start = kernel.m_Event.getProfilingInfo<CL_PROFILING_COMMAND_START>();
111*89c4ff92SAndroid Build Coastguard Worker cl_ulong end = kernel.m_Event.getProfilingInfo<CL_PROFILING_COMMAND_END>();
112*89c4ff92SAndroid Build Coastguard Worker timeUs = static_cast<double>(end - start) / 1000.0;
113*89c4ff92SAndroid Build Coastguard Worker }
114*89c4ff92SAndroid Build Coastguard Worker
115*89c4ff92SAndroid Build Coastguard Worker measurements.emplace_back(name, timeUs, Measurement::Unit::TIME_US);
116*89c4ff92SAndroid Build Coastguard Worker }
117*89c4ff92SAndroid Build Coastguard Worker
118*89c4ff92SAndroid Build Coastguard Worker return measurements;
119*89c4ff92SAndroid Build Coastguard Worker }
120*89c4ff92SAndroid Build Coastguard Worker
121*89c4ff92SAndroid Build Coastguard Worker } //namespace armnn
122