xref: /aosp_15_r20/external/OpenCL-CTS/test_conformance/device_execution/host_queue_order.cpp (revision 6467f958c7de8070b317fc65bcb0f6472e388d82)
1 //
2 // Copyright (c) 2017 The Khronos Group Inc.
3 //
4 // Licensed under the Apache License, Version 2.0 (the "License");
5 // you may not use this file except in compliance with the License.
6 // You may obtain a copy of the License at
7 //
8 //    http://www.apache.org/licenses/LICENSE-2.0
9 //
10 // Unless required by applicable law or agreed to in writing, software
11 // distributed under the License is distributed on an "AS IS" BASIS,
12 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 // See the License for the specific language governing permissions and
14 // limitations under the License.
15 //
16 #include <stdio.h>
17 #include <string.h>
18 #include "harness/testHarness.h"
19 #include "harness/typeWrappers.h"
20 
21 #include <algorithm>
22 #include <vector>
23 
24 #include "procs.h"
25 #include "utils.h"
26 #include <time.h>
27 
28 extern int gWimpyMode;
29 
30 #ifdef CL_VERSION_2_0
31 
32 static const char* enqueue_block_first_kernel[] =
33 {
34     NL, "void block_fn(uint num, __global int* res)"
35     NL, "{"
36     NL, "    size_t tid = get_global_id(0);"
37     NL, ""
38     NL, "    for(int i = 1 ; i < tid ; i++)"
39     NL, "    {"
40     NL, "      for(int j = 0 ; j < num ; j++)"
41     NL, "        atomic_add(res+tid, 1);"
42     NL, "    }"
43     NL, "}"
44     NL, ""
45     NL, "kernel void enqueue_block_first_kernel(uint num, __global int* res)"
46     NL, "{"
47     NL, "  void (^kernelBlock)(void) = ^{ block_fn(num, res); };"
48     NL, ""
49     NL, "  ndrange_t ndrange = ndrange_1D(num, 1);"
50     NL, ""
51     NL, "  int enq_res = enqueue_kernel(get_default_queue(), CLK_ENQUEUE_FLAGS_NO_WAIT, ndrange, kernelBlock);"
52     NL, "  if(enq_res != CLK_SUCCESS) { res[0] = -1; return; }"
53     NL, ""
54     NL, "}"
55     NL
56 };
57 
58 static const char* enqueue_block_second_kernel[] =
59 {
60     NL, "void block_fn(uint num, __global int* res)"
61     NL, "{"
62     NL, "    for(int i = 2 ; i < num ; i++)"
63     NL, "    {"
64     NL, "      res[i] = res[i]/num - (i-1);"
65     NL, "    }"
66     NL, "}"
67     NL, ""
68     NL, "kernel void enqueue_block_second_kernel(uint num, __global int* res)"
69     NL, "{"
70     NL, "  void (^kernelBlock)(void) = ^{ block_fn(num, res); };"
71     NL, ""
72     NL, "  ndrange_t ndrange = ndrange_1D(1);"
73     NL, ""
74     NL, "  int enq_res = enqueue_kernel(get_default_queue(), CLK_ENQUEUE_FLAGS_WAIT_KERNEL, ndrange, kernelBlock);"
75     NL, "  if(enq_res != CLK_SUCCESS) { res[0] = -1; return; }"
76     NL, ""
77     NL, "}"
78     NL
79 };
80 
check_kernel_results(cl_int * results,cl_int len)81 static int check_kernel_results(cl_int* results, cl_int len)
82 {
83     for(cl_int i = 0; i < len; ++i)
84     {
85         if(results[i] != 0) return i;
86     }
87     return -1;
88 }
89 
90 /*
91     Test checks kernel block execution order in case of two different kernels with enqueue block submitted to one ordered host queue.
92 */
test_host_queue_order(cl_device_id device,cl_context context,cl_command_queue queue,int num_elements)93 int test_host_queue_order(cl_device_id device, cl_context context, cl_command_queue queue, int num_elements)
94 {
95     cl_int k, err_ret, res = 0;
96     clCommandQueueWrapper dev_queue;
97     cl_int kernel_results[MAX_GWS] = {0};
98 
99     size_t ret_len;
100     cl_uint max_queues = 1;
101     cl_uint maxQueueSize = 0;
102     err_ret = clGetDeviceInfo(device, CL_DEVICE_QUEUE_ON_DEVICE_MAX_SIZE, sizeof(maxQueueSize), &maxQueueSize, 0);
103     test_error(err_ret, "clGetDeviceInfo(CL_DEVICE_QUEUE_ON_DEVICE_MAX_SIZE) failed");
104 
105     err_ret = clGetDeviceInfo(device, CL_DEVICE_MAX_ON_DEVICE_QUEUES, sizeof(max_queues), &max_queues, &ret_len);
106     test_error(err_ret, "clGetDeviceInfo(CL_DEVICE_MAX_ON_DEVICE_QUEUES) failed");
107 
108     size_t max_local_size = 1;
109     err_ret = clGetDeviceInfo(device, CL_DEVICE_MAX_WORK_GROUP_SIZE, sizeof(max_local_size), &max_local_size, &ret_len);
110     test_error(err_ret, "clGetDeviceInfo(CL_DEVICE_MAX_WORK_GROUP_SIZE) failed");
111 
112     cl_queue_properties queue_prop_def[] =
113     {
114         CL_QUEUE_PROPERTIES, CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE|CL_QUEUE_ON_DEVICE|CL_QUEUE_ON_DEVICE_DEFAULT,
115         CL_QUEUE_SIZE, maxQueueSize,
116         0
117     };
118 
119     dev_queue = clCreateCommandQueueWithProperties(context, device, queue_prop_def, &err_ret);
120     test_error(err_ret, "clCreateCommandQueueWithProperties(CL_QUEUE_DEVICE|CL_QUEUE_DEFAULT) failed");
121 
122     cl_int status;
123     size_t size = 1;
124     cl_int result[MAX_GWS] = { 0 };
125     cl_uint num = arr_size(result);
126     if( gWimpyMode )
127     {
128         num = std::max(num / 16, 4U);
129     }
130 
131     clMemWrapper res_mem;
132     clProgramWrapper program1, program2;
133     clKernelWrapper kernel1, kernel2;
134 
135     cl_event kernel_event;
136 
137     err_ret = create_single_kernel_helper(
138         context, &program1, &kernel1, arr_size(enqueue_block_first_kernel),
139         enqueue_block_first_kernel, "enqueue_block_first_kernel");
140     if(check_error(err_ret, "Create single kernel failed")) return -1;
141 
142     err_ret = create_single_kernel_helper(
143         context, &program2, &kernel2, arr_size(enqueue_block_second_kernel),
144         enqueue_block_second_kernel, "enqueue_block_second_kernel");
145     if(check_error(err_ret, "Create single kernel failed")) return -1;
146 
147     res_mem = clCreateBuffer(context, CL_MEM_READ_WRITE|CL_MEM_COPY_HOST_PTR, sizeof(kernel_results), kernel_results, &err_ret);
148     test_error(err_ret, "clCreateBuffer() failed");
149 
150     // Enqueue first kernel
151     err_ret = clSetKernelArg(kernel1, 0, sizeof(num), &num);
152     test_error(err_ret, "clSetKernelArg(0) failed");
153     err_ret = clSetKernelArg(kernel1, 1, sizeof(cl_mem), &res_mem);
154     test_error(err_ret, "clSetKernelArg(1) failed");
155 
156     cl_event event1 = clCreateUserEvent(context, &err_ret);
157     if(check_error(err_ret, "Create user event failed")) return -1;
158 
159     err_ret = clEnqueueNDRangeKernel(queue, kernel1, 1, NULL, &size, &size, 1, &event1, NULL);
160     test_error(err_ret, "clEnqueueNDRangeKernel('enqueue_block_first_kernel') failed");
161 
162     // Enqueue second kernel
163     err_ret = clSetKernelArg(kernel2, 0, sizeof(num), &num);
164     test_error(err_ret, "clSetKernelArg(0) failed");
165     err_ret = clSetKernelArg(kernel2, 1, sizeof(cl_mem), &res_mem);
166     test_error(err_ret, "clSetKernelArg(1) failed");
167 
168     err_ret = clEnqueueNDRangeKernel(queue, kernel2, 1, NULL, &size, &size, 0, NULL, &kernel_event);
169     test_error(err_ret, "clEnqueueNDRangeKernel('enqueue_block_second_kernel') failed");
170 
171     //Triger execution of first kernel
172     err_ret = clSetUserEventStatus(event1, CL_COMPLETE);
173     test_error(err_ret, "clSetUserEventStatus() failed");
174 
175     // Collect resulsts
176     err_ret = clEnqueueReadBuffer(queue, res_mem, CL_TRUE, 0, sizeof(result), result, 0, NULL, NULL);
177     test_error(err_ret, "clEnqueueReadBuffer() failed");
178 
179     err_ret = clGetEventInfo(kernel_event, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(status), &status, &ret_len);
180     test_error(err_ret, "clGetEventInfo() failed");
181 
182     if(check_error(status, "Kernel execution status %d", status)) return status;
183 
184     if((k = check_kernel_results(result, num)) >= 0 && check_error(-1, "'%s' results validation failed: [%d] returned %d expected 0", "test_host_queue_order", k, result[k])) res = -1;
185 
186     clReleaseEvent(kernel_event);
187     clReleaseEvent(event1);
188 
189     return res;
190 }
191 
192 #endif
193 
194