1 /*
2 * Copyright © 2016 Red Hat.
3 * Copyright © 2016 Bas Nieuwenhuizen
4 *
5 * based in part on anv driver which is:
6 * Copyright © 2015 Intel Corporation
7 *
8 * SPDX-License-Identifier: MIT
9 */
10
11 #ifdef HAVE_VALGRIND
12 #include <memcheck.h>
13 #include <valgrind.h>
14 #define VG(x) x
15 #else
16 #define VG(x) ((void)0)
17 #endif
18
19 #include "radv_instance.h"
20 #include "radv_debug.h"
21 #include "radv_entrypoints.h"
22 #include "radv_wsi.h"
23
24 #include "util/driconf.h"
25
26 #include "vk_instance.h"
27 #include "vk_log.h"
28 #include "vk_util.h"
29
30 static const struct debug_control radv_debug_options[] = {{"nofastclears", RADV_DEBUG_NO_FAST_CLEARS},
31 {"nodcc", RADV_DEBUG_NO_DCC},
32 {"shaders", RADV_DEBUG_DUMP_SHADERS},
33 {"nocache", RADV_DEBUG_NO_CACHE},
34 {"shaderstats", RADV_DEBUG_DUMP_SHADER_STATS},
35 {"nohiz", RADV_DEBUG_NO_HIZ},
36 {"nocompute", RADV_DEBUG_NO_COMPUTE_QUEUE},
37 {"allbos", RADV_DEBUG_ALL_BOS},
38 {"noibs", RADV_DEBUG_NO_IBS},
39 {"spirv", RADV_DEBUG_DUMP_SPIRV},
40 {"zerovram", RADV_DEBUG_ZERO_VRAM},
41 {"syncshaders", RADV_DEBUG_SYNC_SHADERS},
42 {"preoptir", RADV_DEBUG_PREOPTIR},
43 {"nodynamicbounds", RADV_DEBUG_NO_DYNAMIC_BOUNDS},
44 {"info", RADV_DEBUG_INFO},
45 {"startup", RADV_DEBUG_STARTUP},
46 {"checkir", RADV_DEBUG_CHECKIR},
47 {"nobinning", RADV_DEBUG_NOBINNING},
48 {"nongg", RADV_DEBUG_NO_NGG},
49 {"metashaders", RADV_DEBUG_DUMP_META_SHADERS},
50 {"llvm", RADV_DEBUG_LLVM},
51 {"forcecompress", RADV_DEBUG_FORCE_COMPRESS},
52 {"hang", RADV_DEBUG_HANG},
53 {"img", RADV_DEBUG_IMG},
54 {"noumr", RADV_DEBUG_NO_UMR},
55 {"invariantgeom", RADV_DEBUG_INVARIANT_GEOM},
56 {"splitfma", RADV_DEBUG_SPLIT_FMA},
57 {"nodisplaydcc", RADV_DEBUG_NO_DISPLAY_DCC},
58 {"notccompatcmask", RADV_DEBUG_NO_TC_COMPAT_CMASK},
59 {"novrsflatshading", RADV_DEBUG_NO_VRS_FLAT_SHADING},
60 {"noatocdithering", RADV_DEBUG_NO_ATOC_DITHERING},
61 {"nonggc", RADV_DEBUG_NO_NGGC},
62 {"prologs", RADV_DEBUG_DUMP_PROLOGS},
63 {"nodma", RADV_DEBUG_NO_DMA_BLIT},
64 {"epilogs", RADV_DEBUG_DUMP_EPILOGS},
65 {"nofmask", RADV_DEBUG_NO_FMASK},
66 {"shadowregs", RADV_DEBUG_SHADOW_REGS},
67 {"extra_md", RADV_DEBUG_EXTRA_MD},
68 {"nogpl", RADV_DEBUG_NO_GPL},
69 {"videoarraypath", RADV_DEBUG_VIDEO_ARRAY_PATH},
70 {"nort", RADV_DEBUG_NO_RT},
71 {"nomeshshader", RADV_DEBUG_NO_MESH_SHADER},
72 {"nongg_gs", RADV_DEBUG_NO_NGG_GS},
73 {"noeso", RADV_DEBUG_NO_ESO},
74 {"psocachestats", RADV_DEBUG_PSO_CACHE_STATS},
75 {NULL, 0}};
76
77 const char *
radv_get_debug_option_name(int id)78 radv_get_debug_option_name(int id)
79 {
80 assert(id < ARRAY_SIZE(radv_debug_options) - 1);
81 return radv_debug_options[id].string;
82 }
83
84 static const struct debug_control radv_perftest_options[] = {{"localbos", RADV_PERFTEST_LOCAL_BOS},
85 {"dccmsaa", RADV_PERFTEST_DCC_MSAA},
86 {"bolist", RADV_PERFTEST_BO_LIST},
87 {"cswave32", RADV_PERFTEST_CS_WAVE_32},
88 {"pswave32", RADV_PERFTEST_PS_WAVE_32},
89 {"gewave32", RADV_PERFTEST_GE_WAVE_32},
90 {"nosam", RADV_PERFTEST_NO_SAM},
91 {"sam", RADV_PERFTEST_SAM},
92 {"nggc", RADV_PERFTEST_NGGC},
93 {"emulate_rt", RADV_PERFTEST_EMULATE_RT},
94 {"rtwave64", RADV_PERFTEST_RT_WAVE_64},
95 {"video_decode", RADV_PERFTEST_VIDEO_DECODE},
96 {"dmashaders", RADV_PERFTEST_DMA_SHADERS},
97 {"transfer_queue", RADV_PERFTEST_TRANSFER_QUEUE},
98 {"nircache", RADV_PERFTEST_NIR_CACHE},
99 {"rtwave32", RADV_PERFTEST_RT_WAVE_32},
100 {"video_encode", RADV_PERFTEST_VIDEO_ENCODE},
101 {NULL, 0}};
102
103 const char *
radv_get_perftest_option_name(int id)104 radv_get_perftest_option_name(int id)
105 {
106 assert(id < ARRAY_SIZE(radv_perftest_options) - 1);
107 return radv_perftest_options[id].string;
108 }
109
110 static const struct debug_control trace_options[] = {
111 {"rgp", RADV_TRACE_MODE_RGP},
112 {"rra", RADV_TRACE_MODE_RRA},
113 {"ctxroll", RADV_TRACE_MODE_CTX_ROLLS},
114 {NULL, 0},
115 };
116
117 // clang-format off
118 static const driOptionDescription radv_dri_options[] = {
119 DRI_CONF_SECTION_PERFORMANCE
120 DRI_CONF_ADAPTIVE_SYNC(true)
121 DRI_CONF_VK_X11_OVERRIDE_MIN_IMAGE_COUNT(0)
122 DRI_CONF_VK_X11_STRICT_IMAGE_COUNT(false)
123 DRI_CONF_VK_X11_ENSURE_MIN_IMAGE_COUNT(false)
124 DRI_CONF_VK_KHR_PRESENT_WAIT(false)
125 DRI_CONF_VK_XWAYLAND_WAIT_READY(false)
126 DRI_CONF_RADV_REPORT_LLVM9_VERSION_STRING(false)
127 DRI_CONF_RADV_ENABLE_MRT_OUTPUT_NAN_FIXUP(false)
128 DRI_CONF_RADV_DISABLE_SHRINK_IMAGE_STORE(false)
129 DRI_CONF_RADV_NO_DYNAMIC_BOUNDS(false)
130 DRI_CONF_RADV_OVERRIDE_UNIFORM_OFFSET_ALIGNMENT(0)
131 DRI_CONF_RADV_CLEAR_LDS(false)
132 DRI_CONF_RADV_DISABLE_NGG_GS(false)
133 DRI_CONF_SECTION_END
134
135 DRI_CONF_SECTION_DEBUG
136 DRI_CONF_OVERRIDE_VRAM_SIZE()
137 DRI_CONF_VK_WSI_FORCE_BGRA8_UNORM_FIRST(false)
138 DRI_CONF_VK_WSI_FORCE_SWAPCHAIN_TO_CURRENT_EXTENT(false)
139 DRI_CONF_VK_X11_IGNORE_SUBOPTIMAL(false)
140 DRI_CONF_VK_REQUIRE_ETC2(false)
141 DRI_CONF_VK_REQUIRE_ASTC(false)
142 DRI_CONF_RADV_ZERO_VRAM(false)
143 DRI_CONF_RADV_INVARIANT_GEOM(false)
144 DRI_CONF_RADV_SPLIT_FMA(false)
145 DRI_CONF_RADV_DISABLE_TC_COMPAT_HTILE_GENERAL(false)
146 DRI_CONF_RADV_DISABLE_DCC(false)
147 DRI_CONF_RADV_DISABLE_ANISO_SINGLE_LEVEL(false)
148 DRI_CONF_RADV_DISABLE_TRUNC_COORD(false)
149 DRI_CONF_RADV_DISABLE_SINKING_LOAD_INPUT_FS(false)
150 DRI_CONF_RADV_DISABLE_DEPTH_STORAGE(false)
151 DRI_CONF_RADV_DGC(false)
152 DRI_CONF_RADV_FLUSH_BEFORE_QUERY_COPY(false)
153 DRI_CONF_RADV_ENABLE_UNIFIED_HEAP_ON_APU(false)
154 DRI_CONF_RADV_TEX_NON_UNIFORM(false)
155 DRI_CONF_RADV_FLUSH_BEFORE_TIMESTAMP_WRITE(false)
156 DRI_CONF_RADV_RT_WAVE64(false)
157 DRI_CONF_RADV_LEGACY_SPARSE_BINDING(false)
158 DRI_CONF_RADV_FORCE_PSTATE_PEAK_GFX11_DGPU(false)
159 DRI_CONF_DUAL_COLOR_BLEND_BY_LOCATION(false)
160 DRI_CONF_RADV_OVERRIDE_GRAPHICS_SHADER_VERSION(0)
161 DRI_CONF_RADV_OVERRIDE_COMPUTE_SHADER_VERSION(0)
162 DRI_CONF_RADV_OVERRIDE_RAY_TRACING_SHADER_VERSION(0)
163 DRI_CONF_RADV_SSBO_NON_UNIFORM(false)
164 DRI_CONF_RADV_APP_LAYER()
165 DRI_CONF_SECTION_END
166 };
167 // clang-format on
168
169 static void
radv_init_dri_options(struct radv_instance * instance)170 radv_init_dri_options(struct radv_instance *instance)
171 {
172 driParseOptionInfo(&instance->drirc.available_options, radv_dri_options, ARRAY_SIZE(radv_dri_options));
173 driParseConfigFiles(&instance->drirc.options, &instance->drirc.available_options, 0, "radv", NULL, NULL,
174 instance->vk.app_info.app_name, instance->vk.app_info.app_version,
175 instance->vk.app_info.engine_name, instance->vk.app_info.engine_version);
176
177 instance->drirc.enable_mrt_output_nan_fixup =
178 driQueryOptionb(&instance->drirc.options, "radv_enable_mrt_output_nan_fixup");
179
180 instance->drirc.disable_shrink_image_store =
181 driQueryOptionb(&instance->drirc.options, "radv_disable_shrink_image_store");
182
183 instance->drirc.disable_tc_compat_htile_in_general =
184 driQueryOptionb(&instance->drirc.options, "radv_disable_tc_compat_htile_general");
185
186 if (driQueryOptionb(&instance->drirc.options, "radv_no_dynamic_bounds"))
187 instance->debug_flags |= RADV_DEBUG_NO_DYNAMIC_BOUNDS;
188
189 if (driQueryOptionb(&instance->drirc.options, "radv_invariant_geom"))
190 instance->debug_flags |= RADV_DEBUG_INVARIANT_GEOM;
191
192 if (driQueryOptionb(&instance->drirc.options, "radv_split_fma"))
193 instance->debug_flags |= RADV_DEBUG_SPLIT_FMA;
194
195 if (driQueryOptionb(&instance->drirc.options, "radv_disable_dcc"))
196 instance->debug_flags |= RADV_DEBUG_NO_DCC;
197
198 if (driQueryOptionb(&instance->drirc.options, "radv_disable_ngg_gs"))
199 instance->debug_flags |= RADV_DEBUG_NO_NGG_GS;
200
201 instance->drirc.clear_lds = driQueryOptionb(&instance->drirc.options, "radv_clear_lds");
202
203 instance->drirc.zero_vram = driQueryOptionb(&instance->drirc.options, "radv_zero_vram");
204
205 instance->drirc.disable_aniso_single_level =
206 driQueryOptionb(&instance->drirc.options, "radv_disable_aniso_single_level");
207
208 instance->drirc.disable_trunc_coord = driQueryOptionb(&instance->drirc.options, "radv_disable_trunc_coord");
209
210 instance->drirc.disable_sinking_load_input_fs =
211 driQueryOptionb(&instance->drirc.options, "radv_disable_sinking_load_input_fs");
212
213 instance->drirc.disable_depth_storage = driQueryOptionb(&instance->drirc.options, "radv_disable_depth_storage");
214
215 instance->drirc.flush_before_query_copy = driQueryOptionb(&instance->drirc.options, "radv_flush_before_query_copy");
216
217 instance->drirc.enable_unified_heap_on_apu =
218 driQueryOptionb(&instance->drirc.options, "radv_enable_unified_heap_on_apu");
219
220 instance->drirc.tex_non_uniform = driQueryOptionb(&instance->drirc.options, "radv_tex_non_uniform");
221
222 instance->drirc.ssbo_non_uniform = driQueryOptionb(&instance->drirc.options, "radv_ssbo_non_uniform");
223
224 instance->drirc.app_layer = driQueryOptionstr(&instance->drirc.options, "radv_app_layer");
225
226 instance->drirc.flush_before_timestamp_write =
227 driQueryOptionb(&instance->drirc.options, "radv_flush_before_timestamp_write");
228
229 instance->drirc.force_rt_wave64 = driQueryOptionb(&instance->drirc.options, "radv_rt_wave64");
230
231 instance->drirc.dual_color_blend_by_location =
232 driQueryOptionb(&instance->drirc.options, "dual_color_blend_by_location");
233
234 instance->drirc.legacy_sparse_binding = driQueryOptionb(&instance->drirc.options, "radv_legacy_sparse_binding");
235
236 instance->drirc.force_pstate_peak_gfx11_dgpu =
237 driQueryOptionb(&instance->drirc.options, "radv_force_pstate_peak_gfx11_dgpu");
238
239 instance->drirc.override_graphics_shader_version =
240 driQueryOptioni(&instance->drirc.options, "radv_override_graphics_shader_version");
241 instance->drirc.override_compute_shader_version =
242 driQueryOptioni(&instance->drirc.options, "radv_override_compute_shader_version");
243 instance->drirc.override_ray_tracing_shader_version =
244 driQueryOptioni(&instance->drirc.options, "radv_override_ray_tracing_shader_version");
245
246 instance->drirc.enable_dgc = driQueryOptionb(&instance->drirc.options, "radv_dgc");
247
248 instance->drirc.override_vram_size = driQueryOptioni(&instance->drirc.options, "override_vram_size");
249
250 instance->drirc.enable_khr_present_wait = driQueryOptionb(&instance->drirc.options, "vk_khr_present_wait");
251
252 instance->drirc.override_uniform_offset_alignment =
253 driQueryOptioni(&instance->drirc.options, "radv_override_uniform_offset_alignment");
254
255 instance->drirc.report_llvm9_version_string =
256 driQueryOptionb(&instance->drirc.options, "radv_report_llvm9_version_string");
257
258 instance->drirc.vk_require_etc2 = driQueryOptionb(&instance->drirc.options, "vk_require_etc2");
259 instance->drirc.vk_require_astc = driQueryOptionb(&instance->drirc.options, "vk_require_astc");
260 }
261
262 static const struct vk_instance_extension_table radv_instance_extensions_supported = {
263 .KHR_device_group_creation = true,
264 .KHR_external_fence_capabilities = true,
265 .KHR_external_memory_capabilities = true,
266 .KHR_external_semaphore_capabilities = true,
267 .KHR_get_physical_device_properties2 = true,
268 .EXT_debug_report = true,
269 .EXT_debug_utils = true,
270
271 #ifdef RADV_USE_WSI_PLATFORM
272 .KHR_get_surface_capabilities2 = true,
273 .KHR_surface = true,
274 .KHR_surface_protected_capabilities = true,
275 .EXT_surface_maintenance1 = true,
276 .EXT_swapchain_colorspace = true,
277 #endif
278 #ifdef VK_USE_PLATFORM_WAYLAND_KHR
279 .KHR_wayland_surface = true,
280 #endif
281 #ifdef VK_USE_PLATFORM_XCB_KHR
282 .KHR_xcb_surface = true,
283 #endif
284 #ifdef VK_USE_PLATFORM_XLIB_KHR
285 .KHR_xlib_surface = true,
286 #endif
287 #ifdef VK_USE_PLATFORM_XLIB_XRANDR_EXT
288 .EXT_acquire_xlib_display = true,
289 #endif
290 #ifdef VK_USE_PLATFORM_DISPLAY_KHR
291 .KHR_display = true,
292 .KHR_get_display_properties2 = true,
293 .EXT_direct_mode_display = true,
294 .EXT_display_surface_counter = true,
295 .EXT_acquire_drm_display = true,
296 #endif
297 #ifndef VK_USE_PLATFORM_WIN32_KHR
298 .EXT_headless_surface = true,
299 #endif
300 };
301
302 static void
radv_handle_legacy_sqtt_trigger(struct vk_instance * instance)303 radv_handle_legacy_sqtt_trigger(struct vk_instance *instance)
304 {
305 char *trigger_file = secure_getenv("RADV_THREAD_TRACE_TRIGGER");
306 if (trigger_file) {
307 instance->trace_trigger_file = trigger_file;
308 instance->trace_mode |= RADV_TRACE_MODE_RGP;
309 fprintf(stderr, "WARNING: RADV_THREAD_TRACE_TRIGGER is deprecated, please use MESA_VK_TRACE_TRIGGER instead.\n");
310 }
311 }
312
313 static enum radeon_ctx_pstate
radv_parse_pstate(const char * str)314 radv_parse_pstate(const char* str)
315 {
316 if (!strcmp(str, "peak")) {
317 return RADEON_CTX_PSTATE_PEAK;
318 } else if (!strcmp(str, "standard")) {
319 return RADEON_CTX_PSTATE_STANDARD;
320 } else if (!strcmp(str, "min_sclk")) {
321 return RADEON_CTX_PSTATE_MIN_SCLK;
322 } else if (!strcmp(str, "min_mclk")) {
323 return RADEON_CTX_PSTATE_MIN_MCLK;
324 } else {
325 return RADEON_CTX_PSTATE_NONE;
326 }
327 }
328
329 VKAPI_ATTR VkResult VKAPI_CALL
radv_CreateInstance(const VkInstanceCreateInfo * pCreateInfo,const VkAllocationCallbacks * pAllocator,VkInstance * pInstance)330 radv_CreateInstance(const VkInstanceCreateInfo *pCreateInfo, const VkAllocationCallbacks *pAllocator,
331 VkInstance *pInstance)
332 {
333 struct radv_instance *instance;
334 VkResult result;
335
336 if (!pAllocator)
337 pAllocator = vk_default_allocator();
338
339 instance = vk_zalloc(pAllocator, sizeof(*instance), 8, VK_SYSTEM_ALLOCATION_SCOPE_INSTANCE);
340 if (!instance)
341 return vk_error(NULL, VK_ERROR_OUT_OF_HOST_MEMORY);
342
343 struct vk_instance_dispatch_table dispatch_table;
344 vk_instance_dispatch_table_from_entrypoints(&dispatch_table, &radv_instance_entrypoints, true);
345 vk_instance_dispatch_table_from_entrypoints(&dispatch_table, &wsi_instance_entrypoints, false);
346
347 result =
348 vk_instance_init(&instance->vk, &radv_instance_extensions_supported, &dispatch_table, pCreateInfo, pAllocator);
349 if (result != VK_SUCCESS) {
350 vk_free(pAllocator, instance);
351 return vk_error(NULL, result);
352 }
353
354 vk_instance_add_driver_trace_modes(&instance->vk, trace_options);
355 radv_handle_legacy_sqtt_trigger(&instance->vk);
356
357 simple_mtx_init(&instance->shader_dump_mtx, mtx_plain);
358
359 instance->debug_flags = parse_debug_string(getenv("RADV_DEBUG"), radv_debug_options);
360 instance->perftest_flags = parse_debug_string(getenv("RADV_PERFTEST"), radv_perftest_options);
361 instance->profile_pstate = radv_parse_pstate(debug_get_option("RADV_PROFILE_PSTATE", "peak"));
362
363 /* When RADV_FORCE_FAMILY is set, the driver creates a null
364 * device that allows to test the compiler without having an
365 * AMDGPU instance.
366 */
367 if (getenv("RADV_FORCE_FAMILY"))
368 instance->vk.physical_devices.enumerate = create_null_physical_device;
369 else
370 instance->vk.physical_devices.try_create_for_drm = create_drm_physical_device;
371
372 instance->vk.physical_devices.destroy = radv_physical_device_destroy;
373
374 if (instance->debug_flags & RADV_DEBUG_STARTUP)
375 fprintf(stderr, "radv: info: Created an instance.\n");
376
377 VG(VALGRIND_CREATE_MEMPOOL(instance, 0, false));
378
379 radv_init_dri_options(instance);
380
381 *pInstance = radv_instance_to_handle(instance);
382
383 return VK_SUCCESS;
384 }
385
386 VKAPI_ATTR void VKAPI_CALL
radv_DestroyInstance(VkInstance _instance,const VkAllocationCallbacks * pAllocator)387 radv_DestroyInstance(VkInstance _instance, const VkAllocationCallbacks *pAllocator)
388 {
389 VK_FROM_HANDLE(radv_instance, instance, _instance);
390
391 if (!instance)
392 return;
393
394 VG(VALGRIND_DESTROY_MEMPOOL(instance));
395
396 simple_mtx_destroy(&instance->shader_dump_mtx);
397
398 driDestroyOptionCache(&instance->drirc.options);
399 driDestroyOptionInfo(&instance->drirc.available_options);
400
401 vk_instance_finish(&instance->vk);
402 vk_free(&instance->vk.alloc, instance);
403 }
404
405 VKAPI_ATTR VkResult VKAPI_CALL
radv_EnumerateInstanceExtensionProperties(const char * pLayerName,uint32_t * pPropertyCount,VkExtensionProperties * pProperties)406 radv_EnumerateInstanceExtensionProperties(const char *pLayerName, uint32_t *pPropertyCount,
407 VkExtensionProperties *pProperties)
408 {
409 if (pLayerName)
410 return vk_error(NULL, VK_ERROR_LAYER_NOT_PRESENT);
411
412 return vk_enumerate_instance_extension_properties(&radv_instance_extensions_supported, pPropertyCount, pProperties);
413 }
414
415 VKAPI_ATTR VkResult VKAPI_CALL
radv_EnumerateInstanceVersion(uint32_t * pApiVersion)416 radv_EnumerateInstanceVersion(uint32_t *pApiVersion)
417 {
418 *pApiVersion = RADV_API_VERSION;
419 return VK_SUCCESS;
420 }
421
422 VKAPI_ATTR VkResult VKAPI_CALL
radv_EnumerateInstanceLayerProperties(uint32_t * pPropertyCount,VkLayerProperties * pProperties)423 radv_EnumerateInstanceLayerProperties(uint32_t *pPropertyCount, VkLayerProperties *pProperties)
424 {
425 if (pProperties == NULL) {
426 *pPropertyCount = 0;
427 return VK_SUCCESS;
428 }
429
430 /* None supported at this time */
431 return vk_error(NULL, VK_ERROR_LAYER_NOT_PRESENT);
432 }
433
434 VKAPI_ATTR PFN_vkVoidFunction VKAPI_CALL
radv_GetInstanceProcAddr(VkInstance _instance,const char * pName)435 radv_GetInstanceProcAddr(VkInstance _instance, const char *pName)
436 {
437 VK_FROM_HANDLE(vk_instance, instance, _instance);
438 return vk_instance_get_proc_addr(instance, &radv_instance_entrypoints, pName);
439 }
440
441 /* Windows will use a dll definition file to avoid build errors. */
442 #ifdef _WIN32
443 #undef PUBLIC
444 #define PUBLIC
445 #endif
446
447 /* The loader wants us to expose a second GetInstanceProcAddr function
448 * to work around certain LD_PRELOAD issues seen in apps.
449 */
450 PUBLIC
451 VKAPI_ATTR PFN_vkVoidFunction VKAPI_CALL
vk_icdGetInstanceProcAddr(VkInstance instance,const char * pName)452 vk_icdGetInstanceProcAddr(VkInstance instance, const char *pName)
453 {
454 return radv_GetInstanceProcAddr(instance, pName);
455 }
456