2 * Copyright 2018 Collabora Ltd.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
24 #include "zink_screen.h"
26 #include "zink_kopper.h"
27 #include "zink_compiler.h"
28 #include "zink_context.h"
29 #include "zink_descriptors.h"
30 #include "zink_fence.h"
31 #include "zink_format.h"
32 #include "zink_framebuffer.h"
33 #include "zink_program.h"
34 #include "zink_public.h"
35 #include "zink_query.h"
36 #include "zink_resource.h"
37 #include "zink_state.h"
38 #include "nir_to_spirv/nir_to_spirv.h" // for SPIRV_VERSION
40 #include "os/os_process.h"
41 #include "util/u_debug.h"
42 #include "util/u_dl.h"
43 #include "util/os_file.h"
44 #include "util/u_memory.h"
45 #include "util/u_screen.h"
46 #include "util/u_string.h"
47 #include "util/u_transfer_helper.h"
48 #include "util/xmlconfig.h"
50 #include "util/u_cpu_detect.h"
54 #define VK_LIBNAME "vulkan-1.dll"
58 #define VK_LIBNAME "libvulkan.1.dylib"
59 #elif DETECT_OS_ANDROID
60 #define VK_LIBNAME "libvulkan.so"
62 #define VK_LIBNAME "libvulkan.so.1"
66 #if defined(__APPLE__)
67 // Source of MVK_VERSION
68 #include "MoltenVK/vk_mvk_moltenvk.h"
71 static const struct debug_named_value
72 zink_debug_options[] = {
73 { "nir", ZINK_DEBUG_NIR, "Dump NIR during program compile" },
74 { "spirv", ZINK_DEBUG_SPIRV, "Dump SPIR-V during program compile" },
75 { "tgsi", ZINK_DEBUG_TGSI, "Dump TGSI during program compile" },
76 { "validation", ZINK_DEBUG_VALIDATION, "Dump Validation layer output" },
77 { "sync", ZINK_DEBUG_SYNC, "Force synchronization before draws/dispatches" },
78 { "compact", ZINK_DEBUG_COMPACT, "Use only 4 descriptor sets" },
79 { "noreorder", ZINK_DEBUG_NOREORDER, "Do not reorder command streams" },
80 { "gpl", ZINK_DEBUG_GPL, "Force using Graphics Pipeline Library for all shaders" },
81 { "shaderdb", ZINK_DEBUG_SHADERDB, "Do stuff to make shader-db work" },
85 DEBUG_GET_ONCE_FLAGS_OPTION(zink_debug, "ZINK_DEBUG", zink_debug_options, 0)
91 static const struct debug_named_value
92 zink_descriptor_options[] = {
93 { "auto", ZINK_DESCRIPTOR_MODE_AUTO, "Automatically detect best mode" },
94 { "lazy", ZINK_DESCRIPTOR_MODE_LAZY, "Don't cache, do least amount of updates" },
98 DEBUG_GET_ONCE_FLAGS_OPTION(zink_descriptor_mode, "ZINK_DESCRIPTORS", zink_descriptor_options, ZINK_DESCRIPTOR_MODE_AUTO)
100 enum zink_descriptor_mode zink_descriptor_mode;
103 zink_get_vendor(struct pipe_screen *pscreen)
105 return "Collabora Ltd";
109 zink_get_device_vendor(struct pipe_screen *pscreen)
111 struct zink_screen *screen = zink_screen(pscreen);
112 static char buf[1000];
113 snprintf(buf, sizeof(buf), "Unknown (vendor-id: 0x%04x)", screen->info.props.vendorID);
118 zink_get_name(struct pipe_screen *pscreen)
120 struct zink_screen *screen = zink_screen(pscreen);
121 static char buf[1000];
122 snprintf(buf, sizeof(buf), "zink (%s)", screen->info.props.deviceName);
127 zink_get_driver_uuid(struct pipe_screen *pscreen, char *uuid)
129 struct zink_screen *screen = zink_screen(pscreen);
130 if (screen->vk_version >= VK_MAKE_VERSION(1,2,0)) {
131 memcpy(uuid, screen->info.props11.driverUUID, VK_UUID_SIZE);
133 memcpy(uuid, screen->info.deviceid_props.driverUUID, VK_UUID_SIZE);
138 zink_get_device_uuid(struct pipe_screen *pscreen, char *uuid)
140 struct zink_screen *screen = zink_screen(pscreen);
141 if (screen->vk_version >= VK_MAKE_VERSION(1,2,0)) {
142 memcpy(uuid, screen->info.props11.deviceUUID, VK_UUID_SIZE);
144 memcpy(uuid, screen->info.deviceid_props.deviceUUID, VK_UUID_SIZE);
149 zink_get_device_luid(struct pipe_screen *pscreen, char *luid)
151 struct zink_screen *screen = zink_screen(pscreen);
152 if (screen->info.have_vulkan12) {
153 memcpy(luid, screen->info.props11.deviceLUID, VK_LUID_SIZE);
155 memcpy(luid, screen->info.deviceid_props.deviceLUID, VK_LUID_SIZE);
160 zink_get_device_node_mask(struct pipe_screen *pscreen)
162 struct zink_screen *screen = zink_screen(pscreen);
163 if (screen->info.have_vulkan12) {
164 return screen->info.props11.deviceNodeMask;
166 return screen->info.deviceid_props.deviceNodeMask;
171 zink_set_max_shader_compiler_threads(struct pipe_screen *pscreen, unsigned max_threads)
173 struct zink_screen *screen = zink_screen(pscreen);
174 util_queue_adjust_num_threads(&screen->cache_get_thread, max_threads);
178 zink_is_parallel_shader_compilation_finished(struct pipe_screen *screen, void *shader, enum pipe_shader_type shader_type)
180 if (shader_type == MESA_SHADER_COMPUTE) {
181 struct zink_program *pg = shader;
182 return !pg->can_precompile || util_queue_fence_is_signalled(&pg->cache_fence);
185 struct zink_shader *zs = shader;
186 bool finished = true;
187 set_foreach(zs->programs, entry) {
188 struct zink_gfx_program *prog = (void*)entry->key;
189 finished &= util_queue_fence_is_signalled(&prog->base.cache_fence);
195 get_video_mem(struct zink_screen *screen)
197 VkDeviceSize size = 0;
198 for (uint32_t i = 0; i < screen->info.mem_props.memoryHeapCount; ++i) {
199 if (screen->info.mem_props.memoryHeaps[i].flags &
200 VK_MEMORY_HEAP_DEVICE_LOCAL_BIT)
201 size += screen->info.mem_props.memoryHeaps[i].size;
207 disk_cache_init(struct zink_screen *screen)
209 if (zink_debug & ZINK_DEBUG_SHADERDB)
211 #ifdef ENABLE_SHADER_CACHE
212 static char buf[1000];
213 snprintf(buf, sizeof(buf), "zink_%x04x", screen->info.props.vendorID);
215 screen->disk_cache = disk_cache_create(buf, screen->info.props.deviceName, 0);
216 if (!screen->disk_cache)
219 if (!util_queue_init(&screen->cache_put_thread, "zcq", 8, 1, UTIL_QUEUE_INIT_RESIZE_IF_FULL, screen)) {
220 mesa_loge("zink: Failed to create disk cache queue\n");
222 disk_cache_destroy(screen->disk_cache);
223 screen->disk_cache = NULL;
225 util_queue_destroy(&screen->cache_put_thread);
236 cache_put_job(void *data, void *gdata, int thread_index)
238 struct zink_program *pg = data;
239 struct zink_screen *screen = gdata;
241 VkResult result = VKSCR(GetPipelineCacheData)(screen->dev, pg->pipeline_cache, &size, NULL);
242 if (result != VK_SUCCESS) {
243 mesa_loge("ZINK: vkGetPipelineCacheData failed (%s)", vk_Result_to_str(result));
246 if (pg->pipeline_cache_size == size)
248 void *pipeline_data = malloc(size);
251 result = VKSCR(GetPipelineCacheData)(screen->dev, pg->pipeline_cache, &size, pipeline_data);
252 if (result == VK_SUCCESS) {
253 pg->pipeline_cache_size = size;
256 disk_cache_compute_key(screen->disk_cache, pg->sha1, sizeof(pg->sha1), key);
257 disk_cache_put_nocopy(screen->disk_cache, key, pipeline_data, size, NULL);
259 mesa_loge("ZINK: vkGetPipelineCacheData failed (%s)", vk_Result_to_str(result));
264 zink_screen_update_pipeline_cache(struct zink_screen *screen, struct zink_program *pg, bool in_thread)
266 if (!screen->disk_cache)
270 cache_put_job(pg, screen, 0);
272 util_queue_add_job(&screen->cache_put_thread, pg, &pg->cache_fence, cache_put_job, NULL, 0);
276 cache_get_job(void *data, void *gdata, int thread_index)
278 struct zink_program *pg = data;
279 struct zink_screen *screen = gdata;
281 VkPipelineCacheCreateInfo pcci;
282 pcci.sType = VK_STRUCTURE_TYPE_PIPELINE_CACHE_CREATE_INFO;
284 pcci.flags = screen->info.have_EXT_pipeline_creation_cache_control || screen->info.feats13.pipelineCreationCacheControl ?
285 VK_PIPELINE_CACHE_CREATE_EXTERNALLY_SYNCHRONIZED_BIT : 0;
286 pcci.initialDataSize = 0;
287 pcci.pInitialData = NULL;
290 disk_cache_compute_key(screen->disk_cache, pg->sha1, sizeof(pg->sha1), key);
291 pcci.pInitialData = disk_cache_get(screen->disk_cache, key, &pg->pipeline_cache_size);
292 pcci.initialDataSize = pg->pipeline_cache_size;
294 VkResult res = VKSCR(CreatePipelineCache)(screen->dev, &pcci, NULL, &pg->pipeline_cache);
295 if (res != VK_SUCCESS) {
296 mesa_loge("ZINK: vkCreatePipelineCache failed (%s)", vk_Result_to_str(res));
298 free((void*)pcci.pInitialData);
302 zink_screen_get_pipeline_cache(struct zink_screen *screen, struct zink_program *pg, bool in_thread)
304 if (!screen->disk_cache)
308 cache_get_job(pg, screen, 0);
310 util_queue_add_job(&screen->cache_get_thread, pg, &pg->cache_fence, cache_get_job, NULL, 0);
314 zink_get_compute_param(struct pipe_screen *pscreen, enum pipe_shader_ir ir_type,
315 enum pipe_compute_cap param, void *ret)
317 struct zink_screen *screen = zink_screen(pscreen);
318 #define RET(x) do { \
320 memcpy(ret, x, sizeof(x)); \
325 case PIPE_COMPUTE_CAP_ADDRESS_BITS:
326 RET((uint32_t []){ 32 });
328 case PIPE_COMPUTE_CAP_IR_TARGET:
333 case PIPE_COMPUTE_CAP_GRID_DIMENSION:
334 RET((uint64_t []) { 3 });
336 case PIPE_COMPUTE_CAP_MAX_GRID_SIZE:
337 RET(((uint64_t []) { screen->info.props.limits.maxComputeWorkGroupCount[0],
338 screen->info.props.limits.maxComputeWorkGroupCount[1],
339 screen->info.props.limits.maxComputeWorkGroupCount[2] }));
341 case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:
342 /* MaxComputeWorkGroupSize[0..2] */
343 RET(((uint64_t []) {screen->info.props.limits.maxComputeWorkGroupSize[0],
344 screen->info.props.limits.maxComputeWorkGroupSize[1],
345 screen->info.props.limits.maxComputeWorkGroupSize[2]}));
347 case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:
348 case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK:
349 RET((uint64_t []) { screen->info.props.limits.maxComputeWorkGroupInvocations });
351 case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE:
352 RET((uint64_t []) { screen->info.props.limits.maxComputeSharedMemorySize });
354 case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED:
355 RET((uint32_t []) { 1 });
357 case PIPE_COMPUTE_CAP_SUBGROUP_SIZE:
358 RET((uint32_t []) { screen->info.props11.subgroupSize });
360 case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE:
361 case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY:
362 case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS:
363 case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE:
364 case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE:
365 case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE:
366 // XXX: I think these are for Clover...
370 unreachable("unknown compute param");
375 get_smallest_buffer_heap(struct zink_screen *screen)
377 enum zink_heap heaps[] = {
378 ZINK_HEAP_DEVICE_LOCAL,
379 ZINK_HEAP_DEVICE_LOCAL_VISIBLE,
380 ZINK_HEAP_HOST_VISIBLE_COHERENT,
381 ZINK_HEAP_HOST_VISIBLE_COHERENT
383 unsigned size = UINT32_MAX;
384 for (unsigned i = 0; i < ARRAY_SIZE(heaps); i++) {
385 unsigned heap_idx = screen->info.mem_props.memoryTypes[screen->heap_map[i]].heapIndex;
386 size = MIN2(screen->info.mem_props.memoryHeaps[heap_idx].size, size);
392 have_fp32_filter_linear(struct zink_screen *screen)
394 const VkFormat fp32_formats[] = {
395 VK_FORMAT_R32_SFLOAT,
396 VK_FORMAT_R32G32_SFLOAT,
397 VK_FORMAT_R32G32B32_SFLOAT,
398 VK_FORMAT_R32G32B32A32_SFLOAT,
399 VK_FORMAT_D32_SFLOAT,
401 for (int i = 0; i < ARRAY_SIZE(fp32_formats); ++i) {
402 VkFormatProperties props;
403 VKSCR(GetPhysicalDeviceFormatProperties)(screen->pdev,
406 if (((props.linearTilingFeatures | props.optimalTilingFeatures) &
407 (VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT |
408 VK_FORMAT_FEATURE_SAMPLED_IMAGE_FILTER_LINEAR_BIT)) ==
409 VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT) {
417 zink_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
419 struct zink_screen *screen = zink_screen(pscreen);
422 case PIPE_CAP_TEXRECT:
423 case PIPE_CAP_MULTI_DRAW_INDIRECT_PARTIAL_STRIDE:
425 case PIPE_CAP_ANISOTROPIC_FILTER:
426 return screen->info.feats.features.samplerAnisotropy;
427 case PIPE_CAP_EMULATE_NONFIXED_PRIMITIVE_RESTART:
429 case PIPE_CAP_SUPPORTED_PRIM_MODES_WITH_RESTART: {
430 uint32_t modes = BITFIELD_BIT(PIPE_PRIM_LINE_STRIP) |
431 BITFIELD_BIT(PIPE_PRIM_TRIANGLE_STRIP) |
432 BITFIELD_BIT(PIPE_PRIM_LINE_STRIP_ADJACENCY) |
433 BITFIELD_BIT(PIPE_PRIM_TRIANGLE_STRIP_ADJACENCY);
434 if (screen->have_triangle_fans)
435 modes |= BITFIELD_BIT(PIPE_PRIM_TRIANGLE_FAN);
436 if (screen->info.have_EXT_primitive_topology_list_restart) {
437 modes |= BITFIELD_BIT(PIPE_PRIM_POINTS) |
438 BITFIELD_BIT(PIPE_PRIM_LINES) |
439 BITFIELD_BIT(PIPE_PRIM_LINES_ADJACENCY) |
440 BITFIELD_BIT(PIPE_PRIM_TRIANGLES) |
441 BITFIELD_BIT(PIPE_PRIM_TRIANGLES_ADJACENCY);
442 if (screen->info.list_restart_feats.primitiveTopologyPatchListRestart)
443 modes |= BITFIELD_BIT(PIPE_PRIM_PATCHES);
447 case PIPE_CAP_SUPPORTED_PRIM_MODES: {
448 uint32_t modes = BITFIELD_MASK(PIPE_PRIM_MAX);
449 modes &= ~BITFIELD_BIT(PIPE_PRIM_QUADS);
450 modes &= ~BITFIELD_BIT(PIPE_PRIM_QUAD_STRIP);
451 modes &= ~BITFIELD_BIT(PIPE_PRIM_POLYGON);
452 modes &= ~BITFIELD_BIT(PIPE_PRIM_LINE_LOOP);
453 if (!screen->have_triangle_fans)
454 modes &= ~BITFIELD_BIT(PIPE_PRIM_TRIANGLE_FAN);
458 case PIPE_CAP_FBFETCH:
460 case PIPE_CAP_FBFETCH_COHERENT:
461 return screen->info.have_EXT_rasterization_order_attachment_access;
463 case PIPE_CAP_MEMOBJ:
464 return screen->instance_info.have_KHR_external_memory_capabilities && (screen->info.have_KHR_external_memory_fd || screen->info.have_KHR_external_memory_win32);
465 case PIPE_CAP_FENCE_SIGNAL:
466 return screen->info.have_KHR_external_semaphore_fd || screen->info.have_KHR_external_semaphore_win32;
467 case PIPE_CAP_NATIVE_FENCE_FD:
468 return screen->instance_info.have_KHR_external_semaphore_capabilities && screen->info.have_KHR_external_semaphore_fd;
470 case PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION:
471 case PIPE_CAP_MAP_UNSYNCHRONIZED_THREAD_SAFE:
472 case PIPE_CAP_SHAREABLE_SHADERS:
473 case PIPE_CAP_DEVICE_RESET_STATUS_QUERY:
474 case PIPE_CAP_QUERY_MEMORY_INFO:
475 case PIPE_CAP_NPOT_TEXTURES:
476 case PIPE_CAP_TGSI_TEXCOORD:
477 case PIPE_CAP_DRAW_INDIRECT:
478 case PIPE_CAP_TEXTURE_QUERY_LOD:
479 case PIPE_CAP_GLSL_TESS_LEVELS_AS_INPUTS:
480 case PIPE_CAP_CLEAR_TEXTURE:
481 case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:
482 case PIPE_CAP_FORCE_PERSAMPLE_INTERP:
483 case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:
484 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
485 case PIPE_CAP_SHADER_ARRAY_COMPONENTS:
486 case PIPE_CAP_QUERY_BUFFER_OBJECT:
487 case PIPE_CAP_CONDITIONAL_RENDER_INVERTED:
488 case PIPE_CAP_CLIP_HALFZ:
489 case PIPE_CAP_TEXTURE_QUERY_SAMPLES:
490 case PIPE_CAP_TEXTURE_BARRIER:
491 case PIPE_CAP_QUERY_SO_OVERFLOW:
492 case PIPE_CAP_GL_SPIRV:
493 case PIPE_CAP_CLEAR_SCISSORED:
494 case PIPE_CAP_INVALIDATE_BUFFER:
495 case PIPE_CAP_PREFER_REAL_BUFFER_IN_CONSTBUF0:
496 case PIPE_CAP_PACKED_UNIFORMS:
497 case PIPE_CAP_SHADER_PACK_HALF_FLOAT:
498 case PIPE_CAP_CULL_DISTANCE_NOCOMBINE:
499 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
500 case PIPE_CAP_LOAD_CONSTBUF:
501 case PIPE_CAP_MULTISAMPLE_Z_RESOLVE:
502 case PIPE_CAP_RGB_OVERRIDE_DST_ALPHA_BLEND:
505 case PIPE_CAP_DRAW_VERTEX_STATE:
506 return screen->info.have_EXT_vertex_input_dynamic_state;
508 case PIPE_CAP_SURFACE_SAMPLE_COUNT:
509 return screen->vk_version >= VK_MAKE_VERSION(1,2,0);
511 case PIPE_CAP_SHADER_GROUP_VOTE:
512 if (screen->info.have_vulkan11 &&
513 (screen->info.subgroup.supportedOperations & VK_SUBGROUP_FEATURE_VOTE_BIT) &&
514 (screen->info.subgroup.supportedStages & VK_SHADER_STAGE_COMPUTE_BIT))
516 if (screen->info.have_EXT_shader_subgroup_vote)
519 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
520 return screen->info.have_EXT_provoking_vertex;
522 case PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE:
523 return screen->info.have_KHR_sampler_mirror_clamp_to_edge;
525 case PIPE_CAP_POLYGON_OFFSET_UNITS_UNSCALED:
528 case PIPE_CAP_POLYGON_OFFSET_CLAMP:
529 return screen->info.feats.features.depthBiasClamp;
531 case PIPE_CAP_QUERY_PIPELINE_STATISTICS_SINGLE:
532 return screen->info.feats.features.pipelineStatisticsQuery;
534 case PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR:
535 return screen->info.feats.features.robustBufferAccess;
537 case PIPE_CAP_MULTI_DRAW_INDIRECT:
538 return screen->info.feats.features.multiDrawIndirect;
540 case PIPE_CAP_IMAGE_ATOMIC_FLOAT_ADD:
541 return screen->info.have_EXT_shader_atomic_float;
542 case PIPE_CAP_SHADER_ATOMIC_INT64:
543 return screen->info.have_KHR_shader_atomic_int64;
545 case PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS:
546 return screen->info.have_KHR_draw_indirect_count;
548 case PIPE_CAP_START_INSTANCE:
549 case PIPE_CAP_DRAW_PARAMETERS:
550 return (screen->info.have_vulkan12 && screen->info.feats11.shaderDrawParameters) ||
551 screen->info.have_KHR_shader_draw_parameters;
553 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
554 return screen->info.have_EXT_vertex_attribute_divisor;
556 case PIPE_CAP_MAX_VERTEX_STREAMS:
557 return screen->info.tf_props.maxTransformFeedbackStreams;
560 case PIPE_CAP_INT64_DIVMOD:
561 case PIPE_CAP_DOUBLES:
564 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
565 if (!screen->info.feats.features.dualSrcBlend)
567 return screen->info.props.limits.maxFragmentDualSrcAttachments;
569 case PIPE_CAP_MAX_RENDER_TARGETS:
570 return screen->info.props.limits.maxColorAttachments;
572 case PIPE_CAP_OCCLUSION_QUERY:
573 return screen->info.feats.features.occlusionQueryPrecise;
575 case PIPE_CAP_PROGRAMMABLE_SAMPLE_LOCATIONS:
576 return screen->info.have_EXT_sample_locations && screen->info.have_EXT_extended_dynamic_state;
578 case PIPE_CAP_QUERY_TIME_ELAPSED:
579 return screen->timestamp_valid_bits > 0;
581 case PIPE_CAP_TEXTURE_MULTISAMPLE:
584 case PIPE_CAP_FRAGMENT_SHADER_INTERLOCK:
585 return screen->info.have_EXT_fragment_shader_interlock;
587 case PIPE_CAP_SHADER_CLOCK:
588 return screen->info.have_KHR_shader_clock;
590 case PIPE_CAP_POINT_SPRITE:
593 case PIPE_CAP_SHADER_BALLOT:
594 if (screen->info.props11.subgroupSize > 64)
596 if (screen->info.have_vulkan11 &&
597 screen->info.subgroup.supportedOperations & VK_SUBGROUP_FEATURE_BALLOT_BIT)
599 if (screen->info.have_EXT_shader_subgroup_ballot)
603 case PIPE_CAP_DEMOTE_TO_HELPER_INVOCATION:
604 return screen->info.have_EXT_shader_demote_to_helper_invocation;
606 case PIPE_CAP_SAMPLE_SHADING:
607 return screen->info.feats.features.sampleRateShading;
609 case PIPE_CAP_TEXTURE_SWIZZLE:
612 case PIPE_CAP_VERTEX_ATTRIB_ELEMENT_ALIGNED_ONLY:
615 case PIPE_CAP_GL_CLAMP:
618 case PIPE_CAP_PREFER_IMM_ARRAYS_AS_CONSTBUF:
619 return 0; /* Assume that the vk driver is capable of moving imm arrays to some sort of constant storage on its own. */
621 case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK: {
622 enum pipe_quirk_texture_border_color_swizzle quirk = PIPE_QUIRK_TEXTURE_BORDER_COLOR_SWIZZLE_ALPHA_NOT_W;
623 if (!screen->info.border_color_feats.customBorderColorWithoutFormat)
624 return quirk | PIPE_QUIRK_TEXTURE_BORDER_COLOR_SWIZZLE_FREEDRENO;
625 /* assume that if drivers don't implement this extension they either:
626 * - don't support custom border colors
627 * - handle things correctly
628 * - hate border color accuracy
630 if (screen->info.have_EXT_border_color_swizzle &&
631 !screen->info.border_swizzle_feats.borderColorSwizzleFromImage)
632 return quirk | PIPE_QUIRK_TEXTURE_BORDER_COLOR_SWIZZLE_NV50;
636 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
637 return screen->info.props.limits.maxImageDimension2D;
638 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
639 return 1 + util_logbase2(screen->info.props.limits.maxImageDimension3D);
640 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
641 return 1 + util_logbase2(screen->info.props.limits.maxImageDimensionCube);
643 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
644 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
647 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
648 case PIPE_CAP_INDEP_BLEND_ENABLE:
649 case PIPE_CAP_INDEP_BLEND_FUNC:
650 return screen->info.feats.features.independentBlend;
652 case PIPE_CAP_DITHERING:
655 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
656 return screen->info.have_EXT_transform_feedback ? screen->info.tf_props.maxTransformFeedbackBuffers : 0;
657 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
658 case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:
659 return screen->info.have_EXT_transform_feedback;
661 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
662 return screen->info.props.limits.maxImageArrayLayers;
664 case PIPE_CAP_DEPTH_CLIP_DISABLE:
665 return !screen->driver_workarounds.depth_clip_control_missing;
667 case PIPE_CAP_SHADER_STENCIL_EXPORT:
668 return screen->info.have_EXT_shader_stencil_export;
670 case PIPE_CAP_VS_INSTANCEID:
671 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
672 case PIPE_CAP_SEAMLESS_CUBE_MAP:
675 case PIPE_CAP_MIN_TEXEL_OFFSET:
676 return screen->info.props.limits.minTexelOffset;
677 case PIPE_CAP_MAX_TEXEL_OFFSET:
678 return screen->info.props.limits.maxTexelOffset;
680 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
683 case PIPE_CAP_CONDITIONAL_RENDER:
686 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
687 case PIPE_CAP_GLSL_FEATURE_LEVEL:
690 case PIPE_CAP_COMPUTE:
693 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
694 return screen->info.props.limits.minUniformBufferOffsetAlignment;
696 case PIPE_CAP_QUERY_TIMESTAMP:
697 return screen->timestamp_valid_bits > 0;
699 case PIPE_CAP_QUERY_TIMESTAMP_BITS:
700 return screen->timestamp_valid_bits;
702 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
703 return 1 << MIN_SLAB_ORDER;
705 case PIPE_CAP_CUBE_MAP_ARRAY:
706 return screen->info.feats.features.imageCubeArray;
708 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
709 case PIPE_CAP_PRIMITIVE_RESTART:
712 case PIPE_CAP_BINDLESS_TEXTURE:
713 return screen->info.have_EXT_descriptor_indexing;
715 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
716 return screen->info.props.limits.minTexelBufferOffsetAlignment;
718 case PIPE_CAP_TEXTURE_TRANSFER_MODES: {
719 enum pipe_texture_transfer_mode mode = PIPE_TEXTURE_TRANSFER_BLIT;
720 if (!screen->is_cpu &&
721 /* this needs substantial perf tuning */
722 screen->info.driver_props.driverID != VK_DRIVER_ID_MESA_TURNIP &&
723 screen->info.have_KHR_8bit_storage &&
724 screen->info.have_KHR_16bit_storage &&
725 screen->info.have_KHR_shader_float16_int8)
726 mode |= PIPE_TEXTURE_TRANSFER_COMPUTE;
730 case PIPE_CAP_MAX_TEXEL_BUFFER_ELEMENTS_UINT:
731 return MIN2(get_smallest_buffer_heap(screen),
732 screen->info.props.limits.maxTexelBufferElements);
734 case PIPE_CAP_ENDIANNESS:
735 return PIPE_ENDIAN_NATIVE; /* unsure */
737 case PIPE_CAP_MAX_VIEWPORTS:
738 return MIN2(screen->info.props.limits.maxViewports, PIPE_MAX_VIEWPORTS);
740 case PIPE_CAP_IMAGE_LOAD_FORMATTED:
741 return screen->info.feats.features.shaderStorageImageReadWithoutFormat;
743 case PIPE_CAP_IMAGE_STORE_FORMATTED:
744 return screen->info.feats.features.shaderStorageImageWriteWithoutFormat;
746 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
749 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
750 return screen->info.props.limits.maxGeometryOutputVertices;
751 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
752 return screen->info.props.limits.maxGeometryTotalOutputComponents;
754 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
757 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
758 return screen->info.props.limits.minTexelGatherOffset;
759 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
760 return screen->info.props.limits.maxTexelGatherOffset;
762 case PIPE_CAP_SAMPLER_REDUCTION_MINMAX_ARB:
763 return screen->info.feats12.samplerFilterMinmax || screen->info.have_EXT_sampler_filter_minmax;
765 case PIPE_CAP_FS_FINE_DERIVATIVE:
768 case PIPE_CAP_VENDOR_ID:
769 return screen->info.props.vendorID;
770 case PIPE_CAP_DEVICE_ID:
771 return screen->info.props.deviceID;
773 case PIPE_CAP_ACCELERATED:
774 return !screen->is_cpu;
775 case PIPE_CAP_VIDEO_MEMORY:
776 return get_video_mem(screen) >> 20;
778 return screen->info.props.deviceType == VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU;
780 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
781 return screen->info.props.limits.maxVertexInputBindingStride;
783 case PIPE_CAP_SAMPLER_VIEW_TARGET:
786 case PIPE_CAP_VS_LAYER_VIEWPORT:
787 case PIPE_CAP_TES_LAYER_VIEWPORT:
788 return screen->info.have_EXT_shader_viewport_index_layer ||
789 (screen->spirv_version >= SPIRV_VERSION(1, 5) &&
790 screen->info.feats12.shaderOutputLayer &&
791 screen->info.feats12.shaderOutputViewportIndex);
793 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
794 return have_fp32_filter_linear(screen);
796 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
799 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
800 return screen->info.props.limits.minStorageBufferOffsetAlignment;
802 case PIPE_CAP_PCI_GROUP:
803 case PIPE_CAP_PCI_BUS:
804 case PIPE_CAP_PCI_DEVICE:
805 case PIPE_CAP_PCI_FUNCTION:
806 return 0; /* TODO: figure these out */
808 case PIPE_CAP_CULL_DISTANCE:
809 return screen->info.feats.features.shaderCullDistance;
811 case PIPE_CAP_SPARSE_BUFFER_PAGE_SIZE:
812 return screen->info.feats.features.sparseBinding ? ZINK_SPARSE_BUFFER_PAGE_SIZE : 0;
815 case PIPE_CAP_MAX_SPARSE_TEXTURE_SIZE:
816 return screen->info.feats.features.sparseResidencyImage2D ?
817 zink_get_param(pscreen, PIPE_CAP_MAX_TEXTURE_2D_SIZE) : 0;
818 case PIPE_CAP_MAX_SPARSE_3D_TEXTURE_SIZE:
819 return screen->info.feats.features.sparseResidencyImage3D ?
820 (1 << (zink_get_param(pscreen, PIPE_CAP_MAX_TEXTURE_3D_LEVELS) - 1)) : 0;
821 case PIPE_CAP_MAX_SPARSE_ARRAY_TEXTURE_LAYERS:
822 return screen->info.feats.features.sparseResidencyImage2D ?
823 zink_get_param(pscreen, PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS) : 0;
824 case PIPE_CAP_SPARSE_TEXTURE_FULL_ARRAY_CUBE_MIPMAPS:
825 return screen->info.feats.features.sparseResidencyImage2D ? 1 : 0;
826 case PIPE_CAP_QUERY_SPARSE_TEXTURE_RESIDENCY:
827 case PIPE_CAP_CLAMP_SPARSE_TEXTURE_LOD:
828 return screen->info.feats.features.sparseResidency2Samples ? 1 : 0;
830 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
831 return screen->info.props.limits.viewportSubPixelBits;
833 case PIPE_CAP_MAX_GS_INVOCATIONS:
834 return screen->info.props.limits.maxGeometryShaderInvocations;
836 case PIPE_CAP_MAX_COMBINED_SHADER_BUFFERS:
837 /* gallium handles this automatically */
840 case PIPE_CAP_MAX_SHADER_BUFFER_SIZE_UINT:
841 /* 1<<27 is required by VK spec */
842 assert(screen->info.props.limits.maxStorageBufferRange >= 1 << 27);
843 /* clamp to VK spec minimum */
844 return MIN2(get_smallest_buffer_heap(screen), screen->info.props.limits.maxStorageBufferRange);
846 case PIPE_CAP_FS_COORD_ORIGIN_UPPER_LEFT:
847 case PIPE_CAP_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
850 case PIPE_CAP_FS_COORD_ORIGIN_LOWER_LEFT:
851 case PIPE_CAP_FS_COORD_PIXEL_CENTER_INTEGER:
854 case PIPE_CAP_NIR_COMPACT_ARRAYS:
857 case PIPE_CAP_FS_FACE_IS_INTEGER_SYSVAL:
860 case PIPE_CAP_VIEWPORT_TRANSFORM_LOWERED:
863 case PIPE_CAP_FLATSHADE:
864 case PIPE_CAP_ALPHA_TEST:
865 case PIPE_CAP_CLIP_PLANES:
866 case PIPE_CAP_POINT_SIZE_FIXED:
867 case PIPE_CAP_TWO_SIDED_COLOR:
870 case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS:
871 return screen->info.props.limits.maxTessellationControlPerVertexOutputComponents / 4;
872 case PIPE_CAP_MAX_VARYINGS:
873 /* need to reserve up to 60 of our varying components and 16 slots for streamout */
874 return MIN2(screen->info.props.limits.maxVertexOutputComponents / 4 / 2, 16);
876 case PIPE_CAP_DMABUF:
877 return screen->info.have_KHR_external_memory_fd &&
878 screen->info.have_EXT_external_memory_dma_buf &&
879 screen->info.have_EXT_queue_family_foreign;
881 case PIPE_CAP_DEPTH_BOUNDS_TEST:
882 return screen->info.feats.features.depthBounds;
884 case PIPE_CAP_POST_DEPTH_COVERAGE:
885 return screen->info.have_EXT_post_depth_coverage;
887 case PIPE_CAP_STRING_MARKER:
888 return screen->instance_info.have_EXT_debug_utils;
891 return u_pipe_screen_get_param_defaults(pscreen, param);
896 zink_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
898 struct zink_screen *screen = zink_screen(pscreen);
901 case PIPE_CAPF_MIN_LINE_WIDTH:
902 case PIPE_CAPF_MIN_LINE_WIDTH_AA:
903 if (!screen->info.feats.features.wideLines)
905 return MAX2(screen->info.props.limits.lineWidthRange[0], 0.01);
907 case PIPE_CAPF_MIN_POINT_SIZE:
908 case PIPE_CAPF_MIN_POINT_SIZE_AA:
909 if (!screen->info.feats.features.largePoints)
911 return MAX2(screen->info.props.limits.pointSizeRange[0], 0.01);
914 case PIPE_CAPF_LINE_WIDTH_GRANULARITY:
915 if (!screen->info.feats.features.wideLines)
917 return screen->info.props.limits.lineWidthGranularity;
919 case PIPE_CAPF_POINT_SIZE_GRANULARITY:
920 if (!screen->info.feats.features.largePoints)
922 return screen->info.props.limits.pointSizeGranularity;
925 case PIPE_CAPF_MAX_LINE_WIDTH:
926 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
927 if (!screen->info.feats.features.wideLines)
929 return screen->info.props.limits.lineWidthRange[1];
931 case PIPE_CAPF_MAX_POINT_SIZE:
932 case PIPE_CAPF_MAX_POINT_SIZE_AA:
933 if (!screen->info.feats.features.largePoints)
935 return screen->info.props.limits.pointSizeRange[1];
937 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
938 if (!screen->info.feats.features.samplerAnisotropy)
940 return screen->info.props.limits.maxSamplerAnisotropy;
942 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
943 return screen->info.props.limits.maxSamplerLodBias;
945 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
946 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
947 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
948 return 0.0f; /* not implemented */
951 /* should only get here on unhandled cases */
956 zink_get_shader_param(struct pipe_screen *pscreen,
957 gl_shader_stage shader,
958 enum pipe_shader_cap param)
960 struct zink_screen *screen = zink_screen(pscreen);
963 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
965 case MESA_SHADER_FRAGMENT:
966 case MESA_SHADER_VERTEX:
968 case MESA_SHADER_TESS_CTRL:
969 case MESA_SHADER_TESS_EVAL:
970 if (screen->info.feats.features.tessellationShader &&
971 screen->info.have_KHR_maintenance2)
975 case MESA_SHADER_GEOMETRY:
976 if (screen->info.feats.features.geometryShader)
980 case MESA_SHADER_COMPUTE:
986 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
987 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
988 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
989 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
992 case PIPE_SHADER_CAP_MAX_INPUTS: {
995 case MESA_SHADER_VERTEX:
996 max = MIN2(screen->info.props.limits.maxVertexInputAttributes, PIPE_MAX_ATTRIBS);
998 case MESA_SHADER_TESS_CTRL:
999 max = screen->info.props.limits.maxTessellationControlPerVertexInputComponents / 4;
1001 case MESA_SHADER_TESS_EVAL:
1002 max = screen->info.props.limits.maxTessellationEvaluationInputComponents / 4;
1004 case MESA_SHADER_GEOMETRY:
1005 max = screen->info.props.limits.maxGeometryInputComponents / 4;
1007 case MESA_SHADER_FRAGMENT:
1008 /* intel drivers report fewer components, but it's a value that's compatible
1009 * with what we need for GL, so we can still force a conformant value here
1011 if (screen->info.driver_props.driverID == VK_DRIVER_ID_INTEL_OPEN_SOURCE_MESA ||
1012 screen->info.driver_props.driverID == VK_DRIVER_ID_INTEL_PROPRIETARY_WINDOWS)
1014 max = screen->info.props.limits.maxFragmentInputComponents / 4;
1017 return 0; /* unsupported stage */
1020 case MESA_SHADER_VERTEX:
1021 case MESA_SHADER_TESS_EVAL:
1022 case MESA_SHADER_GEOMETRY:
1023 /* last vertex stage must support streamout, and this is capped in glsl compiler */
1024 return MIN2(max, MAX_VARYING);
1027 return MIN2(max, 64); // prevent overflowing struct shader_info::inputs_read
1030 case PIPE_SHADER_CAP_MAX_OUTPUTS: {
1033 case MESA_SHADER_VERTEX:
1034 max = screen->info.props.limits.maxVertexOutputComponents / 4;
1036 case MESA_SHADER_TESS_CTRL:
1037 max = screen->info.props.limits.maxTessellationControlPerVertexOutputComponents / 4;
1039 case MESA_SHADER_TESS_EVAL:
1040 max = screen->info.props.limits.maxTessellationEvaluationOutputComponents / 4;
1042 case MESA_SHADER_GEOMETRY:
1043 max = screen->info.props.limits.maxGeometryOutputComponents / 4;
1045 case MESA_SHADER_FRAGMENT:
1046 max = screen->info.props.limits.maxColorAttachments;
1049 return 0; /* unsupported stage */
1051 return MIN2(max, 64); // prevent overflowing struct shader_info::outputs_read/written
1054 case PIPE_SHADER_CAP_MAX_CONST_BUFFER0_SIZE:
1055 /* At least 16384 is guaranteed by VK spec */
1056 assert(screen->info.props.limits.maxUniformBufferRange >= 16384);
1057 /* but Gallium can't handle values that are too big */
1058 return MIN3(get_smallest_buffer_heap(screen),
1059 screen->info.props.limits.maxUniformBufferRange, BITFIELD_BIT(31));
1061 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
1062 return MIN2(screen->info.props.limits.maxPerStageDescriptorUniformBuffers,
1063 PIPE_MAX_CONSTANT_BUFFERS);
1065 case PIPE_SHADER_CAP_MAX_TEMPS:
1068 case PIPE_SHADER_CAP_INTEGERS:
1071 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
1072 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
1073 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
1074 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
1077 case PIPE_SHADER_CAP_SUBROUTINES:
1078 case PIPE_SHADER_CAP_INT64_ATOMICS:
1079 case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
1080 return 0; /* not implemented */
1082 case PIPE_SHADER_CAP_FP16_CONST_BUFFERS:
1083 //enabling this breaks GTF-GL46.gtf21.GL2Tests.glGetUniform.glGetUniform
1084 //return screen->info.feats11.uniformAndStorageBuffer16BitAccess ||
1085 //(screen->info.have_KHR_16bit_storage && screen->info.storage_16bit_feats.uniformAndStorageBuffer16BitAccess);
1087 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
1088 return 0; //spirv requires 32bit derivative srcs and dests
1089 case PIPE_SHADER_CAP_FP16:
1090 return screen->info.feats12.shaderFloat16 ||
1091 (screen->info.have_KHR_shader_float16_int8 &&
1092 screen->info.shader_float16_int8_feats.shaderFloat16);
1094 case PIPE_SHADER_CAP_INT16:
1095 return screen->info.feats.features.shaderInt16;
1097 case PIPE_SHADER_CAP_PREFERRED_IR:
1098 return PIPE_SHADER_IR_NIR;
1100 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
1101 return 0; /* not implemented */
1103 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
1104 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
1105 return MIN2(MIN2(screen->info.props.limits.maxPerStageDescriptorSamplers,
1106 screen->info.props.limits.maxPerStageDescriptorSampledImages),
1109 case PIPE_SHADER_CAP_DROUND_SUPPORTED:
1110 case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
1111 return 0; /* not implemented */
1113 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
1114 return 0; /* no idea */
1116 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
1118 case MESA_SHADER_VERTEX:
1119 case MESA_SHADER_TESS_CTRL:
1120 case MESA_SHADER_TESS_EVAL:
1121 case MESA_SHADER_GEOMETRY:
1122 if (!screen->info.feats.features.vertexPipelineStoresAndAtomics)
1126 case MESA_SHADER_FRAGMENT:
1127 if (!screen->info.feats.features.fragmentStoresAndAtomics)
1135 /* TODO: this limitation is dumb, and will need some fixes in mesa */
1136 return MIN2(screen->info.props.limits.maxPerStageDescriptorStorageBuffers, PIPE_MAX_SHADER_BUFFERS);
1138 case PIPE_SHADER_CAP_SUPPORTED_IRS:
1139 return (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_TGSI);
1141 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
1142 if (screen->info.feats.features.shaderStorageImageExtendedFormats &&
1143 screen->info.feats.features.shaderStorageImageWriteWithoutFormat)
1144 return MIN2(screen->info.props.limits.maxPerStageDescriptorStorageImages,
1145 ZINK_MAX_SHADER_IMAGES);
1148 case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
1149 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
1150 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
1151 return 0; /* not implemented */
1152 case PIPE_SHADER_CAP_CONT_SUPPORTED:
1156 /* should only get here on unhandled cases */
1160 static VkSampleCountFlagBits
1161 vk_sample_count_flags(uint32_t sample_count)
1163 switch (sample_count) {
1164 case 1: return VK_SAMPLE_COUNT_1_BIT;
1165 case 2: return VK_SAMPLE_COUNT_2_BIT;
1166 case 4: return VK_SAMPLE_COUNT_4_BIT;
1167 case 8: return VK_SAMPLE_COUNT_8_BIT;
1168 case 16: return VK_SAMPLE_COUNT_16_BIT;
1169 case 32: return VK_SAMPLE_COUNT_32_BIT;
1170 case 64: return VK_SAMPLE_COUNT_64_BIT;
1177 zink_is_compute_copy_faster(struct pipe_screen *pscreen,
1178 enum pipe_format src_format,
1179 enum pipe_format dst_format,
1186 /* very basic for now, probably even worse for some cases,
1187 * but fixes lots of others
1189 return width * height * depth > 64 * 64;
1194 zink_is_format_supported(struct pipe_screen *pscreen,
1195 enum pipe_format format,
1196 enum pipe_texture_target target,
1197 unsigned sample_count,
1198 unsigned storage_sample_count,
1201 struct zink_screen *screen = zink_screen(pscreen);
1203 if (storage_sample_count && !screen->info.feats.features.shaderStorageImageMultisample && bind & PIPE_BIND_SHADER_IMAGE)
1206 if (format == PIPE_FORMAT_NONE)
1207 return screen->info.props.limits.framebufferNoAttachmentsSampleCounts &
1208 vk_sample_count_flags(sample_count);
1210 if (bind & PIPE_BIND_INDEX_BUFFER) {
1211 if (format == PIPE_FORMAT_R8_UINT &&
1212 !screen->info.have_EXT_index_type_uint8)
1214 if (format != PIPE_FORMAT_R8_UINT &&
1215 format != PIPE_FORMAT_R16_UINT &&
1216 format != PIPE_FORMAT_R32_UINT)
1220 VkFormat vkformat = zink_get_format(screen, format);
1221 if (vkformat == VK_FORMAT_UNDEFINED)
1224 if (sample_count >= 1) {
1225 VkSampleCountFlagBits sample_mask = vk_sample_count_flags(sample_count);
1228 const struct util_format_description *desc = util_format_description(format);
1229 if (util_format_is_depth_or_stencil(format)) {
1230 if (util_format_has_depth(desc)) {
1231 if (bind & PIPE_BIND_DEPTH_STENCIL &&
1232 (screen->info.props.limits.framebufferDepthSampleCounts & sample_mask) != sample_mask)
1234 if (bind & PIPE_BIND_SAMPLER_VIEW &&
1235 (screen->info.props.limits.sampledImageDepthSampleCounts & sample_mask) != sample_mask)
1238 if (util_format_has_stencil(desc)) {
1239 if (bind & PIPE_BIND_DEPTH_STENCIL &&
1240 (screen->info.props.limits.framebufferStencilSampleCounts & sample_mask) != sample_mask)
1242 if (bind & PIPE_BIND_SAMPLER_VIEW &&
1243 (screen->info.props.limits.sampledImageStencilSampleCounts & sample_mask) != sample_mask)
1246 } else if (util_format_is_pure_integer(format)) {
1247 if (bind & PIPE_BIND_RENDER_TARGET &&
1248 !(screen->info.props.limits.framebufferColorSampleCounts & sample_mask))
1250 if (bind & PIPE_BIND_SAMPLER_VIEW &&
1251 !(screen->info.props.limits.sampledImageIntegerSampleCounts & sample_mask))
1254 if (bind & PIPE_BIND_RENDER_TARGET &&
1255 !(screen->info.props.limits.framebufferColorSampleCounts & sample_mask))
1257 if (bind & PIPE_BIND_SAMPLER_VIEW &&
1258 !(screen->info.props.limits.sampledImageColorSampleCounts & sample_mask))
1261 if (bind & PIPE_BIND_SHADER_IMAGE) {
1262 if (!(screen->info.props.limits.storageImageSampleCounts & sample_mask))
1267 VkFormatProperties props = screen->format_props[format];
1269 if (target == PIPE_BUFFER) {
1270 if (bind & PIPE_BIND_VERTEX_BUFFER) {
1271 if (!(props.bufferFeatures & VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT)) {
1272 enum pipe_format new_format = zink_decompose_vertex_format(format);
1275 if (!(screen->format_props[new_format].bufferFeatures & VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT))
1280 if (bind & PIPE_BIND_SAMPLER_VIEW &&
1281 !(props.bufferFeatures & VK_FORMAT_FEATURE_UNIFORM_TEXEL_BUFFER_BIT))
1284 if (bind & PIPE_BIND_SHADER_IMAGE &&
1285 !(props.bufferFeatures & VK_FORMAT_FEATURE_STORAGE_TEXEL_BUFFER_BIT))
1288 /* all other targets are texture-targets */
1289 if (bind & PIPE_BIND_RENDER_TARGET &&
1290 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT))
1293 if (bind & PIPE_BIND_BLENDABLE &&
1294 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BLEND_BIT))
1297 if (bind & PIPE_BIND_SAMPLER_VIEW &&
1298 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT))
1301 if (bind & PIPE_BIND_SAMPLER_REDUCTION_MINMAX &&
1302 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_SAMPLED_IMAGE_FILTER_MINMAX_BIT))
1305 if ((bind & PIPE_BIND_SAMPLER_VIEW) || (bind & PIPE_BIND_RENDER_TARGET)) {
1306 /* if this is a 3-component texture, force gallium to give us 4 components by rejecting this one */
1307 const struct util_format_description *desc = util_format_description(format);
1308 if (desc->nr_channels == 3 &&
1309 (desc->block.bits == 24 || desc->block.bits == 48 || desc->block.bits == 96))
1313 if (bind & PIPE_BIND_DEPTH_STENCIL &&
1314 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT))
1317 if (bind & PIPE_BIND_SHADER_IMAGE &&
1318 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_STORAGE_IMAGE_BIT))
1326 zink_destroy_screen(struct pipe_screen *pscreen)
1328 struct zink_screen *screen = zink_screen(pscreen);
1330 hash_table_foreach(&screen->dts, entry)
1331 zink_kopper_deinit_displaytarget(screen, entry->data);
1332 simple_mtx_destroy(&screen->dt_lock);
1334 if (screen->copy_context)
1335 screen->copy_context->base.destroy(&screen->copy_context->base);
1337 if (VK_NULL_HANDLE != screen->debugUtilsCallbackHandle) {
1338 VKSCR(DestroyDebugUtilsMessengerEXT)(screen->instance, screen->debugUtilsCallbackHandle, NULL);
1341 util_vertex_state_cache_deinit(&screen->vertex_state_cache);
1343 u_transfer_helper_destroy(pscreen->transfer_helper);
1344 util_queue_finish(&screen->cache_get_thread);
1345 util_queue_destroy(&screen->cache_get_thread);
1346 #ifdef ENABLE_SHADER_CACHE
1347 if (screen->disk_cache) {
1348 util_queue_finish(&screen->cache_put_thread);
1349 disk_cache_wait_for_idle(screen->disk_cache);
1350 util_queue_destroy(&screen->cache_put_thread);
1353 disk_cache_destroy(screen->disk_cache);
1354 zink_bo_deinit(screen);
1355 util_live_shader_cache_deinit(&screen->shaders);
1357 zink_descriptor_layouts_deinit(screen);
1360 VKSCR(DestroySemaphore)(screen->dev, screen->sem, NULL);
1363 VKSCR(DestroyFence)(screen->dev, screen->fence, NULL);
1365 if (screen->threaded)
1366 util_queue_destroy(&screen->flush_queue);
1368 simple_mtx_destroy(&screen->queue_lock);
1369 VKSCR(DestroyDevice)(screen->dev, NULL);
1370 VKSCR(DestroyInstance)(screen->instance, NULL);
1371 util_idalloc_mt_fini(&screen->buffer_ids);
1373 util_dl_close(screen->loader_lib);
1374 if (screen->drm_fd != -1)
1375 close(screen->drm_fd);
1377 slab_destroy_parent(&screen->transfer_pool);
1378 ralloc_free(screen);
1379 glsl_type_singleton_decref();
1383 choose_pdev(struct zink_screen *screen)
1385 uint32_t i, pdev_count;
1386 VkPhysicalDevice *pdevs;
1387 bool is_cpu = false;
1388 VkResult result = VKSCR(EnumeratePhysicalDevices)(screen->instance, &pdev_count, NULL);
1389 if (result != VK_SUCCESS) {
1390 mesa_loge("ZINK: vkEnumeratePhysicalDevices failed (%s)", vk_Result_to_str(result));
1394 assert(pdev_count > 0);
1396 pdevs = malloc(sizeof(*pdevs) * pdev_count);
1397 result = VKSCR(EnumeratePhysicalDevices)(screen->instance, &pdev_count, pdevs);
1398 assert(result == VK_SUCCESS);
1399 assert(pdev_count > 0);
1401 VkPhysicalDeviceProperties props;
1402 bool cpu = debug_get_bool_option("LIBGL_ALWAYS_SOFTWARE", false) ||
1403 debug_get_bool_option("D3D_ALWAYS_SOFTWARE", false);
1404 /* priority when multiple drivers are available (highest to lowest):
1405 VK_PHYSICAL_DEVICE_TYPE_VIRTUAL_GPU
1406 VK_PHYSICAL_DEVICE_TYPE_DISCRETE_GPU
1407 VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU
1408 VK_PHYSICAL_DEVICE_TYPE_CPU
1409 VK_PHYSICAL_DEVICE_TYPE_OTHER
1411 * users should specify VK_ICD_FILENAMES since this is a standardized variable
1412 * used by all vulkan applications
1414 unsigned prio_map[] = {
1415 [VK_PHYSICAL_DEVICE_TYPE_OTHER] = 0,
1416 [VK_PHYSICAL_DEVICE_TYPE_CPU] = 1,
1417 [VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU] = 2,
1418 [VK_PHYSICAL_DEVICE_TYPE_DISCRETE_GPU] = 3,
1419 [VK_PHYSICAL_DEVICE_TYPE_VIRTUAL_GPU] = 4,
1423 for (i = 0; i < pdev_count; ++i) {
1424 VKSCR(GetPhysicalDeviceProperties)(pdevs[i], &props);
1427 /* if user wants cpu, only give them cpu */
1428 if (props.deviceType == VK_PHYSICAL_DEVICE_TYPE_CPU) {
1430 cur_prio = prio_map[props.deviceType];
1434 assert(props.deviceType <= VK_PHYSICAL_DEVICE_TYPE_CPU);
1435 if (prio_map[props.deviceType] > cur_prio) {
1437 cur_prio = prio_map[props.deviceType];
1441 is_cpu = cur_prio == prio_map[VK_PHYSICAL_DEVICE_TYPE_CPU];
1445 screen->pdev = pdevs[idx];
1446 VKSCR(GetPhysicalDeviceProperties)(screen->pdev, &screen->info.props);
1447 screen->info.device_version = screen->info.props.apiVersion;
1449 /* runtime version is the lesser of the instance version and device version */
1450 screen->vk_version = MIN2(screen->info.device_version, screen->instance_info.loader_version);
1452 /* calculate SPIR-V version based on VK version */
1453 if (screen->vk_version >= VK_MAKE_VERSION(1, 2, 0))
1454 screen->spirv_version = SPIRV_VERSION(1, 5);
1455 else if (screen->vk_version >= VK_MAKE_VERSION(1, 1, 0))
1456 screen->spirv_version = SPIRV_VERSION(1, 3);
1458 screen->spirv_version = SPIRV_VERSION(1, 0);
1465 update_queue_props(struct zink_screen *screen)
1467 uint32_t num_queues;
1468 VKSCR(GetPhysicalDeviceQueueFamilyProperties)(screen->pdev, &num_queues, NULL);
1469 assert(num_queues > 0);
1471 VkQueueFamilyProperties *props = malloc(sizeof(*props) * num_queues);
1472 VKSCR(GetPhysicalDeviceQueueFamilyProperties)(screen->pdev, &num_queues, props);
1474 bool found_gfx = false;
1475 uint32_t sparse_only = UINT32_MAX;
1476 screen->sparse_queue = UINT32_MAX;
1477 for (uint32_t i = 0; i < num_queues; i++) {
1478 if (props[i].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
1481 screen->sparse_queue = screen->gfx_queue = i;
1482 screen->max_queues = props[i].queueCount;
1483 screen->timestamp_valid_bits = props[i].timestampValidBits;
1485 } else if (props[i].queueFlags & VK_QUEUE_SPARSE_BINDING_BIT)
1488 if (sparse_only != UINT32_MAX)
1489 screen->sparse_queue = sparse_only;
1494 init_queue(struct zink_screen *screen)
1496 simple_mtx_init(&screen->queue_lock, mtx_plain);
1497 VKSCR(GetDeviceQueue)(screen->dev, screen->gfx_queue, 0, &screen->queue);
1498 if (screen->sparse_queue != screen->gfx_queue)
1499 VKSCR(GetDeviceQueue)(screen->dev, screen->sparse_queue, 0, &screen->queue_sparse);
1501 screen->queue_sparse = screen->queue;
1505 zink_flush_frontbuffer(struct pipe_screen *pscreen,
1506 struct pipe_context *pctx,
1507 struct pipe_resource *pres,
1508 unsigned level, unsigned layer,
1509 void *winsys_drawable_handle,
1510 struct pipe_box *sub_box)
1512 struct zink_screen *screen = zink_screen(pscreen);
1513 struct zink_resource *res = zink_resource(pres);
1514 struct zink_context *ctx = zink_context(pctx);
1516 /* if the surface is no longer a swapchain, this is a no-op */
1517 if (!zink_is_swapchain(res))
1520 ctx = zink_tc_context_unwrap(pctx, screen->threaded);
1522 if (!zink_kopper_acquired(res->obj->dt, res->obj->dt_idx)) {
1523 /* swapbuffers to an undefined surface: acquire and present garbage */
1524 zink_kopper_acquire(ctx, res, UINT64_MAX);
1525 ctx->needs_present = res;
1526 /* set batch usage to submit acquire semaphore */
1527 zink_batch_resource_usage_set(&ctx->batch, res, true, false);
1528 /* ensure the resource is set up to present garbage */
1529 ctx->base.flush_resource(&ctx->base, pres);
1532 /* handle any outstanding acquire submits (not just from above) */
1533 if (ctx->batch.swapchain || ctx->needs_present) {
1534 ctx->batch.has_work = true;
1535 pctx->flush(pctx, NULL, PIPE_FLUSH_END_OF_FRAME);
1536 if (ctx->last_fence && screen->threaded) {
1537 struct zink_batch_state *bs = zink_batch_state(ctx->last_fence);
1538 util_queue_fence_wait(&bs->flush_completed);
1542 /* always verify that this was acquired */
1543 assert(zink_kopper_acquired(res->obj->dt, res->obj->dt_idx));
1544 zink_kopper_present_queue(screen, res);
1548 zink_is_depth_format_supported(struct zink_screen *screen, VkFormat format)
1550 VkFormatProperties props;
1551 VKSCR(GetPhysicalDeviceFormatProperties)(screen->pdev, format, &props);
1552 return (props.linearTilingFeatures | props.optimalTilingFeatures) &
1553 VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT;
1556 static enum pipe_format
1557 emulate_x8(enum pipe_format format)
1559 /* convert missing Xn variants to An */
1561 case PIPE_FORMAT_B8G8R8X8_UNORM:
1562 return PIPE_FORMAT_B8G8R8A8_UNORM;
1564 case PIPE_FORMAT_B8G8R8X8_SRGB:
1565 return PIPE_FORMAT_B8G8R8A8_SRGB;
1566 case PIPE_FORMAT_R8G8B8X8_SRGB:
1567 return PIPE_FORMAT_R8G8B8A8_SRGB;
1569 case PIPE_FORMAT_R8G8B8X8_SINT:
1570 return PIPE_FORMAT_R8G8B8A8_SINT;
1571 case PIPE_FORMAT_R8G8B8X8_SNORM:
1572 return PIPE_FORMAT_R8G8B8A8_SNORM;
1573 case PIPE_FORMAT_R8G8B8X8_UNORM:
1574 return PIPE_FORMAT_R8G8B8A8_UNORM;
1576 case PIPE_FORMAT_R16G16B16X16_FLOAT:
1577 return PIPE_FORMAT_R16G16B16A16_FLOAT;
1578 case PIPE_FORMAT_R16G16B16X16_SINT:
1579 return PIPE_FORMAT_R16G16B16A16_SINT;
1580 case PIPE_FORMAT_R16G16B16X16_SNORM:
1581 return PIPE_FORMAT_R16G16B16A16_SNORM;
1582 case PIPE_FORMAT_R16G16B16X16_UNORM:
1583 return PIPE_FORMAT_R16G16B16A16_UNORM;
1585 case PIPE_FORMAT_R32G32B32X32_FLOAT:
1586 return PIPE_FORMAT_R32G32B32A32_FLOAT;
1587 case PIPE_FORMAT_R32G32B32X32_SINT:
1588 return PIPE_FORMAT_R32G32B32A32_SINT;
1596 zink_get_format(struct zink_screen *screen, enum pipe_format format)
1598 if (!screen->driver_workarounds.broken_l4a4 || format != PIPE_FORMAT_L4A4_UNORM)
1599 format = zink_format_get_emulated_alpha(format);
1601 VkFormat ret = zink_pipe_format_to_vk_format(emulate_x8(format));
1603 if (format == PIPE_FORMAT_X32_S8X24_UINT &&
1604 screen->have_D32_SFLOAT_S8_UINT)
1605 return VK_FORMAT_D32_SFLOAT_S8_UINT;
1607 if (format == PIPE_FORMAT_X24S8_UINT)
1608 /* valid when using aspects to extract stencil,
1609 * fails format test because it's emulated */
1610 ret = VK_FORMAT_D24_UNORM_S8_UINT;
1612 if (ret == VK_FORMAT_X8_D24_UNORM_PACK32 &&
1613 !screen->have_X8_D24_UNORM_PACK32) {
1614 assert(zink_is_depth_format_supported(screen, VK_FORMAT_D32_SFLOAT));
1615 return VK_FORMAT_D32_SFLOAT;
1618 if (ret == VK_FORMAT_D24_UNORM_S8_UINT &&
1619 !screen->have_D24_UNORM_S8_UINT) {
1620 assert(screen->have_D32_SFLOAT_S8_UINT);
1621 return VK_FORMAT_D32_SFLOAT_S8_UINT;
1624 if ((ret == VK_FORMAT_A4B4G4R4_UNORM_PACK16 &&
1625 !screen->info.format_4444_feats.formatA4B4G4R4) ||
1626 (ret == VK_FORMAT_A4R4G4B4_UNORM_PACK16 &&
1627 !screen->info.format_4444_feats.formatA4R4G4B4))
1628 return VK_FORMAT_UNDEFINED;
1630 if (format == PIPE_FORMAT_R4A4_UNORM)
1631 return VK_FORMAT_R4G4_UNORM_PACK8;
1637 check_have_device_time(struct zink_screen *screen)
1639 uint32_t num_domains = 0;
1640 VkTimeDomainEXT domains[8]; //current max is 4
1641 VkResult result = VKSCR(GetPhysicalDeviceCalibrateableTimeDomainsEXT)(screen->pdev, &num_domains, NULL);
1642 if (result != VK_SUCCESS) {
1643 mesa_loge("ZINK: vkGetPhysicalDeviceCalibrateableTimeDomainsEXT failed (%s)", vk_Result_to_str(result));
1645 assert(num_domains > 0);
1646 assert(num_domains < ARRAY_SIZE(domains));
1648 result = VKSCR(GetPhysicalDeviceCalibrateableTimeDomainsEXT)(screen->pdev, &num_domains, domains);
1649 if (result != VK_SUCCESS) {
1650 mesa_loge("ZINK: vkGetPhysicalDeviceCalibrateableTimeDomainsEXT failed (%s)", vk_Result_to_str(result));
1653 /* VK_TIME_DOMAIN_DEVICE_EXT is used for the ctx->get_timestamp hook and is the only one we really need */
1654 for (unsigned i = 0; i < num_domains; i++) {
1655 if (domains[i] == VK_TIME_DOMAIN_DEVICE_EXT) {
1664 zink_error(const char *msg)
1669 zink_warn(const char *msg)
1674 zink_info(const char *msg)
1679 zink_msg(const char *msg)
1683 static VKAPI_ATTR VkBool32 VKAPI_CALL
1684 zink_debug_util_callback(
1685 VkDebugUtilsMessageSeverityFlagBitsEXT messageSeverity,
1686 VkDebugUtilsMessageTypeFlagsEXT messageType,
1687 const VkDebugUtilsMessengerCallbackDataEXT *pCallbackData,
1690 // Pick message prefix and color to use.
1691 // Only MacOS and Linux have been tested for color support
1692 if (messageSeverity & VK_DEBUG_UTILS_MESSAGE_SEVERITY_ERROR_BIT_EXT) {
1693 zink_error(pCallbackData->pMessage);
1694 } else if (messageSeverity & VK_DEBUG_UTILS_MESSAGE_SEVERITY_WARNING_BIT_EXT) {
1695 zink_warn(pCallbackData->pMessage);
1696 } else if (messageSeverity & VK_DEBUG_UTILS_MESSAGE_SEVERITY_INFO_BIT_EXT) {
1697 zink_info(pCallbackData->pMessage);
1699 zink_msg(pCallbackData->pMessage);
1705 create_debug(struct zink_screen *screen)
1707 VkDebugUtilsMessengerCreateInfoEXT vkDebugUtilsMessengerCreateInfoEXT = {
1708 VK_STRUCTURE_TYPE_DEBUG_UTILS_MESSENGER_CREATE_INFO_EXT,
1711 VK_DEBUG_UTILS_MESSAGE_SEVERITY_VERBOSE_BIT_EXT |
1712 VK_DEBUG_UTILS_MESSAGE_SEVERITY_INFO_BIT_EXT |
1713 VK_DEBUG_UTILS_MESSAGE_SEVERITY_WARNING_BIT_EXT |
1714 VK_DEBUG_UTILS_MESSAGE_SEVERITY_ERROR_BIT_EXT,
1715 VK_DEBUG_UTILS_MESSAGE_TYPE_GENERAL_BIT_EXT |
1716 VK_DEBUG_UTILS_MESSAGE_TYPE_VALIDATION_BIT_EXT |
1717 VK_DEBUG_UTILS_MESSAGE_TYPE_PERFORMANCE_BIT_EXT,
1718 zink_debug_util_callback,
1722 VkDebugUtilsMessengerEXT vkDebugUtilsCallbackEXT = VK_NULL_HANDLE;
1724 VkResult result = VKSCR(CreateDebugUtilsMessengerEXT)(
1726 &vkDebugUtilsMessengerCreateInfoEXT,
1728 &vkDebugUtilsCallbackEXT);
1729 if (result != VK_SUCCESS) {
1730 mesa_loge("ZINK: vkCreateDebugUtilsMessengerEXT failed (%s)", vk_Result_to_str(result));
1733 screen->debugUtilsCallbackHandle = vkDebugUtilsCallbackEXT;
1739 zink_internal_setup_moltenvk(struct zink_screen *screen)
1741 #if defined(MVK_VERSION)
1742 if (!screen->instance_info.have_MVK_moltenvk)
1745 GET_PROC_ADDR_INSTANCE_LOCAL(screen, screen->instance, GetMoltenVKConfigurationMVK);
1746 GET_PROC_ADDR_INSTANCE_LOCAL(screen, screen->instance, SetMoltenVKConfigurationMVK);
1747 GET_PROC_ADDR_INSTANCE_LOCAL(screen, screen->instance, GetVersionStringsMVK);
1749 if (vk_GetVersionStringsMVK) {
1750 char molten_version[64] = {0};
1751 char vulkan_version[64] = {0};
1753 vk_GetVersionStringsMVK(molten_version, sizeof(molten_version) - 1, vulkan_version, sizeof(vulkan_version) - 1);
1755 printf("zink: MoltenVK %s Vulkan %s \n", molten_version, vulkan_version);
1758 if (vk_GetMoltenVKConfigurationMVK && vk_SetMoltenVKConfigurationMVK) {
1759 MVKConfiguration molten_config = {0};
1760 size_t molten_config_size = sizeof(molten_config);
1762 VkResult res = vk_GetMoltenVKConfigurationMVK(screen->instance, &molten_config, &molten_config_size);
1763 if (res == VK_SUCCESS || res == VK_INCOMPLETE) {
1764 // Needed to allow MoltenVK to accept VkImageView swizzles.
1765 // Encountered when using VK_FORMAT_R8G8_UNORM
1766 molten_config.fullImageViewSwizzle = VK_TRUE;
1767 vk_SetMoltenVKConfigurationMVK(screen->instance, &molten_config, &molten_config_size);
1770 #endif // MVK_VERSION
1776 check_vertex_formats(struct zink_screen *screen)
1779 enum pipe_format format_list[] = {
1780 /* not supported by vk
1781 PIPE_FORMAT_R32_FIXED,
1782 PIPE_FORMAT_R32G32_FIXED,
1783 PIPE_FORMAT_R32G32B32_FIXED,
1784 PIPE_FORMAT_R32G32B32A32_FIXED,
1786 PIPE_FORMAT_R16_FLOAT,
1787 PIPE_FORMAT_R16G16_FLOAT,
1788 PIPE_FORMAT_R16G16B16_FLOAT,
1789 PIPE_FORMAT_R16G16B16A16_FLOAT,
1790 /* not supported by vk
1791 PIPE_FORMAT_R64_FLOAT,
1792 PIPE_FORMAT_R64G64_FLOAT,
1793 PIPE_FORMAT_R64G64B64_FLOAT,
1794 PIPE_FORMAT_R64G64B64A64_FLOAT,
1795 PIPE_FORMAT_R32_UNORM,
1796 PIPE_FORMAT_R32G32_UNORM,
1797 PIPE_FORMAT_R32G32B32_UNORM,
1798 PIPE_FORMAT_R32G32B32A32_UNORM,
1799 PIPE_FORMAT_R32_SNORM,
1800 PIPE_FORMAT_R32G32_SNORM,
1801 PIPE_FORMAT_R32G32B32_SNORM,
1802 PIPE_FORMAT_R32G32B32A32_SNORM,
1803 PIPE_FORMAT_R32_USCALED,
1804 PIPE_FORMAT_R32G32_USCALED,
1805 PIPE_FORMAT_R32G32B32_USCALED,
1806 PIPE_FORMAT_R32G32B32A32_USCALED,
1807 PIPE_FORMAT_R32_SSCALED,
1808 PIPE_FORMAT_R32G32_SSCALED,
1809 PIPE_FORMAT_R32G32B32_SSCALED,
1810 PIPE_FORMAT_R32G32B32A32_SSCALED,
1812 PIPE_FORMAT_R16_UNORM,
1813 PIPE_FORMAT_R16G16_UNORM,
1814 PIPE_FORMAT_R16G16B16_UNORM,
1815 PIPE_FORMAT_R16G16B16A16_UNORM,
1816 PIPE_FORMAT_R16_SNORM,
1817 PIPE_FORMAT_R16G16_SNORM,
1818 PIPE_FORMAT_R16G16B16_SNORM,
1819 PIPE_FORMAT_R16G16B16_SINT,
1820 PIPE_FORMAT_R16G16B16_UINT,
1821 PIPE_FORMAT_R16G16B16A16_SNORM,
1822 PIPE_FORMAT_R16_USCALED,
1823 PIPE_FORMAT_R16G16_USCALED,
1824 PIPE_FORMAT_R16G16B16_USCALED,
1825 PIPE_FORMAT_R16G16B16A16_USCALED,
1826 PIPE_FORMAT_R16_SSCALED,
1827 PIPE_FORMAT_R16G16_SSCALED,
1828 PIPE_FORMAT_R16G16B16_SSCALED,
1829 PIPE_FORMAT_R16G16B16A16_SSCALED,
1830 PIPE_FORMAT_R8_UNORM,
1831 PIPE_FORMAT_R8G8_UNORM,
1832 PIPE_FORMAT_R8G8B8_UNORM,
1833 PIPE_FORMAT_R8G8B8A8_UNORM,
1834 PIPE_FORMAT_R8_SNORM,
1835 PIPE_FORMAT_R8G8_SNORM,
1836 PIPE_FORMAT_R8G8B8_SNORM,
1837 PIPE_FORMAT_R8G8B8A8_SNORM,
1838 PIPE_FORMAT_R8_USCALED,
1839 PIPE_FORMAT_R8G8_USCALED,
1840 PIPE_FORMAT_R8G8B8_USCALED,
1841 PIPE_FORMAT_R8G8B8A8_USCALED,
1842 PIPE_FORMAT_R8_SSCALED,
1843 PIPE_FORMAT_R8G8_SSCALED,
1844 PIPE_FORMAT_R8G8B8_SSCALED,
1845 PIPE_FORMAT_R8G8B8A8_SSCALED,
1847 for (unsigned i = 0; i < ARRAY_SIZE(format_list); i++) {
1848 if (zink_is_format_supported(&screen->base, format_list[i], PIPE_BUFFER, 0, 0, PIPE_BIND_VERTEX_BUFFER))
1850 if (util_format_get_nr_components(format_list[i]) == 1)
1852 enum pipe_format decomposed = zink_decompose_vertex_format(format_list[i]);
1853 if (zink_is_format_supported(&screen->base, decomposed, PIPE_BUFFER, 0, 0, PIPE_BIND_VERTEX_BUFFER)) {
1854 screen->need_decompose_attrs = true;
1855 mesa_logw("zink: this application would be much faster if %s supported vertex format %s", screen->info.props.deviceName, util_format_name(format_list[i]));
1861 populate_format_props(struct zink_screen *screen)
1863 for (unsigned i = 0; i < PIPE_FORMAT_COUNT; i++) {
1864 VkFormat format = zink_get_format(screen, i);
1867 if (VKSCR(GetPhysicalDeviceFormatProperties2)) {
1868 VkFormatProperties2 props = {0};
1869 props.sType = VK_STRUCTURE_TYPE_FORMAT_PROPERTIES_2;
1871 VkDrmFormatModifierPropertiesListEXT mod_props;
1872 VkDrmFormatModifierPropertiesEXT mods[128];
1873 if (screen->info.have_EXT_image_drm_format_modifier) {
1874 mod_props.sType = VK_STRUCTURE_TYPE_DRM_FORMAT_MODIFIER_PROPERTIES_LIST_EXT;
1875 mod_props.pNext = NULL;
1876 mod_props.drmFormatModifierCount = ARRAY_SIZE(mods);
1877 mod_props.pDrmFormatModifierProperties = mods;
1878 props.pNext = &mod_props;
1880 VkFormatProperties3 props3 = {0};
1881 props3.sType = VK_STRUCTURE_TYPE_FORMAT_PROPERTIES_3;
1882 props3.pNext = props.pNext;
1883 props.pNext = &props3;
1884 VKSCR(GetPhysicalDeviceFormatProperties2)(screen->pdev, format, &props);
1885 screen->format_props[i] = props.formatProperties;
1886 if (props3.linearTilingFeatures & VK_FORMAT_FEATURE_2_LINEAR_COLOR_ATTACHMENT_BIT_NV)
1887 screen->format_props[i].linearTilingFeatures |= VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT;
1888 if (screen->info.have_EXT_image_drm_format_modifier && mod_props.drmFormatModifierCount) {
1889 screen->modifier_props[i].drmFormatModifierCount = mod_props.drmFormatModifierCount;
1890 screen->modifier_props[i].pDrmFormatModifierProperties = ralloc_array(screen, VkDrmFormatModifierPropertiesEXT, mod_props.drmFormatModifierCount);
1891 if (mod_props.pDrmFormatModifierProperties) {
1892 for (unsigned j = 0; j < mod_props.drmFormatModifierCount; j++)
1893 screen->modifier_props[i].pDrmFormatModifierProperties[j] = mod_props.pDrmFormatModifierProperties[j];
1897 VKSCR(GetPhysicalDeviceFormatProperties)(screen->pdev, format, &screen->format_props[i]);
1898 if (zink_format_is_emulated_alpha(i)) {
1899 VkFormatFeatureFlags blocked = VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT | VK_FORMAT_FEATURE_STORAGE_IMAGE_BIT;
1900 screen->format_props[i].linearTilingFeatures &= ~blocked;
1901 screen->format_props[i].optimalTilingFeatures &= ~blocked;
1902 screen->format_props[i].bufferFeatures = 0;
1905 check_vertex_formats(screen);
1906 VkImageFormatProperties image_props;
1907 VkResult ret = VKSCR(GetPhysicalDeviceImageFormatProperties)(screen->pdev, VK_FORMAT_D32_SFLOAT,
1909 VK_IMAGE_TILING_OPTIMAL,
1910 VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT | VK_IMAGE_USAGE_SAMPLED_BIT,
1912 if (ret != VK_SUCCESS && ret != VK_ERROR_FORMAT_NOT_SUPPORTED) {
1913 mesa_loge("ZINK: vkGetPhysicalDeviceImageFormatProperties failed (%s)", vk_Result_to_str(ret));
1915 screen->need_2D_zs = ret != VK_SUCCESS;
1917 if (screen->info.feats.features.sparseResidencyImage2D)
1918 screen->need_2D_sparse = !screen->base.get_sparse_texture_virtual_page_size(&screen->base, PIPE_TEXTURE_1D, false, PIPE_FORMAT_R32_FLOAT, 0, 16, NULL, NULL, NULL);
1922 zink_screen_init_semaphore(struct zink_screen *screen)
1924 VkSemaphoreCreateInfo sci = {0};
1925 VkSemaphoreTypeCreateInfo tci = {0};
1927 sci.sType = VK_STRUCTURE_TYPE_SEMAPHORE_CREATE_INFO;
1928 tci.sType = VK_STRUCTURE_TYPE_SEMAPHORE_TYPE_CREATE_INFO;
1929 tci.semaphoreType = VK_SEMAPHORE_TYPE_TIMELINE;
1931 return VKSCR(CreateSemaphore)(screen->dev, &sci, NULL, &screen->sem) == VK_SUCCESS;
1935 zink_screen_timeline_wait(struct zink_screen *screen, uint64_t batch_id, uint64_t timeout)
1937 VkSemaphoreWaitInfo wi = {0};
1939 if (zink_screen_check_last_finished(screen, batch_id))
1942 wi.sType = VK_STRUCTURE_TYPE_SEMAPHORE_WAIT_INFO;
1943 wi.semaphoreCount = 1;
1944 wi.pSemaphores = &screen->sem;
1945 wi.pValues = &batch_id;
1946 bool success = false;
1947 if (screen->device_lost)
1949 VkResult ret = VKSCR(WaitSemaphores)(screen->dev, &wi, timeout);
1950 success = zink_screen_handle_vkresult(screen, ret);
1953 zink_screen_update_last_finished(screen, batch_id);
1959 zink_get_loader_version(struct zink_screen *screen)
1962 uint32_t loader_version = VK_API_VERSION_1_0;
1964 // Get the Loader version
1965 GET_PROC_ADDR_INSTANCE_LOCAL(screen, NULL, EnumerateInstanceVersion);
1966 if (vk_EnumerateInstanceVersion) {
1967 uint32_t loader_version_temp = VK_API_VERSION_1_0;
1968 VkResult result = (*vk_EnumerateInstanceVersion)(&loader_version_temp);
1969 if (VK_SUCCESS == result) {
1970 loader_version = loader_version_temp;
1972 mesa_loge("ZINK: vkEnumerateInstanceVersion failed (%s)", vk_Result_to_str(result));
1976 return loader_version;
1980 zink_query_memory_info(struct pipe_screen *pscreen, struct pipe_memory_info *info)
1982 struct zink_screen *screen = zink_screen(pscreen);
1983 memset(info, 0, sizeof(struct pipe_memory_info));
1984 if (screen->info.have_EXT_memory_budget && VKSCR(GetPhysicalDeviceMemoryProperties2)) {
1985 VkPhysicalDeviceMemoryProperties2 mem = {0};
1986 mem.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_MEMORY_PROPERTIES_2;
1988 VkPhysicalDeviceMemoryBudgetPropertiesEXT budget = {0};
1989 budget.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_MEMORY_BUDGET_PROPERTIES_EXT;
1990 mem.pNext = &budget;
1991 VKSCR(GetPhysicalDeviceMemoryProperties2)(screen->pdev, &mem);
1993 for (unsigned i = 0; i < mem.memoryProperties.memoryHeapCount; i++) {
1994 if (mem.memoryProperties.memoryHeaps[i].flags & VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT) {
1996 info->total_device_memory += mem.memoryProperties.memoryHeaps[i].size / 1024;
1997 info->avail_device_memory += (mem.memoryProperties.memoryHeaps[i].size - budget.heapUsage[i]) / 1024;
2000 info->total_staging_memory += mem.memoryProperties.memoryHeaps[i].size / 1024;
2001 info->avail_staging_memory += (mem.memoryProperties.memoryHeaps[i].size - budget.heapUsage[i]) / 1024;
2004 /* evictions not yet supported in vulkan */
2006 for (unsigned i = 0; i < screen->info.mem_props.memoryHeapCount; i++) {
2007 if (screen->info.mem_props.memoryHeaps[i].flags & VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT) {
2009 info->total_device_memory += screen->info.mem_props.memoryHeaps[i].size / 1024;
2010 /* free real estate! */
2011 info->avail_device_memory += info->total_device_memory;
2014 info->total_staging_memory += screen->info.mem_props.memoryHeaps[i].size / 1024;
2015 /* free real estate! */
2016 info->avail_staging_memory += info->total_staging_memory;
2023 zink_query_dmabuf_modifiers(struct pipe_screen *pscreen, enum pipe_format format, int max, uint64_t *modifiers, unsigned int *external_only, int *count)
2025 struct zink_screen *screen = zink_screen(pscreen);
2026 *count = screen->modifier_props[format].drmFormatModifierCount;
2027 for (int i = 0; i < MIN2(max, *count); i++)
2028 modifiers[i] = screen->modifier_props[format].pDrmFormatModifierProperties[i].drmFormatModifier;
2032 zink_is_dmabuf_modifier_supported(struct pipe_screen *pscreen, uint64_t modifier, enum pipe_format format, bool *external_only)
2034 struct zink_screen *screen = zink_screen(pscreen);
2035 for (unsigned i = 0; i < screen->modifier_props[format].drmFormatModifierCount; i++)
2036 if (screen->modifier_props[format].pDrmFormatModifierProperties[i].drmFormatModifier == modifier)
2042 zink_get_dmabuf_modifier_planes(struct pipe_screen *pscreen, uint64_t modifier, enum pipe_format format)
2044 struct zink_screen *screen = zink_screen(pscreen);
2045 for (unsigned i = 0; i < screen->modifier_props[format].drmFormatModifierCount; i++)
2046 if (screen->modifier_props[format].pDrmFormatModifierProperties[i].drmFormatModifier == modifier)
2047 return screen->modifier_props[format].pDrmFormatModifierProperties[i].drmFormatModifierPlaneCount;
2052 zink_get_sparse_texture_virtual_page_size(struct pipe_screen *pscreen,
2053 enum pipe_texture_target target,
2055 enum pipe_format pformat,
2056 unsigned offset, unsigned size,
2057 int *x, int *y, int *z)
2059 struct zink_screen *screen = zink_screen(pscreen);
2060 static const int page_size_2d[][3] = {
2061 { 256, 256, 1 }, /* 8bpp */
2062 { 256, 128, 1 }, /* 16bpp */
2063 { 128, 128, 1 }, /* 32bpp */
2064 { 128, 64, 1 }, /* 64bpp */
2065 { 64, 64, 1 }, /* 128bpp */
2067 static const int page_size_3d[][3] = {
2068 { 64, 32, 32 }, /* 8bpp */
2069 { 32, 32, 32 }, /* 16bpp */
2070 { 32, 32, 16 }, /* 32bpp */
2071 { 32, 16, 16 }, /* 64bpp */
2072 { 16, 16, 16 }, /* 128bpp */
2074 /* Only support one type of page size. */
2078 /* reject multisample if 2x isn't supported; assume none are */
2079 if (multi_sample && !screen->info.feats.features.sparseResidency2Samples)
2082 VkFormat format = zink_get_format(screen, pformat);
2083 bool is_zs = util_format_is_depth_or_stencil(pformat);
2086 case PIPE_TEXTURE_1D:
2087 case PIPE_TEXTURE_1D_ARRAY:
2088 type = (screen->need_2D_sparse || (screen->need_2D_zs && is_zs)) ? VK_IMAGE_TYPE_2D : VK_IMAGE_TYPE_1D;
2091 case PIPE_TEXTURE_2D:
2092 case PIPE_TEXTURE_CUBE:
2093 case PIPE_TEXTURE_RECT:
2094 case PIPE_TEXTURE_2D_ARRAY:
2095 case PIPE_TEXTURE_CUBE_ARRAY:
2096 type = VK_IMAGE_TYPE_2D;
2099 case PIPE_TEXTURE_3D:
2100 type = VK_IMAGE_TYPE_3D;
2109 VkImageUsageFlags flags = VK_IMAGE_USAGE_SAMPLED_BIT | VK_IMAGE_USAGE_TRANSFER_DST_BIT | VK_IMAGE_USAGE_TRANSFER_SRC_BIT |
2110 VK_IMAGE_USAGE_STORAGE_BIT | VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT;
2111 flags |= is_zs ? VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT : VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT;
2112 VkSparseImageFormatProperties props[4]; //planar?
2113 unsigned prop_count = ARRAY_SIZE(props);
2114 VKSCR(GetPhysicalDeviceSparseImageFormatProperties)(screen->pdev, format, type,
2115 multi_sample ? VK_SAMPLE_COUNT_2_BIT : VK_SAMPLE_COUNT_1_BIT,
2117 VK_IMAGE_TILING_OPTIMAL,
2118 &prop_count, props);
2120 if (pformat == PIPE_FORMAT_R9G9B9E5_FLOAT) {
2121 screen->faked_e5sparse = true;
2129 *x = props[0].imageGranularity.width;
2131 *y = props[0].imageGranularity.height;
2133 *z = props[0].imageGranularity.depth;
2139 const int (*page_sizes)[3] = target == PIPE_TEXTURE_3D ? page_size_3d : page_size_2d;
2140 int blk_size = util_format_get_blocksize(pformat);
2143 unsigned index = util_logbase2(blk_size);
2144 if (x) *x = page_sizes[index][0];
2145 if (y) *y = page_sizes[index][1];
2146 if (z) *z = page_sizes[index][2];
2153 zink_create_logical_device(struct zink_screen *screen)
2155 VkDevice dev = VK_NULL_HANDLE;
2157 VkDeviceQueueCreateInfo qci[2] = {0};
2158 uint32_t queues[3] = {
2160 screen->sparse_queue,
2163 for (unsigned i = 0; i < ARRAY_SIZE(qci); i++) {
2164 qci[i].sType = VK_STRUCTURE_TYPE_DEVICE_QUEUE_CREATE_INFO;
2165 qci[i].queueFamilyIndex = queues[i];
2166 qci[i].queueCount = 1;
2167 qci[i].pQueuePriorities = &dummy;
2170 unsigned num_queues = 1;
2171 if (screen->sparse_queue != screen->gfx_queue)
2174 VkDeviceCreateInfo dci = {0};
2175 dci.sType = VK_STRUCTURE_TYPE_DEVICE_CREATE_INFO;
2176 dci.queueCreateInfoCount = num_queues;
2177 dci.pQueueCreateInfos = qci;
2178 /* extensions don't have bool members in pEnabledFeatures.
2179 * this requires us to pass the whole VkPhysicalDeviceFeatures2 struct
2181 if (screen->info.feats.sType == VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_FEATURES_2) {
2182 dci.pNext = &screen->info.feats;
2184 dci.pEnabledFeatures = &screen->info.feats.features;
2187 dci.ppEnabledExtensionNames = screen->info.extensions;
2188 dci.enabledExtensionCount = screen->info.num_extensions;
2190 VkResult result = VKSCR(CreateDevice)(screen->pdev, &dci, NULL, &dev);
2191 if (result != VK_SUCCESS)
2192 mesa_loge("ZINK: vkCreateDevice failed (%s)", vk_Result_to_str(result));
2198 check_base_requirements(struct zink_screen *screen)
2200 if (!screen->info.feats.features.logicOp ||
2201 !screen->info.feats.features.fillModeNonSolid ||
2202 !screen->info.feats.features.shaderClipDistance ||
2203 !(screen->info.feats12.scalarBlockLayout ||
2204 screen->info.have_EXT_scalar_block_layout) ||
2205 !screen->info.have_KHR_maintenance1 ||
2206 !screen->info.have_EXT_custom_border_color ||
2207 !screen->info.have_EXT_line_rasterization) {
2208 fprintf(stderr, "WARNING: Some incorrect rendering "
2209 "might occur because the selected Vulkan device (%s) doesn't support "
2210 "base Zink requirements: ", screen->info.props.deviceName);
2211 #define CHECK_OR_PRINT(X) \
2212 if (!screen->info.X) \
2213 fprintf(stderr, "%s ", #X)
2214 CHECK_OR_PRINT(feats.features.logicOp);
2215 CHECK_OR_PRINT(feats.features.fillModeNonSolid);
2216 CHECK_OR_PRINT(feats.features.shaderClipDistance);
2217 if (!screen->info.feats12.scalarBlockLayout && !screen->info.have_EXT_scalar_block_layout)
2218 printf("scalarBlockLayout OR EXT_scalar_block_layout ");
2219 CHECK_OR_PRINT(have_KHR_maintenance1);
2220 CHECK_OR_PRINT(have_EXT_custom_border_color);
2221 CHECK_OR_PRINT(have_EXT_line_rasterization);
2222 fprintf(stderr, "\n");
2227 zink_get_sample_pixel_grid(struct pipe_screen *pscreen, unsigned sample_count,
2228 unsigned *width, unsigned *height)
2230 struct zink_screen *screen = zink_screen(pscreen);
2231 unsigned idx = util_logbase2_ceil(MAX2(sample_count, 1));
2232 assert(idx < ARRAY_SIZE(screen->maxSampleLocationGridSize));
2233 *width = screen->maxSampleLocationGridSize[idx].width;
2234 *height = screen->maxSampleLocationGridSize[idx].height;
2238 init_driver_workarounds(struct zink_screen *screen)
2240 /* enable implicit sync for all non-mesa drivers */
2241 screen->driver_workarounds.implicit_sync = true;
2242 switch (screen->info.driver_props.driverID) {
2243 case VK_DRIVER_ID_MESA_RADV:
2244 case VK_DRIVER_ID_INTEL_OPEN_SOURCE_MESA:
2245 case VK_DRIVER_ID_MESA_LLVMPIPE:
2246 case VK_DRIVER_ID_MESA_TURNIP:
2247 case VK_DRIVER_ID_MESA_V3DV:
2248 case VK_DRIVER_ID_MESA_PANVK:
2249 case VK_DRIVER_ID_MESA_VENUS:
2250 screen->driver_workarounds.implicit_sync = false;
2255 if (screen->info.line_rast_feats.stippledRectangularLines &&
2256 screen->info.line_rast_feats.stippledBresenhamLines &&
2257 screen->info.line_rast_feats.stippledSmoothLines &&
2258 !screen->info.dynamic_state3_feats.extendedDynamicState3LineStippleEnable)
2259 screen->info.have_EXT_extended_dynamic_state3 = false;
2260 if (!screen->info.dynamic_state3_feats.extendedDynamicState3PolygonMode ||
2261 !screen->info.dynamic_state3_feats.extendedDynamicState3DepthClampEnable ||
2262 !screen->info.dynamic_state3_feats.extendedDynamicState3DepthClipEnable ||
2263 !screen->info.dynamic_state3_feats.extendedDynamicState3ProvokingVertexMode ||
2264 !screen->info.dynamic_state3_feats.extendedDynamicState3LineRasterizationMode)
2265 screen->info.have_EXT_extended_dynamic_state3 = false;
2266 else if (screen->info.dynamic_state3_feats.extendedDynamicState3SampleMask &&
2267 screen->info.dynamic_state3_feats.extendedDynamicState3AlphaToCoverageEnable &&
2268 (!screen->info.feats.features.alphaToOne || screen->info.dynamic_state3_feats.extendedDynamicState3AlphaToOneEnable) &&
2269 screen->info.dynamic_state3_feats.extendedDynamicState3ColorBlendEnable &&
2270 screen->info.dynamic_state3_feats.extendedDynamicState3RasterizationSamples &&
2271 screen->info.dynamic_state3_feats.extendedDynamicState3ColorWriteMask &&
2272 screen->info.dynamic_state3_feats.extendedDynamicState3LogicOpEnable &&
2273 screen->info.dynamic_state2_feats.extendedDynamicState2LogicOp)
2274 screen->have_full_ds3 = true;
2275 if (screen->info.have_EXT_graphics_pipeline_library)
2276 screen->info.have_EXT_graphics_pipeline_library = screen->info.have_EXT_extended_dynamic_state &&
2277 screen->info.have_EXT_extended_dynamic_state2 &&
2278 ((zink_debug & ZINK_DEBUG_GPL) ||
2279 screen->info.dynamic_state2_feats.extendedDynamicState2PatchControlPoints) &&
2280 screen->info.have_EXT_extended_dynamic_state3 &&
2281 screen->info.have_KHR_dynamic_rendering &&
2282 screen->info.have_EXT_non_seamless_cube_map &&
2283 (!(zink_debug & ZINK_DEBUG_GPL) ||
2284 screen->info.gpl_props.graphicsPipelineLibraryFastLinking ||
2286 screen->driver_workarounds.broken_l4a4 = screen->info.driver_props.driverID == VK_DRIVER_ID_NVIDIA_PROPRIETARY;
2287 screen->driver_workarounds.depth_clip_control_missing = !screen->info.have_EXT_depth_clip_control;
2288 if (screen->info.driver_props.driverID == VK_DRIVER_ID_AMD_PROPRIETARY)
2289 /* this completely breaks xfb somehow */
2290 screen->info.have_EXT_extended_dynamic_state2 = false;
2291 if (screen->info.driver_props.driverID == VK_DRIVER_ID_MESA_TURNIP) {
2293 screen->info.border_color_feats.customBorderColorWithoutFormat = VK_FALSE;
2295 if (screen->info.driver_props.driverID == VK_DRIVER_ID_AMD_OPEN_SOURCE ||
2296 screen->info.driver_props.driverID == VK_DRIVER_ID_AMD_PROPRIETARY ||
2297 screen->info.driver_props.driverID == VK_DRIVER_ID_NVIDIA_PROPRIETARY ||
2298 screen->info.driver_props.driverID == VK_DRIVER_ID_MESA_RADV)
2299 screen->driver_workarounds.z24_unscaled_bias = 1<<23;
2301 screen->driver_workarounds.z24_unscaled_bias = 1<<24;
2302 if (screen->info.driver_props.driverID == VK_DRIVER_ID_NVIDIA_PROPRIETARY)
2303 screen->driver_workarounds.z16_unscaled_bias = 1<<15;
2305 screen->driver_workarounds.z16_unscaled_bias = 1<<16;
2306 /* these drivers don't use VK_PIPELINE_CREATE_COLOR_ATTACHMENT_FEEDBACK_LOOP_BIT_EXT, so it can always be set */
2307 switch (screen->info.driver_props.driverID) {
2308 case VK_DRIVER_ID_MESA_RADV:
2309 case VK_DRIVER_ID_INTEL_OPEN_SOURCE_MESA:
2310 case VK_DRIVER_ID_MESA_LLVMPIPE:
2311 case VK_DRIVER_ID_MESA_VENUS:
2312 case VK_DRIVER_ID_NVIDIA_PROPRIETARY:
2313 case VK_DRIVER_ID_INTEL_PROPRIETARY_WINDOWS:
2314 case VK_DRIVER_ID_IMAGINATION_PROPRIETARY:
2315 screen->driver_workarounds.always_feedback_loop = screen->info.have_EXT_attachment_feedback_loop_layout;
2320 /* these drivers don't use VK_PIPELINE_CREATE_DEPTH_STENCIL_ATTACHMENT_FEEDBACK_LOOP_BIT_EXT, so it can always be set */
2321 switch (screen->info.driver_props.driverID) {
2322 case VK_DRIVER_ID_MESA_RADV:
2323 case VK_DRIVER_ID_MESA_LLVMPIPE:
2324 case VK_DRIVER_ID_MESA_VENUS:
2325 case VK_DRIVER_ID_NVIDIA_PROPRIETARY:
2326 case VK_DRIVER_ID_IMAGINATION_PROPRIETARY:
2327 screen->driver_workarounds.always_feedback_loop_zs = screen->info.have_EXT_attachment_feedback_loop_layout;
2334 static struct zink_screen *
2335 zink_internal_create_screen(const struct pipe_screen_config *config)
2337 if (getenv("ZINK_USE_LAVAPIPE")) {
2338 mesa_loge("ZINK_USE_LAVAPIPE is obsolete. Use LIBGL_ALWAYS_SOFTWARE\n");
2342 struct zink_screen *screen = rzalloc(NULL, struct zink_screen);
2346 screen->threaded = util_get_cpu_caps()->nr_cpus > 1 && debug_get_bool_option("GALLIUM_THREAD", util_get_cpu_caps()->nr_cpus > 1);
2347 screen->abort_on_hang = debug_get_bool_option("ZINK_HANG_ABORT", false);
2349 zink_debug = debug_get_option_zink_debug();
2350 zink_descriptor_mode = debug_get_option_zink_descriptor_mode();
2352 screen->loader_lib = util_dl_open(VK_LIBNAME);
2353 if (!screen->loader_lib)
2356 screen->vk_GetInstanceProcAddr = (PFN_vkGetInstanceProcAddr)util_dl_get_proc_address(screen->loader_lib, "vkGetInstanceProcAddr");
2357 screen->vk_GetDeviceProcAddr = (PFN_vkGetDeviceProcAddr)util_dl_get_proc_address(screen->loader_lib, "vkGetDeviceProcAddr");
2358 if (!screen->vk_GetInstanceProcAddr ||
2359 !screen->vk_GetDeviceProcAddr)
2362 screen->instance_info.loader_version = zink_get_loader_version(screen);
2365 driParseConfigFiles(config->options, config->options_info, 0, "zink",
2366 NULL, NULL, NULL, 0, NULL, 0);
2367 screen->driconf.dual_color_blend_by_location = driQueryOptionb(config->options, "dual_color_blend_by_location");
2368 screen->driconf.glsl_correct_derivatives_after_discard = driQueryOptionb(config->options, "glsl_correct_derivatives_after_discard");
2369 //screen->driconf.inline_uniforms = driQueryOptionb(config->options, "radeonsi_inline_uniforms");
2370 screen->instance_info.disable_xcb_surface = driQueryOptionb(config->options, "disable_xcb_surface");
2374 if (!zink_create_instance(screen))
2377 vk_instance_dispatch_table_load(&screen->vk.instance,
2378 screen->vk_GetInstanceProcAddr,
2380 vk_physical_device_dispatch_table_load(&screen->vk.physical_device,
2381 screen->vk_GetInstanceProcAddr,
2384 zink_verify_instance_extensions(screen);
2386 if (screen->instance_info.have_EXT_debug_utils &&
2387 (zink_debug & ZINK_DEBUG_VALIDATION) && !create_debug(screen))
2388 debug_printf("ZINK: failed to setup debug utils\n");
2390 screen->is_cpu = choose_pdev(screen);
2391 if (screen->pdev == VK_NULL_HANDLE)
2394 update_queue_props(screen);
2396 screen->have_X8_D24_UNORM_PACK32 = zink_is_depth_format_supported(screen,
2397 VK_FORMAT_X8_D24_UNORM_PACK32);
2398 screen->have_D24_UNORM_S8_UINT = zink_is_depth_format_supported(screen,
2399 VK_FORMAT_D24_UNORM_S8_UINT);
2400 screen->have_D32_SFLOAT_S8_UINT = zink_is_depth_format_supported(screen,
2401 VK_FORMAT_D32_SFLOAT_S8_UINT);
2403 if (!zink_get_physical_device_info(screen)) {
2404 debug_printf("ZINK: failed to detect features\n");
2408 if (screen->threaded && !util_queue_init(&screen->flush_queue, "zfq", 8, 1, UTIL_QUEUE_INIT_RESIZE_IF_FULL, screen)) {
2409 mesa_loge("zink: Failed to create flush queue.\n");
2413 zink_internal_setup_moltenvk(screen);
2414 if (!screen->info.have_KHR_timeline_semaphore) {
2415 mesa_loge("zink: KHR_timeline_semaphore is required");
2419 init_driver_workarounds(screen);
2421 screen->dev = zink_create_logical_device(screen);
2425 vk_device_dispatch_table_load(&screen->vk.device,
2426 screen->vk_GetDeviceProcAddr,
2430 if (screen->info.driver_props.driverID == VK_DRIVER_ID_MESA_RADV ||
2431 screen->info.driver_props.driverID == VK_DRIVER_ID_AMD_OPEN_SOURCE ||
2432 screen->info.driver_props.driverID == VK_DRIVER_ID_AMD_PROPRIETARY)
2433 /* this has bad perf on AMD */
2434 screen->info.have_KHR_push_descriptor = false;
2436 zink_verify_device_extensions(screen);
2438 if ((zink_debug & ZINK_DEBUG_COMPACT) ||
2439 screen->info.props.limits.maxBoundDescriptorSets < ZINK_MAX_DESCRIPTOR_SETS) {
2440 screen->desc_set_id[ZINK_DESCRIPTOR_TYPES] = 0;
2441 screen->desc_set_id[ZINK_DESCRIPTOR_TYPE_UBO] = 1;
2442 screen->desc_set_id[ZINK_DESCRIPTOR_TYPE_SSBO] = 1;
2443 screen->desc_set_id[ZINK_DESCRIPTOR_TYPE_SAMPLER_VIEW] = 2;
2444 screen->desc_set_id[ZINK_DESCRIPTOR_TYPE_IMAGE] = 2;
2445 screen->desc_set_id[ZINK_DESCRIPTOR_BINDLESS] = 3;
2446 screen->compact_descriptors = true;
2448 screen->desc_set_id[ZINK_DESCRIPTOR_TYPES] = 0;
2449 screen->desc_set_id[ZINK_DESCRIPTOR_TYPE_UBO] = 1;
2450 screen->desc_set_id[ZINK_DESCRIPTOR_TYPE_SAMPLER_VIEW] = 2;
2451 screen->desc_set_id[ZINK_DESCRIPTOR_TYPE_SSBO] = 3;
2452 screen->desc_set_id[ZINK_DESCRIPTOR_TYPE_IMAGE] = 4;
2453 screen->desc_set_id[ZINK_DESCRIPTOR_BINDLESS] = 5;
2455 if (zink_descriptor_mode == ZINK_DESCRIPTOR_MODE_AUTO) {
2456 zink_descriptor_mode = ZINK_DESCRIPTOR_MODE_LAZY;
2459 if (screen->info.have_EXT_calibrated_timestamps && !check_have_device_time(screen))
2462 screen->have_triangle_fans = true;
2463 #if defined(VK_KHR_PORTABILITY_SUBSET_EXTENSION_NAME)
2464 if (screen->info.have_KHR_portability_subset) {
2465 screen->have_triangle_fans = (VK_TRUE == screen->info.portability_subset_feats.triangleFans);
2467 #endif // VK_KHR_PORTABILITY_SUBSET_EXTENSION_NAME
2469 check_base_requirements(screen);
2470 util_live_shader_cache_init(&screen->shaders, zink_create_gfx_shader_state, zink_delete_shader_state);
2472 screen->base.get_name = zink_get_name;
2473 if (screen->instance_info.have_KHR_external_memory_capabilities) {
2474 screen->base.get_device_uuid = zink_get_device_uuid;
2475 screen->base.get_driver_uuid = zink_get_driver_uuid;
2477 if (screen->info.have_KHR_external_memory_win32) {
2478 screen->base.get_device_luid = zink_get_device_luid;
2479 screen->base.get_device_node_mask = zink_get_device_node_mask;
2481 screen->base.set_max_shader_compiler_threads = zink_set_max_shader_compiler_threads;
2482 screen->base.is_parallel_shader_compilation_finished = zink_is_parallel_shader_compilation_finished;
2483 screen->base.get_vendor = zink_get_vendor;
2484 screen->base.get_device_vendor = zink_get_device_vendor;
2485 screen->base.get_compute_param = zink_get_compute_param;
2486 screen->base.get_timestamp = zink_get_timestamp;
2487 screen->base.query_memory_info = zink_query_memory_info;
2488 screen->base.get_param = zink_get_param;
2489 screen->base.get_paramf = zink_get_paramf;
2490 screen->base.get_shader_param = zink_get_shader_param;
2491 screen->base.get_compiler_options = zink_get_compiler_options;
2492 screen->base.get_sample_pixel_grid = zink_get_sample_pixel_grid;
2493 screen->base.is_compute_copy_faster = zink_is_compute_copy_faster;
2494 screen->base.is_format_supported = zink_is_format_supported;
2495 screen->base.driver_thread_add_job = zink_driver_thread_add_job;
2496 if (screen->info.have_EXT_image_drm_format_modifier && screen->info.have_EXT_external_memory_dma_buf) {
2497 screen->base.query_dmabuf_modifiers = zink_query_dmabuf_modifiers;
2498 screen->base.is_dmabuf_modifier_supported = zink_is_dmabuf_modifier_supported;
2499 screen->base.get_dmabuf_modifier_planes = zink_get_dmabuf_modifier_planes;
2502 if (screen->info.have_KHR_external_memory_win32)
2503 screen->base.create_fence_win32 = zink_create_fence_win32;
2505 screen->base.context_create = zink_context_create;
2506 screen->base.flush_frontbuffer = zink_flush_frontbuffer;
2507 screen->base.destroy = zink_destroy_screen;
2508 screen->base.finalize_nir = zink_shader_finalize;
2509 screen->base.get_sparse_texture_virtual_page_size = zink_get_sparse_texture_virtual_page_size;
2511 if (screen->info.have_EXT_sample_locations) {
2512 VkMultisamplePropertiesEXT prop;
2513 prop.sType = VK_STRUCTURE_TYPE_MULTISAMPLE_PROPERTIES_EXT;
2515 for (unsigned i = 0; i < ARRAY_SIZE(screen->maxSampleLocationGridSize); i++) {
2516 if (screen->info.sample_locations_props.sampleLocationSampleCounts & (1 << i)) {
2517 VKSCR(GetPhysicalDeviceMultisamplePropertiesEXT)(screen->pdev, 1 << i, &prop);
2518 screen->maxSampleLocationGridSize[i] = prop.maxSampleLocationGridSize;
2523 if (!zink_screen_resource_init(&screen->base))
2525 zink_bo_init(screen);
2526 zink_screen_fence_init(&screen->base);
2528 zink_screen_init_compiler(screen);
2529 if (!disk_cache_init(screen))
2531 if (!util_queue_init(&screen->cache_get_thread, "zcfq", 8, 4,
2532 UTIL_QUEUE_INIT_RESIZE_IF_FULL | UTIL_QUEUE_INIT_SCALE_THREADS, screen))
2534 populate_format_props(screen);
2536 slab_create_parent(&screen->transfer_pool, sizeof(struct zink_transfer), 16);
2538 screen->driconf.inline_uniforms = debug_get_bool_option("ZINK_INLINE_UNIFORMS", screen->is_cpu);
2540 screen->total_video_mem = get_video_mem(screen);
2541 screen->clamp_video_mem = screen->total_video_mem * 0.8;
2542 if (!os_get_total_physical_memory(&screen->total_mem))
2545 if (!zink_screen_init_semaphore(screen)) {
2546 mesa_loge("zink: failed to create timeline semaphore");
2550 memset(&screen->heap_map, UINT8_MAX, sizeof(screen->heap_map));
2551 for (enum zink_heap i = 0; i < ZINK_HEAP_MAX; i++) {
2552 for (unsigned j = 0; j < screen->info.mem_props.memoryTypeCount; j++) {
2553 VkMemoryPropertyFlags domains = vk_domain_from_heap(i);
2554 if ((screen->info.mem_props.memoryTypes[j].propertyFlags & domains) == domains) {
2555 assert(screen->heap_map[i] == UINT8_MAX);
2556 screen->heap_map[i] = j;
2561 /* not found: use compatible heap */
2562 if (screen->heap_map[i] == UINT8_MAX) {
2563 /* only cached mem has a failure case for now */
2564 assert(i == ZINK_HEAP_HOST_VISIBLE_CACHED || i == ZINK_HEAP_DEVICE_LOCAL_LAZY ||
2565 i == ZINK_HEAP_DEVICE_LOCAL_VISIBLE);
2566 if (i == ZINK_HEAP_HOST_VISIBLE_CACHED)
2567 screen->heap_map[i] = screen->heap_map[ZINK_HEAP_HOST_VISIBLE_COHERENT];
2569 screen->heap_map[i] = screen->heap_map[ZINK_HEAP_DEVICE_LOCAL];
2571 screen->heap_flags[i] = screen->info.mem_props.memoryTypes[screen->heap_map[i]].propertyFlags;
2574 unsigned vis_vram = screen->heap_map[ZINK_HEAP_DEVICE_LOCAL_VISIBLE];
2575 unsigned vram = screen->heap_map[ZINK_HEAP_DEVICE_LOCAL];
2576 /* determine if vis vram is roughly equal to total vram */
2577 if (screen->info.mem_props.memoryHeaps[screen->info.mem_props.memoryTypes[vis_vram].heapIndex].size >
2578 screen->info.mem_props.memoryHeaps[screen->info.mem_props.memoryTypes[vram].heapIndex].size * 0.9)
2579 screen->resizable_bar = true;
2582 simple_mtx_init(&screen->dt_lock, mtx_plain);
2584 util_idalloc_mt_init_tc(&screen->buffer_ids);
2586 util_vertex_state_cache_init(&screen->vertex_state_cache,
2587 zink_create_vertex_state, zink_vertex_state_destroy);
2588 screen->base.create_vertex_state = zink_cache_create_vertex_state;
2589 screen->base.vertex_state_destroy = zink_cache_vertex_state_destroy;
2590 glsl_type_singleton_init_or_ref();
2592 if (screen->info.have_vulkan13 || screen->info.have_KHR_synchronization2) {
2593 screen->image_barrier = zink_resource_image_barrier2;
2594 screen->buffer_barrier = zink_resource_buffer_barrier2;
2596 screen->image_barrier = zink_resource_image_barrier;
2597 screen->buffer_barrier = zink_resource_buffer_barrier;
2600 if (!zink_descriptor_layouts_init(screen))
2604 screen->copy_context = zink_context(screen->base.context_create(&screen->base, NULL, ZINK_CONTEXT_COPY_ONLY));
2605 if (!screen->copy_context) {
2606 mesa_loge("zink: failed to create copy context");
2610 screen->optimal_keys = !screen->need_decompose_attrs && screen->info.have_EXT_non_seamless_cube_map && !screen->driconf.inline_uniforms;
2611 if (!screen->optimal_keys)
2612 screen->info.have_EXT_graphics_pipeline_library = false;
2617 if (screen->loader_lib)
2618 util_dl_close(screen->loader_lib);
2619 if (screen->threaded)
2620 util_queue_destroy(&screen->flush_queue);
2622 ralloc_free(screen);
2626 struct pipe_screen *
2627 zink_create_screen(struct sw_winsys *winsys, const struct pipe_screen_config *config)
2629 struct zink_screen *ret = zink_internal_create_screen(config);
2637 struct pipe_screen *
2638 zink_drm_create_screen(int fd, const struct pipe_screen_config *config)
2640 struct zink_screen *ret = zink_internal_create_screen(config);
2643 ret->drm_fd = os_dupfd_cloexec(fd);
2644 if (ret && !ret->info.have_KHR_external_memory_fd) {
2645 debug_printf("ZINK: KHR_external_memory_fd required!\n");
2646 zink_destroy_screen(&ret->base);
2653 void zink_stub_function_not_loaded()
2655 /* this will be used by the zink_verify_*_extensions() functions on a
2658 mesa_loge("ZINK: a Vulkan function was called without being loaded");