17ec681f3Smrg/* 27ec681f3Smrg * Copyright 2018 Collabora Ltd. 37ec681f3Smrg * 47ec681f3Smrg * Permission is hereby granted, free of charge, to any person obtaining a 57ec681f3Smrg * copy of this software and associated documentation files (the "Software"), 67ec681f3Smrg * to deal in the Software without restriction, including without limitation 77ec681f3Smrg * on the rights to use, copy, modify, merge, publish, distribute, sub 87ec681f3Smrg * license, and/or sell copies of the Software, and to permit persons to whom 97ec681f3Smrg * the Software is furnished to do so, subject to the following conditions: 107ec681f3Smrg * 117ec681f3Smrg * The above copyright notice and this permission notice (including the next 127ec681f3Smrg * paragraph) shall be included in all copies or substantial portions of the 137ec681f3Smrg * Software. 147ec681f3Smrg * 157ec681f3Smrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 167ec681f3Smrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 177ec681f3Smrg * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL 187ec681f3Smrg * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM, 197ec681f3Smrg * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 207ec681f3Smrg * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 217ec681f3Smrg * USE OR OTHER DEALINGS IN THE SOFTWARE. 227ec681f3Smrg */ 237ec681f3Smrg 247ec681f3Smrg#include "zink_program.h" 257ec681f3Smrg 267ec681f3Smrg#include "zink_compiler.h" 277ec681f3Smrg#include "zink_context.h" 287ec681f3Smrg#include "zink_descriptors.h" 297ec681f3Smrg#include "zink_helpers.h" 307ec681f3Smrg#include "zink_render_pass.h" 317ec681f3Smrg#include "zink_resource.h" 327ec681f3Smrg#include "zink_screen.h" 337ec681f3Smrg#include "zink_state.h" 347ec681f3Smrg#include "zink_inlines.h" 357ec681f3Smrg 367ec681f3Smrg#include "util/hash_table.h" 377ec681f3Smrg#include "util/set.h" 387ec681f3Smrg#include "util/u_debug.h" 397ec681f3Smrg#include "util/u_memory.h" 407ec681f3Smrg#include "util/u_prim.h" 417ec681f3Smrg#include "tgsi/tgsi_from_mesa.h" 427ec681f3Smrg 437ec681f3Smrg/* for pipeline cache */ 447ec681f3Smrg#define XXH_INLINE_ALL 457ec681f3Smrg#include "util/xxhash.h" 467ec681f3Smrg 477ec681f3Smrgstruct gfx_pipeline_cache_entry { 487ec681f3Smrg struct zink_gfx_pipeline_state state; 497ec681f3Smrg VkPipeline pipeline; 507ec681f3Smrg}; 517ec681f3Smrg 527ec681f3Smrgstruct compute_pipeline_cache_entry { 537ec681f3Smrg struct zink_compute_pipeline_state state; 547ec681f3Smrg VkPipeline pipeline; 557ec681f3Smrg}; 567ec681f3Smrg 577ec681f3Smrgvoid 587ec681f3Smrgdebug_describe_zink_gfx_program(char *buf, const struct zink_gfx_program *ptr) 597ec681f3Smrg{ 607ec681f3Smrg sprintf(buf, "zink_gfx_program"); 617ec681f3Smrg} 627ec681f3Smrg 637ec681f3Smrgvoid 647ec681f3Smrgdebug_describe_zink_compute_program(char *buf, const struct zink_compute_program *ptr) 657ec681f3Smrg{ 667ec681f3Smrg sprintf(buf, "zink_compute_program"); 677ec681f3Smrg} 687ec681f3Smrg 697ec681f3Smrgstatic bool 707ec681f3Smrgshader_key_matches(const struct zink_shader_module *zm, const struct zink_shader_key *key, unsigned num_uniforms) 717ec681f3Smrg{ 727ec681f3Smrg if (zm->key_size != key->size || zm->num_uniforms != num_uniforms) 737ec681f3Smrg return false; 747ec681f3Smrg return !memcmp(zm->key, key, zm->key_size) && 757ec681f3Smrg (!num_uniforms || !memcmp(zm->key + zm->key_size, key->base.inlined_uniform_values, zm->num_uniforms * sizeof(uint32_t))); 767ec681f3Smrg} 777ec681f3Smrg 787ec681f3Smrgstatic uint32_t 797ec681f3Smrgshader_module_hash(const struct zink_shader_module *zm) 807ec681f3Smrg{ 817ec681f3Smrg unsigned key_size = zm->key_size + zm->num_uniforms * sizeof(uint32_t); 827ec681f3Smrg return _mesa_hash_data(zm->key, key_size); 837ec681f3Smrg} 847ec681f3Smrg 857ec681f3Smrgstatic struct zink_shader_module * 867ec681f3Smrgget_shader_module_for_stage(struct zink_context *ctx, struct zink_screen *screen, 877ec681f3Smrg struct zink_shader *zs, struct zink_gfx_program *prog, 887ec681f3Smrg struct zink_gfx_pipeline_state *state) 897ec681f3Smrg{ 907ec681f3Smrg gl_shader_stage stage = zs->nir->info.stage; 917ec681f3Smrg enum pipe_shader_type pstage = pipe_shader_type_from_mesa(stage); 927ec681f3Smrg VkShaderModule mod; 937ec681f3Smrg struct zink_shader_module *zm = NULL; 947ec681f3Smrg unsigned base_size = 0; 957ec681f3Smrg struct zink_shader_key *key = &state->shader_keys.key[pstage]; 967ec681f3Smrg 977ec681f3Smrg if (ctx && zs->nir->info.num_inlinable_uniforms && 987ec681f3Smrg ctx->inlinable_uniforms_valid_mask & BITFIELD64_BIT(pstage)) { 997ec681f3Smrg if (prog->inlined_variant_count[pstage] < ZINK_MAX_INLINED_VARIANTS) 1007ec681f3Smrg base_size = zs->nir->info.num_inlinable_uniforms; 1017ec681f3Smrg else 1027ec681f3Smrg key->inline_uniforms = false; 1037ec681f3Smrg } 1047ec681f3Smrg 1057ec681f3Smrg struct zink_shader_module *iter, *next; 1067ec681f3Smrg LIST_FOR_EACH_ENTRY_SAFE(iter, next, &prog->shader_cache[pstage][!!base_size], list) { 1077ec681f3Smrg if (!shader_key_matches(iter, key, base_size)) 1087ec681f3Smrg continue; 1097ec681f3Smrg list_delinit(&iter->list); 1107ec681f3Smrg zm = iter; 1117ec681f3Smrg break; 1127ec681f3Smrg } 1137ec681f3Smrg 1147ec681f3Smrg if (!zm) { 1157ec681f3Smrg zm = malloc(sizeof(struct zink_shader_module) + key->size + base_size * sizeof(uint32_t)); 1167ec681f3Smrg if (!zm) { 1177ec681f3Smrg return NULL; 1187ec681f3Smrg } 1197ec681f3Smrg mod = zink_shader_compile(screen, zs, prog->nir[stage], key); 1207ec681f3Smrg if (!mod) { 1217ec681f3Smrg FREE(zm); 1227ec681f3Smrg return NULL; 1237ec681f3Smrg } 1247ec681f3Smrg zm->shader = mod; 1257ec681f3Smrg list_inithead(&zm->list); 1267ec681f3Smrg zm->num_uniforms = base_size; 1277ec681f3Smrg zm->key_size = key->size; 1287ec681f3Smrg memcpy(zm->key, key, key->size); 1297ec681f3Smrg if (base_size) 1307ec681f3Smrg memcpy(zm->key + key->size, &key->base, base_size * sizeof(uint32_t)); 1317ec681f3Smrg zm->hash = shader_module_hash(zm); 1327ec681f3Smrg zm->default_variant = !base_size && list_is_empty(&prog->shader_cache[pstage][0]); 1337ec681f3Smrg if (base_size) 1347ec681f3Smrg prog->inlined_variant_count[pstage]++; 1357ec681f3Smrg } 1367ec681f3Smrg list_add(&zm->list, &prog->shader_cache[pstage][!!base_size]); 1377ec681f3Smrg return zm; 1387ec681f3Smrg} 1397ec681f3Smrg 1407ec681f3Smrgstatic void 1417ec681f3Smrgzink_destroy_shader_module(struct zink_screen *screen, struct zink_shader_module *zm) 1427ec681f3Smrg{ 1437ec681f3Smrg VKSCR(DestroyShaderModule)(screen->dev, zm->shader, NULL); 1447ec681f3Smrg free(zm); 1457ec681f3Smrg} 1467ec681f3Smrg 1477ec681f3Smrgstatic void 1487ec681f3Smrgdestroy_shader_cache(struct zink_screen *screen, struct list_head *sc) 1497ec681f3Smrg{ 1507ec681f3Smrg struct zink_shader_module *zm, *next; 1517ec681f3Smrg LIST_FOR_EACH_ENTRY_SAFE(zm, next, sc, list) { 1527ec681f3Smrg list_delinit(&zm->list); 1537ec681f3Smrg zink_destroy_shader_module(screen, zm); 1547ec681f3Smrg } 1557ec681f3Smrg} 1567ec681f3Smrg 1577ec681f3Smrgstatic void 1587ec681f3Smrgupdate_shader_modules(struct zink_context *ctx, 1597ec681f3Smrg struct zink_screen *screen, 1607ec681f3Smrg struct zink_gfx_program *prog, uint32_t mask, 1617ec681f3Smrg struct zink_gfx_pipeline_state *state) 1627ec681f3Smrg{ 1637ec681f3Smrg bool hash_changed = false; 1647ec681f3Smrg bool default_variants = true; 1657ec681f3Smrg bool first = !prog->modules[PIPE_SHADER_VERTEX]; 1667ec681f3Smrg uint32_t variant_hash = prog->last_variant_hash; 1677ec681f3Smrg u_foreach_bit(pstage, mask) { 1687ec681f3Smrg assert(prog->shaders[pstage]); 1697ec681f3Smrg struct zink_shader_module *zm = get_shader_module_for_stage(ctx, screen, prog->shaders[pstage], prog, state); 1707ec681f3Smrg state->modules[pstage] = zm->shader; 1717ec681f3Smrg if (prog->modules[pstage] == zm) 1727ec681f3Smrg continue; 1737ec681f3Smrg if (prog->modules[pstage]) 1747ec681f3Smrg variant_hash ^= prog->modules[pstage]->hash; 1757ec681f3Smrg hash_changed = true; 1767ec681f3Smrg default_variants &= zm->default_variant; 1777ec681f3Smrg prog->modules[pstage] = zm; 1787ec681f3Smrg variant_hash ^= prog->modules[pstage]->hash; 1797ec681f3Smrg } 1807ec681f3Smrg 1817ec681f3Smrg if (hash_changed && state) { 1827ec681f3Smrg if (default_variants && !first) 1837ec681f3Smrg prog->last_variant_hash = prog->default_variant_hash; 1847ec681f3Smrg else { 1857ec681f3Smrg prog->last_variant_hash = variant_hash; 1867ec681f3Smrg if (first) { 1877ec681f3Smrg p_atomic_dec(&prog->base.reference.count); 1887ec681f3Smrg prog->default_variant_hash = prog->last_variant_hash; 1897ec681f3Smrg } 1907ec681f3Smrg } 1917ec681f3Smrg 1927ec681f3Smrg state->modules_changed = true; 1937ec681f3Smrg } 1947ec681f3Smrg} 1957ec681f3Smrg 1967ec681f3Smrgstatic uint32_t 1977ec681f3Smrghash_gfx_pipeline_state(const void *key) 1987ec681f3Smrg{ 1997ec681f3Smrg const struct zink_gfx_pipeline_state *state = key; 2007ec681f3Smrg uint32_t hash = _mesa_hash_data(key, offsetof(struct zink_gfx_pipeline_state, hash)); 2017ec681f3Smrg if (!state->have_EXT_extended_dynamic_state2) 2027ec681f3Smrg hash = XXH32(&state->primitive_restart, 1, hash); 2037ec681f3Smrg if (state->have_EXT_extended_dynamic_state) 2047ec681f3Smrg return hash; 2057ec681f3Smrg return XXH32(&state->dyn_state1, sizeof(state->dyn_state1), hash); 2067ec681f3Smrg} 2077ec681f3Smrg 2087ec681f3Smrgstatic bool 2097ec681f3Smrgequals_gfx_pipeline_state(const void *a, const void *b) 2107ec681f3Smrg{ 2117ec681f3Smrg const struct zink_gfx_pipeline_state *sa = a; 2127ec681f3Smrg const struct zink_gfx_pipeline_state *sb = b; 2137ec681f3Smrg if (!sa->have_EXT_extended_dynamic_state) { 2147ec681f3Smrg if (sa->vertex_buffers_enabled_mask != sb->vertex_buffers_enabled_mask) 2157ec681f3Smrg return false; 2167ec681f3Smrg /* if we don't have dynamic states, we have to hash the enabled vertex buffer bindings */ 2177ec681f3Smrg uint32_t mask_a = sa->vertex_buffers_enabled_mask; 2187ec681f3Smrg uint32_t mask_b = sb->vertex_buffers_enabled_mask; 2197ec681f3Smrg while (mask_a || mask_b) { 2207ec681f3Smrg unsigned idx_a = u_bit_scan(&mask_a); 2217ec681f3Smrg unsigned idx_b = u_bit_scan(&mask_b); 2227ec681f3Smrg if (sa->vertex_strides[idx_a] != sb->vertex_strides[idx_b]) 2237ec681f3Smrg return false; 2247ec681f3Smrg } 2257ec681f3Smrg if (sa->dyn_state1.front_face != sb->dyn_state1.front_face) 2267ec681f3Smrg return false; 2277ec681f3Smrg if (!!sa->dyn_state1.depth_stencil_alpha_state != !!sb->dyn_state1.depth_stencil_alpha_state || 2287ec681f3Smrg (sa->dyn_state1.depth_stencil_alpha_state && 2297ec681f3Smrg memcmp(sa->dyn_state1.depth_stencil_alpha_state, sb->dyn_state1.depth_stencil_alpha_state, 2307ec681f3Smrg sizeof(struct zink_depth_stencil_alpha_hw_state)))) 2317ec681f3Smrg return false; 2327ec681f3Smrg } 2337ec681f3Smrg if (!sa->have_EXT_extended_dynamic_state2) { 2347ec681f3Smrg if (sa->primitive_restart != sb->primitive_restart) 2357ec681f3Smrg return false; 2367ec681f3Smrg } 2377ec681f3Smrg return !memcmp(sa->modules, sb->modules, sizeof(sa->modules)) && 2387ec681f3Smrg !memcmp(a, b, offsetof(struct zink_gfx_pipeline_state, hash)); 2397ec681f3Smrg} 2407ec681f3Smrg 2417ec681f3Smrgvoid 2427ec681f3Smrgzink_update_gfx_program(struct zink_context *ctx, struct zink_gfx_program *prog) 2437ec681f3Smrg{ 2447ec681f3Smrg update_shader_modules(ctx, zink_screen(ctx->base.screen), prog, ctx->dirty_shader_stages & prog->stages_present, &ctx->gfx_pipeline_state); 2457ec681f3Smrg} 2467ec681f3Smrg 2477ec681f3SmrgVkPipelineLayout 2487ec681f3Smrgzink_pipeline_layout_create(struct zink_screen *screen, struct zink_program *pg, uint32_t *compat) 2497ec681f3Smrg{ 2507ec681f3Smrg VkPipelineLayoutCreateInfo plci = {0}; 2517ec681f3Smrg plci.sType = VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO; 2527ec681f3Smrg 2537ec681f3Smrg plci.pSetLayouts = pg->dsl; 2547ec681f3Smrg plci.setLayoutCount = pg->num_dsl; 2557ec681f3Smrg 2567ec681f3Smrg VkPushConstantRange pcr[2] = {0}; 2577ec681f3Smrg if (pg->is_compute) { 2587ec681f3Smrg if (((struct zink_compute_program*)pg)->shader->nir->info.stage == MESA_SHADER_KERNEL) { 2597ec681f3Smrg pcr[0].stageFlags = VK_SHADER_STAGE_COMPUTE_BIT; 2607ec681f3Smrg pcr[0].offset = 0; 2617ec681f3Smrg pcr[0].size = sizeof(struct zink_cs_push_constant); 2627ec681f3Smrg plci.pushConstantRangeCount = 1; 2637ec681f3Smrg } 2647ec681f3Smrg } else { 2657ec681f3Smrg pcr[0].stageFlags = VK_SHADER_STAGE_VERTEX_BIT; 2667ec681f3Smrg pcr[0].offset = offsetof(struct zink_gfx_push_constant, draw_mode_is_indexed); 2677ec681f3Smrg pcr[0].size = 2 * sizeof(unsigned); 2687ec681f3Smrg pcr[1].stageFlags = VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT; 2697ec681f3Smrg pcr[1].offset = offsetof(struct zink_gfx_push_constant, default_inner_level); 2707ec681f3Smrg pcr[1].size = sizeof(float) * 6; 2717ec681f3Smrg plci.pushConstantRangeCount = 2; 2727ec681f3Smrg } 2737ec681f3Smrg plci.pPushConstantRanges = &pcr[0]; 2747ec681f3Smrg 2757ec681f3Smrg VkPipelineLayout layout; 2767ec681f3Smrg if (VKSCR(CreatePipelineLayout)(screen->dev, &plci, NULL, &layout) != VK_SUCCESS) { 2777ec681f3Smrg debug_printf("vkCreatePipelineLayout failed!\n"); 2787ec681f3Smrg return VK_NULL_HANDLE; 2797ec681f3Smrg } 2807ec681f3Smrg 2817ec681f3Smrg *compat = _mesa_hash_data(pg->dsl, pg->num_dsl * sizeof(pg->dsl[0])); 2827ec681f3Smrg 2837ec681f3Smrg return layout; 2847ec681f3Smrg} 2857ec681f3Smrg 2867ec681f3Smrgstatic void 2877ec681f3Smrgassign_io(struct zink_gfx_program *prog, struct zink_shader *stages[ZINK_SHADER_COUNT]) 2887ec681f3Smrg{ 2897ec681f3Smrg struct zink_shader *shaders[PIPE_SHADER_TYPES]; 2907ec681f3Smrg 2917ec681f3Smrg /* build array in pipeline order */ 2927ec681f3Smrg for (unsigned i = 0; i < ZINK_SHADER_COUNT; i++) 2937ec681f3Smrg shaders[tgsi_processor_to_shader_stage(i)] = stages[i]; 2947ec681f3Smrg 2957ec681f3Smrg for (unsigned i = 0; i < MESA_SHADER_FRAGMENT;) { 2967ec681f3Smrg nir_shader *producer = shaders[i]->nir; 2977ec681f3Smrg for (unsigned j = i + 1; j < ZINK_SHADER_COUNT; i++, j++) { 2987ec681f3Smrg struct zink_shader *consumer = shaders[j]; 2997ec681f3Smrg if (!consumer) 3007ec681f3Smrg continue; 3017ec681f3Smrg if (!prog->nir[producer->info.stage]) 3027ec681f3Smrg prog->nir[producer->info.stage] = nir_shader_clone(prog, producer); 3037ec681f3Smrg if (!prog->nir[j]) 3047ec681f3Smrg prog->nir[j] = nir_shader_clone(prog, consumer->nir); 3057ec681f3Smrg zink_compiler_assign_io(prog->nir[producer->info.stage], prog->nir[j]); 3067ec681f3Smrg i = j; 3077ec681f3Smrg break; 3087ec681f3Smrg } 3097ec681f3Smrg } 3107ec681f3Smrg} 3117ec681f3Smrg 3127ec681f3Smrgstruct zink_gfx_program * 3137ec681f3Smrgzink_create_gfx_program(struct zink_context *ctx, 3147ec681f3Smrg struct zink_shader *stages[ZINK_SHADER_COUNT], 3157ec681f3Smrg unsigned vertices_per_patch) 3167ec681f3Smrg{ 3177ec681f3Smrg struct zink_screen *screen = zink_screen(ctx->base.screen); 3187ec681f3Smrg struct zink_gfx_program *prog = rzalloc(NULL, struct zink_gfx_program); 3197ec681f3Smrg if (!prog) 3207ec681f3Smrg goto fail; 3217ec681f3Smrg 3227ec681f3Smrg pipe_reference_init(&prog->base.reference, 1); 3237ec681f3Smrg 3247ec681f3Smrg for (int i = 0; i < ZINK_SHADER_COUNT; ++i) { 3257ec681f3Smrg list_inithead(&prog->shader_cache[i][0]); 3267ec681f3Smrg list_inithead(&prog->shader_cache[i][1]); 3277ec681f3Smrg if (stages[i]) { 3287ec681f3Smrg prog->shaders[i] = stages[i]; 3297ec681f3Smrg prog->stages_present |= BITFIELD_BIT(i); 3307ec681f3Smrg } 3317ec681f3Smrg } 3327ec681f3Smrg if (stages[PIPE_SHADER_TESS_EVAL] && !stages[PIPE_SHADER_TESS_CTRL]) { 3337ec681f3Smrg prog->shaders[PIPE_SHADER_TESS_EVAL]->generated = 3347ec681f3Smrg prog->shaders[PIPE_SHADER_TESS_CTRL] = 3357ec681f3Smrg zink_shader_tcs_create(screen, stages[PIPE_SHADER_VERTEX], vertices_per_patch); 3367ec681f3Smrg prog->stages_present |= BITFIELD_BIT(PIPE_SHADER_TESS_CTRL); 3377ec681f3Smrg } 3387ec681f3Smrg 3397ec681f3Smrg assign_io(prog, prog->shaders); 3407ec681f3Smrg 3417ec681f3Smrg if (stages[PIPE_SHADER_GEOMETRY]) 3427ec681f3Smrg prog->last_vertex_stage = stages[PIPE_SHADER_GEOMETRY]; 3437ec681f3Smrg else if (stages[PIPE_SHADER_TESS_EVAL]) 3447ec681f3Smrg prog->last_vertex_stage = stages[PIPE_SHADER_TESS_EVAL]; 3457ec681f3Smrg else 3467ec681f3Smrg prog->last_vertex_stage = stages[PIPE_SHADER_VERTEX]; 3477ec681f3Smrg 3487ec681f3Smrg for (int i = 0; i < ARRAY_SIZE(prog->pipelines); ++i) { 3497ec681f3Smrg _mesa_hash_table_init(&prog->pipelines[i], prog, NULL, equals_gfx_pipeline_state); 3507ec681f3Smrg /* only need first 3/4 for point/line/tri/patch */ 3517ec681f3Smrg if (screen->info.have_EXT_extended_dynamic_state && 3527ec681f3Smrg i == (prog->last_vertex_stage->nir->info.stage == MESA_SHADER_TESS_EVAL ? 4 : 3)) 3537ec681f3Smrg break; 3547ec681f3Smrg } 3557ec681f3Smrg 3567ec681f3Smrg struct mesa_sha1 sctx; 3577ec681f3Smrg _mesa_sha1_init(&sctx); 3587ec681f3Smrg for (int i = 0; i < ZINK_SHADER_COUNT; ++i) { 3597ec681f3Smrg if (prog->shaders[i]) { 3607ec681f3Smrg simple_mtx_lock(&prog->shaders[i]->lock); 3617ec681f3Smrg _mesa_set_add(prog->shaders[i]->programs, prog); 3627ec681f3Smrg simple_mtx_unlock(&prog->shaders[i]->lock); 3637ec681f3Smrg zink_gfx_program_reference(screen, NULL, prog); 3647ec681f3Smrg _mesa_sha1_update(&sctx, prog->shaders[i]->base.sha1, sizeof(prog->shaders[i]->base.sha1)); 3657ec681f3Smrg } 3667ec681f3Smrg } 3677ec681f3Smrg _mesa_sha1_final(&sctx, prog->base.sha1); 3687ec681f3Smrg 3697ec681f3Smrg if (!screen->descriptor_program_init(ctx, &prog->base)) 3707ec681f3Smrg goto fail; 3717ec681f3Smrg 3727ec681f3Smrg zink_screen_get_pipeline_cache(screen, &prog->base); 3737ec681f3Smrg return prog; 3747ec681f3Smrg 3757ec681f3Smrgfail: 3767ec681f3Smrg if (prog) 3777ec681f3Smrg zink_destroy_gfx_program(screen, prog); 3787ec681f3Smrg return NULL; 3797ec681f3Smrg} 3807ec681f3Smrg 3817ec681f3Smrgstatic uint32_t 3827ec681f3Smrghash_compute_pipeline_state(const void *key) 3837ec681f3Smrg{ 3847ec681f3Smrg const struct zink_compute_pipeline_state *state = key; 3857ec681f3Smrg uint32_t hash = _mesa_hash_data(state, offsetof(struct zink_compute_pipeline_state, hash)); 3867ec681f3Smrg if (state->use_local_size) 3877ec681f3Smrg hash = XXH32(&state->local_size[0], sizeof(state->local_size), hash); 3887ec681f3Smrg return hash; 3897ec681f3Smrg} 3907ec681f3Smrg 3917ec681f3Smrgvoid 3927ec681f3Smrgzink_program_update_compute_pipeline_state(struct zink_context *ctx, struct zink_compute_program *comp, const uint block[3]) 3937ec681f3Smrg{ 3947ec681f3Smrg struct zink_shader *zs = comp->shader; 3957ec681f3Smrg bool use_local_size = !(zs->nir->info.workgroup_size[0] || 3967ec681f3Smrg zs->nir->info.workgroup_size[1] || 3977ec681f3Smrg zs->nir->info.workgroup_size[2]); 3987ec681f3Smrg if (ctx->compute_pipeline_state.use_local_size != use_local_size) 3997ec681f3Smrg ctx->compute_pipeline_state.dirty = true; 4007ec681f3Smrg ctx->compute_pipeline_state.use_local_size = use_local_size; 4017ec681f3Smrg 4027ec681f3Smrg if (ctx->compute_pipeline_state.use_local_size) { 4037ec681f3Smrg for (int i = 0; i < ARRAY_SIZE(ctx->compute_pipeline_state.local_size); i++) { 4047ec681f3Smrg if (ctx->compute_pipeline_state.local_size[i] != block[i]) 4057ec681f3Smrg ctx->compute_pipeline_state.dirty = true; 4067ec681f3Smrg ctx->compute_pipeline_state.local_size[i] = block[i]; 4077ec681f3Smrg } 4087ec681f3Smrg } else 4097ec681f3Smrg ctx->compute_pipeline_state.local_size[0] = 4107ec681f3Smrg ctx->compute_pipeline_state.local_size[1] = 4117ec681f3Smrg ctx->compute_pipeline_state.local_size[2] = 0; 4127ec681f3Smrg} 4137ec681f3Smrg 4147ec681f3Smrgstatic bool 4157ec681f3Smrgequals_compute_pipeline_state(const void *a, const void *b) 4167ec681f3Smrg{ 4177ec681f3Smrg return memcmp(a, b, offsetof(struct zink_compute_pipeline_state, hash)) == 0; 4187ec681f3Smrg} 4197ec681f3Smrg 4207ec681f3Smrgstruct zink_compute_program * 4217ec681f3Smrgzink_create_compute_program(struct zink_context *ctx, struct zink_shader *shader) 4227ec681f3Smrg{ 4237ec681f3Smrg struct zink_screen *screen = zink_screen(ctx->base.screen); 4247ec681f3Smrg struct zink_compute_program *comp = rzalloc(NULL, struct zink_compute_program); 4257ec681f3Smrg if (!comp) 4267ec681f3Smrg goto fail; 4277ec681f3Smrg 4287ec681f3Smrg pipe_reference_init(&comp->base.reference, 1); 4297ec681f3Smrg comp->base.is_compute = true; 4307ec681f3Smrg 4317ec681f3Smrg comp->module = CALLOC_STRUCT(zink_shader_module); 4327ec681f3Smrg assert(comp->module); 4337ec681f3Smrg comp->module->shader = zink_shader_compile(screen, shader, shader->nir, NULL); 4347ec681f3Smrg assert(comp->module->shader); 4357ec681f3Smrg 4367ec681f3Smrg comp->pipelines = _mesa_hash_table_create(NULL, hash_compute_pipeline_state, 4377ec681f3Smrg equals_compute_pipeline_state); 4387ec681f3Smrg 4397ec681f3Smrg _mesa_set_add(shader->programs, comp); 4407ec681f3Smrg comp->shader = shader; 4417ec681f3Smrg memcpy(comp->base.sha1, shader->base.sha1, sizeof(shader->base.sha1)); 4427ec681f3Smrg 4437ec681f3Smrg if (!screen->descriptor_program_init(ctx, &comp->base)) 4447ec681f3Smrg goto fail; 4457ec681f3Smrg 4467ec681f3Smrg zink_screen_get_pipeline_cache(screen, &comp->base); 4477ec681f3Smrg return comp; 4487ec681f3Smrg 4497ec681f3Smrgfail: 4507ec681f3Smrg if (comp) 4517ec681f3Smrg zink_destroy_compute_program(screen, comp); 4527ec681f3Smrg return NULL; 4537ec681f3Smrg} 4547ec681f3Smrg 4557ec681f3Smrguint32_t 4567ec681f3Smrgzink_program_get_descriptor_usage(struct zink_context *ctx, enum pipe_shader_type stage, enum zink_descriptor_type type) 4577ec681f3Smrg{ 4587ec681f3Smrg struct zink_shader *zs = NULL; 4597ec681f3Smrg switch (stage) { 4607ec681f3Smrg case PIPE_SHADER_VERTEX: 4617ec681f3Smrg case PIPE_SHADER_TESS_CTRL: 4627ec681f3Smrg case PIPE_SHADER_TESS_EVAL: 4637ec681f3Smrg case PIPE_SHADER_GEOMETRY: 4647ec681f3Smrg case PIPE_SHADER_FRAGMENT: 4657ec681f3Smrg zs = ctx->gfx_stages[stage]; 4667ec681f3Smrg break; 4677ec681f3Smrg case PIPE_SHADER_COMPUTE: { 4687ec681f3Smrg zs = ctx->compute_stage; 4697ec681f3Smrg break; 4707ec681f3Smrg } 4717ec681f3Smrg default: 4727ec681f3Smrg unreachable("unknown shader type"); 4737ec681f3Smrg } 4747ec681f3Smrg if (!zs) 4757ec681f3Smrg return 0; 4767ec681f3Smrg switch (type) { 4777ec681f3Smrg case ZINK_DESCRIPTOR_TYPE_UBO: 4787ec681f3Smrg return zs->ubos_used; 4797ec681f3Smrg case ZINK_DESCRIPTOR_TYPE_SSBO: 4807ec681f3Smrg return zs->ssbos_used; 4817ec681f3Smrg case ZINK_DESCRIPTOR_TYPE_SAMPLER_VIEW: 4827ec681f3Smrg return BITSET_TEST_RANGE(zs->nir->info.textures_used, 0, PIPE_MAX_SAMPLERS - 1); 4837ec681f3Smrg case ZINK_DESCRIPTOR_TYPE_IMAGE: 4847ec681f3Smrg return zs->nir->info.images_used; 4857ec681f3Smrg default: 4867ec681f3Smrg unreachable("unknown descriptor type!"); 4877ec681f3Smrg } 4887ec681f3Smrg return 0; 4897ec681f3Smrg} 4907ec681f3Smrg 4917ec681f3Smrgbool 4927ec681f3Smrgzink_program_descriptor_is_buffer(struct zink_context *ctx, enum pipe_shader_type stage, enum zink_descriptor_type type, unsigned i) 4937ec681f3Smrg{ 4947ec681f3Smrg struct zink_shader *zs = NULL; 4957ec681f3Smrg switch (stage) { 4967ec681f3Smrg case PIPE_SHADER_VERTEX: 4977ec681f3Smrg case PIPE_SHADER_TESS_CTRL: 4987ec681f3Smrg case PIPE_SHADER_TESS_EVAL: 4997ec681f3Smrg case PIPE_SHADER_GEOMETRY: 5007ec681f3Smrg case PIPE_SHADER_FRAGMENT: 5017ec681f3Smrg zs = ctx->gfx_stages[stage]; 5027ec681f3Smrg break; 5037ec681f3Smrg case PIPE_SHADER_COMPUTE: { 5047ec681f3Smrg zs = ctx->compute_stage; 5057ec681f3Smrg break; 5067ec681f3Smrg } 5077ec681f3Smrg default: 5087ec681f3Smrg unreachable("unknown shader type"); 5097ec681f3Smrg } 5107ec681f3Smrg if (!zs) 5117ec681f3Smrg return false; 5127ec681f3Smrg return zink_shader_descriptor_is_buffer(zs, type, i); 5137ec681f3Smrg} 5147ec681f3Smrg 5157ec681f3Smrgstatic unsigned 5167ec681f3Smrgget_num_bindings(struct zink_shader *zs, enum zink_descriptor_type type) 5177ec681f3Smrg{ 5187ec681f3Smrg switch (type) { 5197ec681f3Smrg case ZINK_DESCRIPTOR_TYPE_UBO: 5207ec681f3Smrg case ZINK_DESCRIPTOR_TYPE_SSBO: 5217ec681f3Smrg return zs->num_bindings[type]; 5227ec681f3Smrg default: 5237ec681f3Smrg break; 5247ec681f3Smrg } 5257ec681f3Smrg unsigned num_bindings = 0; 5267ec681f3Smrg for (int i = 0; i < zs->num_bindings[type]; i++) 5277ec681f3Smrg num_bindings += zs->bindings[type][i].size; 5287ec681f3Smrg return num_bindings; 5297ec681f3Smrg} 5307ec681f3Smrg 5317ec681f3Smrgunsigned 5327ec681f3Smrgzink_program_num_bindings_typed(const struct zink_program *pg, enum zink_descriptor_type type, bool is_compute) 5337ec681f3Smrg{ 5347ec681f3Smrg unsigned num_bindings = 0; 5357ec681f3Smrg if (is_compute) { 5367ec681f3Smrg struct zink_compute_program *comp = (void*)pg; 5377ec681f3Smrg return get_num_bindings(comp->shader, type); 5387ec681f3Smrg } 5397ec681f3Smrg struct zink_gfx_program *prog = (void*)pg; 5407ec681f3Smrg for (unsigned i = 0; i < ZINK_SHADER_COUNT; i++) { 5417ec681f3Smrg if (prog->shaders[i]) 5427ec681f3Smrg num_bindings += get_num_bindings(prog->shaders[i], type); 5437ec681f3Smrg } 5447ec681f3Smrg return num_bindings; 5457ec681f3Smrg} 5467ec681f3Smrg 5477ec681f3Smrgunsigned 5487ec681f3Smrgzink_program_num_bindings(const struct zink_program *pg, bool is_compute) 5497ec681f3Smrg{ 5507ec681f3Smrg unsigned num_bindings = 0; 5517ec681f3Smrg for (unsigned i = 0; i < ZINK_DESCRIPTOR_TYPES; i++) 5527ec681f3Smrg num_bindings += zink_program_num_bindings_typed(pg, i, is_compute); 5537ec681f3Smrg return num_bindings; 5547ec681f3Smrg} 5557ec681f3Smrg 5567ec681f3Smrgvoid 5577ec681f3Smrgzink_destroy_gfx_program(struct zink_screen *screen, 5587ec681f3Smrg struct zink_gfx_program *prog) 5597ec681f3Smrg{ 5607ec681f3Smrg if (prog->base.layout) 5617ec681f3Smrg VKSCR(DestroyPipelineLayout)(screen->dev, prog->base.layout, NULL); 5627ec681f3Smrg 5637ec681f3Smrg for (int i = 0; i < ZINK_SHADER_COUNT; ++i) { 5647ec681f3Smrg if (prog->shaders[i]) { 5657ec681f3Smrg _mesa_set_remove_key(prog->shaders[i]->programs, prog); 5667ec681f3Smrg prog->shaders[i] = NULL; 5677ec681f3Smrg } 5687ec681f3Smrg destroy_shader_cache(screen, &prog->shader_cache[i][0]); 5697ec681f3Smrg destroy_shader_cache(screen, &prog->shader_cache[i][1]); 5707ec681f3Smrg ralloc_free(prog->nir[i]); 5717ec681f3Smrg } 5727ec681f3Smrg 5737ec681f3Smrg unsigned max_idx = ARRAY_SIZE(prog->pipelines); 5747ec681f3Smrg if (screen->info.have_EXT_extended_dynamic_state) { 5757ec681f3Smrg /* only need first 3/4 for point/line/tri/patch */ 5767ec681f3Smrg if ((prog->stages_present & 5777ec681f3Smrg (BITFIELD_BIT(PIPE_SHADER_TESS_EVAL) | BITFIELD_BIT(PIPE_SHADER_GEOMETRY))) == 5787ec681f3Smrg BITFIELD_BIT(PIPE_SHADER_TESS_EVAL)) 5797ec681f3Smrg max_idx = 4; 5807ec681f3Smrg else 5817ec681f3Smrg max_idx = 3; 5827ec681f3Smrg max_idx++; 5837ec681f3Smrg } 5847ec681f3Smrg 5857ec681f3Smrg for (int i = 0; i < max_idx; ++i) { 5867ec681f3Smrg hash_table_foreach(&prog->pipelines[i], entry) { 5877ec681f3Smrg struct gfx_pipeline_cache_entry *pc_entry = entry->data; 5887ec681f3Smrg 5897ec681f3Smrg VKSCR(DestroyPipeline)(screen->dev, pc_entry->pipeline, NULL); 5907ec681f3Smrg free(pc_entry); 5917ec681f3Smrg } 5927ec681f3Smrg } 5937ec681f3Smrg if (prog->base.pipeline_cache) 5947ec681f3Smrg VKSCR(DestroyPipelineCache)(screen->dev, prog->base.pipeline_cache, NULL); 5957ec681f3Smrg screen->descriptor_program_deinit(screen, &prog->base); 5967ec681f3Smrg 5977ec681f3Smrg ralloc_free(prog); 5987ec681f3Smrg} 5997ec681f3Smrg 6007ec681f3Smrgvoid 6017ec681f3Smrgzink_destroy_compute_program(struct zink_screen *screen, 6027ec681f3Smrg struct zink_compute_program *comp) 6037ec681f3Smrg{ 6047ec681f3Smrg if (comp->base.layout) 6057ec681f3Smrg VKSCR(DestroyPipelineLayout)(screen->dev, comp->base.layout, NULL); 6067ec681f3Smrg 6077ec681f3Smrg if (comp->shader) 6087ec681f3Smrg _mesa_set_remove_key(comp->shader->programs, comp); 6097ec681f3Smrg 6107ec681f3Smrg hash_table_foreach(comp->pipelines, entry) { 6117ec681f3Smrg struct compute_pipeline_cache_entry *pc_entry = entry->data; 6127ec681f3Smrg 6137ec681f3Smrg VKSCR(DestroyPipeline)(screen->dev, pc_entry->pipeline, NULL); 6147ec681f3Smrg free(pc_entry); 6157ec681f3Smrg } 6167ec681f3Smrg _mesa_hash_table_destroy(comp->pipelines, NULL); 6177ec681f3Smrg VKSCR(DestroyShaderModule)(screen->dev, comp->module->shader, NULL); 6187ec681f3Smrg free(comp->module); 6197ec681f3Smrg if (comp->base.pipeline_cache) 6207ec681f3Smrg VKSCR(DestroyPipelineCache)(screen->dev, comp->base.pipeline_cache, NULL); 6217ec681f3Smrg screen->descriptor_program_deinit(screen, &comp->base); 6227ec681f3Smrg 6237ec681f3Smrg ralloc_free(comp); 6247ec681f3Smrg} 6257ec681f3Smrg 6267ec681f3Smrgstatic unsigned 6277ec681f3Smrgget_pipeline_idx(bool have_EXT_extended_dynamic_state, enum pipe_prim_type mode, VkPrimitiveTopology vkmode) 6287ec681f3Smrg{ 6297ec681f3Smrg /* VK_DYNAMIC_STATE_PRIMITIVE_TOPOLOGY_EXT specifies that the topology state in 6307ec681f3Smrg * VkPipelineInputAssemblyStateCreateInfo only specifies the topology class, 6317ec681f3Smrg * and the specific topology order and adjacency must be set dynamically 6327ec681f3Smrg * with vkCmdSetPrimitiveTopologyEXT before any drawing commands. 6337ec681f3Smrg */ 6347ec681f3Smrg if (have_EXT_extended_dynamic_state) { 6357ec681f3Smrg if (mode == PIPE_PRIM_PATCHES) 6367ec681f3Smrg return 3; 6377ec681f3Smrg switch (u_reduced_prim(mode)) { 6387ec681f3Smrg case PIPE_PRIM_POINTS: 6397ec681f3Smrg return 0; 6407ec681f3Smrg case PIPE_PRIM_LINES: 6417ec681f3Smrg return 1; 6427ec681f3Smrg default: 6437ec681f3Smrg return 2; 6447ec681f3Smrg } 6457ec681f3Smrg } 6467ec681f3Smrg return vkmode; 6477ec681f3Smrg} 6487ec681f3Smrg 6497ec681f3Smrg 6507ec681f3SmrgVkPipeline 6517ec681f3Smrgzink_get_gfx_pipeline(struct zink_context *ctx, 6527ec681f3Smrg struct zink_gfx_program *prog, 6537ec681f3Smrg struct zink_gfx_pipeline_state *state, 6547ec681f3Smrg enum pipe_prim_type mode) 6557ec681f3Smrg{ 6567ec681f3Smrg struct zink_screen *screen = zink_screen(ctx->base.screen); 6577ec681f3Smrg const bool have_EXT_vertex_input_dynamic_state = screen->info.have_EXT_vertex_input_dynamic_state; 6587ec681f3Smrg const bool have_EXT_extended_dynamic_state = screen->info.have_EXT_extended_dynamic_state; 6597ec681f3Smrg 6607ec681f3Smrg VkPrimitiveTopology vkmode = zink_primitive_topology(mode); 6617ec681f3Smrg const unsigned idx = get_pipeline_idx(screen->info.have_EXT_extended_dynamic_state, mode, vkmode); 6627ec681f3Smrg assert(idx <= ARRAY_SIZE(prog->pipelines)); 6637ec681f3Smrg if (!state->dirty && !state->modules_changed && 6647ec681f3Smrg (have_EXT_vertex_input_dynamic_state || !ctx->vertex_state_changed) && 6657ec681f3Smrg idx == state->idx) 6667ec681f3Smrg return state->pipeline; 6677ec681f3Smrg 6687ec681f3Smrg struct hash_entry *entry = NULL; 6697ec681f3Smrg 6707ec681f3Smrg if (state->dirty) { 6717ec681f3Smrg if (state->pipeline) //avoid on first hash 6727ec681f3Smrg state->final_hash ^= state->hash; 6737ec681f3Smrg state->hash = hash_gfx_pipeline_state(state); 6747ec681f3Smrg state->final_hash ^= state->hash; 6757ec681f3Smrg state->dirty = false; 6767ec681f3Smrg } 6777ec681f3Smrg if (!have_EXT_vertex_input_dynamic_state && ctx->vertex_state_changed) { 6787ec681f3Smrg if (state->pipeline) 6797ec681f3Smrg state->final_hash ^= state->vertex_hash; 6807ec681f3Smrg if (!have_EXT_extended_dynamic_state) { 6817ec681f3Smrg uint32_t hash = 0; 6827ec681f3Smrg /* if we don't have dynamic states, we have to hash the enabled vertex buffer bindings */ 6837ec681f3Smrg uint32_t vertex_buffers_enabled_mask = state->vertex_buffers_enabled_mask; 6847ec681f3Smrg hash = XXH32(&vertex_buffers_enabled_mask, sizeof(uint32_t), hash); 6857ec681f3Smrg 6867ec681f3Smrg for (unsigned i = 0; i < state->element_state->num_bindings; i++) { 6877ec681f3Smrg struct pipe_vertex_buffer *vb = ctx->vertex_buffers + ctx->element_state->binding_map[i]; 6887ec681f3Smrg state->vertex_strides[i] = vb->buffer.resource ? vb->stride : 0; 6897ec681f3Smrg hash = XXH32(&state->vertex_strides[i], sizeof(uint32_t), hash); 6907ec681f3Smrg } 6917ec681f3Smrg state->vertex_hash = hash ^ state->element_state->hash; 6927ec681f3Smrg } else 6937ec681f3Smrg state->vertex_hash = state->element_state->hash; 6947ec681f3Smrg state->final_hash ^= state->vertex_hash; 6957ec681f3Smrg } 6967ec681f3Smrg state->modules_changed = false; 6977ec681f3Smrg ctx->vertex_state_changed = false; 6987ec681f3Smrg 6997ec681f3Smrg entry = _mesa_hash_table_search_pre_hashed(&prog->pipelines[idx], state->final_hash, state); 7007ec681f3Smrg 7017ec681f3Smrg if (!entry) { 7027ec681f3Smrg util_queue_fence_wait(&prog->base.cache_fence); 7037ec681f3Smrg VkPipeline pipeline = zink_create_gfx_pipeline(screen, prog, 7047ec681f3Smrg state, vkmode); 7057ec681f3Smrg if (pipeline == VK_NULL_HANDLE) 7067ec681f3Smrg return VK_NULL_HANDLE; 7077ec681f3Smrg 7087ec681f3Smrg zink_screen_update_pipeline_cache(screen, &prog->base); 7097ec681f3Smrg struct gfx_pipeline_cache_entry *pc_entry = CALLOC_STRUCT(gfx_pipeline_cache_entry); 7107ec681f3Smrg if (!pc_entry) 7117ec681f3Smrg return VK_NULL_HANDLE; 7127ec681f3Smrg 7137ec681f3Smrg memcpy(&pc_entry->state, state, sizeof(*state)); 7147ec681f3Smrg pc_entry->pipeline = pipeline; 7157ec681f3Smrg 7167ec681f3Smrg entry = _mesa_hash_table_insert_pre_hashed(&prog->pipelines[idx], state->final_hash, pc_entry, pc_entry); 7177ec681f3Smrg assert(entry); 7187ec681f3Smrg } 7197ec681f3Smrg 7207ec681f3Smrg struct gfx_pipeline_cache_entry *cache_entry = entry->data; 7217ec681f3Smrg state->pipeline = cache_entry->pipeline; 7227ec681f3Smrg state->idx = idx; 7237ec681f3Smrg return state->pipeline; 7247ec681f3Smrg} 7257ec681f3Smrg 7267ec681f3SmrgVkPipeline 7277ec681f3Smrgzink_get_compute_pipeline(struct zink_screen *screen, 7287ec681f3Smrg struct zink_compute_program *comp, 7297ec681f3Smrg struct zink_compute_pipeline_state *state) 7307ec681f3Smrg{ 7317ec681f3Smrg struct hash_entry *entry = NULL; 7327ec681f3Smrg 7337ec681f3Smrg if (!state->dirty) 7347ec681f3Smrg return state->pipeline; 7357ec681f3Smrg if (state->dirty) { 7367ec681f3Smrg state->hash = hash_compute_pipeline_state(state); 7377ec681f3Smrg state->dirty = false; 7387ec681f3Smrg } 7397ec681f3Smrg entry = _mesa_hash_table_search_pre_hashed(comp->pipelines, state->hash, state); 7407ec681f3Smrg 7417ec681f3Smrg if (!entry) { 7427ec681f3Smrg util_queue_fence_wait(&comp->base.cache_fence); 7437ec681f3Smrg VkPipeline pipeline = zink_create_compute_pipeline(screen, comp, state); 7447ec681f3Smrg 7457ec681f3Smrg if (pipeline == VK_NULL_HANDLE) 7467ec681f3Smrg return VK_NULL_HANDLE; 7477ec681f3Smrg 7487ec681f3Smrg struct compute_pipeline_cache_entry *pc_entry = CALLOC_STRUCT(compute_pipeline_cache_entry); 7497ec681f3Smrg if (!pc_entry) 7507ec681f3Smrg return VK_NULL_HANDLE; 7517ec681f3Smrg 7527ec681f3Smrg memcpy(&pc_entry->state, state, sizeof(*state)); 7537ec681f3Smrg pc_entry->pipeline = pipeline; 7547ec681f3Smrg 7557ec681f3Smrg entry = _mesa_hash_table_insert_pre_hashed(comp->pipelines, state->hash, pc_entry, pc_entry); 7567ec681f3Smrg assert(entry); 7577ec681f3Smrg } 7587ec681f3Smrg 7597ec681f3Smrg struct compute_pipeline_cache_entry *cache_entry = entry->data; 7607ec681f3Smrg state->pipeline = cache_entry->pipeline; 7617ec681f3Smrg return state->pipeline; 7627ec681f3Smrg} 7637ec681f3Smrg 7647ec681f3Smrgstatic inline void 7657ec681f3Smrgbind_stage(struct zink_context *ctx, enum pipe_shader_type stage, 7667ec681f3Smrg struct zink_shader *shader) 7677ec681f3Smrg{ 7687ec681f3Smrg if (shader && shader->nir->info.num_inlinable_uniforms) 7697ec681f3Smrg ctx->shader_has_inlinable_uniforms_mask |= 1 << stage; 7707ec681f3Smrg else 7717ec681f3Smrg ctx->shader_has_inlinable_uniforms_mask &= ~(1 << stage); 7727ec681f3Smrg 7737ec681f3Smrg if (stage == PIPE_SHADER_COMPUTE) { 7747ec681f3Smrg if (shader && shader != ctx->compute_stage) { 7757ec681f3Smrg struct hash_entry *entry = _mesa_hash_table_search(&ctx->compute_program_cache, shader); 7767ec681f3Smrg if (entry) { 7777ec681f3Smrg ctx->compute_pipeline_state.dirty = true; 7787ec681f3Smrg ctx->curr_compute = entry->data; 7797ec681f3Smrg } else { 7807ec681f3Smrg struct zink_compute_program *comp = zink_create_compute_program(ctx, shader); 7817ec681f3Smrg _mesa_hash_table_insert(&ctx->compute_program_cache, comp->shader, comp); 7827ec681f3Smrg ctx->compute_pipeline_state.dirty = true; 7837ec681f3Smrg ctx->curr_compute = comp; 7847ec681f3Smrg zink_batch_reference_program(&ctx->batch, &ctx->curr_compute->base); 7857ec681f3Smrg } 7867ec681f3Smrg } else if (!shader) 7877ec681f3Smrg ctx->curr_compute = NULL; 7887ec681f3Smrg ctx->compute_stage = shader; 7897ec681f3Smrg zink_select_launch_grid(ctx); 7907ec681f3Smrg } else { 7917ec681f3Smrg if (ctx->gfx_stages[stage]) 7927ec681f3Smrg ctx->gfx_hash ^= ctx->gfx_stages[stage]->hash; 7937ec681f3Smrg ctx->gfx_stages[stage] = shader; 7947ec681f3Smrg ctx->gfx_dirty = ctx->gfx_stages[PIPE_SHADER_FRAGMENT] && ctx->gfx_stages[PIPE_SHADER_VERTEX]; 7957ec681f3Smrg ctx->gfx_pipeline_state.modules_changed = true; 7967ec681f3Smrg if (shader) { 7977ec681f3Smrg ctx->shader_stages |= BITFIELD_BIT(stage); 7987ec681f3Smrg ctx->gfx_hash ^= ctx->gfx_stages[stage]->hash; 7997ec681f3Smrg } else { 8007ec681f3Smrg ctx->gfx_pipeline_state.modules[stage] = VK_NULL_HANDLE; 8017ec681f3Smrg if (ctx->curr_program) 8027ec681f3Smrg ctx->gfx_pipeline_state.final_hash ^= ctx->curr_program->last_variant_hash; 8037ec681f3Smrg ctx->curr_program = NULL; 8047ec681f3Smrg ctx->shader_stages &= ~BITFIELD_BIT(stage); 8057ec681f3Smrg } 8067ec681f3Smrg } 8077ec681f3Smrg} 8087ec681f3Smrg 8097ec681f3Smrgstatic void 8107ec681f3Smrgbind_last_vertex_stage(struct zink_context *ctx) 8117ec681f3Smrg{ 8127ec681f3Smrg enum pipe_shader_type old = ctx->last_vertex_stage ? pipe_shader_type_from_mesa(ctx->last_vertex_stage->nir->info.stage) : PIPE_SHADER_TYPES; 8137ec681f3Smrg if (ctx->gfx_stages[PIPE_SHADER_GEOMETRY]) 8147ec681f3Smrg ctx->last_vertex_stage = ctx->gfx_stages[PIPE_SHADER_GEOMETRY]; 8157ec681f3Smrg else if (ctx->gfx_stages[PIPE_SHADER_TESS_EVAL]) 8167ec681f3Smrg ctx->last_vertex_stage = ctx->gfx_stages[PIPE_SHADER_TESS_EVAL]; 8177ec681f3Smrg else 8187ec681f3Smrg ctx->last_vertex_stage = ctx->gfx_stages[PIPE_SHADER_VERTEX]; 8197ec681f3Smrg enum pipe_shader_type current = ctx->last_vertex_stage ? pipe_shader_type_from_mesa(ctx->last_vertex_stage->nir->info.stage) : PIPE_SHADER_VERTEX; 8207ec681f3Smrg if (old != current) { 8217ec681f3Smrg if (old != PIPE_SHADER_TYPES) { 8227ec681f3Smrg memset(&ctx->gfx_pipeline_state.shader_keys.key[old].key.vs_base, 0, sizeof(struct zink_vs_key_base)); 8237ec681f3Smrg ctx->dirty_shader_stages |= BITFIELD_BIT(old); 8247ec681f3Smrg } else { 8257ec681f3Smrg /* always unset vertex shader values when changing to a non-vs last stage */ 8267ec681f3Smrg memset(&ctx->gfx_pipeline_state.shader_keys.key[PIPE_SHADER_VERTEX].key.vs_base, 0, sizeof(struct zink_vs_key_base)); 8277ec681f3Smrg } 8287ec681f3Smrg ctx->last_vertex_stage_dirty = true; 8297ec681f3Smrg } 8307ec681f3Smrg} 8317ec681f3Smrg 8327ec681f3Smrgstatic void 8337ec681f3Smrgzink_bind_vs_state(struct pipe_context *pctx, 8347ec681f3Smrg void *cso) 8357ec681f3Smrg{ 8367ec681f3Smrg struct zink_context *ctx = zink_context(pctx); 8377ec681f3Smrg if (!cso && !ctx->gfx_stages[PIPE_SHADER_VERTEX]) 8387ec681f3Smrg return; 8397ec681f3Smrg void *prev = ctx->gfx_stages[PIPE_SHADER_VERTEX]; 8407ec681f3Smrg bind_stage(ctx, PIPE_SHADER_VERTEX, cso); 8417ec681f3Smrg if (cso) { 8427ec681f3Smrg struct zink_shader *zs = cso; 8437ec681f3Smrg ctx->shader_reads_drawid = BITSET_TEST(zs->nir->info.system_values_read, SYSTEM_VALUE_DRAW_ID); 8447ec681f3Smrg ctx->shader_reads_basevertex = BITSET_TEST(zs->nir->info.system_values_read, SYSTEM_VALUE_BASE_VERTEX); 8457ec681f3Smrg } else { 8467ec681f3Smrg ctx->shader_reads_drawid = false; 8477ec681f3Smrg ctx->shader_reads_basevertex = false; 8487ec681f3Smrg } 8497ec681f3Smrg if (ctx->last_vertex_stage == prev) 8507ec681f3Smrg ctx->last_vertex_stage = cso; 8517ec681f3Smrg 8527ec681f3Smrg} 8537ec681f3Smrg 8547ec681f3Smrg/* if gl_SampleMask[] is written to, we have to ensure that we get a shader with the same sample count: 8557ec681f3Smrg * in GL, samples==1 means ignore gl_SampleMask[] 8567ec681f3Smrg * in VK, gl_SampleMask[] is never ignored 8577ec681f3Smrg */ 8587ec681f3Smrgvoid 8597ec681f3Smrgzink_update_fs_key_samples(struct zink_context *ctx) 8607ec681f3Smrg{ 8617ec681f3Smrg if (!ctx->gfx_stages[PIPE_SHADER_FRAGMENT]) 8627ec681f3Smrg return; 8637ec681f3Smrg nir_shader *nir = ctx->gfx_stages[PIPE_SHADER_FRAGMENT]->nir; 8647ec681f3Smrg if (nir->info.outputs_written & (1 << FRAG_RESULT_SAMPLE_MASK)) { 8657ec681f3Smrg bool samples = zink_get_fs_key(ctx)->samples; 8667ec681f3Smrg if (samples != (ctx->fb_state.samples > 1)) 8677ec681f3Smrg zink_set_fs_key(ctx)->samples = ctx->fb_state.samples > 1; 8687ec681f3Smrg } 8697ec681f3Smrg} 8707ec681f3Smrg 8717ec681f3Smrgstatic void 8727ec681f3Smrgzink_bind_fs_state(struct pipe_context *pctx, 8737ec681f3Smrg void *cso) 8747ec681f3Smrg{ 8757ec681f3Smrg struct zink_context *ctx = zink_context(pctx); 8767ec681f3Smrg if (!cso && !ctx->gfx_stages[PIPE_SHADER_FRAGMENT]) 8777ec681f3Smrg return; 8787ec681f3Smrg bind_stage(ctx, PIPE_SHADER_FRAGMENT, cso); 8797ec681f3Smrg ctx->fbfetch_outputs = 0; 8807ec681f3Smrg if (cso) { 8817ec681f3Smrg nir_shader *nir = ctx->gfx_stages[PIPE_SHADER_FRAGMENT]->nir; 8827ec681f3Smrg if (nir->info.fs.uses_fbfetch_output) { 8837ec681f3Smrg nir_foreach_shader_out_variable(var, ctx->gfx_stages[PIPE_SHADER_FRAGMENT]->nir) { 8847ec681f3Smrg if (var->data.fb_fetch_output) 8857ec681f3Smrg ctx->fbfetch_outputs |= BITFIELD_BIT(var->data.location - FRAG_RESULT_DATA0); 8867ec681f3Smrg } 8877ec681f3Smrg } 8887ec681f3Smrg zink_update_fs_key_samples(ctx); 8897ec681f3Smrg } 8907ec681f3Smrg zink_update_fbfetch(ctx); 8917ec681f3Smrg} 8927ec681f3Smrg 8937ec681f3Smrgstatic void 8947ec681f3Smrgzink_bind_gs_state(struct pipe_context *pctx, 8957ec681f3Smrg void *cso) 8967ec681f3Smrg{ 8977ec681f3Smrg struct zink_context *ctx = zink_context(pctx); 8987ec681f3Smrg if (!cso && !ctx->gfx_stages[PIPE_SHADER_GEOMETRY]) 8997ec681f3Smrg return; 9007ec681f3Smrg bool had_points = ctx->gfx_stages[PIPE_SHADER_GEOMETRY] ? ctx->gfx_stages[PIPE_SHADER_GEOMETRY]->nir->info.gs.output_primitive == GL_POINTS : false; 9017ec681f3Smrg bind_stage(ctx, PIPE_SHADER_GEOMETRY, cso); 9027ec681f3Smrg bind_last_vertex_stage(ctx); 9037ec681f3Smrg if (cso) { 9047ec681f3Smrg if (!had_points && ctx->last_vertex_stage->nir->info.gs.output_primitive == GL_POINTS) 9057ec681f3Smrg ctx->gfx_pipeline_state.has_points++; 9067ec681f3Smrg } else { 9077ec681f3Smrg if (had_points) 9087ec681f3Smrg ctx->gfx_pipeline_state.has_points--; 9097ec681f3Smrg } 9107ec681f3Smrg} 9117ec681f3Smrg 9127ec681f3Smrgstatic void 9137ec681f3Smrgzink_bind_tcs_state(struct pipe_context *pctx, 9147ec681f3Smrg void *cso) 9157ec681f3Smrg{ 9167ec681f3Smrg bind_stage(zink_context(pctx), PIPE_SHADER_TESS_CTRL, cso); 9177ec681f3Smrg} 9187ec681f3Smrg 9197ec681f3Smrgstatic void 9207ec681f3Smrgzink_bind_tes_state(struct pipe_context *pctx, 9217ec681f3Smrg void *cso) 9227ec681f3Smrg{ 9237ec681f3Smrg struct zink_context *ctx = zink_context(pctx); 9247ec681f3Smrg if (!cso && !ctx->gfx_stages[PIPE_SHADER_TESS_EVAL]) 9257ec681f3Smrg return; 9267ec681f3Smrg if (!!ctx->gfx_stages[PIPE_SHADER_TESS_EVAL] != !!cso) { 9277ec681f3Smrg if (!cso) { 9287ec681f3Smrg /* if unsetting a TESS that uses a generated TCS, ensure the TCS is unset */ 9297ec681f3Smrg if (ctx->gfx_stages[PIPE_SHADER_TESS_EVAL]->generated) 9307ec681f3Smrg ctx->gfx_stages[PIPE_SHADER_TESS_CTRL] = NULL; 9317ec681f3Smrg } 9327ec681f3Smrg } 9337ec681f3Smrg bind_stage(ctx, PIPE_SHADER_TESS_EVAL, cso); 9347ec681f3Smrg bind_last_vertex_stage(ctx); 9357ec681f3Smrg} 9367ec681f3Smrg 9377ec681f3Smrgstatic void * 9387ec681f3Smrgzink_create_cs_state(struct pipe_context *pctx, 9397ec681f3Smrg const struct pipe_compute_state *shader) 9407ec681f3Smrg{ 9417ec681f3Smrg struct nir_shader *nir; 9427ec681f3Smrg if (shader->ir_type != PIPE_SHADER_IR_NIR) 9437ec681f3Smrg nir = zink_tgsi_to_nir(pctx->screen, shader->prog); 9447ec681f3Smrg else 9457ec681f3Smrg nir = (struct nir_shader *)shader->prog; 9467ec681f3Smrg 9477ec681f3Smrg return zink_shader_create(zink_screen(pctx->screen), nir, NULL); 9487ec681f3Smrg} 9497ec681f3Smrg 9507ec681f3Smrgstatic void 9517ec681f3Smrgzink_bind_cs_state(struct pipe_context *pctx, 9527ec681f3Smrg void *cso) 9537ec681f3Smrg{ 9547ec681f3Smrg bind_stage(zink_context(pctx), PIPE_SHADER_COMPUTE, cso); 9557ec681f3Smrg} 9567ec681f3Smrg 9577ec681f3Smrgvoid 9587ec681f3Smrgzink_delete_shader_state(struct pipe_context *pctx, void *cso) 9597ec681f3Smrg{ 9607ec681f3Smrg zink_shader_free(zink_context(pctx), cso); 9617ec681f3Smrg} 9627ec681f3Smrg 9637ec681f3Smrgvoid * 9647ec681f3Smrgzink_create_gfx_shader_state(struct pipe_context *pctx, const struct pipe_shader_state *shader) 9657ec681f3Smrg{ 9667ec681f3Smrg nir_shader *nir; 9677ec681f3Smrg if (shader->type != PIPE_SHADER_IR_NIR) 9687ec681f3Smrg nir = zink_tgsi_to_nir(pctx->screen, shader->tokens); 9697ec681f3Smrg else 9707ec681f3Smrg nir = (struct nir_shader *)shader->ir.nir; 9717ec681f3Smrg 9727ec681f3Smrg return zink_shader_create(zink_screen(pctx->screen), nir, &shader->stream_output); 9737ec681f3Smrg} 9747ec681f3Smrg 9757ec681f3Smrgstatic void 9767ec681f3Smrgzink_delete_cached_shader_state(struct pipe_context *pctx, void *cso) 9777ec681f3Smrg{ 9787ec681f3Smrg struct zink_screen *screen = zink_screen(pctx->screen); 9797ec681f3Smrg util_shader_reference(pctx, &screen->shaders, &cso, NULL); 9807ec681f3Smrg} 9817ec681f3Smrg 9827ec681f3Smrgstatic void * 9837ec681f3Smrgzink_create_cached_shader_state(struct pipe_context *pctx, const struct pipe_shader_state *shader) 9847ec681f3Smrg{ 9857ec681f3Smrg bool cache_hit; 9867ec681f3Smrg struct zink_screen *screen = zink_screen(pctx->screen); 9877ec681f3Smrg return util_live_shader_cache_get(pctx, &screen->shaders, shader, &cache_hit); 9887ec681f3Smrg} 9897ec681f3Smrg 9907ec681f3Smrgvoid 9917ec681f3Smrgzink_program_init(struct zink_context *ctx) 9927ec681f3Smrg{ 9937ec681f3Smrg ctx->base.create_vs_state = zink_create_cached_shader_state; 9947ec681f3Smrg ctx->base.bind_vs_state = zink_bind_vs_state; 9957ec681f3Smrg ctx->base.delete_vs_state = zink_delete_cached_shader_state; 9967ec681f3Smrg 9977ec681f3Smrg ctx->base.create_fs_state = zink_create_cached_shader_state; 9987ec681f3Smrg ctx->base.bind_fs_state = zink_bind_fs_state; 9997ec681f3Smrg ctx->base.delete_fs_state = zink_delete_cached_shader_state; 10007ec681f3Smrg 10017ec681f3Smrg ctx->base.create_gs_state = zink_create_cached_shader_state; 10027ec681f3Smrg ctx->base.bind_gs_state = zink_bind_gs_state; 10037ec681f3Smrg ctx->base.delete_gs_state = zink_delete_cached_shader_state; 10047ec681f3Smrg 10057ec681f3Smrg ctx->base.create_tcs_state = zink_create_cached_shader_state; 10067ec681f3Smrg ctx->base.bind_tcs_state = zink_bind_tcs_state; 10077ec681f3Smrg ctx->base.delete_tcs_state = zink_delete_cached_shader_state; 10087ec681f3Smrg 10097ec681f3Smrg ctx->base.create_tes_state = zink_create_cached_shader_state; 10107ec681f3Smrg ctx->base.bind_tes_state = zink_bind_tes_state; 10117ec681f3Smrg ctx->base.delete_tes_state = zink_delete_cached_shader_state; 10127ec681f3Smrg 10137ec681f3Smrg ctx->base.create_compute_state = zink_create_cs_state; 10147ec681f3Smrg ctx->base.bind_compute_state = zink_bind_cs_state; 10157ec681f3Smrg ctx->base.delete_compute_state = zink_delete_shader_state; 10167ec681f3Smrg} 1017