17ec681f3Smrg/*
27ec681f3Smrg * Copyright 2018 Collabora Ltd.
37ec681f3Smrg *
47ec681f3Smrg * Permission is hereby granted, free of charge, to any person obtaining a
57ec681f3Smrg * copy of this software and associated documentation files (the "Software"),
67ec681f3Smrg * to deal in the Software without restriction, including without limitation
77ec681f3Smrg * on the rights to use, copy, modify, merge, publish, distribute, sub
87ec681f3Smrg * license, and/or sell copies of the Software, and to permit persons to whom
97ec681f3Smrg * the Software is furnished to do so, subject to the following conditions:
107ec681f3Smrg *
117ec681f3Smrg * The above copyright notice and this permission notice (including the next
127ec681f3Smrg * paragraph) shall be included in all copies or substantial portions of the
137ec681f3Smrg * Software.
147ec681f3Smrg *
157ec681f3Smrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
167ec681f3Smrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
177ec681f3Smrg * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
187ec681f3Smrg * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
197ec681f3Smrg * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
207ec681f3Smrg * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
217ec681f3Smrg * USE OR OTHER DEALINGS IN THE SOFTWARE.
227ec681f3Smrg */
237ec681f3Smrg
247ec681f3Smrg#include "zink_program.h"
257ec681f3Smrg
267ec681f3Smrg#include "zink_compiler.h"
277ec681f3Smrg#include "zink_context.h"
287ec681f3Smrg#include "zink_descriptors.h"
297ec681f3Smrg#include "zink_helpers.h"
307ec681f3Smrg#include "zink_render_pass.h"
317ec681f3Smrg#include "zink_resource.h"
327ec681f3Smrg#include "zink_screen.h"
337ec681f3Smrg#include "zink_state.h"
347ec681f3Smrg#include "zink_inlines.h"
357ec681f3Smrg
367ec681f3Smrg#include "util/hash_table.h"
377ec681f3Smrg#include "util/set.h"
387ec681f3Smrg#include "util/u_debug.h"
397ec681f3Smrg#include "util/u_memory.h"
407ec681f3Smrg#include "util/u_prim.h"
417ec681f3Smrg#include "tgsi/tgsi_from_mesa.h"
427ec681f3Smrg
437ec681f3Smrg/* for pipeline cache */
447ec681f3Smrg#define XXH_INLINE_ALL
457ec681f3Smrg#include "util/xxhash.h"
467ec681f3Smrg
477ec681f3Smrgstruct gfx_pipeline_cache_entry {
487ec681f3Smrg   struct zink_gfx_pipeline_state state;
497ec681f3Smrg   VkPipeline pipeline;
507ec681f3Smrg};
517ec681f3Smrg
527ec681f3Smrgstruct compute_pipeline_cache_entry {
537ec681f3Smrg   struct zink_compute_pipeline_state state;
547ec681f3Smrg   VkPipeline pipeline;
557ec681f3Smrg};
567ec681f3Smrg
577ec681f3Smrgvoid
587ec681f3Smrgdebug_describe_zink_gfx_program(char *buf, const struct zink_gfx_program *ptr)
597ec681f3Smrg{
607ec681f3Smrg   sprintf(buf, "zink_gfx_program");
617ec681f3Smrg}
627ec681f3Smrg
637ec681f3Smrgvoid
647ec681f3Smrgdebug_describe_zink_compute_program(char *buf, const struct zink_compute_program *ptr)
657ec681f3Smrg{
667ec681f3Smrg   sprintf(buf, "zink_compute_program");
677ec681f3Smrg}
687ec681f3Smrg
697ec681f3Smrgstatic bool
707ec681f3Smrgshader_key_matches(const struct zink_shader_module *zm, const struct zink_shader_key *key, unsigned num_uniforms)
717ec681f3Smrg{
727ec681f3Smrg   if (zm->key_size != key->size || zm->num_uniforms != num_uniforms)
737ec681f3Smrg      return false;
747ec681f3Smrg   return !memcmp(zm->key, key, zm->key_size) &&
757ec681f3Smrg          (!num_uniforms || !memcmp(zm->key + zm->key_size, key->base.inlined_uniform_values, zm->num_uniforms * sizeof(uint32_t)));
767ec681f3Smrg}
777ec681f3Smrg
787ec681f3Smrgstatic uint32_t
797ec681f3Smrgshader_module_hash(const struct zink_shader_module *zm)
807ec681f3Smrg{
817ec681f3Smrg   unsigned key_size = zm->key_size + zm->num_uniforms * sizeof(uint32_t);
827ec681f3Smrg   return _mesa_hash_data(zm->key, key_size);
837ec681f3Smrg}
847ec681f3Smrg
857ec681f3Smrgstatic struct zink_shader_module *
867ec681f3Smrgget_shader_module_for_stage(struct zink_context *ctx, struct zink_screen *screen,
877ec681f3Smrg                            struct zink_shader *zs, struct zink_gfx_program *prog,
887ec681f3Smrg                            struct zink_gfx_pipeline_state *state)
897ec681f3Smrg{
907ec681f3Smrg   gl_shader_stage stage = zs->nir->info.stage;
917ec681f3Smrg   enum pipe_shader_type pstage = pipe_shader_type_from_mesa(stage);
927ec681f3Smrg   VkShaderModule mod;
937ec681f3Smrg   struct zink_shader_module *zm = NULL;
947ec681f3Smrg   unsigned base_size = 0;
957ec681f3Smrg   struct zink_shader_key *key = &state->shader_keys.key[pstage];
967ec681f3Smrg
977ec681f3Smrg   if (ctx && zs->nir->info.num_inlinable_uniforms &&
987ec681f3Smrg       ctx->inlinable_uniforms_valid_mask & BITFIELD64_BIT(pstage)) {
997ec681f3Smrg      if (prog->inlined_variant_count[pstage] < ZINK_MAX_INLINED_VARIANTS)
1007ec681f3Smrg         base_size = zs->nir->info.num_inlinable_uniforms;
1017ec681f3Smrg      else
1027ec681f3Smrg         key->inline_uniforms = false;
1037ec681f3Smrg   }
1047ec681f3Smrg
1057ec681f3Smrg   struct zink_shader_module *iter, *next;
1067ec681f3Smrg   LIST_FOR_EACH_ENTRY_SAFE(iter, next, &prog->shader_cache[pstage][!!base_size], list) {
1077ec681f3Smrg      if (!shader_key_matches(iter, key, base_size))
1087ec681f3Smrg         continue;
1097ec681f3Smrg      list_delinit(&iter->list);
1107ec681f3Smrg      zm = iter;
1117ec681f3Smrg      break;
1127ec681f3Smrg   }
1137ec681f3Smrg
1147ec681f3Smrg   if (!zm) {
1157ec681f3Smrg      zm = malloc(sizeof(struct zink_shader_module) + key->size + base_size * sizeof(uint32_t));
1167ec681f3Smrg      if (!zm) {
1177ec681f3Smrg         return NULL;
1187ec681f3Smrg      }
1197ec681f3Smrg      mod = zink_shader_compile(screen, zs, prog->nir[stage], key);
1207ec681f3Smrg      if (!mod) {
1217ec681f3Smrg         FREE(zm);
1227ec681f3Smrg         return NULL;
1237ec681f3Smrg      }
1247ec681f3Smrg      zm->shader = mod;
1257ec681f3Smrg      list_inithead(&zm->list);
1267ec681f3Smrg      zm->num_uniforms = base_size;
1277ec681f3Smrg      zm->key_size = key->size;
1287ec681f3Smrg      memcpy(zm->key, key, key->size);
1297ec681f3Smrg      if (base_size)
1307ec681f3Smrg         memcpy(zm->key + key->size, &key->base, base_size * sizeof(uint32_t));
1317ec681f3Smrg      zm->hash = shader_module_hash(zm);
1327ec681f3Smrg      zm->default_variant = !base_size && list_is_empty(&prog->shader_cache[pstage][0]);
1337ec681f3Smrg      if (base_size)
1347ec681f3Smrg         prog->inlined_variant_count[pstage]++;
1357ec681f3Smrg   }
1367ec681f3Smrg   list_add(&zm->list, &prog->shader_cache[pstage][!!base_size]);
1377ec681f3Smrg   return zm;
1387ec681f3Smrg}
1397ec681f3Smrg
1407ec681f3Smrgstatic void
1417ec681f3Smrgzink_destroy_shader_module(struct zink_screen *screen, struct zink_shader_module *zm)
1427ec681f3Smrg{
1437ec681f3Smrg   VKSCR(DestroyShaderModule)(screen->dev, zm->shader, NULL);
1447ec681f3Smrg   free(zm);
1457ec681f3Smrg}
1467ec681f3Smrg
1477ec681f3Smrgstatic void
1487ec681f3Smrgdestroy_shader_cache(struct zink_screen *screen, struct list_head *sc)
1497ec681f3Smrg{
1507ec681f3Smrg   struct zink_shader_module *zm, *next;
1517ec681f3Smrg   LIST_FOR_EACH_ENTRY_SAFE(zm, next, sc, list) {
1527ec681f3Smrg      list_delinit(&zm->list);
1537ec681f3Smrg      zink_destroy_shader_module(screen, zm);
1547ec681f3Smrg   }
1557ec681f3Smrg}
1567ec681f3Smrg
1577ec681f3Smrgstatic void
1587ec681f3Smrgupdate_shader_modules(struct zink_context *ctx,
1597ec681f3Smrg                      struct zink_screen *screen,
1607ec681f3Smrg                      struct zink_gfx_program *prog, uint32_t mask,
1617ec681f3Smrg                      struct zink_gfx_pipeline_state *state)
1627ec681f3Smrg{
1637ec681f3Smrg   bool hash_changed = false;
1647ec681f3Smrg   bool default_variants = true;
1657ec681f3Smrg   bool first = !prog->modules[PIPE_SHADER_VERTEX];
1667ec681f3Smrg   uint32_t variant_hash = prog->last_variant_hash;
1677ec681f3Smrg   u_foreach_bit(pstage, mask) {
1687ec681f3Smrg      assert(prog->shaders[pstage]);
1697ec681f3Smrg      struct zink_shader_module *zm = get_shader_module_for_stage(ctx, screen, prog->shaders[pstage], prog, state);
1707ec681f3Smrg      state->modules[pstage] = zm->shader;
1717ec681f3Smrg      if (prog->modules[pstage] == zm)
1727ec681f3Smrg         continue;
1737ec681f3Smrg      if (prog->modules[pstage])
1747ec681f3Smrg         variant_hash ^= prog->modules[pstage]->hash;
1757ec681f3Smrg      hash_changed = true;
1767ec681f3Smrg      default_variants &= zm->default_variant;
1777ec681f3Smrg      prog->modules[pstage] = zm;
1787ec681f3Smrg      variant_hash ^= prog->modules[pstage]->hash;
1797ec681f3Smrg   }
1807ec681f3Smrg
1817ec681f3Smrg   if (hash_changed && state) {
1827ec681f3Smrg      if (default_variants && !first)
1837ec681f3Smrg         prog->last_variant_hash = prog->default_variant_hash;
1847ec681f3Smrg      else {
1857ec681f3Smrg         prog->last_variant_hash = variant_hash;
1867ec681f3Smrg         if (first) {
1877ec681f3Smrg            p_atomic_dec(&prog->base.reference.count);
1887ec681f3Smrg            prog->default_variant_hash = prog->last_variant_hash;
1897ec681f3Smrg         }
1907ec681f3Smrg      }
1917ec681f3Smrg
1927ec681f3Smrg      state->modules_changed = true;
1937ec681f3Smrg   }
1947ec681f3Smrg}
1957ec681f3Smrg
1967ec681f3Smrgstatic uint32_t
1977ec681f3Smrghash_gfx_pipeline_state(const void *key)
1987ec681f3Smrg{
1997ec681f3Smrg   const struct zink_gfx_pipeline_state *state = key;
2007ec681f3Smrg   uint32_t hash = _mesa_hash_data(key, offsetof(struct zink_gfx_pipeline_state, hash));
2017ec681f3Smrg   if (!state->have_EXT_extended_dynamic_state2)
2027ec681f3Smrg      hash = XXH32(&state->primitive_restart, 1, hash);
2037ec681f3Smrg   if (state->have_EXT_extended_dynamic_state)
2047ec681f3Smrg      return hash;
2057ec681f3Smrg   return XXH32(&state->dyn_state1, sizeof(state->dyn_state1), hash);
2067ec681f3Smrg}
2077ec681f3Smrg
2087ec681f3Smrgstatic bool
2097ec681f3Smrgequals_gfx_pipeline_state(const void *a, const void *b)
2107ec681f3Smrg{
2117ec681f3Smrg   const struct zink_gfx_pipeline_state *sa = a;
2127ec681f3Smrg   const struct zink_gfx_pipeline_state *sb = b;
2137ec681f3Smrg   if (!sa->have_EXT_extended_dynamic_state) {
2147ec681f3Smrg      if (sa->vertex_buffers_enabled_mask != sb->vertex_buffers_enabled_mask)
2157ec681f3Smrg         return false;
2167ec681f3Smrg      /* if we don't have dynamic states, we have to hash the enabled vertex buffer bindings */
2177ec681f3Smrg      uint32_t mask_a = sa->vertex_buffers_enabled_mask;
2187ec681f3Smrg      uint32_t mask_b = sb->vertex_buffers_enabled_mask;
2197ec681f3Smrg      while (mask_a || mask_b) {
2207ec681f3Smrg         unsigned idx_a = u_bit_scan(&mask_a);
2217ec681f3Smrg         unsigned idx_b = u_bit_scan(&mask_b);
2227ec681f3Smrg         if (sa->vertex_strides[idx_a] != sb->vertex_strides[idx_b])
2237ec681f3Smrg            return false;
2247ec681f3Smrg      }
2257ec681f3Smrg      if (sa->dyn_state1.front_face != sb->dyn_state1.front_face)
2267ec681f3Smrg         return false;
2277ec681f3Smrg      if (!!sa->dyn_state1.depth_stencil_alpha_state != !!sb->dyn_state1.depth_stencil_alpha_state ||
2287ec681f3Smrg          (sa->dyn_state1.depth_stencil_alpha_state &&
2297ec681f3Smrg           memcmp(sa->dyn_state1.depth_stencil_alpha_state, sb->dyn_state1.depth_stencil_alpha_state,
2307ec681f3Smrg                  sizeof(struct zink_depth_stencil_alpha_hw_state))))
2317ec681f3Smrg         return false;
2327ec681f3Smrg   }
2337ec681f3Smrg   if (!sa->have_EXT_extended_dynamic_state2) {
2347ec681f3Smrg      if (sa->primitive_restart != sb->primitive_restart)
2357ec681f3Smrg         return false;
2367ec681f3Smrg   }
2377ec681f3Smrg   return !memcmp(sa->modules, sb->modules, sizeof(sa->modules)) &&
2387ec681f3Smrg          !memcmp(a, b, offsetof(struct zink_gfx_pipeline_state, hash));
2397ec681f3Smrg}
2407ec681f3Smrg
2417ec681f3Smrgvoid
2427ec681f3Smrgzink_update_gfx_program(struct zink_context *ctx, struct zink_gfx_program *prog)
2437ec681f3Smrg{
2447ec681f3Smrg   update_shader_modules(ctx, zink_screen(ctx->base.screen), prog, ctx->dirty_shader_stages & prog->stages_present, &ctx->gfx_pipeline_state);
2457ec681f3Smrg}
2467ec681f3Smrg
2477ec681f3SmrgVkPipelineLayout
2487ec681f3Smrgzink_pipeline_layout_create(struct zink_screen *screen, struct zink_program *pg, uint32_t *compat)
2497ec681f3Smrg{
2507ec681f3Smrg   VkPipelineLayoutCreateInfo plci = {0};
2517ec681f3Smrg   plci.sType = VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO;
2527ec681f3Smrg
2537ec681f3Smrg   plci.pSetLayouts = pg->dsl;
2547ec681f3Smrg   plci.setLayoutCount = pg->num_dsl;
2557ec681f3Smrg
2567ec681f3Smrg   VkPushConstantRange pcr[2] = {0};
2577ec681f3Smrg   if (pg->is_compute) {
2587ec681f3Smrg      if (((struct zink_compute_program*)pg)->shader->nir->info.stage == MESA_SHADER_KERNEL) {
2597ec681f3Smrg         pcr[0].stageFlags = VK_SHADER_STAGE_COMPUTE_BIT;
2607ec681f3Smrg         pcr[0].offset = 0;
2617ec681f3Smrg         pcr[0].size = sizeof(struct zink_cs_push_constant);
2627ec681f3Smrg         plci.pushConstantRangeCount = 1;
2637ec681f3Smrg      }
2647ec681f3Smrg   } else {
2657ec681f3Smrg      pcr[0].stageFlags = VK_SHADER_STAGE_VERTEX_BIT;
2667ec681f3Smrg      pcr[0].offset = offsetof(struct zink_gfx_push_constant, draw_mode_is_indexed);
2677ec681f3Smrg      pcr[0].size = 2 * sizeof(unsigned);
2687ec681f3Smrg      pcr[1].stageFlags = VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT;
2697ec681f3Smrg      pcr[1].offset = offsetof(struct zink_gfx_push_constant, default_inner_level);
2707ec681f3Smrg      pcr[1].size = sizeof(float) * 6;
2717ec681f3Smrg      plci.pushConstantRangeCount = 2;
2727ec681f3Smrg   }
2737ec681f3Smrg   plci.pPushConstantRanges = &pcr[0];
2747ec681f3Smrg
2757ec681f3Smrg   VkPipelineLayout layout;
2767ec681f3Smrg   if (VKSCR(CreatePipelineLayout)(screen->dev, &plci, NULL, &layout) != VK_SUCCESS) {
2777ec681f3Smrg      debug_printf("vkCreatePipelineLayout failed!\n");
2787ec681f3Smrg      return VK_NULL_HANDLE;
2797ec681f3Smrg   }
2807ec681f3Smrg
2817ec681f3Smrg   *compat = _mesa_hash_data(pg->dsl, pg->num_dsl * sizeof(pg->dsl[0]));
2827ec681f3Smrg
2837ec681f3Smrg   return layout;
2847ec681f3Smrg}
2857ec681f3Smrg
2867ec681f3Smrgstatic void
2877ec681f3Smrgassign_io(struct zink_gfx_program *prog, struct zink_shader *stages[ZINK_SHADER_COUNT])
2887ec681f3Smrg{
2897ec681f3Smrg   struct zink_shader *shaders[PIPE_SHADER_TYPES];
2907ec681f3Smrg
2917ec681f3Smrg   /* build array in pipeline order */
2927ec681f3Smrg   for (unsigned i = 0; i < ZINK_SHADER_COUNT; i++)
2937ec681f3Smrg      shaders[tgsi_processor_to_shader_stage(i)] = stages[i];
2947ec681f3Smrg
2957ec681f3Smrg   for (unsigned i = 0; i < MESA_SHADER_FRAGMENT;) {
2967ec681f3Smrg      nir_shader *producer = shaders[i]->nir;
2977ec681f3Smrg      for (unsigned j = i + 1; j < ZINK_SHADER_COUNT; i++, j++) {
2987ec681f3Smrg         struct zink_shader *consumer = shaders[j];
2997ec681f3Smrg         if (!consumer)
3007ec681f3Smrg            continue;
3017ec681f3Smrg         if (!prog->nir[producer->info.stage])
3027ec681f3Smrg            prog->nir[producer->info.stage] = nir_shader_clone(prog, producer);
3037ec681f3Smrg         if (!prog->nir[j])
3047ec681f3Smrg            prog->nir[j] = nir_shader_clone(prog, consumer->nir);
3057ec681f3Smrg         zink_compiler_assign_io(prog->nir[producer->info.stage], prog->nir[j]);
3067ec681f3Smrg         i = j;
3077ec681f3Smrg         break;
3087ec681f3Smrg      }
3097ec681f3Smrg   }
3107ec681f3Smrg}
3117ec681f3Smrg
3127ec681f3Smrgstruct zink_gfx_program *
3137ec681f3Smrgzink_create_gfx_program(struct zink_context *ctx,
3147ec681f3Smrg                        struct zink_shader *stages[ZINK_SHADER_COUNT],
3157ec681f3Smrg                        unsigned vertices_per_patch)
3167ec681f3Smrg{
3177ec681f3Smrg   struct zink_screen *screen = zink_screen(ctx->base.screen);
3187ec681f3Smrg   struct zink_gfx_program *prog = rzalloc(NULL, struct zink_gfx_program);
3197ec681f3Smrg   if (!prog)
3207ec681f3Smrg      goto fail;
3217ec681f3Smrg
3227ec681f3Smrg   pipe_reference_init(&prog->base.reference, 1);
3237ec681f3Smrg
3247ec681f3Smrg   for (int i = 0; i < ZINK_SHADER_COUNT; ++i) {
3257ec681f3Smrg      list_inithead(&prog->shader_cache[i][0]);
3267ec681f3Smrg      list_inithead(&prog->shader_cache[i][1]);
3277ec681f3Smrg      if (stages[i]) {
3287ec681f3Smrg         prog->shaders[i] = stages[i];
3297ec681f3Smrg         prog->stages_present |= BITFIELD_BIT(i);
3307ec681f3Smrg      }
3317ec681f3Smrg   }
3327ec681f3Smrg   if (stages[PIPE_SHADER_TESS_EVAL] && !stages[PIPE_SHADER_TESS_CTRL]) {
3337ec681f3Smrg      prog->shaders[PIPE_SHADER_TESS_EVAL]->generated =
3347ec681f3Smrg      prog->shaders[PIPE_SHADER_TESS_CTRL] =
3357ec681f3Smrg        zink_shader_tcs_create(screen, stages[PIPE_SHADER_VERTEX], vertices_per_patch);
3367ec681f3Smrg      prog->stages_present |= BITFIELD_BIT(PIPE_SHADER_TESS_CTRL);
3377ec681f3Smrg   }
3387ec681f3Smrg
3397ec681f3Smrg   assign_io(prog, prog->shaders);
3407ec681f3Smrg
3417ec681f3Smrg   if (stages[PIPE_SHADER_GEOMETRY])
3427ec681f3Smrg      prog->last_vertex_stage = stages[PIPE_SHADER_GEOMETRY];
3437ec681f3Smrg   else if (stages[PIPE_SHADER_TESS_EVAL])
3447ec681f3Smrg      prog->last_vertex_stage = stages[PIPE_SHADER_TESS_EVAL];
3457ec681f3Smrg   else
3467ec681f3Smrg      prog->last_vertex_stage = stages[PIPE_SHADER_VERTEX];
3477ec681f3Smrg
3487ec681f3Smrg   for (int i = 0; i < ARRAY_SIZE(prog->pipelines); ++i) {
3497ec681f3Smrg      _mesa_hash_table_init(&prog->pipelines[i], prog, NULL, equals_gfx_pipeline_state);
3507ec681f3Smrg      /* only need first 3/4 for point/line/tri/patch */
3517ec681f3Smrg      if (screen->info.have_EXT_extended_dynamic_state &&
3527ec681f3Smrg          i == (prog->last_vertex_stage->nir->info.stage == MESA_SHADER_TESS_EVAL ? 4 : 3))
3537ec681f3Smrg         break;
3547ec681f3Smrg   }
3557ec681f3Smrg
3567ec681f3Smrg   struct mesa_sha1 sctx;
3577ec681f3Smrg   _mesa_sha1_init(&sctx);
3587ec681f3Smrg   for (int i = 0; i < ZINK_SHADER_COUNT; ++i) {
3597ec681f3Smrg      if (prog->shaders[i]) {
3607ec681f3Smrg         simple_mtx_lock(&prog->shaders[i]->lock);
3617ec681f3Smrg         _mesa_set_add(prog->shaders[i]->programs, prog);
3627ec681f3Smrg         simple_mtx_unlock(&prog->shaders[i]->lock);
3637ec681f3Smrg         zink_gfx_program_reference(screen, NULL, prog);
3647ec681f3Smrg         _mesa_sha1_update(&sctx, prog->shaders[i]->base.sha1, sizeof(prog->shaders[i]->base.sha1));
3657ec681f3Smrg      }
3667ec681f3Smrg   }
3677ec681f3Smrg   _mesa_sha1_final(&sctx, prog->base.sha1);
3687ec681f3Smrg
3697ec681f3Smrg   if (!screen->descriptor_program_init(ctx, &prog->base))
3707ec681f3Smrg      goto fail;
3717ec681f3Smrg
3727ec681f3Smrg   zink_screen_get_pipeline_cache(screen, &prog->base);
3737ec681f3Smrg   return prog;
3747ec681f3Smrg
3757ec681f3Smrgfail:
3767ec681f3Smrg   if (prog)
3777ec681f3Smrg      zink_destroy_gfx_program(screen, prog);
3787ec681f3Smrg   return NULL;
3797ec681f3Smrg}
3807ec681f3Smrg
3817ec681f3Smrgstatic uint32_t
3827ec681f3Smrghash_compute_pipeline_state(const void *key)
3837ec681f3Smrg{
3847ec681f3Smrg   const struct zink_compute_pipeline_state *state = key;
3857ec681f3Smrg   uint32_t hash = _mesa_hash_data(state, offsetof(struct zink_compute_pipeline_state, hash));
3867ec681f3Smrg   if (state->use_local_size)
3877ec681f3Smrg      hash = XXH32(&state->local_size[0], sizeof(state->local_size), hash);
3887ec681f3Smrg   return hash;
3897ec681f3Smrg}
3907ec681f3Smrg
3917ec681f3Smrgvoid
3927ec681f3Smrgzink_program_update_compute_pipeline_state(struct zink_context *ctx, struct zink_compute_program *comp, const uint block[3])
3937ec681f3Smrg{
3947ec681f3Smrg   struct zink_shader *zs = comp->shader;
3957ec681f3Smrg   bool use_local_size = !(zs->nir->info.workgroup_size[0] ||
3967ec681f3Smrg                           zs->nir->info.workgroup_size[1] ||
3977ec681f3Smrg                           zs->nir->info.workgroup_size[2]);
3987ec681f3Smrg   if (ctx->compute_pipeline_state.use_local_size != use_local_size)
3997ec681f3Smrg      ctx->compute_pipeline_state.dirty = true;
4007ec681f3Smrg   ctx->compute_pipeline_state.use_local_size = use_local_size;
4017ec681f3Smrg
4027ec681f3Smrg   if (ctx->compute_pipeline_state.use_local_size) {
4037ec681f3Smrg      for (int i = 0; i < ARRAY_SIZE(ctx->compute_pipeline_state.local_size); i++) {
4047ec681f3Smrg         if (ctx->compute_pipeline_state.local_size[i] != block[i])
4057ec681f3Smrg            ctx->compute_pipeline_state.dirty = true;
4067ec681f3Smrg         ctx->compute_pipeline_state.local_size[i] = block[i];
4077ec681f3Smrg      }
4087ec681f3Smrg   } else
4097ec681f3Smrg      ctx->compute_pipeline_state.local_size[0] =
4107ec681f3Smrg      ctx->compute_pipeline_state.local_size[1] =
4117ec681f3Smrg      ctx->compute_pipeline_state.local_size[2] = 0;
4127ec681f3Smrg}
4137ec681f3Smrg
4147ec681f3Smrgstatic bool
4157ec681f3Smrgequals_compute_pipeline_state(const void *a, const void *b)
4167ec681f3Smrg{
4177ec681f3Smrg   return memcmp(a, b, offsetof(struct zink_compute_pipeline_state, hash)) == 0;
4187ec681f3Smrg}
4197ec681f3Smrg
4207ec681f3Smrgstruct zink_compute_program *
4217ec681f3Smrgzink_create_compute_program(struct zink_context *ctx, struct zink_shader *shader)
4227ec681f3Smrg{
4237ec681f3Smrg   struct zink_screen *screen = zink_screen(ctx->base.screen);
4247ec681f3Smrg   struct zink_compute_program *comp = rzalloc(NULL, struct zink_compute_program);
4257ec681f3Smrg   if (!comp)
4267ec681f3Smrg      goto fail;
4277ec681f3Smrg
4287ec681f3Smrg   pipe_reference_init(&comp->base.reference, 1);
4297ec681f3Smrg   comp->base.is_compute = true;
4307ec681f3Smrg
4317ec681f3Smrg   comp->module = CALLOC_STRUCT(zink_shader_module);
4327ec681f3Smrg   assert(comp->module);
4337ec681f3Smrg   comp->module->shader = zink_shader_compile(screen, shader, shader->nir, NULL);
4347ec681f3Smrg   assert(comp->module->shader);
4357ec681f3Smrg
4367ec681f3Smrg   comp->pipelines = _mesa_hash_table_create(NULL, hash_compute_pipeline_state,
4377ec681f3Smrg                                             equals_compute_pipeline_state);
4387ec681f3Smrg
4397ec681f3Smrg   _mesa_set_add(shader->programs, comp);
4407ec681f3Smrg   comp->shader = shader;
4417ec681f3Smrg   memcpy(comp->base.sha1, shader->base.sha1, sizeof(shader->base.sha1));
4427ec681f3Smrg
4437ec681f3Smrg   if (!screen->descriptor_program_init(ctx, &comp->base))
4447ec681f3Smrg      goto fail;
4457ec681f3Smrg
4467ec681f3Smrg   zink_screen_get_pipeline_cache(screen, &comp->base);
4477ec681f3Smrg   return comp;
4487ec681f3Smrg
4497ec681f3Smrgfail:
4507ec681f3Smrg   if (comp)
4517ec681f3Smrg      zink_destroy_compute_program(screen, comp);
4527ec681f3Smrg   return NULL;
4537ec681f3Smrg}
4547ec681f3Smrg
4557ec681f3Smrguint32_t
4567ec681f3Smrgzink_program_get_descriptor_usage(struct zink_context *ctx, enum pipe_shader_type stage, enum zink_descriptor_type type)
4577ec681f3Smrg{
4587ec681f3Smrg   struct zink_shader *zs = NULL;
4597ec681f3Smrg   switch (stage) {
4607ec681f3Smrg   case PIPE_SHADER_VERTEX:
4617ec681f3Smrg   case PIPE_SHADER_TESS_CTRL:
4627ec681f3Smrg   case PIPE_SHADER_TESS_EVAL:
4637ec681f3Smrg   case PIPE_SHADER_GEOMETRY:
4647ec681f3Smrg   case PIPE_SHADER_FRAGMENT:
4657ec681f3Smrg      zs = ctx->gfx_stages[stage];
4667ec681f3Smrg      break;
4677ec681f3Smrg   case PIPE_SHADER_COMPUTE: {
4687ec681f3Smrg      zs = ctx->compute_stage;
4697ec681f3Smrg      break;
4707ec681f3Smrg   }
4717ec681f3Smrg   default:
4727ec681f3Smrg      unreachable("unknown shader type");
4737ec681f3Smrg   }
4747ec681f3Smrg   if (!zs)
4757ec681f3Smrg      return 0;
4767ec681f3Smrg   switch (type) {
4777ec681f3Smrg   case ZINK_DESCRIPTOR_TYPE_UBO:
4787ec681f3Smrg      return zs->ubos_used;
4797ec681f3Smrg   case ZINK_DESCRIPTOR_TYPE_SSBO:
4807ec681f3Smrg      return zs->ssbos_used;
4817ec681f3Smrg   case ZINK_DESCRIPTOR_TYPE_SAMPLER_VIEW:
4827ec681f3Smrg      return BITSET_TEST_RANGE(zs->nir->info.textures_used, 0, PIPE_MAX_SAMPLERS - 1);
4837ec681f3Smrg   case ZINK_DESCRIPTOR_TYPE_IMAGE:
4847ec681f3Smrg      return zs->nir->info.images_used;
4857ec681f3Smrg   default:
4867ec681f3Smrg      unreachable("unknown descriptor type!");
4877ec681f3Smrg   }
4887ec681f3Smrg   return 0;
4897ec681f3Smrg}
4907ec681f3Smrg
4917ec681f3Smrgbool
4927ec681f3Smrgzink_program_descriptor_is_buffer(struct zink_context *ctx, enum pipe_shader_type stage, enum zink_descriptor_type type, unsigned i)
4937ec681f3Smrg{
4947ec681f3Smrg   struct zink_shader *zs = NULL;
4957ec681f3Smrg   switch (stage) {
4967ec681f3Smrg   case PIPE_SHADER_VERTEX:
4977ec681f3Smrg   case PIPE_SHADER_TESS_CTRL:
4987ec681f3Smrg   case PIPE_SHADER_TESS_EVAL:
4997ec681f3Smrg   case PIPE_SHADER_GEOMETRY:
5007ec681f3Smrg   case PIPE_SHADER_FRAGMENT:
5017ec681f3Smrg      zs = ctx->gfx_stages[stage];
5027ec681f3Smrg      break;
5037ec681f3Smrg   case PIPE_SHADER_COMPUTE: {
5047ec681f3Smrg      zs = ctx->compute_stage;
5057ec681f3Smrg      break;
5067ec681f3Smrg   }
5077ec681f3Smrg   default:
5087ec681f3Smrg      unreachable("unknown shader type");
5097ec681f3Smrg   }
5107ec681f3Smrg   if (!zs)
5117ec681f3Smrg      return false;
5127ec681f3Smrg   return zink_shader_descriptor_is_buffer(zs, type, i);
5137ec681f3Smrg}
5147ec681f3Smrg
5157ec681f3Smrgstatic unsigned
5167ec681f3Smrgget_num_bindings(struct zink_shader *zs, enum zink_descriptor_type type)
5177ec681f3Smrg{
5187ec681f3Smrg   switch (type) {
5197ec681f3Smrg   case ZINK_DESCRIPTOR_TYPE_UBO:
5207ec681f3Smrg   case ZINK_DESCRIPTOR_TYPE_SSBO:
5217ec681f3Smrg      return zs->num_bindings[type];
5227ec681f3Smrg   default:
5237ec681f3Smrg      break;
5247ec681f3Smrg   }
5257ec681f3Smrg   unsigned num_bindings = 0;
5267ec681f3Smrg   for (int i = 0; i < zs->num_bindings[type]; i++)
5277ec681f3Smrg      num_bindings += zs->bindings[type][i].size;
5287ec681f3Smrg   return num_bindings;
5297ec681f3Smrg}
5307ec681f3Smrg
5317ec681f3Smrgunsigned
5327ec681f3Smrgzink_program_num_bindings_typed(const struct zink_program *pg, enum zink_descriptor_type type, bool is_compute)
5337ec681f3Smrg{
5347ec681f3Smrg   unsigned num_bindings = 0;
5357ec681f3Smrg   if (is_compute) {
5367ec681f3Smrg      struct zink_compute_program *comp = (void*)pg;
5377ec681f3Smrg      return get_num_bindings(comp->shader, type);
5387ec681f3Smrg   }
5397ec681f3Smrg   struct zink_gfx_program *prog = (void*)pg;
5407ec681f3Smrg   for (unsigned i = 0; i < ZINK_SHADER_COUNT; i++) {
5417ec681f3Smrg      if (prog->shaders[i])
5427ec681f3Smrg         num_bindings += get_num_bindings(prog->shaders[i], type);
5437ec681f3Smrg   }
5447ec681f3Smrg   return num_bindings;
5457ec681f3Smrg}
5467ec681f3Smrg
5477ec681f3Smrgunsigned
5487ec681f3Smrgzink_program_num_bindings(const struct zink_program *pg, bool is_compute)
5497ec681f3Smrg{
5507ec681f3Smrg   unsigned num_bindings = 0;
5517ec681f3Smrg   for (unsigned i = 0; i < ZINK_DESCRIPTOR_TYPES; i++)
5527ec681f3Smrg      num_bindings += zink_program_num_bindings_typed(pg, i, is_compute);
5537ec681f3Smrg   return num_bindings;
5547ec681f3Smrg}
5557ec681f3Smrg
5567ec681f3Smrgvoid
5577ec681f3Smrgzink_destroy_gfx_program(struct zink_screen *screen,
5587ec681f3Smrg                         struct zink_gfx_program *prog)
5597ec681f3Smrg{
5607ec681f3Smrg   if (prog->base.layout)
5617ec681f3Smrg      VKSCR(DestroyPipelineLayout)(screen->dev, prog->base.layout, NULL);
5627ec681f3Smrg
5637ec681f3Smrg   for (int i = 0; i < ZINK_SHADER_COUNT; ++i) {
5647ec681f3Smrg      if (prog->shaders[i]) {
5657ec681f3Smrg         _mesa_set_remove_key(prog->shaders[i]->programs, prog);
5667ec681f3Smrg         prog->shaders[i] = NULL;
5677ec681f3Smrg      }
5687ec681f3Smrg      destroy_shader_cache(screen, &prog->shader_cache[i][0]);
5697ec681f3Smrg      destroy_shader_cache(screen, &prog->shader_cache[i][1]);
5707ec681f3Smrg      ralloc_free(prog->nir[i]);
5717ec681f3Smrg   }
5727ec681f3Smrg
5737ec681f3Smrg   unsigned max_idx = ARRAY_SIZE(prog->pipelines);
5747ec681f3Smrg   if (screen->info.have_EXT_extended_dynamic_state) {
5757ec681f3Smrg      /* only need first 3/4 for point/line/tri/patch */
5767ec681f3Smrg      if ((prog->stages_present &
5777ec681f3Smrg          (BITFIELD_BIT(PIPE_SHADER_TESS_EVAL) | BITFIELD_BIT(PIPE_SHADER_GEOMETRY))) ==
5787ec681f3Smrg          BITFIELD_BIT(PIPE_SHADER_TESS_EVAL))
5797ec681f3Smrg         max_idx = 4;
5807ec681f3Smrg      else
5817ec681f3Smrg         max_idx = 3;
5827ec681f3Smrg      max_idx++;
5837ec681f3Smrg   }
5847ec681f3Smrg
5857ec681f3Smrg   for (int i = 0; i < max_idx; ++i) {
5867ec681f3Smrg      hash_table_foreach(&prog->pipelines[i], entry) {
5877ec681f3Smrg         struct gfx_pipeline_cache_entry *pc_entry = entry->data;
5887ec681f3Smrg
5897ec681f3Smrg         VKSCR(DestroyPipeline)(screen->dev, pc_entry->pipeline, NULL);
5907ec681f3Smrg         free(pc_entry);
5917ec681f3Smrg      }
5927ec681f3Smrg   }
5937ec681f3Smrg   if (prog->base.pipeline_cache)
5947ec681f3Smrg      VKSCR(DestroyPipelineCache)(screen->dev, prog->base.pipeline_cache, NULL);
5957ec681f3Smrg   screen->descriptor_program_deinit(screen, &prog->base);
5967ec681f3Smrg
5977ec681f3Smrg   ralloc_free(prog);
5987ec681f3Smrg}
5997ec681f3Smrg
6007ec681f3Smrgvoid
6017ec681f3Smrgzink_destroy_compute_program(struct zink_screen *screen,
6027ec681f3Smrg                         struct zink_compute_program *comp)
6037ec681f3Smrg{
6047ec681f3Smrg   if (comp->base.layout)
6057ec681f3Smrg      VKSCR(DestroyPipelineLayout)(screen->dev, comp->base.layout, NULL);
6067ec681f3Smrg
6077ec681f3Smrg   if (comp->shader)
6087ec681f3Smrg      _mesa_set_remove_key(comp->shader->programs, comp);
6097ec681f3Smrg
6107ec681f3Smrg   hash_table_foreach(comp->pipelines, entry) {
6117ec681f3Smrg      struct compute_pipeline_cache_entry *pc_entry = entry->data;
6127ec681f3Smrg
6137ec681f3Smrg      VKSCR(DestroyPipeline)(screen->dev, pc_entry->pipeline, NULL);
6147ec681f3Smrg      free(pc_entry);
6157ec681f3Smrg   }
6167ec681f3Smrg   _mesa_hash_table_destroy(comp->pipelines, NULL);
6177ec681f3Smrg   VKSCR(DestroyShaderModule)(screen->dev, comp->module->shader, NULL);
6187ec681f3Smrg   free(comp->module);
6197ec681f3Smrg   if (comp->base.pipeline_cache)
6207ec681f3Smrg      VKSCR(DestroyPipelineCache)(screen->dev, comp->base.pipeline_cache, NULL);
6217ec681f3Smrg   screen->descriptor_program_deinit(screen, &comp->base);
6227ec681f3Smrg
6237ec681f3Smrg   ralloc_free(comp);
6247ec681f3Smrg}
6257ec681f3Smrg
6267ec681f3Smrgstatic unsigned
6277ec681f3Smrgget_pipeline_idx(bool have_EXT_extended_dynamic_state, enum pipe_prim_type mode, VkPrimitiveTopology vkmode)
6287ec681f3Smrg{
6297ec681f3Smrg   /* VK_DYNAMIC_STATE_PRIMITIVE_TOPOLOGY_EXT specifies that the topology state in
6307ec681f3Smrg    * VkPipelineInputAssemblyStateCreateInfo only specifies the topology class,
6317ec681f3Smrg    * and the specific topology order and adjacency must be set dynamically
6327ec681f3Smrg    * with vkCmdSetPrimitiveTopologyEXT before any drawing commands.
6337ec681f3Smrg    */
6347ec681f3Smrg   if (have_EXT_extended_dynamic_state) {
6357ec681f3Smrg      if (mode == PIPE_PRIM_PATCHES)
6367ec681f3Smrg         return 3;
6377ec681f3Smrg      switch (u_reduced_prim(mode)) {
6387ec681f3Smrg      case PIPE_PRIM_POINTS:
6397ec681f3Smrg         return 0;
6407ec681f3Smrg      case PIPE_PRIM_LINES:
6417ec681f3Smrg         return 1;
6427ec681f3Smrg      default:
6437ec681f3Smrg         return 2;
6447ec681f3Smrg      }
6457ec681f3Smrg   }
6467ec681f3Smrg   return vkmode;
6477ec681f3Smrg}
6487ec681f3Smrg
6497ec681f3Smrg
6507ec681f3SmrgVkPipeline
6517ec681f3Smrgzink_get_gfx_pipeline(struct zink_context *ctx,
6527ec681f3Smrg                      struct zink_gfx_program *prog,
6537ec681f3Smrg                      struct zink_gfx_pipeline_state *state,
6547ec681f3Smrg                      enum pipe_prim_type mode)
6557ec681f3Smrg{
6567ec681f3Smrg   struct zink_screen *screen = zink_screen(ctx->base.screen);
6577ec681f3Smrg   const bool have_EXT_vertex_input_dynamic_state = screen->info.have_EXT_vertex_input_dynamic_state;
6587ec681f3Smrg   const bool have_EXT_extended_dynamic_state = screen->info.have_EXT_extended_dynamic_state;
6597ec681f3Smrg
6607ec681f3Smrg   VkPrimitiveTopology vkmode = zink_primitive_topology(mode);
6617ec681f3Smrg   const unsigned idx = get_pipeline_idx(screen->info.have_EXT_extended_dynamic_state, mode, vkmode);
6627ec681f3Smrg   assert(idx <= ARRAY_SIZE(prog->pipelines));
6637ec681f3Smrg   if (!state->dirty && !state->modules_changed &&
6647ec681f3Smrg       (have_EXT_vertex_input_dynamic_state || !ctx->vertex_state_changed) &&
6657ec681f3Smrg       idx == state->idx)
6667ec681f3Smrg      return state->pipeline;
6677ec681f3Smrg
6687ec681f3Smrg   struct hash_entry *entry = NULL;
6697ec681f3Smrg
6707ec681f3Smrg   if (state->dirty) {
6717ec681f3Smrg      if (state->pipeline) //avoid on first hash
6727ec681f3Smrg         state->final_hash ^= state->hash;
6737ec681f3Smrg      state->hash = hash_gfx_pipeline_state(state);
6747ec681f3Smrg      state->final_hash ^= state->hash;
6757ec681f3Smrg      state->dirty = false;
6767ec681f3Smrg   }
6777ec681f3Smrg   if (!have_EXT_vertex_input_dynamic_state && ctx->vertex_state_changed) {
6787ec681f3Smrg      if (state->pipeline)
6797ec681f3Smrg         state->final_hash ^= state->vertex_hash;
6807ec681f3Smrg      if (!have_EXT_extended_dynamic_state) {
6817ec681f3Smrg         uint32_t hash = 0;
6827ec681f3Smrg         /* if we don't have dynamic states, we have to hash the enabled vertex buffer bindings */
6837ec681f3Smrg         uint32_t vertex_buffers_enabled_mask = state->vertex_buffers_enabled_mask;
6847ec681f3Smrg         hash = XXH32(&vertex_buffers_enabled_mask, sizeof(uint32_t), hash);
6857ec681f3Smrg
6867ec681f3Smrg         for (unsigned i = 0; i < state->element_state->num_bindings; i++) {
6877ec681f3Smrg            struct pipe_vertex_buffer *vb = ctx->vertex_buffers + ctx->element_state->binding_map[i];
6887ec681f3Smrg            state->vertex_strides[i] = vb->buffer.resource ? vb->stride : 0;
6897ec681f3Smrg            hash = XXH32(&state->vertex_strides[i], sizeof(uint32_t), hash);
6907ec681f3Smrg         }
6917ec681f3Smrg         state->vertex_hash = hash ^ state->element_state->hash;
6927ec681f3Smrg      } else
6937ec681f3Smrg         state->vertex_hash = state->element_state->hash;
6947ec681f3Smrg      state->final_hash ^= state->vertex_hash;
6957ec681f3Smrg   }
6967ec681f3Smrg   state->modules_changed = false;
6977ec681f3Smrg   ctx->vertex_state_changed = false;
6987ec681f3Smrg
6997ec681f3Smrg   entry = _mesa_hash_table_search_pre_hashed(&prog->pipelines[idx], state->final_hash, state);
7007ec681f3Smrg
7017ec681f3Smrg   if (!entry) {
7027ec681f3Smrg      util_queue_fence_wait(&prog->base.cache_fence);
7037ec681f3Smrg      VkPipeline pipeline = zink_create_gfx_pipeline(screen, prog,
7047ec681f3Smrg                                                     state, vkmode);
7057ec681f3Smrg      if (pipeline == VK_NULL_HANDLE)
7067ec681f3Smrg         return VK_NULL_HANDLE;
7077ec681f3Smrg
7087ec681f3Smrg      zink_screen_update_pipeline_cache(screen, &prog->base);
7097ec681f3Smrg      struct gfx_pipeline_cache_entry *pc_entry = CALLOC_STRUCT(gfx_pipeline_cache_entry);
7107ec681f3Smrg      if (!pc_entry)
7117ec681f3Smrg         return VK_NULL_HANDLE;
7127ec681f3Smrg
7137ec681f3Smrg      memcpy(&pc_entry->state, state, sizeof(*state));
7147ec681f3Smrg      pc_entry->pipeline = pipeline;
7157ec681f3Smrg
7167ec681f3Smrg      entry = _mesa_hash_table_insert_pre_hashed(&prog->pipelines[idx], state->final_hash, pc_entry, pc_entry);
7177ec681f3Smrg      assert(entry);
7187ec681f3Smrg   }
7197ec681f3Smrg
7207ec681f3Smrg   struct gfx_pipeline_cache_entry *cache_entry = entry->data;
7217ec681f3Smrg   state->pipeline = cache_entry->pipeline;
7227ec681f3Smrg   state->idx = idx;
7237ec681f3Smrg   return state->pipeline;
7247ec681f3Smrg}
7257ec681f3Smrg
7267ec681f3SmrgVkPipeline
7277ec681f3Smrgzink_get_compute_pipeline(struct zink_screen *screen,
7287ec681f3Smrg                      struct zink_compute_program *comp,
7297ec681f3Smrg                      struct zink_compute_pipeline_state *state)
7307ec681f3Smrg{
7317ec681f3Smrg   struct hash_entry *entry = NULL;
7327ec681f3Smrg
7337ec681f3Smrg   if (!state->dirty)
7347ec681f3Smrg      return state->pipeline;
7357ec681f3Smrg   if (state->dirty) {
7367ec681f3Smrg      state->hash = hash_compute_pipeline_state(state);
7377ec681f3Smrg      state->dirty = false;
7387ec681f3Smrg   }
7397ec681f3Smrg   entry = _mesa_hash_table_search_pre_hashed(comp->pipelines, state->hash, state);
7407ec681f3Smrg
7417ec681f3Smrg   if (!entry) {
7427ec681f3Smrg      util_queue_fence_wait(&comp->base.cache_fence);
7437ec681f3Smrg      VkPipeline pipeline = zink_create_compute_pipeline(screen, comp, state);
7447ec681f3Smrg
7457ec681f3Smrg      if (pipeline == VK_NULL_HANDLE)
7467ec681f3Smrg         return VK_NULL_HANDLE;
7477ec681f3Smrg
7487ec681f3Smrg      struct compute_pipeline_cache_entry *pc_entry = CALLOC_STRUCT(compute_pipeline_cache_entry);
7497ec681f3Smrg      if (!pc_entry)
7507ec681f3Smrg         return VK_NULL_HANDLE;
7517ec681f3Smrg
7527ec681f3Smrg      memcpy(&pc_entry->state, state, sizeof(*state));
7537ec681f3Smrg      pc_entry->pipeline = pipeline;
7547ec681f3Smrg
7557ec681f3Smrg      entry = _mesa_hash_table_insert_pre_hashed(comp->pipelines, state->hash, pc_entry, pc_entry);
7567ec681f3Smrg      assert(entry);
7577ec681f3Smrg   }
7587ec681f3Smrg
7597ec681f3Smrg   struct compute_pipeline_cache_entry *cache_entry = entry->data;
7607ec681f3Smrg   state->pipeline = cache_entry->pipeline;
7617ec681f3Smrg   return state->pipeline;
7627ec681f3Smrg}
7637ec681f3Smrg
7647ec681f3Smrgstatic inline void
7657ec681f3Smrgbind_stage(struct zink_context *ctx, enum pipe_shader_type stage,
7667ec681f3Smrg           struct zink_shader *shader)
7677ec681f3Smrg{
7687ec681f3Smrg   if (shader && shader->nir->info.num_inlinable_uniforms)
7697ec681f3Smrg      ctx->shader_has_inlinable_uniforms_mask |= 1 << stage;
7707ec681f3Smrg   else
7717ec681f3Smrg      ctx->shader_has_inlinable_uniforms_mask &= ~(1 << stage);
7727ec681f3Smrg
7737ec681f3Smrg   if (stage == PIPE_SHADER_COMPUTE) {
7747ec681f3Smrg      if (shader && shader != ctx->compute_stage) {
7757ec681f3Smrg         struct hash_entry *entry = _mesa_hash_table_search(&ctx->compute_program_cache, shader);
7767ec681f3Smrg         if (entry) {
7777ec681f3Smrg            ctx->compute_pipeline_state.dirty = true;
7787ec681f3Smrg            ctx->curr_compute = entry->data;
7797ec681f3Smrg         } else {
7807ec681f3Smrg            struct zink_compute_program *comp = zink_create_compute_program(ctx, shader);
7817ec681f3Smrg            _mesa_hash_table_insert(&ctx->compute_program_cache, comp->shader, comp);
7827ec681f3Smrg            ctx->compute_pipeline_state.dirty = true;
7837ec681f3Smrg            ctx->curr_compute = comp;
7847ec681f3Smrg            zink_batch_reference_program(&ctx->batch, &ctx->curr_compute->base);
7857ec681f3Smrg         }
7867ec681f3Smrg      } else if (!shader)
7877ec681f3Smrg         ctx->curr_compute = NULL;
7887ec681f3Smrg      ctx->compute_stage = shader;
7897ec681f3Smrg      zink_select_launch_grid(ctx);
7907ec681f3Smrg   } else {
7917ec681f3Smrg      if (ctx->gfx_stages[stage])
7927ec681f3Smrg         ctx->gfx_hash ^= ctx->gfx_stages[stage]->hash;
7937ec681f3Smrg      ctx->gfx_stages[stage] = shader;
7947ec681f3Smrg      ctx->gfx_dirty = ctx->gfx_stages[PIPE_SHADER_FRAGMENT] && ctx->gfx_stages[PIPE_SHADER_VERTEX];
7957ec681f3Smrg      ctx->gfx_pipeline_state.modules_changed = true;
7967ec681f3Smrg      if (shader) {
7977ec681f3Smrg         ctx->shader_stages |= BITFIELD_BIT(stage);
7987ec681f3Smrg         ctx->gfx_hash ^= ctx->gfx_stages[stage]->hash;
7997ec681f3Smrg      } else {
8007ec681f3Smrg         ctx->gfx_pipeline_state.modules[stage] = VK_NULL_HANDLE;
8017ec681f3Smrg         if (ctx->curr_program)
8027ec681f3Smrg            ctx->gfx_pipeline_state.final_hash ^= ctx->curr_program->last_variant_hash;
8037ec681f3Smrg         ctx->curr_program = NULL;
8047ec681f3Smrg         ctx->shader_stages &= ~BITFIELD_BIT(stage);
8057ec681f3Smrg      }
8067ec681f3Smrg   }
8077ec681f3Smrg}
8087ec681f3Smrg
8097ec681f3Smrgstatic void
8107ec681f3Smrgbind_last_vertex_stage(struct zink_context *ctx)
8117ec681f3Smrg{
8127ec681f3Smrg   enum pipe_shader_type old = ctx->last_vertex_stage ? pipe_shader_type_from_mesa(ctx->last_vertex_stage->nir->info.stage) : PIPE_SHADER_TYPES;
8137ec681f3Smrg   if (ctx->gfx_stages[PIPE_SHADER_GEOMETRY])
8147ec681f3Smrg      ctx->last_vertex_stage = ctx->gfx_stages[PIPE_SHADER_GEOMETRY];
8157ec681f3Smrg   else if (ctx->gfx_stages[PIPE_SHADER_TESS_EVAL])
8167ec681f3Smrg      ctx->last_vertex_stage = ctx->gfx_stages[PIPE_SHADER_TESS_EVAL];
8177ec681f3Smrg   else
8187ec681f3Smrg      ctx->last_vertex_stage = ctx->gfx_stages[PIPE_SHADER_VERTEX];
8197ec681f3Smrg   enum pipe_shader_type current = ctx->last_vertex_stage ? pipe_shader_type_from_mesa(ctx->last_vertex_stage->nir->info.stage) : PIPE_SHADER_VERTEX;
8207ec681f3Smrg   if (old != current) {
8217ec681f3Smrg      if (old != PIPE_SHADER_TYPES) {
8227ec681f3Smrg         memset(&ctx->gfx_pipeline_state.shader_keys.key[old].key.vs_base, 0, sizeof(struct zink_vs_key_base));
8237ec681f3Smrg         ctx->dirty_shader_stages |= BITFIELD_BIT(old);
8247ec681f3Smrg      } else {
8257ec681f3Smrg         /* always unset vertex shader values when changing to a non-vs last stage */
8267ec681f3Smrg         memset(&ctx->gfx_pipeline_state.shader_keys.key[PIPE_SHADER_VERTEX].key.vs_base, 0, sizeof(struct zink_vs_key_base));
8277ec681f3Smrg      }
8287ec681f3Smrg      ctx->last_vertex_stage_dirty = true;
8297ec681f3Smrg   }
8307ec681f3Smrg}
8317ec681f3Smrg
8327ec681f3Smrgstatic void
8337ec681f3Smrgzink_bind_vs_state(struct pipe_context *pctx,
8347ec681f3Smrg                   void *cso)
8357ec681f3Smrg{
8367ec681f3Smrg   struct zink_context *ctx = zink_context(pctx);
8377ec681f3Smrg   if (!cso && !ctx->gfx_stages[PIPE_SHADER_VERTEX])
8387ec681f3Smrg      return;
8397ec681f3Smrg   void *prev = ctx->gfx_stages[PIPE_SHADER_VERTEX];
8407ec681f3Smrg   bind_stage(ctx, PIPE_SHADER_VERTEX, cso);
8417ec681f3Smrg   if (cso) {
8427ec681f3Smrg      struct zink_shader *zs = cso;
8437ec681f3Smrg      ctx->shader_reads_drawid = BITSET_TEST(zs->nir->info.system_values_read, SYSTEM_VALUE_DRAW_ID);
8447ec681f3Smrg      ctx->shader_reads_basevertex = BITSET_TEST(zs->nir->info.system_values_read, SYSTEM_VALUE_BASE_VERTEX);
8457ec681f3Smrg   } else {
8467ec681f3Smrg      ctx->shader_reads_drawid = false;
8477ec681f3Smrg      ctx->shader_reads_basevertex = false;
8487ec681f3Smrg   }
8497ec681f3Smrg   if (ctx->last_vertex_stage == prev)
8507ec681f3Smrg      ctx->last_vertex_stage = cso;
8517ec681f3Smrg
8527ec681f3Smrg}
8537ec681f3Smrg
8547ec681f3Smrg/* if gl_SampleMask[] is written to, we have to ensure that we get a shader with the same sample count:
8557ec681f3Smrg * in GL, samples==1 means ignore gl_SampleMask[]
8567ec681f3Smrg * in VK, gl_SampleMask[] is never ignored
8577ec681f3Smrg */
8587ec681f3Smrgvoid
8597ec681f3Smrgzink_update_fs_key_samples(struct zink_context *ctx)
8607ec681f3Smrg{
8617ec681f3Smrg   if (!ctx->gfx_stages[PIPE_SHADER_FRAGMENT])
8627ec681f3Smrg      return;
8637ec681f3Smrg   nir_shader *nir = ctx->gfx_stages[PIPE_SHADER_FRAGMENT]->nir;
8647ec681f3Smrg   if (nir->info.outputs_written & (1 << FRAG_RESULT_SAMPLE_MASK)) {
8657ec681f3Smrg      bool samples = zink_get_fs_key(ctx)->samples;
8667ec681f3Smrg      if (samples != (ctx->fb_state.samples > 1))
8677ec681f3Smrg         zink_set_fs_key(ctx)->samples = ctx->fb_state.samples > 1;
8687ec681f3Smrg   }
8697ec681f3Smrg}
8707ec681f3Smrg
8717ec681f3Smrgstatic void
8727ec681f3Smrgzink_bind_fs_state(struct pipe_context *pctx,
8737ec681f3Smrg                   void *cso)
8747ec681f3Smrg{
8757ec681f3Smrg   struct zink_context *ctx = zink_context(pctx);
8767ec681f3Smrg   if (!cso && !ctx->gfx_stages[PIPE_SHADER_FRAGMENT])
8777ec681f3Smrg      return;
8787ec681f3Smrg   bind_stage(ctx, PIPE_SHADER_FRAGMENT, cso);
8797ec681f3Smrg   ctx->fbfetch_outputs = 0;
8807ec681f3Smrg   if (cso) {
8817ec681f3Smrg      nir_shader *nir = ctx->gfx_stages[PIPE_SHADER_FRAGMENT]->nir;
8827ec681f3Smrg      if (nir->info.fs.uses_fbfetch_output) {
8837ec681f3Smrg         nir_foreach_shader_out_variable(var, ctx->gfx_stages[PIPE_SHADER_FRAGMENT]->nir) {
8847ec681f3Smrg            if (var->data.fb_fetch_output)
8857ec681f3Smrg               ctx->fbfetch_outputs |= BITFIELD_BIT(var->data.location - FRAG_RESULT_DATA0);
8867ec681f3Smrg         }
8877ec681f3Smrg      }
8887ec681f3Smrg      zink_update_fs_key_samples(ctx);
8897ec681f3Smrg   }
8907ec681f3Smrg   zink_update_fbfetch(ctx);
8917ec681f3Smrg}
8927ec681f3Smrg
8937ec681f3Smrgstatic void
8947ec681f3Smrgzink_bind_gs_state(struct pipe_context *pctx,
8957ec681f3Smrg                   void *cso)
8967ec681f3Smrg{
8977ec681f3Smrg   struct zink_context *ctx = zink_context(pctx);
8987ec681f3Smrg   if (!cso && !ctx->gfx_stages[PIPE_SHADER_GEOMETRY])
8997ec681f3Smrg      return;
9007ec681f3Smrg   bool had_points = ctx->gfx_stages[PIPE_SHADER_GEOMETRY] ? ctx->gfx_stages[PIPE_SHADER_GEOMETRY]->nir->info.gs.output_primitive == GL_POINTS : false;
9017ec681f3Smrg   bind_stage(ctx, PIPE_SHADER_GEOMETRY, cso);
9027ec681f3Smrg   bind_last_vertex_stage(ctx);
9037ec681f3Smrg   if (cso) {
9047ec681f3Smrg      if (!had_points && ctx->last_vertex_stage->nir->info.gs.output_primitive == GL_POINTS)
9057ec681f3Smrg         ctx->gfx_pipeline_state.has_points++;
9067ec681f3Smrg   } else {
9077ec681f3Smrg      if (had_points)
9087ec681f3Smrg         ctx->gfx_pipeline_state.has_points--;
9097ec681f3Smrg   }
9107ec681f3Smrg}
9117ec681f3Smrg
9127ec681f3Smrgstatic void
9137ec681f3Smrgzink_bind_tcs_state(struct pipe_context *pctx,
9147ec681f3Smrg                   void *cso)
9157ec681f3Smrg{
9167ec681f3Smrg   bind_stage(zink_context(pctx), PIPE_SHADER_TESS_CTRL, cso);
9177ec681f3Smrg}
9187ec681f3Smrg
9197ec681f3Smrgstatic void
9207ec681f3Smrgzink_bind_tes_state(struct pipe_context *pctx,
9217ec681f3Smrg                   void *cso)
9227ec681f3Smrg{
9237ec681f3Smrg   struct zink_context *ctx = zink_context(pctx);
9247ec681f3Smrg   if (!cso && !ctx->gfx_stages[PIPE_SHADER_TESS_EVAL])
9257ec681f3Smrg      return;
9267ec681f3Smrg   if (!!ctx->gfx_stages[PIPE_SHADER_TESS_EVAL] != !!cso) {
9277ec681f3Smrg      if (!cso) {
9287ec681f3Smrg         /* if unsetting a TESS that uses a generated TCS, ensure the TCS is unset */
9297ec681f3Smrg         if (ctx->gfx_stages[PIPE_SHADER_TESS_EVAL]->generated)
9307ec681f3Smrg            ctx->gfx_stages[PIPE_SHADER_TESS_CTRL] = NULL;
9317ec681f3Smrg      }
9327ec681f3Smrg   }
9337ec681f3Smrg   bind_stage(ctx, PIPE_SHADER_TESS_EVAL, cso);
9347ec681f3Smrg   bind_last_vertex_stage(ctx);
9357ec681f3Smrg}
9367ec681f3Smrg
9377ec681f3Smrgstatic void *
9387ec681f3Smrgzink_create_cs_state(struct pipe_context *pctx,
9397ec681f3Smrg                     const struct pipe_compute_state *shader)
9407ec681f3Smrg{
9417ec681f3Smrg   struct nir_shader *nir;
9427ec681f3Smrg   if (shader->ir_type != PIPE_SHADER_IR_NIR)
9437ec681f3Smrg      nir = zink_tgsi_to_nir(pctx->screen, shader->prog);
9447ec681f3Smrg   else
9457ec681f3Smrg      nir = (struct nir_shader *)shader->prog;
9467ec681f3Smrg
9477ec681f3Smrg   return zink_shader_create(zink_screen(pctx->screen), nir, NULL);
9487ec681f3Smrg}
9497ec681f3Smrg
9507ec681f3Smrgstatic void
9517ec681f3Smrgzink_bind_cs_state(struct pipe_context *pctx,
9527ec681f3Smrg                   void *cso)
9537ec681f3Smrg{
9547ec681f3Smrg   bind_stage(zink_context(pctx), PIPE_SHADER_COMPUTE, cso);
9557ec681f3Smrg}
9567ec681f3Smrg
9577ec681f3Smrgvoid
9587ec681f3Smrgzink_delete_shader_state(struct pipe_context *pctx, void *cso)
9597ec681f3Smrg{
9607ec681f3Smrg   zink_shader_free(zink_context(pctx), cso);
9617ec681f3Smrg}
9627ec681f3Smrg
9637ec681f3Smrgvoid *
9647ec681f3Smrgzink_create_gfx_shader_state(struct pipe_context *pctx, const struct pipe_shader_state *shader)
9657ec681f3Smrg{
9667ec681f3Smrg   nir_shader *nir;
9677ec681f3Smrg   if (shader->type != PIPE_SHADER_IR_NIR)
9687ec681f3Smrg      nir = zink_tgsi_to_nir(pctx->screen, shader->tokens);
9697ec681f3Smrg   else
9707ec681f3Smrg      nir = (struct nir_shader *)shader->ir.nir;
9717ec681f3Smrg
9727ec681f3Smrg   return zink_shader_create(zink_screen(pctx->screen), nir, &shader->stream_output);
9737ec681f3Smrg}
9747ec681f3Smrg
9757ec681f3Smrgstatic void
9767ec681f3Smrgzink_delete_cached_shader_state(struct pipe_context *pctx, void *cso)
9777ec681f3Smrg{
9787ec681f3Smrg   struct zink_screen *screen = zink_screen(pctx->screen);
9797ec681f3Smrg   util_shader_reference(pctx, &screen->shaders, &cso, NULL);
9807ec681f3Smrg}
9817ec681f3Smrg
9827ec681f3Smrgstatic void *
9837ec681f3Smrgzink_create_cached_shader_state(struct pipe_context *pctx, const struct pipe_shader_state *shader)
9847ec681f3Smrg{
9857ec681f3Smrg   bool cache_hit;
9867ec681f3Smrg   struct zink_screen *screen = zink_screen(pctx->screen);
9877ec681f3Smrg   return util_live_shader_cache_get(pctx, &screen->shaders, shader, &cache_hit);
9887ec681f3Smrg}
9897ec681f3Smrg
9907ec681f3Smrgvoid
9917ec681f3Smrgzink_program_init(struct zink_context *ctx)
9927ec681f3Smrg{
9937ec681f3Smrg   ctx->base.create_vs_state = zink_create_cached_shader_state;
9947ec681f3Smrg   ctx->base.bind_vs_state = zink_bind_vs_state;
9957ec681f3Smrg   ctx->base.delete_vs_state = zink_delete_cached_shader_state;
9967ec681f3Smrg
9977ec681f3Smrg   ctx->base.create_fs_state = zink_create_cached_shader_state;
9987ec681f3Smrg   ctx->base.bind_fs_state = zink_bind_fs_state;
9997ec681f3Smrg   ctx->base.delete_fs_state = zink_delete_cached_shader_state;
10007ec681f3Smrg
10017ec681f3Smrg   ctx->base.create_gs_state = zink_create_cached_shader_state;
10027ec681f3Smrg   ctx->base.bind_gs_state = zink_bind_gs_state;
10037ec681f3Smrg   ctx->base.delete_gs_state = zink_delete_cached_shader_state;
10047ec681f3Smrg
10057ec681f3Smrg   ctx->base.create_tcs_state = zink_create_cached_shader_state;
10067ec681f3Smrg   ctx->base.bind_tcs_state = zink_bind_tcs_state;
10077ec681f3Smrg   ctx->base.delete_tcs_state = zink_delete_cached_shader_state;
10087ec681f3Smrg
10097ec681f3Smrg   ctx->base.create_tes_state = zink_create_cached_shader_state;
10107ec681f3Smrg   ctx->base.bind_tes_state = zink_bind_tes_state;
10117ec681f3Smrg   ctx->base.delete_tes_state = zink_delete_cached_shader_state;
10127ec681f3Smrg
10137ec681f3Smrg   ctx->base.create_compute_state = zink_create_cs_state;
10147ec681f3Smrg   ctx->base.bind_compute_state = zink_bind_cs_state;
10157ec681f3Smrg   ctx->base.delete_compute_state = zink_delete_shader_state;
10167ec681f3Smrg}
1017