1/*
2 * Copyright (c) 2017-2019 Lima Project
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sub license,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the
12 * next paragraph) shall be included in all copies or substantial portions
13 * of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 *
23 */
24
25#include "util/u_memory.h"
26#include "util/ralloc.h"
27#include "util/u_debug.h"
28
29#include "tgsi/tgsi_dump.h"
30#include "compiler/nir/nir.h"
31#include "compiler/nir/nir_serialize.h"
32#include "nir/tgsi_to_nir.h"
33
34#include "pipe/p_state.h"
35
36#include "lima_screen.h"
37#include "lima_context.h"
38#include "lima_job.h"
39#include "lima_program.h"
40#include "lima_bo.h"
41#include "lima_disk_cache.h"
42
43#include "ir/lima_ir.h"
44
45static const nir_shader_compiler_options vs_nir_options = {
46   .lower_ffma16 = true,
47   .lower_ffma32 = true,
48   .lower_ffma64 = true,
49   .lower_fpow = true,
50   .lower_ffract = true,
51   .lower_fdiv = true,
52   .lower_fmod = true,
53   .lower_fsqrt = true,
54   .lower_flrp32 = true,
55   .lower_flrp64 = true,
56   /* could be implemented by clamp */
57   .lower_fsat = true,
58   .lower_bitops = true,
59   .lower_rotate = true,
60   .lower_sincos = true,
61   .lower_fceil = true,
62   .lower_insert_byte = true,
63   .lower_insert_word = true,
64   .force_indirect_unrolling = (nir_var_shader_in | nir_var_shader_out | nir_var_function_temp),
65};
66
67static const nir_shader_compiler_options fs_nir_options = {
68   .lower_ffma16 = true,
69   .lower_ffma32 = true,
70   .lower_ffma64 = true,
71   .lower_fpow = true,
72   .lower_fdiv = true,
73   .lower_fmod = true,
74   .lower_flrp32 = true,
75   .lower_flrp64 = true,
76   .lower_fsign = true,
77   .lower_rotate = true,
78   .lower_fdot = true,
79   .lower_fdph = true,
80   .lower_insert_byte = true,
81   .lower_insert_word = true,
82   .lower_bitops = true,
83   .lower_vector_cmp = true,
84   .force_indirect_unrolling = (nir_var_shader_in | nir_var_shader_out | nir_var_function_temp),
85};
86
87const void *
88lima_program_get_compiler_options(enum pipe_shader_type shader)
89{
90   switch (shader) {
91   case PIPE_SHADER_VERTEX:
92      return &vs_nir_options;
93   case PIPE_SHADER_FRAGMENT:
94      return &fs_nir_options;
95   default:
96      return NULL;
97   }
98}
99
100static int
101type_size(const struct glsl_type *type, bool bindless)
102{
103   return glsl_count_attribute_slots(type, false);
104}
105
106void
107lima_program_optimize_vs_nir(struct nir_shader *s)
108{
109   bool progress;
110
111   NIR_PASS_V(s, nir_lower_viewport_transform);
112   NIR_PASS_V(s, nir_lower_point_size, 1.0f, 100.0f);
113   NIR_PASS_V(s, nir_lower_io,
114	      nir_var_shader_in | nir_var_shader_out, type_size, 0);
115   NIR_PASS_V(s, nir_lower_load_const_to_scalar);
116   NIR_PASS_V(s, lima_nir_lower_uniform_to_scalar);
117   NIR_PASS_V(s, nir_lower_io_to_scalar,
118              nir_var_shader_in|nir_var_shader_out);
119
120   do {
121      progress = false;
122
123      NIR_PASS_V(s, nir_lower_vars_to_ssa);
124      NIR_PASS(progress, s, nir_lower_alu_to_scalar, NULL, NULL);
125      NIR_PASS(progress, s, nir_lower_phis_to_scalar, false);
126      NIR_PASS(progress, s, nir_copy_prop);
127      NIR_PASS(progress, s, nir_opt_remove_phis);
128      NIR_PASS(progress, s, nir_opt_dce);
129      NIR_PASS(progress, s, nir_opt_dead_cf);
130      NIR_PASS(progress, s, nir_opt_cse);
131      NIR_PASS(progress, s, nir_opt_peephole_select, 8, true, true);
132      NIR_PASS(progress, s, nir_opt_algebraic);
133      NIR_PASS(progress, s, lima_nir_lower_ftrunc);
134      NIR_PASS(progress, s, nir_opt_constant_folding);
135      NIR_PASS(progress, s, nir_opt_undef);
136      NIR_PASS(progress, s, nir_opt_loop_unroll);
137   } while (progress);
138
139   NIR_PASS_V(s, nir_lower_int_to_float);
140   /* int_to_float pass generates ftrunc, so lower it */
141   NIR_PASS(progress, s, lima_nir_lower_ftrunc);
142   NIR_PASS_V(s, nir_lower_bool_to_float);
143
144   NIR_PASS_V(s, nir_copy_prop);
145   NIR_PASS_V(s, nir_opt_dce);
146   NIR_PASS_V(s, lima_nir_split_loads);
147   NIR_PASS_V(s, nir_lower_locals_to_regs);
148   NIR_PASS_V(s, nir_convert_from_ssa, true);
149   NIR_PASS_V(s, nir_remove_dead_variables, nir_var_function_temp, NULL);
150   nir_sweep(s);
151}
152
153static bool
154lima_alu_to_scalar_filter_cb(const nir_instr *instr, const void *data)
155{
156   if (instr->type != nir_instr_type_alu)
157      return false;
158
159   nir_alu_instr *alu = nir_instr_as_alu(instr);
160   switch (alu->op) {
161   case nir_op_frcp:
162   case nir_op_frsq:
163   case nir_op_flog2:
164   case nir_op_fexp2:
165   case nir_op_fsqrt:
166   case nir_op_fsin:
167   case nir_op_fcos:
168      return true;
169   default:
170      break;
171   }
172
173   /* nir vec4 fcsel assumes that each component of the condition will be
174    * used to select the same component from the two options, but Utgard PP
175    * has only 1 component condition. If all condition components are not the
176    * same we need to lower it to scalar.
177    */
178   switch (alu->op) {
179   case nir_op_bcsel:
180   case nir_op_fcsel:
181      break;
182   default:
183      return false;
184   }
185
186   int num_components = nir_dest_num_components(alu->dest.dest);
187
188   uint8_t swizzle = alu->src[0].swizzle[0];
189
190   for (int i = 1; i < num_components; i++)
191      if (alu->src[0].swizzle[i] != swizzle)
192         return true;
193
194   return false;
195}
196
197static bool
198lima_vec_to_movs_filter_cb(const nir_instr *instr, unsigned writemask,
199                           const void *data)
200{
201   assert(writemask > 0);
202   if (util_bitcount(writemask) == 1)
203      return true;
204
205   return !lima_alu_to_scalar_filter_cb(instr, data);
206}
207
208void
209lima_program_optimize_fs_nir(struct nir_shader *s,
210                             struct nir_lower_tex_options *tex_options)
211{
212   bool progress;
213
214   NIR_PASS_V(s, nir_lower_fragcoord_wtrans);
215   NIR_PASS_V(s, nir_lower_io,
216	      nir_var_shader_in | nir_var_shader_out, type_size, 0);
217   NIR_PASS_V(s, nir_lower_regs_to_ssa);
218   NIR_PASS_V(s, nir_lower_tex, tex_options);
219
220   do {
221      progress = false;
222      NIR_PASS(progress, s, nir_opt_vectorize, NULL, NULL);
223   } while (progress);
224
225   do {
226      progress = false;
227
228      NIR_PASS_V(s, nir_lower_vars_to_ssa);
229      NIR_PASS(progress, s, nir_lower_alu_to_scalar, lima_alu_to_scalar_filter_cb, NULL);
230      NIR_PASS(progress, s, nir_copy_prop);
231      NIR_PASS(progress, s, nir_opt_remove_phis);
232      NIR_PASS(progress, s, nir_opt_dce);
233      NIR_PASS(progress, s, nir_opt_dead_cf);
234      NIR_PASS(progress, s, nir_opt_cse);
235      NIR_PASS(progress, s, nir_opt_peephole_select, 8, true, true);
236      NIR_PASS(progress, s, nir_opt_algebraic);
237      NIR_PASS(progress, s, nir_opt_constant_folding);
238      NIR_PASS(progress, s, nir_opt_undef);
239      NIR_PASS(progress, s, nir_opt_loop_unroll);
240      NIR_PASS(progress, s, lima_nir_split_load_input);
241   } while (progress);
242
243   NIR_PASS_V(s, nir_lower_int_to_float);
244   NIR_PASS_V(s, nir_lower_bool_to_float);
245
246   /* Some ops must be lowered after being converted from int ops,
247    * so re-run nir_opt_algebraic after int lowering. */
248   do {
249      progress = false;
250      NIR_PASS(progress, s, nir_opt_algebraic);
251   } while (progress);
252
253   /* Must be run after optimization loop */
254   NIR_PASS_V(s, lima_nir_scale_trig);
255
256   /* Lower modifiers */
257   NIR_PASS_V(s, nir_lower_to_source_mods, nir_lower_all_source_mods);
258   NIR_PASS_V(s, nir_copy_prop);
259   NIR_PASS_V(s, nir_opt_dce);
260
261   NIR_PASS_V(s, nir_lower_locals_to_regs);
262   NIR_PASS_V(s, nir_convert_from_ssa, true);
263   NIR_PASS_V(s, nir_remove_dead_variables, nir_var_function_temp, NULL);
264
265   NIR_PASS_V(s, nir_move_vec_src_uses_to_dest);
266   NIR_PASS_V(s, nir_lower_vec_to_movs, lima_vec_to_movs_filter_cb, NULL);
267   NIR_PASS_V(s, nir_opt_dce); /* clean up any new dead code from vec to movs */
268
269   NIR_PASS_V(s, lima_nir_duplicate_load_uniforms);
270   NIR_PASS_V(s, lima_nir_duplicate_load_inputs);
271   NIR_PASS_V(s, lima_nir_duplicate_load_consts);
272
273   nir_sweep(s);
274}
275
276static bool
277lima_fs_compile_shader(struct lima_context *ctx,
278                       struct lima_fs_key *key,
279                       struct lima_fs_uncompiled_shader *ufs,
280                       struct lima_fs_compiled_shader *fs)
281{
282   struct lima_screen *screen = lima_screen(ctx->base.screen);
283   nir_shader *nir = nir_shader_clone(fs, ufs->base.ir.nir);
284
285   struct nir_lower_tex_options tex_options = {
286      .lower_txp = ~0u,
287      .swizzle_result = ~0u,
288   };
289
290   for (int i = 0; i < ARRAY_SIZE(key->tex); i++) {
291      for (int j = 0; j < 4; j++)
292         tex_options.swizzles[i][j] = key->tex[i].swizzle[j];
293   }
294
295   lima_program_optimize_fs_nir(nir, &tex_options);
296
297   if (lima_debug & LIMA_DEBUG_PP)
298      nir_print_shader(nir, stdout);
299
300   if (!ppir_compile_nir(fs, nir, screen->pp_ra, &ctx->debug)) {
301      ralloc_free(nir);
302      return false;
303   }
304
305   fs->state.uses_discard = nir->info.fs.uses_discard;
306   ralloc_free(nir);
307
308   return true;
309}
310
311static bool
312lima_fs_upload_shader(struct lima_context *ctx,
313                      struct lima_fs_compiled_shader *fs)
314{
315   struct lima_screen *screen = lima_screen(ctx->base.screen);
316
317   fs->bo = lima_bo_create(screen, fs->state.shader_size, 0);
318   if (!fs->bo) {
319      fprintf(stderr, "lima: create fs shader bo fail\n");
320      return false;
321   }
322
323   memcpy(lima_bo_map(fs->bo), fs->shader, fs->state.shader_size);
324
325   return true;
326}
327
328static struct lima_fs_compiled_shader *
329lima_get_compiled_fs(struct lima_context *ctx,
330                     struct lima_fs_uncompiled_shader *ufs,
331                     struct lima_fs_key *key)
332{
333   struct lima_screen *screen = lima_screen(ctx->base.screen);
334   struct hash_table *ht;
335   uint32_t key_size;
336
337   ht = ctx->fs_cache;
338   key_size = sizeof(struct lima_fs_key);
339
340   struct hash_entry *entry = _mesa_hash_table_search(ht, key);
341   if (entry)
342      return entry->data;
343
344   /* Not on memory cache, try disk cache */
345   struct lima_fs_compiled_shader *fs =
346      lima_fs_disk_cache_retrieve(screen->disk_cache, key);
347
348   if (!fs) {
349      /* Not on disk cache, compile and insert into disk cache*/
350      fs = rzalloc(NULL, struct lima_fs_compiled_shader);
351      if (!fs)
352         return NULL;
353
354      if (!lima_fs_compile_shader(ctx, key, ufs, fs))
355         goto err;
356
357      lima_fs_disk_cache_store(screen->disk_cache, key, fs);
358   }
359
360   if (!lima_fs_upload_shader(ctx, fs))
361      goto err;
362
363   ralloc_free(fs->shader);
364   fs->shader = NULL;
365
366   /* Insert into memory cache */
367   struct lima_key *dup_key;
368   dup_key = rzalloc_size(fs, key_size);
369   memcpy(dup_key, key, key_size);
370   _mesa_hash_table_insert(ht, dup_key, fs);
371
372   return fs;
373
374err:
375   ralloc_free(fs);
376   return NULL;
377}
378
379static void *
380lima_create_fs_state(struct pipe_context *pctx,
381                     const struct pipe_shader_state *cso)
382{
383   struct lima_context *ctx = lima_context(pctx);
384   struct lima_fs_uncompiled_shader *so = rzalloc(NULL, struct lima_fs_uncompiled_shader);
385
386   if (!so)
387      return NULL;
388
389   nir_shader *nir;
390   if (cso->type == PIPE_SHADER_IR_NIR)
391      /* The backend takes ownership of the NIR shader on state
392       * creation. */
393      nir = cso->ir.nir;
394   else {
395      assert(cso->type == PIPE_SHADER_IR_TGSI);
396
397      nir = tgsi_to_nir(cso->tokens, pctx->screen, false);
398   }
399
400   so->base.type = PIPE_SHADER_IR_NIR;
401   so->base.ir.nir = nir;
402
403   /* Serialize the NIR to a binary blob that we can hash for the disk
404    * cache.  Drop unnecessary information (like variable names)
405    * so the serialized NIR is smaller, and also to let us detect more
406    * isomorphic shaders when hashing, increasing cache hits.
407    */
408   struct blob blob;
409   blob_init(&blob);
410   nir_serialize(&blob, nir, true);
411   _mesa_sha1_compute(blob.data, blob.size, so->nir_sha1);
412   blob_finish(&blob);
413
414   if (lima_debug & LIMA_DEBUG_PRECOMPILE) {
415      /* Trigger initial compilation with default settings */
416      struct lima_fs_key key;
417      memset(&key, 0, sizeof(key));
418      memcpy(key.nir_sha1, so->nir_sha1, sizeof(so->nir_sha1));
419      for (int i = 0; i < ARRAY_SIZE(key.tex); i++) {
420         for (int j = 0; j < 4; j++)
421            key.tex[i].swizzle[j] = j;
422      }
423      lima_get_compiled_fs(ctx, so, &key);
424   }
425
426   return so;
427}
428
429static void
430lima_bind_fs_state(struct pipe_context *pctx, void *hwcso)
431{
432   struct lima_context *ctx = lima_context(pctx);
433
434   ctx->uncomp_fs = hwcso;
435   ctx->dirty |= LIMA_CONTEXT_DIRTY_UNCOMPILED_FS;
436}
437
438static void
439lima_delete_fs_state(struct pipe_context *pctx, void *hwcso)
440{
441   struct lima_context *ctx = lima_context(pctx);
442   struct lima_fs_uncompiled_shader *so = hwcso;
443
444   hash_table_foreach(ctx->fs_cache, entry) {
445      const struct lima_fs_key *key = entry->key;
446      if (!memcmp(key->nir_sha1, so->nir_sha1, sizeof(so->nir_sha1))) {
447         struct lima_fs_compiled_shader *fs = entry->data;
448         _mesa_hash_table_remove(ctx->fs_cache, entry);
449         if (fs->bo)
450            lima_bo_unreference(fs->bo);
451
452         if (fs == ctx->fs)
453            ctx->fs = NULL;
454
455         ralloc_free(fs);
456      }
457   }
458
459   ralloc_free(so->base.ir.nir);
460   ralloc_free(so);
461}
462
463static bool
464lima_vs_compile_shader(struct lima_context *ctx,
465                       struct lima_vs_key *key,
466                       struct lima_vs_uncompiled_shader *uvs,
467                       struct lima_vs_compiled_shader *vs)
468{
469   nir_shader *nir = nir_shader_clone(vs, uvs->base.ir.nir);
470
471   lima_program_optimize_vs_nir(nir);
472
473   if (lima_debug & LIMA_DEBUG_GP)
474      nir_print_shader(nir, stdout);
475
476   if (!gpir_compile_nir(vs, nir, &ctx->debug)) {
477      ralloc_free(nir);
478      return false;
479   }
480
481   ralloc_free(nir);
482
483   return true;
484}
485
486static bool
487lima_vs_upload_shader(struct lima_context *ctx,
488                      struct lima_vs_compiled_shader *vs)
489{
490   struct lima_screen *screen = lima_screen(ctx->base.screen);
491   vs->bo = lima_bo_create(screen, vs->state.shader_size, 0);
492   if (!vs->bo) {
493      fprintf(stderr, "lima: create vs shader bo fail\n");
494      return false;
495   }
496
497   memcpy(lima_bo_map(vs->bo), vs->shader, vs->state.shader_size);
498
499   return true;
500}
501
502static struct lima_vs_compiled_shader *
503lima_get_compiled_vs(struct lima_context *ctx,
504                     struct lima_vs_uncompiled_shader *uvs,
505                     struct lima_vs_key *key)
506{
507   struct lima_screen *screen = lima_screen(ctx->base.screen);
508   struct hash_table *ht;
509   uint32_t key_size;
510
511   ht = ctx->vs_cache;
512   key_size = sizeof(struct lima_vs_key);
513
514   struct hash_entry *entry = _mesa_hash_table_search(ht, key);
515   if (entry)
516      return entry->data;
517
518   /* Not on memory cache, try disk cache */
519   struct lima_vs_compiled_shader *vs =
520      lima_vs_disk_cache_retrieve(screen->disk_cache, key);
521
522   if (!vs) {
523      /* Not on disk cache, compile and insert into disk cache */
524      vs = rzalloc(NULL, struct lima_vs_compiled_shader);
525      if (!vs)
526         return NULL;
527      if (!lima_vs_compile_shader(ctx, key, uvs, vs))
528         goto err;
529
530      lima_vs_disk_cache_store(screen->disk_cache, key, vs);
531   }
532
533   if (!lima_vs_upload_shader(ctx, vs))
534      goto err;
535
536   ralloc_free(vs->shader);
537   vs->shader = NULL;
538
539   struct lima_key *dup_key;
540   dup_key = rzalloc_size(vs, key_size);
541   memcpy(dup_key, key, key_size);
542   _mesa_hash_table_insert(ht, dup_key, vs);
543
544   return vs;
545
546err:
547   ralloc_free(vs);
548   return NULL;
549}
550
551bool
552lima_update_vs_state(struct lima_context *ctx)
553{
554   if (!(ctx->dirty & LIMA_CONTEXT_DIRTY_UNCOMPILED_VS)) {
555      return true;
556   }
557
558   struct lima_vs_key local_key;
559   struct lima_vs_key *key = &local_key;
560   memset(key, 0, sizeof(*key));
561   memcpy(key->nir_sha1, ctx->uncomp_vs->nir_sha1,
562          sizeof(ctx->uncomp_vs->nir_sha1));
563
564   struct lima_vs_compiled_shader *old_vs = ctx->vs;
565   struct lima_vs_compiled_shader *vs = lima_get_compiled_vs(ctx,
566                                                             ctx->uncomp_vs,
567                                                             key);
568   if (!vs)
569      return false;
570
571   ctx->vs = vs;
572
573   if (ctx->vs != old_vs)
574      ctx->dirty |= LIMA_CONTEXT_DIRTY_COMPILED_VS;
575
576   return true;
577}
578
579bool
580lima_update_fs_state(struct lima_context *ctx)
581{
582   if (!(ctx->dirty & (LIMA_CONTEXT_DIRTY_UNCOMPILED_FS |
583                       LIMA_CONTEXT_DIRTY_TEXTURES))) {
584      return true;
585   }
586
587   struct lima_texture_stateobj *lima_tex = &ctx->tex_stateobj;
588   struct lima_fs_key local_key;
589   struct lima_fs_key *key = &local_key;
590   memset(key, 0, sizeof(*key));
591   memcpy(key->nir_sha1, ctx->uncomp_fs->nir_sha1,
592          sizeof(ctx->uncomp_fs->nir_sha1));
593
594   for (int i = 0; i < lima_tex->num_textures; i++) {
595      struct lima_sampler_view *sampler = lima_sampler_view(lima_tex->textures[i]);
596      for (int j = 0; j < 4; j++)
597         key->tex[i].swizzle[j] = sampler->swizzle[j];
598   }
599
600   /* Fill rest with identity swizzle */
601   uint8_t identity[4] = { PIPE_SWIZZLE_X, PIPE_SWIZZLE_Y,
602                           PIPE_SWIZZLE_Z, PIPE_SWIZZLE_W };
603   for (int i = lima_tex->num_textures; i < ARRAY_SIZE(key->tex); i++)
604      memcpy(key->tex[i].swizzle, identity, 4);
605
606   struct lima_fs_compiled_shader *old_fs = ctx->fs;
607
608   struct lima_fs_compiled_shader *fs = lima_get_compiled_fs(ctx,
609                                                             ctx->uncomp_fs,
610                                                             key);
611   if (!fs)
612      return false;
613
614   ctx->fs = fs;
615
616   if (ctx->fs != old_fs)
617      ctx->dirty |= LIMA_CONTEXT_DIRTY_COMPILED_FS;
618
619   return true;
620}
621
622static void *
623lima_create_vs_state(struct pipe_context *pctx,
624                     const struct pipe_shader_state *cso)
625{
626   struct lima_context *ctx = lima_context(pctx);
627   struct lima_vs_uncompiled_shader *so = rzalloc(NULL, struct lima_vs_uncompiled_shader);
628
629   if (!so)
630      return NULL;
631
632   nir_shader *nir;
633   if (cso->type == PIPE_SHADER_IR_NIR)
634      /* The backend takes ownership of the NIR shader on state
635       * creation. */
636      nir = cso->ir.nir;
637   else {
638      assert(cso->type == PIPE_SHADER_IR_TGSI);
639
640      nir = tgsi_to_nir(cso->tokens, pctx->screen, false);
641   }
642
643   so->base.type = PIPE_SHADER_IR_NIR;
644   so->base.ir.nir = nir;
645
646   /* Serialize the NIR to a binary blob that we can hash for the disk
647    * cache.  Drop unnecessary information (like variable names)
648    * so the serialized NIR is smaller, and also to let us detect more
649    * isomorphic shaders when hashing, increasing cache hits.
650    */
651   struct blob blob;
652   blob_init(&blob);
653   nir_serialize(&blob, nir, true);
654   _mesa_sha1_compute(blob.data, blob.size, so->nir_sha1);
655   blob_finish(&blob);
656
657   if (lima_debug & LIMA_DEBUG_PRECOMPILE) {
658      /* Trigger initial compilation with default settings */
659      struct lima_vs_key key;
660      memset(&key, 0, sizeof(key));
661      memcpy(key.nir_sha1, so->nir_sha1, sizeof(so->nir_sha1));
662      lima_get_compiled_vs(ctx, so, &key);
663   }
664
665   return so;
666}
667
668static void
669lima_bind_vs_state(struct pipe_context *pctx, void *hwcso)
670{
671   struct lima_context *ctx = lima_context(pctx);
672
673   ctx->uncomp_vs = hwcso;
674   ctx->dirty |= LIMA_CONTEXT_DIRTY_UNCOMPILED_VS;
675}
676
677static void
678lima_delete_vs_state(struct pipe_context *pctx, void *hwcso)
679{
680   struct lima_context *ctx = lima_context(pctx);
681   struct lima_vs_uncompiled_shader *so = hwcso;
682
683   hash_table_foreach(ctx->vs_cache, entry) {
684      const struct lima_vs_key *key = entry->key;
685      if (!memcmp(key->nir_sha1, so->nir_sha1, sizeof(so->nir_sha1))) {
686         struct lima_vs_compiled_shader *vs = entry->data;
687         _mesa_hash_table_remove(ctx->vs_cache, entry);
688         if (vs->bo)
689            lima_bo_unreference(vs->bo);
690
691         if (vs == ctx->vs)
692            ctx->vs = NULL;
693
694         ralloc_free(vs);
695      }
696   }
697
698   ralloc_free(so->base.ir.nir);
699   ralloc_free(so);
700}
701
702static uint32_t
703lima_fs_cache_hash(const void *key)
704{
705   return _mesa_hash_data(key, sizeof(struct lima_fs_key));
706}
707
708static uint32_t
709lima_vs_cache_hash(const void *key)
710{
711   return _mesa_hash_data(key, sizeof(struct lima_vs_key));
712}
713
714static bool
715lima_fs_cache_compare(const void *key1, const void *key2)
716{
717   return memcmp(key1, key2, sizeof(struct lima_fs_key)) == 0;
718}
719
720static bool
721lima_vs_cache_compare(const void *key1, const void *key2)
722{
723   return memcmp(key1, key2, sizeof(struct lima_vs_key)) == 0;
724}
725
726void
727lima_program_init(struct lima_context *ctx)
728{
729   ctx->base.create_fs_state = lima_create_fs_state;
730   ctx->base.bind_fs_state = lima_bind_fs_state;
731   ctx->base.delete_fs_state = lima_delete_fs_state;
732
733   ctx->base.create_vs_state = lima_create_vs_state;
734   ctx->base.bind_vs_state = lima_bind_vs_state;
735   ctx->base.delete_vs_state = lima_delete_vs_state;
736
737   ctx->fs_cache = _mesa_hash_table_create(ctx, lima_fs_cache_hash,
738                                           lima_fs_cache_compare);
739   ctx->vs_cache = _mesa_hash_table_create(ctx, lima_vs_cache_hash,
740                                           lima_vs_cache_compare);
741}
742
743void
744lima_program_fini(struct lima_context *ctx)
745{
746   hash_table_foreach(ctx->vs_cache, entry) {
747      struct lima_vs_compiled_shader *vs = entry->data;
748      if (vs->bo)
749         lima_bo_unreference(vs->bo);
750      ralloc_free(vs);
751      _mesa_hash_table_remove(ctx->vs_cache, entry);
752   }
753
754   hash_table_foreach(ctx->fs_cache, entry) {
755      struct lima_fs_compiled_shader *fs = entry->data;
756      if (fs->bo)
757         lima_bo_unreference(fs->bo);
758      ralloc_free(fs);
759      _mesa_hash_table_remove(ctx->fs_cache, entry);
760   }
761}
762