1/*
2 * Copyright © 2012 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 */
23
24#include "ir.h"
25#include "linker.h"
26#include "ir_uniform.h"
27#include "link_uniform_block_active_visitor.h"
28#include "util/hash_table.h"
29#include "program.h"
30#include "main/errors.h"
31#include "main/mtypes.h"
32
33namespace {
34
35class ubo_visitor : public program_resource_visitor {
36public:
37   ubo_visitor(void *mem_ctx, gl_uniform_buffer_variable *variables,
38               unsigned num_variables, struct gl_shader_program *prog,
39               bool use_std430_as_default)
40      : index(0), offset(0), buffer_size(0), variables(variables),
41        num_variables(num_variables), mem_ctx(mem_ctx),
42        is_array_instance(false), prog(prog),
43        use_std430_as_default(use_std430_as_default)
44   {
45      /* empty */
46   }
47
48   void process(const glsl_type *type, const char *name)
49   {
50      this->offset = 0;
51      this->buffer_size = 0;
52      this->is_array_instance = strchr(name, ']') != NULL;
53      this->program_resource_visitor::process(type, name,
54                                              use_std430_as_default);
55   }
56
57   unsigned index;
58   unsigned offset;
59   unsigned buffer_size;
60   gl_uniform_buffer_variable *variables;
61   unsigned num_variables;
62   void *mem_ctx;
63   bool is_array_instance;
64   struct gl_shader_program *prog;
65
66private:
67   virtual void enter_record(const glsl_type *type, const char *,
68                             bool row_major,
69                             const enum glsl_interface_packing packing)
70   {
71      assert(type->is_struct());
72      if (packing == GLSL_INTERFACE_PACKING_STD430)
73         this->offset = glsl_align(
74            this->offset, type->std430_base_alignment(row_major));
75      else
76         this->offset = glsl_align(
77            this->offset, type->std140_base_alignment(row_major));
78   }
79
80   virtual void leave_record(const glsl_type *type, const char *,
81                             bool row_major,
82                             const enum glsl_interface_packing packing)
83   {
84      assert(type->is_struct());
85
86      /* If this is the last field of a structure, apply rule #9.  The
87       * ARB_uniform_buffer_object spec says:
88       *
89       *    The structure may have padding at the end; the base offset of the
90       *    member following the sub-structure is rounded up to the next
91       *    multiple of the base alignment of the structure.
92       */
93      if (packing == GLSL_INTERFACE_PACKING_STD430)
94         this->offset = glsl_align(
95            this->offset, type->std430_base_alignment(row_major));
96      else
97         this->offset = glsl_align(
98            this->offset, type->std140_base_alignment(row_major));
99   }
100
101   virtual void set_buffer_offset(unsigned offset)
102   {
103      this->offset = offset;
104   }
105
106   virtual void visit_field(const glsl_type *type, const char *name,
107                            bool row_major, const glsl_type *,
108                            const enum glsl_interface_packing packing,
109                            bool last_field)
110   {
111      assert(this->index < this->num_variables);
112
113      gl_uniform_buffer_variable *v = &this->variables[this->index++];
114
115      v->Name = ralloc_strdup(mem_ctx, name);
116      v->Type = type;
117      v->RowMajor = type->without_array()->is_matrix() && row_major;
118
119      if (this->is_array_instance) {
120         v->IndexName = ralloc_strdup(mem_ctx, name);
121
122         char *open_bracket = strchr(v->IndexName, '[');
123         assert(open_bracket != NULL);
124
125         char *close_bracket = strchr(open_bracket, '.') - 1;
126         assert(close_bracket != NULL);
127
128         /* Length of the tail without the ']' but with the NUL.
129          */
130         unsigned len = strlen(close_bracket + 1) + 1;
131
132         memmove(open_bracket, close_bracket + 1, len);
133      } else {
134         v->IndexName = v->Name;
135      }
136
137      unsigned alignment = 0;
138      unsigned size = 0;
139
140      /* The ARB_program_interface_query spec says:
141       *
142       *    If the final member of an active shader storage block is array
143       *    with no declared size, the minimum buffer size is computed
144       *    assuming the array was declared as an array with one element.
145       *
146       * For that reason, we use the base type of the unsized array to
147       * calculate its size. We don't need to check if the unsized array is
148       * the last member of a shader storage block (that check was already
149       * done by the parser).
150       */
151      const glsl_type *type_for_size = type;
152      if (type->is_unsized_array()) {
153         if (!last_field) {
154            linker_error(prog, "unsized array `%s' definition: "
155                         "only last member of a shader storage block "
156                         "can be defined as unsized array",
157                         name);
158         }
159
160         type_for_size = type->without_array();
161      }
162
163      if (packing == GLSL_INTERFACE_PACKING_STD430) {
164         alignment = type->std430_base_alignment(v->RowMajor);
165         size = type_for_size->std430_size(v->RowMajor);
166      } else {
167         alignment = type->std140_base_alignment(v->RowMajor);
168         size = type_for_size->std140_size(v->RowMajor);
169      }
170
171      this->offset = glsl_align(this->offset, alignment);
172      v->Offset = this->offset;
173
174      this->offset += size;
175
176      /* The ARB_uniform_buffer_object spec says:
177       *
178       *    For uniform blocks laid out according to [std140] rules, the
179       *    minimum buffer object size returned by the UNIFORM_BLOCK_DATA_SIZE
180       *    query is derived by taking the offset of the last basic machine
181       *    unit consumed by the last uniform of the uniform block (including
182       *    any end-of-array or end-of-structure padding), adding one, and
183       *    rounding up to the next multiple of the base alignment required
184       *    for a vec4.
185       */
186      this->buffer_size = glsl_align(this->offset, 16);
187   }
188
189   bool use_std430_as_default;
190};
191
192class count_block_size : public program_resource_visitor {
193public:
194   count_block_size() : num_active_uniforms(0)
195   {
196      /* empty */
197   }
198
199   unsigned num_active_uniforms;
200
201private:
202   virtual void visit_field(const glsl_type * /* type */,
203                            const char * /* name */,
204                            bool /* row_major */,
205                            const glsl_type * /* record_type */,
206                            const enum glsl_interface_packing,
207                            bool /* last_field */)
208   {
209      this->num_active_uniforms++;
210   }
211};
212
213} /* anonymous namespace */
214
215struct block {
216   const glsl_type *type;
217   bool has_instance_name;
218};
219
220static void process_block_array_leaf(const char *name, gl_uniform_block *blocks,
221                                     ubo_visitor *parcel,
222                                     gl_uniform_buffer_variable *variables,
223                                     const struct link_uniform_block_active *const b,
224                                     unsigned *block_index,
225                                     unsigned binding_offset,
226                                     unsigned linearized_index,
227                                     struct gl_context *ctx,
228                                     struct gl_shader_program *prog);
229
230/**
231 *
232 * \param first_index Value of \c block_index for the first element of the
233 *                    array.
234 */
235static void
236process_block_array(struct uniform_block_array_elements *ub_array, char **name,
237                    size_t name_length, gl_uniform_block *blocks,
238                    ubo_visitor *parcel, gl_uniform_buffer_variable *variables,
239                    const struct link_uniform_block_active *const b,
240                    unsigned *block_index, unsigned binding_offset,
241                    struct gl_context *ctx, struct gl_shader_program *prog,
242                    unsigned first_index)
243{
244   for (unsigned j = 0; j < ub_array->num_array_elements; j++) {
245      size_t new_length = name_length;
246
247      unsigned int element_idx = ub_array->array_elements[j];
248      /* Append the subscript to the current variable name */
249      ralloc_asprintf_rewrite_tail(name, &new_length, "[%u]", element_idx);
250
251      if (ub_array->array) {
252         unsigned binding_stride = binding_offset + (element_idx *
253                                   ub_array->array->aoa_size);
254         process_block_array(ub_array->array, name, new_length, blocks,
255                             parcel, variables, b, block_index,
256                             binding_stride, ctx, prog, first_index);
257      } else {
258         process_block_array_leaf(*name, blocks,
259                                  parcel, variables, b, block_index,
260                                  binding_offset + element_idx,
261                                  *block_index - first_index, ctx, prog);
262      }
263   }
264}
265
266static void
267process_block_array_leaf(const char *name,
268                         gl_uniform_block *blocks,
269                         ubo_visitor *parcel, gl_uniform_buffer_variable *variables,
270                         const struct link_uniform_block_active *const b,
271                         unsigned *block_index, unsigned binding_offset,
272                         unsigned linearized_index,
273                         struct gl_context *ctx, struct gl_shader_program *prog)
274{
275   unsigned i = *block_index;
276   const glsl_type *type =  b->type->without_array();
277
278   blocks[i].Name = ralloc_strdup(blocks, name);
279   blocks[i].Uniforms = &variables[(*parcel).index];
280
281   /* The ARB_shading_language_420pack spec says:
282    *
283    *    If the binding identifier is used with a uniform block instanced as
284    *    an array then the first element of the array takes the specified
285    *    block binding and each subsequent element takes the next consecutive
286    *    uniform block binding point.
287    */
288   blocks[i].Binding = (b->has_binding) ? b->binding + binding_offset : 0;
289
290   blocks[i].UniformBufferSize = 0;
291   blocks[i]._Packing = glsl_interface_packing(type->interface_packing);
292   blocks[i]._RowMajor = type->get_interface_row_major();
293   blocks[i].linearized_array_index = linearized_index;
294
295   parcel->process(type, b->has_instance_name ? blocks[i].Name : "");
296
297   blocks[i].UniformBufferSize = parcel->buffer_size;
298
299   /* Check SSBO size is lower than maximum supported size for SSBO */
300   if (b->is_shader_storage &&
301       parcel->buffer_size > ctx->Const.MaxShaderStorageBlockSize) {
302      linker_error(prog, "shader storage block `%s' has size %d, "
303                   "which is larger than the maximum allowed (%d)",
304                   b->type->name,
305                   parcel->buffer_size,
306                   ctx->Const.MaxShaderStorageBlockSize);
307   }
308   blocks[i].NumUniforms =
309      (unsigned)(ptrdiff_t)(&variables[parcel->index] - blocks[i].Uniforms);
310
311   *block_index = *block_index + 1;
312}
313
314/* This function resizes the array types of the block so that later we can use
315 * this new size to correctly calculate the offest for indirect indexing.
316 */
317static const glsl_type *
318resize_block_array(const glsl_type *type,
319                   struct uniform_block_array_elements *ub_array)
320{
321   if (type->is_array()) {
322      struct uniform_block_array_elements *child_array =
323         type->fields.array->is_array() ? ub_array->array : NULL;
324      const glsl_type *new_child_type =
325         resize_block_array(type->fields.array, child_array);
326
327      const glsl_type *new_type =
328         glsl_type::get_array_instance(new_child_type,
329                                       ub_array->num_array_elements);
330      ub_array->ir->array->type = new_type;
331      return new_type;
332   } else {
333      return type;
334   }
335}
336
337static void
338create_buffer_blocks(void *mem_ctx, struct gl_context *ctx,
339                     struct gl_shader_program *prog,
340                     struct gl_uniform_block **out_blks, unsigned num_blocks,
341                     struct hash_table *block_hash, unsigned num_variables,
342                     bool create_ubo_blocks)
343{
344   if (num_blocks == 0) {
345      assert(num_variables == 0);
346      return;
347   }
348
349   assert(num_variables != 0);
350
351   /* Allocate storage to hold all of the information related to uniform
352    * blocks that can be queried through the API.
353    */
354   struct gl_uniform_block *blocks =
355      rzalloc_array(mem_ctx, gl_uniform_block, num_blocks);
356   gl_uniform_buffer_variable *variables =
357      ralloc_array(blocks, gl_uniform_buffer_variable, num_variables);
358
359   /* Add each variable from each uniform block to the API tracking
360    * structures.
361    */
362   ubo_visitor parcel(blocks, variables, num_variables, prog,
363                      ctx->Const.UseSTD430AsDefaultPacking);
364
365   unsigned i = 0;
366   hash_table_foreach (block_hash, entry) {
367      const struct link_uniform_block_active *const b =
368         (const struct link_uniform_block_active *) entry->data;
369      const glsl_type *block_type = b->type;
370
371      if ((create_ubo_blocks && !b->is_shader_storage) ||
372          (!create_ubo_blocks && b->is_shader_storage)) {
373
374         if (b->array != NULL) {
375            char *name = ralloc_strdup(NULL,
376                                       block_type->without_array()->name);
377            size_t name_length = strlen(name);
378
379            assert(b->has_instance_name);
380            process_block_array(b->array, &name, name_length, blocks, &parcel,
381                                variables, b, &i, 0, ctx, prog,
382                                i);
383            ralloc_free(name);
384         } else {
385            process_block_array_leaf(block_type->name, blocks, &parcel,
386                                     variables, b, &i, 0,
387                                     0, ctx, prog);
388         }
389      }
390   }
391
392   *out_blks = blocks;
393
394   assert(parcel.index == num_variables);
395}
396
397void
398link_uniform_blocks(void *mem_ctx,
399                    struct gl_context *ctx,
400                    struct gl_shader_program *prog,
401                    struct gl_linked_shader *shader,
402                    struct gl_uniform_block **ubo_blocks,
403                    unsigned *num_ubo_blocks,
404                    struct gl_uniform_block **ssbo_blocks,
405                    unsigned *num_ssbo_blocks)
406{
407   /* This hash table will track all of the uniform blocks that have been
408    * encountered.  Since blocks with the same block-name must be the same,
409    * the hash is organized by block-name.
410    */
411   struct hash_table *block_hash =
412      _mesa_hash_table_create(mem_ctx, _mesa_hash_string,
413                              _mesa_key_string_equal);
414
415   if (block_hash == NULL) {
416      _mesa_error_no_memory(__func__);
417      linker_error(prog, "out of memory\n");
418      return;
419   }
420
421   /* Determine which uniform blocks are active. */
422   link_uniform_block_active_visitor v(mem_ctx, block_hash, prog);
423   visit_list_elements(&v, shader->ir);
424
425   /* Count the number of active uniform blocks.  Count the total number of
426    * active slots in those uniform blocks.
427    */
428   unsigned num_ubo_variables = 0;
429   unsigned num_ssbo_variables = 0;
430   count_block_size block_size;
431
432   hash_table_foreach (block_hash, entry) {
433      struct link_uniform_block_active *const b =
434         (struct link_uniform_block_active *) entry->data;
435
436      assert((b->array != NULL) == b->type->is_array());
437
438      if (b->array != NULL &&
439          (b->type->without_array()->interface_packing ==
440           GLSL_INTERFACE_PACKING_PACKED)) {
441         b->type = resize_block_array(b->type, b->array);
442         b->var->type = b->type;
443         b->var->data.max_array_access = b->type->length - 1;
444      }
445
446      block_size.num_active_uniforms = 0;
447      block_size.process(b->type->without_array(), "",
448                         ctx->Const.UseSTD430AsDefaultPacking);
449
450      if (b->array != NULL) {
451         unsigned aoa_size = b->type->arrays_of_arrays_size();
452         if (b->is_shader_storage) {
453            *num_ssbo_blocks += aoa_size;
454            num_ssbo_variables += aoa_size * block_size.num_active_uniforms;
455         } else {
456            *num_ubo_blocks += aoa_size;
457            num_ubo_variables += aoa_size * block_size.num_active_uniforms;
458         }
459      } else {
460         if (b->is_shader_storage) {
461            (*num_ssbo_blocks)++;
462            num_ssbo_variables += block_size.num_active_uniforms;
463         } else {
464            (*num_ubo_blocks)++;
465            num_ubo_variables += block_size.num_active_uniforms;
466         }
467      }
468
469   }
470
471   create_buffer_blocks(mem_ctx, ctx, prog, ubo_blocks, *num_ubo_blocks,
472                        block_hash, num_ubo_variables, true);
473   create_buffer_blocks(mem_ctx, ctx, prog, ssbo_blocks, *num_ssbo_blocks,
474                        block_hash, num_ssbo_variables, false);
475
476   _mesa_hash_table_destroy(block_hash, NULL);
477}
478
479static bool
480link_uniform_blocks_are_compatible(const gl_uniform_block *a,
481                                   const gl_uniform_block *b)
482{
483   assert(strcmp(a->Name, b->Name) == 0);
484
485   /* Page 35 (page 42 of the PDF) in section 4.3.7 of the GLSL 1.50 spec says:
486    *
487    *    Matched block names within an interface (as defined above) must match
488    *    in terms of having the same number of declarations with the same
489    *    sequence of types and the same sequence of member names, as well as
490    *    having the same member-wise layout qualification....if a matching
491    *    block is declared as an array, then the array sizes must also
492    *    match... Any mismatch will generate a link error.
493    *
494    * Arrays are not yet supported, so there is no check for that.
495    */
496   if (a->NumUniforms != b->NumUniforms)
497      return false;
498
499   if (a->_Packing != b->_Packing)
500      return false;
501
502   if (a->_RowMajor != b->_RowMajor)
503      return false;
504
505   if (a->Binding != b->Binding)
506      return false;
507
508   for (unsigned i = 0; i < a->NumUniforms; i++) {
509      if (strcmp(a->Uniforms[i].Name, b->Uniforms[i].Name) != 0)
510         return false;
511
512      if (a->Uniforms[i].Type != b->Uniforms[i].Type)
513         return false;
514
515      if (a->Uniforms[i].RowMajor != b->Uniforms[i].RowMajor)
516         return false;
517   }
518
519   return true;
520}
521
522/**
523 * Merges a uniform block into an array of uniform blocks that may or
524 * may not already contain a copy of it.
525 *
526 * Returns the index of the new block in the array.
527 */
528int
529link_cross_validate_uniform_block(void *mem_ctx,
530                                  struct gl_uniform_block **linked_blocks,
531                                  unsigned int *num_linked_blocks,
532                                  struct gl_uniform_block *new_block)
533{
534   for (unsigned int i = 0; i < *num_linked_blocks; i++) {
535      struct gl_uniform_block *old_block = &(*linked_blocks)[i];
536
537      if (strcmp(old_block->Name, new_block->Name) == 0)
538         return link_uniform_blocks_are_compatible(old_block, new_block)
539            ? i : -1;
540   }
541
542   *linked_blocks = reralloc(mem_ctx, *linked_blocks,
543                             struct gl_uniform_block,
544                             *num_linked_blocks + 1);
545   int linked_block_index = (*num_linked_blocks)++;
546   struct gl_uniform_block *linked_block = &(*linked_blocks)[linked_block_index];
547
548   memcpy(linked_block, new_block, sizeof(*new_block));
549   linked_block->Uniforms = ralloc_array(*linked_blocks,
550                                         struct gl_uniform_buffer_variable,
551                                         linked_block->NumUniforms);
552
553   memcpy(linked_block->Uniforms,
554          new_block->Uniforms,
555          sizeof(*linked_block->Uniforms) * linked_block->NumUniforms);
556
557   linked_block->Name = ralloc_strdup(*linked_blocks, linked_block->Name);
558
559   for (unsigned int i = 0; i < linked_block->NumUniforms; i++) {
560      struct gl_uniform_buffer_variable *ubo_var =
561         &linked_block->Uniforms[i];
562
563      if (ubo_var->Name == ubo_var->IndexName) {
564         ubo_var->Name = ralloc_strdup(*linked_blocks, ubo_var->Name);
565         ubo_var->IndexName = ubo_var->Name;
566      } else {
567         ubo_var->Name = ralloc_strdup(*linked_blocks, ubo_var->Name);
568         ubo_var->IndexName = ralloc_strdup(*linked_blocks, ubo_var->IndexName);
569      }
570   }
571
572   return linked_block_index;
573}
574