compiler/glsl/ir_expression_operation.py

01e04c3fSmrg#
01e04c3fSmrg# Copyright (C) 2015 Intel Corporation
01e04c3fSmrg#
01e04c3fSmrg# Permission is hereby granted, free of charge, to any person obtaining a
01e04c3fSmrg# copy of this software and associated documentation files (the "Software"),
01e04c3fSmrg# to deal in the Software without restriction, including without limitation
01e04c3fSmrg# the rights to use, copy, modify, merge, publish, distribute, sublicense,
01e04c3fSmrg# and/or sell copies of the Software, and to permit persons to whom the
01e04c3fSmrg# Software is furnished to do so, subject to the following conditions:
01e04c3fSmrg#
01e04c3fSmrg# The above copyright notice and this permission notice (including the next
01e04c3fSmrg# paragraph) shall be included in all copies or substantial portions of the
01e04c3fSmrg# Software.
01e04c3fSmrg#
01e04c3fSmrg# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
01e04c3fSmrg# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
01e04c3fSmrg# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
01e04c3fSmrg# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
01e04c3fSmrg# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
01e04c3fSmrg# FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
01e04c3fSmrg# IN THE SOFTWARE.
01e04c3fSmrg
01e04c3fSmrgimport mako.template
01e04c3fSmrgimport sys
01e04c3fSmrg
01e04c3fSmrgclass type(object):
01e04c3fSmrg   def __init__(self, c_type, union_field, glsl_type):
01e04c3fSmrg      self.c_type = c_type
01e04c3fSmrg      self.union_field = union_field
01e04c3fSmrg      self.glsl_type = glsl_type
01e04c3fSmrg
01e04c3fSmrg
01e04c3fSmrgclass type_signature_iter(object):
01e04c3fSmrg   """Basic iterator for a set of type signatures.  Various kinds of sequences of
01e04c3fSmrg   types come in, and an iteration of type_signature objects come out.
01e04c3fSmrg
01e04c3fSmrg   """
01e04c3fSmrg
01e04c3fSmrg   def __init__(self, source_types, num_operands):
01e04c3fSmrg      """Initialize an iterator from a sequence of input types and a number
01e04c3fSmrg      operands.  This is for signatures where all the operands have the same
01e04c3fSmrg      type and the result type of the operation is the same as the input type.
01e04c3fSmrg
01e04c3fSmrg      """
01e04c3fSmrg      self.dest_type = None
01e04c3fSmrg      self.source_types = source_types
01e04c3fSmrg      self.num_operands = num_operands
01e04c3fSmrg      self.i = 0
01e04c3fSmrg
01e04c3fSmrg   def __init__(self, dest_type, source_types, num_operands):
01e04c3fSmrg      """Initialize an iterator from a result tpye, a sequence of input types and a
01e04c3fSmrg      number operands.  This is for signatures where all the operands have the
01e04c3fSmrg      same type but the result type of the operation is different from the
01e04c3fSmrg      input type.
01e04c3fSmrg
01e04c3fSmrg      """
01e04c3fSmrg      self.dest_type = dest_type
01e04c3fSmrg      self.source_types = source_types
01e04c3fSmrg      self.num_operands = num_operands
01e04c3fSmrg      self.i = 0
01e04c3fSmrg
01e04c3fSmrg   def __iter__(self):
01e04c3fSmrg      return self
01e04c3fSmrg
01e04c3fSmrg   def __next__(self):
01e04c3fSmrg      if self.i < len(self.source_types):
01e04c3fSmrg         i = self.i
01e04c3fSmrg         self.i += 1
01e04c3fSmrg
01e04c3fSmrg         if self.dest_type is None:
01e04c3fSmrg            dest_type = self.source_types[i]
01e04c3fSmrg         else:
01e04c3fSmrg            dest_type = self.dest_type
01e04c3fSmrg
01e04c3fSmrg         return (dest_type, self.num_operands * (self.source_types[i],))
01e04c3fSmrg      else:
01e04c3fSmrg         raise StopIteration()
01e04c3fSmrg
01e04c3fSmrg   next = __next__
01e04c3fSmrg
01e04c3fSmrg
01e04c3fSmrguint_type = type("unsigned", "u", "GLSL_TYPE_UINT")
01e04c3fSmrgint_type = type("int", "i", "GLSL_TYPE_INT")
01e04c3fSmrguint64_type = type("uint64_t", "u64", "GLSL_TYPE_UINT64")
01e04c3fSmrgint64_type = type("int64_t", "i64", "GLSL_TYPE_INT64")
01e04c3fSmrgfloat_type = type("float", "f", "GLSL_TYPE_FLOAT")
01e04c3fSmrgdouble_type = type("double", "d", "GLSL_TYPE_DOUBLE")
01e04c3fSmrgbool_type = type("bool", "b", "GLSL_TYPE_BOOL")
01e04c3fSmrg
01e04c3fSmrgall_types = (uint_type, int_type, float_type, double_type, uint64_type, int64_type, bool_type)
01e04c3fSmrgnumeric_types = (uint_type, int_type, float_type, double_type, uint64_type, int64_type)
01e04c3fSmrgsigned_numeric_types = (int_type, float_type, double_type, int64_type)
01e04c3fSmrginteger_types = (uint_type, int_type, uint64_type, int64_type)
01e04c3fSmrgreal_types = (float_type, double_type)
01e04c3fSmrg
01e04c3fSmrg# This template is for operations that can have operands of a several
01e04c3fSmrg# different types, and each type may or may not has a different C expression.
01e04c3fSmrg# This is used by most operations.
01e04c3fSmrgconstant_template_common = mako.template.Template("""\
01e04c3fSmrg   case ${op.get_enum_name()}:
01e04c3fSmrg      for (unsigned c = 0; c < op[0]->type->components(); c++) {
01e04c3fSmrg         switch (op[0]->type->base_type) {
01e04c3fSmrg    % for dst_type, src_types in op.signatures():
01e04c3fSmrg         case ${src_types[0].glsl_type}:
01e04c3fSmrg            data.${dst_type.union_field}[c] = ${op.get_c_expression(src_types)};
01e04c3fSmrg            break;
01e04c3fSmrg    % endfor
01e04c3fSmrg         default:
01e04c3fSmrg            unreachable("invalid type");
01e04c3fSmrg         }
01e04c3fSmrg      }
01e04c3fSmrg      break;""")
01e04c3fSmrg
01e04c3fSmrg# This template is for binary operations that can operate on some combination
01e04c3fSmrg# of scalar and vector operands.
01e04c3fSmrgconstant_template_vector_scalar = mako.template.Template("""\
01e04c3fSmrg   case ${op.get_enum_name()}:
01e04c3fSmrg    % if "mixed" in op.flags:
01e04c3fSmrg        % for i in range(op.num_operands):
01e04c3fSmrg      assert(op[${i}]->type->base_type == ${op.source_types[0].glsl_type} ||
01e04c3fSmrg            % for src_type in op.source_types[1:-1]:
01e04c3fSmrg             op[${i}]->type->base_type == ${src_type.glsl_type} ||
01e04c3fSmrg            % endfor
01e04c3fSmrg             op[${i}]->type->base_type == ${op.source_types[-1].glsl_type});
01e04c3fSmrg        % endfor
01e04c3fSmrg    % else:
01e04c3fSmrg      assert(op[0]->type == op[1]->type || op0_scalar || op1_scalar);
01e04c3fSmrg    % endif
01e04c3fSmrg      for (unsigned c = 0, c0 = 0, c1 = 0;
01e04c3fSmrg           c < components;
01e04c3fSmrg           c0 += c0_inc, c1 += c1_inc, c++) {
01e04c3fSmrg
01e04c3fSmrg         switch (op[0]->type->base_type) {
01e04c3fSmrg    % for dst_type, src_types in op.signatures():
01e04c3fSmrg         case ${src_types[0].glsl_type}:
01e04c3fSmrg            data.${dst_type.union_field}[c] = ${op.get_c_expression(src_types, ("c0", "c1", "c2"))};
01e04c3fSmrg            break;
01e04c3fSmrg    % endfor
01e04c3fSmrg         default:
01e04c3fSmrg            unreachable("invalid type");
01e04c3fSmrg         }
01e04c3fSmrg      }
01e04c3fSmrg      break;""")
01e04c3fSmrg
01e04c3fSmrg# This template is for multiplication.  It is unique because it has to support
01e04c3fSmrg# matrix * vector and matrix * matrix operations, and those are just different.
01e04c3fSmrgconstant_template_mul = mako.template.Template("""\
01e04c3fSmrg   case ${op.get_enum_name()}:
01e04c3fSmrg      /* Check for equal types, or unequal types involving scalars */
01e04c3fSmrg      if ((op[0]->type == op[1]->type && !op[0]->type->is_matrix())
01e04c3fSmrg          || op0_scalar || op1_scalar) {
01e04c3fSmrg         for (unsigned c = 0, c0 = 0, c1 = 0;
01e04c3fSmrg              c < components;
01e04c3fSmrg              c0 += c0_inc, c1 += c1_inc, c++) {
01e04c3fSmrg
01e04c3fSmrg            switch (op[0]->type->base_type) {
01e04c3fSmrg    % for dst_type, src_types in op.signatures():
01e04c3fSmrg            case ${src_types[0].glsl_type}:
01e04c3fSmrg               data.${dst_type.union_field}[c] = ${op.get_c_expression(src_types, ("c0", "c1", "c2"))};
01e04c3fSmrg               break;
01e04c3fSmrg    % endfor
01e04c3fSmrg            default:
01e04c3fSmrg               unreachable("invalid type");
01e04c3fSmrg            }
01e04c3fSmrg         }
01e04c3fSmrg      } else {
01e04c3fSmrg         assert(op[0]->type->is_matrix() || op[1]->type->is_matrix());
01e04c3fSmrg
01e04c3fSmrg         /* Multiply an N-by-M matrix with an M-by-P matrix.  Since either
01e04c3fSmrg          * matrix can be a GLSL vector, either N or P can be 1.
01e04c3fSmrg          *
01e04c3fSmrg          * For vec*mat, the vector is treated as a row vector.  This
01e04c3fSmrg          * means the vector is a 1-row x M-column matrix.
01e04c3fSmrg          *
01e04c3fSmrg          * For mat*vec, the vector is treated as a column vector.  Since
01e04c3fSmrg          * matrix_columns is 1 for vectors, this just works.
01e04c3fSmrg          */
01e04c3fSmrg         const unsigned n = op[0]->type->is_vector()
01e04c3fSmrg            ? 1 : op[0]->type->vector_elements;
01e04c3fSmrg         const unsigned m = op[1]->type->vector_elements;
01e04c3fSmrg         const unsigned p = op[1]->type->matrix_columns;
01e04c3fSmrg         for (unsigned j = 0; j < p; j++) {
01e04c3fSmrg            for (unsigned i = 0; i < n; i++) {
01e04c3fSmrg               for (unsigned k = 0; k < m; k++) {
01e04c3fSmrg                  if (op[0]->type->is_double())
01e04c3fSmrg                     data.d[i+n*j] += op[0]->value.d[i+n*k]*op[1]->value.d[k+m*j];
01e04c3fSmrg                  else
01e04c3fSmrg                     data.f[i+n*j] += op[0]->value.f[i+n*k]*op[1]->value.f[k+m*j];
01e04c3fSmrg               }
01e04c3fSmrg            }
01e04c3fSmrg         }
01e04c3fSmrg      }
01e04c3fSmrg      break;""")
01e04c3fSmrg
01e04c3fSmrg# This template is for operations that are horizontal and either have only a
01e04c3fSmrg# single type or the implementation for all types is identical.  That is, the
01e04c3fSmrg# operation consumes a vector and produces a scalar.
01e04c3fSmrgconstant_template_horizontal_single_implementation = mako.template.Template("""\
01e04c3fSmrg   case ${op.get_enum_name()}:
01e04c3fSmrg      data.${op.dest_type.union_field}[0] = ${op.c_expression['default']};
01e04c3fSmrg      break;""")
01e04c3fSmrg
01e04c3fSmrg# This template is for operations that are horizontal and do not assign the
01e04c3fSmrg# result.  The various unpack operations are examples.
01e04c3fSmrgconstant_template_horizontal_nonassignment = mako.template.Template("""\
01e04c3fSmrg   case ${op.get_enum_name()}:
01e04c3fSmrg      ${op.c_expression['default']};
01e04c3fSmrg      break;""")
01e04c3fSmrg
01e04c3fSmrg# This template is for binary operations that are horizontal.  That is, the
01e04c3fSmrg# operation consumes a vector and produces a scalar.
01e04c3fSmrgconstant_template_horizontal = mako.template.Template("""\
01e04c3fSmrg   case ${op.get_enum_name()}:
01e04c3fSmrg      switch (op[0]->type->base_type) {
01e04c3fSmrg    % for dst_type, src_types in op.signatures():
01e04c3fSmrg      case ${src_types[0].glsl_type}:
01e04c3fSmrg         data.${dst_type.union_field}[0] = ${op.get_c_expression(src_types)};
01e04c3fSmrg         break;
01e04c3fSmrg    % endfor
01e04c3fSmrg      default:
01e04c3fSmrg         unreachable("invalid type");
01e04c3fSmrg      }
01e04c3fSmrg      break;""")
01e04c3fSmrg
01e04c3fSmrg# This template is for ir_binop_vector_extract.
01e04c3fSmrgconstant_template_vector_extract = mako.template.Template("""\
01e04c3fSmrg   case ${op.get_enum_name()}: {
01e04c3fSmrg      const int c = CLAMP(op[1]->value.i[0], 0,
01e04c3fSmrg                          (int) op[0]->type->vector_elements - 1);
01e04c3fSmrg
01e04c3fSmrg      switch (op[0]->type->base_type) {
01e04c3fSmrg    % for dst_type, src_types in op.signatures():
01e04c3fSmrg      case ${src_types[0].glsl_type}:
01e04c3fSmrg         data.${dst_type.union_field}[0] = op[0]->value.${src_types[0].union_field}[c];
01e04c3fSmrg         break;
01e04c3fSmrg    % endfor
01e04c3fSmrg      default:
01e04c3fSmrg         unreachable("invalid type");
01e04c3fSmrg      }
01e04c3fSmrg      break;
01e04c3fSmrg   }""")
01e04c3fSmrg
01e04c3fSmrg# This template is for ir_triop_vector_insert.
01e04c3fSmrgconstant_template_vector_insert = mako.template.Template("""\
01e04c3fSmrg   case ${op.get_enum_name()}: {
01e04c3fSmrg      const unsigned idx = op[2]->value.u[0];
01e04c3fSmrg
01e04c3fSmrg      memcpy(&data, &op[0]->value, sizeof(data));
01e04c3fSmrg
7ec681f3Smrg      switch (return_type->base_type) {
01e04c3fSmrg    % for dst_type, src_types in op.signatures():
01e04c3fSmrg      case ${src_types[0].glsl_type}:
01e04c3fSmrg         data.${dst_type.union_field}[idx] = op[1]->value.${src_types[0].union_field}[0];
01e04c3fSmrg         break;
01e04c3fSmrg    % endfor
01e04c3fSmrg      default:
01e04c3fSmrg         unreachable("invalid type");
01e04c3fSmrg      }
01e04c3fSmrg      break;
01e04c3fSmrg   }""")
01e04c3fSmrg
01e04c3fSmrg# This template is for ir_quadop_vector.
01e04c3fSmrgconstant_template_vector = mako.template.Template("""\
01e04c3fSmrg   case ${op.get_enum_name()}:
7ec681f3Smrg      for (unsigned c = 0; c < return_type->vector_elements; c++) {
7ec681f3Smrg         switch (return_type->base_type) {
01e04c3fSmrg    % for dst_type, src_types in op.signatures():
01e04c3fSmrg         case ${src_types[0].glsl_type}:
01e04c3fSmrg            data.${dst_type.union_field}[c] = op[c]->value.${src_types[0].union_field}[0];
01e04c3fSmrg            break;
01e04c3fSmrg    % endfor
01e04c3fSmrg         default:
01e04c3fSmrg            unreachable("invalid type");
01e04c3fSmrg         }
01e04c3fSmrg      }
01e04c3fSmrg      break;""")
01e04c3fSmrg
01e04c3fSmrg# This template is for ir_triop_lrp.
01e04c3fSmrgconstant_template_lrp = mako.template.Template("""\
01e04c3fSmrg   case ${op.get_enum_name()}: {
01e04c3fSmrg      assert(op[0]->type->is_float() || op[0]->type->is_double());
01e04c3fSmrg      assert(op[1]->type->is_float() || op[1]->type->is_double());
01e04c3fSmrg      assert(op[2]->type->is_float() || op[2]->type->is_double());
01e04c3fSmrg
01e04c3fSmrg      unsigned c2_inc = op[2]->type->is_scalar() ? 0 : 1;
01e04c3fSmrg      for (unsigned c = 0, c2 = 0; c < components; c2 += c2_inc, c++) {
7ec681f3Smrg         switch (return_type->base_type) {
01e04c3fSmrg    % for dst_type, src_types in op.signatures():
01e04c3fSmrg         case ${src_types[0].glsl_type}:
01e04c3fSmrg            data.${dst_type.union_field}[c] = ${op.get_c_expression(src_types, ("c", "c", "c2"))};
01e04c3fSmrg            break;
01e04c3fSmrg    % endfor
01e04c3fSmrg         default:
01e04c3fSmrg            unreachable("invalid type");
01e04c3fSmrg         }
01e04c3fSmrg      }
01e04c3fSmrg      break;
01e04c3fSmrg   }""")
01e04c3fSmrg
01e04c3fSmrg# This template is for ir_triop_csel.  This expression is really unique
01e04c3fSmrg# because not all of the operands are the same type, and the second operand
01e04c3fSmrg# determines the type of the expression (instead of the first).
01e04c3fSmrgconstant_template_csel = mako.template.Template("""\
01e04c3fSmrg   case ${op.get_enum_name()}:
01e04c3fSmrg      for (unsigned c = 0; c < components; c++) {
7ec681f3Smrg         switch (return_type->base_type) {
01e04c3fSmrg    % for dst_type, src_types in op.signatures():
01e04c3fSmrg         case ${src_types[1].glsl_type}:
01e04c3fSmrg            data.${dst_type.union_field}[c] = ${op.get_c_expression(src_types)};
01e04c3fSmrg            break;
01e04c3fSmrg    % endfor
01e04c3fSmrg         default:
01e04c3fSmrg            unreachable("invalid type");
01e04c3fSmrg         }
01e04c3fSmrg      }
01e04c3fSmrg      break;""")
01e04c3fSmrg
01e04c3fSmrg
01e04c3fSmrgvector_scalar_operation = "vector-scalar"
01e04c3fSmrghorizontal_operation = "horizontal"
01e04c3fSmrgtypes_identical_operation = "identical"
01e04c3fSmrgnon_assign_operation = "nonassign"
01e04c3fSmrgmixed_type_operation = "mixed"
01e04c3fSmrg
01e04c3fSmrgclass operation(object):
01e04c3fSmrg   def __init__(self, name, num_operands, printable_name = None, source_types = None, dest_type = None, c_expression = None, flags = None, all_signatures = None):
01e04c3fSmrg      self.name = name
01e04c3fSmrg      self.num_operands = num_operands
01e04c3fSmrg
01e04c3fSmrg      if printable_name is None:
01e04c3fSmrg         self.printable_name = name
01e04c3fSmrg      else:
01e04c3fSmrg         self.printable_name = printable_name
01e04c3fSmrg
01e04c3fSmrg      self.all_signatures = all_signatures
01e04c3fSmrg
01e04c3fSmrg      if source_types is None:
01e04c3fSmrg         self.source_types = tuple()
01e04c3fSmrg      else:
01e04c3fSmrg         self.source_types = source_types
01e04c3fSmrg
01e04c3fSmrg      self.dest_type = dest_type
01e04c3fSmrg
01e04c3fSmrg      if c_expression is None:
01e04c3fSmrg         self.c_expression = None
01e04c3fSmrg      elif isinstance(c_expression, str):
01e04c3fSmrg         self.c_expression = {'default': c_expression}
01e04c3fSmrg      else:
01e04c3fSmrg         self.c_expression = c_expression
01e04c3fSmrg
01e04c3fSmrg      if flags is None:
01e04c3fSmrg         self.flags = frozenset()
01e04c3fSmrg      elif isinstance(flags, str):
01e04c3fSmrg         self.flags = frozenset([flags])
01e04c3fSmrg      else:
01e04c3fSmrg         self.flags = frozenset(flags)
01e04c3fSmrg
01e04c3fSmrg
01e04c3fSmrg   def get_enum_name(self):
01e04c3fSmrg      return "ir_{0}op_{1}".format(("un", "bin", "tri", "quad")[self.num_operands-1], self.name)
01e04c3fSmrg
01e04c3fSmrg
01e04c3fSmrg   def get_template(self):
01e04c3fSmrg      if self.c_expression is None:
01e04c3fSmrg         return None
01e04c3fSmrg
01e04c3fSmrg      if horizontal_operation in self.flags:
01e04c3fSmrg         if non_assign_operation in self.flags:
01e04c3fSmrg            return constant_template_horizontal_nonassignment.render(op=self)
01e04c3fSmrg         elif types_identical_operation in self.flags:
01e04c3fSmrg            return constant_template_horizontal_single_implementation.render(op=self)
01e04c3fSmrg         else:
01e04c3fSmrg            return constant_template_horizontal.render(op=self)
01e04c3fSmrg
01e04c3fSmrg      if self.num_operands == 2:
01e04c3fSmrg         if self.name == "mul":
01e04c3fSmrg            return constant_template_mul.render(op=self)
01e04c3fSmrg         elif self.name == "vector_extract":
01e04c3fSmrg            return constant_template_vector_extract.render(op=self)
01e04c3fSmrg         elif vector_scalar_operation in self.flags:
01e04c3fSmrg            return constant_template_vector_scalar.render(op=self)
01e04c3fSmrg      elif self.num_operands == 3:
01e04c3fSmrg         if self.name == "vector_insert":
01e04c3fSmrg            return constant_template_vector_insert.render(op=self)
01e04c3fSmrg         elif self.name == "lrp":
01e04c3fSmrg            return constant_template_lrp.render(op=self)
01e04c3fSmrg         elif self.name == "csel":
01e04c3fSmrg            return constant_template_csel.render(op=self)
01e04c3fSmrg      elif self.num_operands == 4:
01e04c3fSmrg         if self.name == "vector":
01e04c3fSmrg            return constant_template_vector.render(op=self)
01e04c3fSmrg
01e04c3fSmrg      return constant_template_common.render(op=self)
01e04c3fSmrg
01e04c3fSmrg
01e04c3fSmrg   def get_c_expression(self, types, indices=("c", "c", "c")):
01e04c3fSmrg      src0 = "op[0]->value.{0}[{1}]".format(types[0].union_field, indices[0])
01e04c3fSmrg      src1 = "op[1]->value.{0}[{1}]".format(types[1].union_field, indices[1]) if len(types) >= 2 else "ERROR"
01e04c3fSmrg      src2 = "op[2]->value.{0}[{1}]".format(types[2].union_field, indices[2]) if len(types) >= 3 else "ERROR"
01e04c3fSmrg      src3 = "op[3]->value.{0}[c]".format(types[3].union_field) if len(types) >= 4 else "ERROR"
01e04c3fSmrg
01e04c3fSmrg      expr = self.c_expression[types[0].union_field] if types[0].union_field in self.c_expression else self.c_expression['default']
01e04c3fSmrg
01e04c3fSmrg      return expr.format(src0=src0,
01e04c3fSmrg                         src1=src1,
01e04c3fSmrg                         src2=src2,
01e04c3fSmrg                         src3=src3)
01e04c3fSmrg
01e04c3fSmrg
01e04c3fSmrg   def signatures(self):
01e04c3fSmrg      if self.all_signatures is not None:
01e04c3fSmrg         return self.all_signatures
01e04c3fSmrg      else:
01e04c3fSmrg         return type_signature_iter(self.dest_type, self.source_types, self.num_operands)
01e04c3fSmrg
01e04c3fSmrg
01e04c3fSmrgir_expression_operation = [
01e04c3fSmrg   operation("bit_not", 1, printable_name="~", source_types=integer_types, c_expression="~ {src0}"),
01e04c3fSmrg   operation("logic_not", 1, printable_name="!", source_types=(bool_type,), c_expression="!{src0}"),
7ec681f3Smrg   operation("neg", 1, source_types=numeric_types, c_expression={'u': "-((int) {src0})", 'u64': "-((int64_t) {src0})", 'default': "-{src0}"}),
01e04c3fSmrg   operation("abs", 1, source_types=signed_numeric_types, c_expression={'i': "{src0} < 0 ? -{src0} : {src0}", 'f': "fabsf({src0})", 'd': "fabs({src0})", 'i64': "{src0} < 0 ? -{src0} : {src0}"}),
01e04c3fSmrg   operation("sign", 1, source_types=signed_numeric_types, c_expression={'i': "({src0} > 0) - ({src0} < 0)", 'f': "float(({src0} > 0.0F) - ({src0} < 0.0F))", 'd': "double(({src0} > 0.0) - ({src0} < 0.0))", 'i64': "({src0} > 0) - ({src0} < 0)"}),
01e04c3fSmrg   operation("rcp", 1, source_types=real_types, c_expression={'f': "1.0F / {src0}", 'd': "1.0 / {src0}"}),
01e04c3fSmrg   operation("rsq", 1, source_types=real_types, c_expression={'f': "1.0F / sqrtf({src0})", 'd': "1.0 / sqrt({src0})"}),
01e04c3fSmrg   operation("sqrt", 1, source_types=real_types, c_expression={'f': "sqrtf({src0})", 'd': "sqrt({src0})"}),
01e04c3fSmrg   operation("exp", 1, source_types=(float_type,), c_expression="expf({src0})"),         # Log base e on gentype
01e04c3fSmrg   operation("log", 1, source_types=(float_type,), c_expression="logf({src0})"),         # Natural log on gentype
01e04c3fSmrg   operation("exp2", 1, source_types=(float_type,), c_expression="exp2f({src0})"),
01e04c3fSmrg   operation("log2", 1, source_types=(float_type,), c_expression="log2f({src0})"),
01e04c3fSmrg
01e04c3fSmrg   # Float-to-integer conversion.
01e04c3fSmrg   operation("f2i", 1, source_types=(float_type,), dest_type=int_type, c_expression="(int) {src0}"),
01e04c3fSmrg   # Float-to-unsigned conversion.
01e04c3fSmrg   operation("f2u", 1, source_types=(float_type,), dest_type=uint_type, c_expression="(unsigned) {src0}"),
01e04c3fSmrg   # Integer-to-float conversion.
01e04c3fSmrg   operation("i2f", 1, source_types=(int_type,), dest_type=float_type, c_expression="(float) {src0}"),
01e04c3fSmrg   # Float-to-boolean conversion
01e04c3fSmrg   operation("f2b", 1, source_types=(float_type,), dest_type=bool_type, c_expression="{src0} != 0.0F ? true : false"),
01e04c3fSmrg   # Boolean-to-float conversion
01e04c3fSmrg   operation("b2f", 1, source_types=(bool_type,), dest_type=float_type, c_expression="{src0} ? 1.0F : 0.0F"),
7ec681f3Smrg   # Boolean-to-float16 conversion
7ec681f3Smrg   operation("b2f16", 1, source_types=(bool_type,), dest_type=float_type, c_expression="{src0} ? 1.0F : 0.0F"),
01e04c3fSmrg   # int-to-boolean conversion
01e04c3fSmrg   operation("i2b", 1, source_types=(uint_type, int_type), dest_type=bool_type, c_expression="{src0} ? true : false"),
01e04c3fSmrg   # Boolean-to-int conversion
01e04c3fSmrg   operation("b2i", 1, source_types=(bool_type,), dest_type=int_type, c_expression="{src0} ? 1 : 0"),
01e04c3fSmrg   # Unsigned-to-float conversion.
01e04c3fSmrg   operation("u2f", 1, source_types=(uint_type,), dest_type=float_type, c_expression="(float) {src0}"),
01e04c3fSmrg   # Integer-to-unsigned conversion.
01e04c3fSmrg   operation("i2u", 1, source_types=(int_type,), dest_type=uint_type, c_expression="{src0}"),
01e04c3fSmrg   # Unsigned-to-integer conversion.
01e04c3fSmrg   operation("u2i", 1, source_types=(uint_type,), dest_type=int_type, c_expression="{src0}"),
01e04c3fSmrg   # Double-to-float conversion.
01e04c3fSmrg   operation("d2f", 1, source_types=(double_type,), dest_type=float_type, c_expression="{src0}"),
01e04c3fSmrg   # Float-to-double conversion.
01e04c3fSmrg   operation("f2d", 1, source_types=(float_type,), dest_type=double_type, c_expression="{src0}"),
7ec681f3Smrg   # Half-float conversions. These all operate on and return float types,
7ec681f3Smrg   # since the framework expands half to full float before calling in.  We
7ec681f3Smrg   # still have to handle them here so that we can constant propagate through
7ec681f3Smrg   # them, but they are no-ops.
7ec681f3Smrg   operation("f2f16", 1, source_types=(float_type,), dest_type=float_type, c_expression="{src0}"),
7ec681f3Smrg   operation("f2fmp", 1, source_types=(float_type,), dest_type=float_type, c_expression="{src0}"),
7ec681f3Smrg   operation("f162f", 1, source_types=(float_type,), dest_type=float_type, c_expression="{src0}"),
7ec681f3Smrg   # int16<->int32 conversion.
7ec681f3Smrg   operation("i2i", 1, source_types=(int_type,), dest_type=int_type, c_expression="{src0}"),
7ec681f3Smrg   operation("i2imp", 1, source_types=(int_type,), dest_type=int_type, c_expression="{src0}"),
7ec681f3Smrg   operation("u2u", 1, source_types=(uint_type,), dest_type=uint_type, c_expression="{src0}"),
7ec681f3Smrg   operation("u2ump", 1, source_types=(uint_type,), dest_type=uint_type, c_expression="{src0}"),
01e04c3fSmrg   # Double-to-integer conversion.
01e04c3fSmrg   operation("d2i", 1, source_types=(double_type,), dest_type=int_type, c_expression="{src0}"),
01e04c3fSmrg   # Integer-to-double conversion.
01e04c3fSmrg   operation("i2d", 1, source_types=(int_type,), dest_type=double_type, c_expression="{src0}"),
01e04c3fSmrg   # Double-to-unsigned conversion.
01e04c3fSmrg   operation("d2u", 1, source_types=(double_type,), dest_type=uint_type, c_expression="{src0}"),
01e04c3fSmrg   # Unsigned-to-double conversion.
01e04c3fSmrg   operation("u2d", 1, source_types=(uint_type,), dest_type=double_type, c_expression="{src0}"),
01e04c3fSmrg   # Double-to-boolean conversion.
01e04c3fSmrg   operation("d2b", 1, source_types=(double_type,), dest_type=bool_type, c_expression="{src0} != 0.0"),
7ec681f3Smrg   # Float16-to-boolean conversion.
7ec681f3Smrg   operation("f162b", 1, source_types=(float_type,), dest_type=bool_type, c_expression="{src0} != 0.0"),
01e04c3fSmrg   # 'Bit-identical int-to-float "conversion"
01e04c3fSmrg   operation("bitcast_i2f", 1, source_types=(int_type,), dest_type=float_type, c_expression="bitcast_u2f({src0})"),
01e04c3fSmrg   # 'Bit-identical float-to-int "conversion"
01e04c3fSmrg   operation("bitcast_f2i", 1, source_types=(float_type,), dest_type=int_type, c_expression="bitcast_f2u({src0})"),
01e04c3fSmrg   # 'Bit-identical uint-to-float "conversion"
01e04c3fSmrg   operation("bitcast_u2f", 1, source_types=(uint_type,), dest_type=float_type, c_expression="bitcast_u2f({src0})"),
01e04c3fSmrg   # 'Bit-identical float-to-uint "conversion"
01e04c3fSmrg   operation("bitcast_f2u", 1, source_types=(float_type,), dest_type=uint_type, c_expression="bitcast_f2u({src0})"),
01e04c3fSmrg   # Bit-identical u64-to-double "conversion"
01e04c3fSmrg   operation("bitcast_u642d", 1, source_types=(uint64_type,), dest_type=double_type, c_expression="bitcast_u642d({src0})"),
01e04c3fSmrg   # Bit-identical i64-to-double "conversion"
01e04c3fSmrg   operation("bitcast_i642d", 1, source_types=(int64_type,), dest_type=double_type, c_expression="bitcast_i642d({src0})"),
01e04c3fSmrg   # Bit-identical double-to_u64 "conversion"
01e04c3fSmrg   operation("bitcast_d2u64", 1, source_types=(double_type,), dest_type=uint64_type, c_expression="bitcast_d2u64({src0})"),
01e04c3fSmrg   # Bit-identical double-to-i64 "conversion"
01e04c3fSmrg   operation("bitcast_d2i64", 1, source_types=(double_type,), dest_type=int64_type, c_expression="bitcast_d2i64({src0})"),
01e04c3fSmrg   # i64-to-i32 conversion
01e04c3fSmrg   operation("i642i", 1, source_types=(int64_type,), dest_type=int_type, c_expression="{src0}"),
01e04c3fSmrg   # ui64-to-i32 conversion
01e04c3fSmrg   operation("u642i", 1, source_types=(uint64_type,), dest_type=int_type, c_expression="{src0}"),
01e04c3fSmrg   operation("i642u", 1, source_types=(int64_type,), dest_type=uint_type, c_expression="{src0}"),
01e04c3fSmrg   operation("u642u", 1, source_types=(uint64_type,), dest_type=uint_type, c_expression="{src0}"),
01e04c3fSmrg   operation("i642b", 1, source_types=(int64_type,), dest_type=bool_type, c_expression="{src0} != 0"),
01e04c3fSmrg   operation("i642f", 1, source_types=(int64_type,), dest_type=float_type, c_expression="{src0}"),
01e04c3fSmrg   operation("u642f", 1, source_types=(uint64_type,), dest_type=float_type, c_expression="{src0}"),
01e04c3fSmrg   operation("i642d", 1, source_types=(int64_type,), dest_type=double_type, c_expression="{src0}"),
01e04c3fSmrg   operation("u642d", 1, source_types=(uint64_type,), dest_type=double_type, c_expression="{src0}"),
01e04c3fSmrg   operation("i2i64", 1, source_types=(int_type,), dest_type=int64_type, c_expression="{src0}"),
01e04c3fSmrg   operation("u2i64", 1, source_types=(uint_type,), dest_type=int64_type, c_expression="{src0}"),
01e04c3fSmrg   operation("b2i64", 1, source_types=(bool_type,), dest_type=int64_type, c_expression="{src0}"),
01e04c3fSmrg   operation("f2i64", 1, source_types=(float_type,), dest_type=int64_type, c_expression="{src0}"),
01e04c3fSmrg   operation("d2i64", 1, source_types=(double_type,), dest_type=int64_type, c_expression="{src0}"),
01e04c3fSmrg   operation("i2u64", 1, source_types=(int_type,), dest_type=uint64_type, c_expression="{src0}"),
01e04c3fSmrg   operation("u2u64", 1, source_types=(uint_type,), dest_type=uint64_type, c_expression="{src0}"),
01e04c3fSmrg   operation("f2u64", 1, source_types=(float_type,), dest_type=uint64_type, c_expression="{src0}"),
01e04c3fSmrg   operation("d2u64", 1, source_types=(double_type,), dest_type=uint64_type, c_expression="{src0}"),
01e04c3fSmrg   operation("u642i64", 1, source_types=(uint64_type,), dest_type=int64_type, c_expression="{src0}"),
01e04c3fSmrg   operation("i642u64", 1, source_types=(int64_type,), dest_type=uint64_type, c_expression="{src0}"),
01e04c3fSmrg
01e04c3fSmrg
01e04c3fSmrg   # Unary floating-point rounding operations.
01e04c3fSmrg   operation("trunc", 1, source_types=real_types, c_expression={'f': "truncf({src0})", 'd': "trunc({src0})"}),
01e04c3fSmrg   operation("ceil", 1, source_types=real_types, c_expression={'f': "ceilf({src0})", 'd': "ceil({src0})"}),
01e04c3fSmrg   operation("floor", 1, source_types=real_types, c_expression={'f': "floorf({src0})", 'd': "floor({src0})"}),
01e04c3fSmrg   operation("fract", 1, source_types=real_types, c_expression={'f': "{src0} - floorf({src0})", 'd': "{src0} - floor({src0})"}),
01e04c3fSmrg   operation("round_even", 1, source_types=real_types, c_expression={'f': "_mesa_roundevenf({src0})", 'd': "_mesa_roundeven({src0})"}),
01e04c3fSmrg
01e04c3fSmrg   # Trigonometric operations.
01e04c3fSmrg   operation("sin", 1, source_types=(float_type,), c_expression="sinf({src0})"),
01e04c3fSmrg   operation("cos", 1, source_types=(float_type,), c_expression="cosf({src0})"),
7ec681f3Smrg   operation("atan", 1, source_types=(float_type,), c_expression="atan({src0})"),
01e04c3fSmrg
01e04c3fSmrg   # Partial derivatives.
01e04c3fSmrg   operation("dFdx", 1, source_types=(float_type,), c_expression="0.0f"),
01e04c3fSmrg   operation("dFdx_coarse", 1, printable_name="dFdxCoarse", source_types=(float_type,), c_expression="0.0f"),
01e04c3fSmrg   operation("dFdx_fine", 1, printable_name="dFdxFine", source_types=(float_type,), c_expression="0.0f"),
01e04c3fSmrg   operation("dFdy", 1, source_types=(float_type,), c_expression="0.0f"),
01e04c3fSmrg   operation("dFdy_coarse", 1, printable_name="dFdyCoarse", source_types=(float_type,), c_expression="0.0f"),
01e04c3fSmrg   operation("dFdy_fine", 1, printable_name="dFdyFine", source_types=(float_type,), c_expression="0.0f"),
01e04c3fSmrg
01e04c3fSmrg   # Floating point pack and unpack operations.
01e04c3fSmrg   operation("pack_snorm_2x16", 1, printable_name="packSnorm2x16", source_types=(float_type,), dest_type=uint_type, c_expression="pack_2x16(pack_snorm_1x16, op[0]->value.f[0], op[0]->value.f[1])", flags=horizontal_operation),
01e04c3fSmrg   operation("pack_snorm_4x8", 1, printable_name="packSnorm4x8", source_types=(float_type,), dest_type=uint_type, c_expression="pack_4x8(pack_snorm_1x8, op[0]->value.f[0], op[0]->value.f[1], op[0]->value.f[2], op[0]->value.f[3])", flags=horizontal_operation),
01e04c3fSmrg   operation("pack_unorm_2x16", 1, printable_name="packUnorm2x16", source_types=(float_type,), dest_type=uint_type, c_expression="pack_2x16(pack_unorm_1x16, op[0]->value.f[0], op[0]->value.f[1])", flags=horizontal_operation),
01e04c3fSmrg   operation("pack_unorm_4x8", 1, printable_name="packUnorm4x8", source_types=(float_type,), dest_type=uint_type, c_expression="pack_4x8(pack_unorm_1x8, op[0]->value.f[0], op[0]->value.f[1], op[0]->value.f[2], op[0]->value.f[3])", flags=horizontal_operation),
01e04c3fSmrg   operation("pack_half_2x16", 1, printable_name="packHalf2x16", source_types=(float_type,), dest_type=uint_type, c_expression="pack_2x16(pack_half_1x16, op[0]->value.f[0], op[0]->value.f[1])", flags=horizontal_operation),
01e04c3fSmrg   operation("unpack_snorm_2x16", 1, printable_name="unpackSnorm2x16", source_types=(uint_type,), dest_type=float_type, c_expression="unpack_2x16(unpack_snorm_1x16, op[0]->value.u[0], &data.f[0], &data.f[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
01e04c3fSmrg   operation("unpack_snorm_4x8", 1, printable_name="unpackSnorm4x8", source_types=(uint_type,), dest_type=float_type, c_expression="unpack_4x8(unpack_snorm_1x8, op[0]->value.u[0], &data.f[0], &data.f[1], &data.f[2], &data.f[3])", flags=frozenset((horizontal_operation, non_assign_operation))),
01e04c3fSmrg   operation("unpack_unorm_2x16", 1, printable_name="unpackUnorm2x16", source_types=(uint_type,), dest_type=float_type, c_expression="unpack_2x16(unpack_unorm_1x16, op[0]->value.u[0], &data.f[0], &data.f[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
01e04c3fSmrg   operation("unpack_unorm_4x8", 1, printable_name="unpackUnorm4x8", source_types=(uint_type,), dest_type=float_type, c_expression="unpack_4x8(unpack_unorm_1x8, op[0]->value.u[0], &data.f[0], &data.f[1], &data.f[2], &data.f[3])", flags=frozenset((horizontal_operation, non_assign_operation))),
01e04c3fSmrg   operation("unpack_half_2x16", 1, printable_name="unpackHalf2x16", source_types=(uint_type,), dest_type=float_type, c_expression="unpack_2x16(unpack_half_1x16, op[0]->value.u[0], &data.f[0], &data.f[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
01e04c3fSmrg
01e04c3fSmrg   # Bit operations, part of ARB_gpu_shader5.
01e04c3fSmrg   operation("bitfield_reverse", 1, source_types=(uint_type, int_type), c_expression="bitfield_reverse({src0})"),
01e04c3fSmrg   operation("bit_count", 1, source_types=(uint_type, int_type), dest_type=int_type, c_expression="util_bitcount({src0})"),
01e04c3fSmrg   operation("find_msb", 1, source_types=(uint_type, int_type), dest_type=int_type, c_expression={'u': "find_msb_uint({src0})", 'i': "find_msb_int({src0})"}),
01e04c3fSmrg   operation("find_lsb", 1, source_types=(uint_type, int_type), dest_type=int_type, c_expression="find_msb_uint({src0} & -{src0})"),
7ec681f3Smrg   operation("clz", 1, source_types=(uint_type,), dest_type=uint_type, c_expression="(unsigned)(31 - find_msb_uint({src0}))"),
01e04c3fSmrg
01e04c3fSmrg   operation("saturate", 1, printable_name="sat", source_types=(float_type,), c_expression="CLAMP({src0}, 0.0f, 1.0f)"),
01e04c3fSmrg
01e04c3fSmrg   # Double packing, part of ARB_gpu_shader_fp64.
7ec681f3Smrg   operation("pack_double_2x32", 1, printable_name="packDouble2x32", source_types=(uint_type,), dest_type=double_type, c_expression="data.u64[0] = pack_2x32(op[0]->value.u[0], op[0]->value.u[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
7ec681f3Smrg   operation("unpack_double_2x32", 1, printable_name="unpackDouble2x32", source_types=(double_type,), dest_type=uint_type, c_expression="unpack_2x32(op[0]->value.u64[0], &data.u[0], &data.u[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
01e04c3fSmrg
01e04c3fSmrg   # Sampler/Image packing, part of ARB_bindless_texture.
7ec681f3Smrg   operation("pack_sampler_2x32", 1, printable_name="packSampler2x32", source_types=(uint_type,), dest_type=uint64_type, c_expression="data.u64[0] = pack_2x32(op[0]->value.u[0], op[0]->value.u[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
7ec681f3Smrg   operation("pack_image_2x32", 1, printable_name="packImage2x32", source_types=(uint_type,), dest_type=uint64_type, c_expression="data.u64[0] = pack_2x32(op[0]->value.u[0], op[0]->value.u[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
7ec681f3Smrg   operation("unpack_sampler_2x32", 1, printable_name="unpackSampler2x32", source_types=(uint64_type,), dest_type=uint_type, c_expression="unpack_2x32(op[0]->value.u64[0], &data.u[0], &data.u[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
7ec681f3Smrg   operation("unpack_image_2x32", 1, printable_name="unpackImage2x32", source_types=(uint64_type,), dest_type=uint_type, c_expression="unpack_2x32(op[0]->value.u64[0], &data.u[0], &data.u[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
01e04c3fSmrg
01e04c3fSmrg   operation("frexp_sig", 1),
01e04c3fSmrg   operation("frexp_exp", 1),
01e04c3fSmrg
01e04c3fSmrg   operation("subroutine_to_int", 1),
01e04c3fSmrg
01e04c3fSmrg   # Interpolate fs input at centroid
01e04c3fSmrg   #
01e04c3fSmrg   # operand0 is the fs input.
01e04c3fSmrg   operation("interpolate_at_centroid", 1),
01e04c3fSmrg
01e04c3fSmrg   # Ask the driver for the total size of a buffer block.
01e04c3fSmrg   # operand0 is the ir_constant buffer block index in the linked shader.
01e04c3fSmrg   operation("get_buffer_size", 1),
01e04c3fSmrg
01e04c3fSmrg   # Calculate length of an unsized array inside a buffer block.
01e04c3fSmrg   # This opcode is going to be replaced in a lowering pass inside
01e04c3fSmrg   # the linker.
01e04c3fSmrg   #
01e04c3fSmrg   # operand0 is the unsized array's ir_value for the calculation
01e04c3fSmrg   # of its length.
01e04c3fSmrg   operation("ssbo_unsized_array_length", 1),
01e04c3fSmrg
7ec681f3Smrg   # Calculate length of an implicitly sized array.
7ec681f3Smrg   # This opcode is going to be replaced with a constant expression at link
7ec681f3Smrg   # time.
7ec681f3Smrg   operation("implicitly_sized_array_length", 1),
7ec681f3Smrg
01e04c3fSmrg   # 64-bit integer packing ops.
7ec681f3Smrg   operation("pack_int_2x32", 1, printable_name="packInt2x32", source_types=(int_type,), dest_type=int64_type, c_expression="data.u64[0] = pack_2x32(op[0]->value.u[0], op[0]->value.u[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
7ec681f3Smrg   operation("pack_uint_2x32", 1, printable_name="packUint2x32", source_types=(uint_type,), dest_type=uint64_type, c_expression="data.u64[0] = pack_2x32(op[0]->value.u[0], op[0]->value.u[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
7ec681f3Smrg   operation("unpack_int_2x32", 1, printable_name="unpackInt2x32", source_types=(int64_type,), dest_type=int_type, c_expression="unpack_2x32(op[0]->value.u64[0], &data.u[0], &data.u[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
7ec681f3Smrg   operation("unpack_uint_2x32", 1, printable_name="unpackUint2x32", source_types=(uint64_type,), dest_type=uint_type, c_expression="unpack_2x32(op[0]->value.u64[0], &data.u[0], &data.u[1])", flags=frozenset((horizontal_operation, non_assign_operation))),
01e04c3fSmrg
01e04c3fSmrg   operation("add", 2, printable_name="+", source_types=numeric_types, c_expression="{src0} + {src1}", flags=vector_scalar_operation),
01e04c3fSmrg   operation("sub", 2, printable_name="-", source_types=numeric_types, c_expression="{src0} - {src1}", flags=vector_scalar_operation),
7ec681f3Smrg   operation("add_sat", 2, printable_name="add_sat", source_types=integer_types, c_expression={
7ec681f3Smrg      'u': "({src0} + {src1}) < {src0} ? UINT32_MAX : ({src0} + {src1})",
7ec681f3Smrg      'i': "iadd_saturate({src0}, {src1})",
7ec681f3Smrg      'u64': "({src0} + {src1}) < {src0} ? UINT64_MAX : ({src0} + {src1})",
7ec681f3Smrg      'i64': "iadd64_saturate({src0}, {src1})"
7ec681f3Smrg   }),
7ec681f3Smrg   operation("sub_sat", 2, printable_name="sub_sat", source_types=integer_types, c_expression={
7ec681f3Smrg      'u': "({src1} > {src0}) ? 0 : {src0} - {src1}",
7ec681f3Smrg      'i': "isub_saturate({src0}, {src1})",
7ec681f3Smrg      'u64': "({src1} > {src0}) ? 0 : {src0} - {src1}",
7ec681f3Smrg      'i64': "isub64_saturate({src0}, {src1})"
7ec681f3Smrg   }),
7ec681f3Smrg   operation("abs_sub", 2, printable_name="abs_sub", source_types=integer_types, c_expression={
7ec681f3Smrg      'u': "({src1} > {src0}) ? {src1} - {src0} : {src0} - {src1}",
7ec681f3Smrg      'i': "({src1} > {src0}) ? (unsigned){src1} - (unsigned){src0} : (unsigned){src0} - (unsigned){src1}",
7ec681f3Smrg      'u64': "({src1} > {src0}) ? {src1} - {src0} : {src0} - {src1}",
7ec681f3Smrg      'i64': "({src1} > {src0}) ? (uint64_t){src1} - (uint64_t){src0} : (uint64_t){src0} - (uint64_t){src1}",
7ec681f3Smrg   }),
7ec681f3Smrg   operation("avg", 2, printable_name="average", source_types=integer_types, c_expression="({src0} >> 1) + ({src1} >> 1) + (({src0} & {src1}) & 1)"),
7ec681f3Smrg   operation("avg_round", 2, printable_name="average_rounded", source_types=integer_types, c_expression="({src0} >> 1) + ({src1} >> 1) + (({src0} | {src1}) & 1)"),
7ec681f3Smrg
01e04c3fSmrg   # "Floating-point or low 32-bit integer multiply."
01e04c3fSmrg   operation("mul", 2, printable_name="*", source_types=numeric_types, c_expression="{src0} * {src1}"),
7ec681f3Smrg   operation("mul_32x16", 2, printable_name="*", source_types=(uint_type, int_type), c_expression={
7ec681f3Smrg      'u': "{src0} * (uint16_t){src1}",
7ec681f3Smrg      'i': "{src0} * (int16_t){src0}"
7ec681f3Smrg   }),
01e04c3fSmrg   operation("imul_high", 2),       # Calculates the high 32-bits of a 64-bit multiply.
01e04c3fSmrg   operation("div", 2, printable_name="/", source_types=numeric_types, c_expression={'u': "{src1} == 0 ? 0 : {src0} / {src1}", 'i': "{src1} == 0 ? 0 : {src0} / {src1}", 'u64': "{src1} == 0 ? 0 : {src0} / {src1}", 'i64': "{src1} == 0 ? 0 : {src0} / {src1}", 'default': "{src0} / {src1}"}, flags=vector_scalar_operation),
01e04c3fSmrg
01e04c3fSmrg   # Returns the carry resulting from the addition of the two arguments.
01e04c3fSmrg   operation("carry", 2),
01e04c3fSmrg
01e04c3fSmrg   # Returns the borrow resulting from the subtraction of the second argument
01e04c3fSmrg   # from the first argument.
01e04c3fSmrg   operation("borrow", 2),
01e04c3fSmrg
01e04c3fSmrg   # Either (vector % vector) or (vector % scalar)
01e04c3fSmrg   #
01e04c3fSmrg   # We don't use fmod because it rounds toward zero; GLSL specifies the use
01e04c3fSmrg   # of floor.
01e04c3fSmrg   operation("mod", 2, printable_name="%", source_types=numeric_types, c_expression={'u': "{src1} == 0 ? 0 : {src0} % {src1}", 'i': "{src1} == 0 ? 0 : {src0} % {src1}", 'f': "{src0} - {src1} * floorf({src0} / {src1})", 'd': "{src0} - {src1} * floor({src0} / {src1})", 'u64': "{src1} == 0 ? 0 : {src0} % {src1}", 'i64': "{src1} == 0 ? 0 : {src0} % {src1}"}, flags=vector_scalar_operation),
01e04c3fSmrg
01e04c3fSmrg   # Binary comparison operators which return a boolean vector.
01e04c3fSmrg   # The type of both operands must be equal.
01e04c3fSmrg   operation("less", 2, printable_name="<", source_types=numeric_types, dest_type=bool_type, c_expression="{src0} < {src1}"),
01e04c3fSmrg   operation("gequal", 2, printable_name=">=", source_types=numeric_types, dest_type=bool_type, c_expression="{src0} >= {src1}"),
01e04c3fSmrg   operation("equal", 2, printable_name="==", source_types=all_types, dest_type=bool_type, c_expression="{src0} == {src1}"),
01e04c3fSmrg   operation("nequal", 2, printable_name="!=", source_types=all_types, dest_type=bool_type, c_expression="{src0} != {src1}"),
01e04c3fSmrg
01e04c3fSmrg   # Returns single boolean for whether all components of operands[0]
01e04c3fSmrg   # equal the components of operands[1].
01e04c3fSmrg   operation("all_equal", 2, source_types=all_types, dest_type=bool_type, c_expression="op[0]->has_value(op[1])", flags=frozenset((horizontal_operation, types_identical_operation))),
01e04c3fSmrg
01e04c3fSmrg   # Returns single boolean for whether any component of operands[0]
01e04c3fSmrg   # is not equal to the corresponding component of operands[1].
01e04c3fSmrg   operation("any_nequal", 2, source_types=all_types, dest_type=bool_type, c_expression="!op[0]->has_value(op[1])", flags=frozenset((horizontal_operation, types_identical_operation))),
01e04c3fSmrg
01e04c3fSmrg   # Bit-wise binary operations.
01e04c3fSmrg   operation("lshift", 2, printable_name="<<", source_types=integer_types, c_expression="{src0} << {src1}", flags=frozenset((vector_scalar_operation, mixed_type_operation))),
01e04c3fSmrg   operation("rshift", 2, printable_name=">>", source_types=integer_types, c_expression="{src0} >> {src1}", flags=frozenset((vector_scalar_operation, mixed_type_operation))),
01e04c3fSmrg   operation("bit_and", 2, printable_name="&", source_types=integer_types, c_expression="{src0} & {src1}", flags=vector_scalar_operation),
01e04c3fSmrg   operation("bit_xor", 2, printable_name="^", source_types=integer_types, c_expression="{src0} ^ {src1}", flags=vector_scalar_operation),
01e04c3fSmrg   operation("bit_or", 2, printable_name="|", source_types=integer_types, c_expression="{src0} | {src1}", flags=vector_scalar_operation),
01e04c3fSmrg
01e04c3fSmrg   operation("logic_and", 2, printable_name="&&", source_types=(bool_type,), c_expression="{src0} && {src1}"),
01e04c3fSmrg   operation("logic_xor", 2, printable_name="^^", source_types=(bool_type,), c_expression="{src0} != {src1}"),
01e04c3fSmrg   operation("logic_or", 2, printable_name="||", source_types=(bool_type,), c_expression="{src0} || {src1}"),
01e04c3fSmrg
01e04c3fSmrg   operation("dot", 2, source_types=real_types, c_expression={'f': "dot_f(op[0], op[1])", 'd': "dot_d(op[0], op[1])"}, flags=horizontal_operation),
01e04c3fSmrg   operation("min", 2, source_types=numeric_types, c_expression="MIN2({src0}, {src1})", flags=vector_scalar_operation),
01e04c3fSmrg   operation("max", 2, source_types=numeric_types, c_expression="MAX2({src0}, {src1})", flags=vector_scalar_operation),
01e04c3fSmrg
01e04c3fSmrg   operation("pow", 2, source_types=(float_type,), c_expression="powf({src0}, {src1})"),
01e04c3fSmrg
01e04c3fSmrg   # Load a value the size of a given GLSL type from a uniform block.
01e04c3fSmrg   #
01e04c3fSmrg   # operand0 is the ir_constant uniform block index in the linked shader.
01e04c3fSmrg   # operand1 is a byte offset within the uniform block.
01e04c3fSmrg   operation("ubo_load", 2),
01e04c3fSmrg
01e04c3fSmrg   # Multiplies a number by two to a power, part of ARB_gpu_shader5.
01e04c3fSmrg   operation("ldexp", 2,
01e04c3fSmrg             all_signatures=((float_type, (float_type, int_type)),
01e04c3fSmrg                             (double_type, (double_type, int_type))),
01e04c3fSmrg             c_expression={'f': "ldexpf_flush_subnormal({src0}, {src1})",
01e04c3fSmrg                           'd': "ldexp_flush_subnormal({src0}, {src1})"}),
01e04c3fSmrg
01e04c3fSmrg   # Extract a scalar from a vector
01e04c3fSmrg   #
01e04c3fSmrg   # operand0 is the vector
01e04c3fSmrg   # operand1 is the index of the field to read from operand0
01e04c3fSmrg   operation("vector_extract", 2, source_types=all_types, c_expression="anything-except-None"),
01e04c3fSmrg
01e04c3fSmrg   # Interpolate fs input at offset
01e04c3fSmrg   #
01e04c3fSmrg   # operand0 is the fs input
01e04c3fSmrg   # operand1 is the offset from the pixel center
01e04c3fSmrg   operation("interpolate_at_offset", 2),
01e04c3fSmrg
01e04c3fSmrg   # Interpolate fs input at sample position
01e04c3fSmrg   #
01e04c3fSmrg   # operand0 is the fs input
01e04c3fSmrg   # operand1 is the sample ID
01e04c3fSmrg   operation("interpolate_at_sample", 2),
01e04c3fSmrg
7ec681f3Smrg   operation("atan2", 2, source_types=(float_type,), c_expression="atan2({src0}, {src1})"),
7ec681f3Smrg
01e04c3fSmrg   # Fused floating-point multiply-add, part of ARB_gpu_shader5.
01e04c3fSmrg   operation("fma", 3, source_types=real_types, c_expression="{src0} * {src1} + {src2}"),
01e04c3fSmrg
01e04c3fSmrg   operation("lrp", 3, source_types=real_types, c_expression={'f': "{src0} * (1.0f - {src2}) + ({src1} * {src2})", 'd': "{src0} * (1.0 - {src2}) + ({src1} * {src2})"}),
01e04c3fSmrg
01e04c3fSmrg   # Conditional Select
01e04c3fSmrg   #
01e04c3fSmrg   # A vector conditional select instruction (like ?:, but operating per-
01e04c3fSmrg   # component on vectors).
01e04c3fSmrg   #
01e04c3fSmrg   # See also lower_instructions_visitor::ldexp_to_arith
01e04c3fSmrg   operation("csel", 3,
01e04c3fSmrg             all_signatures=zip(all_types, zip(len(all_types) * (bool_type,), all_types, all_types)),
01e04c3fSmrg             c_expression="{src0} ? {src1} : {src2}"),
01e04c3fSmrg
01e04c3fSmrg   operation("bitfield_extract", 3,
01e04c3fSmrg             all_signatures=((int_type, (uint_type, int_type, int_type)),
01e04c3fSmrg                             (int_type, (int_type, int_type, int_type))),
01e04c3fSmrg             c_expression={'u': "bitfield_extract_uint({src0}, {src1}, {src2})",
01e04c3fSmrg                           'i': "bitfield_extract_int({src0}, {src1}, {src2})"}),
01e04c3fSmrg
01e04c3fSmrg   # Generate a value with one field of a vector changed
01e04c3fSmrg   #
01e04c3fSmrg   # operand0 is the vector
01e04c3fSmrg   # operand1 is the value to write into the vector result
01e04c3fSmrg   # operand2 is the index in operand0 to be modified
01e04c3fSmrg   operation("vector_insert", 3, source_types=all_types, c_expression="anything-except-None"),
01e04c3fSmrg
01e04c3fSmrg   operation("bitfield_insert", 4,
01e04c3fSmrg             all_signatures=((uint_type, (uint_type, uint_type, int_type, int_type)),
01e04c3fSmrg                             (int_type, (int_type, int_type, int_type, int_type))),
01e04c3fSmrg             c_expression="bitfield_insert({src0}, {src1}, {src2}, {src3})"),
01e04c3fSmrg
01e04c3fSmrg   operation("vector", 4, source_types=all_types, c_expression="anything-except-None"),
01e04c3fSmrg]
01e04c3fSmrg
01e04c3fSmrg
01e04c3fSmrgif __name__ == "__main__":
01e04c3fSmrg   copyright = """/*
01e04c3fSmrg * Copyright (C) 2010 Intel Corporation
01e04c3fSmrg *
01e04c3fSmrg * Permission is hereby granted, free of charge, to any person obtaining a
01e04c3fSmrg * copy of this software and associated documentation files (the "Software"),
01e04c3fSmrg * to deal in the Software without restriction, including without limitation
01e04c3fSmrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
01e04c3fSmrg * and/or sell copies of the Software, and to permit persons to whom the
01e04c3fSmrg * Software is furnished to do so, subject to the following conditions:
01e04c3fSmrg *
01e04c3fSmrg * The above copyright notice and this permission notice (including the next
01e04c3fSmrg * paragraph) shall be included in all copies or substantial portions of the
01e04c3fSmrg * Software.
01e04c3fSmrg *
01e04c3fSmrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
01e04c3fSmrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
01e04c3fSmrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
01e04c3fSmrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
01e04c3fSmrg * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
01e04c3fSmrg * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
01e04c3fSmrg * DEALINGS IN THE SOFTWARE.
01e04c3fSmrg */
01e04c3fSmrg"""
01e04c3fSmrg   enum_template = mako.template.Template(copyright + """
01e04c3fSmrgenum ir_expression_operation {
01e04c3fSmrg% for item in values:
01e04c3fSmrg   ${item.get_enum_name()},
01e04c3fSmrg% endfor
01e04c3fSmrg
01e04c3fSmrg   /* Sentinels marking the last of each kind of operation. */
01e04c3fSmrg% for item in lasts:
01e04c3fSmrg   ir_last_${("un", "bin", "tri", "quad")[item.num_operands - 1]}op = ${item.get_enum_name()},
01e04c3fSmrg% endfor
01e04c3fSmrg   ir_last_opcode = ir_quadop_${lasts[3].name}
01e04c3fSmrg};""")
01e04c3fSmrg
01e04c3fSmrg   strings_template = mako.template.Template(copyright + """
01e04c3fSmrgconst char *const ir_expression_operation_strings[] = {
01e04c3fSmrg% for item in values:
01e04c3fSmrg   "${item.printable_name}",
01e04c3fSmrg% endfor
01e04c3fSmrg};
01e04c3fSmrg
01e04c3fSmrgconst char *const ir_expression_operation_enum_strings[] = {
01e04c3fSmrg% for item in values:
01e04c3fSmrg   "${item.name}",
01e04c3fSmrg% endfor
01e04c3fSmrg};""")
01e04c3fSmrg
01e04c3fSmrg   constant_template = mako.template.Template("""\
01e04c3fSmrg   switch (this->operation) {
01e04c3fSmrg% for op in values:
01e04c3fSmrg    % if op.c_expression is not None:
01e04c3fSmrg${op.get_template()}
01e04c3fSmrg
01e04c3fSmrg    % endif
01e04c3fSmrg% endfor
01e04c3fSmrg   default:
01e04c3fSmrg      /* FINISHME: Should handle all expression types. */
01e04c3fSmrg      return NULL;
01e04c3fSmrg   }
01e04c3fSmrg""")
01e04c3fSmrg
01e04c3fSmrg   if sys.argv[1] == "enum":
01e04c3fSmrg      lasts = [None, None, None, None]
01e04c3fSmrg      for item in reversed(ir_expression_operation):
01e04c3fSmrg         i = item.num_operands - 1
01e04c3fSmrg         if lasts[i] is None:
01e04c3fSmrg            lasts[i] = item
01e04c3fSmrg
01e04c3fSmrg      print(enum_template.render(values=ir_expression_operation,
01e04c3fSmrg                                 lasts=lasts))
01e04c3fSmrg   elif sys.argv[1] == "strings":
01e04c3fSmrg      print(strings_template.render(values=ir_expression_operation))
01e04c3fSmrg   elif sys.argv[1] == "constant":
01e04c3fSmrg      print(constant_template.render(values=ir_expression_operation))