1b8e80941Smrg/*
2b8e80941Smrg * Copyright © 2010 Intel Corporation
3b8e80941Smrg *
4b8e80941Smrg * Permission is hereby granted, free of charge, to any person obtaining a
5b8e80941Smrg * copy of this software and associated documentation files (the "Software"),
6b8e80941Smrg * to deal in the Software without restriction, including without limitation
7b8e80941Smrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8b8e80941Smrg * and/or sell copies of the Software, and to permit persons to whom the
9b8e80941Smrg * Software is furnished to do so, subject to the following conditions:
10b8e80941Smrg *
11b8e80941Smrg * The above copyright notice and this permission notice (including the next
12b8e80941Smrg * paragraph) shall be included in all copies or substantial portions of the
13b8e80941Smrg * Software.
14b8e80941Smrg *
15b8e80941Smrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16b8e80941Smrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17b8e80941Smrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18b8e80941Smrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19b8e80941Smrg * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20b8e80941Smrg * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21b8e80941Smrg * DEALINGS IN THE SOFTWARE.
22b8e80941Smrg */
23b8e80941Smrg
24b8e80941Smrg/**
25b8e80941Smrg * \file opt_swizzle.cpp
26b8e80941Smrg * Optimize swizzle operations.
27b8e80941Smrg *
28b8e80941Smrg * First, compact a sequence of swizzled swizzles into a single swizzle.
29b8e80941Smrg *
30b8e80941Smrg * If the final resulting swizzle doesn't change the order or count of
31b8e80941Smrg * components, then remove the swizzle so that other optimization passes see
32b8e80941Smrg * the value behind it.
33b8e80941Smrg */
34b8e80941Smrg
35b8e80941Smrg#include "ir.h"
36b8e80941Smrg#include "ir_visitor.h"
37b8e80941Smrg#include "ir_rvalue_visitor.h"
38b8e80941Smrg#include "compiler/glsl_types.h"
39b8e80941Smrg
40b8e80941Smrgnamespace {
41b8e80941Smrg
42b8e80941Smrgclass ir_opt_swizzle_visitor : public ir_rvalue_visitor {
43b8e80941Smrgpublic:
44b8e80941Smrg   ir_opt_swizzle_visitor()
45b8e80941Smrg   {
46b8e80941Smrg      this->progress = false;
47b8e80941Smrg   }
48b8e80941Smrg
49b8e80941Smrg   void handle_rvalue(ir_rvalue **rvalue);
50b8e80941Smrg   bool progress;
51b8e80941Smrg};
52b8e80941Smrg
53b8e80941Smrg} /* unnamed namespace */
54b8e80941Smrg
55b8e80941Smrgvoid
56b8e80941Smrgir_opt_swizzle_visitor::handle_rvalue(ir_rvalue **rvalue)
57b8e80941Smrg{
58b8e80941Smrg   if (!*rvalue)
59b8e80941Smrg      return;
60b8e80941Smrg
61b8e80941Smrg   ir_swizzle *swiz = (*rvalue)->as_swizzle();
62b8e80941Smrg
63b8e80941Smrg   if (!swiz)
64b8e80941Smrg      return;
65b8e80941Smrg
66b8e80941Smrg   ir_swizzle *swiz2;
67b8e80941Smrg
68b8e80941Smrg   while ((swiz2 = swiz->val->as_swizzle()) != NULL) {
69b8e80941Smrg      int mask2[4];
70b8e80941Smrg
71b8e80941Smrg      memset(&mask2, 0, sizeof(mask2));
72b8e80941Smrg      if (swiz2->mask.num_components >= 1)
73b8e80941Smrg         mask2[0] = swiz2->mask.x;
74b8e80941Smrg      if (swiz2->mask.num_components >= 2)
75b8e80941Smrg         mask2[1] = swiz2->mask.y;
76b8e80941Smrg      if (swiz2->mask.num_components >= 3)
77b8e80941Smrg         mask2[2] = swiz2->mask.z;
78b8e80941Smrg      if (swiz2->mask.num_components >= 4)
79b8e80941Smrg         mask2[3] = swiz2->mask.w;
80b8e80941Smrg
81b8e80941Smrg      if (swiz->mask.num_components >= 1)
82b8e80941Smrg         swiz->mask.x = mask2[swiz->mask.x];
83b8e80941Smrg      if (swiz->mask.num_components >= 2)
84b8e80941Smrg         swiz->mask.y = mask2[swiz->mask.y];
85b8e80941Smrg      if (swiz->mask.num_components >= 3)
86b8e80941Smrg         swiz->mask.z = mask2[swiz->mask.z];
87b8e80941Smrg      if (swiz->mask.num_components >= 4)
88b8e80941Smrg         swiz->mask.w = mask2[swiz->mask.w];
89b8e80941Smrg
90b8e80941Smrg      swiz->val = swiz2->val;
91b8e80941Smrg
92b8e80941Smrg      this->progress = true;
93b8e80941Smrg   }
94b8e80941Smrg
95b8e80941Smrg   if (swiz->type != swiz->val->type)
96b8e80941Smrg      return;
97b8e80941Smrg
98b8e80941Smrg   int elems = swiz->val->type->vector_elements;
99b8e80941Smrg   if (swiz->mask.x != 0)
100b8e80941Smrg      return;
101b8e80941Smrg   if (elems >= 2 && swiz->mask.y != 1)
102b8e80941Smrg      return;
103b8e80941Smrg   if (elems >= 3 && swiz->mask.z != 2)
104b8e80941Smrg      return;
105b8e80941Smrg   if (elems >= 4 && swiz->mask.w != 3)
106b8e80941Smrg      return;
107b8e80941Smrg
108b8e80941Smrg   this->progress = true;
109b8e80941Smrg   *rvalue = swiz->val;
110b8e80941Smrg}
111b8e80941Smrg
112b8e80941Smrgbool
113b8e80941Smrgoptimize_swizzles(exec_list *instructions)
114b8e80941Smrg{
115b8e80941Smrg   ir_opt_swizzle_visitor v;
116b8e80941Smrg   visit_list_elements(&v, instructions);
117b8e80941Smrg
118b8e80941Smrg   return v.progress;
119b8e80941Smrg}
120