1b8e80941Smrg/*
2b8e80941Smrg * Copyright © 2015 Red Hat
3b8e80941Smrg *
4b8e80941Smrg * Permission is hereby granted, free of charge, to any person obtaining a
5b8e80941Smrg * copy of this software and associated documentation files (the "Software"),
6b8e80941Smrg * to deal in the Software without restriction, including without limitation
7b8e80941Smrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8b8e80941Smrg * and/or sell copies of the Software, and to permit persons to whom the
9b8e80941Smrg * Software is furnished to do so, subject to the following conditions:
10b8e80941Smrg *
11b8e80941Smrg * The above copyright notice and this permission notice (including the next
12b8e80941Smrg * paragraph) shall be included in all copies or substantial portions of the
13b8e80941Smrg * Software.
14b8e80941Smrg *
15b8e80941Smrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16b8e80941Smrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17b8e80941Smrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18b8e80941Smrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19b8e80941Smrg * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20b8e80941Smrg * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21b8e80941Smrg * SOFTWARE.
22b8e80941Smrg */
23b8e80941Smrg
24b8e80941Smrg#include "nir.h"
25b8e80941Smrg#include "nir_builder.h"
26b8e80941Smrg
27b8e80941Smrg/* Lower glDrawPixels().
28b8e80941Smrg *
29b8e80941Smrg * This is based on the logic in st_get_drawpix_shader() in TGSI compiler.
30b8e80941Smrg *
31b8e80941Smrg * Run before nir_lower_io.
32b8e80941Smrg */
33b8e80941Smrg
34b8e80941Smrgtypedef struct {
35b8e80941Smrg   const nir_lower_drawpixels_options *options;
36b8e80941Smrg   nir_shader   *shader;
37b8e80941Smrg   nir_builder   b;
38b8e80941Smrg   nir_variable *texcoord, *scale, *bias, *tex, *pixelmap;
39b8e80941Smrg} lower_drawpixels_state;
40b8e80941Smrg
41b8e80941Smrgstatic nir_ssa_def *
42b8e80941Smrgget_texcoord(lower_drawpixels_state *state)
43b8e80941Smrg{
44b8e80941Smrg   if (state->texcoord == NULL) {
45b8e80941Smrg      nir_variable *texcoord = NULL;
46b8e80941Smrg
47b8e80941Smrg      /* find gl_TexCoord, if it exists: */
48b8e80941Smrg      nir_foreach_variable(var, &state->shader->inputs) {
49b8e80941Smrg         if (var->data.location == VARYING_SLOT_TEX0) {
50b8e80941Smrg            texcoord = var;
51b8e80941Smrg            break;
52b8e80941Smrg         }
53b8e80941Smrg      }
54b8e80941Smrg
55b8e80941Smrg      /* otherwise create it: */
56b8e80941Smrg      if (texcoord == NULL) {
57b8e80941Smrg         texcoord = nir_variable_create(state->shader,
58b8e80941Smrg                                        nir_var_shader_in,
59b8e80941Smrg                                        glsl_vec4_type(),
60b8e80941Smrg                                        "gl_TexCoord");
61b8e80941Smrg         texcoord->data.location = VARYING_SLOT_TEX0;
62b8e80941Smrg      }
63b8e80941Smrg
64b8e80941Smrg      state->texcoord = texcoord;
65b8e80941Smrg   }
66b8e80941Smrg   return nir_load_var(&state->b, state->texcoord);
67b8e80941Smrg}
68b8e80941Smrg
69b8e80941Smrgstatic nir_variable *
70b8e80941Smrgcreate_uniform(nir_shader *shader, const char *name,
71b8e80941Smrg               const gl_state_index16 state_tokens[STATE_LENGTH])
72b8e80941Smrg{
73b8e80941Smrg   nir_variable *var = nir_variable_create(shader,
74b8e80941Smrg                                           nir_var_uniform,
75b8e80941Smrg                                           glsl_vec4_type(),
76b8e80941Smrg                                           name);
77b8e80941Smrg   var->num_state_slots = 1;
78b8e80941Smrg   var->state_slots = ralloc_array(var, nir_state_slot, 1);
79b8e80941Smrg   memcpy(var->state_slots[0].tokens, state_tokens,
80b8e80941Smrg          sizeof(var->state_slots[0].tokens));
81b8e80941Smrg   return var;
82b8e80941Smrg}
83b8e80941Smrg
84b8e80941Smrgstatic nir_ssa_def *
85b8e80941Smrgget_scale(lower_drawpixels_state *state)
86b8e80941Smrg{
87b8e80941Smrg   if (state->scale == NULL) {
88b8e80941Smrg      state->scale = create_uniform(state->shader, "gl_PTscale",
89b8e80941Smrg                                    state->options->scale_state_tokens);
90b8e80941Smrg   }
91b8e80941Smrg   return nir_load_var(&state->b, state->scale);
92b8e80941Smrg}
93b8e80941Smrg
94b8e80941Smrgstatic nir_ssa_def *
95b8e80941Smrgget_bias(lower_drawpixels_state *state)
96b8e80941Smrg{
97b8e80941Smrg   if (state->bias == NULL) {
98b8e80941Smrg      state->bias = create_uniform(state->shader, "gl_PTbias",
99b8e80941Smrg                                   state->options->bias_state_tokens);
100b8e80941Smrg   }
101b8e80941Smrg   return nir_load_var(&state->b, state->bias);
102b8e80941Smrg}
103b8e80941Smrg
104b8e80941Smrgstatic nir_ssa_def *
105b8e80941Smrgget_texcoord_const(lower_drawpixels_state *state)
106b8e80941Smrg{
107b8e80941Smrg   if (state->bias == NULL) {
108b8e80941Smrg      state->bias = create_uniform(state->shader, "gl_MultiTexCoord0",
109b8e80941Smrg                                   state->options->texcoord_state_tokens);
110b8e80941Smrg   }
111b8e80941Smrg   return nir_load_var(&state->b, state->bias);
112b8e80941Smrg}
113b8e80941Smrg
114b8e80941Smrgstatic void
115b8e80941Smrglower_color(lower_drawpixels_state *state, nir_intrinsic_instr *intr)
116b8e80941Smrg{
117b8e80941Smrg   nir_builder *b = &state->b;
118b8e80941Smrg   nir_ssa_def *texcoord;
119b8e80941Smrg   nir_tex_instr *tex;
120b8e80941Smrg   nir_ssa_def *def;
121b8e80941Smrg
122b8e80941Smrg   assert(intr->dest.is_ssa);
123b8e80941Smrg
124b8e80941Smrg   b->cursor = nir_before_instr(&intr->instr);
125b8e80941Smrg
126b8e80941Smrg   texcoord = get_texcoord(state);
127b8e80941Smrg
128b8e80941Smrg   const struct glsl_type *sampler2D =
129b8e80941Smrg      glsl_sampler_type(GLSL_SAMPLER_DIM_2D, false, false, GLSL_TYPE_FLOAT);
130b8e80941Smrg
131b8e80941Smrg   if (!state->tex) {
132b8e80941Smrg      state->tex =
133b8e80941Smrg         nir_variable_create(b->shader, nir_var_uniform, sampler2D, "drawpix");
134b8e80941Smrg      state->tex->data.binding = state->options->drawpix_sampler;
135b8e80941Smrg      state->tex->data.explicit_binding = true;
136b8e80941Smrg      state->tex->data.how_declared = nir_var_hidden;
137b8e80941Smrg   }
138b8e80941Smrg
139b8e80941Smrg   nir_deref_instr *tex_deref = nir_build_deref_var(b, state->tex);
140b8e80941Smrg
141b8e80941Smrg   /* replace load_var(gl_Color) w/ texture sample:
142b8e80941Smrg    *   TEX def, texcoord, drawpix_sampler, 2D
143b8e80941Smrg    */
144b8e80941Smrg   tex = nir_tex_instr_create(state->shader, 3);
145b8e80941Smrg   tex->op = nir_texop_tex;
146b8e80941Smrg   tex->sampler_dim = GLSL_SAMPLER_DIM_2D;
147b8e80941Smrg   tex->coord_components = 2;
148b8e80941Smrg   tex->dest_type = nir_type_float;
149b8e80941Smrg   tex->src[0].src_type = nir_tex_src_texture_deref;
150b8e80941Smrg   tex->src[0].src = nir_src_for_ssa(&tex_deref->dest.ssa);
151b8e80941Smrg   tex->src[1].src_type = nir_tex_src_sampler_deref;
152b8e80941Smrg   tex->src[1].src = nir_src_for_ssa(&tex_deref->dest.ssa);
153b8e80941Smrg   tex->src[2].src_type = nir_tex_src_coord;
154b8e80941Smrg   tex->src[2].src =
155b8e80941Smrg      nir_src_for_ssa(nir_channels(b, texcoord,
156b8e80941Smrg                                   (1 << tex->coord_components) - 1));
157b8e80941Smrg
158b8e80941Smrg   nir_ssa_dest_init(&tex->instr, &tex->dest, 4, 32, NULL);
159b8e80941Smrg   nir_builder_instr_insert(b, &tex->instr);
160b8e80941Smrg   def = &tex->dest.ssa;
161b8e80941Smrg
162b8e80941Smrg   /* Apply the scale and bias. */
163b8e80941Smrg   if (state->options->scale_and_bias) {
164b8e80941Smrg      /* MAD def, def, scale, bias; */
165b8e80941Smrg      def = nir_ffma(b, def, get_scale(state), get_bias(state));
166b8e80941Smrg   }
167b8e80941Smrg
168b8e80941Smrg   if (state->options->pixel_maps) {
169b8e80941Smrg      if (!state->pixelmap) {
170b8e80941Smrg         state->pixelmap = nir_variable_create(b->shader, nir_var_uniform,
171b8e80941Smrg                                               sampler2D, "pixelmap");
172b8e80941Smrg         state->pixelmap->data.binding = state->options->pixelmap_sampler;
173b8e80941Smrg         state->pixelmap->data.explicit_binding = true;
174b8e80941Smrg         state->pixelmap->data.how_declared = nir_var_hidden;
175b8e80941Smrg      }
176b8e80941Smrg
177b8e80941Smrg      nir_deref_instr *pixelmap_deref =
178b8e80941Smrg         nir_build_deref_var(b, state->pixelmap);
179b8e80941Smrg
180b8e80941Smrg      /* do four pixel map look-ups with two TEX instructions: */
181b8e80941Smrg      nir_ssa_def *def_xy, *def_zw;
182b8e80941Smrg
183b8e80941Smrg      /* TEX def.xy, def.xyyy, pixelmap_sampler, 2D; */
184b8e80941Smrg      tex = nir_tex_instr_create(state->shader, 3);
185b8e80941Smrg      tex->op = nir_texop_tex;
186b8e80941Smrg      tex->sampler_dim = GLSL_SAMPLER_DIM_2D;
187b8e80941Smrg      tex->coord_components = 2;
188b8e80941Smrg      tex->sampler_index = state->options->pixelmap_sampler;
189b8e80941Smrg      tex->texture_index = state->options->pixelmap_sampler;
190b8e80941Smrg      tex->dest_type = nir_type_float;
191b8e80941Smrg      tex->src[0].src_type = nir_tex_src_texture_deref;
192b8e80941Smrg      tex->src[0].src = nir_src_for_ssa(&pixelmap_deref->dest.ssa);
193b8e80941Smrg      tex->src[1].src_type = nir_tex_src_sampler_deref;
194b8e80941Smrg      tex->src[1].src = nir_src_for_ssa(&pixelmap_deref->dest.ssa);
195b8e80941Smrg      tex->src[2].src_type = nir_tex_src_coord;
196b8e80941Smrg      tex->src[2].src = nir_src_for_ssa(nir_channels(b, def, 0x3));
197b8e80941Smrg
198b8e80941Smrg      nir_ssa_dest_init(&tex->instr, &tex->dest, 4, 32, NULL);
199b8e80941Smrg      nir_builder_instr_insert(b, &tex->instr);
200b8e80941Smrg      def_xy = &tex->dest.ssa;
201b8e80941Smrg
202b8e80941Smrg      /* TEX def.zw, def.zwww, pixelmap_sampler, 2D; */
203b8e80941Smrg      tex = nir_tex_instr_create(state->shader, 1);
204b8e80941Smrg      tex->op = nir_texop_tex;
205b8e80941Smrg      tex->sampler_dim = GLSL_SAMPLER_DIM_2D;
206b8e80941Smrg      tex->coord_components = 2;
207b8e80941Smrg      tex->sampler_index = state->options->pixelmap_sampler;
208b8e80941Smrg      tex->dest_type = nir_type_float;
209b8e80941Smrg      tex->src[0].src_type = nir_tex_src_coord;
210b8e80941Smrg      tex->src[0].src = nir_src_for_ssa(nir_channels(b, def, 0xc));
211b8e80941Smrg
212b8e80941Smrg      nir_ssa_dest_init(&tex->instr, &tex->dest, 4, 32, NULL);
213b8e80941Smrg      nir_builder_instr_insert(b, &tex->instr);
214b8e80941Smrg      def_zw = &tex->dest.ssa;
215b8e80941Smrg
216b8e80941Smrg      /* def = vec4(def.xy, def.zw); */
217b8e80941Smrg      def = nir_vec4(b,
218b8e80941Smrg                     nir_channel(b, def_xy, 0),
219b8e80941Smrg                     nir_channel(b, def_xy, 1),
220b8e80941Smrg                     nir_channel(b, def_zw, 0),
221b8e80941Smrg                     nir_channel(b, def_zw, 1));
222b8e80941Smrg   }
223b8e80941Smrg
224b8e80941Smrg   nir_ssa_def_rewrite_uses(&intr->dest.ssa, nir_src_for_ssa(def));
225b8e80941Smrg}
226b8e80941Smrg
227b8e80941Smrgstatic void
228b8e80941Smrglower_texcoord(lower_drawpixels_state *state, nir_intrinsic_instr *intr)
229b8e80941Smrg{
230b8e80941Smrg   state->b.cursor = nir_before_instr(&intr->instr);
231b8e80941Smrg
232b8e80941Smrg   nir_ssa_def *texcoord_const = get_texcoord_const(state);
233b8e80941Smrg   nir_ssa_def_rewrite_uses(&intr->dest.ssa, nir_src_for_ssa(texcoord_const));
234b8e80941Smrg}
235b8e80941Smrg
236b8e80941Smrgstatic bool
237b8e80941Smrglower_drawpixels_block(lower_drawpixels_state *state, nir_block *block)
238b8e80941Smrg{
239b8e80941Smrg   nir_foreach_instr_safe(instr, block) {
240b8e80941Smrg      if (instr->type == nir_instr_type_intrinsic) {
241b8e80941Smrg         nir_intrinsic_instr *intr = nir_instr_as_intrinsic(instr);
242b8e80941Smrg         if (intr->intrinsic == nir_intrinsic_load_deref) {
243b8e80941Smrg            nir_deref_instr *deref = nir_src_as_deref(intr->src[0]);
244b8e80941Smrg            nir_variable *var = nir_deref_instr_get_variable(deref);
245b8e80941Smrg
246b8e80941Smrg            if (var->data.location == VARYING_SLOT_COL0) {
247b8e80941Smrg               /* gl_Color should not have array/struct derefs: */
248b8e80941Smrg               assert(deref->deref_type == nir_deref_type_var);
249b8e80941Smrg               lower_color(state, intr);
250b8e80941Smrg            } else if (var->data.location == VARYING_SLOT_TEX0) {
251b8e80941Smrg               /* gl_TexCoord should not have array/struct derefs: */
252b8e80941Smrg               assert(deref->deref_type == nir_deref_type_var);
253b8e80941Smrg               lower_texcoord(state, intr);
254b8e80941Smrg            }
255b8e80941Smrg         }
256b8e80941Smrg      }
257b8e80941Smrg   }
258b8e80941Smrg
259b8e80941Smrg   return true;
260b8e80941Smrg}
261b8e80941Smrg
262b8e80941Smrgstatic void
263b8e80941Smrglower_drawpixels_impl(lower_drawpixels_state *state, nir_function_impl *impl)
264b8e80941Smrg{
265b8e80941Smrg   nir_builder_init(&state->b, impl);
266b8e80941Smrg
267b8e80941Smrg   nir_foreach_block(block, impl) {
268b8e80941Smrg      lower_drawpixels_block(state, block);
269b8e80941Smrg   }
270b8e80941Smrg   nir_metadata_preserve(impl, nir_metadata_block_index |
271b8e80941Smrg                               nir_metadata_dominance);
272b8e80941Smrg}
273b8e80941Smrg
274b8e80941Smrgvoid
275b8e80941Smrgnir_lower_drawpixels(nir_shader *shader,
276b8e80941Smrg                     const nir_lower_drawpixels_options *options)
277b8e80941Smrg{
278b8e80941Smrg   lower_drawpixels_state state = {
279b8e80941Smrg      .options = options,
280b8e80941Smrg      .shader = shader,
281b8e80941Smrg   };
282b8e80941Smrg
283b8e80941Smrg   assert(shader->info.stage == MESA_SHADER_FRAGMENT);
284b8e80941Smrg
285b8e80941Smrg   nir_foreach_function(function, shader) {
286b8e80941Smrg      if (function->impl)
287b8e80941Smrg         lower_drawpixels_impl(&state, function->impl);
288b8e80941Smrg   }
289b8e80941Smrg}
290