1b8e80941Smrg/* 2b8e80941Smrg * Copyright © 2015 Red Hat 3b8e80941Smrg * 4b8e80941Smrg * Permission is hereby granted, free of charge, to any person obtaining a 5b8e80941Smrg * copy of this software and associated documentation files (the "Software"), 6b8e80941Smrg * to deal in the Software without restriction, including without limitation 7b8e80941Smrg * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8b8e80941Smrg * and/or sell copies of the Software, and to permit persons to whom the 9b8e80941Smrg * Software is furnished to do so, subject to the following conditions: 10b8e80941Smrg * 11b8e80941Smrg * The above copyright notice and this permission notice (including the next 12b8e80941Smrg * paragraph) shall be included in all copies or substantial portions of the 13b8e80941Smrg * Software. 14b8e80941Smrg * 15b8e80941Smrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16b8e80941Smrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17b8e80941Smrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18b8e80941Smrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19b8e80941Smrg * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20b8e80941Smrg * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21b8e80941Smrg * SOFTWARE. 22b8e80941Smrg */ 23b8e80941Smrg 24b8e80941Smrg#include "nir.h" 25b8e80941Smrg#include "nir_builder.h" 26b8e80941Smrg 27b8e80941Smrg/* Lower glDrawPixels(). 28b8e80941Smrg * 29b8e80941Smrg * This is based on the logic in st_get_drawpix_shader() in TGSI compiler. 30b8e80941Smrg * 31b8e80941Smrg * Run before nir_lower_io. 32b8e80941Smrg */ 33b8e80941Smrg 34b8e80941Smrgtypedef struct { 35b8e80941Smrg const nir_lower_drawpixels_options *options; 36b8e80941Smrg nir_shader *shader; 37b8e80941Smrg nir_builder b; 38b8e80941Smrg nir_variable *texcoord, *scale, *bias, *tex, *pixelmap; 39b8e80941Smrg} lower_drawpixels_state; 40b8e80941Smrg 41b8e80941Smrgstatic nir_ssa_def * 42b8e80941Smrgget_texcoord(lower_drawpixels_state *state) 43b8e80941Smrg{ 44b8e80941Smrg if (state->texcoord == NULL) { 45b8e80941Smrg nir_variable *texcoord = NULL; 46b8e80941Smrg 47b8e80941Smrg /* find gl_TexCoord, if it exists: */ 48b8e80941Smrg nir_foreach_variable(var, &state->shader->inputs) { 49b8e80941Smrg if (var->data.location == VARYING_SLOT_TEX0) { 50b8e80941Smrg texcoord = var; 51b8e80941Smrg break; 52b8e80941Smrg } 53b8e80941Smrg } 54b8e80941Smrg 55b8e80941Smrg /* otherwise create it: */ 56b8e80941Smrg if (texcoord == NULL) { 57b8e80941Smrg texcoord = nir_variable_create(state->shader, 58b8e80941Smrg nir_var_shader_in, 59b8e80941Smrg glsl_vec4_type(), 60b8e80941Smrg "gl_TexCoord"); 61b8e80941Smrg texcoord->data.location = VARYING_SLOT_TEX0; 62b8e80941Smrg } 63b8e80941Smrg 64b8e80941Smrg state->texcoord = texcoord; 65b8e80941Smrg } 66b8e80941Smrg return nir_load_var(&state->b, state->texcoord); 67b8e80941Smrg} 68b8e80941Smrg 69b8e80941Smrgstatic nir_variable * 70b8e80941Smrgcreate_uniform(nir_shader *shader, const char *name, 71b8e80941Smrg const gl_state_index16 state_tokens[STATE_LENGTH]) 72b8e80941Smrg{ 73b8e80941Smrg nir_variable *var = nir_variable_create(shader, 74b8e80941Smrg nir_var_uniform, 75b8e80941Smrg glsl_vec4_type(), 76b8e80941Smrg name); 77b8e80941Smrg var->num_state_slots = 1; 78b8e80941Smrg var->state_slots = ralloc_array(var, nir_state_slot, 1); 79b8e80941Smrg memcpy(var->state_slots[0].tokens, state_tokens, 80b8e80941Smrg sizeof(var->state_slots[0].tokens)); 81b8e80941Smrg return var; 82b8e80941Smrg} 83b8e80941Smrg 84b8e80941Smrgstatic nir_ssa_def * 85b8e80941Smrgget_scale(lower_drawpixels_state *state) 86b8e80941Smrg{ 87b8e80941Smrg if (state->scale == NULL) { 88b8e80941Smrg state->scale = create_uniform(state->shader, "gl_PTscale", 89b8e80941Smrg state->options->scale_state_tokens); 90b8e80941Smrg } 91b8e80941Smrg return nir_load_var(&state->b, state->scale); 92b8e80941Smrg} 93b8e80941Smrg 94b8e80941Smrgstatic nir_ssa_def * 95b8e80941Smrgget_bias(lower_drawpixels_state *state) 96b8e80941Smrg{ 97b8e80941Smrg if (state->bias == NULL) { 98b8e80941Smrg state->bias = create_uniform(state->shader, "gl_PTbias", 99b8e80941Smrg state->options->bias_state_tokens); 100b8e80941Smrg } 101b8e80941Smrg return nir_load_var(&state->b, state->bias); 102b8e80941Smrg} 103b8e80941Smrg 104b8e80941Smrgstatic nir_ssa_def * 105b8e80941Smrgget_texcoord_const(lower_drawpixels_state *state) 106b8e80941Smrg{ 107b8e80941Smrg if (state->bias == NULL) { 108b8e80941Smrg state->bias = create_uniform(state->shader, "gl_MultiTexCoord0", 109b8e80941Smrg state->options->texcoord_state_tokens); 110b8e80941Smrg } 111b8e80941Smrg return nir_load_var(&state->b, state->bias); 112b8e80941Smrg} 113b8e80941Smrg 114b8e80941Smrgstatic void 115b8e80941Smrglower_color(lower_drawpixels_state *state, nir_intrinsic_instr *intr) 116b8e80941Smrg{ 117b8e80941Smrg nir_builder *b = &state->b; 118b8e80941Smrg nir_ssa_def *texcoord; 119b8e80941Smrg nir_tex_instr *tex; 120b8e80941Smrg nir_ssa_def *def; 121b8e80941Smrg 122b8e80941Smrg assert(intr->dest.is_ssa); 123b8e80941Smrg 124b8e80941Smrg b->cursor = nir_before_instr(&intr->instr); 125b8e80941Smrg 126b8e80941Smrg texcoord = get_texcoord(state); 127b8e80941Smrg 128b8e80941Smrg const struct glsl_type *sampler2D = 129b8e80941Smrg glsl_sampler_type(GLSL_SAMPLER_DIM_2D, false, false, GLSL_TYPE_FLOAT); 130b8e80941Smrg 131b8e80941Smrg if (!state->tex) { 132b8e80941Smrg state->tex = 133b8e80941Smrg nir_variable_create(b->shader, nir_var_uniform, sampler2D, "drawpix"); 134b8e80941Smrg state->tex->data.binding = state->options->drawpix_sampler; 135b8e80941Smrg state->tex->data.explicit_binding = true; 136b8e80941Smrg state->tex->data.how_declared = nir_var_hidden; 137b8e80941Smrg } 138b8e80941Smrg 139b8e80941Smrg nir_deref_instr *tex_deref = nir_build_deref_var(b, state->tex); 140b8e80941Smrg 141b8e80941Smrg /* replace load_var(gl_Color) w/ texture sample: 142b8e80941Smrg * TEX def, texcoord, drawpix_sampler, 2D 143b8e80941Smrg */ 144b8e80941Smrg tex = nir_tex_instr_create(state->shader, 3); 145b8e80941Smrg tex->op = nir_texop_tex; 146b8e80941Smrg tex->sampler_dim = GLSL_SAMPLER_DIM_2D; 147b8e80941Smrg tex->coord_components = 2; 148b8e80941Smrg tex->dest_type = nir_type_float; 149b8e80941Smrg tex->src[0].src_type = nir_tex_src_texture_deref; 150b8e80941Smrg tex->src[0].src = nir_src_for_ssa(&tex_deref->dest.ssa); 151b8e80941Smrg tex->src[1].src_type = nir_tex_src_sampler_deref; 152b8e80941Smrg tex->src[1].src = nir_src_for_ssa(&tex_deref->dest.ssa); 153b8e80941Smrg tex->src[2].src_type = nir_tex_src_coord; 154b8e80941Smrg tex->src[2].src = 155b8e80941Smrg nir_src_for_ssa(nir_channels(b, texcoord, 156b8e80941Smrg (1 << tex->coord_components) - 1)); 157b8e80941Smrg 158b8e80941Smrg nir_ssa_dest_init(&tex->instr, &tex->dest, 4, 32, NULL); 159b8e80941Smrg nir_builder_instr_insert(b, &tex->instr); 160b8e80941Smrg def = &tex->dest.ssa; 161b8e80941Smrg 162b8e80941Smrg /* Apply the scale and bias. */ 163b8e80941Smrg if (state->options->scale_and_bias) { 164b8e80941Smrg /* MAD def, def, scale, bias; */ 165b8e80941Smrg def = nir_ffma(b, def, get_scale(state), get_bias(state)); 166b8e80941Smrg } 167b8e80941Smrg 168b8e80941Smrg if (state->options->pixel_maps) { 169b8e80941Smrg if (!state->pixelmap) { 170b8e80941Smrg state->pixelmap = nir_variable_create(b->shader, nir_var_uniform, 171b8e80941Smrg sampler2D, "pixelmap"); 172b8e80941Smrg state->pixelmap->data.binding = state->options->pixelmap_sampler; 173b8e80941Smrg state->pixelmap->data.explicit_binding = true; 174b8e80941Smrg state->pixelmap->data.how_declared = nir_var_hidden; 175b8e80941Smrg } 176b8e80941Smrg 177b8e80941Smrg nir_deref_instr *pixelmap_deref = 178b8e80941Smrg nir_build_deref_var(b, state->pixelmap); 179b8e80941Smrg 180b8e80941Smrg /* do four pixel map look-ups with two TEX instructions: */ 181b8e80941Smrg nir_ssa_def *def_xy, *def_zw; 182b8e80941Smrg 183b8e80941Smrg /* TEX def.xy, def.xyyy, pixelmap_sampler, 2D; */ 184b8e80941Smrg tex = nir_tex_instr_create(state->shader, 3); 185b8e80941Smrg tex->op = nir_texop_tex; 186b8e80941Smrg tex->sampler_dim = GLSL_SAMPLER_DIM_2D; 187b8e80941Smrg tex->coord_components = 2; 188b8e80941Smrg tex->sampler_index = state->options->pixelmap_sampler; 189b8e80941Smrg tex->texture_index = state->options->pixelmap_sampler; 190b8e80941Smrg tex->dest_type = nir_type_float; 191b8e80941Smrg tex->src[0].src_type = nir_tex_src_texture_deref; 192b8e80941Smrg tex->src[0].src = nir_src_for_ssa(&pixelmap_deref->dest.ssa); 193b8e80941Smrg tex->src[1].src_type = nir_tex_src_sampler_deref; 194b8e80941Smrg tex->src[1].src = nir_src_for_ssa(&pixelmap_deref->dest.ssa); 195b8e80941Smrg tex->src[2].src_type = nir_tex_src_coord; 196b8e80941Smrg tex->src[2].src = nir_src_for_ssa(nir_channels(b, def, 0x3)); 197b8e80941Smrg 198b8e80941Smrg nir_ssa_dest_init(&tex->instr, &tex->dest, 4, 32, NULL); 199b8e80941Smrg nir_builder_instr_insert(b, &tex->instr); 200b8e80941Smrg def_xy = &tex->dest.ssa; 201b8e80941Smrg 202b8e80941Smrg /* TEX def.zw, def.zwww, pixelmap_sampler, 2D; */ 203b8e80941Smrg tex = nir_tex_instr_create(state->shader, 1); 204b8e80941Smrg tex->op = nir_texop_tex; 205b8e80941Smrg tex->sampler_dim = GLSL_SAMPLER_DIM_2D; 206b8e80941Smrg tex->coord_components = 2; 207b8e80941Smrg tex->sampler_index = state->options->pixelmap_sampler; 208b8e80941Smrg tex->dest_type = nir_type_float; 209b8e80941Smrg tex->src[0].src_type = nir_tex_src_coord; 210b8e80941Smrg tex->src[0].src = nir_src_for_ssa(nir_channels(b, def, 0xc)); 211b8e80941Smrg 212b8e80941Smrg nir_ssa_dest_init(&tex->instr, &tex->dest, 4, 32, NULL); 213b8e80941Smrg nir_builder_instr_insert(b, &tex->instr); 214b8e80941Smrg def_zw = &tex->dest.ssa; 215b8e80941Smrg 216b8e80941Smrg /* def = vec4(def.xy, def.zw); */ 217b8e80941Smrg def = nir_vec4(b, 218b8e80941Smrg nir_channel(b, def_xy, 0), 219b8e80941Smrg nir_channel(b, def_xy, 1), 220b8e80941Smrg nir_channel(b, def_zw, 0), 221b8e80941Smrg nir_channel(b, def_zw, 1)); 222b8e80941Smrg } 223b8e80941Smrg 224b8e80941Smrg nir_ssa_def_rewrite_uses(&intr->dest.ssa, nir_src_for_ssa(def)); 225b8e80941Smrg} 226b8e80941Smrg 227b8e80941Smrgstatic void 228b8e80941Smrglower_texcoord(lower_drawpixels_state *state, nir_intrinsic_instr *intr) 229b8e80941Smrg{ 230b8e80941Smrg state->b.cursor = nir_before_instr(&intr->instr); 231b8e80941Smrg 232b8e80941Smrg nir_ssa_def *texcoord_const = get_texcoord_const(state); 233b8e80941Smrg nir_ssa_def_rewrite_uses(&intr->dest.ssa, nir_src_for_ssa(texcoord_const)); 234b8e80941Smrg} 235b8e80941Smrg 236b8e80941Smrgstatic bool 237b8e80941Smrglower_drawpixels_block(lower_drawpixels_state *state, nir_block *block) 238b8e80941Smrg{ 239b8e80941Smrg nir_foreach_instr_safe(instr, block) { 240b8e80941Smrg if (instr->type == nir_instr_type_intrinsic) { 241b8e80941Smrg nir_intrinsic_instr *intr = nir_instr_as_intrinsic(instr); 242b8e80941Smrg if (intr->intrinsic == nir_intrinsic_load_deref) { 243b8e80941Smrg nir_deref_instr *deref = nir_src_as_deref(intr->src[0]); 244b8e80941Smrg nir_variable *var = nir_deref_instr_get_variable(deref); 245b8e80941Smrg 246b8e80941Smrg if (var->data.location == VARYING_SLOT_COL0) { 247b8e80941Smrg /* gl_Color should not have array/struct derefs: */ 248b8e80941Smrg assert(deref->deref_type == nir_deref_type_var); 249b8e80941Smrg lower_color(state, intr); 250b8e80941Smrg } else if (var->data.location == VARYING_SLOT_TEX0) { 251b8e80941Smrg /* gl_TexCoord should not have array/struct derefs: */ 252b8e80941Smrg assert(deref->deref_type == nir_deref_type_var); 253b8e80941Smrg lower_texcoord(state, intr); 254b8e80941Smrg } 255b8e80941Smrg } 256b8e80941Smrg } 257b8e80941Smrg } 258b8e80941Smrg 259b8e80941Smrg return true; 260b8e80941Smrg} 261b8e80941Smrg 262b8e80941Smrgstatic void 263b8e80941Smrglower_drawpixels_impl(lower_drawpixels_state *state, nir_function_impl *impl) 264b8e80941Smrg{ 265b8e80941Smrg nir_builder_init(&state->b, impl); 266b8e80941Smrg 267b8e80941Smrg nir_foreach_block(block, impl) { 268b8e80941Smrg lower_drawpixels_block(state, block); 269b8e80941Smrg } 270b8e80941Smrg nir_metadata_preserve(impl, nir_metadata_block_index | 271b8e80941Smrg nir_metadata_dominance); 272b8e80941Smrg} 273b8e80941Smrg 274b8e80941Smrgvoid 275b8e80941Smrgnir_lower_drawpixels(nir_shader *shader, 276b8e80941Smrg const nir_lower_drawpixels_options *options) 277b8e80941Smrg{ 278b8e80941Smrg lower_drawpixels_state state = { 279b8e80941Smrg .options = options, 280b8e80941Smrg .shader = shader, 281b8e80941Smrg }; 282b8e80941Smrg 283b8e80941Smrg assert(shader->info.stage == MESA_SHADER_FRAGMENT); 284b8e80941Smrg 285b8e80941Smrg nir_foreach_function(function, shader) { 286b8e80941Smrg if (function->impl) 287b8e80941Smrg lower_drawpixels_impl(&state, function->impl); 288b8e80941Smrg } 289b8e80941Smrg} 290