brw_clip_line.c revision 01e04c3f
1/*
2 Copyright (C) Intel Corp.  2006.  All Rights Reserved.
3 Intel funded Tungsten Graphics to
4 develop this 3D driver.
5
6 Permission is hereby granted, free of charge, to any person obtaining
7 a copy of this software and associated documentation files (the
8 "Software"), to deal in the Software without restriction, including
9 without limitation the rights to use, copy, modify, merge, publish,
10 distribute, sublicense, and/or sell copies of the Software, and to
11 permit persons to whom the Software is furnished to do so, subject to
12 the following conditions:
13
14 The above copyright notice and this permission notice (including the
15 next paragraph) shall be included in all copies or substantial
16 portions of the Software.
17
18 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
19 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
21 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
22 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
23 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
24 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25
26 **********************************************************************/
27 /*
28  * Authors:
29  *   Keith Whitwell <keithw@vmware.com>
30  */
31
32#include "main/macros.h"
33#include "main/enums.h"
34#include "program/program.h"
35
36#include "brw_clip.h"
37
38static void brw_clip_line_alloc_regs( struct brw_clip_compile *c )
39{
40   const struct gen_device_info *devinfo = c->func.devinfo;
41   GLuint i = 0,j;
42
43   /* Register usage is static, precompute here:
44    */
45   c->reg.R0 = retype(brw_vec8_grf(i, 0), BRW_REGISTER_TYPE_UD); i++;
46
47   if (c->key.nr_userclip) {
48      c->reg.fixed_planes = brw_vec4_grf(i, 0);
49      i += (6 + c->key.nr_userclip + 1) / 2;
50
51      c->prog_data.curb_read_length = (6 + c->key.nr_userclip + 1) / 2;
52   }
53   else
54      c->prog_data.curb_read_length = 0;
55
56
57   /* Payload vertices plus space for more generated vertices:
58    */
59   for (j = 0; j < 4; j++) {
60      c->reg.vertex[j] = brw_vec4_grf(i, 0);
61      i += c->nr_regs;
62   }
63
64   c->reg.t           = brw_vec1_grf(i, 0);
65   c->reg.t0          = brw_vec1_grf(i, 1);
66   c->reg.t1          = brw_vec1_grf(i, 2);
67   c->reg.planemask   = retype(brw_vec1_grf(i, 3), BRW_REGISTER_TYPE_UD);
68   c->reg.plane_equation = brw_vec4_grf(i, 4);
69   i++;
70
71   c->reg.dp0         = brw_vec1_grf(i, 0); /* fixme - dp4 will clobber r.1,2,3 */
72   c->reg.dp1         = brw_vec1_grf(i, 4);
73   i++;
74
75   if (!c->key.nr_userclip) {
76      c->reg.fixed_planes = brw_vec8_grf(i, 0);
77      i++;
78   }
79
80   c->reg.vertex_src_mask = retype(brw_vec1_grf(i, 0), BRW_REGISTER_TYPE_UD);
81   c->reg.clipdistance_offset = retype(brw_vec1_grf(i, 1), BRW_REGISTER_TYPE_W);
82   i++;
83
84   if (devinfo->gen == 5) {
85      c->reg.ff_sync = retype(brw_vec1_grf(i, 0), BRW_REGISTER_TYPE_UD);
86      i++;
87   }
88
89   c->first_tmp = i;
90   c->last_tmp = i;
91
92   c->prog_data.urb_read_length = c->nr_regs; /* ? */
93   c->prog_data.total_grf = i;
94}
95
96
97/* Line clipping, more or less following the following algorithm:
98 *
99 *  for (p=0;p<MAX_PLANES;p++) {
100 *     if (clipmask & (1 << p)) {
101 *        GLfloat dp0 = DOTPROD( vtx0, plane[p] );
102 *        GLfloat dp1 = DOTPROD( vtx1, plane[p] );
103 *
104 *        if (dp1 < 0.0f) {
105 *           GLfloat t = dp1 / (dp1 - dp0);
106 *           if (t > t1) t1 = t;
107 *        } else {
108 *           GLfloat t = dp0 / (dp0 - dp1);
109 *           if (t > t0) t0 = t;
110 *        }
111 *
112 *        if (t0 + t1 >= 1.0)
113 *           return;
114 *     }
115 *  }
116 *
117 *  interp( ctx, newvtx0, vtx0, vtx1, t0 );
118 *  interp( ctx, newvtx1, vtx1, vtx0, t1 );
119 *
120 */
121static void clip_and_emit_line( struct brw_clip_compile *c )
122{
123   struct brw_codegen *p = &c->func;
124   struct brw_indirect vtx0     = brw_indirect(0, 0);
125   struct brw_indirect vtx1      = brw_indirect(1, 0);
126   struct brw_indirect newvtx0   = brw_indirect(2, 0);
127   struct brw_indirect newvtx1   = brw_indirect(3, 0);
128   struct brw_indirect plane_ptr = brw_indirect(4, 0);
129   struct brw_reg v1_null_ud = retype(vec1(brw_null_reg()), BRW_REGISTER_TYPE_UD);
130   GLuint hpos_offset = brw_varying_to_offset(&c->vue_map, VARYING_SLOT_POS);
131   GLint clipdist0_offset = c->key.nr_userclip
132      ? brw_varying_to_offset(&c->vue_map, VARYING_SLOT_CLIP_DIST0)
133      : 0;
134
135   brw_MOV(p, get_addr_reg(vtx0),      brw_address(c->reg.vertex[0]));
136   brw_MOV(p, get_addr_reg(vtx1),      brw_address(c->reg.vertex[1]));
137   brw_MOV(p, get_addr_reg(newvtx0),   brw_address(c->reg.vertex[2]));
138   brw_MOV(p, get_addr_reg(newvtx1),   brw_address(c->reg.vertex[3]));
139   brw_MOV(p, get_addr_reg(plane_ptr), brw_clip_plane0_address(c));
140
141   /* Note: init t0, t1 together:
142    */
143   brw_MOV(p, vec2(c->reg.t0), brw_imm_f(0));
144
145   brw_clip_init_planes(c);
146   brw_clip_init_clipmask(c);
147
148   /* -ve rhw workaround */
149   if (p->devinfo->has_negative_rhw_bug) {
150      brw_AND(p, brw_null_reg(), get_element_ud(c->reg.R0, 2),
151              brw_imm_ud(1<<20));
152      brw_inst_set_cond_modifier(p->devinfo, brw_last_inst, BRW_CONDITIONAL_NZ);
153      brw_OR(p, c->reg.planemask, c->reg.planemask, brw_imm_ud(0x3f));
154      brw_inst_set_pred_control(p->devinfo, brw_last_inst, BRW_PREDICATE_NORMAL);
155   }
156
157   /* Set the initial vertex source mask: The first 6 planes are the bounds
158    * of the view volume; the next 8 planes are the user clipping planes.
159    */
160   brw_MOV(p, c->reg.vertex_src_mask, brw_imm_ud(0x3fc0));
161
162   /* Set the initial clipdistance offset to be 6 floats before gl_ClipDistance[0].
163    * We'll increment 6 times before we start hitting actual user clipping. */
164   brw_MOV(p, c->reg.clipdistance_offset, brw_imm_d(clipdist0_offset - 6*sizeof(float)));
165
166   brw_DO(p, BRW_EXECUTE_1);
167   {
168      /* if (planemask & 1)
169       */
170      brw_AND(p, v1_null_ud, c->reg.planemask, brw_imm_ud(1));
171      brw_inst_set_cond_modifier(p->devinfo, brw_last_inst, BRW_CONDITIONAL_NZ);
172
173      brw_IF(p, BRW_EXECUTE_1);
174      {
175         brw_AND(p, v1_null_ud, c->reg.vertex_src_mask, brw_imm_ud(1));
176         brw_inst_set_cond_modifier(p->devinfo, brw_last_inst, BRW_CONDITIONAL_NZ);
177         brw_IF(p, BRW_EXECUTE_1);
178         {
179            /* user clip distance: just fetch the correct float from each vertex */
180            struct brw_indirect temp_ptr = brw_indirect(7, 0);
181            brw_ADD(p, get_addr_reg(temp_ptr), get_addr_reg(vtx0), c->reg.clipdistance_offset);
182            brw_MOV(p, c->reg.dp0, deref_1f(temp_ptr, 0));
183            brw_ADD(p, get_addr_reg(temp_ptr), get_addr_reg(vtx1), c->reg.clipdistance_offset);
184            brw_MOV(p, c->reg.dp1, deref_1f(temp_ptr, 0));
185         }
186         brw_ELSE(p);
187         {
188            /* fixed plane: fetch the hpos, dp4 against the plane. */
189            if (c->key.nr_userclip)
190               brw_MOV(p, c->reg.plane_equation, deref_4f(plane_ptr, 0));
191            else
192               brw_MOV(p, c->reg.plane_equation, deref_4b(plane_ptr, 0));
193
194            brw_DP4(p, vec4(c->reg.dp0), deref_4f(vtx0, hpos_offset), c->reg.plane_equation);
195            brw_DP4(p, vec4(c->reg.dp1), deref_4f(vtx1, hpos_offset), c->reg.plane_equation);
196         }
197         brw_ENDIF(p);
198
199         brw_CMP(p, brw_null_reg(), BRW_CONDITIONAL_L, vec1(c->reg.dp1), brw_imm_f(0.0f));
200
201         brw_IF(p, BRW_EXECUTE_1);
202         {
203             /*
204              * Both can be negative on GM965/G965 due to RHW workaround
205              * if so, this object should be rejected.
206              */
207             if (p->devinfo->has_negative_rhw_bug) {
208                 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_LE, c->reg.dp0, brw_imm_f(0.0));
209                 brw_IF(p, BRW_EXECUTE_1);
210                 {
211                     brw_clip_kill_thread(c);
212                 }
213                 brw_ENDIF(p);
214             }
215
216             brw_ADD(p, c->reg.t, c->reg.dp1, negate(c->reg.dp0));
217             brw_math_invert(p, c->reg.t, c->reg.t);
218             brw_MUL(p, c->reg.t, c->reg.t, c->reg.dp1);
219
220             brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_G, c->reg.t, c->reg.t1 );
221             brw_MOV(p, c->reg.t1, c->reg.t);
222             brw_inst_set_pred_control(p->devinfo, brw_last_inst,
223                                       BRW_PREDICATE_NORMAL);
224	 }
225	 brw_ELSE(p);
226	 {
227             /* Coming back in.  We know that both cannot be negative
228              * because the line would have been culled in that case.
229              */
230
231             /* If both are positive, do nothing */
232             /* Only on GM965/G965 */
233             if (p->devinfo->has_negative_rhw_bug) {
234                 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_L, c->reg.dp0, brw_imm_f(0.0));
235                 brw_IF(p, BRW_EXECUTE_1);
236             }
237
238             {
239                 brw_ADD(p, c->reg.t, c->reg.dp0, negate(c->reg.dp1));
240                 brw_math_invert(p, c->reg.t, c->reg.t);
241                 brw_MUL(p, c->reg.t, c->reg.t, c->reg.dp0);
242
243                 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_G, c->reg.t, c->reg.t0 );
244                 brw_MOV(p, c->reg.t0, c->reg.t);
245                 brw_inst_set_pred_control(p->devinfo, brw_last_inst,
246                                           BRW_PREDICATE_NORMAL);
247             }
248
249             if (p->devinfo->has_negative_rhw_bug) {
250                 brw_ENDIF(p);
251             }
252         }
253	 brw_ENDIF(p);
254      }
255      brw_ENDIF(p);
256
257      /* plane_ptr++;
258       */
259      brw_ADD(p, get_addr_reg(plane_ptr), get_addr_reg(plane_ptr), brw_clip_plane_stride(c));
260
261      /* while (planemask>>=1) != 0
262       */
263      brw_SHR(p, c->reg.planemask, c->reg.planemask, brw_imm_ud(1));
264      brw_inst_set_cond_modifier(p->devinfo, brw_last_inst, BRW_CONDITIONAL_NZ);
265      brw_SHR(p, c->reg.vertex_src_mask, c->reg.vertex_src_mask, brw_imm_ud(1));
266      brw_inst_set_pred_control(p->devinfo, brw_last_inst, BRW_PREDICATE_NORMAL);
267      brw_ADD(p, c->reg.clipdistance_offset, c->reg.clipdistance_offset, brw_imm_w(sizeof(float)));
268      brw_inst_set_pred_control(p->devinfo, brw_last_inst, BRW_PREDICATE_NORMAL);
269   }
270   brw_WHILE(p);
271   brw_inst_set_pred_control(p->devinfo, brw_last_inst, BRW_PREDICATE_NORMAL);
272
273   brw_ADD(p, c->reg.t, c->reg.t0, c->reg.t1);
274   brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_L, c->reg.t, brw_imm_f(1.0));
275   brw_IF(p, BRW_EXECUTE_1);
276   {
277      brw_clip_interp_vertex(c, newvtx0, vtx0, vtx1, c->reg.t0, false);
278      brw_clip_interp_vertex(c, newvtx1, vtx1, vtx0, c->reg.t1, false);
279
280      brw_clip_emit_vue(c, newvtx0, BRW_URB_WRITE_ALLOCATE_COMPLETE,
281                        (_3DPRIM_LINESTRIP << URB_WRITE_PRIM_TYPE_SHIFT)
282                        | URB_WRITE_PRIM_START);
283      brw_clip_emit_vue(c, newvtx1, BRW_URB_WRITE_EOT_COMPLETE,
284                        (_3DPRIM_LINESTRIP << URB_WRITE_PRIM_TYPE_SHIFT)
285                        | URB_WRITE_PRIM_END);
286   }
287   brw_ENDIF(p);
288   brw_clip_kill_thread(c);
289}
290
291
292
293void brw_emit_line_clip( struct brw_clip_compile *c )
294{
295   brw_clip_line_alloc_regs(c);
296   brw_clip_init_ff_sync(c);
297
298   if (c->key.contains_flat_varying) {
299      if (c->key.pv_first)
300         brw_clip_copy_flatshaded_attributes(c, 1, 0);
301      else
302         brw_clip_copy_flatshaded_attributes(c, 0, 1);
303   }
304
305   clip_and_emit_line(c);
306}
307