1/**************************************************************************
2 *
3 * Copyright 2008 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28/**
29 * AA point stage:  AA points are converted to quads and rendered with a
30 * special fragment shader.  Another approach would be to use a texture
31 * map image of a point, but experiments indicate the quality isn't nearly
32 * as good as this approach.
33 *
34 * Note: this looks a lot like draw_aaline.c but there's actually little
35 * if any code that can be shared.
36 *
37 * Authors:  Brian Paul
38 */
39
40
41#include "pipe/p_context.h"
42#include "pipe/p_defines.h"
43#include "pipe/p_shader_tokens.h"
44
45#include "tgsi/tgsi_transform.h"
46#include "tgsi/tgsi_dump.h"
47
48#include "util/u_math.h"
49#include "util/u_memory.h"
50
51#include "draw_context.h"
52#include "draw_vs.h"
53#include "draw_pipe.h"
54
55
56/** Approx number of new tokens for instructions in aa_transform_inst() */
57#define NUM_NEW_TOKENS 200
58
59
60/*
61 * Enabling NORMALIZE might give _slightly_ better results.
62 * Basically, it controls whether we compute distance as d=sqrt(x*x+y*y) or
63 * d=x*x+y*y.  Since we're working with a unit circle, the later seems
64 * close enough and saves some costly instructions.
65 */
66#define NORMALIZE 0
67
68
69/**
70 * Subclass of pipe_shader_state to carry extra fragment shader info.
71 */
72struct aapoint_fragment_shader
73{
74   struct pipe_shader_state state;
75   void *driver_fs;   /**< the regular shader */
76   void *aapoint_fs;  /**< the aa point-augmented shader */
77   int generic_attrib; /**< The generic input attrib/texcoord we'll use */
78};
79
80
81/**
82 * Subclass of draw_stage
83 */
84struct aapoint_stage
85{
86   struct draw_stage stage;
87
88   /** half of pipe_rasterizer_state::point_size */
89   float radius;
90
91   /** vertex attrib slot containing point size */
92   int psize_slot;
93
94   /** this is the vertex attrib slot for the new texcoords */
95   uint tex_slot;
96
97   /** vertex attrib slot containing position */
98   uint pos_slot;
99
100   /** Currently bound fragment shader */
101   struct aapoint_fragment_shader *fs;
102
103   /*
104    * Driver interface/override functions
105    */
106   void * (*driver_create_fs_state)(struct pipe_context *,
107                                    const struct pipe_shader_state *);
108   void (*driver_bind_fs_state)(struct pipe_context *, void *);
109   void (*driver_delete_fs_state)(struct pipe_context *, void *);
110};
111
112
113
114/**
115 * Subclass of tgsi_transform_context, used for transforming the
116 * user's fragment shader to add the special AA instructions.
117 */
118struct aa_transform_context {
119   struct tgsi_transform_context base;
120   uint tempsUsed;  /**< bitmask */
121   int colorOutput; /**< which output is the primary color */
122   int maxInput, maxGeneric;  /**< max input index found */
123   int tmp0, colorTemp;  /**< temp registers */
124};
125
126
127/**
128 * TGSI declaration transform callback.
129 * Look for two free temp regs and available input reg for new texcoords.
130 */
131static void
132aa_transform_decl(struct tgsi_transform_context *ctx,
133                  struct tgsi_full_declaration *decl)
134{
135   struct aa_transform_context *aactx = (struct aa_transform_context *) ctx;
136
137   if (decl->Declaration.File == TGSI_FILE_OUTPUT &&
138       decl->Semantic.Name == TGSI_SEMANTIC_COLOR &&
139       decl->Semantic.Index == 0) {
140      aactx->colorOutput = decl->Range.First;
141   }
142   else if (decl->Declaration.File == TGSI_FILE_INPUT) {
143      if ((int) decl->Range.Last > aactx->maxInput)
144         aactx->maxInput = decl->Range.Last;
145      if (decl->Semantic.Name == TGSI_SEMANTIC_GENERIC &&
146           (int) decl->Semantic.Index > aactx->maxGeneric) {
147         aactx->maxGeneric = decl->Semantic.Index;
148      }
149   }
150   else if (decl->Declaration.File == TGSI_FILE_TEMPORARY) {
151      uint i;
152      for (i = decl->Range.First;
153           i <= decl->Range.Last; i++) {
154         aactx->tempsUsed |= (1 << i);
155      }
156   }
157
158   ctx->emit_declaration(ctx, decl);
159}
160
161
162/**
163 * TGSI transform callback.
164 * Insert new declarations and instructions before first instruction.
165 */
166static void
167aa_transform_prolog(struct tgsi_transform_context *ctx)
168{
169   /* emit our new declarations before the first instruction */
170   struct aa_transform_context *aactx = (struct aa_transform_context *) ctx;
171   struct tgsi_full_instruction newInst;
172   const int texInput = aactx->maxInput + 1;
173   int tmp0;
174   uint i;
175
176   /* find two free temp regs */
177   for (i = 0; i < 32; i++) {
178      if ((aactx->tempsUsed & (1u << i)) == 0) {
179         /* found a free temp */
180         if (aactx->tmp0 < 0)
181            aactx->tmp0 = i;
182         else if (aactx->colorTemp < 0)
183            aactx->colorTemp = i;
184         else
185            break;
186      }
187   }
188
189   assert(aactx->colorTemp != aactx->tmp0);
190
191   tmp0 = aactx->tmp0;
192
193   /* declare new generic input/texcoord */
194   tgsi_transform_input_decl(ctx, texInput,
195                             TGSI_SEMANTIC_GENERIC, aactx->maxGeneric + 1,
196                             TGSI_INTERPOLATE_LINEAR);
197
198   /* declare new temp regs */
199   tgsi_transform_temp_decl(ctx, tmp0);
200   tgsi_transform_temp_decl(ctx, aactx->colorTemp);
201
202   /*
203    * Emit code to compute fragment coverage, kill if outside point radius
204    *
205    * Temp reg0 usage:
206    *  t0.x = distance of fragment from center point
207    *  t0.y = boolean, is t0.x > 1.0, also misc temp usage
208    *  t0.z = temporary for computing 1/(1-k) value
209    *  t0.w = final coverage value
210    */
211
212   /* MUL t0.xy, tex, tex;  # compute x^2, y^2 */
213   tgsi_transform_op2_inst(ctx, TGSI_OPCODE_MUL,
214                           TGSI_FILE_TEMPORARY, tmp0, TGSI_WRITEMASK_XY,
215                           TGSI_FILE_INPUT, texInput,
216                           TGSI_FILE_INPUT, texInput, false);
217
218   /* ADD t0.x, t0.x, t0.y;  # x^2 + y^2 */
219   tgsi_transform_op2_swz_inst(ctx, TGSI_OPCODE_ADD,
220                               TGSI_FILE_TEMPORARY, tmp0, TGSI_WRITEMASK_X,
221                               TGSI_FILE_TEMPORARY, tmp0, TGSI_SWIZZLE_X,
222                               TGSI_FILE_TEMPORARY, tmp0, TGSI_SWIZZLE_Y, false);
223
224#if NORMALIZE  /* OPTIONAL normalization of length */
225   /* RSQ t0.x, t0.x; */
226   tgsi_transform_op1_inst(ctx, TGSI_OPCODE_RSQ,
227                           TGSI_FILE_TEMPORARY, tmp0, TGSI_WRITEMASK_X,
228                           TGSI_FILE_TEMPORARY, tmp0);
229
230   /* RCP t0.x, t0.x; */
231   tgsi_transform_op1_inst(ctx, TGSI_OPCODE_RCP,
232                           TGSI_FILE_TEMPORARY, tmp0, TGSI_WRITEMASK_X,
233                           TGSI_FILE_TEMPORARY, tmp0);
234#endif
235
236   /* SGT t0.y, t0.xxxx, tex.wwww;  # bool b = d > 1 (NOTE tex.w == 1) */
237   tgsi_transform_op2_swz_inst(ctx, TGSI_OPCODE_SGT,
238                               TGSI_FILE_TEMPORARY, tmp0, TGSI_WRITEMASK_Y,
239                               TGSI_FILE_TEMPORARY, tmp0, TGSI_SWIZZLE_X,
240                               TGSI_FILE_INPUT, texInput, TGSI_SWIZZLE_W, false);
241
242   /* KILL_IF -tmp0.yyyy;   # if -tmp0.y < 0, KILL */
243   tgsi_transform_kill_inst(ctx, TGSI_FILE_TEMPORARY, tmp0,
244                            TGSI_SWIZZLE_Y, TRUE);
245
246   /* compute coverage factor = (1-d)/(1-k) */
247
248   /* SUB t0.z, tex.w, tex.z;  # m = 1 - k */
249   tgsi_transform_op2_swz_inst(ctx, TGSI_OPCODE_ADD,
250                               TGSI_FILE_TEMPORARY, tmp0, TGSI_WRITEMASK_Z,
251                               TGSI_FILE_INPUT, texInput, TGSI_SWIZZLE_W,
252                               TGSI_FILE_INPUT, texInput, TGSI_SWIZZLE_Z, true);
253
254   /* RCP t0.z, t0.z;  # t0.z = 1 / m */
255   newInst = tgsi_default_full_instruction();
256   newInst.Instruction.Opcode = TGSI_OPCODE_RCP;
257   newInst.Instruction.NumDstRegs = 1;
258   newInst.Dst[0].Register.File = TGSI_FILE_TEMPORARY;
259   newInst.Dst[0].Register.Index = tmp0;
260   newInst.Dst[0].Register.WriteMask = TGSI_WRITEMASK_Z;
261   newInst.Instruction.NumSrcRegs = 1;
262   newInst.Src[0].Register.File = TGSI_FILE_TEMPORARY;
263   newInst.Src[0].Register.Index = tmp0;
264   newInst.Src[0].Register.SwizzleX = TGSI_SWIZZLE_Z;
265   ctx->emit_instruction(ctx, &newInst);
266
267   /* SUB t0.y, 1, t0.x;  # d = 1 - d */
268   tgsi_transform_op2_swz_inst(ctx, TGSI_OPCODE_ADD,
269                               TGSI_FILE_TEMPORARY, tmp0, TGSI_WRITEMASK_Y,
270                               TGSI_FILE_INPUT, texInput, TGSI_SWIZZLE_W,
271                               TGSI_FILE_TEMPORARY, tmp0, TGSI_SWIZZLE_X, true);
272
273   /* MUL t0.w, t0.y, t0.z;   # coverage = d * m */
274   tgsi_transform_op2_swz_inst(ctx, TGSI_OPCODE_MUL,
275                               TGSI_FILE_TEMPORARY, tmp0, TGSI_WRITEMASK_W,
276                               TGSI_FILE_TEMPORARY, tmp0, TGSI_SWIZZLE_Y,
277                               TGSI_FILE_TEMPORARY, tmp0, TGSI_SWIZZLE_Z, false);
278
279   /* SLE t0.y, t0.x, tex.z;  # bool b = distance <= k */
280   tgsi_transform_op2_swz_inst(ctx, TGSI_OPCODE_SLE,
281                               TGSI_FILE_TEMPORARY, tmp0, TGSI_WRITEMASK_Y,
282                               TGSI_FILE_TEMPORARY, tmp0, TGSI_SWIZZLE_X,
283                               TGSI_FILE_INPUT, texInput, TGSI_SWIZZLE_Z, false);
284
285   /* CMP t0.w, -t0.y, tex.w, t0.w;
286    *  # if -t0.y < 0 then
287    *       t0.w = 1
288    *    else
289    *       t0.w = t0.w
290    */
291   tgsi_transform_op3_swz_inst(ctx, TGSI_OPCODE_CMP,
292                               TGSI_FILE_TEMPORARY, tmp0, TGSI_WRITEMASK_W,
293                               TGSI_FILE_TEMPORARY, tmp0, TGSI_SWIZZLE_Y, 1,
294                               TGSI_FILE_INPUT, texInput, TGSI_SWIZZLE_W,
295                               TGSI_FILE_TEMPORARY, tmp0, TGSI_SWIZZLE_W);
296}
297
298
299/**
300 * TGSI transform callback.
301 * Insert new instructions before the END instruction.
302 */
303static void
304aa_transform_epilog(struct tgsi_transform_context *ctx)
305{
306   struct aa_transform_context *aactx = (struct aa_transform_context *) ctx;
307
308   /* add alpha modulation code at tail of program */
309
310   /* MOV result.color.xyz, colorTemp; */
311   tgsi_transform_op1_inst(ctx, TGSI_OPCODE_MOV,
312                           TGSI_FILE_OUTPUT, aactx->colorOutput,
313                           TGSI_WRITEMASK_XYZ,
314                           TGSI_FILE_TEMPORARY, aactx->colorTemp);
315
316   /* MUL result.color.w, colorTemp, tmp0.w; */
317   tgsi_transform_op2_inst(ctx, TGSI_OPCODE_MUL,
318                           TGSI_FILE_OUTPUT, aactx->colorOutput,
319                           TGSI_WRITEMASK_W,
320                           TGSI_FILE_TEMPORARY, aactx->colorTemp,
321                           TGSI_FILE_TEMPORARY, aactx->tmp0, false);
322}
323
324
325/**
326 * TGSI transform callback.
327 * Called per instruction.
328 * Replace writes to result.color w/ a temp reg.
329 */
330static void
331aa_transform_inst(struct tgsi_transform_context *ctx,
332                  struct tgsi_full_instruction *inst)
333{
334   struct aa_transform_context *aactx = (struct aa_transform_context *) ctx;
335   unsigned i;
336
337   /* Not an END instruction.
338    * Look for writes to result.color and replace with colorTemp reg.
339    */
340   for (i = 0; i < inst->Instruction.NumDstRegs; i++) {
341      struct tgsi_full_dst_register *dst = &inst->Dst[i];
342      if (dst->Register.File == TGSI_FILE_OUTPUT &&
343          dst->Register.Index == aactx->colorOutput) {
344         dst->Register.File = TGSI_FILE_TEMPORARY;
345         dst->Register.Index = aactx->colorTemp;
346      }
347   }
348
349   ctx->emit_instruction(ctx, inst);
350}
351
352
353/**
354 * Generate the frag shader we'll use for drawing AA points.
355 * This will be the user's shader plus some texture/modulate instructions.
356 */
357static boolean
358generate_aapoint_fs(struct aapoint_stage *aapoint)
359{
360   const struct pipe_shader_state *orig_fs = &aapoint->fs->state;
361   struct pipe_shader_state aapoint_fs;
362   struct aa_transform_context transform;
363   const uint newLen = tgsi_num_tokens(orig_fs->tokens) + NUM_NEW_TOKENS;
364   struct pipe_context *pipe = aapoint->stage.draw->pipe;
365
366   aapoint_fs = *orig_fs; /* copy to init */
367   aapoint_fs.tokens = tgsi_alloc_tokens(newLen);
368   if (aapoint_fs.tokens == NULL)
369      return FALSE;
370
371   memset(&transform, 0, sizeof(transform));
372   transform.colorOutput = -1;
373   transform.maxInput = -1;
374   transform.maxGeneric = -1;
375   transform.colorTemp = -1;
376   transform.tmp0 = -1;
377   transform.base.prolog = aa_transform_prolog;
378   transform.base.epilog = aa_transform_epilog;
379   transform.base.transform_instruction = aa_transform_inst;
380   transform.base.transform_declaration = aa_transform_decl;
381
382   tgsi_transform_shader(orig_fs->tokens,
383                         (struct tgsi_token *) aapoint_fs.tokens,
384                         newLen, &transform.base);
385
386#if 0 /* DEBUG */
387   debug_printf("draw_aapoint, orig shader:\n");
388   tgsi_dump(orig_fs->tokens, 0);
389   debug_printf("draw_aapoint, new shader:\n");
390   tgsi_dump(aapoint_fs.tokens, 0);
391#endif
392
393   aapoint->fs->aapoint_fs
394      = aapoint->driver_create_fs_state(pipe, &aapoint_fs);
395   if (aapoint->fs->aapoint_fs == NULL)
396      goto fail;
397
398   aapoint->fs->generic_attrib = transform.maxGeneric + 1;
399   FREE((void *)aapoint_fs.tokens);
400   return TRUE;
401
402fail:
403   FREE((void *)aapoint_fs.tokens);
404   return FALSE;
405}
406
407
408/**
409 * When we're about to draw our first AA point in a batch, this function is
410 * called to tell the driver to bind our modified fragment shader.
411 */
412static boolean
413bind_aapoint_fragment_shader(struct aapoint_stage *aapoint)
414{
415   struct draw_context *draw = aapoint->stage.draw;
416   struct pipe_context *pipe = draw->pipe;
417
418   if (!aapoint->fs->aapoint_fs &&
419       !generate_aapoint_fs(aapoint))
420      return FALSE;
421
422   draw->suspend_flushing = TRUE;
423   aapoint->driver_bind_fs_state(pipe, aapoint->fs->aapoint_fs);
424   draw->suspend_flushing = FALSE;
425
426   return TRUE;
427}
428
429
430
431static inline struct aapoint_stage *
432aapoint_stage( struct draw_stage *stage )
433{
434   return (struct aapoint_stage *) stage;
435}
436
437
438
439
440/**
441 * Draw an AA point by drawing a quad.
442 */
443static void
444aapoint_point(struct draw_stage *stage, struct prim_header *header)
445{
446   const struct aapoint_stage *aapoint = aapoint_stage(stage);
447   struct prim_header tri;
448   struct vertex_header *v[4];
449   const uint tex_slot = aapoint->tex_slot;
450   const uint pos_slot = aapoint->pos_slot;
451   float radius, *pos, *tex;
452   uint i;
453   float k;
454
455   if (aapoint->psize_slot >= 0) {
456      radius = 0.5f * header->v[0]->data[aapoint->psize_slot][0];
457   }
458   else {
459      radius = aapoint->radius;
460   }
461
462   /*
463    * Note: the texcoords (generic attrib, really) we use are special:
464    * The S and T components simply vary from -1 to +1.
465    * The R component is k, below.
466    * The Q component is 1.0 and will used as a handy constant in the
467    * fragment shader.
468    */
469
470   /*
471    * k is the threshold distance from the point's center at which
472    * we begin alpha attenuation (the coverage value).
473    * Operating within a unit circle, we'll compute the fragment's
474    * distance 'd' from the center point using the texcoords.
475    * IF d > 1.0 THEN
476    *    KILL fragment
477    * ELSE IF d > k THEN
478    *    compute coverage in [0,1] proportional to d in [k, 1].
479    * ELSE
480    *    coverage = 1.0;  // full coverage
481    * ENDIF
482    *
483    * Note: the ELSEIF and ELSE clauses are actually implemented with CMP to
484    * avoid using IF/ELSE/ENDIF TGSI opcodes.
485    */
486
487#if !NORMALIZE
488   k = 1.0f / radius;
489   k = 1.0f - 2.0f * k + k * k;
490#else
491   k = 1.0f - 1.0f / radius;
492#endif
493
494   /* allocate/dup new verts */
495   for (i = 0; i < 4; i++) {
496      v[i] = dup_vert(stage, header->v[0], i);
497   }
498
499   /* new verts */
500   pos = v[0]->data[pos_slot];
501   pos[0] -= radius;
502   pos[1] -= radius;
503
504   pos = v[1]->data[pos_slot];
505   pos[0] += radius;
506   pos[1] -= radius;
507
508   pos = v[2]->data[pos_slot];
509   pos[0] += radius;
510   pos[1] += radius;
511
512   pos = v[3]->data[pos_slot];
513   pos[0] -= radius;
514   pos[1] += radius;
515
516   /* new texcoords */
517   tex = v[0]->data[tex_slot];
518   ASSIGN_4V(tex, -1, -1, k, 1);
519
520   tex = v[1]->data[tex_slot];
521   ASSIGN_4V(tex,  1, -1, k, 1);
522
523   tex = v[2]->data[tex_slot];
524   ASSIGN_4V(tex,  1,  1, k, 1);
525
526   tex = v[3]->data[tex_slot];
527   ASSIGN_4V(tex, -1,  1, k, 1);
528
529   /* emit 2 tris for the quad strip */
530   tri.v[0] = v[0];
531   tri.v[1] = v[1];
532   tri.v[2] = v[2];
533   stage->next->tri( stage->next, &tri );
534
535   tri.v[0] = v[0];
536   tri.v[1] = v[2];
537   tri.v[2] = v[3];
538   stage->next->tri( stage->next, &tri );
539}
540
541
542static void
543aapoint_first_point(struct draw_stage *stage, struct prim_header *header)
544{
545   auto struct aapoint_stage *aapoint = aapoint_stage(stage);
546   struct draw_context *draw = stage->draw;
547   struct pipe_context *pipe = draw->pipe;
548   const struct pipe_rasterizer_state *rast = draw->rasterizer;
549   void *r;
550
551   assert(draw->rasterizer->point_smooth);
552
553   if (draw->rasterizer->point_size <= 2.0)
554      aapoint->radius = 1.0;
555   else
556      aapoint->radius = 0.5f * draw->rasterizer->point_size;
557
558   /*
559    * Bind (generate) our fragprog.
560    */
561   bind_aapoint_fragment_shader(aapoint);
562
563   draw_aapoint_prepare_outputs(draw, draw->pipeline.aapoint);
564
565   draw->suspend_flushing = TRUE;
566
567   /* Disable triangle culling, stippling, unfilled mode etc. */
568   r = draw_get_rasterizer_no_cull(draw, rast->scissor, rast->flatshade);
569   pipe->bind_rasterizer_state(pipe, r);
570
571   draw->suspend_flushing = FALSE;
572
573   /* now really draw first point */
574   stage->point = aapoint_point;
575   stage->point(stage, header);
576}
577
578
579static void
580aapoint_flush(struct draw_stage *stage, unsigned flags)
581{
582   struct draw_context *draw = stage->draw;
583   struct aapoint_stage *aapoint = aapoint_stage(stage);
584   struct pipe_context *pipe = draw->pipe;
585
586   stage->point = aapoint_first_point;
587   stage->next->flush( stage->next, flags );
588
589   /* restore original frag shader */
590   draw->suspend_flushing = TRUE;
591   aapoint->driver_bind_fs_state(pipe, aapoint->fs ? aapoint->fs->driver_fs : NULL);
592
593   /* restore original rasterizer state */
594   if (draw->rast_handle) {
595      pipe->bind_rasterizer_state(pipe, draw->rast_handle);
596   }
597
598   draw->suspend_flushing = FALSE;
599
600   draw_remove_extra_vertex_attribs(draw);
601}
602
603
604static void
605aapoint_reset_stipple_counter(struct draw_stage *stage)
606{
607   stage->next->reset_stipple_counter( stage->next );
608}
609
610
611static void
612aapoint_destroy(struct draw_stage *stage)
613{
614   struct aapoint_stage* aapoint = aapoint_stage(stage);
615   struct pipe_context *pipe = stage->draw->pipe;
616
617   draw_free_temp_verts( stage );
618
619   /* restore the old entry points */
620   pipe->create_fs_state = aapoint->driver_create_fs_state;
621   pipe->bind_fs_state = aapoint->driver_bind_fs_state;
622   pipe->delete_fs_state = aapoint->driver_delete_fs_state;
623
624   FREE( stage );
625}
626
627void
628draw_aapoint_prepare_outputs(struct draw_context *draw,
629                             struct draw_stage *stage)
630{
631   struct aapoint_stage *aapoint = aapoint_stage(stage);
632   const struct pipe_rasterizer_state *rast = draw->rasterizer;
633
634   /* update vertex attrib info */
635   aapoint->pos_slot = draw_current_shader_position_output(draw);
636
637   if (!rast->point_smooth)
638      return;
639
640   /* allocate the extra post-transformed vertex attribute */
641   aapoint->tex_slot = draw_alloc_extra_vertex_attrib(draw,
642                                                      TGSI_SEMANTIC_GENERIC,
643                                                      aapoint->fs->generic_attrib);
644   assert(aapoint->tex_slot > 0); /* output[0] is vertex pos */
645
646   /* find psize slot in post-transform vertex */
647   aapoint->psize_slot = -1;
648   if (draw->rasterizer->point_size_per_vertex) {
649      const struct tgsi_shader_info *info = draw_get_shader_info(draw);
650      uint i;
651      /* find PSIZ vertex output */
652      for (i = 0; i < info->num_outputs; i++) {
653         if (info->output_semantic_name[i] == TGSI_SEMANTIC_PSIZE) {
654            aapoint->psize_slot = i;
655            break;
656         }
657      }
658   }
659}
660
661static struct aapoint_stage *
662draw_aapoint_stage(struct draw_context *draw)
663{
664   struct aapoint_stage *aapoint = CALLOC_STRUCT(aapoint_stage);
665   if (!aapoint)
666      goto fail;
667
668   aapoint->stage.draw = draw;
669   aapoint->stage.name = "aapoint";
670   aapoint->stage.next = NULL;
671   aapoint->stage.point = aapoint_first_point;
672   aapoint->stage.line = draw_pipe_passthrough_line;
673   aapoint->stage.tri = draw_pipe_passthrough_tri;
674   aapoint->stage.flush = aapoint_flush;
675   aapoint->stage.reset_stipple_counter = aapoint_reset_stipple_counter;
676   aapoint->stage.destroy = aapoint_destroy;
677
678   if (!draw_alloc_temp_verts( &aapoint->stage, 4 ))
679      goto fail;
680
681   return aapoint;
682
683 fail:
684   if (aapoint)
685      aapoint->stage.destroy(&aapoint->stage);
686
687   return NULL;
688
689}
690
691
692static struct aapoint_stage *
693aapoint_stage_from_pipe(struct pipe_context *pipe)
694{
695   struct draw_context *draw = (struct draw_context *) pipe->draw;
696   return aapoint_stage(draw->pipeline.aapoint);
697}
698
699
700/**
701 * This function overrides the driver's create_fs_state() function and
702 * will typically be called by the state tracker.
703 */
704static void *
705aapoint_create_fs_state(struct pipe_context *pipe,
706                       const struct pipe_shader_state *fs)
707{
708   struct aapoint_stage *aapoint = aapoint_stage_from_pipe(pipe);
709   struct aapoint_fragment_shader *aafs = CALLOC_STRUCT(aapoint_fragment_shader);
710   if (!aafs)
711      return NULL;
712
713   aafs->state.tokens = tgsi_dup_tokens(fs->tokens);
714
715   /* pass-through */
716   aafs->driver_fs = aapoint->driver_create_fs_state(pipe, fs);
717
718   return aafs;
719}
720
721
722static void
723aapoint_bind_fs_state(struct pipe_context *pipe, void *fs)
724{
725   struct aapoint_stage *aapoint = aapoint_stage_from_pipe(pipe);
726   struct aapoint_fragment_shader *aafs = (struct aapoint_fragment_shader *) fs;
727   /* save current */
728   aapoint->fs = aafs;
729   /* pass-through */
730   aapoint->driver_bind_fs_state(pipe,
731                                 (aafs ? aafs->driver_fs : NULL));
732}
733
734
735static void
736aapoint_delete_fs_state(struct pipe_context *pipe, void *fs)
737{
738   struct aapoint_stage *aapoint = aapoint_stage_from_pipe(pipe);
739   struct aapoint_fragment_shader *aafs = (struct aapoint_fragment_shader *) fs;
740
741   /* pass-through */
742   aapoint->driver_delete_fs_state(pipe, aafs->driver_fs);
743
744   if (aafs->aapoint_fs)
745      aapoint->driver_delete_fs_state(pipe, aafs->aapoint_fs);
746
747   FREE((void*)aafs->state.tokens);
748
749   FREE(aafs);
750}
751
752
753/**
754 * Called by drivers that want to install this AA point prim stage
755 * into the draw module's pipeline.  This will not be used if the
756 * hardware has native support for AA points.
757 */
758boolean
759draw_install_aapoint_stage(struct draw_context *draw,
760                           struct pipe_context *pipe)
761{
762   struct aapoint_stage *aapoint;
763
764   pipe->draw = (void *) draw;
765
766   /*
767    * Create / install AA point drawing / prim stage
768    */
769   aapoint = draw_aapoint_stage( draw );
770   if (!aapoint)
771      return FALSE;
772
773   /* save original driver functions */
774   aapoint->driver_create_fs_state = pipe->create_fs_state;
775   aapoint->driver_bind_fs_state = pipe->bind_fs_state;
776   aapoint->driver_delete_fs_state = pipe->delete_fs_state;
777
778   /* override the driver's functions */
779   pipe->create_fs_state = aapoint_create_fs_state;
780   pipe->bind_fs_state = aapoint_bind_fs_state;
781   pipe->delete_fs_state = aapoint_delete_fs_state;
782
783   draw->pipeline.aapoint = &aapoint->stage;
784
785   return TRUE;
786}
787