lp_setup.c revision 7ec681f3
1/**************************************************************************
2 *
3 * Copyright 2007 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28/**
29 * Tiling engine.
30 *
31 * Builds per-tile display lists and executes them on calls to
32 * lp_setup_flush().
33 */
34
35#include <limits.h>
36
37#include "pipe/p_defines.h"
38#include "util/u_framebuffer.h"
39#include "util/u_inlines.h"
40#include "util/u_memory.h"
41#include "util/u_pack_color.h"
42#include "util/u_cpu_detect.h"
43#include "util/u_viewport.h"
44#include "draw/draw_pipe.h"
45#include "util/os_time.h"
46#include "lp_context.h"
47#include "lp_memory.h"
48#include "lp_scene.h"
49#include "lp_texture.h"
50#include "lp_debug.h"
51#include "lp_fence.h"
52#include "lp_query.h"
53#include "lp_rast.h"
54#include "lp_setup_context.h"
55#include "lp_screen.h"
56#include "lp_state.h"
57#include "lp_jit.h"
58#include "frontend/sw_winsys.h"
59
60#include "draw/draw_context.h"
61#include "draw/draw_vbuf.h"
62
63
64static boolean set_scene_state( struct lp_setup_context *, enum setup_state,
65                             const char *reason);
66static boolean try_update_scene_state( struct lp_setup_context *setup );
67
68
69static void
70lp_setup_get_empty_scene(struct lp_setup_context *setup)
71{
72   assert(setup->scene == NULL);
73
74   setup->scene_idx++;
75   setup->scene_idx %= ARRAY_SIZE(setup->scenes);
76
77   setup->scene = setup->scenes[setup->scene_idx];
78
79   if (setup->scene->fence) {
80      if (LP_DEBUG & DEBUG_SETUP)
81         debug_printf("%s: wait for scene %d\n",
82                      __FUNCTION__, setup->scene->fence->id);
83
84      lp_fence_wait(setup->scene->fence);
85   }
86
87   lp_scene_begin_binning(setup->scene, &setup->fb);
88
89   setup->scene->permit_linear_rasterizer = setup->permit_linear_rasterizer;
90}
91
92
93static void
94first_triangle( struct lp_setup_context *setup,
95                const float (*v0)[4],
96                const float (*v1)[4],
97                const float (*v2)[4])
98{
99   assert(setup->state == SETUP_ACTIVE);
100   lp_setup_choose_triangle( setup );
101   setup->triangle( setup, v0, v1, v2 );
102}
103
104static boolean
105first_rectangle( struct lp_setup_context *setup,
106                 const float (*v0)[4],
107                 const float (*v1)[4],
108                 const float (*v2)[4],
109                 const float (*v3)[4],
110                 const float (*v4)[4],
111                 const float (*v5)[4])
112{
113   assert(setup->state == SETUP_ACTIVE);
114   lp_setup_choose_rect( setup );
115   return setup->rect( setup, v0, v1, v2, v3, v4, v5 );
116}
117
118static void
119first_line( struct lp_setup_context *setup,
120	    const float (*v0)[4],
121	    const float (*v1)[4])
122{
123   assert(setup->state == SETUP_ACTIVE);
124   lp_setup_choose_line( setup );
125   setup->line( setup, v0, v1 );
126}
127
128static void
129first_point( struct lp_setup_context *setup,
130	     const float (*v0)[4])
131{
132   assert(setup->state == SETUP_ACTIVE);
133   lp_setup_choose_point( setup );
134   setup->point( setup, v0 );
135}
136
137void
138lp_setup_reset( struct lp_setup_context *setup )
139{
140   unsigned i;
141
142   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
143
144   /* Reset derived state */
145   for (i = 0; i < ARRAY_SIZE(setup->constants); ++i) {
146      setup->constants[i].stored_size = 0;
147      setup->constants[i].stored_data = NULL;
148   }
149
150   setup->fs.stored = NULL;
151   setup->dirty = ~0;
152
153   /* no current bin */
154   setup->scene = NULL;
155
156   /* Reset some state:
157    */
158   memset(&setup->clear, 0, sizeof setup->clear);
159
160   /* Have an explicit "start-binning" call and get rid of this
161    * pointer twiddling?
162    */
163   setup->line = first_line;
164   setup->point = first_point;
165   setup->triangle = first_triangle;
166   setup->rect = first_rectangle;
167}
168
169
170/** Rasterize all scene's bins */
171static void
172lp_setup_rasterize_scene( struct lp_setup_context *setup )
173{
174   struct lp_scene *scene = setup->scene;
175   struct llvmpipe_screen *screen = llvmpipe_screen(scene->pipe->screen);
176
177   scene->num_active_queries = setup->active_binned_queries;
178   memcpy(scene->active_queries, setup->active_queries,
179          scene->num_active_queries * sizeof(scene->active_queries[0]));
180
181   lp_scene_end_binning(scene);
182
183   lp_fence_reference(&setup->last_fence, scene->fence);
184
185   if (setup->last_fence)
186      setup->last_fence->issued = TRUE;
187
188   mtx_lock(&screen->rast_mutex);
189
190   /* FIXME: We enqueue the scene then wait on the rasterizer to finish.
191    * This means we never actually run any vertex stuff in parallel to
192    * rasterization (not in the same context at least) which is what the
193    * multiple scenes per setup is about - when we get a new empty scene
194    * any old one is already empty again because we waited here for
195    * raster tasks to be finished. Ideally, we shouldn't need to wait here
196    * and rely on fences elsewhere when waiting is necessary.
197    * Certainly, lp_scene_end_rasterization() would need to be deferred too
198    * and there's probably other bits why this doesn't actually work.
199    */
200   lp_rast_queue_scene(screen->rast, scene);
201   lp_rast_finish(screen->rast);
202   mtx_unlock(&screen->rast_mutex);
203
204   lp_scene_end_rasterization(setup->scene);
205   lp_setup_reset( setup );
206
207   LP_DBG(DEBUG_SETUP, "%s done \n", __FUNCTION__);
208}
209
210
211
212static boolean
213begin_binning( struct lp_setup_context *setup )
214{
215   struct lp_scene *scene = setup->scene;
216   boolean need_zsload = FALSE;
217   boolean ok;
218
219   assert(scene);
220   assert(scene->fence == NULL);
221
222   /* Always create a fence:
223    */
224   scene->fence = lp_fence_create(MAX2(1, setup->num_threads));
225   if (!scene->fence)
226      return FALSE;
227
228   ok = try_update_scene_state(setup);
229   if (!ok)
230      return FALSE;
231
232   if (setup->fb.zsbuf &&
233       ((setup->clear.flags & PIPE_CLEAR_DEPTHSTENCIL) != PIPE_CLEAR_DEPTHSTENCIL) &&
234        util_format_is_depth_and_stencil(setup->fb.zsbuf->format))
235      need_zsload = TRUE;
236
237   LP_DBG(DEBUG_SETUP, "%s color clear bufs: %x depth: %s\n", __FUNCTION__,
238          setup->clear.flags >> 2,
239          need_zsload ? "clear": "load");
240
241   if (setup->clear.flags & PIPE_CLEAR_COLOR) {
242      unsigned cbuf;
243      for (cbuf = 0; cbuf < setup->fb.nr_cbufs; cbuf++) {
244         assert(PIPE_CLEAR_COLOR0 == 1 << 2);
245         if (setup->clear.flags & (1 << (2 + cbuf))) {
246            union lp_rast_cmd_arg clearrb_arg;
247            struct lp_rast_clear_rb *cc_scene =
248               (struct lp_rast_clear_rb *)
249                  lp_scene_alloc(scene, sizeof(struct lp_rast_clear_rb));
250
251            if (!cc_scene) {
252               return FALSE;
253            }
254
255            cc_scene->cbuf = cbuf;
256            cc_scene->color_val = setup->clear.color_val[cbuf];
257            clearrb_arg.clear_rb = cc_scene;
258
259            if (!lp_scene_bin_everywhere(scene,
260                                         LP_RAST_OP_CLEAR_COLOR,
261                                         clearrb_arg))
262               return FALSE;
263         }
264      }
265   }
266
267   if (setup->fb.zsbuf) {
268      if (setup->clear.flags & PIPE_CLEAR_DEPTHSTENCIL) {
269         ok = lp_scene_bin_everywhere( scene,
270                                       LP_RAST_OP_CLEAR_ZSTENCIL,
271                                       lp_rast_arg_clearzs(
272                                          setup->clear.zsvalue,
273                                          setup->clear.zsmask));
274         if (!ok)
275            return FALSE;
276      }
277   }
278
279   setup->clear.flags = 0;
280   setup->clear.zsmask = 0;
281   setup->clear.zsvalue = 0;
282
283   scene->had_queries = !!setup->active_binned_queries;
284
285   LP_DBG(DEBUG_SETUP, "%s done\n", __FUNCTION__);
286   return TRUE;
287}
288
289
290/* This basically bins and then flushes any outstanding full-screen
291 * clears.
292 *
293 * TODO: fast path for fullscreen clears and no triangles.
294 */
295static boolean
296execute_clears( struct lp_setup_context *setup )
297{
298   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
299
300   return begin_binning( setup );
301}
302
303const char *states[] = {
304   "FLUSHED",
305   "CLEARED",
306   "ACTIVE "
307};
308
309
310static boolean
311set_scene_state( struct lp_setup_context *setup,
312                 enum setup_state new_state,
313                 const char *reason)
314{
315   unsigned old_state = setup->state;
316
317   if (old_state == new_state)
318      return TRUE;
319
320   if (LP_DEBUG & DEBUG_SCENE) {
321      debug_printf("%s old %s new %s%s%s\n",
322                   __FUNCTION__,
323                   states[old_state],
324                   states[new_state],
325                   (new_state == SETUP_FLUSHED) ? ": " : "",
326                   (new_state == SETUP_FLUSHED) ? reason : "");
327
328      if (new_state == SETUP_FLUSHED && setup->scene)
329         lp_debug_draw_bins_by_cmd_length(setup->scene);
330   }
331
332   /* wait for a free/empty scene
333    */
334   if (old_state == SETUP_FLUSHED)
335      lp_setup_get_empty_scene(setup);
336
337   switch (new_state) {
338   case SETUP_CLEARED:
339      break;
340
341   case SETUP_ACTIVE:
342      if (!begin_binning( setup ))
343         goto fail;
344      break;
345
346   case SETUP_FLUSHED:
347      if (old_state == SETUP_CLEARED)
348         if (!execute_clears( setup ))
349            goto fail;
350
351      lp_setup_rasterize_scene( setup );
352      assert(setup->scene == NULL);
353      break;
354
355   default:
356      assert(0 && "invalid setup state mode");
357      goto fail;
358   }
359
360   setup->state = new_state;
361   return TRUE;
362
363fail:
364   if (setup->scene) {
365      lp_scene_end_rasterization(setup->scene);
366      setup->scene = NULL;
367   }
368
369   setup->state = SETUP_FLUSHED;
370   lp_setup_reset( setup );
371   return FALSE;
372}
373
374
375void
376lp_setup_flush( struct lp_setup_context *setup,
377                struct pipe_fence_handle **fence,
378                const char *reason)
379{
380   set_scene_state( setup, SETUP_FLUSHED, reason );
381
382   if (fence) {
383      lp_fence_reference((struct lp_fence **)fence, setup->last_fence);
384      if (!*fence)
385         *fence = (struct pipe_fence_handle *)lp_fence_create(0);
386   }
387}
388
389
390void
391lp_setup_bind_framebuffer( struct lp_setup_context *setup,
392                           const struct pipe_framebuffer_state *fb )
393{
394   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
395
396   /* Flush any old scene.
397    */
398   set_scene_state( setup, SETUP_FLUSHED, __FUNCTION__ );
399
400   /*
401    * Ensure the old scene is not reused.
402    */
403   assert(!setup->scene);
404
405   /* Set new state.  This will be picked up later when we next need a
406    * scene.
407    */
408   util_copy_framebuffer_state(&setup->fb, fb);
409   setup->framebuffer.x0 = 0;
410   setup->framebuffer.y0 = 0;
411   setup->framebuffer.x1 = fb->width-1;
412   setup->framebuffer.y1 = fb->height-1;
413   setup->dirty |= LP_SETUP_NEW_SCISSOR;
414}
415
416
417/*
418 * Try to clear one color buffer of the attached fb, either by binning a clear
419 * command or queuing up the clear for later (when binning is started).
420 */
421static boolean
422lp_setup_try_clear_color_buffer(struct lp_setup_context *setup,
423                                const union pipe_color_union *color,
424                                unsigned cbuf)
425{
426   union lp_rast_cmd_arg clearrb_arg;
427   union util_color uc;
428   enum pipe_format format = setup->fb.cbufs[cbuf]->format;
429
430   LP_DBG(DEBUG_SETUP, "%s state %d\n", __FUNCTION__, setup->state);
431
432   util_pack_color_union(format, &uc, color);
433
434   if (setup->state == SETUP_ACTIVE) {
435      struct lp_scene *scene = setup->scene;
436
437      /* Add the clear to existing scene.  In the unusual case where
438       * both color and depth-stencil are being cleared when there's
439       * already been some rendering, we could discard the currently
440       * binned scene and start again, but I don't see that as being
441       * a common usage.
442       */
443      struct lp_rast_clear_rb *cc_scene =
444         (struct lp_rast_clear_rb *)
445            lp_scene_alloc_aligned(scene, sizeof(struct lp_rast_clear_rb), 8);
446
447      if (!cc_scene) {
448         return FALSE;
449      }
450
451      cc_scene->cbuf = cbuf;
452      cc_scene->color_val = uc;
453      clearrb_arg.clear_rb = cc_scene;
454
455      if (!lp_scene_bin_everywhere(scene,
456                                   LP_RAST_OP_CLEAR_COLOR,
457                                   clearrb_arg))
458         return FALSE;
459   }
460   else {
461      /* Put ourselves into the 'pre-clear' state, specifically to try
462       * and accumulate multiple clears to color and depth_stencil
463       * buffers which the app or gallium frontend might issue
464       * separately.
465       */
466      set_scene_state( setup, SETUP_CLEARED, __FUNCTION__ );
467
468      assert(PIPE_CLEAR_COLOR0 == (1 << 2));
469      setup->clear.flags |= 1 << (cbuf + 2);
470      setup->clear.color_val[cbuf] = uc;
471   }
472
473   return TRUE;
474}
475
476static boolean
477lp_setup_try_clear_zs(struct lp_setup_context *setup,
478                      double depth,
479                      unsigned stencil,
480                      unsigned flags)
481{
482   uint64_t zsmask = 0;
483   uint64_t zsvalue = 0;
484   uint32_t zmask32;
485   uint8_t smask8;
486   enum pipe_format format = setup->fb.zsbuf->format;
487
488   LP_DBG(DEBUG_SETUP, "%s state %d\n", __FUNCTION__, setup->state);
489
490   zmask32 = (flags & PIPE_CLEAR_DEPTH) ? ~0 : 0;
491   smask8 = (flags & PIPE_CLEAR_STENCIL) ? ~0 : 0;
492
493   zsvalue = util_pack64_z_stencil(format, depth, stencil);
494
495   zsmask = util_pack64_mask_z_stencil(format, zmask32, smask8);
496
497   zsvalue &= zsmask;
498
499   if (format == PIPE_FORMAT_Z24X8_UNORM ||
500       format == PIPE_FORMAT_X8Z24_UNORM) {
501      /*
502       * Make full mask if there's "X" bits so we can do full
503       * clear (without rmw).
504       */
505      uint32_t zsmask_full = 0;
506      zsmask_full = util_pack_mask_z_stencil(format, ~0, ~0);
507      zsmask |= ~zsmask_full;
508   }
509
510   if (setup->state == SETUP_ACTIVE) {
511      struct lp_scene *scene = setup->scene;
512
513      /* Add the clear to existing scene.  In the unusual case where
514       * both color and depth-stencil are being cleared when there's
515       * already been some rendering, we could discard the currently
516       * binned scene and start again, but I don't see that as being
517       * a common usage.
518       */
519      if (!lp_scene_bin_everywhere(scene,
520                                   LP_RAST_OP_CLEAR_ZSTENCIL,
521                                   lp_rast_arg_clearzs(zsvalue, zsmask)))
522         return FALSE;
523   }
524   else {
525      /* Put ourselves into the 'pre-clear' state, specifically to try
526       * and accumulate multiple clears to color and depth_stencil
527       * buffers which the app or gallium frontend might issue
528       * separately.
529       */
530      set_scene_state( setup, SETUP_CLEARED, __FUNCTION__ );
531
532      setup->clear.flags |= flags;
533
534      setup->clear.zsmask |= zsmask;
535      setup->clear.zsvalue =
536         (setup->clear.zsvalue & ~zsmask) | (zsvalue & zsmask);
537   }
538
539   return TRUE;
540}
541
542void
543lp_setup_clear( struct lp_setup_context *setup,
544                const union pipe_color_union *color,
545                double depth,
546                unsigned stencil,
547                unsigned flags )
548{
549   unsigned i;
550
551   /*
552    * Note any of these (max 9) clears could fail (but at most there should
553    * be just one failure!). This avoids doing the previous succeeded
554    * clears again (we still clear tiles twice if a clear command succeeded
555    * partially for one buffer).
556    */
557   if (flags & PIPE_CLEAR_DEPTHSTENCIL) {
558      unsigned flagszs = flags & PIPE_CLEAR_DEPTHSTENCIL;
559      if (!lp_setup_try_clear_zs(setup, depth, stencil, flagszs)) {
560         lp_setup_flush(setup, NULL, __FUNCTION__);
561
562         if (!lp_setup_try_clear_zs(setup, depth, stencil, flagszs))
563            assert(0);
564      }
565   }
566
567   if (flags & PIPE_CLEAR_COLOR) {
568      assert(PIPE_CLEAR_COLOR0 == (1 << 2));
569      for (i = 0; i < setup->fb.nr_cbufs; i++) {
570         if ((flags & (1 << (2 + i))) && setup->fb.cbufs[i]) {
571            if (!lp_setup_try_clear_color_buffer(setup, color, i)) {
572               lp_setup_flush(setup, NULL, __FUNCTION__);
573
574               if (!lp_setup_try_clear_color_buffer(setup, color, i))
575                  assert(0);
576            }
577         }
578      }
579   }
580}
581
582
583
584void
585lp_setup_set_triangle_state( struct lp_setup_context *setup,
586                             unsigned cull_mode,
587                             boolean ccw_is_frontface,
588                             boolean scissor,
589                             boolean half_pixel_center,
590                             boolean bottom_edge_rule,
591                             boolean multisample)
592{
593   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
594
595   setup->ccw_is_frontface = ccw_is_frontface;
596   setup->cullmode = cull_mode;
597   setup->triangle = first_triangle;
598   setup->rect = first_rectangle;
599   setup->multisample = multisample;
600   setup->pixel_offset = half_pixel_center ? 0.5f : 0.0f;
601   setup->bottom_edge_rule = bottom_edge_rule;
602
603   if (setup->scissor_test != scissor) {
604      setup->dirty |= LP_SETUP_NEW_SCISSOR;
605      setup->scissor_test = scissor;
606   }
607}
608
609void
610lp_setup_set_line_state( struct lp_setup_context *setup,
611                         float line_width,
612                         boolean line_rectangular)
613{
614   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
615
616   setup->line_width = line_width;
617   setup->rectangular_lines = line_rectangular;
618}
619
620void
621lp_setup_set_point_state( struct lp_setup_context *setup,
622                          float point_size,
623                          boolean point_tri_clip,
624                          boolean point_size_per_vertex,
625                          uint sprite_coord_enable,
626                          uint sprite_coord_origin,
627                          boolean point_quad_rasterization)
628{
629   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
630
631   setup->point_size = point_size;
632   setup->sprite_coord_enable = sprite_coord_enable;
633   setup->sprite_coord_origin = sprite_coord_origin;
634   setup->point_tri_clip = point_tri_clip;
635   setup->point_size_per_vertex = point_size_per_vertex;
636   setup->legacy_points = !point_quad_rasterization;
637}
638
639void
640lp_setup_set_setup_variant( struct lp_setup_context *setup,
641			    const struct lp_setup_variant *variant)
642{
643   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
644
645   setup->setup.variant = variant;
646}
647
648void
649lp_setup_set_fs_variant( struct lp_setup_context *setup,
650                         struct lp_fragment_shader_variant *variant)
651{
652   LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__,
653          variant);
654
655   setup->fs.current.variant = variant;
656   setup->dirty |= LP_SETUP_NEW_FS;
657}
658
659void
660lp_setup_set_fs_constants(struct lp_setup_context *setup,
661                          unsigned num,
662                          struct pipe_constant_buffer *buffers)
663{
664   unsigned i;
665
666   LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__, (void *) buffers);
667
668   assert(num <= ARRAY_SIZE(setup->constants));
669
670   for (i = 0; i < num; ++i) {
671      util_copy_constant_buffer(&setup->constants[i].current, &buffers[i], false);
672   }
673   for (; i < ARRAY_SIZE(setup->constants); i++) {
674      util_copy_constant_buffer(&setup->constants[i].current, NULL, false);
675   }
676   setup->dirty |= LP_SETUP_NEW_CONSTANTS;
677}
678
679void
680lp_setup_set_fs_ssbos(struct lp_setup_context *setup,
681                      unsigned num,
682                      struct pipe_shader_buffer *buffers)
683{
684   unsigned i;
685
686   LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__, (void *) buffers);
687
688   assert(num <= ARRAY_SIZE(setup->ssbos));
689
690   for (i = 0; i < num; ++i) {
691      util_copy_shader_buffer(&setup->ssbos[i].current, &buffers[i]);
692   }
693   for (; i < ARRAY_SIZE(setup->ssbos); i++) {
694      util_copy_shader_buffer(&setup->ssbos[i].current, NULL);
695   }
696   setup->dirty |= LP_SETUP_NEW_SSBOS;
697}
698
699void
700lp_setup_set_fs_images(struct lp_setup_context *setup,
701                       unsigned num,
702                       struct pipe_image_view *images)
703{
704   unsigned i;
705
706   LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__, (void *) images);
707
708   assert(num <= ARRAY_SIZE(setup->images));
709
710   for (i = 0; i < num; ++i) {
711      struct pipe_image_view *image = &images[i];
712      util_copy_image_view(&setup->images[i].current, &images[i]);
713
714      struct pipe_resource *res = image->resource;
715      struct llvmpipe_resource *lp_res = llvmpipe_resource(res);
716      struct lp_jit_image *jit_image;
717
718      jit_image = &setup->fs.current.jit_context.images[i];
719      if (!lp_res)
720         continue;
721      if (!lp_res->dt) {
722         /* regular texture - setup array of mipmap level offsets */
723         if (llvmpipe_resource_is_texture(res)) {
724            jit_image->base = lp_res->tex_data;
725         } else
726            jit_image->base = lp_res->data;
727
728         jit_image->width = res->width0;
729         jit_image->height = res->height0;
730         jit_image->depth = res->depth0;
731         jit_image->num_samples = res->nr_samples;
732
733         if (llvmpipe_resource_is_texture(res)) {
734            uint32_t mip_offset = lp_res->mip_offsets[image->u.tex.level];
735            const uint32_t bw = util_format_get_blockwidth(image->resource->format);
736            const uint32_t bh = util_format_get_blockheight(image->resource->format);
737
738            jit_image->width = DIV_ROUND_UP(jit_image->width, bw);
739            jit_image->height = DIV_ROUND_UP(jit_image->height, bh);
740            jit_image->width = u_minify(jit_image->width, image->u.tex.level);
741            jit_image->height = u_minify(jit_image->height, image->u.tex.level);
742
743            if (res->target == PIPE_TEXTURE_1D_ARRAY ||
744                res->target == PIPE_TEXTURE_2D_ARRAY ||
745                res->target == PIPE_TEXTURE_3D ||
746                res->target == PIPE_TEXTURE_CUBE ||
747                res->target == PIPE_TEXTURE_CUBE_ARRAY) {
748               /*
749                * For array textures, we don't have first_layer, instead
750                * adjust last_layer (stored as depth) plus the mip level offsets
751                * (as we have mip-first layout can't just adjust base ptr).
752                * XXX For mip levels, could do something similar.
753                */
754               jit_image->depth = image->u.tex.last_layer - image->u.tex.first_layer + 1;
755               mip_offset += image->u.tex.first_layer * lp_res->img_stride[image->u.tex.level];
756            } else
757               jit_image->depth = u_minify(jit_image->depth, image->u.tex.level);
758
759            jit_image->row_stride = lp_res->row_stride[image->u.tex.level];
760            jit_image->img_stride = lp_res->img_stride[image->u.tex.level];
761            jit_image->sample_stride = lp_res->sample_stride;
762            jit_image->base = (uint8_t *)jit_image->base + mip_offset;
763         }
764         else {
765            unsigned view_blocksize = util_format_get_blocksize(image->format);
766            jit_image->width = image->u.buf.size / view_blocksize;
767            jit_image->base = (uint8_t *)jit_image->base + image->u.buf.offset;
768         }
769      }
770   }
771   for (; i < ARRAY_SIZE(setup->images); i++) {
772      util_copy_image_view(&setup->images[i].current, NULL);
773   }
774   setup->dirty |= LP_SETUP_NEW_FS;
775}
776
777void
778lp_setup_set_alpha_ref_value( struct lp_setup_context *setup,
779                              float alpha_ref_value )
780{
781   LP_DBG(DEBUG_SETUP, "%s %f\n", __FUNCTION__, alpha_ref_value);
782
783   if(setup->fs.current.jit_context.alpha_ref_value != alpha_ref_value) {
784      setup->fs.current.jit_context.alpha_ref_value = alpha_ref_value;
785      setup->dirty |= LP_SETUP_NEW_FS;
786   }
787}
788
789void
790lp_setup_set_stencil_ref_values( struct lp_setup_context *setup,
791                                 const ubyte refs[2] )
792{
793   LP_DBG(DEBUG_SETUP, "%s %d %d\n", __FUNCTION__, refs[0], refs[1]);
794
795   if (setup->fs.current.jit_context.stencil_ref_front != refs[0] ||
796       setup->fs.current.jit_context.stencil_ref_back != refs[1]) {
797      setup->fs.current.jit_context.stencil_ref_front = refs[0];
798      setup->fs.current.jit_context.stencil_ref_back = refs[1];
799      setup->dirty |= LP_SETUP_NEW_FS;
800   }
801}
802
803void
804lp_setup_set_blend_color( struct lp_setup_context *setup,
805                          const struct pipe_blend_color *blend_color )
806{
807   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
808
809   assert(blend_color);
810
811   if(memcmp(&setup->blend_color.current, blend_color, sizeof *blend_color) != 0) {
812      memcpy(&setup->blend_color.current, blend_color, sizeof *blend_color);
813      setup->dirty |= LP_SETUP_NEW_BLEND_COLOR;
814   }
815}
816
817
818void
819lp_setup_set_scissors( struct lp_setup_context *setup,
820                       const struct pipe_scissor_state *scissors )
821{
822   unsigned i;
823   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
824
825   assert(scissors);
826
827   for (i = 0; i < PIPE_MAX_VIEWPORTS; ++i) {
828      setup->scissors[i].x0 = scissors[i].minx;
829      setup->scissors[i].x1 = scissors[i].maxx-1;
830      setup->scissors[i].y0 = scissors[i].miny;
831      setup->scissors[i].y1 = scissors[i].maxy-1;
832   }
833   setup->dirty |= LP_SETUP_NEW_SCISSOR;
834}
835
836void
837lp_setup_set_sample_mask(struct lp_setup_context *setup,
838                         uint32_t sample_mask)
839{
840   if (setup->fs.current.jit_context.sample_mask != sample_mask) {
841      setup->fs.current.jit_context.sample_mask = sample_mask;
842      setup->dirty |= LP_SETUP_NEW_FS;
843   }
844}
845
846void
847lp_setup_set_flatshade_first(struct lp_setup_context *setup,
848                             boolean flatshade_first)
849{
850   setup->flatshade_first = flatshade_first;
851}
852
853void
854lp_setup_set_rasterizer_discard(struct lp_setup_context *setup,
855                                boolean rasterizer_discard)
856{
857   if (setup->rasterizer_discard != rasterizer_discard) {
858      setup->rasterizer_discard = rasterizer_discard;
859      setup->line = first_line;
860      setup->point = first_point;
861      setup->triangle = first_triangle;
862      setup->rect = first_rectangle;
863   }
864}
865
866void
867lp_setup_set_vertex_info(struct lp_setup_context *setup,
868                         struct vertex_info *vertex_info)
869{
870   /* XXX: just silently holding onto the pointer:
871    */
872   setup->vertex_info = vertex_info;
873}
874
875
876void
877lp_setup_set_linear_mode( struct lp_setup_context *setup,
878                          boolean mode )
879{
880   /* The linear rasterizer requires sse2 both at compile and runtime,
881    * in particular for the code in lp_rast_linear_fallback.c.  This
882    * is more than ten-year-old technology, so it's a reasonable
883    * baseline.
884    */
885#if defined(PIPE_ARCH_SSE)
886   setup->permit_linear_rasterizer = (mode &&
887                                      util_get_cpu_caps()->has_sse2);
888#else
889   setup->permit_linear_rasterizer = FALSE;
890#endif
891}
892
893
894/**
895 * Called during state validation when LP_NEW_VIEWPORT is set.
896 */
897void
898lp_setup_set_viewports(struct lp_setup_context *setup,
899                       unsigned num_viewports,
900                       const struct pipe_viewport_state *viewports)
901{
902   struct llvmpipe_context *lp = llvmpipe_context(setup->pipe);
903   float half_height, x0, y0;
904   unsigned i;
905
906   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
907
908   assert(num_viewports <= PIPE_MAX_VIEWPORTS);
909   assert(viewports);
910
911   /*
912    * Linear rasterizer path for scissor/viewport intersection.
913    *
914    * Calculate "scissor" rect from the (first) viewport.
915    * Just like stored scissor rects need inclusive coords.
916    * For rounding, assume half pixel center (d3d9 should not end up
917    * with fractional viewports) - quite obviously for msaa we'd need
918    * fractional values here (and elsewhere for the point bounding box).
919    *
920    * See: lp_setup.c::try_update_scene_state
921    */
922   half_height = fabsf(viewports[0].scale[1]);
923   x0 = viewports[0].translate[0] - viewports[0].scale[0];
924   y0 = viewports[0].translate[1] - half_height;
925   setup->vpwh.x0 = (int)(x0 + 0.5f);
926   setup->vpwh.x1 = (int)(viewports[0].scale[0] * 2.0f + x0 - 0.5f);
927   setup->vpwh.y0 = (int)(y0 + 0.5f);
928   setup->vpwh.y1 = (int)(half_height * 2.0f + y0 - 0.5f);
929   setup->dirty |= LP_SETUP_NEW_SCISSOR;
930
931   /*
932    * For use in lp_state_fs.c, propagate the viewport values for all viewports.
933    */
934   for (i = 0; i < num_viewports; i++) {
935      float min_depth;
936      float max_depth;
937      util_viewport_zmin_zmax(&viewports[i], lp->rasterizer->clip_halfz,
938                              &min_depth, &max_depth);
939
940      if (setup->viewports[i].min_depth != min_depth ||
941          setup->viewports[i].max_depth != max_depth) {
942          setup->viewports[i].min_depth = min_depth;
943          setup->viewports[i].max_depth = max_depth;
944          setup->dirty |= LP_SETUP_NEW_VIEWPORTS;
945      }
946   }
947}
948
949
950/**
951 * Called directly by llvmpipe_set_sampler_views
952 */
953void
954lp_setup_set_fragment_sampler_views(struct lp_setup_context *setup,
955                                    unsigned num,
956                                    struct pipe_sampler_view **views)
957{
958   unsigned i, max_tex_num;
959
960   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
961
962   assert(num <= PIPE_MAX_SHADER_SAMPLER_VIEWS);
963
964   max_tex_num = MAX2(num, setup->fs.current_tex_num);
965
966   for (i = 0; i < max_tex_num; i++) {
967      struct pipe_sampler_view *view = i < num ? views[i] : NULL;
968
969      /* We are going to overwrite/unref the current texture further below. If
970       * set, make sure to unmap its resource to avoid leaking previous
971       * mapping.  */
972      if (setup->fs.current_tex[i])
973         llvmpipe_resource_unmap(setup->fs.current_tex[i], 0, 0);
974
975      if (view) {
976         struct pipe_resource *res = view->texture;
977         struct llvmpipe_resource *lp_tex = llvmpipe_resource(res);
978         struct lp_jit_texture *jit_tex;
979         jit_tex = &setup->fs.current.jit_context.textures[i];
980
981         /* We're referencing the texture's internal data, so save a
982          * reference to it.
983          */
984         pipe_resource_reference(&setup->fs.current_tex[i], res);
985
986         if (!lp_tex->dt) {
987            /* regular texture - setup array of mipmap level offsets */
988            int j;
989            unsigned first_level = 0;
990            unsigned last_level = 0;
991
992            if (llvmpipe_resource_is_texture(res)) {
993               first_level = view->u.tex.first_level;
994               last_level = view->u.tex.last_level;
995               assert(first_level <= last_level);
996               assert(last_level <= res->last_level);
997               jit_tex->base = lp_tex->tex_data;
998            }
999            else {
1000              jit_tex->base = lp_tex->data;
1001            }
1002
1003            if (LP_PERF & PERF_TEX_MEM) {
1004               /* use dummy tile memory */
1005               jit_tex->base = lp_dummy_tile;
1006               jit_tex->width = TILE_SIZE/8;
1007               jit_tex->height = TILE_SIZE/8;
1008               jit_tex->depth = 1;
1009               jit_tex->first_level = 0;
1010               jit_tex->last_level = 0;
1011               jit_tex->mip_offsets[0] = 0;
1012               jit_tex->row_stride[0] = 0;
1013               jit_tex->img_stride[0] = 0;
1014               jit_tex->num_samples = 0;
1015               jit_tex->sample_stride = 0;
1016            }
1017            else {
1018               jit_tex->width = res->width0;
1019               jit_tex->height = res->height0;
1020               jit_tex->depth = res->depth0;
1021               jit_tex->first_level = first_level;
1022               jit_tex->last_level = last_level;
1023               jit_tex->num_samples = res->nr_samples;
1024               jit_tex->sample_stride = 0;
1025
1026               if (llvmpipe_resource_is_texture(res)) {
1027                  for (j = first_level; j <= last_level; j++) {
1028                     jit_tex->mip_offsets[j] = lp_tex->mip_offsets[j];
1029                     jit_tex->row_stride[j] = lp_tex->row_stride[j];
1030                     jit_tex->img_stride[j] = lp_tex->img_stride[j];
1031                  }
1032
1033                  jit_tex->sample_stride = lp_tex->sample_stride;
1034
1035                  if (res->target == PIPE_TEXTURE_1D_ARRAY ||
1036                      res->target == PIPE_TEXTURE_2D_ARRAY ||
1037                      res->target == PIPE_TEXTURE_CUBE ||
1038                      res->target == PIPE_TEXTURE_CUBE_ARRAY) {
1039                     /*
1040                      * For array textures, we don't have first_layer, instead
1041                      * adjust last_layer (stored as depth) plus the mip level offsets
1042                      * (as we have mip-first layout can't just adjust base ptr).
1043                      * XXX For mip levels, could do something similar.
1044                      */
1045                     jit_tex->depth = view->u.tex.last_layer - view->u.tex.first_layer + 1;
1046                     for (j = first_level; j <= last_level; j++) {
1047                        jit_tex->mip_offsets[j] += view->u.tex.first_layer *
1048                                                   lp_tex->img_stride[j];
1049                     }
1050                     if (view->target == PIPE_TEXTURE_CUBE ||
1051                         view->target == PIPE_TEXTURE_CUBE_ARRAY) {
1052                        assert(jit_tex->depth % 6 == 0);
1053                     }
1054                     assert(view->u.tex.first_layer <= view->u.tex.last_layer);
1055                     assert(view->u.tex.last_layer < res->array_size);
1056                  }
1057               }
1058               else {
1059                  /*
1060                   * For buffers, we don't have "offset", instead adjust
1061                   * the size (stored as width) plus the base pointer.
1062                   */
1063                  unsigned view_blocksize = util_format_get_blocksize(view->format);
1064                  /* probably don't really need to fill that out */
1065                  jit_tex->mip_offsets[0] = 0;
1066                  jit_tex->row_stride[0] = 0;
1067                  jit_tex->img_stride[0] = 0;
1068
1069                  /* everything specified in number of elements here. */
1070                  jit_tex->width = view->u.buf.size / view_blocksize;
1071                  jit_tex->base = (uint8_t *)jit_tex->base + view->u.buf.offset;
1072                  /* XXX Unsure if we need to sanitize parameters? */
1073                  assert(view->u.buf.offset + view->u.buf.size <= res->width0);
1074               }
1075            }
1076         }
1077         else {
1078            /* display target texture/surface */
1079            jit_tex->base = llvmpipe_resource_map(res, 0, 0, LP_TEX_USAGE_READ);
1080            jit_tex->row_stride[0] = lp_tex->row_stride[0];
1081            jit_tex->img_stride[0] = lp_tex->img_stride[0];
1082            jit_tex->mip_offsets[0] = 0;
1083            jit_tex->width = res->width0;
1084            jit_tex->height = res->height0;
1085            jit_tex->depth = res->depth0;
1086            jit_tex->first_level = jit_tex->last_level = 0;
1087            jit_tex->num_samples = res->nr_samples;
1088            jit_tex->sample_stride = 0;
1089            assert(jit_tex->base);
1090         }
1091      }
1092      else {
1093         pipe_resource_reference(&setup->fs.current_tex[i], NULL);
1094      }
1095   }
1096   setup->fs.current_tex_num = num;
1097
1098   setup->dirty |= LP_SETUP_NEW_FS;
1099}
1100
1101/**
1102 * Called during state validation when LP_NEW_SAMPLER is set.
1103 */
1104void
1105lp_setup_set_fragment_sampler_state(struct lp_setup_context *setup,
1106                                    unsigned num,
1107                                    struct pipe_sampler_state **samplers)
1108{
1109   unsigned i;
1110
1111   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
1112
1113   assert(num <= PIPE_MAX_SAMPLERS);
1114
1115   for (i = 0; i < PIPE_MAX_SAMPLERS; i++) {
1116      const struct pipe_sampler_state *sampler = i < num ? samplers[i] : NULL;
1117
1118      if (sampler) {
1119         struct lp_jit_sampler *jit_sam;
1120         jit_sam = &setup->fs.current.jit_context.samplers[i];
1121
1122         jit_sam->min_lod = sampler->min_lod;
1123         jit_sam->max_lod = sampler->max_lod;
1124         jit_sam->lod_bias = sampler->lod_bias;
1125         jit_sam->max_aniso = sampler->max_anisotropy;
1126         COPY_4V(jit_sam->border_color, sampler->border_color.f);
1127      }
1128   }
1129
1130   setup->dirty |= LP_SETUP_NEW_FS;
1131}
1132
1133
1134
1135
1136/**
1137 * Is the given texture referenced by any scene?
1138 * Note: we have to check all scenes including any scenes currently
1139 * being rendered and the current scene being built.
1140 */
1141unsigned
1142lp_setup_is_resource_referenced( const struct lp_setup_context *setup,
1143                                const struct pipe_resource *texture )
1144{
1145   unsigned i;
1146
1147   /* check the render targets */
1148   for (i = 0; i < setup->fb.nr_cbufs; i++) {
1149      if (setup->fb.cbufs[i] && setup->fb.cbufs[i]->texture == texture)
1150         return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
1151   }
1152   if (setup->fb.zsbuf && setup->fb.zsbuf->texture == texture) {
1153      return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
1154   }
1155
1156   /* check textures referenced by the scene */
1157   for (i = 0; i < ARRAY_SIZE(setup->scenes); i++) {
1158      if (lp_scene_is_resource_referenced(setup->scenes[i], texture)) {
1159         return LP_REFERENCED_FOR_READ;
1160      }
1161   }
1162
1163   for (i = 0; i < ARRAY_SIZE(setup->ssbos); i++) {
1164      if (setup->ssbos[i].current.buffer == texture)
1165         return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
1166   }
1167
1168   for (i = 0; i < ARRAY_SIZE(setup->images); i++) {
1169      if (setup->images[i].current.resource == texture)
1170         return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
1171   }
1172
1173   return LP_UNREFERENCED;
1174}
1175
1176
1177/**
1178 * Called by vbuf code when we're about to draw something.
1179 *
1180 * This function stores all dirty state in the current scene's display list
1181 * memory, via lp_scene_alloc().  We can not pass pointers of mutable state to
1182 * the JIT functions, as the JIT functions will be called later on, most likely
1183 * on a different thread.
1184 *
1185 * When processing dirty state it is imperative that we don't refer to any
1186 * pointers previously allocated with lp_scene_alloc() in this function (or any
1187 * function) as they may belong to a scene freed since then.
1188 */
1189static boolean
1190try_update_scene_state( struct lp_setup_context *setup )
1191{
1192   static const float fake_const_buf[4];
1193   boolean new_scene = (setup->fs.stored == NULL);
1194   struct lp_scene *scene = setup->scene;
1195   unsigned i;
1196
1197   assert(scene);
1198
1199   if (setup->dirty & LP_SETUP_NEW_VIEWPORTS) {
1200      /*
1201       * Record new depth range state for changes due to viewport updates.
1202       *
1203       * TODO: Collapse the existing viewport and depth range information
1204       *       into one structure, for access by JIT.
1205       */
1206      struct lp_jit_viewport *stored;
1207
1208      stored = (struct lp_jit_viewport *)
1209         lp_scene_alloc(scene, sizeof setup->viewports);
1210
1211      if (!stored) {
1212         assert(!new_scene);
1213         return FALSE;
1214      }
1215
1216      memcpy(stored, setup->viewports, sizeof setup->viewports);
1217
1218      setup->fs.current.jit_context.viewports = stored;
1219      setup->dirty |= LP_SETUP_NEW_FS;
1220   }
1221
1222   if(setup->dirty & LP_SETUP_NEW_BLEND_COLOR) {
1223      uint8_t *stored;
1224      float* fstored;
1225      unsigned i, j;
1226      unsigned size;
1227
1228      /* Alloc u8_blend_color (16 x i8) and f_blend_color (4 or 8 x f32) */
1229      size  = 4 * 16 * sizeof(uint8_t);
1230      size += (LP_MAX_VECTOR_LENGTH / 4) * sizeof(float);
1231      stored = lp_scene_alloc_aligned(scene, size, LP_MIN_VECTOR_ALIGN);
1232
1233      if (!stored) {
1234         assert(!new_scene);
1235         return FALSE;
1236      }
1237
1238      /* Store floating point colour */
1239      fstored = (float*)(stored + 4*16);
1240      for (i = 0; i < (LP_MAX_VECTOR_LENGTH / 4); ++i) {
1241         fstored[i] = setup->blend_color.current.color[i % 4];
1242      }
1243
1244      /* smear each blend color component across 16 ubyte elements */
1245      for (i = 0; i < 4; ++i) {
1246         uint8_t c = float_to_ubyte(setup->blend_color.current.color[i]);
1247         for (j = 0; j < 16; ++j)
1248            stored[i*16 + j] = c;
1249      }
1250
1251      setup->blend_color.stored = stored;
1252      setup->fs.current.jit_context.u8_blend_color = stored;
1253      setup->fs.current.jit_context.f_blend_color = fstored;
1254      setup->dirty |= LP_SETUP_NEW_FS;
1255   }
1256
1257   struct llvmpipe_context *llvmpipe = llvmpipe_context(setup->pipe);
1258   if (llvmpipe->dirty & LP_NEW_FS_CONSTANTS)
1259      lp_setup_set_fs_constants(llvmpipe->setup,
1260                                ARRAY_SIZE(llvmpipe->constants[PIPE_SHADER_FRAGMENT]),
1261                                llvmpipe->constants[PIPE_SHADER_FRAGMENT]);
1262
1263   if (setup->dirty & LP_SETUP_NEW_CONSTANTS) {
1264      for (i = 0; i < ARRAY_SIZE(setup->constants); ++i) {
1265         struct pipe_resource *buffer = setup->constants[i].current.buffer;
1266         const unsigned current_size = MIN2(setup->constants[i].current.buffer_size,
1267                                            LP_MAX_TGSI_CONST_BUFFER_SIZE);
1268         const ubyte *current_data = NULL;
1269         int num_constants;
1270
1271         STATIC_ASSERT(DATA_BLOCK_SIZE >= LP_MAX_TGSI_CONST_BUFFER_SIZE);
1272
1273         if (buffer) {
1274            /* resource buffer */
1275            current_data = (ubyte *) llvmpipe_resource_data(buffer);
1276         }
1277         else if (setup->constants[i].current.user_buffer) {
1278            /* user-space buffer */
1279            current_data = (ubyte *) setup->constants[i].current.user_buffer;
1280         }
1281
1282         if (current_data && current_size >= sizeof(float)) {
1283            current_data += setup->constants[i].current.buffer_offset;
1284
1285            /* TODO: copy only the actually used constants? */
1286
1287            if (setup->constants[i].stored_size != current_size ||
1288               !setup->constants[i].stored_data ||
1289               memcmp(setup->constants[i].stored_data,
1290                      current_data,
1291                      current_size) != 0) {
1292               void *stored;
1293
1294               stored = lp_scene_alloc(scene, current_size);
1295               if (!stored) {
1296                  assert(!new_scene);
1297                  return FALSE;
1298               }
1299
1300               memcpy(stored,
1301                      current_data,
1302                      current_size);
1303               setup->constants[i].stored_size = current_size;
1304               setup->constants[i].stored_data = stored;
1305            }
1306            setup->fs.current.jit_context.constants[i] =
1307               setup->constants[i].stored_data;
1308         }
1309         else {
1310            setup->constants[i].stored_size = 0;
1311            setup->constants[i].stored_data = NULL;
1312            setup->fs.current.jit_context.constants[i] = fake_const_buf;
1313         }
1314
1315         num_constants =
1316            DIV_ROUND_UP(setup->constants[i].stored_size, lp_get_constant_buffer_stride(scene->pipe->screen));
1317         setup->fs.current.jit_context.num_constants[i] = num_constants;
1318         setup->dirty |= LP_SETUP_NEW_FS;
1319      }
1320   }
1321
1322   if (setup->dirty & LP_SETUP_NEW_SSBOS) {
1323      for (i = 0; i < ARRAY_SIZE(setup->ssbos); ++i) {
1324         struct pipe_resource *buffer = setup->ssbos[i].current.buffer;
1325         const ubyte *current_data = NULL;
1326
1327         if (!buffer)
1328            continue;
1329         /* resource buffer */
1330         current_data = (ubyte *) llvmpipe_resource_data(buffer);
1331         if (current_data) {
1332            current_data += setup->ssbos[i].current.buffer_offset;
1333
1334            setup->fs.current.jit_context.ssbos[i] = (const uint32_t *)current_data;
1335            setup->fs.current.jit_context.num_ssbos[i] = setup->ssbos[i].current.buffer_size;
1336         } else {
1337            setup->fs.current.jit_context.ssbos[i] = NULL;
1338            setup->fs.current.jit_context.num_ssbos[i] = 0;
1339         }
1340         setup->dirty |= LP_SETUP_NEW_FS;
1341      }
1342   }
1343   if (setup->dirty & LP_SETUP_NEW_FS) {
1344      if (!setup->fs.stored ||
1345          memcmp(setup->fs.stored,
1346                 &setup->fs.current,
1347                 sizeof setup->fs.current) != 0)
1348      {
1349         struct lp_rast_state *stored;
1350
1351         /* The fs state that's been stored in the scene is different from
1352          * the new, current state.  So allocate a new lp_rast_state object
1353          * and append it to the bin's setup data buffer.
1354          */
1355         stored = (struct lp_rast_state *) lp_scene_alloc(scene, sizeof *stored);
1356         if (!stored) {
1357            assert(!new_scene);
1358            return FALSE;
1359         }
1360
1361         memcpy(&stored->jit_context,
1362                &setup->fs.current.jit_context,
1363                sizeof setup->fs.current.jit_context);
1364         stored->jit_context.aniso_filter_table = lp_build_sample_aniso_filter_table();
1365         stored->variant = setup->fs.current.variant;
1366
1367         if (!lp_scene_add_frag_shader_reference(scene,
1368                                                 setup->fs.current.variant))
1369            return FALSE;
1370         setup->fs.stored = stored;
1371
1372         /* The scene now references the textures in the rasterization
1373          * state record.  Note that now.
1374          */
1375         for (i = 0; i < ARRAY_SIZE(setup->fs.current_tex); i++) {
1376            if (setup->fs.current_tex[i]) {
1377               if (!lp_scene_add_resource_reference(scene,
1378                                                    setup->fs.current_tex[i],
1379                                                    new_scene)) {
1380                  assert(!new_scene);
1381                  return FALSE;
1382               }
1383            }
1384         }
1385      }
1386   }
1387
1388   if (setup->dirty & LP_SETUP_NEW_SCISSOR) {
1389      unsigned i;
1390
1391      for (i = 0; i < PIPE_MAX_VIEWPORTS; ++i) {
1392         setup->draw_regions[i] = setup->framebuffer;
1393         if (setup->scissor_test) {
1394            u_rect_possible_intersection(&setup->scissors[i],
1395                                         &setup->draw_regions[i]);
1396         }
1397      }
1398      if (setup->permit_linear_rasterizer) {
1399         /* NOTE: this only takes first vp into account. */
1400         boolean need_vp_scissoring = !!memcmp(&setup->vpwh, &setup->framebuffer,
1401                                               sizeof(setup->framebuffer));
1402         assert(setup->viewport_index_slot < 0);
1403         if (need_vp_scissoring) {
1404            u_rect_possible_intersection(&setup->vpwh,
1405                                         &setup->draw_regions[0]);
1406         }
1407      }
1408      else if (setup->point_tri_clip) {
1409         /*
1410          * for d3d-style point clipping, we're going to need
1411          * the fake vp scissor too. Hence do the intersection with vp,
1412          * but don't indicate this. As above this will only work for first vp
1413          * which should be ok because we instruct draw to only skip point
1414          * clipping when there's only one viewport (this works because d3d10
1415          * points are always single pixel).
1416          * (Also note that if we have permit_linear_rasterizer this will
1417          * cause large points to always get vp scissored, regardless the
1418          * point_tri_clip setting.)
1419          */
1420         boolean need_vp_scissoring = !!memcmp(&setup->vpwh, &setup->framebuffer,
1421                                               sizeof(setup->framebuffer));
1422         if (need_vp_scissoring) {
1423            u_rect_possible_intersection(&setup->vpwh,
1424                                         &setup->draw_regions[0]);
1425         }
1426      }
1427   }
1428
1429   setup->dirty = 0;
1430
1431   assert(setup->fs.stored);
1432   return TRUE;
1433}
1434
1435boolean
1436lp_setup_update_state( struct lp_setup_context *setup,
1437                       boolean update_scene )
1438{
1439   /* Some of the 'draw' pipeline stages may have changed some driver state.
1440    * Make sure we've processed those state changes before anything else.
1441    *
1442    * XXX this is the only place where llvmpipe_context is used in the
1443    * setup code.  This may get refactored/changed...
1444    */
1445   {
1446      struct llvmpipe_context *lp = llvmpipe_context(setup->pipe);
1447      if (lp->dirty) {
1448         llvmpipe_update_derived(lp);
1449      }
1450
1451      if (lp->setup->dirty) {
1452         llvmpipe_update_setup(lp);
1453      }
1454
1455      assert(setup->setup.variant);
1456
1457      /* Will probably need to move this somewhere else, just need
1458       * to know about vertex shader point size attribute.
1459       */
1460      setup->psize_slot = lp->psize_slot;
1461      setup->viewport_index_slot = lp->viewport_index_slot;
1462      setup->layer_slot = lp->layer_slot;
1463      setup->face_slot = lp->face_slot;
1464
1465      assert(lp->dirty == 0);
1466
1467      assert(lp->setup_variant.key.size ==
1468	     setup->setup.variant->key.size);
1469
1470      assert(memcmp(&lp->setup_variant.key,
1471		    &setup->setup.variant->key,
1472		    setup->setup.variant->key.size) == 0);
1473   }
1474
1475   if (update_scene && setup->state != SETUP_ACTIVE) {
1476      if (!set_scene_state( setup, SETUP_ACTIVE, __FUNCTION__ ))
1477         return FALSE;
1478   }
1479
1480   /* Only call into update_scene_state() if we already have a
1481    * scene:
1482    */
1483   if (update_scene && setup->scene) {
1484      assert(setup->state == SETUP_ACTIVE);
1485
1486      if (try_update_scene_state(setup))
1487         return TRUE;
1488
1489      /* Update failed, try to restart the scene.
1490       *
1491       * Cannot call lp_setup_flush_and_restart() directly here
1492       * because of potential recursion.
1493       */
1494      if (!set_scene_state(setup, SETUP_FLUSHED, __FUNCTION__))
1495         return FALSE;
1496
1497      if (!set_scene_state(setup, SETUP_ACTIVE, __FUNCTION__))
1498         return FALSE;
1499
1500      if (!setup->scene)
1501         return FALSE;
1502
1503      return try_update_scene_state(setup);
1504   }
1505
1506   return TRUE;
1507}
1508
1509
1510
1511/* Only caller is lp_setup_vbuf_destroy()
1512 */
1513void
1514lp_setup_destroy( struct lp_setup_context *setup )
1515{
1516   uint i;
1517
1518   lp_setup_reset( setup );
1519
1520   util_unreference_framebuffer_state(&setup->fb);
1521
1522   for (i = 0; i < ARRAY_SIZE(setup->fs.current_tex); i++) {
1523      struct pipe_resource **res_ptr = &setup->fs.current_tex[i];
1524      if (*res_ptr)
1525         llvmpipe_resource_unmap(*res_ptr, 0, 0);
1526      pipe_resource_reference(res_ptr, NULL);
1527   }
1528
1529   for (i = 0; i < ARRAY_SIZE(setup->constants); i++) {
1530      pipe_resource_reference(&setup->constants[i].current.buffer, NULL);
1531   }
1532
1533   for (i = 0; i < ARRAY_SIZE(setup->ssbos); i++) {
1534      pipe_resource_reference(&setup->ssbos[i].current.buffer, NULL);
1535   }
1536
1537   /* free the scenes in the 'empty' queue */
1538   for (i = 0; i < ARRAY_SIZE(setup->scenes); i++) {
1539      struct lp_scene *scene = setup->scenes[i];
1540
1541      if (scene->fence)
1542         lp_fence_wait(scene->fence);
1543
1544      lp_scene_destroy(scene);
1545   }
1546
1547   lp_fence_reference(&setup->last_fence, NULL);
1548
1549   FREE( setup );
1550}
1551
1552
1553/**
1554 * Create a new primitive tiling engine.  Plug it into the backend of
1555 * the draw module.  Currently also creates a rasterizer to use with
1556 * it.
1557 */
1558struct lp_setup_context *
1559lp_setup_create( struct pipe_context *pipe,
1560                 struct draw_context *draw )
1561{
1562   struct llvmpipe_screen *screen = llvmpipe_screen(pipe->screen);
1563   struct lp_setup_context *setup;
1564   unsigned i;
1565
1566   setup = CALLOC_STRUCT(lp_setup_context);
1567   if (!setup) {
1568      goto no_setup;
1569   }
1570
1571   lp_setup_init_vbuf(setup);
1572
1573   /* Used only in update_state():
1574    */
1575   setup->pipe = pipe;
1576
1577
1578   setup->num_threads = screen->num_threads;
1579   setup->vbuf = draw_vbuf_stage(draw, &setup->base);
1580   if (!setup->vbuf) {
1581      goto no_vbuf;
1582   }
1583
1584   draw_set_rasterize_stage(draw, setup->vbuf);
1585   draw_set_render(draw, &setup->base);
1586
1587   /* create some empty scenes */
1588   for (i = 0; i < MAX_SCENES; i++) {
1589      setup->scenes[i] = lp_scene_create( pipe );
1590      if (!setup->scenes[i]) {
1591         goto no_scenes;
1592      }
1593   }
1594
1595   setup->triangle = first_triangle;
1596   setup->line     = first_line;
1597   setup->point    = first_point;
1598
1599   setup->dirty = ~0;
1600
1601   /* Initialize empty default fb correctly, so the rect is empty */
1602   setup->framebuffer.x1 = -1;
1603   setup->framebuffer.y1 = -1;
1604
1605   return setup;
1606
1607no_scenes:
1608   for (i = 0; i < MAX_SCENES; i++) {
1609      if (setup->scenes[i]) {
1610         lp_scene_destroy(setup->scenes[i]);
1611      }
1612   }
1613
1614   setup->vbuf->destroy(setup->vbuf);
1615no_vbuf:
1616   FREE(setup);
1617no_setup:
1618   return NULL;
1619}
1620
1621
1622/**
1623 * Put a BeginQuery command into all bins.
1624 */
1625void
1626lp_setup_begin_query(struct lp_setup_context *setup,
1627                     struct llvmpipe_query *pq)
1628{
1629   set_scene_state(setup, SETUP_ACTIVE, "begin_query");
1630
1631   if (!(pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1632         pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1633         pq->type == PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE ||
1634         pq->type == PIPE_QUERY_PIPELINE_STATISTICS ||
1635         pq->type == PIPE_QUERY_TIME_ELAPSED))
1636      return;
1637
1638   /* init the query to its beginning state */
1639   assert(setup->active_binned_queries < LP_MAX_ACTIVE_BINNED_QUERIES);
1640   /* exceeding list size so just ignore the query */
1641   if (setup->active_binned_queries >= LP_MAX_ACTIVE_BINNED_QUERIES) {
1642      return;
1643   }
1644   assert(setup->active_queries[setup->active_binned_queries] == NULL);
1645   setup->active_queries[setup->active_binned_queries] = pq;
1646   setup->active_binned_queries++;
1647
1648   assert(setup->scene);
1649   if (setup->scene) {
1650      if (!lp_scene_bin_everywhere(setup->scene,
1651                                   LP_RAST_OP_BEGIN_QUERY,
1652                                   lp_rast_arg_query(pq))) {
1653
1654         if (!lp_setup_flush_and_restart(setup))
1655            return;
1656
1657         if (!lp_scene_bin_everywhere(setup->scene,
1658                                      LP_RAST_OP_BEGIN_QUERY,
1659                                      lp_rast_arg_query(pq))) {
1660            return;
1661         }
1662      }
1663      setup->scene->had_queries |= TRUE;
1664   }
1665}
1666
1667
1668/**
1669 * Put an EndQuery command into all bins.
1670 */
1671void
1672lp_setup_end_query(struct lp_setup_context *setup, struct llvmpipe_query *pq)
1673{
1674   set_scene_state(setup, SETUP_ACTIVE, "end_query");
1675
1676   assert(setup->scene);
1677   if (setup->scene) {
1678      /* pq->fence should be the fence of the *last* scene which
1679       * contributed to the query result.
1680       */
1681      lp_fence_reference(&pq->fence, setup->scene->fence);
1682
1683      if (pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1684          pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1685          pq->type == PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE ||
1686          pq->type == PIPE_QUERY_PIPELINE_STATISTICS ||
1687          pq->type == PIPE_QUERY_TIMESTAMP ||
1688          pq->type == PIPE_QUERY_TIME_ELAPSED) {
1689         if (pq->type == PIPE_QUERY_TIMESTAMP &&
1690               !(setup->scene->tiles_x | setup->scene->tiles_y)) {
1691            /*
1692             * If there's a zero width/height framebuffer, there's no bins and
1693             * hence no rast task is ever run. So fill in something here instead.
1694             */
1695            pq->end[0] = os_time_get_nano();
1696         }
1697
1698         if (!lp_scene_bin_everywhere(setup->scene,
1699                                      LP_RAST_OP_END_QUERY,
1700                                      lp_rast_arg_query(pq))) {
1701            if (!lp_setup_flush_and_restart(setup))
1702               goto fail;
1703
1704            if (!lp_scene_bin_everywhere(setup->scene,
1705                                         LP_RAST_OP_END_QUERY,
1706                                         lp_rast_arg_query(pq))) {
1707               goto fail;
1708            }
1709         }
1710         setup->scene->had_queries |= TRUE;
1711      }
1712   }
1713   else {
1714      lp_fence_reference(&pq->fence, setup->last_fence);
1715   }
1716
1717fail:
1718   /* Need to do this now not earlier since it still needs to be marked as
1719    * active when binning it would cause a flush.
1720    */
1721   if (pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1722      pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1723      pq->type == PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE ||
1724      pq->type == PIPE_QUERY_PIPELINE_STATISTICS ||
1725      pq->type == PIPE_QUERY_TIME_ELAPSED) {
1726      unsigned i;
1727
1728      /* remove from active binned query list */
1729      for (i = 0; i < setup->active_binned_queries; i++) {
1730         if (setup->active_queries[i] == pq)
1731            break;
1732      }
1733      assert(i < setup->active_binned_queries);
1734      if (i == setup->active_binned_queries)
1735         return;
1736      setup->active_binned_queries--;
1737      setup->active_queries[i] = setup->active_queries[setup->active_binned_queries];
1738      setup->active_queries[setup->active_binned_queries] = NULL;
1739   }
1740}
1741
1742
1743boolean
1744lp_setup_flush_and_restart(struct lp_setup_context *setup)
1745{
1746   if (0) debug_printf("%s\n", __FUNCTION__);
1747
1748   assert(setup->state == SETUP_ACTIVE);
1749
1750   if (!set_scene_state(setup, SETUP_FLUSHED, __FUNCTION__))
1751      return FALSE;
1752
1753   if (!lp_setup_update_state(setup, TRUE))
1754      return FALSE;
1755
1756   return TRUE;
1757}
1758
1759void
1760lp_setup_add_scissor_planes(const struct u_rect *scissor,
1761                            struct lp_rast_plane *plane_s,
1762                            boolean s_planes[4], bool multisample)
1763{
1764   /*
1765    * When rasterizing scissored tris, use the intersection of the
1766    * triangle bounding box and the scissor rect to generate the
1767    * scissor planes.
1768    *
1769    * This permits us to cut off the triangle "tails" that are present
1770    * in the intermediate recursive levels caused when two of the
1771    * triangles edges don't diverge quickly enough to trivially reject
1772    * exterior blocks from the triangle.
1773    *
1774    * It's not really clear if it's worth worrying about these tails,
1775    * but since we generate the planes for each scissored tri, it's
1776    * free to trim them in this case.
1777    *
1778    * Note that otherwise, the scissor planes only vary in 'C' value,
1779    * and even then only on state-changes.  Could alternatively store
1780    * these planes elsewhere.
1781    * (Or only store the c value together with a bit indicating which
1782    * scissor edge this is, so rasterization would treat them differently
1783    * (easier to evaluate) to ordinary planes.)
1784    */
1785   int adj = multisample ? 127 : 0;
1786   if (s_planes[0]) {
1787      int x0 = scissor->x0 - 1;
1788      plane_s->dcdx = ~0U << 8;
1789      plane_s->dcdy = 0;
1790      plane_s->c = x0 << 8;
1791      plane_s->c += adj;
1792      plane_s->c = -plane_s->c; /* flip sign */
1793      plane_s->eo = 1 << 8;
1794      plane_s++;
1795   }
1796   if (s_planes[1]) {
1797      int x1 = scissor->x1;
1798      plane_s->dcdx = 1 << 8;
1799      plane_s->dcdy = 0;
1800      plane_s->c = x1 << 8;
1801      plane_s->c += 127 + adj;
1802      plane_s->eo = 0 << 8;
1803      plane_s++;
1804   }
1805   if (s_planes[2]) {
1806      int y0 = scissor->y0 - 1;
1807      plane_s->dcdx = 0;
1808      plane_s->dcdy = 1 << 8;
1809      plane_s->c = y0 << 8;
1810      plane_s->c += adj;
1811      plane_s->c = -plane_s->c; /* flip sign */
1812      plane_s->eo = 1 << 8;
1813      plane_s++;
1814   }
1815   if (s_planes[3]) {
1816      int y1 = scissor->y1;
1817      plane_s->dcdx = 0;
1818      plane_s->dcdy = ~0U << 8;
1819      plane_s->c = y1 << 8;
1820      plane_s->c += 127 + adj;
1821      plane_s->eo = 0;
1822      plane_s++;
1823   }
1824}
1825