etnaviv_state.c revision 01e04c3f
1/*
2 * Copyright (c) 2012-2015 Etnaviv Project
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sub license,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the
12 * next paragraph) shall be included in all copies or substantial portions
13 * of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 *
23 * Authors:
24 *    Wladimir J. van der Laan <laanwj@gmail.com>
25 *    Christian Gmeiner <christian.gmeiner@gmail.com>
26 */
27
28#include "etnaviv_state.h"
29
30#include "hw/common.xml.h"
31
32#include "etnaviv_blend.h"
33#include "etnaviv_clear_blit.h"
34#include "etnaviv_context.h"
35#include "etnaviv_format.h"
36#include "etnaviv_shader.h"
37#include "etnaviv_surface.h"
38#include "etnaviv_translate.h"
39#include "etnaviv_util.h"
40#include "util/u_framebuffer.h"
41#include "util/u_helpers.h"
42#include "util/u_inlines.h"
43#include "util/u_math.h"
44#include "util/u_memory.h"
45
46static void
47etna_set_stencil_ref(struct pipe_context *pctx, const struct pipe_stencil_ref *sr)
48{
49   struct etna_context *ctx = etna_context(pctx);
50   struct compiled_stencil_ref *cs = &ctx->stencil_ref;
51
52   ctx->stencil_ref_s = *sr;
53
54   cs->PE_STENCIL_CONFIG = VIVS_PE_STENCIL_CONFIG_REF_FRONT(sr->ref_value[0]);
55   /* rest of bits weaved in from depth_stencil_alpha */
56   cs->PE_STENCIL_CONFIG_EXT =
57      VIVS_PE_STENCIL_CONFIG_EXT_REF_BACK(sr->ref_value[0]);
58   ctx->dirty |= ETNA_DIRTY_STENCIL_REF;
59}
60
61static void
62etna_set_clip_state(struct pipe_context *pctx, const struct pipe_clip_state *pcs)
63{
64   /* NOOP */
65}
66
67static void
68etna_set_sample_mask(struct pipe_context *pctx, unsigned sample_mask)
69{
70   struct etna_context *ctx = etna_context(pctx);
71
72   ctx->sample_mask = sample_mask;
73   ctx->dirty |= ETNA_DIRTY_SAMPLE_MASK;
74}
75
76static void
77etna_set_constant_buffer(struct pipe_context *pctx,
78      enum pipe_shader_type shader, uint index,
79      const struct pipe_constant_buffer *cb)
80{
81   struct etna_context *ctx = etna_context(pctx);
82
83   if (unlikely(index > 0)) {
84      DBG("Unhandled buffer index %i", index);
85      return;
86   }
87
88
89   util_copy_constant_buffer(&ctx->constant_buffer[shader], cb);
90
91   /* Note that the state tracker can unbind constant buffers by
92    * passing NULL here. */
93   if (unlikely(!cb || (!cb->buffer && !cb->user_buffer)))
94      return;
95
96   /* there is no support for ARB_uniform_buffer_object */
97   assert(cb->buffer == NULL && cb->user_buffer != NULL);
98
99   ctx->dirty |= ETNA_DIRTY_CONSTBUF;
100}
101
102static void
103etna_update_render_resource(struct pipe_context *pctx, struct pipe_resource *pres)
104{
105   struct etna_resource *res = etna_resource(pres);
106
107   if (res->texture && etna_resource_older(res, etna_resource(res->texture))) {
108      /* The render buffer is older than the texture buffer. Copy it over. */
109      etna_copy_resource(pctx, pres, res->texture, 0, pres->last_level);
110      res->seqno = etna_resource(res->texture)->seqno;
111   }
112}
113
114static void
115etna_set_framebuffer_state(struct pipe_context *pctx,
116      const struct pipe_framebuffer_state *sv)
117{
118   struct etna_context *ctx = etna_context(pctx);
119   struct compiled_framebuffer_state *cs = &ctx->framebuffer;
120   int nr_samples_color = -1;
121   int nr_samples_depth = -1;
122
123   /* Set up TS as well. Warning: this state is used by both the RS and PE */
124   uint32_t ts_mem_config = 0;
125
126   if (sv->nr_cbufs > 0) { /* at least one color buffer? */
127      struct etna_surface *cbuf = etna_surface(sv->cbufs[0]);
128      struct etna_resource *res = etna_resource(cbuf->base.texture);
129      bool color_supertiled = (res->layout & ETNA_LAYOUT_BIT_SUPER) != 0;
130
131      assert(res->layout & ETNA_LAYOUT_BIT_TILE); /* Cannot render to linear surfaces */
132      etna_update_render_resource(pctx, cbuf->base.texture);
133
134      cs->PE_COLOR_FORMAT =
135         VIVS_PE_COLOR_FORMAT_FORMAT(translate_rs_format(cbuf->base.format)) |
136         VIVS_PE_COLOR_FORMAT_COMPONENTS__MASK |
137         VIVS_PE_COLOR_FORMAT_OVERWRITE |
138         COND(color_supertiled, VIVS_PE_COLOR_FORMAT_SUPER_TILED) |
139         COND(color_supertiled && ctx->specs.halti >= 5, VIVS_PE_COLOR_FORMAT_SUPER_TILED_NEW);
140      /* VIVS_PE_COLOR_FORMAT_COMPONENTS() and
141       * VIVS_PE_COLOR_FORMAT_OVERWRITE comes from blend_state
142       * but only if we set the bits above. */
143      /* merged with depth_stencil_alpha */
144      if ((cbuf->surf.offset & 63) ||
145          (((cbuf->surf.stride * 4) & 63) && cbuf->surf.height > 4)) {
146         /* XXX Must make temporary surface here.
147          * Need the same mechanism on gc2000 when we want to do mipmap
148          * generation by
149          * rendering to levels > 1 due to multitiled / tiled conversion. */
150         BUG("Alignment error, trying to render to offset %08x with tile "
151             "stride %i",
152             cbuf->surf.offset, cbuf->surf.stride * 4);
153      }
154
155      if (ctx->specs.pixel_pipes == 1) {
156         cs->PE_COLOR_ADDR = cbuf->reloc[0];
157         cs->PE_COLOR_ADDR.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
158      } else {
159         /* Rendered textures must always be multi-tiled, or single-buffer mode must be supported */
160         assert((res->layout & ETNA_LAYOUT_BIT_MULTI) || ctx->specs.single_buffer);
161         for (int i = 0; i < ctx->specs.pixel_pipes; i++) {
162            cs->PE_PIPE_COLOR_ADDR[i] = cbuf->reloc[i];
163            cs->PE_PIPE_COLOR_ADDR[i].flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
164         }
165      }
166      cs->PE_COLOR_STRIDE = cbuf->surf.stride;
167
168      if (cbuf->surf.ts_size) {
169         cs->TS_COLOR_CLEAR_VALUE = cbuf->level->clear_value;
170
171         cs->TS_COLOR_STATUS_BASE = cbuf->ts_reloc;
172         cs->TS_COLOR_STATUS_BASE.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
173
174         cs->TS_COLOR_SURFACE_BASE = cbuf->reloc[0];
175         cs->TS_COLOR_SURFACE_BASE.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
176      }
177
178      /* MSAA */
179      if (cbuf->base.texture->nr_samples > 1)
180         ts_mem_config |=
181            VIVS_TS_MEM_CONFIG_COLOR_COMPRESSION | translate_msaa_format(cbuf->base.format);
182
183      nr_samples_color = cbuf->base.texture->nr_samples;
184   } else {
185      /* Clearing VIVS_PE_COLOR_FORMAT_COMPONENTS__MASK and
186       * VIVS_PE_COLOR_FORMAT_OVERWRITE prevents us from overwriting the
187       * color target */
188      cs->PE_COLOR_FORMAT = VIVS_PE_COLOR_FORMAT_OVERWRITE;
189      cs->PE_COLOR_STRIDE = 0;
190      cs->TS_COLOR_STATUS_BASE.bo = NULL;
191      cs->TS_COLOR_SURFACE_BASE.bo = NULL;
192
193      for (int i = 0; i < ETNA_MAX_PIXELPIPES; i++)
194         cs->PE_PIPE_COLOR_ADDR[i].bo = NULL;
195   }
196
197   if (sv->zsbuf != NULL) {
198      struct etna_surface *zsbuf = etna_surface(sv->zsbuf);
199      struct etna_resource *res = etna_resource(zsbuf->base.texture);
200
201      etna_update_render_resource(pctx, zsbuf->base.texture);
202
203      assert(res->layout &ETNA_LAYOUT_BIT_TILE); /* Cannot render to linear surfaces */
204
205      uint32_t depth_format = translate_depth_format(zsbuf->base.format);
206      unsigned depth_bits =
207         depth_format == VIVS_PE_DEPTH_CONFIG_DEPTH_FORMAT_D16 ? 16 : 24;
208      bool depth_supertiled = (res->layout & ETNA_LAYOUT_BIT_SUPER) != 0;
209
210      cs->PE_DEPTH_CONFIG =
211         depth_format |
212         COND(depth_supertiled, VIVS_PE_DEPTH_CONFIG_SUPER_TILED) |
213         VIVS_PE_DEPTH_CONFIG_DEPTH_MODE_Z |
214         COND(ctx->specs.halti >= 5, VIVS_PE_DEPTH_CONFIG_DISABLE_ZS) /* Needs to be enabled on GC7000, otherwise depth writes hang w/ TS - apparently it does something else now */
215         ;
216      /* VIVS_PE_DEPTH_CONFIG_ONLY_DEPTH */
217      /* merged with depth_stencil_alpha */
218
219      if (ctx->specs.pixel_pipes == 1) {
220         cs->PE_DEPTH_ADDR = zsbuf->reloc[0];
221         cs->PE_DEPTH_ADDR.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
222      } else {
223         for (int i = 0; i < ctx->specs.pixel_pipes; i++) {
224            cs->PE_PIPE_DEPTH_ADDR[i] = zsbuf->reloc[i];
225            cs->PE_PIPE_DEPTH_ADDR[i].flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
226         }
227      }
228
229      cs->PE_DEPTH_STRIDE = zsbuf->surf.stride;
230      cs->PE_HDEPTH_CONTROL = VIVS_PE_HDEPTH_CONTROL_FORMAT_DISABLED;
231      cs->PE_DEPTH_NORMALIZE = fui(exp2f(depth_bits) - 1.0f);
232
233      if (zsbuf->surf.ts_size) {
234         cs->TS_DEPTH_CLEAR_VALUE = zsbuf->level->clear_value;
235
236         cs->TS_DEPTH_STATUS_BASE = zsbuf->ts_reloc;
237         cs->TS_DEPTH_STATUS_BASE.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
238
239         cs->TS_DEPTH_SURFACE_BASE = zsbuf->reloc[0];
240         cs->TS_DEPTH_SURFACE_BASE.flags = ETNA_RELOC_READ | ETNA_RELOC_WRITE;
241      }
242
243      ts_mem_config |= COND(depth_bits == 16, VIVS_TS_MEM_CONFIG_DEPTH_16BPP);
244
245      /* MSAA */
246      if (zsbuf->base.texture->nr_samples > 1)
247         /* XXX VIVS_TS_MEM_CONFIG_DEPTH_COMPRESSION;
248          * Disable without MSAA for now, as it causes corruption in glquake. */
249         ts_mem_config |= VIVS_TS_MEM_CONFIG_DEPTH_COMPRESSION;
250
251      nr_samples_depth = zsbuf->base.texture->nr_samples;
252   } else {
253      cs->PE_DEPTH_CONFIG = VIVS_PE_DEPTH_CONFIG_DEPTH_MODE_NONE;
254      cs->PE_DEPTH_ADDR.bo = NULL;
255      cs->PE_DEPTH_STRIDE = 0;
256      cs->TS_DEPTH_STATUS_BASE.bo = NULL;
257      cs->TS_DEPTH_SURFACE_BASE.bo = NULL;
258
259      for (int i = 0; i < ETNA_MAX_PIXELPIPES; i++)
260         cs->PE_PIPE_DEPTH_ADDR[i].bo = NULL;
261   }
262
263   /* MSAA setup */
264   if (nr_samples_depth != -1 && nr_samples_color != -1 &&
265       nr_samples_depth != nr_samples_color) {
266      BUG("Number of samples in color and depth texture must match (%i and %i respectively)",
267          nr_samples_color, nr_samples_depth);
268   }
269
270   switch (MAX2(nr_samples_depth, nr_samples_color)) {
271   case 0:
272   case 1: /* Are 0 and 1 samples allowed? */
273      cs->GL_MULTI_SAMPLE_CONFIG =
274         VIVS_GL_MULTI_SAMPLE_CONFIG_MSAA_SAMPLES_NONE;
275      cs->msaa_mode = false;
276      break;
277   case 2:
278      cs->GL_MULTI_SAMPLE_CONFIG = VIVS_GL_MULTI_SAMPLE_CONFIG_MSAA_SAMPLES_2X;
279      cs->msaa_mode = true; /* Add input to PS */
280      cs->RA_MULTISAMPLE_UNK00E04 = 0x0;
281      cs->RA_MULTISAMPLE_UNK00E10[0] = 0x0000aa22;
282      cs->RA_CENTROID_TABLE[0] = 0x66aa2288;
283      cs->RA_CENTROID_TABLE[1] = 0x88558800;
284      cs->RA_CENTROID_TABLE[2] = 0x88881100;
285      cs->RA_CENTROID_TABLE[3] = 0x33888800;
286      break;
287   case 4:
288      cs->GL_MULTI_SAMPLE_CONFIG = VIVS_GL_MULTI_SAMPLE_CONFIG_MSAA_SAMPLES_4X;
289      cs->msaa_mode = true; /* Add input to PS */
290      cs->RA_MULTISAMPLE_UNK00E04 = 0x0;
291      cs->RA_MULTISAMPLE_UNK00E10[0] = 0xeaa26e26;
292      cs->RA_MULTISAMPLE_UNK00E10[1] = 0xe6ae622a;
293      cs->RA_MULTISAMPLE_UNK00E10[2] = 0xaaa22a22;
294      cs->RA_CENTROID_TABLE[0] = 0x4a6e2688;
295      cs->RA_CENTROID_TABLE[1] = 0x888888a2;
296      cs->RA_CENTROID_TABLE[2] = 0x888888ea;
297      cs->RA_CENTROID_TABLE[3] = 0x888888c6;
298      cs->RA_CENTROID_TABLE[4] = 0x46622a88;
299      cs->RA_CENTROID_TABLE[5] = 0x888888ae;
300      cs->RA_CENTROID_TABLE[6] = 0x888888e6;
301      cs->RA_CENTROID_TABLE[7] = 0x888888ca;
302      cs->RA_CENTROID_TABLE[8] = 0x262a2288;
303      cs->RA_CENTROID_TABLE[9] = 0x886688a2;
304      cs->RA_CENTROID_TABLE[10] = 0x888866aa;
305      cs->RA_CENTROID_TABLE[11] = 0x668888a6;
306      break;
307   }
308
309   /* Scissor setup */
310   cs->SE_SCISSOR_LEFT = 0; /* affected by rasterizer and scissor state as well */
311   cs->SE_SCISSOR_TOP = 0;
312   cs->SE_SCISSOR_RIGHT = (sv->width << 16) + ETNA_SE_SCISSOR_MARGIN_RIGHT;
313   cs->SE_SCISSOR_BOTTOM = (sv->height << 16) + ETNA_SE_SCISSOR_MARGIN_BOTTOM;
314   cs->SE_CLIP_RIGHT = (sv->width << 16) + ETNA_SE_CLIP_MARGIN_RIGHT;
315   cs->SE_CLIP_BOTTOM = (sv->height << 16) + ETNA_SE_CLIP_MARGIN_BOTTOM;
316
317   cs->TS_MEM_CONFIG = ts_mem_config;
318
319   /* Single buffer setup. There is only one switch for this, not a separate
320    * one per color buffer / depth buffer. To keep the logic simple always use
321    * single buffer when this feature is available.
322    */
323   cs->PE_LOGIC_OP = VIVS_PE_LOGIC_OP_SINGLE_BUFFER(ctx->specs.single_buffer ? 3 : 0);
324
325   /* keep copy of original structure */
326   util_copy_framebuffer_state(&ctx->framebuffer_s, sv);
327   ctx->dirty |= ETNA_DIRTY_FRAMEBUFFER | ETNA_DIRTY_DERIVE_TS;
328}
329
330static void
331etna_set_polygon_stipple(struct pipe_context *pctx,
332      const struct pipe_poly_stipple *stipple)
333{
334   /* NOP */
335}
336
337static void
338etna_set_scissor_states(struct pipe_context *pctx, unsigned start_slot,
339      unsigned num_scissors, const struct pipe_scissor_state *ss)
340{
341   struct etna_context *ctx = etna_context(pctx);
342   struct compiled_scissor_state *cs = &ctx->scissor;
343   assert(ss->minx <= ss->maxx);
344   assert(ss->miny <= ss->maxy);
345
346   /* note that this state is only used when rasterizer_state->scissor is on */
347   ctx->scissor_s = *ss;
348   cs->SE_SCISSOR_LEFT = (ss->minx << 16);
349   cs->SE_SCISSOR_TOP = (ss->miny << 16);
350   cs->SE_SCISSOR_RIGHT = (ss->maxx << 16) + ETNA_SE_SCISSOR_MARGIN_RIGHT;
351   cs->SE_SCISSOR_BOTTOM = (ss->maxy << 16) + ETNA_SE_SCISSOR_MARGIN_BOTTOM;
352   cs->SE_CLIP_RIGHT = (ss->maxx << 16) + ETNA_SE_CLIP_MARGIN_RIGHT;
353   cs->SE_CLIP_BOTTOM = (ss->maxy << 16) + ETNA_SE_CLIP_MARGIN_BOTTOM;
354
355   ctx->dirty |= ETNA_DIRTY_SCISSOR;
356}
357
358static void
359etna_set_viewport_states(struct pipe_context *pctx, unsigned start_slot,
360      unsigned num_scissors, const struct pipe_viewport_state *vs)
361{
362   struct etna_context *ctx = etna_context(pctx);
363   struct compiled_viewport_state *cs = &ctx->viewport;
364
365   ctx->viewport_s = *vs;
366   /**
367    * For Vivante GPU, viewport z transformation is 0..1 to 0..1 instead of
368    * -1..1 to 0..1.
369    * scaling and translation to 0..1 already happened, so remove that
370    *
371    * z' = (z * 2 - 1) * scale + translate
372    *    = z * (2 * scale) + (translate - scale)
373    *
374    * scale' = 2 * scale
375    * translate' = translate - scale
376    */
377
378   /* must be fixp as v4 state deltas assume it is */
379   cs->PA_VIEWPORT_SCALE_X = etna_f32_to_fixp16(vs->scale[0]);
380   cs->PA_VIEWPORT_SCALE_Y = etna_f32_to_fixp16(vs->scale[1]);
381   cs->PA_VIEWPORT_SCALE_Z = fui(vs->scale[2] * 2.0f);
382   cs->PA_VIEWPORT_OFFSET_X = etna_f32_to_fixp16(vs->translate[0]);
383   cs->PA_VIEWPORT_OFFSET_Y = etna_f32_to_fixp16(vs->translate[1]);
384   cs->PA_VIEWPORT_OFFSET_Z = fui(vs->translate[2] - vs->scale[2]);
385
386   /* Compute scissor rectangle (fixp) from viewport.
387    * Make sure left is always < right and top always < bottom.
388    */
389   cs->SE_SCISSOR_LEFT = etna_f32_to_fixp16(MAX2(vs->translate[0] - fabsf(vs->scale[0]), 0.0f));
390   cs->SE_SCISSOR_TOP = etna_f32_to_fixp16(MAX2(vs->translate[1] - fabsf(vs->scale[1]), 0.0f));
391   uint32_t right_fixp = etna_f32_to_fixp16(MAX2(vs->translate[0] + fabsf(vs->scale[0]), 0.0f));
392   uint32_t bottom_fixp = etna_f32_to_fixp16(MAX2(vs->translate[1] + fabsf(vs->scale[1]), 0.0f));
393   cs->SE_SCISSOR_RIGHT = right_fixp + ETNA_SE_SCISSOR_MARGIN_RIGHT;
394   cs->SE_SCISSOR_BOTTOM = bottom_fixp + ETNA_SE_SCISSOR_MARGIN_BOTTOM;
395   cs->SE_CLIP_RIGHT = right_fixp + ETNA_SE_CLIP_MARGIN_RIGHT;
396   cs->SE_CLIP_BOTTOM = bottom_fixp + ETNA_SE_CLIP_MARGIN_BOTTOM;
397
398   cs->PE_DEPTH_NEAR = fui(0.0); /* not affected if depth mode is Z (as in GL) */
399   cs->PE_DEPTH_FAR = fui(1.0);
400   ctx->dirty |= ETNA_DIRTY_VIEWPORT;
401}
402
403static void
404etna_set_vertex_buffers(struct pipe_context *pctx, unsigned start_slot,
405      unsigned num_buffers, const struct pipe_vertex_buffer *vb)
406{
407   struct etna_context *ctx = etna_context(pctx);
408   struct etna_vertexbuf_state *so = &ctx->vertex_buffer;
409
410   util_set_vertex_buffers_mask(so->vb, &so->enabled_mask, vb, start_slot, num_buffers);
411   so->count = util_last_bit(so->enabled_mask);
412
413   for (unsigned idx = start_slot; idx < start_slot + num_buffers; ++idx) {
414      struct compiled_set_vertex_buffer *cs = &so->cvb[idx];
415      struct pipe_vertex_buffer *vbi = &so->vb[idx];
416
417      assert(!vbi->is_user_buffer); /* XXX support user_buffer using
418                                       etna_usermem_map */
419
420      if (vbi->buffer.resource) { /* GPU buffer */
421         cs->FE_VERTEX_STREAM_BASE_ADDR.bo = etna_resource(vbi->buffer.resource)->bo;
422         cs->FE_VERTEX_STREAM_BASE_ADDR.offset = vbi->buffer_offset;
423         cs->FE_VERTEX_STREAM_BASE_ADDR.flags = ETNA_RELOC_READ;
424         cs->FE_VERTEX_STREAM_CONTROL =
425            FE_VERTEX_STREAM_CONTROL_VERTEX_STRIDE(vbi->stride);
426      } else {
427         cs->FE_VERTEX_STREAM_BASE_ADDR.bo = NULL;
428         cs->FE_VERTEX_STREAM_CONTROL = 0;
429      }
430   }
431
432   ctx->dirty |= ETNA_DIRTY_VERTEX_BUFFERS;
433}
434
435static void
436etna_blend_state_bind(struct pipe_context *pctx, void *bs)
437{
438   struct etna_context *ctx = etna_context(pctx);
439
440   ctx->blend = bs;
441   ctx->dirty |= ETNA_DIRTY_BLEND;
442}
443
444static void
445etna_blend_state_delete(struct pipe_context *pctx, void *bs)
446{
447   FREE(bs);
448}
449
450static void
451etna_rasterizer_state_bind(struct pipe_context *pctx, void *rs)
452{
453   struct etna_context *ctx = etna_context(pctx);
454
455   ctx->rasterizer = rs;
456   ctx->dirty |= ETNA_DIRTY_RASTERIZER;
457}
458
459static void
460etna_rasterizer_state_delete(struct pipe_context *pctx, void *rs)
461{
462   FREE(rs);
463}
464
465static void
466etna_zsa_state_bind(struct pipe_context *pctx, void *zs)
467{
468   struct etna_context *ctx = etna_context(pctx);
469
470   ctx->zsa = zs;
471   ctx->dirty |= ETNA_DIRTY_ZSA;
472}
473
474static void
475etna_zsa_state_delete(struct pipe_context *pctx, void *zs)
476{
477   FREE(zs);
478}
479
480/** Create vertex element states, which define a layout for fetching
481 * vertices for rendering.
482 */
483static void *
484etna_vertex_elements_state_create(struct pipe_context *pctx,
485      unsigned num_elements, const struct pipe_vertex_element *elements)
486{
487   struct etna_context *ctx = etna_context(pctx);
488   struct compiled_vertex_elements_state *cs = CALLOC_STRUCT(compiled_vertex_elements_state);
489
490   if (!cs)
491      return NULL;
492
493   if (num_elements > ctx->specs.vertex_max_elements) {
494      BUG("number of elements (%u) exceeds chip maximum (%u)", num_elements,
495          ctx->specs.vertex_max_elements);
496      return NULL;
497   }
498
499   /* XXX could minimize number of consecutive stretches here by sorting, and
500    * permuting the inputs in shader or does Mesa do this already? */
501
502   /* Check that vertex element binding is compatible with hardware; thus
503    * elements[idx].vertex_buffer_index are < stream_count. If not, the binding
504    * uses more streams than is supported, and u_vbuf should have done some
505    * reorganization for compatibility. */
506
507   /* TODO: does mesa this for us? */
508   bool incompatible = false;
509   for (unsigned idx = 0; idx < num_elements; ++idx) {
510      if (elements[idx].vertex_buffer_index >= ctx->specs.stream_count || elements[idx].instance_divisor > 0)
511         incompatible = true;
512   }
513
514   cs->num_elements = num_elements;
515   if (incompatible || num_elements == 0) {
516      DBG("Error: zero vertex elements, or more vertex buffers used than supported");
517      FREE(cs);
518      return NULL;
519   }
520
521   unsigned start_offset = 0; /* start of current consecutive stretch */
522   bool nonconsecutive = true; /* previous value of nonconsecutive */
523
524   for (unsigned idx = 0; idx < num_elements; ++idx) {
525      unsigned element_size = util_format_get_blocksize(elements[idx].src_format);
526      unsigned end_offset = elements[idx].src_offset + element_size;
527      uint32_t format_type, normalize;
528
529      if (nonconsecutive)
530         start_offset = elements[idx].src_offset;
531
532      /* maximum vertex size is 256 bytes */
533      assert(element_size != 0 && end_offset <= 256);
534
535      /* check whether next element is consecutive to this one */
536      nonconsecutive = (idx == (num_elements - 1)) ||
537                       elements[idx + 1].vertex_buffer_index != elements[idx].vertex_buffer_index ||
538                       end_offset != elements[idx + 1].src_offset;
539
540      format_type = translate_vertex_format_type(elements[idx].src_format);
541      normalize = translate_vertex_format_normalize(elements[idx].src_format);
542
543      assert(format_type != ETNA_NO_MATCH);
544      assert(normalize != ETNA_NO_MATCH);
545
546      if (ctx->specs.halti < 5) {
547         cs->FE_VERTEX_ELEMENT_CONFIG[idx] =
548            COND(nonconsecutive, VIVS_FE_VERTEX_ELEMENT_CONFIG_NONCONSECUTIVE) |
549            format_type |
550            VIVS_FE_VERTEX_ELEMENT_CONFIG_NUM(util_format_get_nr_components(elements[idx].src_format)) |
551            normalize | VIVS_FE_VERTEX_ELEMENT_CONFIG_ENDIAN(ENDIAN_MODE_NO_SWAP) |
552            VIVS_FE_VERTEX_ELEMENT_CONFIG_STREAM(elements[idx].vertex_buffer_index) |
553            VIVS_FE_VERTEX_ELEMENT_CONFIG_START(elements[idx].src_offset) |
554            VIVS_FE_VERTEX_ELEMENT_CONFIG_END(end_offset - start_offset);
555      } else { /* HALTI5 spread vertex attrib config over two registers */
556         cs->NFE_GENERIC_ATTRIB_CONFIG0[idx] =
557            format_type |
558            VIVS_NFE_GENERIC_ATTRIB_CONFIG0_NUM(util_format_get_nr_components(elements[idx].src_format)) |
559            normalize | VIVS_NFE_GENERIC_ATTRIB_CONFIG0_ENDIAN(ENDIAN_MODE_NO_SWAP) |
560            VIVS_NFE_GENERIC_ATTRIB_CONFIG0_STREAM(elements[idx].vertex_buffer_index) |
561            VIVS_NFE_GENERIC_ATTRIB_CONFIG0_START(elements[idx].src_offset);
562         cs->NFE_GENERIC_ATTRIB_CONFIG1[idx] =
563            COND(nonconsecutive, VIVS_NFE_GENERIC_ATTRIB_CONFIG1_NONCONSECUTIVE) |
564            VIVS_NFE_GENERIC_ATTRIB_CONFIG1_END(end_offset - start_offset);
565      }
566      cs->NFE_GENERIC_ATTRIB_SCALE[idx] = 0x3f800000; /* 1 for integer, 1.0 for float */
567   }
568
569   return cs;
570}
571
572static void
573etna_vertex_elements_state_delete(struct pipe_context *pctx, void *ve)
574{
575   FREE(ve);
576}
577
578static void
579etna_vertex_elements_state_bind(struct pipe_context *pctx, void *ve)
580{
581   struct etna_context *ctx = etna_context(pctx);
582
583   ctx->vertex_elements = ve;
584   ctx->dirty |= ETNA_DIRTY_VERTEX_ELEMENTS;
585}
586
587static bool
588etna_update_ts_config(struct etna_context *ctx)
589{
590   uint32_t new_ts_config = ctx->framebuffer.TS_MEM_CONFIG;
591
592   if (ctx->framebuffer_s.nr_cbufs > 0) {
593      struct etna_surface *c_surf = etna_surface(ctx->framebuffer_s.cbufs[0]);
594
595      if(c_surf->level->ts_size && c_surf->level->ts_valid) {
596         new_ts_config |= VIVS_TS_MEM_CONFIG_COLOR_FAST_CLEAR;
597      } else {
598         new_ts_config &= ~VIVS_TS_MEM_CONFIG_COLOR_FAST_CLEAR;
599      }
600   }
601
602   if (ctx->framebuffer_s.zsbuf) {
603      struct etna_surface *zs_surf = etna_surface(ctx->framebuffer_s.zsbuf);
604
605      if(zs_surf->level->ts_size && zs_surf->level->ts_valid) {
606         new_ts_config |= VIVS_TS_MEM_CONFIG_DEPTH_FAST_CLEAR;
607      } else {
608         new_ts_config &= ~VIVS_TS_MEM_CONFIG_DEPTH_FAST_CLEAR;
609      }
610   }
611
612   if (new_ts_config != ctx->framebuffer.TS_MEM_CONFIG ||
613       (ctx->dirty & ETNA_DIRTY_FRAMEBUFFER)) {
614      ctx->framebuffer.TS_MEM_CONFIG = new_ts_config;
615      ctx->dirty |= ETNA_DIRTY_TS;
616   }
617
618   ctx->dirty &= ~ETNA_DIRTY_DERIVE_TS;
619
620   return true;
621}
622
623struct etna_state_updater {
624   bool (*update)(struct etna_context *ctx);
625   uint32_t dirty;
626};
627
628static const struct etna_state_updater etna_state_updates[] = {
629   {
630      etna_shader_update_vertex, ETNA_DIRTY_SHADER | ETNA_DIRTY_VERTEX_ELEMENTS,
631   },
632   {
633      etna_shader_link, ETNA_DIRTY_SHADER,
634   },
635   {
636      etna_update_blend, ETNA_DIRTY_BLEND | ETNA_DIRTY_FRAMEBUFFER
637   },
638   {
639      etna_update_blend_color, ETNA_DIRTY_BLEND_COLOR | ETNA_DIRTY_FRAMEBUFFER,
640   },
641   {
642      etna_update_ts_config, ETNA_DIRTY_DERIVE_TS,
643   }
644};
645
646bool
647etna_state_update(struct etna_context *ctx)
648{
649   for (unsigned int i = 0; i < ARRAY_SIZE(etna_state_updates); i++)
650      if (ctx->dirty & etna_state_updates[i].dirty)
651         if (!etna_state_updates[i].update(ctx))
652            return false;
653
654   return true;
655}
656
657void
658etna_state_init(struct pipe_context *pctx)
659{
660   pctx->set_blend_color = etna_set_blend_color;
661   pctx->set_stencil_ref = etna_set_stencil_ref;
662   pctx->set_clip_state = etna_set_clip_state;
663   pctx->set_sample_mask = etna_set_sample_mask;
664   pctx->set_constant_buffer = etna_set_constant_buffer;
665   pctx->set_framebuffer_state = etna_set_framebuffer_state;
666   pctx->set_polygon_stipple = etna_set_polygon_stipple;
667   pctx->set_scissor_states = etna_set_scissor_states;
668   pctx->set_viewport_states = etna_set_viewport_states;
669
670   pctx->set_vertex_buffers = etna_set_vertex_buffers;
671
672   pctx->bind_blend_state = etna_blend_state_bind;
673   pctx->delete_blend_state = etna_blend_state_delete;
674
675   pctx->bind_rasterizer_state = etna_rasterizer_state_bind;
676   pctx->delete_rasterizer_state = etna_rasterizer_state_delete;
677
678   pctx->bind_depth_stencil_alpha_state = etna_zsa_state_bind;
679   pctx->delete_depth_stencil_alpha_state = etna_zsa_state_delete;
680
681   pctx->create_vertex_elements_state = etna_vertex_elements_state_create;
682   pctx->delete_vertex_elements_state = etna_vertex_elements_state_delete;
683   pctx->bind_vertex_elements_state = etna_vertex_elements_state_bind;
684}
685