1428d7b3dSmrg/*
2428d7b3dSmrg * Copyright © 2007-2011 Intel Corporation
3428d7b3dSmrg *
4428d7b3dSmrg * Permission is hereby granted, free of charge, to any person obtaining a
5428d7b3dSmrg * copy of this software and associated documentation files (the "Software"),
6428d7b3dSmrg * to deal in the Software without restriction, including without limitation
7428d7b3dSmrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8428d7b3dSmrg * and/or sell copies of the Software, and to permit persons to whom the
9428d7b3dSmrg * Software is furnished to do so, subject to the following conditions:
10428d7b3dSmrg *
11428d7b3dSmrg * The above copyright notice and this permission notice (including the next
12428d7b3dSmrg * paragraph) shall be included in all copies or substantial portions of the
13428d7b3dSmrg * Software.
14428d7b3dSmrg *
15428d7b3dSmrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16428d7b3dSmrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17428d7b3dSmrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18428d7b3dSmrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19428d7b3dSmrg * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20428d7b3dSmrg * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21428d7b3dSmrg * SOFTWARE.
22428d7b3dSmrg *
23428d7b3dSmrg * Authors:
24428d7b3dSmrg *    Eric Anholt <eric@anholt.net>
25428d7b3dSmrg *    Chris Wilson <chris@chris-wilson.co.uk>
26428d7b3dSmrg *
27428d7b3dSmrg */
28428d7b3dSmrg
29428d7b3dSmrg#ifdef HAVE_CONFIG_H
30428d7b3dSmrg#include "config.h"
31428d7b3dSmrg#endif
32428d7b3dSmrg
33428d7b3dSmrg#include <sys/mman.h>
34428d7b3dSmrg#include <assert.h>
35428d7b3dSmrg
36428d7b3dSmrg#include "sna.h"
37428d7b3dSmrg#include "sna_reg.h"
38428d7b3dSmrg
39428d7b3dSmrg#include "gen4_render.h"
40428d7b3dSmrg
41428d7b3dSmrg#include "kgem_debug.h"
42428d7b3dSmrg
43428d7b3dSmrgstatic struct state {
44428d7b3dSmrg	struct vertex_buffer {
45428d7b3dSmrg		int handle;
46428d7b3dSmrg		void *base;
47428d7b3dSmrg		const char *ptr;
48428d7b3dSmrg		int pitch;
49428d7b3dSmrg
50428d7b3dSmrg		struct kgem_bo *current;
51428d7b3dSmrg	} vb[33];
52428d7b3dSmrg	struct vertex_elements {
53428d7b3dSmrg		int buffer;
54428d7b3dSmrg		int offset;
55428d7b3dSmrg		bool valid;
56428d7b3dSmrg		uint32_t type;
57428d7b3dSmrg		uint8_t swizzle[4];
58428d7b3dSmrg	} ve[33];
59428d7b3dSmrg	int num_ve;
60428d7b3dSmrg
61428d7b3dSmrg	struct dynamic_state {
62428d7b3dSmrg		struct kgem_bo *current;
63428d7b3dSmrg		void *base, *ptr;
64428d7b3dSmrg	} dynamic_state;
65428d7b3dSmrg} state;
66428d7b3dSmrg
67428d7b3dSmrgstatic void gen4_update_vertex_buffer(struct kgem *kgem, const uint32_t *data)
68428d7b3dSmrg{
69428d7b3dSmrg	uint32_t reloc = sizeof(uint32_t) * (&data[1] - kgem->batch);
70428d7b3dSmrg	struct kgem_bo *bo = NULL;
71428d7b3dSmrg	void *base, *ptr;
72428d7b3dSmrg	int i;
73428d7b3dSmrg
74428d7b3dSmrg	for (i = 0; i < kgem->nreloc; i++)
75428d7b3dSmrg		if (kgem->reloc[i].offset == reloc)
76428d7b3dSmrg			break;
77428d7b3dSmrg	assert(i < kgem->nreloc);
78428d7b3dSmrg	reloc = kgem->reloc[i].target_handle;
79428d7b3dSmrg
80428d7b3dSmrg	if (reloc == 0) {
81428d7b3dSmrg		base = kgem->batch;
82428d7b3dSmrg	} else {
83428d7b3dSmrg		list_for_each_entry(bo, &kgem->next_request->buffers, request)
84428d7b3dSmrg			if (bo->handle == reloc)
85428d7b3dSmrg				break;
86428d7b3dSmrg		assert(&bo->request != &kgem->next_request->buffers);
87428d7b3dSmrg		base = kgem_bo_map__debug(kgem, bo);
88428d7b3dSmrg	}
89428d7b3dSmrg	ptr = (char *)base + kgem->reloc[i].delta;
90428d7b3dSmrg
91428d7b3dSmrg	i = data[0] >> 27;
92428d7b3dSmrg
93428d7b3dSmrg	state.vb[i].current = bo;
94428d7b3dSmrg	state.vb[i].base = base;
95428d7b3dSmrg	state.vb[i].ptr = ptr;
96428d7b3dSmrg	state.vb[i].pitch = data[0] & 0x7ff;
97428d7b3dSmrg}
98428d7b3dSmrg
99428d7b3dSmrgstatic uint32_t
100428d7b3dSmrgget_ve_component(uint32_t data, int component)
101428d7b3dSmrg{
102428d7b3dSmrg	return (data >> (16 + (3 - component) * 4)) & 0x7;
103428d7b3dSmrg}
104428d7b3dSmrg
105428d7b3dSmrgstatic void gen4_update_vertex_elements(struct kgem *kgem, int id, const uint32_t *data)
106428d7b3dSmrg{
107428d7b3dSmrg	state.ve[id].buffer = data[0] >> 27;
108428d7b3dSmrg	state.ve[id].valid = !!(data[0] & (1 << 26));
109428d7b3dSmrg	state.ve[id].type = (data[0] >> 16) & 0x1ff;
110428d7b3dSmrg	state.ve[id].offset = data[0] & 0x7ff;
111428d7b3dSmrg	state.ve[id].swizzle[0] = get_ve_component(data[1], 0);
112428d7b3dSmrg	state.ve[id].swizzle[1] = get_ve_component(data[1], 1);
113428d7b3dSmrg	state.ve[id].swizzle[2] = get_ve_component(data[1], 2);
114428d7b3dSmrg	state.ve[id].swizzle[3] = get_ve_component(data[1], 3);
115428d7b3dSmrg}
116428d7b3dSmrg
117428d7b3dSmrgstatic void vertices_sint16_out(const struct vertex_elements *ve, const int16_t *v, int max)
118428d7b3dSmrg{
119428d7b3dSmrg	int c;
120428d7b3dSmrg
121428d7b3dSmrg	ErrorF("(");
122428d7b3dSmrg	for (c = 0; c < max; c++) {
123428d7b3dSmrg		switch (ve->swizzle[c]) {
124428d7b3dSmrg		case 0: ErrorF("#"); break;
125428d7b3dSmrg		case 1: ErrorF("%d", v[c]); break;
126428d7b3dSmrg		case 2: ErrorF("0.0"); break;
127428d7b3dSmrg		case 3: ErrorF("1.0"); break;
128428d7b3dSmrg		case 4: ErrorF("0x1"); break;
129428d7b3dSmrg		case 5: break;
130428d7b3dSmrg		default: ErrorF("?");
131428d7b3dSmrg		}
132428d7b3dSmrg		if (c < 3)
133428d7b3dSmrg			ErrorF(", ");
134428d7b3dSmrg	}
135428d7b3dSmrg	for (; c < 4; c++) {
136428d7b3dSmrg		switch (ve->swizzle[c]) {
137428d7b3dSmrg		case 0: ErrorF("#"); break;
138428d7b3dSmrg		case 1: ErrorF("1.0"); break;
139428d7b3dSmrg		case 2: ErrorF("0.0"); break;
140428d7b3dSmrg		case 3: ErrorF("1.0"); break;
141428d7b3dSmrg		case 4: ErrorF("0x1"); break;
142428d7b3dSmrg		case 5: break;
143428d7b3dSmrg		default: ErrorF("?");
144428d7b3dSmrg		}
145428d7b3dSmrg		if (c < 3)
146428d7b3dSmrg			ErrorF(", ");
147428d7b3dSmrg	}
148428d7b3dSmrg	ErrorF(")");
149428d7b3dSmrg}
150428d7b3dSmrg
151428d7b3dSmrgstatic void vertices_float_out(const struct vertex_elements *ve, const float *f, int max)
152428d7b3dSmrg{
153428d7b3dSmrg	int c, o;
154428d7b3dSmrg
155428d7b3dSmrg	ErrorF("(");
156428d7b3dSmrg	for (c = o = 0; c < 4 && o < max; c++) {
157428d7b3dSmrg		switch (ve->swizzle[c]) {
158428d7b3dSmrg		case 0: ErrorF("#"); break;
159428d7b3dSmrg		case 1: ErrorF("%f", f[o++]); break;
160428d7b3dSmrg		case 2: ErrorF("0.0"); break;
161428d7b3dSmrg		case 3: ErrorF("1.0"); break;
162428d7b3dSmrg		case 4: ErrorF("0x1"); break;
163428d7b3dSmrg		case 5: break;
164428d7b3dSmrg		default: ErrorF("?");
165428d7b3dSmrg		}
166428d7b3dSmrg		if (c < 3)
167428d7b3dSmrg			ErrorF(", ");
168428d7b3dSmrg	}
169428d7b3dSmrg	for (; c < 4; c++) {
170428d7b3dSmrg		switch (ve->swizzle[c]) {
171428d7b3dSmrg		case 0: ErrorF("#"); break;
172428d7b3dSmrg		case 1: ErrorF("1.0"); break;
173428d7b3dSmrg		case 2: ErrorF("0.0"); break;
174428d7b3dSmrg		case 3: ErrorF("1.0"); break;
175428d7b3dSmrg		case 4: ErrorF("0x1"); break;
176428d7b3dSmrg		case 5: break;
177428d7b3dSmrg		default: ErrorF("?");
178428d7b3dSmrg		}
179428d7b3dSmrg		if (c < 3)
180428d7b3dSmrg			ErrorF(", ");
181428d7b3dSmrg	}
182428d7b3dSmrg	ErrorF(")");
183428d7b3dSmrg}
184428d7b3dSmrg
185428d7b3dSmrgstatic void ve_out(const struct vertex_elements *ve, const void *ptr)
186428d7b3dSmrg{
187428d7b3dSmrg	switch (ve->type) {
188428d7b3dSmrg	case GEN4_SURFACEFORMAT_R32_FLOAT:
189428d7b3dSmrg		vertices_float_out(ve, ptr, 1);
190428d7b3dSmrg		break;
191428d7b3dSmrg	case GEN4_SURFACEFORMAT_R32G32_FLOAT:
192428d7b3dSmrg		vertices_float_out(ve, ptr, 2);
193428d7b3dSmrg		break;
194428d7b3dSmrg	case GEN4_SURFACEFORMAT_R32G32B32_FLOAT:
195428d7b3dSmrg		vertices_float_out(ve, ptr, 3);
196428d7b3dSmrg		break;
197428d7b3dSmrg	case GEN4_SURFACEFORMAT_R32G32B32A32_FLOAT:
198428d7b3dSmrg		vertices_float_out(ve, ptr, 4);
199428d7b3dSmrg		break;
200428d7b3dSmrg	case GEN4_SURFACEFORMAT_R16_SINT:
201428d7b3dSmrg		vertices_sint16_out(ve, ptr, 1);
202428d7b3dSmrg		break;
203428d7b3dSmrg	case GEN4_SURFACEFORMAT_R16G16_SINT:
204428d7b3dSmrg		vertices_sint16_out(ve, ptr, 2);
205428d7b3dSmrg		break;
206428d7b3dSmrg	case GEN4_SURFACEFORMAT_R16G16B16A16_SINT:
207428d7b3dSmrg		vertices_sint16_out(ve, ptr, 4);
208428d7b3dSmrg		break;
209428d7b3dSmrg	case GEN4_SURFACEFORMAT_R16_SSCALED:
210428d7b3dSmrg		vertices_sint16_out(ve, ptr, 1);
211428d7b3dSmrg		break;
212428d7b3dSmrg	case GEN4_SURFACEFORMAT_R16G16_SSCALED:
213428d7b3dSmrg		vertices_sint16_out(ve, ptr, 2);
214428d7b3dSmrg		break;
215428d7b3dSmrg	case GEN4_SURFACEFORMAT_R16G16B16A16_SSCALED:
216428d7b3dSmrg		vertices_sint16_out(ve, ptr, 4);
217428d7b3dSmrg		break;
218428d7b3dSmrg	}
219428d7b3dSmrg}
220428d7b3dSmrg
221428d7b3dSmrgstatic void indirect_vertex_out(struct kgem *kgem, uint32_t v)
222428d7b3dSmrg{
223428d7b3dSmrg	int i = 0;
224428d7b3dSmrg
225428d7b3dSmrg	do {
226428d7b3dSmrg		const struct vertex_elements *ve = &state.ve[i];
227428d7b3dSmrg		const struct vertex_buffer *vb = &state.vb[ve->buffer];
228428d7b3dSmrg		const void *ptr = vb->ptr + v * vb->pitch + ve->offset;
229428d7b3dSmrg
230428d7b3dSmrg		if (!ve->valid)
231428d7b3dSmrg			continue;
232428d7b3dSmrg
233428d7b3dSmrg		ve_out(ve, ptr);
234428d7b3dSmrg
235428d7b3dSmrg		while (++i <= state.num_ve && !state.ve[i].valid)
236428d7b3dSmrg			;
237428d7b3dSmrg
238428d7b3dSmrg		if (i <= state.num_ve)
239428d7b3dSmrg			ErrorF(", ");
240428d7b3dSmrg	} while (i <= state.num_ve);
241428d7b3dSmrg}
242428d7b3dSmrg
243428d7b3dSmrgstatic void primitive_out(struct kgem *kgem, uint32_t *data)
244428d7b3dSmrg{
245428d7b3dSmrg	int n;
246428d7b3dSmrg
247428d7b3dSmrg	assert((data[0] & (1<<15)) == 0); /* XXX index buffers */
248428d7b3dSmrg
249428d7b3dSmrg	for (n = 0; n < data[1]; n++) {
250428d7b3dSmrg		int v = data[2] + n;
251428d7b3dSmrg		ErrorF("	[%d:%d] = ", n, v);
252428d7b3dSmrg		indirect_vertex_out(kgem, v);
253428d7b3dSmrg		ErrorF("\n");
254428d7b3dSmrg	}
255428d7b3dSmrg}
256428d7b3dSmrg
257428d7b3dSmrgstatic void
258428d7b3dSmrgstate_base_out(uint32_t *data, uint32_t offset, unsigned int index,
259428d7b3dSmrg	       const char *name)
260428d7b3dSmrg{
261428d7b3dSmrg    if (data[index] & 1)
262428d7b3dSmrg	kgem_debug_print(data, offset, index,
263428d7b3dSmrg		  "%s state base address 0x%08x\n",
264428d7b3dSmrg		  name, data[index] & ~1);
265428d7b3dSmrg    else
266428d7b3dSmrg	kgem_debug_print(data, offset, index,
267428d7b3dSmrg		  "%s state base not updated\n",
268428d7b3dSmrg		  name);
269428d7b3dSmrg}
270428d7b3dSmrg
271428d7b3dSmrgstatic void
272428d7b3dSmrgstate_max_out(uint32_t *data, uint32_t offset, unsigned int index,
273428d7b3dSmrg	      const char *name)
274428d7b3dSmrg{
275428d7b3dSmrg	if (data[index] == 1)
276428d7b3dSmrg		kgem_debug_print(data, offset, index,
277428d7b3dSmrg			  "%s state upper bound disabled\n", name);
278428d7b3dSmrg	else if (data[index] & 1)
279428d7b3dSmrg		kgem_debug_print(data, offset, index,
280428d7b3dSmrg			  "%s state upper bound 0x%08x\n",
281428d7b3dSmrg			  name, data[index] & ~1);
282428d7b3dSmrg	else
283428d7b3dSmrg		kgem_debug_print(data, offset, index,
284428d7b3dSmrg			  "%s state upper bound not updated\n",
285428d7b3dSmrg			  name);
286428d7b3dSmrg}
287428d7b3dSmrg
288428d7b3dSmrgstatic const char *
289428d7b3dSmrgget_965_surfacetype(unsigned int surfacetype)
290428d7b3dSmrg{
291428d7b3dSmrg	switch (surfacetype) {
292428d7b3dSmrg	case 0: return "1D";
293428d7b3dSmrg	case 1: return "2D";
294428d7b3dSmrg	case 2: return "3D";
295428d7b3dSmrg	case 3: return "CUBE";
296428d7b3dSmrg	case 4: return "BUFFER";
297428d7b3dSmrg	case 7: return "NULL";
298428d7b3dSmrg	default: return "unknown";
299428d7b3dSmrg	}
300428d7b3dSmrg}
301428d7b3dSmrg
302428d7b3dSmrgstatic const char *
303428d7b3dSmrgget_965_depthformat(unsigned int depthformat)
304428d7b3dSmrg{
305428d7b3dSmrg	switch (depthformat) {
306428d7b3dSmrg	case 0: return "s8_z24float";
307428d7b3dSmrg	case 1: return "z32float";
308428d7b3dSmrg	case 2: return "z24s8";
309428d7b3dSmrg	case 5: return "z16";
310428d7b3dSmrg	default: return "unknown";
311428d7b3dSmrg	}
312428d7b3dSmrg}
313428d7b3dSmrg
314428d7b3dSmrgstatic const char *
315428d7b3dSmrgget_965_element_component(uint32_t data, int component)
316428d7b3dSmrg{
317428d7b3dSmrg	uint32_t component_control = (data >> (16 + (3 - component) * 4)) & 0x7;
318428d7b3dSmrg
319428d7b3dSmrg	switch (component_control) {
320428d7b3dSmrg	case 0:
321428d7b3dSmrg		return "nostore";
322428d7b3dSmrg	case 1:
323428d7b3dSmrg		switch (component) {
324428d7b3dSmrg		case 0: return "X";
325428d7b3dSmrg		case 1: return "Y";
326428d7b3dSmrg		case 2: return "Z";
327428d7b3dSmrg		case 3: return "W";
328428d7b3dSmrg		default: return "fail";
329428d7b3dSmrg		}
330428d7b3dSmrg	case 2:
331428d7b3dSmrg		return "0.0";
332428d7b3dSmrg	case 3:
333428d7b3dSmrg		return "1.0";
334428d7b3dSmrg	case 4:
335428d7b3dSmrg		return "0x1";
336428d7b3dSmrg	case 5:
337428d7b3dSmrg		return "VID";
338428d7b3dSmrg	default:
339428d7b3dSmrg		return "fail";
340428d7b3dSmrg	}
341428d7b3dSmrg}
342428d7b3dSmrg
343428d7b3dSmrgstatic const char *
344428d7b3dSmrgget_965_prim_type(uint32_t data)
345428d7b3dSmrg{
346428d7b3dSmrg	uint32_t primtype = (data >> 10) & 0x1f;
347428d7b3dSmrg
348428d7b3dSmrg	switch (primtype) {
349428d7b3dSmrg	case 0x01: return "point list";
350428d7b3dSmrg	case 0x02: return "line list";
351428d7b3dSmrg	case 0x03: return "line strip";
352428d7b3dSmrg	case 0x04: return "tri list";
353428d7b3dSmrg	case 0x05: return "tri strip";
354428d7b3dSmrg	case 0x06: return "tri fan";
355428d7b3dSmrg	case 0x07: return "quad list";
356428d7b3dSmrg	case 0x08: return "quad strip";
357428d7b3dSmrg	case 0x09: return "line list adj";
358428d7b3dSmrg	case 0x0a: return "line strip adj";
359428d7b3dSmrg	case 0x0b: return "tri list adj";
360428d7b3dSmrg	case 0x0c: return "tri strip adj";
361428d7b3dSmrg	case 0x0d: return "tri strip reverse";
362428d7b3dSmrg	case 0x0e: return "polygon";
363428d7b3dSmrg	case 0x0f: return "rect list";
364428d7b3dSmrg	case 0x10: return "line loop";
365428d7b3dSmrg	case 0x11: return "point list bf";
366428d7b3dSmrg	case 0x12: return "line strip cont";
367428d7b3dSmrg	case 0x13: return "line strip bf";
368428d7b3dSmrg	case 0x14: return "line strip cont bf";
369428d7b3dSmrg	case 0x15: return "tri fan no stipple";
370428d7b3dSmrg	default: return "fail";
371428d7b3dSmrg	}
372428d7b3dSmrg}
373428d7b3dSmrg
374428d7b3dSmrg#if 0
375428d7b3dSmrgstruct reloc {
376428d7b3dSmrg	struct kgem_bo *bo;
377428d7b3dSmrg	void *base;
378428d7b3dSmrg};
379428d7b3dSmrg
380428d7b3dSmrgstatic void *
381428d7b3dSmrgget_reloc(struct kgem *kgem,
382428d7b3dSmrg	  void *base, const uint32_t *reloc,
383428d7b3dSmrg	  struct reloc *r)
384428d7b3dSmrg{
385428d7b3dSmrg	uint32_t delta = *reloc;
386428d7b3dSmrg
387428d7b3dSmrg	memset(r, 0, sizeof(*r));
388428d7b3dSmrg
389428d7b3dSmrg	if (base == 0) {
390428d7b3dSmrg		uint32_t handle = sizeof(uint32_t) * (reloc - kgem->batch);
391428d7b3dSmrg		struct kgem_bo *bo = NULL;
392428d7b3dSmrg		int i;
393428d7b3dSmrg
394428d7b3dSmrg		for (i = 0; i < kgem->nreloc; i++)
395428d7b3dSmrg			if (kgem->reloc[i].offset == handle)
396428d7b3dSmrg				break;
397428d7b3dSmrg		assert(i < kgem->nreloc);
398428d7b3dSmrg		handle = kgem->reloc[i].target_handle;
399428d7b3dSmrg		delta = kgem->reloc[i].delta;
400428d7b3dSmrg
401428d7b3dSmrg		if (handle == 0) {
402428d7b3dSmrg			base = kgem->batch;
403428d7b3dSmrg		} else {
404428d7b3dSmrg			list_for_each_entry(bo, &kgem->next_request->buffers, request)
405428d7b3dSmrg				if (bo->handle == handle)
406428d7b3dSmrg					break;
407428d7b3dSmrg			assert(&bo->request != &kgem->next_request->buffers);
408428d7b3dSmrg			base = kgem_bo_map__debug(kgem, bo);
409428d7b3dSmrg			r->bo = bo;
410428d7b3dSmrg			r->base = base;
411428d7b3dSmrg		}
412428d7b3dSmrg	}
413428d7b3dSmrg
414428d7b3dSmrg	return (char *)base + delta;
415428d7b3dSmrg}
416428d7b3dSmrg#endif
417428d7b3dSmrg
418428d7b3dSmrgint kgem_gen4_decode_3d(struct kgem *kgem, uint32_t offset)
419428d7b3dSmrg{
420428d7b3dSmrg	static const struct {
421428d7b3dSmrg		uint32_t opcode;
422428d7b3dSmrg		int min_len;
423428d7b3dSmrg		int max_len;
424428d7b3dSmrg		const char *name;
425428d7b3dSmrg	} opcodes[] = {
426428d7b3dSmrg		{ 0x6000, 3, 3, "URB_FENCE" },
427428d7b3dSmrg		{ 0x6001, 2, 2, "CS_URB_FENCE" },
428428d7b3dSmrg		{ 0x6002, 2, 2, "CONSTANT_BUFFER" },
429428d7b3dSmrg		{ 0x6101, 6, 6, "STATE_BASE_ADDRESS" },
430428d7b3dSmrg		{ 0x6102, 2, 2 , "STATE_SIP" },
431428d7b3dSmrg		{ 0x6104, 1, 1, "3DSTATE_PIPELINE_SELECT" },
432428d7b3dSmrg		{ 0x680b, 1, 1, "3DSTATE_VF_STATISTICS" },
433428d7b3dSmrg		{ 0x6904, 1, 1, "3DSTATE_PIPELINE_SELECT" },
434428d7b3dSmrg		{ 0x7800, 7, 7, "3DSTATE_PIPELINED_POINTERS" },
435428d7b3dSmrg		{ 0x7801, 6, 6, "3DSTATE_BINDING_TABLE_POINTERS" },
436428d7b3dSmrg		{ 0x7808, 5, 257, "3DSTATE_VERTEX_BUFFERS" },
437428d7b3dSmrg		{ 0x7809, 3, 256, "3DSTATE_VERTEX_ELEMENTS" },
438428d7b3dSmrg		{ 0x780a, 3, 3, "3DSTATE_INDEX_BUFFER" },
439428d7b3dSmrg		{ 0x780b, 1, 1, "3DSTATE_VF_STATISTICS" },
440428d7b3dSmrg		{ 0x7900, 4, 4, "3DSTATE_DRAWING_RECTANGLE" },
441428d7b3dSmrg		{ 0x7901, 5, 5, "3DSTATE_CONSTANT_COLOR" },
442428d7b3dSmrg		{ 0x7905, 5, 7, "3DSTATE_DEPTH_BUFFER" },
443428d7b3dSmrg		{ 0x7906, 2, 2, "3DSTATE_POLY_STIPPLE_OFFSET" },
444428d7b3dSmrg		{ 0x7907, 33, 33, "3DSTATE_POLY_STIPPLE_PATTERN" },
445428d7b3dSmrg		{ 0x7908, 3, 3, "3DSTATE_LINE_STIPPLE" },
446428d7b3dSmrg		{ 0x7909, 2, 2, "3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP" },
447428d7b3dSmrg		{ 0x7909, 2, 2, "3DSTATE_CLEAR_PARAMS" },
448428d7b3dSmrg		{ 0x790a, 3, 3, "3DSTATE_AA_LINE_PARAMETERS" },
449428d7b3dSmrg		{ 0x790b, 4, 4, "3DSTATE_GS_SVB_INDEX" },
450428d7b3dSmrg		{ 0x790d, 3, 3, "3DSTATE_MULTISAMPLE" },
451428d7b3dSmrg		{ 0x7910, 2, 2, "3DSTATE_CLEAR_PARAMS" },
452428d7b3dSmrg		{ 0x7b00, 6, 6, "3DPRIMITIVE" },
453428d7b3dSmrg		{ 0x7805, 3, 3, "3DSTATE_URB" },
454428d7b3dSmrg		{ 0x7815, 5, 5, "3DSTATE_CONSTANT_VS_STATE" },
455428d7b3dSmrg		{ 0x7816, 5, 5, "3DSTATE_CONSTANT_GS_STATE" },
456428d7b3dSmrg		{ 0x7817, 5, 5, "3DSTATE_CONSTANT_PS_STATE" },
457428d7b3dSmrg		{ 0x7818, 2, 2, "3DSTATE_SAMPLE_MASK" },
458428d7b3dSmrg	};
459428d7b3dSmrg	uint32_t *data = kgem->batch + offset;
460428d7b3dSmrg	uint32_t op;
461428d7b3dSmrg	unsigned int len;
462428d7b3dSmrg	int i;
463428d7b3dSmrg	const char *desc1 = NULL;
464428d7b3dSmrg
465428d7b3dSmrg	len = (data[0] & 0xff) + 2;
466428d7b3dSmrg	op = (data[0] & 0xffff0000) >> 16;
467428d7b3dSmrg	switch (op) {
468428d7b3dSmrg	case 0x6000:
469428d7b3dSmrg		assert(len == 3);
470428d7b3dSmrg
471428d7b3dSmrg		kgem_debug_print(data, offset, 0, "URB_FENCE: %s%s%s%s%s%s\n",
472428d7b3dSmrg			  (data[0] >> 13) & 1 ? "cs " : "",
473428d7b3dSmrg			  (data[0] >> 12) & 1 ? "vfe " : "",
474428d7b3dSmrg			  (data[0] >> 11) & 1 ? "sf " : "",
475428d7b3dSmrg			  (data[0] >> 10) & 1 ? "clip " : "",
476428d7b3dSmrg			  (data[0] >> 9)  & 1 ? "gs " : "",
477428d7b3dSmrg			  (data[0] >> 8)  & 1 ? "vs " : "");
478428d7b3dSmrg		kgem_debug_print(data, offset, 1,
479428d7b3dSmrg			  "vs fence: %d, gs_fence: %d, clip_fence: %d\n",
480428d7b3dSmrg			  data[1] & 0x3ff,
481428d7b3dSmrg			  (data[1] >> 10) & 0x3ff,
482428d7b3dSmrg			  (data[1] >> 20) & 0x3ff);
483428d7b3dSmrg		kgem_debug_print(data, offset, 2,
484428d7b3dSmrg			  "sf fence: %d, vfe_fence: %d, cs_fence: %d\n",
485428d7b3dSmrg			   data[2] & 0x3ff,
486428d7b3dSmrg			   (data[2] >> 10) & 0x3ff,
487428d7b3dSmrg			   (data[2] >> 20) & 0x7ff);
488428d7b3dSmrg		return len;
489428d7b3dSmrg
490428d7b3dSmrg	case 0x6001:
491428d7b3dSmrg		kgem_debug_print(data, offset, 0, "CS_URB_STATE\n");
492428d7b3dSmrg		kgem_debug_print(data, offset, 1, "entry_size: %d [%d bytes], n_entries: %d\n",
493428d7b3dSmrg			  (data[1] >> 4) & 0x1f,
494428d7b3dSmrg			  (((data[1] >> 4) & 0x1f) + 1) * 64,
495428d7b3dSmrg			  data[1] & 0x7);
496428d7b3dSmrg		return len;
497428d7b3dSmrg	case 0x6002:
498428d7b3dSmrg		kgem_debug_print(data, offset, 0, "CONSTANT_BUFFER: %s\n",
499428d7b3dSmrg			  (data[0] >> 8) & 1 ? "valid" : "invalid");
500428d7b3dSmrg		kgem_debug_print(data, offset, 1, "offset: 0x%08x, length: %d bytes\n",
501428d7b3dSmrg			  data[1] & ~0x3f, ((data[1] & 0x3f) + 1) * 64);
502428d7b3dSmrg		return len;
503428d7b3dSmrg	case 0x6101:
504428d7b3dSmrg		i = 0;
505428d7b3dSmrg		kgem_debug_print(data, offset, i++, "STATE_BASE_ADDRESS\n");
506428d7b3dSmrg		assert(len == 6);
507428d7b3dSmrg
508428d7b3dSmrg		state_base_out(data, offset, i++, "general");
509428d7b3dSmrg		state_base_out(data, offset, i++, "surface");
510428d7b3dSmrg		state_base_out(data, offset, i++, "media");
511428d7b3dSmrg
512428d7b3dSmrg		state_max_out(data, offset, i++, "general");
513428d7b3dSmrg		state_max_out(data, offset, i++, "media");
514428d7b3dSmrg
515428d7b3dSmrg		return len;
516428d7b3dSmrg
517428d7b3dSmrg	case 0x7801:
518428d7b3dSmrg		assert(len == 6);
519428d7b3dSmrg
520428d7b3dSmrg		kgem_debug_print(data, offset, 0,
521428d7b3dSmrg			  "3DSTATE_BINDING_TABLE_POINTERS\n");
522428d7b3dSmrg		kgem_debug_print(data, offset, 1, "VS binding table\n");
523428d7b3dSmrg		kgem_debug_print(data, offset, 2, "GS binding table\n");
524428d7b3dSmrg		kgem_debug_print(data, offset, 3, "CLIP binding table\n");
525428d7b3dSmrg		kgem_debug_print(data, offset, 4, "SF binding table\n");
526428d7b3dSmrg		kgem_debug_print(data, offset, 5, "WM binding table\n");
527428d7b3dSmrg
528428d7b3dSmrg		return len;
529428d7b3dSmrg
530428d7b3dSmrg	case 0x7808:
531428d7b3dSmrg		assert((len - 1) % 4 == 0);
532428d7b3dSmrg		kgem_debug_print(data, offset, 0, "3DSTATE_VERTEX_BUFFERS\n");
533428d7b3dSmrg
534428d7b3dSmrg		for (i = 1; i < len;) {
535428d7b3dSmrg			gen4_update_vertex_buffer(kgem, data + i);
536428d7b3dSmrg
537428d7b3dSmrg			kgem_debug_print(data, offset, i, "buffer %d: %s, pitch %db\n",
538428d7b3dSmrg				  data[i] >> 27,
539428d7b3dSmrg				  data[i] & (1 << 20) ? "random" : "sequential",
540428d7b3dSmrg				  data[i] & 0x07ff);
541428d7b3dSmrg			i++;
542428d7b3dSmrg			kgem_debug_print(data, offset, i++, "buffer address\n");
543428d7b3dSmrg			kgem_debug_print(data, offset, i++, "max index\n");
544428d7b3dSmrg			kgem_debug_print(data, offset, i++, "mbz\n");
545428d7b3dSmrg		}
546428d7b3dSmrg		return len;
547428d7b3dSmrg
548428d7b3dSmrg	case 0x7809:
549428d7b3dSmrg		assert((len + 1) % 2 == 0);
550428d7b3dSmrg		kgem_debug_print(data, offset, 0, "3DSTATE_VERTEX_ELEMENTS\n");
551428d7b3dSmrg
552428d7b3dSmrg		memset(state.ve, 0, sizeof(state.ve)); /* XXX? */
553428d7b3dSmrg		for (i = 1; i < len;) {
554428d7b3dSmrg			gen4_update_vertex_elements(kgem, (i - 1)/2, data + i);
555428d7b3dSmrg
556428d7b3dSmrg			kgem_debug_print(data, offset, i, "buffer %d: %svalid, type 0x%04x, "
557428d7b3dSmrg				  "src offset 0x%04x bytes\n",
558428d7b3dSmrg				  data[i] >> 27,
559428d7b3dSmrg				  data[i] & (1 << 26) ? "" : "in",
560428d7b3dSmrg				  (data[i] >> 16) & 0x1ff,
561428d7b3dSmrg				  data[i] & 0x07ff);
562428d7b3dSmrg			i++;
563428d7b3dSmrg			kgem_debug_print(data, offset, i, "(%s, %s, %s, %s), "
564428d7b3dSmrg				  "dst offset 0x%02x bytes\n",
565428d7b3dSmrg				  get_965_element_component(data[i], 0),
566428d7b3dSmrg				  get_965_element_component(data[i], 1),
567428d7b3dSmrg				  get_965_element_component(data[i], 2),
568428d7b3dSmrg				  get_965_element_component(data[i], 3),
569428d7b3dSmrg				  (data[i] & 0xff) * 4);
570428d7b3dSmrg			i++;
571428d7b3dSmrg		}
572428d7b3dSmrg		state.num_ve = (len - 1) / 2; /* XXX? */
573428d7b3dSmrg		return len;
574428d7b3dSmrg
575428d7b3dSmrg	case 0x780a:
576428d7b3dSmrg		assert(len == 3);
577428d7b3dSmrg		kgem_debug_print(data, offset, 0, "3DSTATE_INDEX_BUFFER\n");
578428d7b3dSmrg		kgem_debug_print(data, offset, 1, "beginning buffer address\n");
579428d7b3dSmrg		kgem_debug_print(data, offset, 2, "ending buffer address\n");
580428d7b3dSmrg		return len;
581428d7b3dSmrg
582428d7b3dSmrg	case 0x7900:
583428d7b3dSmrg		assert(len == 4);
584428d7b3dSmrg		kgem_debug_print(data, offset, 0,
585428d7b3dSmrg			  "3DSTATE_DRAWING_RECTANGLE\n");
586428d7b3dSmrg		kgem_debug_print(data, offset, 1, "top left: %d,%d\n",
587428d7b3dSmrg			  data[1] & 0xffff,
588428d7b3dSmrg			  (data[1] >> 16) & 0xffff);
589428d7b3dSmrg		kgem_debug_print(data, offset, 2, "bottom right: %d,%d\n",
590428d7b3dSmrg			  data[2] & 0xffff,
591428d7b3dSmrg			  (data[2] >> 16) & 0xffff);
592428d7b3dSmrg		kgem_debug_print(data, offset, 3, "origin: %d,%d\n",
593428d7b3dSmrg			  (int)data[3] & 0xffff,
594428d7b3dSmrg			  ((int)data[3] >> 16) & 0xffff);
595428d7b3dSmrg		return len;
596428d7b3dSmrg
597428d7b3dSmrg	case 0x7905:
598428d7b3dSmrg		assert(len == 7);
599428d7b3dSmrg		kgem_debug_print(data, offset, 0,
600428d7b3dSmrg			  "3DSTATE_DEPTH_BUFFER\n");
601428d7b3dSmrg		kgem_debug_print(data, offset, 1, "%s, %s, pitch = %d bytes, %stiled, HiZ %d, Seperate Stencil %d\n",
602428d7b3dSmrg			  get_965_surfacetype(data[1] >> 29),
603428d7b3dSmrg			  get_965_depthformat((data[1] >> 18) & 0x7),
604428d7b3dSmrg			  (data[1] & 0x0001ffff) + 1,
605428d7b3dSmrg			  data[1] & (1 << 27) ? "" : "not ",
606428d7b3dSmrg			  (data[1] & (1 << 22)) != 0,
607428d7b3dSmrg			  (data[1] & (1 << 21)) != 0);
608428d7b3dSmrg		kgem_debug_print(data, offset, 2, "depth offset\n");
609428d7b3dSmrg		kgem_debug_print(data, offset, 3, "%dx%d\n",
610428d7b3dSmrg			  ((data[3] & 0x0007ffc0) >> 6) + 1,
611428d7b3dSmrg			  ((data[3] & 0xfff80000) >> 19) + 1);
612428d7b3dSmrg		kgem_debug_print(data, offset, 4, "volume depth\n");
613428d7b3dSmrg		kgem_debug_print(data, offset, 5, "\n");
614428d7b3dSmrg		kgem_debug_print(data, offset, 6, "\n");
615428d7b3dSmrg		return len;
616428d7b3dSmrg
617428d7b3dSmrg	case 0x7a00:
618428d7b3dSmrg		assert(len == 4 || len == 5);
619428d7b3dSmrg		switch ((data[1] >> 14) & 0x3) {
620428d7b3dSmrg		case 0: desc1 = "no write"; break;
621428d7b3dSmrg		case 1: desc1 = "qword write"; break;
622428d7b3dSmrg		case 2: desc1 = "PS_DEPTH_COUNT write"; break;
623428d7b3dSmrg		case 3: desc1 = "TIMESTAMP write"; break;
624428d7b3dSmrg		}
625428d7b3dSmrg		kgem_debug_print(data, offset, 0, "PIPE_CONTROL\n");
626428d7b3dSmrg		kgem_debug_print(data, offset, 1,
627428d7b3dSmrg			  "%s, %scs stall, %stlb invalidate, "
628428d7b3dSmrg			  "%ssync gfdt, %sdepth stall, %sRC write flush, "
629428d7b3dSmrg			  "%sinst flush, %sTC flush\n",
630428d7b3dSmrg			  desc1,
631428d7b3dSmrg			  data[1] & (1 << 20) ? "" : "no ",
632428d7b3dSmrg			  data[1] & (1 << 18) ? "" : "no ",
633428d7b3dSmrg			  data[1] & (1 << 17) ? "" : "no ",
634428d7b3dSmrg			  data[1] & (1 << 13) ? "" : "no ",
635428d7b3dSmrg			  data[1] & (1 << 12) ? "" : "no ",
636428d7b3dSmrg			  data[1] & (1 << 11) ? "" : "no ",
637428d7b3dSmrg			  data[1] & (1 << 10) ? "" : "no ");
638428d7b3dSmrg		if (len == 5) {
639428d7b3dSmrg			kgem_debug_print(data, offset, 2, "destination address\n");
640428d7b3dSmrg			kgem_debug_print(data, offset, 3, "immediate dword low\n");
641428d7b3dSmrg			kgem_debug_print(data, offset, 4, "immediate dword high\n");
642428d7b3dSmrg		} else {
643428d7b3dSmrg			for (i = 2; i < len; i++) {
644428d7b3dSmrg				kgem_debug_print(data, offset, i, "\n");
645428d7b3dSmrg			}
646428d7b3dSmrg		}
647428d7b3dSmrg		return len;
648428d7b3dSmrg
649428d7b3dSmrg	case 0x7b00:
650428d7b3dSmrg		assert(len == 6);
651428d7b3dSmrg		kgem_debug_print(data, offset, 0,
652428d7b3dSmrg			  "3DPRIMITIVE: %s %s\n",
653428d7b3dSmrg			  get_965_prim_type(data[0]),
654428d7b3dSmrg			  (data[0] & (1 << 15)) ? "random" : "sequential");
655428d7b3dSmrg		kgem_debug_print(data, offset, 1, "vertex count\n");
656428d7b3dSmrg		kgem_debug_print(data, offset, 2, "start vertex\n");
657428d7b3dSmrg		kgem_debug_print(data, offset, 3, "instance count\n");
658428d7b3dSmrg		kgem_debug_print(data, offset, 4, "start instance\n");
659428d7b3dSmrg		kgem_debug_print(data, offset, 5, "index bias\n");
660428d7b3dSmrg		primitive_out(kgem, data);
661428d7b3dSmrg		return len;
662428d7b3dSmrg	}
663428d7b3dSmrg
664428d7b3dSmrg	/* For the rest, just dump the bytes */
665428d7b3dSmrg	for (i = 0; i < ARRAY_SIZE(opcodes); i++)
666428d7b3dSmrg		if (op == opcodes[i].opcode)
667428d7b3dSmrg			break;
668428d7b3dSmrg
669428d7b3dSmrg	assert(i < ARRAY_SIZE(opcodes));
670428d7b3dSmrg
671428d7b3dSmrg	len = 1;
672428d7b3dSmrg	kgem_debug_print(data, offset, 0, "%s\n", opcodes[i].name);
673428d7b3dSmrg	if (opcodes[i].max_len > 1) {
674428d7b3dSmrg		len = (data[0] & 0xff) + 2;
675428d7b3dSmrg		assert(len >= opcodes[i].min_len &&
676428d7b3dSmrg		       len <= opcodes[i].max_len);
677428d7b3dSmrg	}
678428d7b3dSmrg
679428d7b3dSmrg	for (i = 1; i < len; i++)
680428d7b3dSmrg		kgem_debug_print(data, offset, i, "dword %d\n", i);
681428d7b3dSmrg
682428d7b3dSmrg	return len;
683428d7b3dSmrg}
684428d7b3dSmrg
685428d7b3dSmrgvoid kgem_gen4_finish_state(struct kgem *kgem)
686428d7b3dSmrg{
687428d7b3dSmrg	memset(&state, 0, sizeof(state));
688428d7b3dSmrg}
689