1428d7b3dSmrg/* 2428d7b3dSmrg * Copyright © 2007-2011 Intel Corporation 3428d7b3dSmrg * 4428d7b3dSmrg * Permission is hereby granted, free of charge, to any person obtaining a 5428d7b3dSmrg * copy of this software and associated documentation files (the "Software"), 6428d7b3dSmrg * to deal in the Software without restriction, including without limitation 7428d7b3dSmrg * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8428d7b3dSmrg * and/or sell copies of the Software, and to permit persons to whom the 9428d7b3dSmrg * Software is furnished to do so, subject to the following conditions: 10428d7b3dSmrg * 11428d7b3dSmrg * The above copyright notice and this permission notice (including the next 12428d7b3dSmrg * paragraph) shall be included in all copies or substantial portions of the 13428d7b3dSmrg * Software. 14428d7b3dSmrg * 15428d7b3dSmrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16428d7b3dSmrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17428d7b3dSmrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18428d7b3dSmrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19428d7b3dSmrg * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20428d7b3dSmrg * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21428d7b3dSmrg * SOFTWARE. 22428d7b3dSmrg * 23428d7b3dSmrg * Authors: 24428d7b3dSmrg * Eric Anholt <eric@anholt.net> 25428d7b3dSmrg * Chris Wilson <chris@chris-wilson.co.uk> 26428d7b3dSmrg * 27428d7b3dSmrg */ 28428d7b3dSmrg 29428d7b3dSmrg#ifdef HAVE_CONFIG_H 30428d7b3dSmrg#include "config.h" 31428d7b3dSmrg#endif 32428d7b3dSmrg 33428d7b3dSmrg#include <sys/mman.h> 34428d7b3dSmrg#include <assert.h> 35428d7b3dSmrg 36428d7b3dSmrg#include "sna.h" 37428d7b3dSmrg#include "sna_reg.h" 38428d7b3dSmrg 39428d7b3dSmrg#include "gen4_render.h" 40428d7b3dSmrg 41428d7b3dSmrg#include "kgem_debug.h" 42428d7b3dSmrg 43428d7b3dSmrgstatic struct state { 44428d7b3dSmrg struct vertex_buffer { 45428d7b3dSmrg int handle; 46428d7b3dSmrg void *base; 47428d7b3dSmrg const char *ptr; 48428d7b3dSmrg int pitch; 49428d7b3dSmrg 50428d7b3dSmrg struct kgem_bo *current; 51428d7b3dSmrg } vb[33]; 52428d7b3dSmrg struct vertex_elements { 53428d7b3dSmrg int buffer; 54428d7b3dSmrg int offset; 55428d7b3dSmrg bool valid; 56428d7b3dSmrg uint32_t type; 57428d7b3dSmrg uint8_t swizzle[4]; 58428d7b3dSmrg } ve[33]; 59428d7b3dSmrg int num_ve; 60428d7b3dSmrg 61428d7b3dSmrg struct dynamic_state { 62428d7b3dSmrg struct kgem_bo *current; 63428d7b3dSmrg void *base, *ptr; 64428d7b3dSmrg } dynamic_state; 65428d7b3dSmrg} state; 66428d7b3dSmrg 67428d7b3dSmrgstatic void gen4_update_vertex_buffer(struct kgem *kgem, const uint32_t *data) 68428d7b3dSmrg{ 69428d7b3dSmrg uint32_t reloc = sizeof(uint32_t) * (&data[1] - kgem->batch); 70428d7b3dSmrg struct kgem_bo *bo = NULL; 71428d7b3dSmrg void *base, *ptr; 72428d7b3dSmrg int i; 73428d7b3dSmrg 74428d7b3dSmrg for (i = 0; i < kgem->nreloc; i++) 75428d7b3dSmrg if (kgem->reloc[i].offset == reloc) 76428d7b3dSmrg break; 77428d7b3dSmrg assert(i < kgem->nreloc); 78428d7b3dSmrg reloc = kgem->reloc[i].target_handle; 79428d7b3dSmrg 80428d7b3dSmrg if (reloc == 0) { 81428d7b3dSmrg base = kgem->batch; 82428d7b3dSmrg } else { 83428d7b3dSmrg list_for_each_entry(bo, &kgem->next_request->buffers, request) 84428d7b3dSmrg if (bo->handle == reloc) 85428d7b3dSmrg break; 86428d7b3dSmrg assert(&bo->request != &kgem->next_request->buffers); 87428d7b3dSmrg base = kgem_bo_map__debug(kgem, bo); 88428d7b3dSmrg } 89428d7b3dSmrg ptr = (char *)base + kgem->reloc[i].delta; 90428d7b3dSmrg 91428d7b3dSmrg i = data[0] >> 27; 92428d7b3dSmrg 93428d7b3dSmrg state.vb[i].current = bo; 94428d7b3dSmrg state.vb[i].base = base; 95428d7b3dSmrg state.vb[i].ptr = ptr; 96428d7b3dSmrg state.vb[i].pitch = data[0] & 0x7ff; 97428d7b3dSmrg} 98428d7b3dSmrg 99428d7b3dSmrgstatic uint32_t 100428d7b3dSmrgget_ve_component(uint32_t data, int component) 101428d7b3dSmrg{ 102428d7b3dSmrg return (data >> (16 + (3 - component) * 4)) & 0x7; 103428d7b3dSmrg} 104428d7b3dSmrg 105428d7b3dSmrgstatic void gen4_update_vertex_elements(struct kgem *kgem, int id, const uint32_t *data) 106428d7b3dSmrg{ 107428d7b3dSmrg state.ve[id].buffer = data[0] >> 27; 108428d7b3dSmrg state.ve[id].valid = !!(data[0] & (1 << 26)); 109428d7b3dSmrg state.ve[id].type = (data[0] >> 16) & 0x1ff; 110428d7b3dSmrg state.ve[id].offset = data[0] & 0x7ff; 111428d7b3dSmrg state.ve[id].swizzle[0] = get_ve_component(data[1], 0); 112428d7b3dSmrg state.ve[id].swizzle[1] = get_ve_component(data[1], 1); 113428d7b3dSmrg state.ve[id].swizzle[2] = get_ve_component(data[1], 2); 114428d7b3dSmrg state.ve[id].swizzle[3] = get_ve_component(data[1], 3); 115428d7b3dSmrg} 116428d7b3dSmrg 117428d7b3dSmrgstatic void vertices_sint16_out(const struct vertex_elements *ve, const int16_t *v, int max) 118428d7b3dSmrg{ 119428d7b3dSmrg int c; 120428d7b3dSmrg 121428d7b3dSmrg ErrorF("("); 122428d7b3dSmrg for (c = 0; c < max; c++) { 123428d7b3dSmrg switch (ve->swizzle[c]) { 124428d7b3dSmrg case 0: ErrorF("#"); break; 125428d7b3dSmrg case 1: ErrorF("%d", v[c]); break; 126428d7b3dSmrg case 2: ErrorF("0.0"); break; 127428d7b3dSmrg case 3: ErrorF("1.0"); break; 128428d7b3dSmrg case 4: ErrorF("0x1"); break; 129428d7b3dSmrg case 5: break; 130428d7b3dSmrg default: ErrorF("?"); 131428d7b3dSmrg } 132428d7b3dSmrg if (c < 3) 133428d7b3dSmrg ErrorF(", "); 134428d7b3dSmrg } 135428d7b3dSmrg for (; c < 4; c++) { 136428d7b3dSmrg switch (ve->swizzle[c]) { 137428d7b3dSmrg case 0: ErrorF("#"); break; 138428d7b3dSmrg case 1: ErrorF("1.0"); break; 139428d7b3dSmrg case 2: ErrorF("0.0"); break; 140428d7b3dSmrg case 3: ErrorF("1.0"); break; 141428d7b3dSmrg case 4: ErrorF("0x1"); break; 142428d7b3dSmrg case 5: break; 143428d7b3dSmrg default: ErrorF("?"); 144428d7b3dSmrg } 145428d7b3dSmrg if (c < 3) 146428d7b3dSmrg ErrorF(", "); 147428d7b3dSmrg } 148428d7b3dSmrg ErrorF(")"); 149428d7b3dSmrg} 150428d7b3dSmrg 151428d7b3dSmrgstatic void vertices_float_out(const struct vertex_elements *ve, const float *f, int max) 152428d7b3dSmrg{ 153428d7b3dSmrg int c, o; 154428d7b3dSmrg 155428d7b3dSmrg ErrorF("("); 156428d7b3dSmrg for (c = o = 0; c < 4 && o < max; c++) { 157428d7b3dSmrg switch (ve->swizzle[c]) { 158428d7b3dSmrg case 0: ErrorF("#"); break; 159428d7b3dSmrg case 1: ErrorF("%f", f[o++]); break; 160428d7b3dSmrg case 2: ErrorF("0.0"); break; 161428d7b3dSmrg case 3: ErrorF("1.0"); break; 162428d7b3dSmrg case 4: ErrorF("0x1"); break; 163428d7b3dSmrg case 5: break; 164428d7b3dSmrg default: ErrorF("?"); 165428d7b3dSmrg } 166428d7b3dSmrg if (c < 3) 167428d7b3dSmrg ErrorF(", "); 168428d7b3dSmrg } 169428d7b3dSmrg for (; c < 4; c++) { 170428d7b3dSmrg switch (ve->swizzle[c]) { 171428d7b3dSmrg case 0: ErrorF("#"); break; 172428d7b3dSmrg case 1: ErrorF("1.0"); break; 173428d7b3dSmrg case 2: ErrorF("0.0"); break; 174428d7b3dSmrg case 3: ErrorF("1.0"); break; 175428d7b3dSmrg case 4: ErrorF("0x1"); break; 176428d7b3dSmrg case 5: break; 177428d7b3dSmrg default: ErrorF("?"); 178428d7b3dSmrg } 179428d7b3dSmrg if (c < 3) 180428d7b3dSmrg ErrorF(", "); 181428d7b3dSmrg } 182428d7b3dSmrg ErrorF(")"); 183428d7b3dSmrg} 184428d7b3dSmrg 185428d7b3dSmrgstatic void ve_out(const struct vertex_elements *ve, const void *ptr) 186428d7b3dSmrg{ 187428d7b3dSmrg switch (ve->type) { 188428d7b3dSmrg case GEN4_SURFACEFORMAT_R32_FLOAT: 189428d7b3dSmrg vertices_float_out(ve, ptr, 1); 190428d7b3dSmrg break; 191428d7b3dSmrg case GEN4_SURFACEFORMAT_R32G32_FLOAT: 192428d7b3dSmrg vertices_float_out(ve, ptr, 2); 193428d7b3dSmrg break; 194428d7b3dSmrg case GEN4_SURFACEFORMAT_R32G32B32_FLOAT: 195428d7b3dSmrg vertices_float_out(ve, ptr, 3); 196428d7b3dSmrg break; 197428d7b3dSmrg case GEN4_SURFACEFORMAT_R32G32B32A32_FLOAT: 198428d7b3dSmrg vertices_float_out(ve, ptr, 4); 199428d7b3dSmrg break; 200428d7b3dSmrg case GEN4_SURFACEFORMAT_R16_SINT: 201428d7b3dSmrg vertices_sint16_out(ve, ptr, 1); 202428d7b3dSmrg break; 203428d7b3dSmrg case GEN4_SURFACEFORMAT_R16G16_SINT: 204428d7b3dSmrg vertices_sint16_out(ve, ptr, 2); 205428d7b3dSmrg break; 206428d7b3dSmrg case GEN4_SURFACEFORMAT_R16G16B16A16_SINT: 207428d7b3dSmrg vertices_sint16_out(ve, ptr, 4); 208428d7b3dSmrg break; 209428d7b3dSmrg case GEN4_SURFACEFORMAT_R16_SSCALED: 210428d7b3dSmrg vertices_sint16_out(ve, ptr, 1); 211428d7b3dSmrg break; 212428d7b3dSmrg case GEN4_SURFACEFORMAT_R16G16_SSCALED: 213428d7b3dSmrg vertices_sint16_out(ve, ptr, 2); 214428d7b3dSmrg break; 215428d7b3dSmrg case GEN4_SURFACEFORMAT_R16G16B16A16_SSCALED: 216428d7b3dSmrg vertices_sint16_out(ve, ptr, 4); 217428d7b3dSmrg break; 218428d7b3dSmrg } 219428d7b3dSmrg} 220428d7b3dSmrg 221428d7b3dSmrgstatic void indirect_vertex_out(struct kgem *kgem, uint32_t v) 222428d7b3dSmrg{ 223428d7b3dSmrg int i = 0; 224428d7b3dSmrg 225428d7b3dSmrg do { 226428d7b3dSmrg const struct vertex_elements *ve = &state.ve[i]; 227428d7b3dSmrg const struct vertex_buffer *vb = &state.vb[ve->buffer]; 228428d7b3dSmrg const void *ptr = vb->ptr + v * vb->pitch + ve->offset; 229428d7b3dSmrg 230428d7b3dSmrg if (!ve->valid) 231428d7b3dSmrg continue; 232428d7b3dSmrg 233428d7b3dSmrg ve_out(ve, ptr); 234428d7b3dSmrg 235428d7b3dSmrg while (++i <= state.num_ve && !state.ve[i].valid) 236428d7b3dSmrg ; 237428d7b3dSmrg 238428d7b3dSmrg if (i <= state.num_ve) 239428d7b3dSmrg ErrorF(", "); 240428d7b3dSmrg } while (i <= state.num_ve); 241428d7b3dSmrg} 242428d7b3dSmrg 243428d7b3dSmrgstatic void primitive_out(struct kgem *kgem, uint32_t *data) 244428d7b3dSmrg{ 245428d7b3dSmrg int n; 246428d7b3dSmrg 247428d7b3dSmrg assert((data[0] & (1<<15)) == 0); /* XXX index buffers */ 248428d7b3dSmrg 249428d7b3dSmrg for (n = 0; n < data[1]; n++) { 250428d7b3dSmrg int v = data[2] + n; 251428d7b3dSmrg ErrorF(" [%d:%d] = ", n, v); 252428d7b3dSmrg indirect_vertex_out(kgem, v); 253428d7b3dSmrg ErrorF("\n"); 254428d7b3dSmrg } 255428d7b3dSmrg} 256428d7b3dSmrg 257428d7b3dSmrgstatic void 258428d7b3dSmrgstate_base_out(uint32_t *data, uint32_t offset, unsigned int index, 259428d7b3dSmrg const char *name) 260428d7b3dSmrg{ 261428d7b3dSmrg if (data[index] & 1) 262428d7b3dSmrg kgem_debug_print(data, offset, index, 263428d7b3dSmrg "%s state base address 0x%08x\n", 264428d7b3dSmrg name, data[index] & ~1); 265428d7b3dSmrg else 266428d7b3dSmrg kgem_debug_print(data, offset, index, 267428d7b3dSmrg "%s state base not updated\n", 268428d7b3dSmrg name); 269428d7b3dSmrg} 270428d7b3dSmrg 271428d7b3dSmrgstatic void 272428d7b3dSmrgstate_max_out(uint32_t *data, uint32_t offset, unsigned int index, 273428d7b3dSmrg const char *name) 274428d7b3dSmrg{ 275428d7b3dSmrg if (data[index] == 1) 276428d7b3dSmrg kgem_debug_print(data, offset, index, 277428d7b3dSmrg "%s state upper bound disabled\n", name); 278428d7b3dSmrg else if (data[index] & 1) 279428d7b3dSmrg kgem_debug_print(data, offset, index, 280428d7b3dSmrg "%s state upper bound 0x%08x\n", 281428d7b3dSmrg name, data[index] & ~1); 282428d7b3dSmrg else 283428d7b3dSmrg kgem_debug_print(data, offset, index, 284428d7b3dSmrg "%s state upper bound not updated\n", 285428d7b3dSmrg name); 286428d7b3dSmrg} 287428d7b3dSmrg 288428d7b3dSmrgstatic const char * 289428d7b3dSmrgget_965_surfacetype(unsigned int surfacetype) 290428d7b3dSmrg{ 291428d7b3dSmrg switch (surfacetype) { 292428d7b3dSmrg case 0: return "1D"; 293428d7b3dSmrg case 1: return "2D"; 294428d7b3dSmrg case 2: return "3D"; 295428d7b3dSmrg case 3: return "CUBE"; 296428d7b3dSmrg case 4: return "BUFFER"; 297428d7b3dSmrg case 7: return "NULL"; 298428d7b3dSmrg default: return "unknown"; 299428d7b3dSmrg } 300428d7b3dSmrg} 301428d7b3dSmrg 302428d7b3dSmrgstatic const char * 303428d7b3dSmrgget_965_depthformat(unsigned int depthformat) 304428d7b3dSmrg{ 305428d7b3dSmrg switch (depthformat) { 306428d7b3dSmrg case 0: return "s8_z24float"; 307428d7b3dSmrg case 1: return "z32float"; 308428d7b3dSmrg case 2: return "z24s8"; 309428d7b3dSmrg case 5: return "z16"; 310428d7b3dSmrg default: return "unknown"; 311428d7b3dSmrg } 312428d7b3dSmrg} 313428d7b3dSmrg 314428d7b3dSmrgstatic const char * 315428d7b3dSmrgget_965_element_component(uint32_t data, int component) 316428d7b3dSmrg{ 317428d7b3dSmrg uint32_t component_control = (data >> (16 + (3 - component) * 4)) & 0x7; 318428d7b3dSmrg 319428d7b3dSmrg switch (component_control) { 320428d7b3dSmrg case 0: 321428d7b3dSmrg return "nostore"; 322428d7b3dSmrg case 1: 323428d7b3dSmrg switch (component) { 324428d7b3dSmrg case 0: return "X"; 325428d7b3dSmrg case 1: return "Y"; 326428d7b3dSmrg case 2: return "Z"; 327428d7b3dSmrg case 3: return "W"; 328428d7b3dSmrg default: return "fail"; 329428d7b3dSmrg } 330428d7b3dSmrg case 2: 331428d7b3dSmrg return "0.0"; 332428d7b3dSmrg case 3: 333428d7b3dSmrg return "1.0"; 334428d7b3dSmrg case 4: 335428d7b3dSmrg return "0x1"; 336428d7b3dSmrg case 5: 337428d7b3dSmrg return "VID"; 338428d7b3dSmrg default: 339428d7b3dSmrg return "fail"; 340428d7b3dSmrg } 341428d7b3dSmrg} 342428d7b3dSmrg 343428d7b3dSmrgstatic const char * 344428d7b3dSmrgget_965_prim_type(uint32_t data) 345428d7b3dSmrg{ 346428d7b3dSmrg uint32_t primtype = (data >> 10) & 0x1f; 347428d7b3dSmrg 348428d7b3dSmrg switch (primtype) { 349428d7b3dSmrg case 0x01: return "point list"; 350428d7b3dSmrg case 0x02: return "line list"; 351428d7b3dSmrg case 0x03: return "line strip"; 352428d7b3dSmrg case 0x04: return "tri list"; 353428d7b3dSmrg case 0x05: return "tri strip"; 354428d7b3dSmrg case 0x06: return "tri fan"; 355428d7b3dSmrg case 0x07: return "quad list"; 356428d7b3dSmrg case 0x08: return "quad strip"; 357428d7b3dSmrg case 0x09: return "line list adj"; 358428d7b3dSmrg case 0x0a: return "line strip adj"; 359428d7b3dSmrg case 0x0b: return "tri list adj"; 360428d7b3dSmrg case 0x0c: return "tri strip adj"; 361428d7b3dSmrg case 0x0d: return "tri strip reverse"; 362428d7b3dSmrg case 0x0e: return "polygon"; 363428d7b3dSmrg case 0x0f: return "rect list"; 364428d7b3dSmrg case 0x10: return "line loop"; 365428d7b3dSmrg case 0x11: return "point list bf"; 366428d7b3dSmrg case 0x12: return "line strip cont"; 367428d7b3dSmrg case 0x13: return "line strip bf"; 368428d7b3dSmrg case 0x14: return "line strip cont bf"; 369428d7b3dSmrg case 0x15: return "tri fan no stipple"; 370428d7b3dSmrg default: return "fail"; 371428d7b3dSmrg } 372428d7b3dSmrg} 373428d7b3dSmrg 374428d7b3dSmrg#if 0 375428d7b3dSmrgstruct reloc { 376428d7b3dSmrg struct kgem_bo *bo; 377428d7b3dSmrg void *base; 378428d7b3dSmrg}; 379428d7b3dSmrg 380428d7b3dSmrgstatic void * 381428d7b3dSmrgget_reloc(struct kgem *kgem, 382428d7b3dSmrg void *base, const uint32_t *reloc, 383428d7b3dSmrg struct reloc *r) 384428d7b3dSmrg{ 385428d7b3dSmrg uint32_t delta = *reloc; 386428d7b3dSmrg 387428d7b3dSmrg memset(r, 0, sizeof(*r)); 388428d7b3dSmrg 389428d7b3dSmrg if (base == 0) { 390428d7b3dSmrg uint32_t handle = sizeof(uint32_t) * (reloc - kgem->batch); 391428d7b3dSmrg struct kgem_bo *bo = NULL; 392428d7b3dSmrg int i; 393428d7b3dSmrg 394428d7b3dSmrg for (i = 0; i < kgem->nreloc; i++) 395428d7b3dSmrg if (kgem->reloc[i].offset == handle) 396428d7b3dSmrg break; 397428d7b3dSmrg assert(i < kgem->nreloc); 398428d7b3dSmrg handle = kgem->reloc[i].target_handle; 399428d7b3dSmrg delta = kgem->reloc[i].delta; 400428d7b3dSmrg 401428d7b3dSmrg if (handle == 0) { 402428d7b3dSmrg base = kgem->batch; 403428d7b3dSmrg } else { 404428d7b3dSmrg list_for_each_entry(bo, &kgem->next_request->buffers, request) 405428d7b3dSmrg if (bo->handle == handle) 406428d7b3dSmrg break; 407428d7b3dSmrg assert(&bo->request != &kgem->next_request->buffers); 408428d7b3dSmrg base = kgem_bo_map__debug(kgem, bo); 409428d7b3dSmrg r->bo = bo; 410428d7b3dSmrg r->base = base; 411428d7b3dSmrg } 412428d7b3dSmrg } 413428d7b3dSmrg 414428d7b3dSmrg return (char *)base + delta; 415428d7b3dSmrg} 416428d7b3dSmrg#endif 417428d7b3dSmrg 418428d7b3dSmrgint kgem_gen4_decode_3d(struct kgem *kgem, uint32_t offset) 419428d7b3dSmrg{ 420428d7b3dSmrg static const struct { 421428d7b3dSmrg uint32_t opcode; 422428d7b3dSmrg int min_len; 423428d7b3dSmrg int max_len; 424428d7b3dSmrg const char *name; 425428d7b3dSmrg } opcodes[] = { 426428d7b3dSmrg { 0x6000, 3, 3, "URB_FENCE" }, 427428d7b3dSmrg { 0x6001, 2, 2, "CS_URB_FENCE" }, 428428d7b3dSmrg { 0x6002, 2, 2, "CONSTANT_BUFFER" }, 429428d7b3dSmrg { 0x6101, 6, 6, "STATE_BASE_ADDRESS" }, 430428d7b3dSmrg { 0x6102, 2, 2 , "STATE_SIP" }, 431428d7b3dSmrg { 0x6104, 1, 1, "3DSTATE_PIPELINE_SELECT" }, 432428d7b3dSmrg { 0x680b, 1, 1, "3DSTATE_VF_STATISTICS" }, 433428d7b3dSmrg { 0x6904, 1, 1, "3DSTATE_PIPELINE_SELECT" }, 434428d7b3dSmrg { 0x7800, 7, 7, "3DSTATE_PIPELINED_POINTERS" }, 435428d7b3dSmrg { 0x7801, 6, 6, "3DSTATE_BINDING_TABLE_POINTERS" }, 436428d7b3dSmrg { 0x7808, 5, 257, "3DSTATE_VERTEX_BUFFERS" }, 437428d7b3dSmrg { 0x7809, 3, 256, "3DSTATE_VERTEX_ELEMENTS" }, 438428d7b3dSmrg { 0x780a, 3, 3, "3DSTATE_INDEX_BUFFER" }, 439428d7b3dSmrg { 0x780b, 1, 1, "3DSTATE_VF_STATISTICS" }, 440428d7b3dSmrg { 0x7900, 4, 4, "3DSTATE_DRAWING_RECTANGLE" }, 441428d7b3dSmrg { 0x7901, 5, 5, "3DSTATE_CONSTANT_COLOR" }, 442428d7b3dSmrg { 0x7905, 5, 7, "3DSTATE_DEPTH_BUFFER" }, 443428d7b3dSmrg { 0x7906, 2, 2, "3DSTATE_POLY_STIPPLE_OFFSET" }, 444428d7b3dSmrg { 0x7907, 33, 33, "3DSTATE_POLY_STIPPLE_PATTERN" }, 445428d7b3dSmrg { 0x7908, 3, 3, "3DSTATE_LINE_STIPPLE" }, 446428d7b3dSmrg { 0x7909, 2, 2, "3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP" }, 447428d7b3dSmrg { 0x7909, 2, 2, "3DSTATE_CLEAR_PARAMS" }, 448428d7b3dSmrg { 0x790a, 3, 3, "3DSTATE_AA_LINE_PARAMETERS" }, 449428d7b3dSmrg { 0x790b, 4, 4, "3DSTATE_GS_SVB_INDEX" }, 450428d7b3dSmrg { 0x790d, 3, 3, "3DSTATE_MULTISAMPLE" }, 451428d7b3dSmrg { 0x7910, 2, 2, "3DSTATE_CLEAR_PARAMS" }, 452428d7b3dSmrg { 0x7b00, 6, 6, "3DPRIMITIVE" }, 453428d7b3dSmrg { 0x7805, 3, 3, "3DSTATE_URB" }, 454428d7b3dSmrg { 0x7815, 5, 5, "3DSTATE_CONSTANT_VS_STATE" }, 455428d7b3dSmrg { 0x7816, 5, 5, "3DSTATE_CONSTANT_GS_STATE" }, 456428d7b3dSmrg { 0x7817, 5, 5, "3DSTATE_CONSTANT_PS_STATE" }, 457428d7b3dSmrg { 0x7818, 2, 2, "3DSTATE_SAMPLE_MASK" }, 458428d7b3dSmrg }; 459428d7b3dSmrg uint32_t *data = kgem->batch + offset; 460428d7b3dSmrg uint32_t op; 461428d7b3dSmrg unsigned int len; 462428d7b3dSmrg int i; 463428d7b3dSmrg const char *desc1 = NULL; 464428d7b3dSmrg 465428d7b3dSmrg len = (data[0] & 0xff) + 2; 466428d7b3dSmrg op = (data[0] & 0xffff0000) >> 16; 467428d7b3dSmrg switch (op) { 468428d7b3dSmrg case 0x6000: 469428d7b3dSmrg assert(len == 3); 470428d7b3dSmrg 471428d7b3dSmrg kgem_debug_print(data, offset, 0, "URB_FENCE: %s%s%s%s%s%s\n", 472428d7b3dSmrg (data[0] >> 13) & 1 ? "cs " : "", 473428d7b3dSmrg (data[0] >> 12) & 1 ? "vfe " : "", 474428d7b3dSmrg (data[0] >> 11) & 1 ? "sf " : "", 475428d7b3dSmrg (data[0] >> 10) & 1 ? "clip " : "", 476428d7b3dSmrg (data[0] >> 9) & 1 ? "gs " : "", 477428d7b3dSmrg (data[0] >> 8) & 1 ? "vs " : ""); 478428d7b3dSmrg kgem_debug_print(data, offset, 1, 479428d7b3dSmrg "vs fence: %d, gs_fence: %d, clip_fence: %d\n", 480428d7b3dSmrg data[1] & 0x3ff, 481428d7b3dSmrg (data[1] >> 10) & 0x3ff, 482428d7b3dSmrg (data[1] >> 20) & 0x3ff); 483428d7b3dSmrg kgem_debug_print(data, offset, 2, 484428d7b3dSmrg "sf fence: %d, vfe_fence: %d, cs_fence: %d\n", 485428d7b3dSmrg data[2] & 0x3ff, 486428d7b3dSmrg (data[2] >> 10) & 0x3ff, 487428d7b3dSmrg (data[2] >> 20) & 0x7ff); 488428d7b3dSmrg return len; 489428d7b3dSmrg 490428d7b3dSmrg case 0x6001: 491428d7b3dSmrg kgem_debug_print(data, offset, 0, "CS_URB_STATE\n"); 492428d7b3dSmrg kgem_debug_print(data, offset, 1, "entry_size: %d [%d bytes], n_entries: %d\n", 493428d7b3dSmrg (data[1] >> 4) & 0x1f, 494428d7b3dSmrg (((data[1] >> 4) & 0x1f) + 1) * 64, 495428d7b3dSmrg data[1] & 0x7); 496428d7b3dSmrg return len; 497428d7b3dSmrg case 0x6002: 498428d7b3dSmrg kgem_debug_print(data, offset, 0, "CONSTANT_BUFFER: %s\n", 499428d7b3dSmrg (data[0] >> 8) & 1 ? "valid" : "invalid"); 500428d7b3dSmrg kgem_debug_print(data, offset, 1, "offset: 0x%08x, length: %d bytes\n", 501428d7b3dSmrg data[1] & ~0x3f, ((data[1] & 0x3f) + 1) * 64); 502428d7b3dSmrg return len; 503428d7b3dSmrg case 0x6101: 504428d7b3dSmrg i = 0; 505428d7b3dSmrg kgem_debug_print(data, offset, i++, "STATE_BASE_ADDRESS\n"); 506428d7b3dSmrg assert(len == 6); 507428d7b3dSmrg 508428d7b3dSmrg state_base_out(data, offset, i++, "general"); 509428d7b3dSmrg state_base_out(data, offset, i++, "surface"); 510428d7b3dSmrg state_base_out(data, offset, i++, "media"); 511428d7b3dSmrg 512428d7b3dSmrg state_max_out(data, offset, i++, "general"); 513428d7b3dSmrg state_max_out(data, offset, i++, "media"); 514428d7b3dSmrg 515428d7b3dSmrg return len; 516428d7b3dSmrg 517428d7b3dSmrg case 0x7801: 518428d7b3dSmrg assert(len == 6); 519428d7b3dSmrg 520428d7b3dSmrg kgem_debug_print(data, offset, 0, 521428d7b3dSmrg "3DSTATE_BINDING_TABLE_POINTERS\n"); 522428d7b3dSmrg kgem_debug_print(data, offset, 1, "VS binding table\n"); 523428d7b3dSmrg kgem_debug_print(data, offset, 2, "GS binding table\n"); 524428d7b3dSmrg kgem_debug_print(data, offset, 3, "CLIP binding table\n"); 525428d7b3dSmrg kgem_debug_print(data, offset, 4, "SF binding table\n"); 526428d7b3dSmrg kgem_debug_print(data, offset, 5, "WM binding table\n"); 527428d7b3dSmrg 528428d7b3dSmrg return len; 529428d7b3dSmrg 530428d7b3dSmrg case 0x7808: 531428d7b3dSmrg assert((len - 1) % 4 == 0); 532428d7b3dSmrg kgem_debug_print(data, offset, 0, "3DSTATE_VERTEX_BUFFERS\n"); 533428d7b3dSmrg 534428d7b3dSmrg for (i = 1; i < len;) { 535428d7b3dSmrg gen4_update_vertex_buffer(kgem, data + i); 536428d7b3dSmrg 537428d7b3dSmrg kgem_debug_print(data, offset, i, "buffer %d: %s, pitch %db\n", 538428d7b3dSmrg data[i] >> 27, 539428d7b3dSmrg data[i] & (1 << 20) ? "random" : "sequential", 540428d7b3dSmrg data[i] & 0x07ff); 541428d7b3dSmrg i++; 542428d7b3dSmrg kgem_debug_print(data, offset, i++, "buffer address\n"); 543428d7b3dSmrg kgem_debug_print(data, offset, i++, "max index\n"); 544428d7b3dSmrg kgem_debug_print(data, offset, i++, "mbz\n"); 545428d7b3dSmrg } 546428d7b3dSmrg return len; 547428d7b3dSmrg 548428d7b3dSmrg case 0x7809: 549428d7b3dSmrg assert((len + 1) % 2 == 0); 550428d7b3dSmrg kgem_debug_print(data, offset, 0, "3DSTATE_VERTEX_ELEMENTS\n"); 551428d7b3dSmrg 552428d7b3dSmrg memset(state.ve, 0, sizeof(state.ve)); /* XXX? */ 553428d7b3dSmrg for (i = 1; i < len;) { 554428d7b3dSmrg gen4_update_vertex_elements(kgem, (i - 1)/2, data + i); 555428d7b3dSmrg 556428d7b3dSmrg kgem_debug_print(data, offset, i, "buffer %d: %svalid, type 0x%04x, " 557428d7b3dSmrg "src offset 0x%04x bytes\n", 558428d7b3dSmrg data[i] >> 27, 559428d7b3dSmrg data[i] & (1 << 26) ? "" : "in", 560428d7b3dSmrg (data[i] >> 16) & 0x1ff, 561428d7b3dSmrg data[i] & 0x07ff); 562428d7b3dSmrg i++; 563428d7b3dSmrg kgem_debug_print(data, offset, i, "(%s, %s, %s, %s), " 564428d7b3dSmrg "dst offset 0x%02x bytes\n", 565428d7b3dSmrg get_965_element_component(data[i], 0), 566428d7b3dSmrg get_965_element_component(data[i], 1), 567428d7b3dSmrg get_965_element_component(data[i], 2), 568428d7b3dSmrg get_965_element_component(data[i], 3), 569428d7b3dSmrg (data[i] & 0xff) * 4); 570428d7b3dSmrg i++; 571428d7b3dSmrg } 572428d7b3dSmrg state.num_ve = (len - 1) / 2; /* XXX? */ 573428d7b3dSmrg return len; 574428d7b3dSmrg 575428d7b3dSmrg case 0x780a: 576428d7b3dSmrg assert(len == 3); 577428d7b3dSmrg kgem_debug_print(data, offset, 0, "3DSTATE_INDEX_BUFFER\n"); 578428d7b3dSmrg kgem_debug_print(data, offset, 1, "beginning buffer address\n"); 579428d7b3dSmrg kgem_debug_print(data, offset, 2, "ending buffer address\n"); 580428d7b3dSmrg return len; 581428d7b3dSmrg 582428d7b3dSmrg case 0x7900: 583428d7b3dSmrg assert(len == 4); 584428d7b3dSmrg kgem_debug_print(data, offset, 0, 585428d7b3dSmrg "3DSTATE_DRAWING_RECTANGLE\n"); 586428d7b3dSmrg kgem_debug_print(data, offset, 1, "top left: %d,%d\n", 587428d7b3dSmrg data[1] & 0xffff, 588428d7b3dSmrg (data[1] >> 16) & 0xffff); 589428d7b3dSmrg kgem_debug_print(data, offset, 2, "bottom right: %d,%d\n", 590428d7b3dSmrg data[2] & 0xffff, 591428d7b3dSmrg (data[2] >> 16) & 0xffff); 592428d7b3dSmrg kgem_debug_print(data, offset, 3, "origin: %d,%d\n", 593428d7b3dSmrg (int)data[3] & 0xffff, 594428d7b3dSmrg ((int)data[3] >> 16) & 0xffff); 595428d7b3dSmrg return len; 596428d7b3dSmrg 597428d7b3dSmrg case 0x7905: 598428d7b3dSmrg assert(len == 7); 599428d7b3dSmrg kgem_debug_print(data, offset, 0, 600428d7b3dSmrg "3DSTATE_DEPTH_BUFFER\n"); 601428d7b3dSmrg kgem_debug_print(data, offset, 1, "%s, %s, pitch = %d bytes, %stiled, HiZ %d, Seperate Stencil %d\n", 602428d7b3dSmrg get_965_surfacetype(data[1] >> 29), 603428d7b3dSmrg get_965_depthformat((data[1] >> 18) & 0x7), 604428d7b3dSmrg (data[1] & 0x0001ffff) + 1, 605428d7b3dSmrg data[1] & (1 << 27) ? "" : "not ", 606428d7b3dSmrg (data[1] & (1 << 22)) != 0, 607428d7b3dSmrg (data[1] & (1 << 21)) != 0); 608428d7b3dSmrg kgem_debug_print(data, offset, 2, "depth offset\n"); 609428d7b3dSmrg kgem_debug_print(data, offset, 3, "%dx%d\n", 610428d7b3dSmrg ((data[3] & 0x0007ffc0) >> 6) + 1, 611428d7b3dSmrg ((data[3] & 0xfff80000) >> 19) + 1); 612428d7b3dSmrg kgem_debug_print(data, offset, 4, "volume depth\n"); 613428d7b3dSmrg kgem_debug_print(data, offset, 5, "\n"); 614428d7b3dSmrg kgem_debug_print(data, offset, 6, "\n"); 615428d7b3dSmrg return len; 616428d7b3dSmrg 617428d7b3dSmrg case 0x7a00: 618428d7b3dSmrg assert(len == 4 || len == 5); 619428d7b3dSmrg switch ((data[1] >> 14) & 0x3) { 620428d7b3dSmrg case 0: desc1 = "no write"; break; 621428d7b3dSmrg case 1: desc1 = "qword write"; break; 622428d7b3dSmrg case 2: desc1 = "PS_DEPTH_COUNT write"; break; 623428d7b3dSmrg case 3: desc1 = "TIMESTAMP write"; break; 624428d7b3dSmrg } 625428d7b3dSmrg kgem_debug_print(data, offset, 0, "PIPE_CONTROL\n"); 626428d7b3dSmrg kgem_debug_print(data, offset, 1, 627428d7b3dSmrg "%s, %scs stall, %stlb invalidate, " 628428d7b3dSmrg "%ssync gfdt, %sdepth stall, %sRC write flush, " 629428d7b3dSmrg "%sinst flush, %sTC flush\n", 630428d7b3dSmrg desc1, 631428d7b3dSmrg data[1] & (1 << 20) ? "" : "no ", 632428d7b3dSmrg data[1] & (1 << 18) ? "" : "no ", 633428d7b3dSmrg data[1] & (1 << 17) ? "" : "no ", 634428d7b3dSmrg data[1] & (1 << 13) ? "" : "no ", 635428d7b3dSmrg data[1] & (1 << 12) ? "" : "no ", 636428d7b3dSmrg data[1] & (1 << 11) ? "" : "no ", 637428d7b3dSmrg data[1] & (1 << 10) ? "" : "no "); 638428d7b3dSmrg if (len == 5) { 639428d7b3dSmrg kgem_debug_print(data, offset, 2, "destination address\n"); 640428d7b3dSmrg kgem_debug_print(data, offset, 3, "immediate dword low\n"); 641428d7b3dSmrg kgem_debug_print(data, offset, 4, "immediate dword high\n"); 642428d7b3dSmrg } else { 643428d7b3dSmrg for (i = 2; i < len; i++) { 644428d7b3dSmrg kgem_debug_print(data, offset, i, "\n"); 645428d7b3dSmrg } 646428d7b3dSmrg } 647428d7b3dSmrg return len; 648428d7b3dSmrg 649428d7b3dSmrg case 0x7b00: 650428d7b3dSmrg assert(len == 6); 651428d7b3dSmrg kgem_debug_print(data, offset, 0, 652428d7b3dSmrg "3DPRIMITIVE: %s %s\n", 653428d7b3dSmrg get_965_prim_type(data[0]), 654428d7b3dSmrg (data[0] & (1 << 15)) ? "random" : "sequential"); 655428d7b3dSmrg kgem_debug_print(data, offset, 1, "vertex count\n"); 656428d7b3dSmrg kgem_debug_print(data, offset, 2, "start vertex\n"); 657428d7b3dSmrg kgem_debug_print(data, offset, 3, "instance count\n"); 658428d7b3dSmrg kgem_debug_print(data, offset, 4, "start instance\n"); 659428d7b3dSmrg kgem_debug_print(data, offset, 5, "index bias\n"); 660428d7b3dSmrg primitive_out(kgem, data); 661428d7b3dSmrg return len; 662428d7b3dSmrg } 663428d7b3dSmrg 664428d7b3dSmrg /* For the rest, just dump the bytes */ 665428d7b3dSmrg for (i = 0; i < ARRAY_SIZE(opcodes); i++) 666428d7b3dSmrg if (op == opcodes[i].opcode) 667428d7b3dSmrg break; 668428d7b3dSmrg 669428d7b3dSmrg assert(i < ARRAY_SIZE(opcodes)); 670428d7b3dSmrg 671428d7b3dSmrg len = 1; 672428d7b3dSmrg kgem_debug_print(data, offset, 0, "%s\n", opcodes[i].name); 673428d7b3dSmrg if (opcodes[i].max_len > 1) { 674428d7b3dSmrg len = (data[0] & 0xff) + 2; 675428d7b3dSmrg assert(len >= opcodes[i].min_len && 676428d7b3dSmrg len <= opcodes[i].max_len); 677428d7b3dSmrg } 678428d7b3dSmrg 679428d7b3dSmrg for (i = 1; i < len; i++) 680428d7b3dSmrg kgem_debug_print(data, offset, i, "dword %d\n", i); 681428d7b3dSmrg 682428d7b3dSmrg return len; 683428d7b3dSmrg} 684428d7b3dSmrg 685428d7b3dSmrgvoid kgem_gen4_finish_state(struct kgem *kgem) 686428d7b3dSmrg{ 687428d7b3dSmrg memset(&state, 0, sizeof(state)); 688428d7b3dSmrg} 689