translate_generic.c revision af69d88d
1/************************************************************************** 2 * 3 * Copyright 2007 VMware, Inc. 4 * All Rights Reserved. 5 * 6 * Permission is hereby granted, free of charge, to any person obtaining a 7 * copy of this software and associated documentation files (the 8 * "Software"), to deal in the Software without restriction, including 9 * without limitation the rights to use, copy, modify, merge, publish, 10 * distribute, sub license, and/or sell copies of the Software, and to 11 * permit persons to whom the Software is furnished to do so, subject to 12 * the following conditions: 13 * 14 * The above copyright notice and this permission notice (including the 15 * next paragraph) shall be included in all copies or substantial portions 16 * of the Software. 17 * 18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS 19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. 21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR 22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, 23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE 24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 25 * 26 **************************************************************************/ 27 28 /* 29 * Authors: 30 * Keith Whitwell <keithw@vmware.com> 31 */ 32 33#include "util/u_memory.h" 34#include "util/u_format.h" 35#include "util/u_half.h" 36#include "util/u_math.h" 37#include "pipe/p_state.h" 38#include "translate.h" 39 40 41#define DRAW_DBG 0 42 43typedef void (*fetch_func)(void *dst, 44 const uint8_t *src, 45 unsigned i, unsigned j); 46typedef void (*emit_func)(const void *attrib, void *ptr); 47 48 49 50struct translate_generic { 51 struct translate translate; 52 53 struct { 54 enum translate_element_type type; 55 56 fetch_func fetch; 57 unsigned buffer; 58 unsigned input_offset; 59 unsigned instance_divisor; 60 61 emit_func emit; 62 unsigned output_offset; 63 64 const uint8_t *input_ptr; 65 unsigned input_stride; 66 unsigned max_index; 67 68 /* this value is set to -1 if this is a normal element with output_format != input_format: 69 * in this case, u_format is used to do a full conversion 70 * 71 * this value is set to the format size in bytes if output_format == input_format or for 32-bit instance ids: 72 * in this case, memcpy is used to copy this amount of bytes 73 */ 74 int copy_size; 75 76 } attrib[TRANSLATE_MAX_ATTRIBS]; 77 78 unsigned nr_attrib; 79}; 80 81 82static struct translate_generic *translate_generic( struct translate *translate ) 83{ 84 return (struct translate_generic *)translate; 85} 86 87/** 88 * Fetch a dword[4] vertex attribute from memory, doing format/type 89 * conversion as needed. 90 * 91 * This is probably needed/dupliocated elsewhere, eg format 92 * conversion, texture sampling etc. 93 */ 94#define ATTRIB( NAME, SZ, SRCTYPE, DSTTYPE, TO ) \ 95static void \ 96emit_##NAME(const void *attrib, void *ptr) \ 97{ \ 98 unsigned i; \ 99 SRCTYPE *in = (SRCTYPE *)attrib; \ 100 DSTTYPE *out = (DSTTYPE *)ptr; \ 101 \ 102 for (i = 0; i < SZ; i++) { \ 103 out[i] = TO(in[i]); \ 104 } \ 105} 106 107 108#define TO_64_FLOAT(x) ((double) x) 109#define TO_32_FLOAT(x) (x) 110#define TO_16_FLOAT(x) util_float_to_half(x) 111 112#define TO_8_USCALED(x) ((unsigned char) x) 113#define TO_16_USCALED(x) ((unsigned short) x) 114#define TO_32_USCALED(x) ((unsigned int) x) 115 116#define TO_8_SSCALED(x) ((char) x) 117#define TO_16_SSCALED(x) ((short) x) 118#define TO_32_SSCALED(x) ((int) x) 119 120#define TO_8_UNORM(x) ((unsigned char) (x * 255.0f)) 121#define TO_16_UNORM(x) ((unsigned short) (x * 65535.0f)) 122#define TO_32_UNORM(x) ((unsigned int) (x * 4294967295.0f)) 123 124#define TO_8_SNORM(x) ((char) (x * 127.0f)) 125#define TO_16_SNORM(x) ((short) (x * 32767.0f)) 126#define TO_32_SNORM(x) ((int) (x * 2147483647.0f)) 127 128#define TO_32_FIXED(x) ((int) (x * 65536.0f)) 129 130#define TO_INT(x) (x) 131 132 133ATTRIB( R64G64B64A64_FLOAT, 4, float, double, TO_64_FLOAT ) 134ATTRIB( R64G64B64_FLOAT, 3, float, double, TO_64_FLOAT ) 135ATTRIB( R64G64_FLOAT, 2, float, double, TO_64_FLOAT ) 136ATTRIB( R64_FLOAT, 1, float, double, TO_64_FLOAT ) 137 138ATTRIB( R32G32B32A32_FLOAT, 4, float, float, TO_32_FLOAT ) 139ATTRIB( R32G32B32_FLOAT, 3, float, float, TO_32_FLOAT ) 140ATTRIB( R32G32_FLOAT, 2, float, float, TO_32_FLOAT ) 141ATTRIB( R32_FLOAT, 1, float, float, TO_32_FLOAT ) 142 143ATTRIB( R16G16B16A16_FLOAT, 4, float, ushort, TO_16_FLOAT ) 144ATTRIB( R16G16B16_FLOAT, 3, float, ushort, TO_16_FLOAT ) 145ATTRIB( R16G16_FLOAT, 2, float, ushort, TO_16_FLOAT ) 146ATTRIB( R16_FLOAT, 1, float, ushort, TO_16_FLOAT ) 147 148ATTRIB( R32G32B32A32_USCALED, 4, float, unsigned, TO_32_USCALED ) 149ATTRIB( R32G32B32_USCALED, 3, float, unsigned, TO_32_USCALED ) 150ATTRIB( R32G32_USCALED, 2, float, unsigned, TO_32_USCALED ) 151ATTRIB( R32_USCALED, 1, float, unsigned, TO_32_USCALED ) 152 153ATTRIB( R32G32B32A32_SSCALED, 4, float, int, TO_32_SSCALED ) 154ATTRIB( R32G32B32_SSCALED, 3, float, int, TO_32_SSCALED ) 155ATTRIB( R32G32_SSCALED, 2, float, int, TO_32_SSCALED ) 156ATTRIB( R32_SSCALED, 1, float, int, TO_32_SSCALED ) 157 158ATTRIB( R32G32B32A32_UNORM, 4, float, unsigned, TO_32_UNORM ) 159ATTRIB( R32G32B32_UNORM, 3, float, unsigned, TO_32_UNORM ) 160ATTRIB( R32G32_UNORM, 2, float, unsigned, TO_32_UNORM ) 161ATTRIB( R32_UNORM, 1, float, unsigned, TO_32_UNORM ) 162 163ATTRIB( R32G32B32A32_SNORM, 4, float, int, TO_32_SNORM ) 164ATTRIB( R32G32B32_SNORM, 3, float, int, TO_32_SNORM ) 165ATTRIB( R32G32_SNORM, 2, float, int, TO_32_SNORM ) 166ATTRIB( R32_SNORM, 1, float, int, TO_32_SNORM ) 167 168ATTRIB( R16G16B16A16_USCALED, 4, float, ushort, TO_16_USCALED ) 169ATTRIB( R16G16B16_USCALED, 3, float, ushort, TO_16_USCALED ) 170ATTRIB( R16G16_USCALED, 2, float, ushort, TO_16_USCALED ) 171ATTRIB( R16_USCALED, 1, float, ushort, TO_16_USCALED ) 172 173ATTRIB( R16G16B16A16_SSCALED, 4, float, short, TO_16_SSCALED ) 174ATTRIB( R16G16B16_SSCALED, 3, float, short, TO_16_SSCALED ) 175ATTRIB( R16G16_SSCALED, 2, float, short, TO_16_SSCALED ) 176ATTRIB( R16_SSCALED, 1, float, short, TO_16_SSCALED ) 177 178ATTRIB( R16G16B16A16_UNORM, 4, float, ushort, TO_16_UNORM ) 179ATTRIB( R16G16B16_UNORM, 3, float, ushort, TO_16_UNORM ) 180ATTRIB( R16G16_UNORM, 2, float, ushort, TO_16_UNORM ) 181ATTRIB( R16_UNORM, 1, float, ushort, TO_16_UNORM ) 182 183ATTRIB( R16G16B16A16_SNORM, 4, float, short, TO_16_SNORM ) 184ATTRIB( R16G16B16_SNORM, 3, float, short, TO_16_SNORM ) 185ATTRIB( R16G16_SNORM, 2, float, short, TO_16_SNORM ) 186ATTRIB( R16_SNORM, 1, float, short, TO_16_SNORM ) 187 188ATTRIB( R8G8B8A8_USCALED, 4, float, ubyte, TO_8_USCALED ) 189ATTRIB( R8G8B8_USCALED, 3, float, ubyte, TO_8_USCALED ) 190ATTRIB( R8G8_USCALED, 2, float, ubyte, TO_8_USCALED ) 191ATTRIB( R8_USCALED, 1, float, ubyte, TO_8_USCALED ) 192 193ATTRIB( R8G8B8A8_SSCALED, 4, float, char, TO_8_SSCALED ) 194ATTRIB( R8G8B8_SSCALED, 3, float, char, TO_8_SSCALED ) 195ATTRIB( R8G8_SSCALED, 2, float, char, TO_8_SSCALED ) 196ATTRIB( R8_SSCALED, 1, float, char, TO_8_SSCALED ) 197 198ATTRIB( R8G8B8A8_UNORM, 4, float, ubyte, TO_8_UNORM ) 199ATTRIB( R8G8B8_UNORM, 3, float, ubyte, TO_8_UNORM ) 200ATTRIB( R8G8_UNORM, 2, float, ubyte, TO_8_UNORM ) 201ATTRIB( R8_UNORM, 1, float, ubyte, TO_8_UNORM ) 202 203ATTRIB( R8G8B8A8_SNORM, 4, float, char, TO_8_SNORM ) 204ATTRIB( R8G8B8_SNORM, 3, float, char, TO_8_SNORM ) 205ATTRIB( R8G8_SNORM, 2, float, char, TO_8_SNORM ) 206ATTRIB( R8_SNORM, 1, float, char, TO_8_SNORM ) 207 208ATTRIB( R32G32B32A32_UINT, 4, uint32_t, unsigned, TO_INT ) 209ATTRIB( R32G32B32_UINT, 3, uint32_t, unsigned, TO_INT ) 210ATTRIB( R32G32_UINT, 2, uint32_t, unsigned, TO_INT ) 211ATTRIB( R32_UINT, 1, uint32_t, unsigned, TO_INT ) 212 213ATTRIB( R16G16B16A16_UINT, 4, uint32_t, ushort, TO_INT ) 214ATTRIB( R16G16B16_UINT, 3, uint32_t, ushort, TO_INT ) 215ATTRIB( R16G16_UINT, 2, uint32_t, ushort, TO_INT ) 216ATTRIB( R16_UINT, 1, uint32_t, ushort, TO_INT ) 217 218ATTRIB( R8G8B8A8_UINT, 4, uint32_t, ubyte, TO_INT ) 219ATTRIB( R8G8B8_UINT, 3, uint32_t, ubyte, TO_INT ) 220ATTRIB( R8G8_UINT, 2, uint32_t, ubyte, TO_INT ) 221ATTRIB( R8_UINT, 1, uint32_t, ubyte, TO_INT ) 222 223ATTRIB( R32G32B32A32_SINT, 4, int32_t, int, TO_INT ) 224ATTRIB( R32G32B32_SINT, 3, int32_t, int, TO_INT ) 225ATTRIB( R32G32_SINT, 2, int32_t, int, TO_INT ) 226ATTRIB( R32_SINT, 1, int32_t, int, TO_INT ) 227 228ATTRIB( R16G16B16A16_SINT, 4, int32_t, short, TO_INT ) 229ATTRIB( R16G16B16_SINT, 3, int32_t, short, TO_INT ) 230ATTRIB( R16G16_SINT, 2, int32_t, short, TO_INT ) 231ATTRIB( R16_SINT, 1, int32_t, short, TO_INT ) 232 233ATTRIB( R8G8B8A8_SINT, 4, int32_t, char, TO_INT ) 234ATTRIB( R8G8B8_SINT, 3, int32_t, char, TO_INT ) 235ATTRIB( R8G8_SINT, 2, int32_t, char, TO_INT ) 236ATTRIB( R8_SINT, 1, int32_t, char, TO_INT ) 237 238static void 239emit_A8R8G8B8_UNORM( const void *attrib, void *ptr) 240{ 241 float *in = (float *)attrib; 242 ubyte *out = (ubyte *)ptr; 243 out[0] = TO_8_UNORM(in[3]); 244 out[1] = TO_8_UNORM(in[0]); 245 out[2] = TO_8_UNORM(in[1]); 246 out[3] = TO_8_UNORM(in[2]); 247} 248 249static void 250emit_B8G8R8A8_UNORM( const void *attrib, void *ptr) 251{ 252 float *in = (float *)attrib; 253 ubyte *out = (ubyte *)ptr; 254 out[2] = TO_8_UNORM(in[0]); 255 out[1] = TO_8_UNORM(in[1]); 256 out[0] = TO_8_UNORM(in[2]); 257 out[3] = TO_8_UNORM(in[3]); 258} 259 260static void 261emit_B10G10R10A2_UNORM( const void *attrib, void *ptr ) 262{ 263 float *src = (float *)ptr; 264 uint32_t value = 0; 265 value |= ((uint32_t)(CLAMP(src[2], 0, 1) * 0x3ff)) & 0x3ff; 266 value |= (((uint32_t)(CLAMP(src[1], 0, 1) * 0x3ff)) & 0x3ff) << 10; 267 value |= (((uint32_t)(CLAMP(src[0], 0, 1) * 0x3ff)) & 0x3ff) << 20; 268 value |= ((uint32_t)(CLAMP(src[3], 0, 1) * 0x3)) << 30; 269#ifdef PIPE_ARCH_BIG_ENDIAN 270 value = util_bswap32(value); 271#endif 272 *(uint32_t *)attrib = value; 273} 274 275static void 276emit_B10G10R10A2_USCALED( const void *attrib, void *ptr ) 277{ 278 float *src = (float *)ptr; 279 uint32_t value = 0; 280 value |= ((uint32_t)CLAMP(src[2], 0, 1023)) & 0x3ff; 281 value |= (((uint32_t)CLAMP(src[1], 0, 1023)) & 0x3ff) << 10; 282 value |= (((uint32_t)CLAMP(src[0], 0, 1023)) & 0x3ff) << 20; 283 value |= ((uint32_t)CLAMP(src[3], 0, 3)) << 30; 284#ifdef PIPE_ARCH_BIG_ENDIAN 285 value = util_bswap32(value); 286#endif 287 *(uint32_t *)attrib = value; 288} 289 290static void 291emit_B10G10R10A2_SNORM( const void *attrib, void *ptr ) 292{ 293 float *src = (float *)ptr; 294 uint32_t value = 0; 295 value |= (uint32_t)(((uint32_t)(CLAMP(src[2], -1, 1) * 0x1ff)) & 0x3ff) ; 296 value |= (uint32_t)((((uint32_t)(CLAMP(src[1], -1, 1) * 0x1ff)) & 0x3ff) << 10) ; 297 value |= (uint32_t)((((uint32_t)(CLAMP(src[0], -1, 1) * 0x1ff)) & 0x3ff) << 20) ; 298 value |= (uint32_t)(((uint32_t)(CLAMP(src[3], -1, 1) * 0x1)) << 30) ; 299#ifdef PIPE_ARCH_BIG_ENDIAN 300 value = util_bswap32(value); 301#endif 302 *(uint32_t *)attrib = value; 303} 304 305static void 306emit_B10G10R10A2_SSCALED( const void *attrib, void *ptr ) 307{ 308 float *src = (float *)ptr; 309 uint32_t value = 0; 310 value |= (uint32_t)(((uint32_t)CLAMP(src[2], -512, 511)) & 0x3ff) ; 311 value |= (uint32_t)((((uint32_t)CLAMP(src[1], -512, 511)) & 0x3ff) << 10) ; 312 value |= (uint32_t)((((uint32_t)CLAMP(src[0], -512, 511)) & 0x3ff) << 20) ; 313 value |= (uint32_t)(((uint32_t)CLAMP(src[3], -2, 1)) << 30) ; 314#ifdef PIPE_ARCH_BIG_ENDIAN 315 value = util_bswap32(value); 316#endif 317 *(uint32_t *)attrib = value; 318} 319 320static void 321emit_R10G10B10A2_UNORM( const void *attrib, void *ptr ) 322{ 323 float *src = (float *)ptr; 324 uint32_t value = 0; 325 value |= ((uint32_t)(CLAMP(src[0], 0, 1) * 0x3ff)) & 0x3ff; 326 value |= (((uint32_t)(CLAMP(src[1], 0, 1) * 0x3ff)) & 0x3ff) << 10; 327 value |= (((uint32_t)(CLAMP(src[2], 0, 1) * 0x3ff)) & 0x3ff) << 20; 328 value |= ((uint32_t)(CLAMP(src[3], 0, 1) * 0x3)) << 30; 329#ifdef PIPE_ARCH_BIG_ENDIAN 330 value = util_bswap32(value); 331#endif 332 *(uint32_t *)attrib = value; 333} 334 335static void 336emit_R10G10B10A2_USCALED( const void *attrib, void *ptr ) 337{ 338 float *src = (float *)ptr; 339 uint32_t value = 0; 340 value |= ((uint32_t)CLAMP(src[0], 0, 1023)) & 0x3ff; 341 value |= (((uint32_t)CLAMP(src[1], 0, 1023)) & 0x3ff) << 10; 342 value |= (((uint32_t)CLAMP(src[2], 0, 1023)) & 0x3ff) << 20; 343 value |= ((uint32_t)CLAMP(src[3], 0, 3)) << 30; 344#ifdef PIPE_ARCH_BIG_ENDIAN 345 value = util_bswap32(value); 346#endif 347 *(uint32_t *)attrib = value; 348} 349 350static void 351emit_R10G10B10A2_SNORM( const void *attrib, void *ptr ) 352{ 353 float *src = (float *)ptr; 354 uint32_t value = 0; 355 value |= (uint32_t)(((uint32_t)(CLAMP(src[0], -1, 1) * 0x1ff)) & 0x3ff) ; 356 value |= (uint32_t)((((uint32_t)(CLAMP(src[1], -1, 1) * 0x1ff)) & 0x3ff) << 10) ; 357 value |= (uint32_t)((((uint32_t)(CLAMP(src[2], -1, 1) * 0x1ff)) & 0x3ff) << 20) ; 358 value |= (uint32_t)(((uint32_t)(CLAMP(src[3], -1, 1) * 0x1)) << 30) ; 359#ifdef PIPE_ARCH_BIG_ENDIAN 360 value = util_bswap32(value); 361#endif 362 *(uint32_t *)attrib = value; 363} 364 365static void 366emit_R10G10B10A2_SSCALED( const void *attrib, void *ptr) 367{ 368 float *src = (float *)ptr; 369 uint32_t value = 0; 370 value |= (uint32_t)(((uint32_t)CLAMP(src[0], -512, 511)) & 0x3ff) ; 371 value |= (uint32_t)((((uint32_t)CLAMP(src[1], -512, 511)) & 0x3ff) << 10) ; 372 value |= (uint32_t)((((uint32_t)CLAMP(src[2], -512, 511)) & 0x3ff) << 20) ; 373 value |= (uint32_t)(((uint32_t)CLAMP(src[3], -2, 1)) << 30) ; 374#ifdef PIPE_ARCH_BIG_ENDIAN 375 value = util_bswap32(value); 376#endif 377 *(uint32_t *)attrib = value; 378} 379 380static void 381emit_NULL( const void *attrib, void *ptr ) 382{ 383 /* do nothing is the only sensible option */ 384} 385 386static emit_func get_emit_func( enum pipe_format format ) 387{ 388 switch (format) { 389 case PIPE_FORMAT_R64_FLOAT: 390 return &emit_R64_FLOAT; 391 case PIPE_FORMAT_R64G64_FLOAT: 392 return &emit_R64G64_FLOAT; 393 case PIPE_FORMAT_R64G64B64_FLOAT: 394 return &emit_R64G64B64_FLOAT; 395 case PIPE_FORMAT_R64G64B64A64_FLOAT: 396 return &emit_R64G64B64A64_FLOAT; 397 398 case PIPE_FORMAT_R32_FLOAT: 399 return &emit_R32_FLOAT; 400 case PIPE_FORMAT_R32G32_FLOAT: 401 return &emit_R32G32_FLOAT; 402 case PIPE_FORMAT_R32G32B32_FLOAT: 403 return &emit_R32G32B32_FLOAT; 404 case PIPE_FORMAT_R32G32B32A32_FLOAT: 405 return &emit_R32G32B32A32_FLOAT; 406 407 case PIPE_FORMAT_R16_FLOAT: 408 return &emit_R16_FLOAT; 409 case PIPE_FORMAT_R16G16_FLOAT: 410 return &emit_R16G16_FLOAT; 411 case PIPE_FORMAT_R16G16B16_FLOAT: 412 return &emit_R16G16B16_FLOAT; 413 case PIPE_FORMAT_R16G16B16A16_FLOAT: 414 return &emit_R16G16B16A16_FLOAT; 415 416 case PIPE_FORMAT_R32_UNORM: 417 return &emit_R32_UNORM; 418 case PIPE_FORMAT_R32G32_UNORM: 419 return &emit_R32G32_UNORM; 420 case PIPE_FORMAT_R32G32B32_UNORM: 421 return &emit_R32G32B32_UNORM; 422 case PIPE_FORMAT_R32G32B32A32_UNORM: 423 return &emit_R32G32B32A32_UNORM; 424 425 case PIPE_FORMAT_R32_USCALED: 426 return &emit_R32_USCALED; 427 case PIPE_FORMAT_R32G32_USCALED: 428 return &emit_R32G32_USCALED; 429 case PIPE_FORMAT_R32G32B32_USCALED: 430 return &emit_R32G32B32_USCALED; 431 case PIPE_FORMAT_R32G32B32A32_USCALED: 432 return &emit_R32G32B32A32_USCALED; 433 434 case PIPE_FORMAT_R32_SNORM: 435 return &emit_R32_SNORM; 436 case PIPE_FORMAT_R32G32_SNORM: 437 return &emit_R32G32_SNORM; 438 case PIPE_FORMAT_R32G32B32_SNORM: 439 return &emit_R32G32B32_SNORM; 440 case PIPE_FORMAT_R32G32B32A32_SNORM: 441 return &emit_R32G32B32A32_SNORM; 442 443 case PIPE_FORMAT_R32_SSCALED: 444 return &emit_R32_SSCALED; 445 case PIPE_FORMAT_R32G32_SSCALED: 446 return &emit_R32G32_SSCALED; 447 case PIPE_FORMAT_R32G32B32_SSCALED: 448 return &emit_R32G32B32_SSCALED; 449 case PIPE_FORMAT_R32G32B32A32_SSCALED: 450 return &emit_R32G32B32A32_SSCALED; 451 452 case PIPE_FORMAT_R16_UNORM: 453 return &emit_R16_UNORM; 454 case PIPE_FORMAT_R16G16_UNORM: 455 return &emit_R16G16_UNORM; 456 case PIPE_FORMAT_R16G16B16_UNORM: 457 return &emit_R16G16B16_UNORM; 458 case PIPE_FORMAT_R16G16B16A16_UNORM: 459 return &emit_R16G16B16A16_UNORM; 460 461 case PIPE_FORMAT_R16_USCALED: 462 return &emit_R16_USCALED; 463 case PIPE_FORMAT_R16G16_USCALED: 464 return &emit_R16G16_USCALED; 465 case PIPE_FORMAT_R16G16B16_USCALED: 466 return &emit_R16G16B16_USCALED; 467 case PIPE_FORMAT_R16G16B16A16_USCALED: 468 return &emit_R16G16B16A16_USCALED; 469 470 case PIPE_FORMAT_R16_SNORM: 471 return &emit_R16_SNORM; 472 case PIPE_FORMAT_R16G16_SNORM: 473 return &emit_R16G16_SNORM; 474 case PIPE_FORMAT_R16G16B16_SNORM: 475 return &emit_R16G16B16_SNORM; 476 case PIPE_FORMAT_R16G16B16A16_SNORM: 477 return &emit_R16G16B16A16_SNORM; 478 479 case PIPE_FORMAT_R16_SSCALED: 480 return &emit_R16_SSCALED; 481 case PIPE_FORMAT_R16G16_SSCALED: 482 return &emit_R16G16_SSCALED; 483 case PIPE_FORMAT_R16G16B16_SSCALED: 484 return &emit_R16G16B16_SSCALED; 485 case PIPE_FORMAT_R16G16B16A16_SSCALED: 486 return &emit_R16G16B16A16_SSCALED; 487 488 case PIPE_FORMAT_R8_UNORM: 489 return &emit_R8_UNORM; 490 case PIPE_FORMAT_R8G8_UNORM: 491 return &emit_R8G8_UNORM; 492 case PIPE_FORMAT_R8G8B8_UNORM: 493 return &emit_R8G8B8_UNORM; 494 case PIPE_FORMAT_R8G8B8A8_UNORM: 495 return &emit_R8G8B8A8_UNORM; 496 497 case PIPE_FORMAT_R8_USCALED: 498 return &emit_R8_USCALED; 499 case PIPE_FORMAT_R8G8_USCALED: 500 return &emit_R8G8_USCALED; 501 case PIPE_FORMAT_R8G8B8_USCALED: 502 return &emit_R8G8B8_USCALED; 503 case PIPE_FORMAT_R8G8B8A8_USCALED: 504 return &emit_R8G8B8A8_USCALED; 505 506 case PIPE_FORMAT_R8_SNORM: 507 return &emit_R8_SNORM; 508 case PIPE_FORMAT_R8G8_SNORM: 509 return &emit_R8G8_SNORM; 510 case PIPE_FORMAT_R8G8B8_SNORM: 511 return &emit_R8G8B8_SNORM; 512 case PIPE_FORMAT_R8G8B8A8_SNORM: 513 return &emit_R8G8B8A8_SNORM; 514 515 case PIPE_FORMAT_R8_SSCALED: 516 return &emit_R8_SSCALED; 517 case PIPE_FORMAT_R8G8_SSCALED: 518 return &emit_R8G8_SSCALED; 519 case PIPE_FORMAT_R8G8B8_SSCALED: 520 return &emit_R8G8B8_SSCALED; 521 case PIPE_FORMAT_R8G8B8A8_SSCALED: 522 return &emit_R8G8B8A8_SSCALED; 523 524 case PIPE_FORMAT_B8G8R8A8_UNORM: 525 return &emit_B8G8R8A8_UNORM; 526 527 case PIPE_FORMAT_A8R8G8B8_UNORM: 528 return &emit_A8R8G8B8_UNORM; 529 530 case PIPE_FORMAT_R32_UINT: 531 return &emit_R32_UINT; 532 case PIPE_FORMAT_R32G32_UINT: 533 return &emit_R32G32_UINT; 534 case PIPE_FORMAT_R32G32B32_UINT: 535 return &emit_R32G32B32_UINT; 536 case PIPE_FORMAT_R32G32B32A32_UINT: 537 return &emit_R32G32B32A32_UINT; 538 539 case PIPE_FORMAT_R16_UINT: 540 return &emit_R16_UINT; 541 case PIPE_FORMAT_R16G16_UINT: 542 return &emit_R16G16_UINT; 543 case PIPE_FORMAT_R16G16B16_UINT: 544 return &emit_R16G16B16_UINT; 545 case PIPE_FORMAT_R16G16B16A16_UINT: 546 return &emit_R16G16B16A16_UINT; 547 548 case PIPE_FORMAT_R8_UINT: 549 return &emit_R8_UINT; 550 case PIPE_FORMAT_R8G8_UINT: 551 return &emit_R8G8_UINT; 552 case PIPE_FORMAT_R8G8B8_UINT: 553 return &emit_R8G8B8_UINT; 554 case PIPE_FORMAT_R8G8B8A8_UINT: 555 return &emit_R8G8B8A8_UINT; 556 557 case PIPE_FORMAT_R32_SINT: 558 return &emit_R32_SINT; 559 case PIPE_FORMAT_R32G32_SINT: 560 return &emit_R32G32_SINT; 561 case PIPE_FORMAT_R32G32B32_SINT: 562 return &emit_R32G32B32_SINT; 563 case PIPE_FORMAT_R32G32B32A32_SINT: 564 return &emit_R32G32B32A32_SINT; 565 566 case PIPE_FORMAT_R16_SINT: 567 return &emit_R16_SINT; 568 case PIPE_FORMAT_R16G16_SINT: 569 return &emit_R16G16_SINT; 570 case PIPE_FORMAT_R16G16B16_SINT: 571 return &emit_R16G16B16_SINT; 572 case PIPE_FORMAT_R16G16B16A16_SINT: 573 return &emit_R16G16B16A16_SINT; 574 575 case PIPE_FORMAT_R8_SINT: 576 return &emit_R8_SINT; 577 case PIPE_FORMAT_R8G8_SINT: 578 return &emit_R8G8_SINT; 579 case PIPE_FORMAT_R8G8B8_SINT: 580 return &emit_R8G8B8_SINT; 581 case PIPE_FORMAT_R8G8B8A8_SINT: 582 return &emit_R8G8B8A8_SINT; 583 584 case PIPE_FORMAT_B10G10R10A2_UNORM: 585 return &emit_B10G10R10A2_UNORM; 586 case PIPE_FORMAT_B10G10R10A2_USCALED: 587 return &emit_B10G10R10A2_USCALED; 588 case PIPE_FORMAT_B10G10R10A2_SNORM: 589 return &emit_B10G10R10A2_SNORM; 590 case PIPE_FORMAT_B10G10R10A2_SSCALED: 591 return &emit_B10G10R10A2_SSCALED; 592 593 case PIPE_FORMAT_R10G10B10A2_UNORM: 594 return &emit_R10G10B10A2_UNORM; 595 case PIPE_FORMAT_R10G10B10A2_USCALED: 596 return &emit_R10G10B10A2_USCALED; 597 case PIPE_FORMAT_R10G10B10A2_SNORM: 598 return &emit_R10G10B10A2_SNORM; 599 case PIPE_FORMAT_R10G10B10A2_SSCALED: 600 return &emit_R10G10B10A2_SSCALED; 601 602 default: 603 assert(0); 604 return &emit_NULL; 605 } 606} 607 608static ALWAYS_INLINE void PIPE_CDECL generic_run_one( struct translate_generic *tg, 609 unsigned elt, 610 unsigned start_instance, 611 unsigned instance_id, 612 void *vert ) 613{ 614 unsigned nr_attrs = tg->nr_attrib; 615 unsigned attr; 616 617 for (attr = 0; attr < nr_attrs; attr++) { 618 float data[4]; 619 uint8_t *dst = (uint8_t *)vert + tg->attrib[attr].output_offset; 620 621 if (tg->attrib[attr].type == TRANSLATE_ELEMENT_NORMAL) { 622 const uint8_t *src; 623 unsigned index; 624 int copy_size; 625 626 if (tg->attrib[attr].instance_divisor) { 627 index = start_instance; 628 index += (instance_id / tg->attrib[attr].instance_divisor); 629 /* XXX we need to clamp the index here too, but to a 630 * per-array max value, not the draw->pt.max_index value 631 * that's being given to us via translate->set_buffer(). 632 */ 633 } 634 else { 635 index = elt; 636 /* clamp to avoid going out of bounds */ 637 index = MIN2(index, tg->attrib[attr].max_index); 638 } 639 640 src = tg->attrib[attr].input_ptr + 641 (ptrdiff_t)tg->attrib[attr].input_stride * index; 642 643 copy_size = tg->attrib[attr].copy_size; 644 if(likely(copy_size >= 0)) 645 memcpy(dst, src, copy_size); 646 else 647 { 648 tg->attrib[attr].fetch( data, src, 0, 0 ); 649 650 if (0) 651 debug_printf("Fetch linear attr %d from %p stride %d index %d: " 652 " %f, %f, %f, %f \n", 653 attr, 654 tg->attrib[attr].input_ptr, 655 tg->attrib[attr].input_stride, 656 index, 657 data[0], data[1],data[2], data[3]); 658 659 tg->attrib[attr].emit( data, dst ); 660 } 661 } else { 662 if(likely(tg->attrib[attr].copy_size >= 0)) 663 memcpy(data, &instance_id, 4); 664 else 665 { 666 data[0] = (float)instance_id; 667 tg->attrib[attr].emit( data, dst ); 668 } 669 } 670 } 671} 672 673/** 674 * Fetch vertex attributes for 'count' vertices. 675 */ 676static void PIPE_CDECL generic_run_elts( struct translate *translate, 677 const unsigned *elts, 678 unsigned count, 679 unsigned start_instance, 680 unsigned instance_id, 681 void *output_buffer ) 682{ 683 struct translate_generic *tg = translate_generic(translate); 684 char *vert = output_buffer; 685 unsigned i; 686 687 for (i = 0; i < count; i++) { 688 generic_run_one(tg, *elts++, start_instance, instance_id, vert); 689 vert += tg->translate.key.output_stride; 690 } 691} 692 693static void PIPE_CDECL generic_run_elts16( struct translate *translate, 694 const uint16_t *elts, 695 unsigned count, 696 unsigned start_instance, 697 unsigned instance_id, 698 void *output_buffer ) 699{ 700 struct translate_generic *tg = translate_generic(translate); 701 char *vert = output_buffer; 702 unsigned i; 703 704 for (i = 0; i < count; i++) { 705 generic_run_one(tg, *elts++, start_instance, instance_id, vert); 706 vert += tg->translate.key.output_stride; 707 } 708} 709 710static void PIPE_CDECL generic_run_elts8( struct translate *translate, 711 const uint8_t *elts, 712 unsigned count, 713 unsigned start_instance, 714 unsigned instance_id, 715 void *output_buffer ) 716{ 717 struct translate_generic *tg = translate_generic(translate); 718 char *vert = output_buffer; 719 unsigned i; 720 721 for (i = 0; i < count; i++) { 722 generic_run_one(tg, *elts++, start_instance, instance_id, vert); 723 vert += tg->translate.key.output_stride; 724 } 725} 726 727static void PIPE_CDECL generic_run( struct translate *translate, 728 unsigned start, 729 unsigned count, 730 unsigned start_instance, 731 unsigned instance_id, 732 void *output_buffer ) 733{ 734 struct translate_generic *tg = translate_generic(translate); 735 char *vert = output_buffer; 736 unsigned i; 737 738 for (i = 0; i < count; i++) { 739 generic_run_one(tg, start + i, start_instance, instance_id, vert); 740 vert += tg->translate.key.output_stride; 741 } 742} 743 744 745 746static void generic_set_buffer( struct translate *translate, 747 unsigned buf, 748 const void *ptr, 749 unsigned stride, 750 unsigned max_index ) 751{ 752 struct translate_generic *tg = translate_generic(translate); 753 unsigned i; 754 755 for (i = 0; i < tg->nr_attrib; i++) { 756 if (tg->attrib[i].buffer == buf) { 757 tg->attrib[i].input_ptr = ((const uint8_t *)ptr + 758 tg->attrib[i].input_offset); 759 tg->attrib[i].input_stride = stride; 760 tg->attrib[i].max_index = max_index; 761 } 762 } 763} 764 765 766static void generic_release( struct translate *translate ) 767{ 768 /* Refcount? 769 */ 770 FREE(translate); 771} 772 773static boolean 774is_legal_int_format_combo( const struct util_format_description *src, 775 const struct util_format_description *dst ) 776{ 777 unsigned i; 778 unsigned nr = MIN2(src->nr_channels, dst->nr_channels); 779 780 for (i = 0; i < nr; i++) { 781 /* The signs must match. */ 782 if (src->channel[i].type != dst->channel[i].type) { 783 return FALSE; 784 } 785 786 /* Integers must not lose precision at any point in the pipeline. */ 787 if (src->channel[i].size > dst->channel[i].size) { 788 return FALSE; 789 } 790 } 791 return TRUE; 792} 793 794struct translate *translate_generic_create( const struct translate_key *key ) 795{ 796 struct translate_generic *tg = CALLOC_STRUCT(translate_generic); 797 unsigned i; 798 799 if (tg == NULL) 800 return NULL; 801 802 assert(key->nr_elements <= TRANSLATE_MAX_ATTRIBS); 803 804 tg->translate.key = *key; 805 tg->translate.release = generic_release; 806 tg->translate.set_buffer = generic_set_buffer; 807 tg->translate.run_elts = generic_run_elts; 808 tg->translate.run_elts16 = generic_run_elts16; 809 tg->translate.run_elts8 = generic_run_elts8; 810 tg->translate.run = generic_run; 811 812 for (i = 0; i < key->nr_elements; i++) { 813 const struct util_format_description *format_desc = 814 util_format_description(key->element[i].input_format); 815 816 assert(format_desc); 817 818 tg->attrib[i].type = key->element[i].type; 819 820 if (format_desc->channel[0].pure_integer) { 821 const struct util_format_description *out_format_desc = 822 util_format_description(key->element[i].output_format); 823 824 if (!is_legal_int_format_combo(format_desc, out_format_desc)) { 825 FREE(tg); 826 return NULL; 827 } 828 829 if (format_desc->channel[0].type == UTIL_FORMAT_TYPE_SIGNED) { 830 assert(format_desc->fetch_rgba_sint); 831 tg->attrib[i].fetch = (fetch_func)format_desc->fetch_rgba_sint; 832 } else { 833 assert(format_desc->fetch_rgba_uint); 834 tg->attrib[i].fetch = (fetch_func)format_desc->fetch_rgba_uint; 835 } 836 } else { 837 assert(format_desc->fetch_rgba_float); 838 tg->attrib[i].fetch = (fetch_func)format_desc->fetch_rgba_float; 839 } 840 841 tg->attrib[i].buffer = key->element[i].input_buffer; 842 tg->attrib[i].input_offset = key->element[i].input_offset; 843 tg->attrib[i].instance_divisor = key->element[i].instance_divisor; 844 845 tg->attrib[i].output_offset = key->element[i].output_offset; 846 847 tg->attrib[i].copy_size = -1; 848 if (tg->attrib[i].type == TRANSLATE_ELEMENT_INSTANCE_ID) 849 { 850 if(key->element[i].output_format == PIPE_FORMAT_R32_USCALED 851 || key->element[i].output_format == PIPE_FORMAT_R32_SSCALED) 852 tg->attrib[i].copy_size = 4; 853 } 854 else 855 { 856 if(key->element[i].input_format == key->element[i].output_format 857 && format_desc->block.width == 1 858 && format_desc->block.height == 1 859 && !(format_desc->block.bits & 7)) 860 tg->attrib[i].copy_size = format_desc->block.bits >> 3; 861 } 862 863 if(tg->attrib[i].copy_size < 0) 864 tg->attrib[i].emit = get_emit_func(key->element[i].output_format); 865 else 866 tg->attrib[i].emit = NULL; 867 } 868 869 tg->nr_attrib = key->nr_elements; 870 871 872 return &tg->translate; 873} 874 875boolean translate_generic_is_output_format_supported(enum pipe_format format) 876{ 877 switch(format) 878 { 879 case PIPE_FORMAT_R64G64B64A64_FLOAT: return TRUE; 880 case PIPE_FORMAT_R64G64B64_FLOAT: return TRUE; 881 case PIPE_FORMAT_R64G64_FLOAT: return TRUE; 882 case PIPE_FORMAT_R64_FLOAT: return TRUE; 883 884 case PIPE_FORMAT_R32G32B32A32_FLOAT: return TRUE; 885 case PIPE_FORMAT_R32G32B32_FLOAT: return TRUE; 886 case PIPE_FORMAT_R32G32_FLOAT: return TRUE; 887 case PIPE_FORMAT_R32_FLOAT: return TRUE; 888 889 case PIPE_FORMAT_R16G16B16A16_FLOAT: return TRUE; 890 case PIPE_FORMAT_R16G16B16_FLOAT: return TRUE; 891 case PIPE_FORMAT_R16G16_FLOAT: return TRUE; 892 case PIPE_FORMAT_R16_FLOAT: return TRUE; 893 894 case PIPE_FORMAT_R32G32B32A32_USCALED: return TRUE; 895 case PIPE_FORMAT_R32G32B32_USCALED: return TRUE; 896 case PIPE_FORMAT_R32G32_USCALED: return TRUE; 897 case PIPE_FORMAT_R32_USCALED: return TRUE; 898 899 case PIPE_FORMAT_R32G32B32A32_SSCALED: return TRUE; 900 case PIPE_FORMAT_R32G32B32_SSCALED: return TRUE; 901 case PIPE_FORMAT_R32G32_SSCALED: return TRUE; 902 case PIPE_FORMAT_R32_SSCALED: return TRUE; 903 904 case PIPE_FORMAT_R32G32B32A32_UNORM: return TRUE; 905 case PIPE_FORMAT_R32G32B32_UNORM: return TRUE; 906 case PIPE_FORMAT_R32G32_UNORM: return TRUE; 907 case PIPE_FORMAT_R32_UNORM: return TRUE; 908 909 case PIPE_FORMAT_R32G32B32A32_SNORM: return TRUE; 910 case PIPE_FORMAT_R32G32B32_SNORM: return TRUE; 911 case PIPE_FORMAT_R32G32_SNORM: return TRUE; 912 case PIPE_FORMAT_R32_SNORM: return TRUE; 913 914 case PIPE_FORMAT_R16G16B16A16_USCALED: return TRUE; 915 case PIPE_FORMAT_R16G16B16_USCALED: return TRUE; 916 case PIPE_FORMAT_R16G16_USCALED: return TRUE; 917 case PIPE_FORMAT_R16_USCALED: return TRUE; 918 919 case PIPE_FORMAT_R16G16B16A16_SSCALED: return TRUE; 920 case PIPE_FORMAT_R16G16B16_SSCALED: return TRUE; 921 case PIPE_FORMAT_R16G16_SSCALED: return TRUE; 922 case PIPE_FORMAT_R16_SSCALED: return TRUE; 923 924 case PIPE_FORMAT_R16G16B16A16_UNORM: return TRUE; 925 case PIPE_FORMAT_R16G16B16_UNORM: return TRUE; 926 case PIPE_FORMAT_R16G16_UNORM: return TRUE; 927 case PIPE_FORMAT_R16_UNORM: return TRUE; 928 929 case PIPE_FORMAT_R16G16B16A16_SNORM: return TRUE; 930 case PIPE_FORMAT_R16G16B16_SNORM: return TRUE; 931 case PIPE_FORMAT_R16G16_SNORM: return TRUE; 932 case PIPE_FORMAT_R16_SNORM: return TRUE; 933 934 case PIPE_FORMAT_R8G8B8A8_USCALED: return TRUE; 935 case PIPE_FORMAT_R8G8B8_USCALED: return TRUE; 936 case PIPE_FORMAT_R8G8_USCALED: return TRUE; 937 case PIPE_FORMAT_R8_USCALED: return TRUE; 938 939 case PIPE_FORMAT_R8G8B8A8_SSCALED: return TRUE; 940 case PIPE_FORMAT_R8G8B8_SSCALED: return TRUE; 941 case PIPE_FORMAT_R8G8_SSCALED: return TRUE; 942 case PIPE_FORMAT_R8_SSCALED: return TRUE; 943 944 case PIPE_FORMAT_R8G8B8A8_UNORM: return TRUE; 945 case PIPE_FORMAT_R8G8B8_UNORM: return TRUE; 946 case PIPE_FORMAT_R8G8_UNORM: return TRUE; 947 case PIPE_FORMAT_R8_UNORM: return TRUE; 948 949 case PIPE_FORMAT_R8G8B8A8_SNORM: return TRUE; 950 case PIPE_FORMAT_R8G8B8_SNORM: return TRUE; 951 case PIPE_FORMAT_R8G8_SNORM: return TRUE; 952 case PIPE_FORMAT_R8_SNORM: return TRUE; 953 954 case PIPE_FORMAT_A8R8G8B8_UNORM: return TRUE; 955 case PIPE_FORMAT_B8G8R8A8_UNORM: return TRUE; 956 957 case PIPE_FORMAT_R32G32B32A32_UINT: return TRUE; 958 case PIPE_FORMAT_R32G32B32_UINT: return TRUE; 959 case PIPE_FORMAT_R32G32_UINT: return TRUE; 960 case PIPE_FORMAT_R32_UINT: return TRUE; 961 962 case PIPE_FORMAT_R16G16B16A16_UINT: return TRUE; 963 case PIPE_FORMAT_R16G16B16_UINT: return TRUE; 964 case PIPE_FORMAT_R16G16_UINT: return TRUE; 965 case PIPE_FORMAT_R16_UINT: return TRUE; 966 967 case PIPE_FORMAT_R8G8B8A8_UINT: return TRUE; 968 case PIPE_FORMAT_R8G8B8_UINT: return TRUE; 969 case PIPE_FORMAT_R8G8_UINT: return TRUE; 970 case PIPE_FORMAT_R8_UINT: return TRUE; 971 972 case PIPE_FORMAT_R32G32B32A32_SINT: return TRUE; 973 case PIPE_FORMAT_R32G32B32_SINT: return TRUE; 974 case PIPE_FORMAT_R32G32_SINT: return TRUE; 975 case PIPE_FORMAT_R32_SINT: return TRUE; 976 977 case PIPE_FORMAT_R16G16B16A16_SINT: return TRUE; 978 case PIPE_FORMAT_R16G16B16_SINT: return TRUE; 979 case PIPE_FORMAT_R16G16_SINT: return TRUE; 980 case PIPE_FORMAT_R16_SINT: return TRUE; 981 982 case PIPE_FORMAT_R8G8B8A8_SINT: return TRUE; 983 case PIPE_FORMAT_R8G8B8_SINT: return TRUE; 984 case PIPE_FORMAT_R8G8_SINT: return TRUE; 985 case PIPE_FORMAT_R8_SINT: return TRUE; 986 987 case PIPE_FORMAT_B10G10R10A2_UNORM: return TRUE; 988 case PIPE_FORMAT_B10G10R10A2_USCALED: return TRUE; 989 case PIPE_FORMAT_B10G10R10A2_SNORM: return TRUE; 990 case PIPE_FORMAT_B10G10R10A2_SSCALED: return TRUE; 991 992 case PIPE_FORMAT_R10G10B10A2_UNORM: return TRUE; 993 case PIPE_FORMAT_R10G10B10A2_USCALED: return TRUE; 994 case PIPE_FORMAT_R10G10B10A2_SNORM: return TRUE; 995 case PIPE_FORMAT_R10G10B10A2_SSCALED: return TRUE; 996 997 default: return FALSE; 998 } 999} 1000