radeon_exa.c revision 921a55d8
1209ff23fSmrg/* 2209ff23fSmrg * Copyright 2005 Eric Anholt 3209ff23fSmrg * Copyright 2005 Benjamin Herrenschmidt 4209ff23fSmrg * All Rights Reserved. 5209ff23fSmrg * 6209ff23fSmrg * Permission is hereby granted, free of charge, to any person obtaining a 7209ff23fSmrg * copy of this software and associated documentation files (the "Software"), 8209ff23fSmrg * to deal in the Software without restriction, including without limitation 9209ff23fSmrg * the rights to use, copy, modify, merge, publish, distribute, sublicense, 10209ff23fSmrg * and/or sell copies of the Software, and to permit persons to whom the 11209ff23fSmrg * Software is furnished to do so, subject to the following conditions: 12209ff23fSmrg * 13209ff23fSmrg * The above copyright notice and this permission notice (including the next 14209ff23fSmrg * paragraph) shall be included in all copies or substantial portions of the 15209ff23fSmrg * Software. 16209ff23fSmrg * 17209ff23fSmrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 18209ff23fSmrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 19209ff23fSmrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 20209ff23fSmrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 21209ff23fSmrg * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 22209ff23fSmrg * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 23209ff23fSmrg * SOFTWARE. 24209ff23fSmrg * 25209ff23fSmrg * Authors: 26209ff23fSmrg * Eric Anholt <anholt@FreeBSD.org> 27209ff23fSmrg * Zack Rusin <zrusin@trolltech.com> 28209ff23fSmrg * Benjamin Herrenschmidt <benh@kernel.crashing.org> 29209ff23fSmrg * 30209ff23fSmrg */ 31209ff23fSmrg 32209ff23fSmrg#ifdef HAVE_CONFIG_H 33209ff23fSmrg#include "config.h" 34209ff23fSmrg#endif 35209ff23fSmrg 36209ff23fSmrg#include "radeon.h" 37209ff23fSmrg#include "radeon_reg.h" 38b7e1c893Smrg#include "r600_reg.h" 39209ff23fSmrg#ifdef XF86DRI 40b7e1c893Smrg#include "radeon_drm.h" 41209ff23fSmrg#endif 42209ff23fSmrg#include "radeon_macros.h" 43209ff23fSmrg#include "radeon_probe.h" 44209ff23fSmrg#include "radeon_version.h" 450974d292Smrg#include "radeon_exa_shared.h" 46209ff23fSmrg 47209ff23fSmrg#include "xf86.h" 48209ff23fSmrg 49209ff23fSmrg 50209ff23fSmrg/***********************************************************************/ 51209ff23fSmrg#define RINFO_FROM_SCREEN(pScr) ScrnInfoPtr pScrn = xf86Screens[pScr->myNum]; \ 52209ff23fSmrg RADEONInfoPtr info = RADEONPTR(pScrn) 53209ff23fSmrg 54209ff23fSmrgstatic struct { 55209ff23fSmrg int rop; 56209ff23fSmrg int pattern; 57209ff23fSmrg} RADEON_ROP[] = { 58209ff23fSmrg { RADEON_ROP3_ZERO, RADEON_ROP3_ZERO }, /* GXclear */ 59209ff23fSmrg { RADEON_ROP3_DSa, RADEON_ROP3_DPa }, /* Gxand */ 60209ff23fSmrg { RADEON_ROP3_SDna, RADEON_ROP3_PDna }, /* GXandReverse */ 61209ff23fSmrg { RADEON_ROP3_S, RADEON_ROP3_P }, /* GXcopy */ 62209ff23fSmrg { RADEON_ROP3_DSna, RADEON_ROP3_DPna }, /* GXandInverted */ 63209ff23fSmrg { RADEON_ROP3_D, RADEON_ROP3_D }, /* GXnoop */ 64209ff23fSmrg { RADEON_ROP3_DSx, RADEON_ROP3_DPx }, /* GXxor */ 65209ff23fSmrg { RADEON_ROP3_DSo, RADEON_ROP3_DPo }, /* GXor */ 66209ff23fSmrg { RADEON_ROP3_DSon, RADEON_ROP3_DPon }, /* GXnor */ 67209ff23fSmrg { RADEON_ROP3_DSxn, RADEON_ROP3_PDxn }, /* GXequiv */ 68209ff23fSmrg { RADEON_ROP3_Dn, RADEON_ROP3_Dn }, /* GXinvert */ 69209ff23fSmrg { RADEON_ROP3_SDno, RADEON_ROP3_PDno }, /* GXorReverse */ 70209ff23fSmrg { RADEON_ROP3_Sn, RADEON_ROP3_Pn }, /* GXcopyInverted */ 71209ff23fSmrg { RADEON_ROP3_DSno, RADEON_ROP3_DPno }, /* GXorInverted */ 72209ff23fSmrg { RADEON_ROP3_DSan, RADEON_ROP3_DPan }, /* GXnand */ 73209ff23fSmrg { RADEON_ROP3_ONE, RADEON_ROP3_ONE } /* GXset */ 74209ff23fSmrg}; 75209ff23fSmrg 76209ff23fSmrg/* Compute log base 2 of val. */ 77209ff23fSmrgstatic __inline__ int 78209ff23fSmrgRADEONLog2(int val) 79209ff23fSmrg{ 80209ff23fSmrg int bits; 81209ff23fSmrg#if (defined __i386__ || defined __x86_64__) && (defined __GNUC__) 82209ff23fSmrg __asm volatile("bsrl %1, %0" 83209ff23fSmrg : "=r" (bits) 84209ff23fSmrg : "c" (val) 85209ff23fSmrg ); 86209ff23fSmrg return bits; 87209ff23fSmrg#else 88209ff23fSmrg for (bits = 0; val != 0; val >>= 1, ++bits) 89209ff23fSmrg ; 90209ff23fSmrg return bits - 1; 91209ff23fSmrg#endif 92209ff23fSmrg} 93209ff23fSmrg 94209ff23fSmrgstatic __inline__ uint32_t F_TO_DW(float val) 95209ff23fSmrg{ 96209ff23fSmrg union { 97209ff23fSmrg float f; 98209ff23fSmrg uint32_t l; 99209ff23fSmrg } tmp; 100209ff23fSmrg tmp.f = val; 101209ff23fSmrg return tmp.l; 102209ff23fSmrg} 103209ff23fSmrg 104ad43ddacSmrg 105209ff23fSmrg/* Assumes that depth 15 and 16 can be used as depth 16, which is okay since we 106209ff23fSmrg * require src and dest datatypes to be equal. 107209ff23fSmrg */ 108209ff23fSmrgBool RADEONGetDatatypeBpp(int bpp, uint32_t *type) 109209ff23fSmrg{ 110209ff23fSmrg switch (bpp) { 111209ff23fSmrg case 8: 112209ff23fSmrg *type = ATI_DATATYPE_CI8; 113209ff23fSmrg return TRUE; 114209ff23fSmrg case 16: 115209ff23fSmrg *type = ATI_DATATYPE_RGB565; 116209ff23fSmrg return TRUE; 117209ff23fSmrg case 24: 118209ff23fSmrg *type = ATI_DATATYPE_CI8; 119209ff23fSmrg return TRUE; 120209ff23fSmrg case 32: 121209ff23fSmrg *type = ATI_DATATYPE_ARGB8888; 122209ff23fSmrg return TRUE; 123209ff23fSmrg default: 124209ff23fSmrg RADEON_FALLBACK(("Unsupported bpp: %d\n", bpp)); 125209ff23fSmrg return FALSE; 126209ff23fSmrg } 127209ff23fSmrg} 128209ff23fSmrg 129209ff23fSmrgstatic Bool RADEONPixmapIsColortiled(PixmapPtr pPix) 130209ff23fSmrg{ 131209ff23fSmrg RINFO_FROM_SCREEN(pPix->drawable.pScreen); 132209ff23fSmrg 133209ff23fSmrg /* This doesn't account for the back buffer, which we may want to wrap in 134209ff23fSmrg * a pixmap at some point for the purposes of DRI buffer moves. 135209ff23fSmrg */ 136209ff23fSmrg if (info->tilingEnabled && exaGetPixmapOffset(pPix) == 0) 137209ff23fSmrg return TRUE; 138209ff23fSmrg else 139209ff23fSmrg return FALSE; 140209ff23fSmrg} 141209ff23fSmrg 142209ff23fSmrgstatic Bool RADEONGetOffsetPitch(PixmapPtr pPix, int bpp, uint32_t *pitch_offset, 143209ff23fSmrg unsigned int offset, unsigned int pitch) 144209ff23fSmrg{ 145209ff23fSmrg RINFO_FROM_SCREEN(pPix->drawable.pScreen); 146209ff23fSmrg 147b7e1c893Smrg if (pitch > 16320 || pitch % info->accel_state->exa->pixmapPitchAlign != 0) 148209ff23fSmrg RADEON_FALLBACK(("Bad pitch 0x%08x\n", pitch)); 149209ff23fSmrg 150b7e1c893Smrg if (offset % info->accel_state->exa->pixmapOffsetAlign != 0) 151209ff23fSmrg RADEON_FALLBACK(("Bad offset 0x%08x\n", offset)); 152209ff23fSmrg 153209ff23fSmrg pitch = pitch >> 6; 154209ff23fSmrg *pitch_offset = (pitch << 22) | (offset >> 10); 155209ff23fSmrg 156209ff23fSmrg /* If it's the front buffer, we've got to note that it's tiled? */ 157209ff23fSmrg if (RADEONPixmapIsColortiled(pPix)) 158209ff23fSmrg *pitch_offset |= RADEON_DST_TILE_MACRO; 159209ff23fSmrg return TRUE; 160209ff23fSmrg} 161209ff23fSmrg 162209ff23fSmrgBool RADEONGetPixmapOffsetPitch(PixmapPtr pPix, uint32_t *pitch_offset) 163209ff23fSmrg{ 164209ff23fSmrg uint32_t pitch, offset; 165209ff23fSmrg int bpp; 166209ff23fSmrg 167209ff23fSmrg bpp = pPix->drawable.bitsPerPixel; 168209ff23fSmrg if (bpp == 24) 169209ff23fSmrg bpp = 8; 170209ff23fSmrg 171ad43ddacSmrg offset = radeonGetPixmapOffset(pPix); 172209ff23fSmrg pitch = exaGetPixmapPitch(pPix); 173209ff23fSmrg 174209ff23fSmrg return RADEONGetOffsetPitch(pPix, bpp, pitch_offset, offset, pitch); 175209ff23fSmrg} 176209ff23fSmrg 177921a55d8Smrg/** 178921a55d8Smrg * Returns whether the provided transform is affine. 179921a55d8Smrg * 180921a55d8Smrg * transform may be null. 181921a55d8Smrg */ 182921a55d8SmrgBool radeon_transform_is_affine(PictTransformPtr t) 183921a55d8Smrg{ 184921a55d8Smrg if (t == NULL) 185921a55d8Smrg return TRUE; 186921a55d8Smrg return t->matrix[2][0] == 0 && t->matrix[2][1] == 0; 187921a55d8Smrg} 188921a55d8Smrg 189209ff23fSmrg#if X_BYTE_ORDER == X_BIG_ENDIAN 190209ff23fSmrg 191b7e1c893Smrgstatic unsigned long swapper_surfaces[6]; 192209ff23fSmrg 193ad43ddacSmrgstatic Bool RADEONPrepareAccess_BE(PixmapPtr pPix, int index) 194209ff23fSmrg{ 195209ff23fSmrg RINFO_FROM_SCREEN(pPix->drawable.pScreen); 196209ff23fSmrg unsigned char *RADEONMMIO = info->MMIO; 197209ff23fSmrg uint32_t offset = exaGetPixmapOffset(pPix); 198209ff23fSmrg int bpp, soff; 199209ff23fSmrg uint32_t size, flags; 200209ff23fSmrg 201209ff23fSmrg /* Front buffer is always set with proper swappers */ 202209ff23fSmrg if (offset == 0) 203209ff23fSmrg return TRUE; 204209ff23fSmrg 205209ff23fSmrg /* If same bpp as front buffer, just do nothing as the main 206209ff23fSmrg * swappers will apply 207209ff23fSmrg */ 208209ff23fSmrg bpp = pPix->drawable.bitsPerPixel; 209209ff23fSmrg if (bpp == pScrn->bitsPerPixel) 210209ff23fSmrg return TRUE; 211209ff23fSmrg 212209ff23fSmrg /* We need to setup a separate swapper, let's request a 213209ff23fSmrg * surface. We need to align the size first 214209ff23fSmrg */ 215209ff23fSmrg size = exaGetPixmapSize(pPix); 216ad43ddacSmrg size = RADEON_ALIGN(size, RADEON_GPU_PAGE_SIZE); 217209ff23fSmrg 218209ff23fSmrg /* Set surface to tiling disabled with appropriate swapper */ 219209ff23fSmrg switch (bpp) { 220209ff23fSmrg case 16: 221209ff23fSmrg flags = RADEON_SURF_AP0_SWP_16BPP | RADEON_SURF_AP1_SWP_16BPP; 222209ff23fSmrg break; 223209ff23fSmrg case 32: 224209ff23fSmrg flags = RADEON_SURF_AP0_SWP_32BPP | RADEON_SURF_AP1_SWP_32BPP; 225209ff23fSmrg break; 226209ff23fSmrg default: 227209ff23fSmrg flags = 0; 228209ff23fSmrg } 229209ff23fSmrg#if defined(XF86DRI) 230209ff23fSmrg if (info->directRenderingEnabled && info->allowColorTiling) { 231b7e1c893Smrg struct drm_radeon_surface_alloc drmsurfalloc; 232209ff23fSmrg int rc; 233209ff23fSmrg 234209ff23fSmrg drmsurfalloc.address = offset; 235209ff23fSmrg drmsurfalloc.size = size; 236209ff23fSmrg drmsurfalloc.flags = flags | 1; /* bogus pitch to please DRM */ 237209ff23fSmrg 238b7e1c893Smrg rc = drmCommandWrite(info->dri->drmFD, DRM_RADEON_SURF_ALLOC, 239209ff23fSmrg &drmsurfalloc, sizeof(drmsurfalloc)); 240209ff23fSmrg if (rc < 0) { 241209ff23fSmrg xf86DrvMsg(pScrn->scrnIndex, X_ERROR, 242209ff23fSmrg "drm: could not allocate surface for access" 243209ff23fSmrg " swapper, err: %d!\n", rc); 244209ff23fSmrg return FALSE; 245209ff23fSmrg } 246209ff23fSmrg swapper_surfaces[index] = offset; 247209ff23fSmrg 248209ff23fSmrg return TRUE; 249209ff23fSmrg } 250209ff23fSmrg#endif 251209ff23fSmrg soff = (index + 1) * 0x10; 252209ff23fSmrg OUTREG(RADEON_SURFACE0_INFO + soff, flags); 253209ff23fSmrg OUTREG(RADEON_SURFACE0_LOWER_BOUND + soff, offset); 254209ff23fSmrg OUTREG(RADEON_SURFACE0_UPPER_BOUND + soff, offset + size - 1); 255209ff23fSmrg swapper_surfaces[index] = offset; 256209ff23fSmrg return TRUE; 257209ff23fSmrg} 258209ff23fSmrg 259ad43ddacSmrgstatic void RADEONFinishAccess_BE(PixmapPtr pPix, int index) 260209ff23fSmrg{ 261209ff23fSmrg RINFO_FROM_SCREEN(pPix->drawable.pScreen); 262209ff23fSmrg unsigned char *RADEONMMIO = info->MMIO; 263209ff23fSmrg uint32_t offset = exaGetPixmapOffset(pPix); 264209ff23fSmrg int soff; 265209ff23fSmrg 266209ff23fSmrg /* Front buffer is always set with proper swappers */ 267209ff23fSmrg if (offset == 0) 268209ff23fSmrg return; 269209ff23fSmrg 270209ff23fSmrg if (swapper_surfaces[index] == 0) 271209ff23fSmrg return; 272209ff23fSmrg#if defined(XF86DRI) 273209ff23fSmrg if (info->directRenderingEnabled && info->allowColorTiling) { 274b7e1c893Smrg struct drm_radeon_surface_free drmsurffree; 275209ff23fSmrg 276209ff23fSmrg drmsurffree.address = offset; 277b7e1c893Smrg drmCommandWrite(info->dri->drmFD, DRM_RADEON_SURF_FREE, 278209ff23fSmrg &drmsurffree, sizeof(drmsurffree)); 279209ff23fSmrg swapper_surfaces[index] = 0; 280209ff23fSmrg return; 281209ff23fSmrg } 282209ff23fSmrg#endif 283209ff23fSmrg soff = (index + 1) * 0x10; 284209ff23fSmrg OUTREG(RADEON_SURFACE0_INFO + soff, 0); 285209ff23fSmrg OUTREG(RADEON_SURFACE0_LOWER_BOUND + soff, 0); 286209ff23fSmrg OUTREG(RADEON_SURFACE0_UPPER_BOUND + soff, 0); 287209ff23fSmrg swapper_surfaces[index] = 0; 288209ff23fSmrg} 289209ff23fSmrg 290209ff23fSmrg#endif /* X_BYTE_ORDER == X_BIG_ENDIAN */ 291209ff23fSmrg 292ad43ddacSmrg#ifdef XF86DRM_MODE 293ad43ddacSmrgBool RADEONPrepareAccess_CS(PixmapPtr pPix, int index) 294ad43ddacSmrg{ 295ad43ddacSmrg ScreenPtr pScreen = pPix->drawable.pScreen; 296ad43ddacSmrg ScrnInfoPtr pScrn = xf86Screens[pScreen->myNum]; 297ad43ddacSmrg RADEONInfoPtr info = RADEONPTR(pScrn); 298ad43ddacSmrg struct radeon_exa_pixmap_priv *driver_priv; 2990974d292Smrg uint32_t possible_domains = ~0U; 3000974d292Smrg uint32_t current_domain = 0; 3010974d292Smrg#ifdef EXA_MIXED_PIXMAPS 3020974d292Smrg Bool can_fail = !(pPix->drawable.bitsPerPixel < 8) && 3030974d292Smrg pPix != pScreen->GetScreenPixmap(pScreen) && 3040974d292Smrg (info->accel_state->exa->flags & EXA_MIXED_PIXMAPS); 3050974d292Smrg#else 3060974d292Smrg Bool can_fail = FALSE; 3070974d292Smrg#endif 3080974d292Smrg Bool flush = FALSE; 309ad43ddacSmrg int ret; 310921a55d8Smrg uint32_t tiling_flags = 0, pitch = 0; 311ad43ddacSmrg 312ad43ddacSmrg#if X_BYTE_ORDER == X_BIG_ENDIAN 313ad43ddacSmrg /* May need to handle byte swapping in DownloadFrom/UploadToScreen */ 3140974d292Smrg if (can_fail && pPix->drawable.bitsPerPixel > 8) 315ad43ddacSmrg return FALSE; 316ad43ddacSmrg#endif 317ad43ddacSmrg 318ad43ddacSmrg driver_priv = exaGetPixmapDriverPrivate(pPix); 319ad43ddacSmrg if (!driver_priv) 320ad43ddacSmrg return FALSE; 321ad43ddacSmrg 322921a55d8Smrg /* check if we are tiled */ 323921a55d8Smrg ret = radeon_bo_get_tiling(driver_priv->bo, &tiling_flags, &pitch); 324921a55d8Smrg if (ret) 325921a55d8Smrg return FALSE; 326921a55d8Smrg /* untile in DFS/UTS */ 327921a55d8Smrg if (tiling_flags & (RADEON_TILING_MACRO | RADEON_TILING_MICRO)) 328921a55d8Smrg return FALSE; 329921a55d8Smrg 330ad43ddacSmrg /* if we have more refs than just the BO then flush */ 3310974d292Smrg if (radeon_bo_is_referenced_by_cs(driver_priv->bo, info->cs)) { 3320974d292Smrg flush = TRUE; 3330974d292Smrg 3340974d292Smrg if (can_fail) { 3350974d292Smrg possible_domains = radeon_bo_get_src_domain(driver_priv->bo); 3360974d292Smrg if (possible_domains == RADEON_GEM_DOMAIN_VRAM) 3370974d292Smrg return FALSE; /* use DownloadFromScreen */ 3380974d292Smrg } 3390974d292Smrg } 3400974d292Smrg 3410974d292Smrg /* if the BO might end up in VRAM, prefer DownloadFromScreen */ 3420974d292Smrg if (can_fail && (possible_domains & RADEON_GEM_DOMAIN_VRAM)) { 3430974d292Smrg radeon_bo_is_busy(driver_priv->bo, ¤t_domain); 3440974d292Smrg 3450974d292Smrg if (current_domain & possible_domains) { 3460974d292Smrg if (current_domain == RADEON_GEM_DOMAIN_VRAM) 3470974d292Smrg return FALSE; 3480974d292Smrg } else if (possible_domains & RADEON_GEM_DOMAIN_VRAM) 3490974d292Smrg return FALSE; 3500974d292Smrg } 3510974d292Smrg 3520974d292Smrg if (flush) 353ad43ddacSmrg radeon_cs_flush_indirect(pScrn); 354ad43ddacSmrg 355ad43ddacSmrg /* flush IB */ 356ad43ddacSmrg ret = radeon_bo_map(driver_priv->bo, 1); 357ad43ddacSmrg if (ret) { 358ad43ddacSmrg FatalError("failed to map pixmap %d\n", ret); 359ad43ddacSmrg return FALSE; 360ad43ddacSmrg } 361ad43ddacSmrg driver_priv->bo_mapped = TRUE; 362ad43ddacSmrg 363ad43ddacSmrg pPix->devPrivate.ptr = driver_priv->bo->ptr; 364ad43ddacSmrg 365ad43ddacSmrg return TRUE; 366ad43ddacSmrg} 367ad43ddacSmrg 368ad43ddacSmrgvoid RADEONFinishAccess_CS(PixmapPtr pPix, int index) 369ad43ddacSmrg{ 370ad43ddacSmrg struct radeon_exa_pixmap_priv *driver_priv; 371ad43ddacSmrg 372ad43ddacSmrg driver_priv = exaGetPixmapDriverPrivate(pPix); 373ad43ddacSmrg if (!driver_priv || !driver_priv->bo_mapped) 374ad43ddacSmrg return; 375ad43ddacSmrg 376ad43ddacSmrg radeon_bo_unmap(driver_priv->bo); 3770974d292Smrg driver_priv->bo_mapped = FALSE; 378ad43ddacSmrg pPix->devPrivate.ptr = NULL; 379ad43ddacSmrg} 380ad43ddacSmrg 381ad43ddacSmrg 382ad43ddacSmrgvoid *RADEONEXACreatePixmap(ScreenPtr pScreen, int size, int align) 383ad43ddacSmrg{ 384ad43ddacSmrg ScrnInfoPtr pScrn = xf86Screens[pScreen->myNum]; 385ad43ddacSmrg RADEONInfoPtr info = RADEONPTR(pScrn); 386ad43ddacSmrg struct radeon_exa_pixmap_priv *new_priv; 387ad43ddacSmrg 388ad43ddacSmrg#ifdef EXA_MIXED_PIXMAPS 389ad43ddacSmrg if (info->accel_state->exa->flags & EXA_MIXED_PIXMAPS) { 390ad43ddacSmrg if (size != 0 && !info->exa_force_create && 391ad43ddacSmrg info->exa_pixmaps == FALSE) 392ad43ddacSmrg return NULL; 393ad43ddacSmrg } 394ad43ddacSmrg#endif 395ad43ddacSmrg 3962f39173dSmrg new_priv = calloc(1, sizeof(struct radeon_exa_pixmap_priv)); 397ad43ddacSmrg if (!new_priv) 398ad43ddacSmrg return NULL; 399ad43ddacSmrg 400ad43ddacSmrg if (size == 0) 401ad43ddacSmrg return new_priv; 402ad43ddacSmrg 403ad43ddacSmrg new_priv->bo = radeon_bo_open(info->bufmgr, 0, size, align, 404ad43ddacSmrg RADEON_GEM_DOMAIN_VRAM, 0); 405ad43ddacSmrg if (!new_priv->bo) { 4062f39173dSmrg free(new_priv); 407ad43ddacSmrg ErrorF("Failed to alloc memory\n"); 408ad43ddacSmrg return NULL; 409ad43ddacSmrg } 410ad43ddacSmrg 411ad43ddacSmrg return new_priv; 412ad43ddacSmrg 413ad43ddacSmrg} 414ad43ddacSmrg 4152f39173dSmrgstatic const unsigned MicroBlockTable[5][3][2] = { 4162f39173dSmrg /*linear tiled square-tiled */ 4172f39173dSmrg {{32, 1}, {8, 4}, {0, 0}}, /* 8 bits per pixel */ 4182f39173dSmrg {{16, 1}, {8, 2}, {4, 4}}, /* 16 bits per pixel */ 4192f39173dSmrg {{ 8, 1}, {4, 2}, {0, 0}}, /* 32 bits per pixel */ 4202f39173dSmrg {{ 4, 1}, {0, 0}, {2, 2}}, /* 64 bits per pixel */ 4212f39173dSmrg {{ 2, 1}, {0, 0}, {0, 0}} /* 128 bits per pixel */ 4222f39173dSmrg}; 4232f39173dSmrg 4242f39173dSmrg/* Return true if macrotiling can be enabled */ 4252f39173dSmrgstatic Bool RADEONMacroSwitch(int width, int height, int bpp, 4262f39173dSmrg uint32_t flags, Bool rv350_mode) 4272f39173dSmrg{ 4282f39173dSmrg unsigned tilew, tileh, microtiled, logbpp; 4292f39173dSmrg 4302f39173dSmrg logbpp = RADEONLog2(bpp / 8); 4312f39173dSmrg if (logbpp > 4) 4322f39173dSmrg return 0; 4332f39173dSmrg 4342f39173dSmrg microtiled = !!(flags & RADEON_TILING_MICRO); 4352f39173dSmrg tilew = MicroBlockTable[logbpp][microtiled][0] * 8; 4362f39173dSmrg tileh = MicroBlockTable[logbpp][microtiled][1] * 8; 4372f39173dSmrg 4382f39173dSmrg /* See TX_FILTER1_n.MACRO_SWITCH. */ 4392f39173dSmrg if (rv350_mode) { 4402f39173dSmrg return width >= tilew && height >= tileh; 4412f39173dSmrg } else { 4422f39173dSmrg return width > tilew && height > tileh; 4432f39173dSmrg } 4442f39173dSmrg} 4452f39173dSmrg 446ad43ddacSmrgvoid *RADEONEXACreatePixmap2(ScreenPtr pScreen, int width, int height, 447ad43ddacSmrg int depth, int usage_hint, int bitsPerPixel, 448ad43ddacSmrg int *new_pitch) 449ad43ddacSmrg{ 450ad43ddacSmrg ScrnInfoPtr pScrn = xf86Screens[pScreen->myNum]; 451ad43ddacSmrg RADEONInfoPtr info = RADEONPTR(pScrn); 452ad43ddacSmrg struct radeon_exa_pixmap_priv *new_priv; 453921a55d8Smrg int pitch, base_align; 454ad43ddacSmrg uint32_t size; 455ad43ddacSmrg uint32_t tiling = 0; 456921a55d8Smrg int cpp = bitsPerPixel / 8; 457ad43ddacSmrg 458ad43ddacSmrg#ifdef EXA_MIXED_PIXMAPS 459ad43ddacSmrg if (info->accel_state->exa->flags & EXA_MIXED_PIXMAPS) { 460ad43ddacSmrg if (width != 0 && height != 0 && !info->exa_force_create && 461ad43ddacSmrg info->exa_pixmaps == FALSE) 462ad43ddacSmrg return NULL; 463ad43ddacSmrg } 464ad43ddacSmrg#endif 465ad43ddacSmrg 466ad43ddacSmrg if (usage_hint) { 467ad43ddacSmrg if (info->allowColorTiling) { 468ad43ddacSmrg if (usage_hint & RADEON_CREATE_PIXMAP_TILING_MACRO) 469ad43ddacSmrg tiling |= RADEON_TILING_MACRO; 470ad43ddacSmrg if (usage_hint & RADEON_CREATE_PIXMAP_TILING_MICRO) 471ad43ddacSmrg tiling |= RADEON_TILING_MICRO; 472ad43ddacSmrg } 473ad43ddacSmrg } 474ad43ddacSmrg 4752f39173dSmrg /* Small pixmaps must not be macrotiled on R300, hw cannot sample them 4762f39173dSmrg * correctly because samplers automatically switch to macrolinear. */ 4772f39173dSmrg if (info->ChipFamily >= CHIP_FAMILY_R300 && 4782f39173dSmrg info->ChipFamily <= CHIP_FAMILY_RS740 && 4792f39173dSmrg (tiling & RADEON_TILING_MACRO) && 4802f39173dSmrg !RADEONMacroSwitch(width, height, bitsPerPixel, tiling, 4812f39173dSmrg info->ChipFamily >= CHIP_FAMILY_RV350)) { 4822f39173dSmrg tiling &= ~RADEON_TILING_MACRO; 4832f39173dSmrg } 4842f39173dSmrg 485921a55d8Smrg height = RADEON_ALIGN(height, drmmode_get_height_align(pScrn, tiling)); 486921a55d8Smrg pitch = RADEON_ALIGN(width, drmmode_get_pitch_align(pScrn, cpp, tiling)) * cpp; 487921a55d8Smrg base_align = drmmode_get_base_align(pScrn, cpp, tiling); 488921a55d8Smrg size = RADEON_ALIGN(height * pitch, RADEON_GPU_PAGE_SIZE); 489ad43ddacSmrg 4902f39173dSmrg new_priv = calloc(1, sizeof(struct radeon_exa_pixmap_priv)); 491ad43ddacSmrg if (!new_priv) 492ad43ddacSmrg return NULL; 493ad43ddacSmrg 494ad43ddacSmrg if (size == 0) 495ad43ddacSmrg return new_priv; 496ad43ddacSmrg 497921a55d8Smrg *new_pitch = pitch; 498ad43ddacSmrg 499921a55d8Smrg new_priv->bo = radeon_bo_open(info->bufmgr, 0, size, base_align, 500ad43ddacSmrg RADEON_GEM_DOMAIN_VRAM, 0); 501ad43ddacSmrg if (!new_priv->bo) { 5022f39173dSmrg free(new_priv); 503ad43ddacSmrg ErrorF("Failed to alloc memory\n"); 504ad43ddacSmrg return NULL; 505ad43ddacSmrg } 506ad43ddacSmrg 507ad43ddacSmrg if (tiling) 508ad43ddacSmrg radeon_bo_set_tiling(new_priv->bo, tiling, *new_pitch); 509ad43ddacSmrg 510ad43ddacSmrg return new_priv; 511ad43ddacSmrg} 512ad43ddacSmrg 513ad43ddacSmrgvoid RADEONEXADestroyPixmap(ScreenPtr pScreen, void *driverPriv) 514ad43ddacSmrg{ 515ad43ddacSmrg struct radeon_exa_pixmap_priv *driver_priv = driverPriv; 516ad43ddacSmrg 517ad43ddacSmrg if (!driverPriv) 518ad43ddacSmrg return; 519ad43ddacSmrg 520ad43ddacSmrg if (driver_priv->bo) 521ad43ddacSmrg radeon_bo_unref(driver_priv->bo); 5222f39173dSmrg free(driverPriv); 523ad43ddacSmrg} 524ad43ddacSmrg 525ad43ddacSmrgstruct radeon_bo *radeon_get_pixmap_bo(PixmapPtr pPix) 526ad43ddacSmrg{ 527ad43ddacSmrg struct radeon_exa_pixmap_priv *driver_priv; 528ad43ddacSmrg driver_priv = exaGetPixmapDriverPrivate(pPix); 529ad43ddacSmrg return driver_priv->bo; 530ad43ddacSmrg} 531ad43ddacSmrg 532ad43ddacSmrgvoid radeon_set_pixmap_bo(PixmapPtr pPix, struct radeon_bo *bo) 533ad43ddacSmrg{ 534ad43ddacSmrg struct radeon_exa_pixmap_priv *driver_priv; 535ad43ddacSmrg 536ad43ddacSmrg driver_priv = exaGetPixmapDriverPrivate(pPix); 537ad43ddacSmrg if (driver_priv) { 538ad43ddacSmrg if (driver_priv->bo) 539ad43ddacSmrg radeon_bo_unref(driver_priv->bo); 540ad43ddacSmrg 541ad43ddacSmrg radeon_bo_ref(bo); 542ad43ddacSmrg driver_priv->bo = bo; 543ad43ddacSmrg } 544ad43ddacSmrg} 545ad43ddacSmrg 546ad43ddacSmrgBool RADEONEXAPixmapIsOffscreen(PixmapPtr pPix) 547ad43ddacSmrg{ 548ad43ddacSmrg struct radeon_exa_pixmap_priv *driver_priv; 549ad43ddacSmrg 550ad43ddacSmrg driver_priv = exaGetPixmapDriverPrivate(pPix); 551ad43ddacSmrg 552ad43ddacSmrg if (!driver_priv) 553ad43ddacSmrg return FALSE; 554ad43ddacSmrg if (driver_priv->bo) 555ad43ddacSmrg return TRUE; 556ad43ddacSmrg return FALSE; 557ad43ddacSmrg} 558ad43ddacSmrg#endif 559ad43ddacSmrg 560209ff23fSmrg#define ENTER_DRAW(x) TRACE 561209ff23fSmrg#define LEAVE_DRAW(x) TRACE 562209ff23fSmrg/***********************************************************************/ 563209ff23fSmrg 564209ff23fSmrg#define ACCEL_MMIO 565209ff23fSmrg#define ACCEL_PREAMBLE() unsigned char *RADEONMMIO = info->MMIO 566209ff23fSmrg#define BEGIN_ACCEL(n) RADEONWaitForFifo(pScrn, (n)) 567209ff23fSmrg#define OUT_ACCEL_REG(reg, val) OUTREG(reg, val) 568209ff23fSmrg#define OUT_ACCEL_REG_F(reg, val) OUTREG(reg, F_TO_DW(val)) 569ad43ddacSmrg#define OUT_RELOC(x, read, write) do {} while(0) 570209ff23fSmrg#define FINISH_ACCEL() 571209ff23fSmrg 572209ff23fSmrg#ifdef RENDER 573209ff23fSmrg#include "radeon_exa_render.c" 574209ff23fSmrg#endif 575209ff23fSmrg#include "radeon_exa_funcs.c" 576209ff23fSmrg 577209ff23fSmrg#undef ACCEL_MMIO 578209ff23fSmrg#undef ACCEL_PREAMBLE 579209ff23fSmrg#undef BEGIN_ACCEL 580209ff23fSmrg#undef OUT_ACCEL_REG 581b7e1c893Smrg#undef OUT_ACCEL_REG_F 582209ff23fSmrg#undef FINISH_ACCEL 583ad43ddacSmrg#undef OUT_RELOC 584209ff23fSmrg 585209ff23fSmrg#ifdef XF86DRI 586209ff23fSmrg 587209ff23fSmrg#define ACCEL_CP 588209ff23fSmrg#define ACCEL_PREAMBLE() \ 589209ff23fSmrg RING_LOCALS; \ 590209ff23fSmrg RADEONCP_REFRESH(pScrn, info) 591209ff23fSmrg#define BEGIN_ACCEL(n) BEGIN_RING(2*(n)) 592209ff23fSmrg#define OUT_ACCEL_REG(reg, val) OUT_RING_REG(reg, val) 593209ff23fSmrg#define FINISH_ACCEL() ADVANCE_RING() 594ad43ddacSmrg#define OUT_RELOC(x, read, write) OUT_RING_RELOC(x, read, write) 595209ff23fSmrg 596209ff23fSmrg#define OUT_RING_F(x) OUT_RING(F_TO_DW(x)) 597209ff23fSmrg 598209ff23fSmrg#ifdef RENDER 599209ff23fSmrg#include "radeon_exa_render.c" 600209ff23fSmrg#endif 601209ff23fSmrg#include "radeon_exa_funcs.c" 602209ff23fSmrg 603b7e1c893Smrg#undef ACCEL_CP 604b7e1c893Smrg#undef ACCEL_PREAMBLE 605b7e1c893Smrg#undef BEGIN_ACCEL 606b7e1c893Smrg#undef OUT_ACCEL_REG 607b7e1c893Smrg#undef FINISH_ACCEL 608b7e1c893Smrg#undef OUT_RING_F 609b7e1c893Smrg 610209ff23fSmrg#endif /* XF86DRI */ 611209ff23fSmrg 612209ff23fSmrg/* 613209ff23fSmrg * Once screen->off_screen_base is set, this function 614209ff23fSmrg * allocates the remaining memory appropriately 615209ff23fSmrg */ 616209ff23fSmrgBool RADEONSetupMemEXA (ScreenPtr pScreen) 617209ff23fSmrg{ 618209ff23fSmrg ScrnInfoPtr pScrn = xf86Screens[pScreen->myNum]; 619209ff23fSmrg RADEONInfoPtr info = RADEONPTR(pScrn); 620209ff23fSmrg xf86CrtcConfigPtr xf86_config = XF86_CRTC_CONFIG_PTR(pScrn); 621209ff23fSmrg int cpp = info->CurrentLayout.pixel_bytes; 622209ff23fSmrg int screen_size; 623209ff23fSmrg int byteStride = pScrn->displayWidth * cpp; 624209ff23fSmrg 625b7e1c893Smrg if (info->accel_state->exa != NULL) { 626209ff23fSmrg xf86DrvMsg(pScreen->myNum, X_ERROR, "Memory map already initialized\n"); 627209ff23fSmrg return FALSE; 628209ff23fSmrg } 629b7e1c893Smrg info->accel_state->exa = exaDriverAlloc(); 630b7e1c893Smrg if (info->accel_state->exa == NULL) 631209ff23fSmrg return FALSE; 632209ff23fSmrg 633209ff23fSmrg /* Need to adjust screen size for 16 line tiles, and then make it align to. 634209ff23fSmrg * the buffer alignment requirement. 635209ff23fSmrg */ 636209ff23fSmrg if (info->allowColorTiling) 637209ff23fSmrg screen_size = RADEON_ALIGN(pScrn->virtualY, 16) * byteStride; 638209ff23fSmrg else 639209ff23fSmrg screen_size = pScrn->virtualY * byteStride; 640209ff23fSmrg 641b7e1c893Smrg info->accel_state->exa->memoryBase = info->FB; 642b7e1c893Smrg info->accel_state->exa->memorySize = info->FbMapSize - info->FbSecureSize; 643b7e1c893Smrg info->accel_state->exa->offScreenBase = screen_size; 644209ff23fSmrg 645209ff23fSmrg xf86DrvMsg(pScrn->scrnIndex, X_INFO, "Allocating from a screen of %ld kb\n", 646b7e1c893Smrg info->accel_state->exa->memorySize / 1024); 647209ff23fSmrg 648209ff23fSmrg /* Reserve static area for hardware cursor */ 649209ff23fSmrg if (!xf86ReturnOptValBool(info->Options, OPTION_SW_CURSOR, FALSE)) { 650b7e1c893Smrg int cursor_size = 64 * 4 * 64; 651b7e1c893Smrg int align = IS_AVIVO_VARIANT ? 4096 : 256; 652b7e1c893Smrg int c; 653b7e1c893Smrg 654b7e1c893Smrg for (c = 0; c < xf86_config->num_crtc; c++) { 655b7e1c893Smrg xf86CrtcPtr crtc = xf86_config->crtc[c]; 656b7e1c893Smrg RADEONCrtcPrivatePtr radeon_crtc = crtc->driver_private; 657b7e1c893Smrg 658b7e1c893Smrg radeon_crtc->cursor_offset = 659b7e1c893Smrg RADEON_ALIGN(info->accel_state->exa->offScreenBase, align); 660b7e1c893Smrg info->accel_state->exa->offScreenBase = radeon_crtc->cursor_offset + cursor_size; 661b7e1c893Smrg 662b7e1c893Smrg xf86DrvMsg(pScrn->scrnIndex, X_INFO, 663b7e1c893Smrg "Will use %d kb for hardware cursor %d at offset 0x%08x\n", 664b7e1c893Smrg (cursor_size * xf86_config->num_crtc) / 1024, 665b7e1c893Smrg c, 666b7e1c893Smrg (unsigned int)radeon_crtc->cursor_offset); 667b7e1c893Smrg } 668209ff23fSmrg } 669209ff23fSmrg 670209ff23fSmrg#if defined(XF86DRI) 671209ff23fSmrg if (info->directRenderingEnabled) { 672b7e1c893Smrg int depthCpp = (info->dri->depthBits - 8) / 4, l, next, depth_size; 673209ff23fSmrg 674b7e1c893Smrg info->dri->frontOffset = 0; 675b7e1c893Smrg info->dri->frontPitch = pScrn->displayWidth; 676209ff23fSmrg 677209ff23fSmrg xf86DrvMsg(pScrn->scrnIndex, X_INFO, 678209ff23fSmrg "Will use %d kb for front buffer at offset 0x%08x\n", 679b7e1c893Smrg screen_size / 1024, info->dri->frontOffset); 680209ff23fSmrg RADEONDRIAllocatePCIGARTTable(pScreen); 681209ff23fSmrg 682209ff23fSmrg if (info->cardType==CARD_PCIE) 683209ff23fSmrg xf86DrvMsg(pScrn->scrnIndex, X_INFO, 684209ff23fSmrg "Will use %d kb for PCI GART at offset 0x%08x\n", 685b7e1c893Smrg info->dri->pciGartSize / 1024, 686b7e1c893Smrg (int)info->dri->pciGartOffset); 687209ff23fSmrg 688209ff23fSmrg /* Reserve a static area for the back buffer the same size as the 689209ff23fSmrg * visible screen. XXX: This would be better initialized in ati_dri.c 690209ff23fSmrg * when GLX is set up, but the offscreen memory manager's allocations 691209ff23fSmrg * don't last through VT switches, while the kernel's understanding of 692209ff23fSmrg * offscreen locations does. 693209ff23fSmrg */ 694b7e1c893Smrg info->dri->backPitch = pScrn->displayWidth; 695ad43ddacSmrg next = RADEON_ALIGN(info->accel_state->exa->offScreenBase, RADEON_GPU_PAGE_SIZE); 696b7e1c893Smrg if (!info->dri->noBackBuffer && 697b7e1c893Smrg next + screen_size <= info->accel_state->exa->memorySize) 698209ff23fSmrg { 699b7e1c893Smrg info->dri->backOffset = next; 700b7e1c893Smrg info->accel_state->exa->offScreenBase = next + screen_size; 701209ff23fSmrg xf86DrvMsg(pScrn->scrnIndex, X_INFO, 702209ff23fSmrg "Will use %d kb for back buffer at offset 0x%08x\n", 703b7e1c893Smrg screen_size / 1024, info->dri->backOffset); 704209ff23fSmrg } 705209ff23fSmrg 706209ff23fSmrg /* Reserve the static depth buffer, and adjust pitch and height to 707209ff23fSmrg * handle tiling. 708209ff23fSmrg */ 709b7e1c893Smrg info->dri->depthPitch = RADEON_ALIGN(pScrn->displayWidth, 32); 710b7e1c893Smrg depth_size = RADEON_ALIGN(pScrn->virtualY, 16) * info->dri->depthPitch * depthCpp; 711ad43ddacSmrg next = RADEON_ALIGN(info->accel_state->exa->offScreenBase, RADEON_GPU_PAGE_SIZE); 712b7e1c893Smrg if (next + depth_size <= info->accel_state->exa->memorySize) 713209ff23fSmrg { 714b7e1c893Smrg info->dri->depthOffset = next; 715b7e1c893Smrg info->accel_state->exa->offScreenBase = next + depth_size; 716209ff23fSmrg xf86DrvMsg(pScrn->scrnIndex, X_INFO, 717209ff23fSmrg "Will use %d kb for depth buffer at offset 0x%08x\n", 718b7e1c893Smrg depth_size / 1024, info->dri->depthOffset); 719209ff23fSmrg } 720209ff23fSmrg 721b7e1c893Smrg info->dri->textureSize *= (info->accel_state->exa->memorySize - 722b7e1c893Smrg info->accel_state->exa->offScreenBase) / 100; 723209ff23fSmrg 724b7e1c893Smrg l = RADEONLog2(info->dri->textureSize / RADEON_NR_TEX_REGIONS); 725209ff23fSmrg if (l < RADEON_LOG_TEX_GRANULARITY) 726209ff23fSmrg l = RADEON_LOG_TEX_GRANULARITY; 727b7e1c893Smrg info->dri->textureSize = (info->dri->textureSize >> l) << l; 728b7e1c893Smrg if (info->dri->textureSize >= 512 * 1024) { 729b7e1c893Smrg info->dri->textureOffset = info->accel_state->exa->offScreenBase; 730b7e1c893Smrg info->accel_state->exa->offScreenBase += info->dri->textureSize; 731209ff23fSmrg xf86DrvMsg(pScrn->scrnIndex, X_INFO, 732209ff23fSmrg "Will use %d kb for textures at offset 0x%08x\n", 733b7e1c893Smrg info->dri->textureSize / 1024, info->dri->textureOffset); 734209ff23fSmrg } else { 735209ff23fSmrg /* Minimum texture size is for 2 256x256x32bpp textures */ 736b7e1c893Smrg info->dri->textureSize = 0; 737209ff23fSmrg } 738209ff23fSmrg } else 739209ff23fSmrg#endif /* XF86DRI */ 740209ff23fSmrg xf86DrvMsg(pScrn->scrnIndex, X_INFO, 741209ff23fSmrg "Will use %d kb for front buffer at offset 0x%08x\n", 742209ff23fSmrg screen_size / 1024, 0); 743209ff23fSmrg 744209ff23fSmrg xf86DrvMsg(pScrn->scrnIndex, X_INFO, 745209ff23fSmrg "Will use %ld kb for X Server offscreen at offset 0x%08lx\n", 746b7e1c893Smrg (info->accel_state->exa->memorySize - info->accel_state->exa->offScreenBase) / 747b7e1c893Smrg 1024, info->accel_state->exa->offScreenBase); 748209ff23fSmrg 749209ff23fSmrg return TRUE; 750209ff23fSmrg} 751209ff23fSmrg 752209ff23fSmrg#ifdef XF86DRI 753209ff23fSmrg 754209ff23fSmrg#ifndef ExaOffscreenMarkUsed 755209ff23fSmrgextern void ExaOffscreenMarkUsed(PixmapPtr); 756209ff23fSmrg#endif 757209ff23fSmrg 758209ff23fSmrgunsigned long long 759209ff23fSmrgRADEONTexOffsetStart(PixmapPtr pPix) 760209ff23fSmrg{ 761b7e1c893Smrg RINFO_FROM_SCREEN(pPix->drawable.pScreen); 762b7e1c893Smrg unsigned long long offset; 763ad43ddacSmrg 764ad43ddacSmrg if (exaGetPixmapDriverPrivate(pPix)) 765ad43ddacSmrg return -1; 766ad43ddacSmrg 767209ff23fSmrg exaMoveInPixmap(pPix); 768209ff23fSmrg ExaOffscreenMarkUsed(pPix); 769209ff23fSmrg 770b7e1c893Smrg offset = exaGetPixmapOffset(pPix); 771b7e1c893Smrg 772b7e1c893Smrg if (offset > info->FbMapSize) 773b7e1c893Smrg return ~0ULL; 774b7e1c893Smrg else 775b7e1c893Smrg return info->fbLocation + offset; 776209ff23fSmrg} 777209ff23fSmrg#endif 778