radeon_exa.c revision 921a55d8
1209ff23fSmrg/*
2209ff23fSmrg * Copyright 2005 Eric Anholt
3209ff23fSmrg * Copyright 2005 Benjamin Herrenschmidt
4209ff23fSmrg * All Rights Reserved.
5209ff23fSmrg *
6209ff23fSmrg * Permission is hereby granted, free of charge, to any person obtaining a
7209ff23fSmrg * copy of this software and associated documentation files (the "Software"),
8209ff23fSmrg * to deal in the Software without restriction, including without limitation
9209ff23fSmrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10209ff23fSmrg * and/or sell copies of the Software, and to permit persons to whom the
11209ff23fSmrg * Software is furnished to do so, subject to the following conditions:
12209ff23fSmrg *
13209ff23fSmrg * The above copyright notice and this permission notice (including the next
14209ff23fSmrg * paragraph) shall be included in all copies or substantial portions of the
15209ff23fSmrg * Software.
16209ff23fSmrg *
17209ff23fSmrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18209ff23fSmrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19209ff23fSmrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
20209ff23fSmrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21209ff23fSmrg * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22209ff23fSmrg * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
23209ff23fSmrg * SOFTWARE.
24209ff23fSmrg *
25209ff23fSmrg * Authors:
26209ff23fSmrg *    Eric Anholt <anholt@FreeBSD.org>
27209ff23fSmrg *    Zack Rusin <zrusin@trolltech.com>
28209ff23fSmrg *    Benjamin Herrenschmidt <benh@kernel.crashing.org>
29209ff23fSmrg *
30209ff23fSmrg */
31209ff23fSmrg
32209ff23fSmrg#ifdef HAVE_CONFIG_H
33209ff23fSmrg#include "config.h"
34209ff23fSmrg#endif
35209ff23fSmrg
36209ff23fSmrg#include "radeon.h"
37209ff23fSmrg#include "radeon_reg.h"
38b7e1c893Smrg#include "r600_reg.h"
39209ff23fSmrg#ifdef XF86DRI
40b7e1c893Smrg#include "radeon_drm.h"
41209ff23fSmrg#endif
42209ff23fSmrg#include "radeon_macros.h"
43209ff23fSmrg#include "radeon_probe.h"
44209ff23fSmrg#include "radeon_version.h"
450974d292Smrg#include "radeon_exa_shared.h"
46209ff23fSmrg
47209ff23fSmrg#include "xf86.h"
48209ff23fSmrg
49209ff23fSmrg
50209ff23fSmrg/***********************************************************************/
51209ff23fSmrg#define RINFO_FROM_SCREEN(pScr) ScrnInfoPtr pScrn =  xf86Screens[pScr->myNum]; \
52209ff23fSmrg    RADEONInfoPtr info   = RADEONPTR(pScrn)
53209ff23fSmrg
54209ff23fSmrgstatic struct {
55209ff23fSmrg    int rop;
56209ff23fSmrg    int pattern;
57209ff23fSmrg} RADEON_ROP[] = {
58209ff23fSmrg    { RADEON_ROP3_ZERO, RADEON_ROP3_ZERO }, /* GXclear        */
59209ff23fSmrg    { RADEON_ROP3_DSa,  RADEON_ROP3_DPa  }, /* Gxand          */
60209ff23fSmrg    { RADEON_ROP3_SDna, RADEON_ROP3_PDna }, /* GXandReverse   */
61209ff23fSmrg    { RADEON_ROP3_S,    RADEON_ROP3_P    }, /* GXcopy         */
62209ff23fSmrg    { RADEON_ROP3_DSna, RADEON_ROP3_DPna }, /* GXandInverted  */
63209ff23fSmrg    { RADEON_ROP3_D,    RADEON_ROP3_D    }, /* GXnoop         */
64209ff23fSmrg    { RADEON_ROP3_DSx,  RADEON_ROP3_DPx  }, /* GXxor          */
65209ff23fSmrg    { RADEON_ROP3_DSo,  RADEON_ROP3_DPo  }, /* GXor           */
66209ff23fSmrg    { RADEON_ROP3_DSon, RADEON_ROP3_DPon }, /* GXnor          */
67209ff23fSmrg    { RADEON_ROP3_DSxn, RADEON_ROP3_PDxn }, /* GXequiv        */
68209ff23fSmrg    { RADEON_ROP3_Dn,   RADEON_ROP3_Dn   }, /* GXinvert       */
69209ff23fSmrg    { RADEON_ROP3_SDno, RADEON_ROP3_PDno }, /* GXorReverse    */
70209ff23fSmrg    { RADEON_ROP3_Sn,   RADEON_ROP3_Pn   }, /* GXcopyInverted */
71209ff23fSmrg    { RADEON_ROP3_DSno, RADEON_ROP3_DPno }, /* GXorInverted   */
72209ff23fSmrg    { RADEON_ROP3_DSan, RADEON_ROP3_DPan }, /* GXnand         */
73209ff23fSmrg    { RADEON_ROP3_ONE,  RADEON_ROP3_ONE  }  /* GXset          */
74209ff23fSmrg};
75209ff23fSmrg
76209ff23fSmrg/* Compute log base 2 of val. */
77209ff23fSmrgstatic __inline__ int
78209ff23fSmrgRADEONLog2(int val)
79209ff23fSmrg{
80209ff23fSmrg	int bits;
81209ff23fSmrg#if (defined __i386__ || defined __x86_64__) && (defined __GNUC__)
82209ff23fSmrg	__asm volatile("bsrl	%1, %0"
83209ff23fSmrg		: "=r" (bits)
84209ff23fSmrg		: "c" (val)
85209ff23fSmrg	);
86209ff23fSmrg	return bits;
87209ff23fSmrg#else
88209ff23fSmrg	for (bits = 0; val != 0; val >>= 1, ++bits)
89209ff23fSmrg		;
90209ff23fSmrg	return bits - 1;
91209ff23fSmrg#endif
92209ff23fSmrg}
93209ff23fSmrg
94209ff23fSmrgstatic __inline__ uint32_t F_TO_DW(float val)
95209ff23fSmrg{
96209ff23fSmrg    union {
97209ff23fSmrg	float f;
98209ff23fSmrg	uint32_t l;
99209ff23fSmrg    } tmp;
100209ff23fSmrg    tmp.f = val;
101209ff23fSmrg    return tmp.l;
102209ff23fSmrg}
103209ff23fSmrg
104ad43ddacSmrg
105209ff23fSmrg/* Assumes that depth 15 and 16 can be used as depth 16, which is okay since we
106209ff23fSmrg * require src and dest datatypes to be equal.
107209ff23fSmrg */
108209ff23fSmrgBool RADEONGetDatatypeBpp(int bpp, uint32_t *type)
109209ff23fSmrg{
110209ff23fSmrg	switch (bpp) {
111209ff23fSmrg	case 8:
112209ff23fSmrg		*type = ATI_DATATYPE_CI8;
113209ff23fSmrg		return TRUE;
114209ff23fSmrg	case 16:
115209ff23fSmrg		*type = ATI_DATATYPE_RGB565;
116209ff23fSmrg		return TRUE;
117209ff23fSmrg	case 24:
118209ff23fSmrg		*type = ATI_DATATYPE_CI8;
119209ff23fSmrg		return TRUE;
120209ff23fSmrg	case 32:
121209ff23fSmrg		*type = ATI_DATATYPE_ARGB8888;
122209ff23fSmrg		return TRUE;
123209ff23fSmrg	default:
124209ff23fSmrg		RADEON_FALLBACK(("Unsupported bpp: %d\n", bpp));
125209ff23fSmrg		return FALSE;
126209ff23fSmrg	}
127209ff23fSmrg}
128209ff23fSmrg
129209ff23fSmrgstatic Bool RADEONPixmapIsColortiled(PixmapPtr pPix)
130209ff23fSmrg{
131209ff23fSmrg    RINFO_FROM_SCREEN(pPix->drawable.pScreen);
132209ff23fSmrg
133209ff23fSmrg    /* This doesn't account for the back buffer, which we may want to wrap in
134209ff23fSmrg     * a pixmap at some point for the purposes of DRI buffer moves.
135209ff23fSmrg     */
136209ff23fSmrg    if (info->tilingEnabled && exaGetPixmapOffset(pPix) == 0)
137209ff23fSmrg	return TRUE;
138209ff23fSmrg    else
139209ff23fSmrg	return FALSE;
140209ff23fSmrg}
141209ff23fSmrg
142209ff23fSmrgstatic Bool RADEONGetOffsetPitch(PixmapPtr pPix, int bpp, uint32_t *pitch_offset,
143209ff23fSmrg				 unsigned int offset, unsigned int pitch)
144209ff23fSmrg{
145209ff23fSmrg	RINFO_FROM_SCREEN(pPix->drawable.pScreen);
146209ff23fSmrg
147b7e1c893Smrg	if (pitch > 16320 || pitch % info->accel_state->exa->pixmapPitchAlign != 0)
148209ff23fSmrg		RADEON_FALLBACK(("Bad pitch 0x%08x\n", pitch));
149209ff23fSmrg
150b7e1c893Smrg	if (offset % info->accel_state->exa->pixmapOffsetAlign != 0)
151209ff23fSmrg		RADEON_FALLBACK(("Bad offset 0x%08x\n", offset));
152209ff23fSmrg
153209ff23fSmrg	pitch = pitch >> 6;
154209ff23fSmrg	*pitch_offset = (pitch << 22) | (offset >> 10);
155209ff23fSmrg
156209ff23fSmrg	/* If it's the front buffer, we've got to note that it's tiled? */
157209ff23fSmrg	if (RADEONPixmapIsColortiled(pPix))
158209ff23fSmrg		*pitch_offset |= RADEON_DST_TILE_MACRO;
159209ff23fSmrg	return TRUE;
160209ff23fSmrg}
161209ff23fSmrg
162209ff23fSmrgBool RADEONGetPixmapOffsetPitch(PixmapPtr pPix, uint32_t *pitch_offset)
163209ff23fSmrg{
164209ff23fSmrg	uint32_t pitch, offset;
165209ff23fSmrg	int bpp;
166209ff23fSmrg
167209ff23fSmrg	bpp = pPix->drawable.bitsPerPixel;
168209ff23fSmrg	if (bpp == 24)
169209ff23fSmrg		bpp = 8;
170209ff23fSmrg
171ad43ddacSmrg	offset = radeonGetPixmapOffset(pPix);
172209ff23fSmrg	pitch = exaGetPixmapPitch(pPix);
173209ff23fSmrg
174209ff23fSmrg	return RADEONGetOffsetPitch(pPix, bpp, pitch_offset, offset, pitch);
175209ff23fSmrg}
176209ff23fSmrg
177921a55d8Smrg/**
178921a55d8Smrg * Returns whether the provided transform is affine.
179921a55d8Smrg *
180921a55d8Smrg * transform may be null.
181921a55d8Smrg */
182921a55d8SmrgBool radeon_transform_is_affine(PictTransformPtr t)
183921a55d8Smrg{
184921a55d8Smrg	if (t == NULL)
185921a55d8Smrg		return TRUE;
186921a55d8Smrg	return t->matrix[2][0] == 0 && t->matrix[2][1] == 0;
187921a55d8Smrg}
188921a55d8Smrg
189209ff23fSmrg#if X_BYTE_ORDER == X_BIG_ENDIAN
190209ff23fSmrg
191b7e1c893Smrgstatic unsigned long swapper_surfaces[6];
192209ff23fSmrg
193ad43ddacSmrgstatic Bool RADEONPrepareAccess_BE(PixmapPtr pPix, int index)
194209ff23fSmrg{
195209ff23fSmrg    RINFO_FROM_SCREEN(pPix->drawable.pScreen);
196209ff23fSmrg    unsigned char *RADEONMMIO = info->MMIO;
197209ff23fSmrg    uint32_t offset = exaGetPixmapOffset(pPix);
198209ff23fSmrg    int bpp, soff;
199209ff23fSmrg    uint32_t size, flags;
200209ff23fSmrg
201209ff23fSmrg    /* Front buffer is always set with proper swappers */
202209ff23fSmrg    if (offset == 0)
203209ff23fSmrg        return TRUE;
204209ff23fSmrg
205209ff23fSmrg    /* If same bpp as front buffer, just do nothing as the main
206209ff23fSmrg     * swappers will apply
207209ff23fSmrg     */
208209ff23fSmrg    bpp = pPix->drawable.bitsPerPixel;
209209ff23fSmrg    if (bpp == pScrn->bitsPerPixel)
210209ff23fSmrg        return TRUE;
211209ff23fSmrg
212209ff23fSmrg    /* We need to setup a separate swapper, let's request a
213209ff23fSmrg     * surface. We need to align the size first
214209ff23fSmrg     */
215209ff23fSmrg    size = exaGetPixmapSize(pPix);
216ad43ddacSmrg    size = RADEON_ALIGN(size, RADEON_GPU_PAGE_SIZE);
217209ff23fSmrg
218209ff23fSmrg    /* Set surface to tiling disabled with appropriate swapper */
219209ff23fSmrg    switch (bpp) {
220209ff23fSmrg    case 16:
221209ff23fSmrg        flags = RADEON_SURF_AP0_SWP_16BPP | RADEON_SURF_AP1_SWP_16BPP;
222209ff23fSmrg	break;
223209ff23fSmrg    case 32:
224209ff23fSmrg        flags = RADEON_SURF_AP0_SWP_32BPP | RADEON_SURF_AP1_SWP_32BPP;
225209ff23fSmrg	break;
226209ff23fSmrg    default:
227209ff23fSmrg        flags = 0;
228209ff23fSmrg    }
229209ff23fSmrg#if defined(XF86DRI)
230209ff23fSmrg    if (info->directRenderingEnabled && info->allowColorTiling) {
231b7e1c893Smrg	struct drm_radeon_surface_alloc drmsurfalloc;
232209ff23fSmrg	int rc;
233209ff23fSmrg
234209ff23fSmrg        drmsurfalloc.address = offset;
235209ff23fSmrg        drmsurfalloc.size = size;
236209ff23fSmrg	drmsurfalloc.flags = flags | 1; /* bogus pitch to please DRM */
237209ff23fSmrg
238b7e1c893Smrg        rc = drmCommandWrite(info->dri->drmFD, DRM_RADEON_SURF_ALLOC,
239209ff23fSmrg			     &drmsurfalloc, sizeof(drmsurfalloc));
240209ff23fSmrg	if (rc < 0) {
241209ff23fSmrg	    xf86DrvMsg(pScrn->scrnIndex, X_ERROR,
242209ff23fSmrg		       "drm: could not allocate surface for access"
243209ff23fSmrg		       " swapper, err: %d!\n", rc);
244209ff23fSmrg	    return FALSE;
245209ff23fSmrg	}
246209ff23fSmrg	swapper_surfaces[index] = offset;
247209ff23fSmrg
248209ff23fSmrg	return TRUE;
249209ff23fSmrg    }
250209ff23fSmrg#endif
251209ff23fSmrg    soff = (index + 1) * 0x10;
252209ff23fSmrg    OUTREG(RADEON_SURFACE0_INFO + soff, flags);
253209ff23fSmrg    OUTREG(RADEON_SURFACE0_LOWER_BOUND + soff, offset);
254209ff23fSmrg    OUTREG(RADEON_SURFACE0_UPPER_BOUND + soff, offset + size - 1);
255209ff23fSmrg    swapper_surfaces[index] = offset;
256209ff23fSmrg    return TRUE;
257209ff23fSmrg}
258209ff23fSmrg
259ad43ddacSmrgstatic void RADEONFinishAccess_BE(PixmapPtr pPix, int index)
260209ff23fSmrg{
261209ff23fSmrg    RINFO_FROM_SCREEN(pPix->drawable.pScreen);
262209ff23fSmrg    unsigned char *RADEONMMIO = info->MMIO;
263209ff23fSmrg    uint32_t offset = exaGetPixmapOffset(pPix);
264209ff23fSmrg    int soff;
265209ff23fSmrg
266209ff23fSmrg    /* Front buffer is always set with proper swappers */
267209ff23fSmrg    if (offset == 0)
268209ff23fSmrg        return;
269209ff23fSmrg
270209ff23fSmrg    if (swapper_surfaces[index] == 0)
271209ff23fSmrg        return;
272209ff23fSmrg#if defined(XF86DRI)
273209ff23fSmrg    if (info->directRenderingEnabled && info->allowColorTiling) {
274b7e1c893Smrg	struct drm_radeon_surface_free drmsurffree;
275209ff23fSmrg
276209ff23fSmrg	drmsurffree.address = offset;
277b7e1c893Smrg	drmCommandWrite(info->dri->drmFD, DRM_RADEON_SURF_FREE,
278209ff23fSmrg			&drmsurffree, sizeof(drmsurffree));
279209ff23fSmrg	swapper_surfaces[index] = 0;
280209ff23fSmrg	return;
281209ff23fSmrg    }
282209ff23fSmrg#endif
283209ff23fSmrg    soff = (index + 1) * 0x10;
284209ff23fSmrg    OUTREG(RADEON_SURFACE0_INFO + soff, 0);
285209ff23fSmrg    OUTREG(RADEON_SURFACE0_LOWER_BOUND + soff, 0);
286209ff23fSmrg    OUTREG(RADEON_SURFACE0_UPPER_BOUND + soff, 0);
287209ff23fSmrg    swapper_surfaces[index] = 0;
288209ff23fSmrg}
289209ff23fSmrg
290209ff23fSmrg#endif /* X_BYTE_ORDER == X_BIG_ENDIAN */
291209ff23fSmrg
292ad43ddacSmrg#ifdef XF86DRM_MODE
293ad43ddacSmrgBool RADEONPrepareAccess_CS(PixmapPtr pPix, int index)
294ad43ddacSmrg{
295ad43ddacSmrg    ScreenPtr pScreen = pPix->drawable.pScreen;
296ad43ddacSmrg    ScrnInfoPtr pScrn = xf86Screens[pScreen->myNum];
297ad43ddacSmrg    RADEONInfoPtr info = RADEONPTR(pScrn);
298ad43ddacSmrg    struct radeon_exa_pixmap_priv *driver_priv;
2990974d292Smrg    uint32_t possible_domains = ~0U;
3000974d292Smrg    uint32_t current_domain = 0;
3010974d292Smrg#ifdef EXA_MIXED_PIXMAPS
3020974d292Smrg    Bool can_fail = !(pPix->drawable.bitsPerPixel < 8) &&
3030974d292Smrg	pPix != pScreen->GetScreenPixmap(pScreen) &&
3040974d292Smrg        (info->accel_state->exa->flags & EXA_MIXED_PIXMAPS);
3050974d292Smrg#else
3060974d292Smrg    Bool can_fail = FALSE;
3070974d292Smrg#endif
3080974d292Smrg    Bool flush = FALSE;
309ad43ddacSmrg    int ret;
310921a55d8Smrg    uint32_t tiling_flags = 0, pitch = 0;
311ad43ddacSmrg
312ad43ddacSmrg#if X_BYTE_ORDER == X_BIG_ENDIAN
313ad43ddacSmrg    /* May need to handle byte swapping in DownloadFrom/UploadToScreen */
3140974d292Smrg    if (can_fail && pPix->drawable.bitsPerPixel > 8)
315ad43ddacSmrg	return FALSE;
316ad43ddacSmrg#endif
317ad43ddacSmrg
318ad43ddacSmrg    driver_priv = exaGetPixmapDriverPrivate(pPix);
319ad43ddacSmrg    if (!driver_priv)
320ad43ddacSmrg      return FALSE;
321ad43ddacSmrg
322921a55d8Smrg    /* check if we are tiled */
323921a55d8Smrg    ret = radeon_bo_get_tiling(driver_priv->bo, &tiling_flags, &pitch);
324921a55d8Smrg    if (ret)
325921a55d8Smrg	return FALSE;
326921a55d8Smrg    /* untile in DFS/UTS */
327921a55d8Smrg    if (tiling_flags & (RADEON_TILING_MACRO | RADEON_TILING_MICRO))
328921a55d8Smrg	return FALSE;
329921a55d8Smrg
330ad43ddacSmrg    /* if we have more refs than just the BO then flush */
3310974d292Smrg    if (radeon_bo_is_referenced_by_cs(driver_priv->bo, info->cs)) {
3320974d292Smrg	flush = TRUE;
3330974d292Smrg
3340974d292Smrg	if (can_fail) {
3350974d292Smrg	    possible_domains = radeon_bo_get_src_domain(driver_priv->bo);
3360974d292Smrg	    if (possible_domains == RADEON_GEM_DOMAIN_VRAM)
3370974d292Smrg		return FALSE; /* use DownloadFromScreen */
3380974d292Smrg	}
3390974d292Smrg    }
3400974d292Smrg
3410974d292Smrg    /* if the BO might end up in VRAM, prefer DownloadFromScreen */
3420974d292Smrg    if (can_fail && (possible_domains & RADEON_GEM_DOMAIN_VRAM)) {
3430974d292Smrg	radeon_bo_is_busy(driver_priv->bo, &current_domain);
3440974d292Smrg
3450974d292Smrg	if (current_domain & possible_domains) {
3460974d292Smrg	    if (current_domain == RADEON_GEM_DOMAIN_VRAM)
3470974d292Smrg		return FALSE;
3480974d292Smrg	} else if (possible_domains & RADEON_GEM_DOMAIN_VRAM)
3490974d292Smrg	    return FALSE;
3500974d292Smrg    }
3510974d292Smrg
3520974d292Smrg    if (flush)
353ad43ddacSmrg        radeon_cs_flush_indirect(pScrn);
354ad43ddacSmrg
355ad43ddacSmrg    /* flush IB */
356ad43ddacSmrg    ret = radeon_bo_map(driver_priv->bo, 1);
357ad43ddacSmrg    if (ret) {
358ad43ddacSmrg      FatalError("failed to map pixmap %d\n", ret);
359ad43ddacSmrg      return FALSE;
360ad43ddacSmrg    }
361ad43ddacSmrg    driver_priv->bo_mapped = TRUE;
362ad43ddacSmrg
363ad43ddacSmrg    pPix->devPrivate.ptr = driver_priv->bo->ptr;
364ad43ddacSmrg
365ad43ddacSmrg    return TRUE;
366ad43ddacSmrg}
367ad43ddacSmrg
368ad43ddacSmrgvoid RADEONFinishAccess_CS(PixmapPtr pPix, int index)
369ad43ddacSmrg{
370ad43ddacSmrg    struct radeon_exa_pixmap_priv *driver_priv;
371ad43ddacSmrg
372ad43ddacSmrg    driver_priv = exaGetPixmapDriverPrivate(pPix);
373ad43ddacSmrg    if (!driver_priv || !driver_priv->bo_mapped)
374ad43ddacSmrg        return;
375ad43ddacSmrg
376ad43ddacSmrg    radeon_bo_unmap(driver_priv->bo);
3770974d292Smrg    driver_priv->bo_mapped = FALSE;
378ad43ddacSmrg    pPix->devPrivate.ptr = NULL;
379ad43ddacSmrg}
380ad43ddacSmrg
381ad43ddacSmrg
382ad43ddacSmrgvoid *RADEONEXACreatePixmap(ScreenPtr pScreen, int size, int align)
383ad43ddacSmrg{
384ad43ddacSmrg    ScrnInfoPtr pScrn = xf86Screens[pScreen->myNum];
385ad43ddacSmrg    RADEONInfoPtr info = RADEONPTR(pScrn);
386ad43ddacSmrg    struct radeon_exa_pixmap_priv *new_priv;
387ad43ddacSmrg
388ad43ddacSmrg#ifdef EXA_MIXED_PIXMAPS
389ad43ddacSmrg    if (info->accel_state->exa->flags & EXA_MIXED_PIXMAPS) {
390ad43ddacSmrg        if (size != 0 && !info->exa_force_create &&
391ad43ddacSmrg	    info->exa_pixmaps == FALSE)
392ad43ddacSmrg            return NULL;
393ad43ddacSmrg    }
394ad43ddacSmrg#endif
395ad43ddacSmrg
3962f39173dSmrg    new_priv = calloc(1, sizeof(struct radeon_exa_pixmap_priv));
397ad43ddacSmrg    if (!new_priv)
398ad43ddacSmrg	return NULL;
399ad43ddacSmrg
400ad43ddacSmrg    if (size == 0)
401ad43ddacSmrg	return new_priv;
402ad43ddacSmrg
403ad43ddacSmrg    new_priv->bo = radeon_bo_open(info->bufmgr, 0, size, align,
404ad43ddacSmrg				  RADEON_GEM_DOMAIN_VRAM, 0);
405ad43ddacSmrg    if (!new_priv->bo) {
4062f39173dSmrg	free(new_priv);
407ad43ddacSmrg	ErrorF("Failed to alloc memory\n");
408ad43ddacSmrg	return NULL;
409ad43ddacSmrg    }
410ad43ddacSmrg
411ad43ddacSmrg    return new_priv;
412ad43ddacSmrg
413ad43ddacSmrg}
414ad43ddacSmrg
4152f39173dSmrgstatic const unsigned MicroBlockTable[5][3][2] = {
4162f39173dSmrg    /*linear  tiled   square-tiled */
4172f39173dSmrg    {{32, 1}, {8, 4}, {0, 0}}, /*   8 bits per pixel */
4182f39173dSmrg    {{16, 1}, {8, 2}, {4, 4}}, /*  16 bits per pixel */
4192f39173dSmrg    {{ 8, 1}, {4, 2}, {0, 0}}, /*  32 bits per pixel */
4202f39173dSmrg    {{ 4, 1}, {0, 0}, {2, 2}}, /*  64 bits per pixel */
4212f39173dSmrg    {{ 2, 1}, {0, 0}, {0, 0}}  /* 128 bits per pixel */
4222f39173dSmrg};
4232f39173dSmrg
4242f39173dSmrg/* Return true if macrotiling can be enabled */
4252f39173dSmrgstatic Bool RADEONMacroSwitch(int width, int height, int bpp,
4262f39173dSmrg                              uint32_t flags, Bool rv350_mode)
4272f39173dSmrg{
4282f39173dSmrg    unsigned tilew, tileh, microtiled, logbpp;
4292f39173dSmrg
4302f39173dSmrg    logbpp = RADEONLog2(bpp / 8);
4312f39173dSmrg    if (logbpp > 4)
4322f39173dSmrg        return 0;
4332f39173dSmrg
4342f39173dSmrg    microtiled = !!(flags & RADEON_TILING_MICRO);
4352f39173dSmrg    tilew = MicroBlockTable[logbpp][microtiled][0] * 8;
4362f39173dSmrg    tileh = MicroBlockTable[logbpp][microtiled][1] * 8;
4372f39173dSmrg
4382f39173dSmrg    /* See TX_FILTER1_n.MACRO_SWITCH. */
4392f39173dSmrg    if (rv350_mode) {
4402f39173dSmrg        return width >= tilew && height >= tileh;
4412f39173dSmrg    } else {
4422f39173dSmrg        return width > tilew && height > tileh;
4432f39173dSmrg    }
4442f39173dSmrg}
4452f39173dSmrg
446ad43ddacSmrgvoid *RADEONEXACreatePixmap2(ScreenPtr pScreen, int width, int height,
447ad43ddacSmrg			     int depth, int usage_hint, int bitsPerPixel,
448ad43ddacSmrg			     int *new_pitch)
449ad43ddacSmrg{
450ad43ddacSmrg    ScrnInfoPtr pScrn = xf86Screens[pScreen->myNum];
451ad43ddacSmrg    RADEONInfoPtr info = RADEONPTR(pScrn);
452ad43ddacSmrg    struct radeon_exa_pixmap_priv *new_priv;
453921a55d8Smrg    int pitch, base_align;
454ad43ddacSmrg    uint32_t size;
455ad43ddacSmrg    uint32_t tiling = 0;
456921a55d8Smrg    int cpp = bitsPerPixel / 8;
457ad43ddacSmrg
458ad43ddacSmrg#ifdef EXA_MIXED_PIXMAPS
459ad43ddacSmrg    if (info->accel_state->exa->flags & EXA_MIXED_PIXMAPS) {
460ad43ddacSmrg	if (width != 0 && height != 0 && !info->exa_force_create &&
461ad43ddacSmrg	    info->exa_pixmaps == FALSE)
462ad43ddacSmrg            return NULL;
463ad43ddacSmrg    }
464ad43ddacSmrg#endif
465ad43ddacSmrg
466ad43ddacSmrg    if (usage_hint) {
467ad43ddacSmrg	if (info->allowColorTiling) {
468ad43ddacSmrg    	    if (usage_hint & RADEON_CREATE_PIXMAP_TILING_MACRO)
469ad43ddacSmrg 	   	tiling |= RADEON_TILING_MACRO;
470ad43ddacSmrg    	    if (usage_hint & RADEON_CREATE_PIXMAP_TILING_MICRO)
471ad43ddacSmrg                tiling |= RADEON_TILING_MICRO;
472ad43ddacSmrg	}
473ad43ddacSmrg    }
474ad43ddacSmrg
4752f39173dSmrg    /* Small pixmaps must not be macrotiled on R300, hw cannot sample them
4762f39173dSmrg     * correctly because samplers automatically switch to macrolinear. */
4772f39173dSmrg    if (info->ChipFamily >= CHIP_FAMILY_R300 &&
4782f39173dSmrg        info->ChipFamily <= CHIP_FAMILY_RS740 &&
4792f39173dSmrg        (tiling & RADEON_TILING_MACRO) &&
4802f39173dSmrg        !RADEONMacroSwitch(width, height, bitsPerPixel, tiling,
4812f39173dSmrg                           info->ChipFamily >= CHIP_FAMILY_RV350)) {
4822f39173dSmrg        tiling &= ~RADEON_TILING_MACRO;
4832f39173dSmrg    }
4842f39173dSmrg
485921a55d8Smrg    height = RADEON_ALIGN(height, drmmode_get_height_align(pScrn, tiling));
486921a55d8Smrg    pitch = RADEON_ALIGN(width, drmmode_get_pitch_align(pScrn, cpp, tiling)) * cpp;
487921a55d8Smrg    base_align = drmmode_get_base_align(pScrn, cpp, tiling);
488921a55d8Smrg    size = RADEON_ALIGN(height * pitch, RADEON_GPU_PAGE_SIZE);
489ad43ddacSmrg
4902f39173dSmrg    new_priv = calloc(1, sizeof(struct radeon_exa_pixmap_priv));
491ad43ddacSmrg    if (!new_priv)
492ad43ddacSmrg	return NULL;
493ad43ddacSmrg
494ad43ddacSmrg    if (size == 0)
495ad43ddacSmrg	return new_priv;
496ad43ddacSmrg
497921a55d8Smrg    *new_pitch = pitch;
498ad43ddacSmrg
499921a55d8Smrg    new_priv->bo = radeon_bo_open(info->bufmgr, 0, size, base_align,
500ad43ddacSmrg				  RADEON_GEM_DOMAIN_VRAM, 0);
501ad43ddacSmrg    if (!new_priv->bo) {
5022f39173dSmrg	free(new_priv);
503ad43ddacSmrg	ErrorF("Failed to alloc memory\n");
504ad43ddacSmrg	return NULL;
505ad43ddacSmrg    }
506ad43ddacSmrg
507ad43ddacSmrg    if (tiling)
508ad43ddacSmrg	radeon_bo_set_tiling(new_priv->bo, tiling, *new_pitch);
509ad43ddacSmrg
510ad43ddacSmrg    return new_priv;
511ad43ddacSmrg}
512ad43ddacSmrg
513ad43ddacSmrgvoid RADEONEXADestroyPixmap(ScreenPtr pScreen, void *driverPriv)
514ad43ddacSmrg{
515ad43ddacSmrg    struct radeon_exa_pixmap_priv *driver_priv = driverPriv;
516ad43ddacSmrg
517ad43ddacSmrg    if (!driverPriv)
518ad43ddacSmrg      return;
519ad43ddacSmrg
520ad43ddacSmrg    if (driver_priv->bo)
521ad43ddacSmrg	radeon_bo_unref(driver_priv->bo);
5222f39173dSmrg    free(driverPriv);
523ad43ddacSmrg}
524ad43ddacSmrg
525ad43ddacSmrgstruct radeon_bo *radeon_get_pixmap_bo(PixmapPtr pPix)
526ad43ddacSmrg{
527ad43ddacSmrg    struct radeon_exa_pixmap_priv *driver_priv;
528ad43ddacSmrg    driver_priv = exaGetPixmapDriverPrivate(pPix);
529ad43ddacSmrg    return driver_priv->bo;
530ad43ddacSmrg}
531ad43ddacSmrg
532ad43ddacSmrgvoid radeon_set_pixmap_bo(PixmapPtr pPix, struct radeon_bo *bo)
533ad43ddacSmrg{
534ad43ddacSmrg    struct radeon_exa_pixmap_priv *driver_priv;
535ad43ddacSmrg
536ad43ddacSmrg    driver_priv = exaGetPixmapDriverPrivate(pPix);
537ad43ddacSmrg    if (driver_priv) {
538ad43ddacSmrg	if (driver_priv->bo)
539ad43ddacSmrg	    radeon_bo_unref(driver_priv->bo);
540ad43ddacSmrg
541ad43ddacSmrg	radeon_bo_ref(bo);
542ad43ddacSmrg	driver_priv->bo = bo;
543ad43ddacSmrg    }
544ad43ddacSmrg}
545ad43ddacSmrg
546ad43ddacSmrgBool RADEONEXAPixmapIsOffscreen(PixmapPtr pPix)
547ad43ddacSmrg{
548ad43ddacSmrg    struct radeon_exa_pixmap_priv *driver_priv;
549ad43ddacSmrg
550ad43ddacSmrg    driver_priv = exaGetPixmapDriverPrivate(pPix);
551ad43ddacSmrg
552ad43ddacSmrg    if (!driver_priv)
553ad43ddacSmrg       return FALSE;
554ad43ddacSmrg    if (driver_priv->bo)
555ad43ddacSmrg       return TRUE;
556ad43ddacSmrg    return FALSE;
557ad43ddacSmrg}
558ad43ddacSmrg#endif
559ad43ddacSmrg
560209ff23fSmrg#define ENTER_DRAW(x) TRACE
561209ff23fSmrg#define LEAVE_DRAW(x) TRACE
562209ff23fSmrg/***********************************************************************/
563209ff23fSmrg
564209ff23fSmrg#define ACCEL_MMIO
565209ff23fSmrg#define ACCEL_PREAMBLE()	unsigned char *RADEONMMIO = info->MMIO
566209ff23fSmrg#define BEGIN_ACCEL(n)		RADEONWaitForFifo(pScrn, (n))
567209ff23fSmrg#define OUT_ACCEL_REG(reg, val)	OUTREG(reg, val)
568209ff23fSmrg#define OUT_ACCEL_REG_F(reg, val) OUTREG(reg, F_TO_DW(val))
569ad43ddacSmrg#define OUT_RELOC(x, read, write)            do {} while(0)
570209ff23fSmrg#define FINISH_ACCEL()
571209ff23fSmrg
572209ff23fSmrg#ifdef RENDER
573209ff23fSmrg#include "radeon_exa_render.c"
574209ff23fSmrg#endif
575209ff23fSmrg#include "radeon_exa_funcs.c"
576209ff23fSmrg
577209ff23fSmrg#undef ACCEL_MMIO
578209ff23fSmrg#undef ACCEL_PREAMBLE
579209ff23fSmrg#undef BEGIN_ACCEL
580209ff23fSmrg#undef OUT_ACCEL_REG
581b7e1c893Smrg#undef OUT_ACCEL_REG_F
582209ff23fSmrg#undef FINISH_ACCEL
583ad43ddacSmrg#undef OUT_RELOC
584209ff23fSmrg
585209ff23fSmrg#ifdef XF86DRI
586209ff23fSmrg
587209ff23fSmrg#define ACCEL_CP
588209ff23fSmrg#define ACCEL_PREAMBLE()						\
589209ff23fSmrg    RING_LOCALS;							\
590209ff23fSmrg    RADEONCP_REFRESH(pScrn, info)
591209ff23fSmrg#define BEGIN_ACCEL(n)		BEGIN_RING(2*(n))
592209ff23fSmrg#define OUT_ACCEL_REG(reg, val)	OUT_RING_REG(reg, val)
593209ff23fSmrg#define FINISH_ACCEL()		ADVANCE_RING()
594ad43ddacSmrg#define OUT_RELOC(x, read, write) OUT_RING_RELOC(x, read, write)
595209ff23fSmrg
596209ff23fSmrg#define OUT_RING_F(x) OUT_RING(F_TO_DW(x))
597209ff23fSmrg
598209ff23fSmrg#ifdef RENDER
599209ff23fSmrg#include "radeon_exa_render.c"
600209ff23fSmrg#endif
601209ff23fSmrg#include "radeon_exa_funcs.c"
602209ff23fSmrg
603b7e1c893Smrg#undef ACCEL_CP
604b7e1c893Smrg#undef ACCEL_PREAMBLE
605b7e1c893Smrg#undef BEGIN_ACCEL
606b7e1c893Smrg#undef OUT_ACCEL_REG
607b7e1c893Smrg#undef FINISH_ACCEL
608b7e1c893Smrg#undef OUT_RING_F
609b7e1c893Smrg
610209ff23fSmrg#endif /* XF86DRI */
611209ff23fSmrg
612209ff23fSmrg/*
613209ff23fSmrg * Once screen->off_screen_base is set, this function
614209ff23fSmrg * allocates the remaining memory appropriately
615209ff23fSmrg */
616209ff23fSmrgBool RADEONSetupMemEXA (ScreenPtr pScreen)
617209ff23fSmrg{
618209ff23fSmrg    ScrnInfoPtr pScrn = xf86Screens[pScreen->myNum];
619209ff23fSmrg    RADEONInfoPtr info = RADEONPTR(pScrn);
620209ff23fSmrg    xf86CrtcConfigPtr   xf86_config = XF86_CRTC_CONFIG_PTR(pScrn);
621209ff23fSmrg    int cpp = info->CurrentLayout.pixel_bytes;
622209ff23fSmrg    int screen_size;
623209ff23fSmrg    int byteStride = pScrn->displayWidth * cpp;
624209ff23fSmrg
625b7e1c893Smrg    if (info->accel_state->exa != NULL) {
626209ff23fSmrg	xf86DrvMsg(pScreen->myNum, X_ERROR, "Memory map already initialized\n");
627209ff23fSmrg	return FALSE;
628209ff23fSmrg    }
629b7e1c893Smrg    info->accel_state->exa = exaDriverAlloc();
630b7e1c893Smrg    if (info->accel_state->exa == NULL)
631209ff23fSmrg	return FALSE;
632209ff23fSmrg
633209ff23fSmrg    /* Need to adjust screen size for 16 line tiles, and then make it align to.
634209ff23fSmrg     * the buffer alignment requirement.
635209ff23fSmrg     */
636209ff23fSmrg    if (info->allowColorTiling)
637209ff23fSmrg	screen_size = RADEON_ALIGN(pScrn->virtualY, 16) * byteStride;
638209ff23fSmrg    else
639209ff23fSmrg	screen_size = pScrn->virtualY * byteStride;
640209ff23fSmrg
641b7e1c893Smrg    info->accel_state->exa->memoryBase = info->FB;
642b7e1c893Smrg    info->accel_state->exa->memorySize = info->FbMapSize - info->FbSecureSize;
643b7e1c893Smrg    info->accel_state->exa->offScreenBase = screen_size;
644209ff23fSmrg
645209ff23fSmrg    xf86DrvMsg(pScrn->scrnIndex, X_INFO, "Allocating from a screen of %ld kb\n",
646b7e1c893Smrg	       info->accel_state->exa->memorySize / 1024);
647209ff23fSmrg
648209ff23fSmrg    /* Reserve static area for hardware cursor */
649209ff23fSmrg    if (!xf86ReturnOptValBool(info->Options, OPTION_SW_CURSOR, FALSE)) {
650b7e1c893Smrg        int cursor_size = 64 * 4 * 64;
651b7e1c893Smrg        int align = IS_AVIVO_VARIANT ? 4096 : 256;
652b7e1c893Smrg        int c;
653b7e1c893Smrg
654b7e1c893Smrg        for (c = 0; c < xf86_config->num_crtc; c++) {
655b7e1c893Smrg            xf86CrtcPtr crtc = xf86_config->crtc[c];
656b7e1c893Smrg            RADEONCrtcPrivatePtr radeon_crtc = crtc->driver_private;
657b7e1c893Smrg
658b7e1c893Smrg            radeon_crtc->cursor_offset =
659b7e1c893Smrg                RADEON_ALIGN(info->accel_state->exa->offScreenBase, align);
660b7e1c893Smrg            info->accel_state->exa->offScreenBase = radeon_crtc->cursor_offset + cursor_size;
661b7e1c893Smrg
662b7e1c893Smrg            xf86DrvMsg(pScrn->scrnIndex, X_INFO,
663b7e1c893Smrg                       "Will use %d kb for hardware cursor %d at offset 0x%08x\n",
664b7e1c893Smrg                       (cursor_size * xf86_config->num_crtc) / 1024,
665b7e1c893Smrg                       c,
666b7e1c893Smrg                       (unsigned int)radeon_crtc->cursor_offset);
667b7e1c893Smrg        }
668209ff23fSmrg    }
669209ff23fSmrg
670209ff23fSmrg#if defined(XF86DRI)
671209ff23fSmrg    if (info->directRenderingEnabled) {
672b7e1c893Smrg	int depthCpp = (info->dri->depthBits - 8) / 4, l, next, depth_size;
673209ff23fSmrg
674b7e1c893Smrg	info->dri->frontOffset = 0;
675b7e1c893Smrg	info->dri->frontPitch = pScrn->displayWidth;
676209ff23fSmrg
677209ff23fSmrg        xf86DrvMsg(pScrn->scrnIndex, X_INFO,
678209ff23fSmrg	       "Will use %d kb for front buffer at offset 0x%08x\n",
679b7e1c893Smrg	       screen_size / 1024, info->dri->frontOffset);
680209ff23fSmrg	RADEONDRIAllocatePCIGARTTable(pScreen);
681209ff23fSmrg
682209ff23fSmrg	if (info->cardType==CARD_PCIE)
683209ff23fSmrg	  xf86DrvMsg(pScrn->scrnIndex, X_INFO,
684209ff23fSmrg		     "Will use %d kb for PCI GART at offset 0x%08x\n",
685b7e1c893Smrg		     info->dri->pciGartSize / 1024,
686b7e1c893Smrg		     (int)info->dri->pciGartOffset);
687209ff23fSmrg
688209ff23fSmrg	/* Reserve a static area for the back buffer the same size as the
689209ff23fSmrg	 * visible screen.  XXX: This would be better initialized in ati_dri.c
690209ff23fSmrg	 * when GLX is set up, but the offscreen memory manager's allocations
691209ff23fSmrg	 * don't last through VT switches, while the kernel's understanding of
692209ff23fSmrg	 * offscreen locations does.
693209ff23fSmrg	 */
694b7e1c893Smrg	info->dri->backPitch = pScrn->displayWidth;
695ad43ddacSmrg	next = RADEON_ALIGN(info->accel_state->exa->offScreenBase, RADEON_GPU_PAGE_SIZE);
696b7e1c893Smrg	if (!info->dri->noBackBuffer &&
697b7e1c893Smrg	    next + screen_size <= info->accel_state->exa->memorySize)
698209ff23fSmrg	{
699b7e1c893Smrg	    info->dri->backOffset = next;
700b7e1c893Smrg	    info->accel_state->exa->offScreenBase = next + screen_size;
701209ff23fSmrg	    xf86DrvMsg(pScrn->scrnIndex, X_INFO,
702209ff23fSmrg		       "Will use %d kb for back buffer at offset 0x%08x\n",
703b7e1c893Smrg		       screen_size / 1024, info->dri->backOffset);
704209ff23fSmrg	}
705209ff23fSmrg
706209ff23fSmrg	/* Reserve the static depth buffer, and adjust pitch and height to
707209ff23fSmrg	 * handle tiling.
708209ff23fSmrg	 */
709b7e1c893Smrg	info->dri->depthPitch = RADEON_ALIGN(pScrn->displayWidth, 32);
710b7e1c893Smrg	depth_size = RADEON_ALIGN(pScrn->virtualY, 16) * info->dri->depthPitch * depthCpp;
711ad43ddacSmrg	next = RADEON_ALIGN(info->accel_state->exa->offScreenBase, RADEON_GPU_PAGE_SIZE);
712b7e1c893Smrg	if (next + depth_size <= info->accel_state->exa->memorySize)
713209ff23fSmrg	{
714b7e1c893Smrg	    info->dri->depthOffset = next;
715b7e1c893Smrg	    info->accel_state->exa->offScreenBase = next + depth_size;
716209ff23fSmrg	    xf86DrvMsg(pScrn->scrnIndex, X_INFO,
717209ff23fSmrg		       "Will use %d kb for depth buffer at offset 0x%08x\n",
718b7e1c893Smrg		       depth_size / 1024, info->dri->depthOffset);
719209ff23fSmrg	}
720209ff23fSmrg
721b7e1c893Smrg	info->dri->textureSize *= (info->accel_state->exa->memorySize -
722b7e1c893Smrg				   info->accel_state->exa->offScreenBase) / 100;
723209ff23fSmrg
724b7e1c893Smrg	l = RADEONLog2(info->dri->textureSize / RADEON_NR_TEX_REGIONS);
725209ff23fSmrg	if (l < RADEON_LOG_TEX_GRANULARITY)
726209ff23fSmrg	    l = RADEON_LOG_TEX_GRANULARITY;
727b7e1c893Smrg	info->dri->textureSize = (info->dri->textureSize >> l) << l;
728b7e1c893Smrg	if (info->dri->textureSize >= 512 * 1024) {
729b7e1c893Smrg	    info->dri->textureOffset = info->accel_state->exa->offScreenBase;
730b7e1c893Smrg	    info->accel_state->exa->offScreenBase += info->dri->textureSize;
731209ff23fSmrg	    xf86DrvMsg(pScrn->scrnIndex, X_INFO,
732209ff23fSmrg		       "Will use %d kb for textures at offset 0x%08x\n",
733b7e1c893Smrg		       info->dri->textureSize / 1024, info->dri->textureOffset);
734209ff23fSmrg	} else {
735209ff23fSmrg	    /* Minimum texture size is for 2 256x256x32bpp textures */
736b7e1c893Smrg	    info->dri->textureSize = 0;
737209ff23fSmrg	}
738209ff23fSmrg    } else
739209ff23fSmrg#endif /* XF86DRI */
740209ff23fSmrg    	xf86DrvMsg(pScrn->scrnIndex, X_INFO,
741209ff23fSmrg		       "Will use %d kb for front buffer at offset 0x%08x\n",
742209ff23fSmrg		       screen_size / 1024, 0);
743209ff23fSmrg
744209ff23fSmrg    xf86DrvMsg(pScrn->scrnIndex, X_INFO,
745209ff23fSmrg	       "Will use %ld kb for X Server offscreen at offset 0x%08lx\n",
746b7e1c893Smrg	       (info->accel_state->exa->memorySize - info->accel_state->exa->offScreenBase) /
747b7e1c893Smrg	       1024, info->accel_state->exa->offScreenBase);
748209ff23fSmrg
749209ff23fSmrg    return TRUE;
750209ff23fSmrg}
751209ff23fSmrg
752209ff23fSmrg#ifdef XF86DRI
753209ff23fSmrg
754209ff23fSmrg#ifndef ExaOffscreenMarkUsed
755209ff23fSmrgextern void ExaOffscreenMarkUsed(PixmapPtr);
756209ff23fSmrg#endif
757209ff23fSmrg
758209ff23fSmrgunsigned long long
759209ff23fSmrgRADEONTexOffsetStart(PixmapPtr pPix)
760209ff23fSmrg{
761b7e1c893Smrg    RINFO_FROM_SCREEN(pPix->drawable.pScreen);
762b7e1c893Smrg    unsigned long long offset;
763ad43ddacSmrg
764ad43ddacSmrg    if (exaGetPixmapDriverPrivate(pPix))
765ad43ddacSmrg	return -1;
766ad43ddacSmrg
767209ff23fSmrg    exaMoveInPixmap(pPix);
768209ff23fSmrg    ExaOffscreenMarkUsed(pPix);
769209ff23fSmrg
770b7e1c893Smrg    offset = exaGetPixmapOffset(pPix);
771b7e1c893Smrg
772b7e1c893Smrg    if (offset > info->FbMapSize)
773b7e1c893Smrg	return ~0ULL;
774b7e1c893Smrg    else
775b7e1c893Smrg	return info->fbLocation + offset;
776209ff23fSmrg}
777209ff23fSmrg#endif
778