nvc0_xv.c revision fda9279d
1fda9279dSmrg/*
2fda9279dSmrg * Copyright 2008 Ben Skeggs
3fda9279dSmrg *
4fda9279dSmrg * Permission is hereby granted, free of charge, to any person obtaining a
5fda9279dSmrg * copy of this software and associated documentation files (the "Software"),
6fda9279dSmrg * to deal in the Software without restriction, including without limitation
7fda9279dSmrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8fda9279dSmrg * and/or sell copies of the Software, and to permit persons to whom the
9fda9279dSmrg * Software is furnished to do so, subject to the following conditions:
10fda9279dSmrg *
11fda9279dSmrg * The above copyright notice and this permission notice shall be included in
12fda9279dSmrg * all copies or substantial portions of the Software.
13fda9279dSmrg *
14fda9279dSmrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15fda9279dSmrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16fda9279dSmrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17fda9279dSmrg * THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
18fda9279dSmrg * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF
19fda9279dSmrg * OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
20fda9279dSmrg * SOFTWARE.
21fda9279dSmrg */
22fda9279dSmrg
23fda9279dSmrg#ifdef HAVE_CONFIG_H
24fda9279dSmrg#include "config.h"
25fda9279dSmrg#endif
26fda9279dSmrg
27fda9279dSmrg#include "xf86xv.h"
28fda9279dSmrg#include <X11/extensions/Xv.h>
29fda9279dSmrg#include "exa.h"
30fda9279dSmrg#include "damage.h"
31fda9279dSmrg#include "dixstruct.h"
32fda9279dSmrg#include "fourcc.h"
33fda9279dSmrg
34fda9279dSmrg#include "nv_include.h"
35fda9279dSmrg#include "nvc0_accel.h"
36fda9279dSmrg
37fda9279dSmrgextern Atom xvSyncToVBlank, xvSetDefaults;
38fda9279dSmrg
39fda9279dSmrgstatic Bool
40fda9279dSmrgnvc0_xv_check_image_put(PixmapPtr ppix)
41fda9279dSmrg{
42fda9279dSmrg	switch (ppix->drawable.bitsPerPixel) {
43fda9279dSmrg	case 32:
44fda9279dSmrg	case 24:
45fda9279dSmrg	case 16:
46fda9279dSmrg	case 15:
47fda9279dSmrg		break;
48fda9279dSmrg	default:
49fda9279dSmrg		return FALSE;
50fda9279dSmrg	}
51fda9279dSmrg
52fda9279dSmrg	if (!nv50_style_tiled_pixmap(ppix))
53fda9279dSmrg		return FALSE;
54fda9279dSmrg
55fda9279dSmrg	return TRUE;
56fda9279dSmrg}
57fda9279dSmrg
58fda9279dSmrgint
59fda9279dSmrgnvc0_xv_image_put(ScrnInfoPtr pScrn,
60fda9279dSmrg		  struct nouveau_bo *src, int packed_y, int uv,
61fda9279dSmrg		  int id, int src_pitch, BoxPtr dstBox,
62fda9279dSmrg		  int x1, int y1, int x2, int y2,
63fda9279dSmrg		  uint16_t width, uint16_t height,
64fda9279dSmrg		  uint16_t src_w, uint16_t src_h,
65fda9279dSmrg		  uint16_t drw_w, uint16_t drw_h,
66fda9279dSmrg		  RegionPtr clipBoxes, PixmapPtr ppix,
67fda9279dSmrg		  NVPortPrivPtr pPriv)
68fda9279dSmrg{
69fda9279dSmrg	NVPtr pNv = NVPTR(pScrn);
70fda9279dSmrg	struct nouveau_bo *dst = nouveau_pixmap_bo(ppix);
71fda9279dSmrg	struct nouveau_pushbuf_refn refs[] = {
72fda9279dSmrg		{ pNv->scratch, NOUVEAU_BO_VRAM | NOUVEAU_BO_RDWR },
73fda9279dSmrg		{ src, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD },
74fda9279dSmrg		{ dst, NOUVEAU_BO_VRAM | NOUVEAU_BO_WR },
75fda9279dSmrg	};
76fda9279dSmrg	struct nouveau_pushbuf *push = pNv->pushbuf;
77fda9279dSmrg	uint32_t mode = 0xd0005000 | (src->config.nvc0.tile_mode << 18);
78fda9279dSmrg	float X1, X2, Y1, Y2;
79fda9279dSmrg	BoxPtr pbox;
80fda9279dSmrg	int nbox;
81fda9279dSmrg
82fda9279dSmrg	if (!nvc0_xv_check_image_put(ppix))
83fda9279dSmrg		return BadMatch;
84fda9279dSmrg
85fda9279dSmrg	if (!PUSH_SPACE(push, 256))
86fda9279dSmrg		return BadImplementation;
87fda9279dSmrg
88fda9279dSmrg	BEGIN_NVC0(push, NVC0_3D(RT_ADDRESS_HIGH(0)), 8);
89fda9279dSmrg	PUSH_DATA (push, dst->offset >> 32);
90fda9279dSmrg	PUSH_DATA (push, dst->offset);
91fda9279dSmrg	PUSH_DATA (push, ppix->drawable.width);
92fda9279dSmrg	PUSH_DATA (push, ppix->drawable.height);
93fda9279dSmrg	switch (ppix->drawable.bitsPerPixel) {
94fda9279dSmrg	case 32: PUSH_DATA (push, NV50_SURFACE_FORMAT_BGRA8_UNORM); break;
95fda9279dSmrg	case 24: PUSH_DATA (push, NV50_SURFACE_FORMAT_BGRX8_UNORM); break;
96fda9279dSmrg	case 16: PUSH_DATA (push, NV50_SURFACE_FORMAT_B5G6R5_UNORM); break;
97fda9279dSmrg	case 15: PUSH_DATA (push, NV50_SURFACE_FORMAT_BGR5_X1_UNORM); break;
98fda9279dSmrg	}
99fda9279dSmrg	PUSH_DATA (push, dst->config.nvc0.tile_mode);
100fda9279dSmrg	PUSH_DATA (push, 1);
101fda9279dSmrg	PUSH_DATA (push, 0);
102fda9279dSmrg
103fda9279dSmrg	BEGIN_NVC0(push, NVC0_3D(BLEND_ENABLE(0)), 1);
104fda9279dSmrg	PUSH_DATA (push, 0);
105fda9279dSmrg
106fda9279dSmrg	PUSH_DATAu(push, pNv->scratch, TIC_OFFSET, 16);
107fda9279dSmrg	if (id == FOURCC_YV12 || id == FOURCC_I420) {
108fda9279dSmrg	PUSH_DATA (push, NV50TIC_0_0_MAPA_C0 | NV50TIC_0_0_TYPEA_UNORM |
109fda9279dSmrg			 NV50TIC_0_0_MAPB_ZERO | NV50TIC_0_0_TYPEB_UNORM |
110fda9279dSmrg			 NV50TIC_0_0_MAPG_ZERO | NV50TIC_0_0_TYPEG_UNORM |
111fda9279dSmrg			 NV50TIC_0_0_MAPR_ZERO | NV50TIC_0_0_TYPER_UNORM |
112fda9279dSmrg			 NV50TIC_0_0_FMT_8);
113fda9279dSmrg	PUSH_DATA (push, ((src->offset + packed_y)));
114fda9279dSmrg	PUSH_DATA (push, ((src->offset + packed_y) >> 32) | mode);
115fda9279dSmrg	PUSH_DATA (push, 0x00300000);
116fda9279dSmrg	PUSH_DATA (push, width);
117fda9279dSmrg	PUSH_DATA (push, (1 << NV50TIC_0_5_DEPTH_SHIFT) | height);
118fda9279dSmrg	PUSH_DATA (push, 0x03000000);
119fda9279dSmrg	PUSH_DATA (push, 0x00000000);
120fda9279dSmrg	PUSH_DATA (push, NV50TIC_0_0_MAPA_C1 | NV50TIC_0_0_TYPEA_UNORM |
121fda9279dSmrg			 NV50TIC_0_0_MAPB_C0 | NV50TIC_0_0_TYPEB_UNORM |
122fda9279dSmrg			 NV50TIC_0_0_MAPG_ZERO | NV50TIC_0_0_TYPEG_UNORM |
123fda9279dSmrg			 NV50TIC_0_0_MAPR_ZERO | NV50TIC_0_0_TYPER_UNORM |
124fda9279dSmrg			 NV50TIC_0_0_FMT_8_8);
125fda9279dSmrg	PUSH_DATA (push, ((src->offset + uv)));
126fda9279dSmrg	PUSH_DATA (push, ((src->offset + uv) >> 32) | mode);
127fda9279dSmrg	PUSH_DATA (push, 0x00300000);
128fda9279dSmrg	PUSH_DATA (push, width >> 1);
129fda9279dSmrg	PUSH_DATA (push, (1 << NV50TIC_0_5_DEPTH_SHIFT) | (height >> 1));
130fda9279dSmrg	PUSH_DATA (push, 0x03000000);
131fda9279dSmrg	PUSH_DATA (push, 0x00000000);
132fda9279dSmrg	} else {
133fda9279dSmrg	if (id == FOURCC_UYVY) {
134fda9279dSmrg	PUSH_DATA (push, NV50TIC_0_0_MAPA_C1 | NV50TIC_0_0_TYPEA_UNORM |
135fda9279dSmrg			 NV50TIC_0_0_MAPB_ZERO | NV50TIC_0_0_TYPEB_UNORM |
136fda9279dSmrg			 NV50TIC_0_0_MAPG_ZERO | NV50TIC_0_0_TYPEG_UNORM |
137fda9279dSmrg			 NV50TIC_0_0_MAPR_ZERO | NV50TIC_0_0_TYPER_UNORM |
138fda9279dSmrg			 NV50TIC_0_0_FMT_8_8);
139fda9279dSmrg	} else {
140fda9279dSmrg	PUSH_DATA (push, NV50TIC_0_0_MAPA_C0 | NV50TIC_0_0_TYPEA_UNORM |
141fda9279dSmrg			 NV50TIC_0_0_MAPB_ZERO | NV50TIC_0_0_TYPEB_UNORM |
142fda9279dSmrg			 NV50TIC_0_0_MAPG_ZERO | NV50TIC_0_0_TYPEG_UNORM |
143fda9279dSmrg			 NV50TIC_0_0_MAPR_ZERO | NV50TIC_0_0_TYPER_UNORM |
144fda9279dSmrg			 NV50TIC_0_0_FMT_8_8);
145fda9279dSmrg	}
146fda9279dSmrg	PUSH_DATA (push, ((src->offset + packed_y)));
147fda9279dSmrg	PUSH_DATA (push, ((src->offset + packed_y) >> 32) | mode);
148fda9279dSmrg	PUSH_DATA (push, 0x00300000);
149fda9279dSmrg	PUSH_DATA (push, width);
150fda9279dSmrg	PUSH_DATA (push, (1 << NV50TIC_0_5_DEPTH_SHIFT) | height);
151fda9279dSmrg	PUSH_DATA (push, 0x03000000);
152fda9279dSmrg	PUSH_DATA (push, 0x00000000);
153fda9279dSmrg	if (id == FOURCC_UYVY) {
154fda9279dSmrg	PUSH_DATA (push, NV50TIC_0_0_MAPA_C2 | NV50TIC_0_0_TYPEA_UNORM |
155fda9279dSmrg			 NV50TIC_0_0_MAPB_C0 | NV50TIC_0_0_TYPEB_UNORM |
156fda9279dSmrg			 NV50TIC_0_0_MAPG_ZERO | NV50TIC_0_0_TYPEG_UNORM |
157fda9279dSmrg			 NV50TIC_0_0_MAPR_ZERO | NV50TIC_0_0_TYPER_UNORM |
158fda9279dSmrg			 NV50TIC_0_0_FMT_8_8_8_8);
159fda9279dSmrg	} else {
160fda9279dSmrg	PUSH_DATA (push, NV50TIC_0_0_MAPA_C3 | NV50TIC_0_0_TYPEA_UNORM |
161fda9279dSmrg			 NV50TIC_0_0_MAPB_C1 | NV50TIC_0_0_TYPEB_UNORM |
162fda9279dSmrg			 NV50TIC_0_0_MAPG_ZERO | NV50TIC_0_0_TYPEG_UNORM |
163fda9279dSmrg			 NV50TIC_0_0_MAPR_ZERO | NV50TIC_0_0_TYPER_UNORM |
164fda9279dSmrg			 NV50TIC_0_0_FMT_8_8_8_8);
165fda9279dSmrg	}
166fda9279dSmrg	PUSH_DATA (push, ((src->offset + packed_y)));
167fda9279dSmrg	PUSH_DATA (push, ((src->offset + packed_y) >> 32) | mode);
168fda9279dSmrg	PUSH_DATA (push, 0x00300000);
169fda9279dSmrg	PUSH_DATA (push, (width >> 1));
170fda9279dSmrg	PUSH_DATA (push, (1 << NV50TIC_0_5_DEPTH_SHIFT) | height);
171fda9279dSmrg	PUSH_DATA (push, 0x03000000);
172fda9279dSmrg	PUSH_DATA (push, 0x00000000);
173fda9279dSmrg	}
174fda9279dSmrg
175fda9279dSmrg	PUSH_DATAu(push, pNv->scratch, TSC_OFFSET, 16);
176fda9279dSmrg	PUSH_DATA (push, NV50TSC_1_0_WRAPS_CLAMP_TO_EDGE |
177fda9279dSmrg			 NV50TSC_1_0_WRAPT_CLAMP_TO_EDGE |
178fda9279dSmrg			 NV50TSC_1_0_WRAPR_CLAMP_TO_EDGE);
179fda9279dSmrg	PUSH_DATA (push, NV50TSC_1_1_MAGF_LINEAR |
180fda9279dSmrg			 NV50TSC_1_1_MINF_LINEAR |
181fda9279dSmrg			 NV50TSC_1_1_MIPF_NONE);
182fda9279dSmrg	PUSH_DATA (push, 0x00000000);
183fda9279dSmrg	PUSH_DATA (push, 0x00000000);
184fda9279dSmrg	PUSH_DATA (push, 0x00000000);
185fda9279dSmrg	PUSH_DATA (push, 0x00000000);
186fda9279dSmrg	PUSH_DATA (push, 0x00000000);
187fda9279dSmrg	PUSH_DATA (push, 0x00000000);
188fda9279dSmrg	PUSH_DATA (push, NV50TSC_1_0_WRAPS_CLAMP_TO_EDGE |
189fda9279dSmrg			 NV50TSC_1_0_WRAPT_CLAMP_TO_EDGE |
190fda9279dSmrg			 NV50TSC_1_0_WRAPR_CLAMP_TO_EDGE);
191fda9279dSmrg	PUSH_DATA (push, NV50TSC_1_1_MAGF_LINEAR |
192fda9279dSmrg			 NV50TSC_1_1_MINF_LINEAR |
193fda9279dSmrg			 NV50TSC_1_1_MIPF_NONE);
194fda9279dSmrg	PUSH_DATA (push, 0x00000000);
195fda9279dSmrg	PUSH_DATA (push, 0x00000000);
196fda9279dSmrg	PUSH_DATA (push, 0x00000000);
197fda9279dSmrg	PUSH_DATA (push, 0x00000000);
198fda9279dSmrg	PUSH_DATA (push, 0x00000000);
199fda9279dSmrg	PUSH_DATA (push, 0x00000000);
200fda9279dSmrg
201fda9279dSmrg	BEGIN_NVC0(push, NVC0_3D(SP_START_ID(5)), 1);
202fda9279dSmrg	PUSH_DATA (push, PFP_NV12);
203fda9279dSmrg
204fda9279dSmrg	BEGIN_NVC0(push, NVC0_3D(TSC_FLUSH), 1);
205fda9279dSmrg	PUSH_DATA (push, 0);
206fda9279dSmrg	BEGIN_NVC0(push, NVC0_3D(TIC_FLUSH), 1);
207fda9279dSmrg	PUSH_DATA (push, 0);
208fda9279dSmrg	BEGIN_NVC0(push, NVC0_3D(TEX_CACHE_CTL), 1);
209fda9279dSmrg	PUSH_DATA (push, 0);
210fda9279dSmrg
211fda9279dSmrg	PUSH_DATAu(push, pNv->scratch, PVP_DATA, 11);
212fda9279dSmrg	PUSH_DATAf(push, 1.0);
213fda9279dSmrg	PUSH_DATAf(push, 0.0);
214fda9279dSmrg	PUSH_DATAf(push, 0.0);
215fda9279dSmrg	PUSH_DATAf(push, 0.0);
216fda9279dSmrg	PUSH_DATAf(push, 1.0);
217fda9279dSmrg	PUSH_DATAf(push, 0.0);
218fda9279dSmrg	PUSH_DATAf(push, 0.0);
219fda9279dSmrg	PUSH_DATAf(push, 0.0);
220fda9279dSmrg	PUSH_DATAf(push, 1.0);
221fda9279dSmrg	PUSH_DATAf(push, 1.0 / width);
222fda9279dSmrg	PUSH_DATAf(push, 1.0 / height);
223fda9279dSmrg
224fda9279dSmrg	if (pPriv->SyncToVBlank) {
225fda9279dSmrg		NVC0SyncToVBlank(ppix, dstBox);
226fda9279dSmrg	}
227fda9279dSmrg
228fda9279dSmrg	/* These are fixed point values in the 16.16 format. */
229fda9279dSmrg	X1 = (float)(x1>>16)+(float)(x1&0xFFFF)/(float)0x10000;
230fda9279dSmrg	Y1 = (float)(y1>>16)+(float)(y1&0xFFFF)/(float)0x10000;
231fda9279dSmrg	X2 = (float)(x2>>16)+(float)(x2&0xFFFF)/(float)0x10000;
232fda9279dSmrg	Y2 = (float)(y2>>16)+(float)(y2&0xFFFF)/(float)0x10000;
233fda9279dSmrg
234fda9279dSmrg	pbox = REGION_RECTS(clipBoxes);
235fda9279dSmrg	nbox = REGION_NUM_RECTS(clipBoxes);
236fda9279dSmrg	while(nbox--) {
237fda9279dSmrg		float tx1=X1+(float)(pbox->x1 - dstBox->x1)*(X2-X1)/(float)(drw_w);
238fda9279dSmrg		float tx2=X1+(float)(pbox->x2 - dstBox->x1)*(src_w)/(float)(drw_w);
239fda9279dSmrg		float ty1=Y1+(float)(pbox->y1 - dstBox->y1)*(Y2-Y1)/(float)(drw_h);
240fda9279dSmrg		float ty2=Y1+(float)(pbox->y2 - dstBox->y1)*(src_h)/(float)(drw_h);
241fda9279dSmrg		int sx1=pbox->x1;
242fda9279dSmrg		int sx2=pbox->x2;
243fda9279dSmrg		int sy1=pbox->y1;
244fda9279dSmrg		int sy2=pbox->y2;
245fda9279dSmrg
246fda9279dSmrg		if (nouveau_pushbuf_space(push, 64, 0, 0) ||
247fda9279dSmrg		    nouveau_pushbuf_refn (push, refs, 3))
248fda9279dSmrg			return BadImplementation;
249fda9279dSmrg
250fda9279dSmrg		BEGIN_NVC0(push, NVC0_3D(SCISSOR_HORIZ(0)), 2);
251fda9279dSmrg		PUSH_DATA (push, sx2 << NVC0_3D_SCISSOR_HORIZ_MAX__SHIFT | sx1);
252fda9279dSmrg		PUSH_DATA (push, sy2 << NVC0_3D_SCISSOR_VERT_MAX__SHIFT | sy1 );
253fda9279dSmrg
254fda9279dSmrg		BEGIN_NVC0(push, NVC0_3D(VERTEX_BEGIN_GL), 1);
255fda9279dSmrg		PUSH_DATA (push, NVC0_3D_VERTEX_BEGIN_GL_PRIMITIVE_TRIANGLES);
256fda9279dSmrg		PUSH_VTX1s(push, tx1, ty1, sx1, sy1);
257fda9279dSmrg		PUSH_VTX1s(push, tx2+(tx2-tx1), ty1, sx2+(sx2-sx1), sy1);
258fda9279dSmrg		PUSH_VTX1s(push, tx1, ty2+(ty2-ty1), sx1, sy2+(sy2-sy1));
259fda9279dSmrg		BEGIN_NVC0(push, NVC0_3D(VERTEX_END_GL), 1);
260fda9279dSmrg		PUSH_DATA (push, 0);
261fda9279dSmrg
262fda9279dSmrg		pbox++;
263fda9279dSmrg	}
264fda9279dSmrg
265fda9279dSmrg	PUSH_KICK(push);
266fda9279dSmrg	return Success;
267fda9279dSmrg}
268fda9279dSmrg
269fda9279dSmrgvoid
270fda9279dSmrgnvc0_xv_csc_update(NVPtr pNv, float yco, float *off, float *uco, float *vco)
271fda9279dSmrg{
272fda9279dSmrg	struct nouveau_pushbuf *push = pNv->pushbuf;
273fda9279dSmrg
274fda9279dSmrg	if (nouveau_pushbuf_space(push, 64, 0, 0) ||
275fda9279dSmrg	    nouveau_pushbuf_refn (push, &(struct nouveau_pushbuf_refn) {
276fda9279dSmrg					pNv->scratch, NOUVEAU_BO_WR |
277fda9279dSmrg					NOUVEAU_BO_VRAM }, 1))
278fda9279dSmrg		return;
279fda9279dSmrg
280fda9279dSmrg	BEGIN_NVC0(push, NVC0_3D(CB_SIZE), 3);
281fda9279dSmrg	PUSH_DATA (push, 256);
282fda9279dSmrg	PUSH_DATA (push, (pNv->scratch->offset + PFP_DATA) >> 32);
283fda9279dSmrg	PUSH_DATA (push, (pNv->scratch->offset + PFP_DATA));
284fda9279dSmrg	BEGIN_NVC0(push, NVC0_3D(CB_POS), 11);
285fda9279dSmrg	PUSH_DATA (push, 0);
286fda9279dSmrg	PUSH_DATAf(push, yco);
287fda9279dSmrg	PUSH_DATAf(push, off[0]);
288fda9279dSmrg	PUSH_DATAf(push, off[1]);
289fda9279dSmrg	PUSH_DATAf(push, off[2]);
290fda9279dSmrg	PUSH_DATAf(push, uco[0]);
291fda9279dSmrg	PUSH_DATAf(push, uco[1]);
292fda9279dSmrg	PUSH_DATAf(push, uco[2]);
293fda9279dSmrg	PUSH_DATAf(push, vco[0]);
294fda9279dSmrg	PUSH_DATAf(push, vco[1]);
295fda9279dSmrg	PUSH_DATAf(push, vco[2]);
296fda9279dSmrg}
297