rasops24.c revision 1.47 1 1.47 rin /* $NetBSD: rasops24.c,v 1.47 2019/08/07 11:47:33 rin Exp $ */
2 1.1 ad
3 1.6 ad /*-
4 1.6 ad * Copyright (c) 1999 The NetBSD Foundation, Inc.
5 1.1 ad * All rights reserved.
6 1.1 ad *
7 1.6 ad * This code is derived from software contributed to The NetBSD Foundation
8 1.13 ad * by Andrew Doran.
9 1.6 ad *
10 1.1 ad * Redistribution and use in source and binary forms, with or without
11 1.1 ad * modification, are permitted provided that the following conditions
12 1.1 ad * are met:
13 1.1 ad * 1. Redistributions of source code must retain the above copyright
14 1.1 ad * notice, this list of conditions and the following disclaimer.
15 1.1 ad * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 ad * notice, this list of conditions and the following disclaimer in the
17 1.1 ad * documentation and/or other materials provided with the distribution.
18 1.1 ad *
19 1.6 ad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.6 ad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.6 ad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.6 ad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.6 ad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.6 ad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.6 ad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.6 ad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.6 ad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.6 ad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.6 ad * POSSIBILITY OF SUCH DAMAGE.
30 1.1 ad */
31 1.2 ad
32 1.15 lukem #include <sys/cdefs.h>
33 1.47 rin __KERNEL_RCSID(0, "$NetBSD: rasops24.c,v 1.47 2019/08/07 11:47:33 rin Exp $");
34 1.15 lukem
35 1.1 ad #include "opt_rasops.h"
36 1.1 ad
37 1.1 ad #include <sys/param.h>
38 1.1 ad #include <sys/systm.h>
39 1.1 ad #include <sys/time.h>
40 1.1 ad
41 1.4 ad #include <machine/endian.h>
42 1.22 dsl #include <sys/bswap.h>
43 1.4 ad
44 1.1 ad #include <dev/wscons/wsdisplayvar.h>
45 1.1 ad #include <dev/wscons/wsconsio.h>
46 1.40 rin
47 1.40 rin #define _RASOPS_PRIVATE
48 1.44 rin #define RASOPS_DEPTH 24
49 1.1 ad #include <dev/rasops/rasops.h>
50 1.1 ad
51 1.18 perry static void rasops24_erasecols(void *, int, int, int, long);
52 1.18 perry static void rasops24_eraserows(void *, int, int, long);
53 1.36 rin static void rasops24_putchar(void *, int, int, u_int, long);
54 1.37 rin static void rasops24_putchar_aa(void *, int, int, u_int, long);
55 1.43 rin static __inline void
56 1.43 rin rasops24_makestamp1(struct rasops_info *, uint32_t *,
57 1.43 rin uint32_t, uint32_t, uint32_t, uint32_t);
58 1.9 ad #ifndef RASOPS_SMALL
59 1.36 rin static void rasops24_putchar8(void *, int, int, u_int, long);
60 1.36 rin static void rasops24_putchar12(void *, int, int, u_int, long);
61 1.36 rin static void rasops24_putchar16(void *, int, int, u_int, long);
62 1.18 perry static void rasops24_makestamp(struct rasops_info *, long);
63 1.29 njoly #endif
64 1.4 ad
65 1.47 rin #ifndef RASOPS_SMALL
66 1.47 rin /* 4x1 stamp for optimized character blitting */
67 1.47 rin static uint32_t stamp[64];
68 1.47 rin static long stamp_attr;
69 1.47 rin static struct rasops_info *stamp_ri;
70 1.47 rin
71 1.4 ad /*
72 1.4 ad * offset = STAMP_SHIFT(fontbits, nibble #) & STAMP_MASK
73 1.32 rin * destination uint32_t[0] = STAMP_READ(offset)
74 1.32 rin * destination uint32_t[1] = STAMP_READ(offset + 4)
75 1.32 rin * destination uint32_t[2] = STAMP_READ(offset + 8)
76 1.4 ad */
77 1.36 rin #define STAMP_SHIFT(fb, n) ((n) ? (fb) : (fb) << 4)
78 1.36 rin #define STAMP_MASK (0xf << 4)
79 1.36 rin #define STAMP_READ(o) (*(uint32_t *)((uint8_t *)stamp + (o)))
80 1.47 rin #endif
81 1.4 ad
82 1.1 ad /*
83 1.14 wiz * Initialize rasops_info struct for this colordepth.
84 1.1 ad */
85 1.1 ad void
86 1.26 dsl rasops24_init(struct rasops_info *ri)
87 1.1 ad {
88 1.1 ad
89 1.36 rin if (ri->ri_rnum == 0) {
90 1.36 rin ri->ri_rnum = ri->ri_gnum = ri->ri_bnum = 8;
91 1.36 rin
92 1.36 rin ri->ri_rpos = 0;
93 1.36 rin ri->ri_gpos = 8;
94 1.36 rin ri->ri_bpos = 16;
95 1.36 rin }
96 1.36 rin
97 1.36 rin ri->ri_ops.erasecols = rasops24_erasecols;
98 1.36 rin ri->ri_ops.eraserows = rasops24_eraserows;
99 1.36 rin
100 1.37 rin if (FONT_IS_ALPHA(ri->ri_font)) {
101 1.37 rin ri->ri_ops.putchar = rasops24_putchar_aa;
102 1.37 rin return;
103 1.37 rin }
104 1.37 rin
105 1.1 ad switch (ri->ri_font->fontwidth) {
106 1.9 ad #ifndef RASOPS_SMALL
107 1.1 ad case 8:
108 1.4 ad ri->ri_ops.putchar = rasops24_putchar8;
109 1.1 ad break;
110 1.1 ad case 12:
111 1.4 ad ri->ri_ops.putchar = rasops24_putchar12;
112 1.1 ad break;
113 1.1 ad case 16:
114 1.4 ad ri->ri_ops.putchar = rasops24_putchar16;
115 1.1 ad break;
116 1.9 ad #endif
117 1.1 ad default:
118 1.4 ad ri->ri_ops.putchar = rasops24_putchar;
119 1.41 rin return;
120 1.1 ad }
121 1.41 rin
122 1.41 rin #ifndef RASOPS_SMALL
123 1.47 rin stamp_attr = 0;
124 1.47 rin stamp_ri = NULL;
125 1.41 rin #endif
126 1.1 ad }
127 1.1 ad
128 1.35 rin #include "rasops_putchar.h"
129 1.37 rin #include "rasops_putchar_aa.h"
130 1.1 ad
131 1.43 rin static __inline void
132 1.47 rin rasops24_makestamp1(struct rasops_info *ri, uint32_t *xstamp,
133 1.43 rin uint32_t c1, uint32_t c2, uint32_t c3, uint32_t c4)
134 1.43 rin {
135 1.43 rin
136 1.47 rin xstamp[0] = (c1 << 8) | (c2 >> 16);
137 1.47 rin xstamp[1] = (c2 << 16) | (c3 >> 8);
138 1.47 rin xstamp[2] = (c3 << 24) | c4;
139 1.43 rin
140 1.43 rin #if BYTE_ORDER == LITTLE_ENDIAN
141 1.43 rin if ((ri->ri_flg & RI_BSWAP) == 0)
142 1.43 rin #else
143 1.43 rin if ((ri->ri_flg & RI_BSWAP) != 0)
144 1.43 rin #endif
145 1.43 rin {
146 1.47 rin xstamp[0] = bswap32(xstamp[0]);
147 1.47 rin xstamp[1] = bswap32(xstamp[1]);
148 1.47 rin xstamp[2] = bswap32(xstamp[2]);
149 1.43 rin }
150 1.43 rin }
151 1.43 rin
152 1.9 ad #ifndef RASOPS_SMALL
153 1.9 ad /*
154 1.9 ad * Recompute the blitting stamp.
155 1.9 ad */
156 1.9 ad static void
157 1.26 dsl rasops24_makestamp(struct rasops_info *ri, long attr)
158 1.9 ad {
159 1.36 rin uint32_t fg, bg, c1, c2, c3, c4;
160 1.9 ad int i;
161 1.12 pk
162 1.47 rin stamp_attr = attr;
163 1.47 rin stamp_ri = ri;
164 1.47 rin
165 1.36 rin fg = ri->ri_devcmap[((uint32_t)attr >> 24) & 0xf] & 0xffffff;
166 1.36 rin bg = ri->ri_devcmap[((uint32_t)attr >> 16) & 0xf] & 0xffffff;
167 1.12 pk
168 1.9 ad for (i = 0; i < 64; i += 4) {
169 1.9 ad #if BYTE_ORDER == LITTLE_ENDIAN
170 1.36 rin c1 = i & 32 ? fg : bg;
171 1.36 rin c2 = i & 16 ? fg : bg;
172 1.36 rin c3 = i & 8 ? fg : bg;
173 1.36 rin c4 = i & 4 ? fg : bg;
174 1.9 ad #else
175 1.36 rin c1 = i & 8 ? fg : bg;
176 1.36 rin c2 = i & 4 ? fg : bg;
177 1.36 rin c3 = i & 16 ? fg : bg;
178 1.36 rin c4 = i & 32 ? fg : bg;
179 1.9 ad #endif
180 1.43 rin rasops24_makestamp1(ri, &stamp[i], c1, c2, c3, c4);
181 1.9 ad }
182 1.9 ad }
183 1.1 ad
184 1.35 rin #define RASOPS_WIDTH 8
185 1.35 rin #include "rasops_putchar_width.h"
186 1.35 rin #undef RASOPS_WIDTH
187 1.35 rin
188 1.35 rin #define RASOPS_WIDTH 12
189 1.35 rin #include "rasops_putchar_width.h"
190 1.35 rin #undef RASOPS_WIDTH
191 1.35 rin
192 1.35 rin #define RASOPS_WIDTH 16
193 1.35 rin #include "rasops_putchar_width.h"
194 1.35 rin #undef RASOPS_WIDTH
195 1.12 pk
196 1.11 ad #endif /* !RASOPS_SMALL */
197 1.1 ad
198 1.1 ad /*
199 1.4 ad * Erase rows. This is nice and easy due to alignment.
200 1.1 ad */
201 1.1 ad static void
202 1.27 dsl rasops24_eraserows(void *cookie, int row, int num, long attr)
203 1.1 ad {
204 1.39 rin struct rasops_info *ri = (struct rasops_info *)cookie;
205 1.42 rin int full, slop, cnt, stride;
206 1.47 rin uint32_t *rp, *dp, *hp, clr, xstamp[3];
207 1.39 rin
208 1.39 rin hp = NULL; /* XXX GCC */
209 1.12 pk
210 1.12 pk /*
211 1.4 ad * If the color is gray, we can cheat and use the generic routines
212 1.4 ad * (which are faster, hopefully) since the r,g,b values are the same.
213 1.4 ad */
214 1.30 mlelstv if ((attr & WSATTR_PRIVATE2) != 0) {
215 1.4 ad rasops_eraserows(cookie, row, num, attr);
216 1.4 ad return;
217 1.4 ad }
218 1.4 ad
219 1.1 ad #ifdef RASOPS_CLIPPING
220 1.1 ad if (row < 0) {
221 1.1 ad num += row;
222 1.1 ad row = 0;
223 1.1 ad }
224 1.1 ad
225 1.39 rin if (row + num > ri->ri_rows)
226 1.1 ad num = ri->ri_rows - row;
227 1.12 pk
228 1.1 ad if (num <= 0)
229 1.1 ad return;
230 1.1 ad #endif
231 1.12 pk
232 1.36 rin clr = ri->ri_devcmap[((uint32_t)attr >> 16) & 0xf] & 0xffffff;
233 1.47 rin rasops24_makestamp1(ri, xstamp, clr, clr, clr, clr);
234 1.4 ad
235 1.12 pk /*
236 1.7 ad * XXX the wsdisplay_emulops interface seems a little deficient in
237 1.12 pk * that there is no way to clear the *entire* screen. We provide a
238 1.12 pk * workaround here: if the entire console area is being cleared, and
239 1.7 ad * the RI_FULLCLEAR flag is set, clear the entire display.
240 1.12 pk */
241 1.7 ad if (num == ri->ri_rows && (ri->ri_flg & RI_FULLCLEAR) != 0) {
242 1.7 ad stride = ri->ri_stride;
243 1.7 ad num = ri->ri_height;
244 1.39 rin rp = (uint32_t *)ri->ri_origbits;
245 1.39 rin if (ri->ri_hwbits)
246 1.39 rin hp = (uint32_t *)ri->ri_hworigbits;
247 1.7 ad } else {
248 1.7 ad stride = ri->ri_emustride;
249 1.7 ad num *= ri->ri_font->fontheight;
250 1.39 rin rp = (uint32_t *)(ri->ri_bits + row * ri->ri_yscale);
251 1.39 rin if (ri->ri_hwbits)
252 1.39 rin hp = (uint32_t *)(ri->ri_hwbits + row * ri->ri_yscale);
253 1.7 ad }
254 1.7 ad
255 1.42 rin full = stride / (4 * 3);
256 1.42 rin slop = (stride - full * (4 * 3)) / 4;
257 1.12 pk
258 1.47 rin while (num--) {
259 1.47 rin dp = rp;
260 1.47 rin for (cnt = full; cnt; cnt--) {
261 1.47 rin dp[0] = xstamp[0];
262 1.47 rin dp[1] = xstamp[1];
263 1.47 rin dp[2] = xstamp[2];
264 1.47 rin dp += 3;
265 1.47 rin }
266 1.47 rin for (cnt = 0; cnt < slop; cnt++)
267 1.47 rin *dp++ = xstamp[cnt];
268 1.1 ad
269 1.39 rin if (ri->ri_hwbits) {
270 1.47 rin memcpy(hp, rp, stride);
271 1.39 rin DELTA(hp, ri->ri_stride, uint32_t *);
272 1.39 rin }
273 1.47 rin
274 1.47 rin DELTA(rp, ri->ri_stride, uint32_t *);
275 1.4 ad }
276 1.4 ad }
277 1.4 ad
278 1.4 ad /*
279 1.4 ad * Erase columns.
280 1.4 ad */
281 1.4 ad static void
282 1.27 dsl rasops24_erasecols(void *cookie, int row, int col, int num, long attr)
283 1.4 ad {
284 1.39 rin struct rasops_info *ri = (struct rasops_info *)cookie;
285 1.47 rin int height, cnt, slop1, slop2, full;
286 1.47 rin uint32_t clr, xstamp[3], *dp;
287 1.39 rin uint8_t *rp, *hp, *dbp;
288 1.39 rin
289 1.39 rin hp = NULL; /* XXX GCC */
290 1.4 ad
291 1.12 pk /*
292 1.4 ad * If the color is gray, we can cheat and use the generic routines
293 1.4 ad * (which are faster, hopefully) since the r,g,b values are the same.
294 1.4 ad */
295 1.30 mlelstv if ((attr & WSATTR_PRIVATE2) != 0) {
296 1.4 ad rasops_erasecols(cookie, row, col, num, attr);
297 1.4 ad return;
298 1.4 ad }
299 1.12 pk
300 1.12 pk #ifdef RASOPS_CLIPPING
301 1.12 pk /* Catches 'row < 0' case too */
302 1.4 ad if ((unsigned)row >= (unsigned)ri->ri_rows)
303 1.4 ad return;
304 1.4 ad
305 1.4 ad if (col < 0) {
306 1.4 ad num += col;
307 1.4 ad col = 0;
308 1.4 ad }
309 1.4 ad
310 1.39 rin if (col + num > ri->ri_cols)
311 1.4 ad num = ri->ri_cols - col;
312 1.12 pk
313 1.4 ad if (num <= 0)
314 1.4 ad return;
315 1.4 ad #endif
316 1.12 pk
317 1.39 rin rp = ri->ri_bits + row * ri->ri_yscale + col * ri->ri_xscale;
318 1.39 rin if (ri->ri_hwbits)
319 1.39 rin hp = ri->ri_hwbits + row * ri->ri_yscale + col * ri->ri_xscale;
320 1.39 rin
321 1.47 rin num *= ri->ri_xscale;
322 1.4 ad height = ri->ri_font->fontheight;
323 1.4 ad
324 1.36 rin clr = ri->ri_devcmap[((uint32_t)attr >> 16) & 0xf] & 0xffffff;
325 1.47 rin rasops24_makestamp1(ri, xstamp, clr, clr, clr, clr);
326 1.12 pk
327 1.47 rin /*
328 1.47 rin * Align to word boundary by 24-bit-wise operations:
329 1.47 rin *
330 1.47 rin * rp % 4 == 1 ---> slop1 = 3:
331 1.47 rin * 0123
332 1.47 rin * -RGB
333 1.47 rin *
334 1.47 rin * rp % 4 == 2 ---> slop1 = 6:
335 1.47 rin * 0123 0123
336 1.47 rin * --RG BRGB
337 1.47 rin *
338 1.47 rin * rp % 4 == 3 ---> slop1 = 9:
339 1.47 rin * 0123 0123 0123
340 1.47 rin * ---R GBRG BRGB
341 1.47 rin */
342 1.47 rin slop1 = 3 * ((uintptr_t)rp % 4);
343 1.47 rin slop2 = (num - slop1) % 12;
344 1.47 rin full = (num - slop1 /* - slop2 */) / 12;
345 1.47 rin
346 1.47 rin while (height--) {
347 1.47 rin /* Align to word boundary */
348 1.47 rin dbp = rp;
349 1.47 rin for (cnt = slop1; cnt; cnt -= 3) {
350 1.47 rin *dbp++ = (clr >> 16);
351 1.47 rin *dbp++ = (clr >> 8);
352 1.47 rin *dbp++ = clr;
353 1.47 rin }
354 1.47 rin
355 1.47 rin /* 4 pels per loop */
356 1.47 rin dp = (uint32_t *)dbp;
357 1.47 rin for (cnt = full; cnt; cnt--) {
358 1.47 rin dp[0] = xstamp[0];
359 1.47 rin dp[1] = xstamp[1];
360 1.47 rin dp[2] = xstamp[2];
361 1.47 rin dp += 3;
362 1.47 rin }
363 1.4 ad
364 1.47 rin /* Trailing slop */
365 1.47 rin dbp = (uint8_t *)dp;
366 1.47 rin for (cnt = slop2; cnt; cnt -= 3) {
367 1.47 rin *dbp++ = (clr >> 16);
368 1.47 rin *dbp++ = (clr >> 8);
369 1.47 rin *dbp++ = clr;
370 1.47 rin }
371 1.39 rin
372 1.39 rin if (ri->ri_hwbits) {
373 1.47 rin memcpy(hp, rp, num);
374 1.39 rin hp += ri->ri_stride;
375 1.12 pk }
376 1.47 rin
377 1.47 rin rp += ri->ri_stride;
378 1.1 ad }
379 1.1 ad }
380