rasops24.c revision 1.40 1 1.40 rin /* $NetBSD: rasops24.c,v 1.40 2019/07/31 00:14:25 rin Exp $ */
2 1.1 ad
3 1.6 ad /*-
4 1.6 ad * Copyright (c) 1999 The NetBSD Foundation, Inc.
5 1.1 ad * All rights reserved.
6 1.1 ad *
7 1.6 ad * This code is derived from software contributed to The NetBSD Foundation
8 1.13 ad * by Andrew Doran.
9 1.6 ad *
10 1.1 ad * Redistribution and use in source and binary forms, with or without
11 1.1 ad * modification, are permitted provided that the following conditions
12 1.1 ad * are met:
13 1.1 ad * 1. Redistributions of source code must retain the above copyright
14 1.1 ad * notice, this list of conditions and the following disclaimer.
15 1.1 ad * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 ad * notice, this list of conditions and the following disclaimer in the
17 1.1 ad * documentation and/or other materials provided with the distribution.
18 1.1 ad *
19 1.6 ad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.6 ad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.6 ad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.6 ad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.6 ad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.6 ad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.6 ad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.6 ad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.6 ad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.6 ad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.6 ad * POSSIBILITY OF SUCH DAMAGE.
30 1.1 ad */
31 1.2 ad
32 1.15 lukem #include <sys/cdefs.h>
33 1.40 rin __KERNEL_RCSID(0, "$NetBSD: rasops24.c,v 1.40 2019/07/31 00:14:25 rin Exp $");
34 1.15 lukem
35 1.1 ad #include "opt_rasops.h"
36 1.1 ad
37 1.1 ad #include <sys/param.h>
38 1.1 ad #include <sys/systm.h>
39 1.1 ad #include <sys/time.h>
40 1.1 ad
41 1.4 ad #include <machine/endian.h>
42 1.22 dsl #include <sys/bswap.h>
43 1.4 ad
44 1.1 ad #include <dev/wscons/wsdisplayvar.h>
45 1.1 ad #include <dev/wscons/wsconsio.h>
46 1.40 rin
47 1.40 rin #define _RASOPS_PRIVATE
48 1.1 ad #include <dev/rasops/rasops.h>
49 1.1 ad
50 1.18 perry static void rasops24_erasecols(void *, int, int, int, long);
51 1.18 perry static void rasops24_eraserows(void *, int, int, long);
52 1.36 rin static void rasops24_putchar(void *, int, int, u_int, long);
53 1.37 rin static void rasops24_putchar_aa(void *, int, int, u_int, long);
54 1.9 ad #ifndef RASOPS_SMALL
55 1.36 rin static void rasops24_putchar8(void *, int, int, u_int, long);
56 1.36 rin static void rasops24_putchar12(void *, int, int, u_int, long);
57 1.36 rin static void rasops24_putchar16(void *, int, int, u_int, long);
58 1.18 perry static void rasops24_makestamp(struct rasops_info *, long);
59 1.1 ad
60 1.12 pk /*
61 1.12 pk * 4x1 stamp for optimized character blitting
62 1.4 ad */
63 1.32 rin static uint32_t stamp[64];
64 1.4 ad static long stamp_attr;
65 1.4 ad static int stamp_mutex; /* XXX see note in readme */
66 1.29 njoly #endif
67 1.4 ad
68 1.4 ad /*
69 1.4 ad * offset = STAMP_SHIFT(fontbits, nibble #) & STAMP_MASK
70 1.32 rin * destination uint32_t[0] = STAMP_READ(offset)
71 1.32 rin * destination uint32_t[1] = STAMP_READ(offset + 4)
72 1.32 rin * destination uint32_t[2] = STAMP_READ(offset + 8)
73 1.4 ad */
74 1.36 rin #define STAMP_SHIFT(fb, n) ((n) ? (fb) : (fb) << 4)
75 1.36 rin #define STAMP_MASK (0xf << 4)
76 1.36 rin #define STAMP_READ(o) (*(uint32_t *)((uint8_t *)stamp + (o)))
77 1.4 ad
78 1.1 ad /*
79 1.14 wiz * Initialize rasops_info struct for this colordepth.
80 1.1 ad */
81 1.1 ad void
82 1.26 dsl rasops24_init(struct rasops_info *ri)
83 1.1 ad {
84 1.1 ad
85 1.38 rin #ifndef RASOPS_SMALL
86 1.38 rin /*
87 1.38 rin * Different devcmap's are used depending on font widths,
88 1.38 rin * therefore we need reset stamp here.
89 1.38 rin */
90 1.38 rin stamp_attr = 0;
91 1.38 rin #endif
92 1.38 rin
93 1.36 rin if (ri->ri_rnum == 0) {
94 1.36 rin ri->ri_rnum = ri->ri_gnum = ri->ri_bnum = 8;
95 1.36 rin
96 1.36 rin ri->ri_rpos = 0;
97 1.36 rin ri->ri_gpos = 8;
98 1.36 rin ri->ri_bpos = 16;
99 1.36 rin }
100 1.36 rin
101 1.36 rin ri->ri_ops.erasecols = rasops24_erasecols;
102 1.36 rin ri->ri_ops.eraserows = rasops24_eraserows;
103 1.36 rin
104 1.37 rin if (FONT_IS_ALPHA(ri->ri_font)) {
105 1.37 rin ri->ri_ops.putchar = rasops24_putchar_aa;
106 1.37 rin return;
107 1.37 rin }
108 1.37 rin
109 1.1 ad switch (ri->ri_font->fontwidth) {
110 1.9 ad #ifndef RASOPS_SMALL
111 1.1 ad case 8:
112 1.4 ad ri->ri_ops.putchar = rasops24_putchar8;
113 1.1 ad break;
114 1.1 ad case 12:
115 1.4 ad ri->ri_ops.putchar = rasops24_putchar12;
116 1.1 ad break;
117 1.1 ad case 16:
118 1.4 ad ri->ri_ops.putchar = rasops24_putchar16;
119 1.1 ad break;
120 1.9 ad #endif
121 1.1 ad default:
122 1.4 ad ri->ri_ops.putchar = rasops24_putchar;
123 1.1 ad break;
124 1.1 ad }
125 1.1 ad }
126 1.1 ad
127 1.35 rin #define RASOPS_DEPTH 24
128 1.35 rin #include "rasops_putchar.h"
129 1.37 rin #include "rasops_putchar_aa.h"
130 1.1 ad
131 1.9 ad #ifndef RASOPS_SMALL
132 1.9 ad /*
133 1.9 ad * Recompute the blitting stamp.
134 1.9 ad */
135 1.9 ad static void
136 1.26 dsl rasops24_makestamp(struct rasops_info *ri, long attr)
137 1.9 ad {
138 1.36 rin uint32_t fg, bg, c1, c2, c3, c4;
139 1.9 ad int i;
140 1.12 pk
141 1.36 rin fg = ri->ri_devcmap[((uint32_t)attr >> 24) & 0xf] & 0xffffff;
142 1.36 rin bg = ri->ri_devcmap[((uint32_t)attr >> 16) & 0xf] & 0xffffff;
143 1.9 ad stamp_attr = attr;
144 1.12 pk
145 1.9 ad for (i = 0; i < 64; i += 4) {
146 1.9 ad #if BYTE_ORDER == LITTLE_ENDIAN
147 1.36 rin c1 = i & 32 ? fg : bg;
148 1.36 rin c2 = i & 16 ? fg : bg;
149 1.36 rin c3 = i & 8 ? fg : bg;
150 1.36 rin c4 = i & 4 ? fg : bg;
151 1.9 ad #else
152 1.36 rin c1 = i & 8 ? fg : bg;
153 1.36 rin c2 = i & 4 ? fg : bg;
154 1.36 rin c3 = i & 16 ? fg : bg;
155 1.36 rin c4 = i & 32 ? fg : bg;
156 1.9 ad #endif
157 1.36 rin stamp[i + 0] = (c1 << 8) | (c2 >> 16);
158 1.36 rin stamp[i + 1] = (c2 << 16) | (c3 >> 8);
159 1.36 rin stamp[i + 2] = (c3 << 24) | c4;
160 1.9 ad
161 1.9 ad #if BYTE_ORDER == LITTLE_ENDIAN
162 1.9 ad if ((ri->ri_flg & RI_BSWAP) == 0) {
163 1.9 ad #else
164 1.9 ad if ((ri->ri_flg & RI_BSWAP) != 0) {
165 1.9 ad #endif
166 1.36 rin stamp[i + 0] = bswap32(stamp[i + 0]);
167 1.36 rin stamp[i + 1] = bswap32(stamp[i + 1]);
168 1.36 rin stamp[i + 2] = bswap32(stamp[i + 2]);
169 1.9 ad }
170 1.9 ad }
171 1.9 ad }
172 1.1 ad
173 1.35 rin #define RASOPS_WIDTH 8
174 1.35 rin #include "rasops_putchar_width.h"
175 1.35 rin #undef RASOPS_WIDTH
176 1.35 rin
177 1.35 rin #define RASOPS_WIDTH 12
178 1.35 rin #include "rasops_putchar_width.h"
179 1.35 rin #undef RASOPS_WIDTH
180 1.35 rin
181 1.35 rin #define RASOPS_WIDTH 16
182 1.35 rin #include "rasops_putchar_width.h"
183 1.35 rin #undef RASOPS_WIDTH
184 1.12 pk
185 1.11 ad #endif /* !RASOPS_SMALL */
186 1.1 ad
187 1.1 ad /*
188 1.4 ad * Erase rows. This is nice and easy due to alignment.
189 1.1 ad */
190 1.1 ad static void
191 1.27 dsl rasops24_eraserows(void *cookie, int row, int num, long attr)
192 1.1 ad {
193 1.39 rin struct rasops_info *ri = (struct rasops_info *)cookie;
194 1.39 rin int n9, n3, n1, cnt, stride;
195 1.39 rin uint32_t *rp, *dp, *hp, clr, xstamp[3];
196 1.39 rin
197 1.39 rin hp = NULL; /* XXX GCC */
198 1.12 pk
199 1.12 pk /*
200 1.4 ad * If the color is gray, we can cheat and use the generic routines
201 1.4 ad * (which are faster, hopefully) since the r,g,b values are the same.
202 1.4 ad */
203 1.30 mlelstv if ((attr & WSATTR_PRIVATE2) != 0) {
204 1.4 ad rasops_eraserows(cookie, row, num, attr);
205 1.4 ad return;
206 1.4 ad }
207 1.4 ad
208 1.1 ad #ifdef RASOPS_CLIPPING
209 1.1 ad if (row < 0) {
210 1.1 ad num += row;
211 1.1 ad row = 0;
212 1.1 ad }
213 1.1 ad
214 1.39 rin if (row + num > ri->ri_rows)
215 1.1 ad num = ri->ri_rows - row;
216 1.12 pk
217 1.1 ad if (num <= 0)
218 1.1 ad return;
219 1.1 ad #endif
220 1.12 pk
221 1.36 rin clr = ri->ri_devcmap[((uint32_t)attr >> 16) & 0xf] & 0xffffff;
222 1.20 christos xstamp[0] = (clr << 8) | (clr >> 16);
223 1.20 christos xstamp[1] = (clr << 16) | (clr >> 8);
224 1.39 rin xstamp[2] = (clr << 24) | clr;
225 1.4 ad
226 1.4 ad #if BYTE_ORDER == LITTLE_ENDIAN
227 1.7 ad if ((ri->ri_flg & RI_BSWAP) == 0) {
228 1.4 ad #else
229 1.7 ad if ((ri->ri_flg & RI_BSWAP) != 0) {
230 1.4 ad #endif
231 1.20 christos xstamp[0] = bswap32(xstamp[0]);
232 1.20 christos xstamp[1] = bswap32(xstamp[1]);
233 1.20 christos xstamp[2] = bswap32(xstamp[2]);
234 1.4 ad }
235 1.4 ad
236 1.12 pk /*
237 1.7 ad * XXX the wsdisplay_emulops interface seems a little deficient in
238 1.12 pk * that there is no way to clear the *entire* screen. We provide a
239 1.12 pk * workaround here: if the entire console area is being cleared, and
240 1.7 ad * the RI_FULLCLEAR flag is set, clear the entire display.
241 1.12 pk */
242 1.7 ad if (num == ri->ri_rows && (ri->ri_flg & RI_FULLCLEAR) != 0) {
243 1.7 ad stride = ri->ri_stride;
244 1.7 ad num = ri->ri_height;
245 1.39 rin rp = (uint32_t *)ri->ri_origbits;
246 1.39 rin if (ri->ri_hwbits)
247 1.39 rin hp = (uint32_t *)ri->ri_hworigbits;
248 1.7 ad } else {
249 1.7 ad stride = ri->ri_emustride;
250 1.7 ad num *= ri->ri_font->fontheight;
251 1.39 rin rp = (uint32_t *)(ri->ri_bits + row * ri->ri_yscale);
252 1.39 rin if (ri->ri_hwbits)
253 1.39 rin hp = (uint32_t *)(ri->ri_hwbits + row * ri->ri_yscale);
254 1.7 ad }
255 1.7 ad
256 1.39 rin n9 = stride / (4 * 9);
257 1.39 rin cnt = n9 * (4 * 9);
258 1.39 rin n3 = (stride - cnt) / (4 * 3);
259 1.39 rin cnt += n3 * (4 * 3);
260 1.39 rin n1 = (stride - cnt) / 4;
261 1.12 pk
262 1.4 ad while (num--) {
263 1.39 rin dp = rp;
264 1.4 ad for (cnt = n9; cnt; cnt--) {
265 1.39 rin dp[0] = xstamp[0]; dp[1] = xstamp[1]; dp[2] = xstamp[2];
266 1.39 rin dp[3] = xstamp[0]; dp[4] = xstamp[1]; dp[5] = xstamp[2];
267 1.39 rin dp[6] = xstamp[0]; dp[7] = xstamp[1]; dp[8] = xstamp[2];
268 1.4 ad dp += 9;
269 1.4 ad }
270 1.1 ad
271 1.4 ad for (cnt = n3; cnt; cnt--) {
272 1.39 rin dp[0] = xstamp[0]; dp[1] = xstamp[1]; dp[2] = xstamp[2];
273 1.4 ad dp += 3;
274 1.4 ad }
275 1.12 pk
276 1.4 ad for (cnt = 0; cnt < n1; cnt++)
277 1.20 christos *dp++ = xstamp[cnt];
278 1.12 pk
279 1.39 rin if (ri->ri_hwbits) {
280 1.39 rin memcpy(hp, rp, stride);
281 1.39 rin DELTA(hp, ri->ri_stride, uint32_t *);
282 1.39 rin }
283 1.39 rin DELTA(rp, ri->ri_stride, uint32_t *);
284 1.4 ad }
285 1.4 ad }
286 1.4 ad
287 1.4 ad /*
288 1.4 ad * Erase columns.
289 1.4 ad */
290 1.4 ad static void
291 1.27 dsl rasops24_erasecols(void *cookie, int row, int col, int num, long attr)
292 1.4 ad {
293 1.39 rin struct rasops_info *ri = (struct rasops_info *)cookie;
294 1.39 rin int n12, n4, height, cnt, slop1, slop2, clr, xstamp[3];
295 1.39 rin uint32_t *dp;
296 1.39 rin uint8_t *rp, *hp, *dbp;
297 1.39 rin
298 1.39 rin hp = NULL; /* XXX GCC */
299 1.4 ad
300 1.12 pk /*
301 1.4 ad * If the color is gray, we can cheat and use the generic routines
302 1.4 ad * (which are faster, hopefully) since the r,g,b values are the same.
303 1.4 ad */
304 1.30 mlelstv if ((attr & WSATTR_PRIVATE2) != 0) {
305 1.4 ad rasops_erasecols(cookie, row, col, num, attr);
306 1.4 ad return;
307 1.4 ad }
308 1.12 pk
309 1.12 pk #ifdef RASOPS_CLIPPING
310 1.12 pk /* Catches 'row < 0' case too */
311 1.4 ad if ((unsigned)row >= (unsigned)ri->ri_rows)
312 1.4 ad return;
313 1.4 ad
314 1.4 ad if (col < 0) {
315 1.4 ad num += col;
316 1.4 ad col = 0;
317 1.4 ad }
318 1.4 ad
319 1.39 rin if (col + num > ri->ri_cols)
320 1.4 ad num = ri->ri_cols - col;
321 1.12 pk
322 1.4 ad if (num <= 0)
323 1.4 ad return;
324 1.4 ad #endif
325 1.12 pk
326 1.39 rin rp = ri->ri_bits + row * ri->ri_yscale + col * ri->ri_xscale;
327 1.39 rin if (ri->ri_hwbits)
328 1.39 rin hp = ri->ri_hwbits + row * ri->ri_yscale + col * ri->ri_xscale;
329 1.39 rin
330 1.4 ad num *= ri->ri_font->fontwidth;
331 1.4 ad height = ri->ri_font->fontheight;
332 1.4 ad
333 1.36 rin clr = ri->ri_devcmap[((uint32_t)attr >> 16) & 0xf] & 0xffffff;
334 1.20 christos xstamp[0] = (clr << 8) | (clr >> 16);
335 1.20 christos xstamp[1] = (clr << 16) | (clr >> 8);
336 1.39 rin xstamp[2] = (clr << 24) | clr;
337 1.4 ad
338 1.4 ad #if BYTE_ORDER == LITTLE_ENDIAN
339 1.7 ad if ((ri->ri_flg & RI_BSWAP) == 0) {
340 1.4 ad #else
341 1.7 ad if ((ri->ri_flg & RI_BSWAP) != 0) {
342 1.4 ad #endif
343 1.20 christos xstamp[0] = bswap32(xstamp[0]);
344 1.20 christos xstamp[1] = bswap32(xstamp[1]);
345 1.20 christos xstamp[2] = bswap32(xstamp[2]);
346 1.4 ad }
347 1.12 pk
348 1.12 pk /*
349 1.4 ad * The current byte offset mod 4 tells us the number of 24-bit pels
350 1.4 ad * we need to write for alignment to 32-bits. Once we're aligned on
351 1.4 ad * a 32-bit boundary, we're also aligned on a 4 pixel boundary, so
352 1.4 ad * the stamp does not need to be rotated. The following shows the
353 1.9 ad * layout of 4 pels in a 3 word region and illustrates this:
354 1.4 ad *
355 1.4 ad * aaab bbcc cddd
356 1.4 ad */
357 1.39 rin slop1 = (uintptr_t)rp & 3;
358 1.39 rin cnt = slop1;
359 1.39 rin n12 = (num - cnt) / 12;
360 1.39 rin cnt += n12 * 12;
361 1.39 rin n4 = (num - cnt) / 4;
362 1.39 rin cnt += n4 * 4;
363 1.39 rin slop2 = num - cnt;
364 1.12 pk
365 1.4 ad while (height--) {
366 1.39 rin dbp = rp;
367 1.4 ad
368 1.4 ad /* Align to 4 bytes */
369 1.7 ad /* XXX handle with masks, bring under control of RI_BSWAP */
370 1.39 rin for (cnt = slop1; cnt; cnt--) {
371 1.4 ad *dbp++ = (clr >> 16);
372 1.4 ad *dbp++ = (clr >> 8);
373 1.39 rin *dbp++ = clr;
374 1.12 pk }
375 1.4 ad
376 1.32 rin dp = (uint32_t *)dbp;
377 1.12 pk
378 1.4 ad /* 12 pels per loop */
379 1.4 ad for (cnt = n12; cnt; cnt--) {
380 1.39 rin dp[0] = xstamp[0]; dp[1] = xstamp[1]; dp[2] = xstamp[2];
381 1.39 rin dp[3] = xstamp[0]; dp[4] = xstamp[1]; dp[5] = xstamp[2];
382 1.39 rin dp[6] = xstamp[0]; dp[7] = xstamp[1]; dp[8] = xstamp[2];
383 1.4 ad dp += 9;
384 1.1 ad }
385 1.1 ad
386 1.4 ad /* 4 pels per loop */
387 1.4 ad for (cnt = n4; cnt; cnt--) {
388 1.39 rin dp[0] = xstamp[0]; dp[1] = xstamp[1]; dp[2] = xstamp[2];
389 1.4 ad dp += 3;
390 1.4 ad }
391 1.12 pk
392 1.4 ad /* Trailing slop */
393 1.7 ad /* XXX handle with masks, bring under control of RI_BSWAP */
394 1.31 rin dbp = (uint8_t *)dp;
395 1.39 rin for (cnt = slop2; cnt; cnt--) {
396 1.4 ad *dbp++ = (clr >> 16);
397 1.4 ad *dbp++ = (clr >> 8);
398 1.39 rin *dbp++ = clr;
399 1.39 rin }
400 1.39 rin
401 1.39 rin if (ri->ri_hwbits) {
402 1.39 rin memcpy(hp, rp, num * 3);
403 1.39 rin hp += ri->ri_stride;
404 1.12 pk }
405 1.39 rin rp += ri->ri_stride;
406 1.1 ad }
407 1.1 ad }
408