Home | History | Annotate | Line # | Download | only in rasops
rasops24.c revision 1.39
      1  1.39       rin /* 	$NetBSD: rasops24.c,v 1.39 2019/07/30 15:23:23 rin Exp $	*/
      2   1.1        ad 
      3   1.6        ad /*-
      4   1.6        ad  * Copyright (c) 1999 The NetBSD Foundation, Inc.
      5   1.1        ad  * All rights reserved.
      6   1.1        ad  *
      7   1.6        ad  * This code is derived from software contributed to The NetBSD Foundation
      8  1.13        ad  * by Andrew Doran.
      9   1.6        ad  *
     10   1.1        ad  * Redistribution and use in source and binary forms, with or without
     11   1.1        ad  * modification, are permitted provided that the following conditions
     12   1.1        ad  * are met:
     13   1.1        ad  * 1. Redistributions of source code must retain the above copyright
     14   1.1        ad  *    notice, this list of conditions and the following disclaimer.
     15   1.1        ad  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.1        ad  *    notice, this list of conditions and the following disclaimer in the
     17   1.1        ad  *    documentation and/or other materials provided with the distribution.
     18   1.1        ad  *
     19   1.6        ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.6        ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.6        ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.6        ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.6        ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.6        ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.6        ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.6        ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.6        ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.6        ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.6        ad  * POSSIBILITY OF SUCH DAMAGE.
     30   1.1        ad  */
     31   1.2        ad 
     32  1.15     lukem #include <sys/cdefs.h>
     33  1.39       rin __KERNEL_RCSID(0, "$NetBSD: rasops24.c,v 1.39 2019/07/30 15:23:23 rin Exp $");
     34  1.15     lukem 
     35   1.1        ad #include "opt_rasops.h"
     36   1.1        ad 
     37   1.1        ad #include <sys/param.h>
     38   1.1        ad #include <sys/systm.h>
     39   1.1        ad #include <sys/time.h>
     40   1.1        ad 
     41   1.4        ad #include <machine/endian.h>
     42  1.22       dsl #include <sys/bswap.h>
     43   1.4        ad 
     44   1.1        ad #include <dev/wscons/wsdisplayvar.h>
     45   1.1        ad #include <dev/wscons/wsconsio.h>
     46   1.1        ad #include <dev/rasops/rasops.h>
     47   1.1        ad 
     48  1.18     perry static void 	rasops24_erasecols(void *, int, int, int, long);
     49  1.18     perry static void 	rasops24_eraserows(void *, int, int, long);
     50  1.36       rin static void 	rasops24_putchar(void *, int, int, u_int, long);
     51  1.37       rin static void 	rasops24_putchar_aa(void *, int, int, u_int, long);
     52   1.9        ad #ifndef RASOPS_SMALL
     53  1.36       rin static void 	rasops24_putchar8(void *, int, int, u_int, long);
     54  1.36       rin static void 	rasops24_putchar12(void *, int, int, u_int, long);
     55  1.36       rin static void 	rasops24_putchar16(void *, int, int, u_int, long);
     56  1.18     perry static void	rasops24_makestamp(struct rasops_info *, long);
     57   1.1        ad 
     58  1.12        pk /*
     59  1.12        pk  * 4x1 stamp for optimized character blitting
     60   1.4        ad  */
     61  1.32       rin static uint32_t	stamp[64];
     62   1.4        ad static long	stamp_attr;
     63   1.4        ad static int	stamp_mutex;	/* XXX see note in readme */
     64  1.29     njoly #endif
     65   1.4        ad 
     66   1.4        ad /*
     67   1.4        ad  * offset = STAMP_SHIFT(fontbits, nibble #) & STAMP_MASK
     68  1.32       rin  * destination uint32_t[0] = STAMP_READ(offset)
     69  1.32       rin  * destination uint32_t[1] = STAMP_READ(offset + 4)
     70  1.32       rin  * destination uint32_t[2] = STAMP_READ(offset + 8)
     71   1.4        ad  */
     72  1.36       rin #define	STAMP_SHIFT(fb, n)	((n) ? (fb) : (fb) << 4)
     73  1.36       rin #define	STAMP_MASK		(0xf << 4)
     74  1.36       rin #define	STAMP_READ(o)		(*(uint32_t *)((uint8_t *)stamp + (o)))
     75   1.4        ad 
     76   1.1        ad /*
     77  1.14       wiz  * Initialize rasops_info struct for this colordepth.
     78   1.1        ad  */
     79   1.1        ad void
     80  1.26       dsl rasops24_init(struct rasops_info *ri)
     81   1.1        ad {
     82   1.1        ad 
     83  1.38       rin #ifndef RASOPS_SMALL
     84  1.38       rin 	/*
     85  1.38       rin 	 * Different devcmap's are used depending on font widths,
     86  1.38       rin 	 * therefore we need reset stamp here.
     87  1.38       rin 	 */
     88  1.38       rin 	stamp_attr = 0;
     89  1.38       rin #endif
     90  1.38       rin 
     91  1.36       rin 	if (ri->ri_rnum == 0) {
     92  1.36       rin 		ri->ri_rnum = ri->ri_gnum = ri->ri_bnum = 8;
     93  1.36       rin 
     94  1.36       rin 		ri->ri_rpos = 0;
     95  1.36       rin 		ri->ri_gpos = 8;
     96  1.36       rin 		ri->ri_bpos = 16;
     97  1.36       rin 	}
     98  1.36       rin 
     99  1.36       rin 	ri->ri_ops.erasecols = rasops24_erasecols;
    100  1.36       rin 	ri->ri_ops.eraserows = rasops24_eraserows;
    101  1.36       rin 
    102  1.37       rin 	if (FONT_IS_ALPHA(ri->ri_font)) {
    103  1.37       rin 		ri->ri_ops.putchar = rasops24_putchar_aa;
    104  1.37       rin 		return;
    105  1.37       rin 	}
    106  1.37       rin 
    107   1.1        ad 	switch (ri->ri_font->fontwidth) {
    108   1.9        ad #ifndef RASOPS_SMALL
    109   1.1        ad 	case 8:
    110   1.4        ad 		ri->ri_ops.putchar = rasops24_putchar8;
    111   1.1        ad 		break;
    112   1.1        ad 	case 12:
    113   1.4        ad 		ri->ri_ops.putchar = rasops24_putchar12;
    114   1.1        ad 		break;
    115   1.1        ad 	case 16:
    116   1.4        ad 		ri->ri_ops.putchar = rasops24_putchar16;
    117   1.1        ad 		break;
    118   1.9        ad #endif
    119   1.1        ad 	default:
    120   1.4        ad 		ri->ri_ops.putchar = rasops24_putchar;
    121   1.1        ad 		break;
    122   1.1        ad 	}
    123   1.1        ad }
    124   1.1        ad 
    125  1.35       rin #define	RASOPS_DEPTH	24
    126  1.35       rin #include "rasops_putchar.h"
    127  1.37       rin #include "rasops_putchar_aa.h"
    128   1.1        ad 
    129   1.9        ad #ifndef RASOPS_SMALL
    130   1.9        ad /*
    131   1.9        ad  * Recompute the blitting stamp.
    132   1.9        ad  */
    133   1.9        ad static void
    134  1.26       dsl rasops24_makestamp(struct rasops_info *ri, long attr)
    135   1.9        ad {
    136  1.36       rin 	uint32_t fg, bg, c1, c2, c3, c4;
    137   1.9        ad 	int i;
    138  1.12        pk 
    139  1.36       rin 	fg = ri->ri_devcmap[((uint32_t)attr >> 24) & 0xf] & 0xffffff;
    140  1.36       rin 	bg = ri->ri_devcmap[((uint32_t)attr >> 16) & 0xf] & 0xffffff;
    141   1.9        ad 	stamp_attr = attr;
    142  1.12        pk 
    143   1.9        ad 	for (i = 0; i < 64; i += 4) {
    144   1.9        ad #if BYTE_ORDER == LITTLE_ENDIAN
    145  1.36       rin 		c1 = i & 32 ? fg : bg;
    146  1.36       rin 		c2 = i & 16 ? fg : bg;
    147  1.36       rin 		c3 = i &  8 ? fg : bg;
    148  1.36       rin 		c4 = i &  4 ? fg : bg;
    149   1.9        ad #else
    150  1.36       rin 		c1 = i &  8 ? fg : bg;
    151  1.36       rin 		c2 = i &  4 ? fg : bg;
    152  1.36       rin 		c3 = i & 16 ? fg : bg;
    153  1.36       rin 		c4 = i & 32 ? fg : bg;
    154   1.9        ad #endif
    155  1.36       rin 		stamp[i + 0] = (c1 <<  8) | (c2 >> 16);
    156  1.36       rin 		stamp[i + 1] = (c2 << 16) | (c3 >>  8);
    157  1.36       rin 		stamp[i + 2] = (c3 << 24) |  c4;
    158   1.9        ad 
    159   1.9        ad #if BYTE_ORDER == LITTLE_ENDIAN
    160   1.9        ad 		if ((ri->ri_flg & RI_BSWAP) == 0) {
    161   1.9        ad #else
    162   1.9        ad 		if ((ri->ri_flg & RI_BSWAP) != 0) {
    163   1.9        ad #endif
    164  1.36       rin 			stamp[i + 0] = bswap32(stamp[i + 0]);
    165  1.36       rin 			stamp[i + 1] = bswap32(stamp[i + 1]);
    166  1.36       rin 			stamp[i + 2] = bswap32(stamp[i + 2]);
    167   1.9        ad 		}
    168   1.9        ad 	}
    169   1.9        ad }
    170   1.1        ad 
    171  1.35       rin #define	RASOPS_WIDTH	8
    172  1.35       rin #include "rasops_putchar_width.h"
    173  1.35       rin #undef	RASOPS_WIDTH
    174  1.35       rin 
    175  1.35       rin #define	RASOPS_WIDTH	12
    176  1.35       rin #include "rasops_putchar_width.h"
    177  1.35       rin #undef	RASOPS_WIDTH
    178  1.35       rin 
    179  1.35       rin #define	RASOPS_WIDTH	16
    180  1.35       rin #include "rasops_putchar_width.h"
    181  1.35       rin #undef	RASOPS_WIDTH
    182  1.12        pk 
    183  1.11        ad #endif	/* !RASOPS_SMALL */
    184   1.1        ad 
    185   1.1        ad /*
    186   1.4        ad  * Erase rows. This is nice and easy due to alignment.
    187   1.1        ad  */
    188   1.1        ad static void
    189  1.27       dsl rasops24_eraserows(void *cookie, int row, int num, long attr)
    190   1.1        ad {
    191  1.39       rin 	struct rasops_info *ri = (struct rasops_info *)cookie;
    192  1.39       rin 	int n9, n3, n1, cnt, stride;
    193  1.39       rin 	uint32_t *rp, *dp, *hp, clr, xstamp[3];
    194  1.39       rin 
    195  1.39       rin 	hp = NULL;	/* XXX GCC */
    196  1.12        pk 
    197  1.12        pk 	/*
    198   1.4        ad 	 * If the color is gray, we can cheat and use the generic routines
    199   1.4        ad 	 * (which are faster, hopefully) since the r,g,b values are the same.
    200   1.4        ad 	 */
    201  1.30   mlelstv 	if ((attr & WSATTR_PRIVATE2) != 0) {
    202   1.4        ad 		rasops_eraserows(cookie, row, num, attr);
    203   1.4        ad 		return;
    204   1.4        ad 	}
    205   1.4        ad 
    206   1.1        ad #ifdef RASOPS_CLIPPING
    207   1.1        ad 	if (row < 0) {
    208   1.1        ad 		num += row;
    209   1.1        ad 		row = 0;
    210   1.1        ad 	}
    211   1.1        ad 
    212  1.39       rin 	if (row + num > ri->ri_rows)
    213   1.1        ad 		num = ri->ri_rows - row;
    214  1.12        pk 
    215   1.1        ad 	if (num <= 0)
    216   1.1        ad 		return;
    217   1.1        ad #endif
    218  1.12        pk 
    219  1.36       rin 	clr = ri->ri_devcmap[((uint32_t)attr >> 16) & 0xf] & 0xffffff;
    220  1.20  christos 	xstamp[0] = (clr <<  8) | (clr >> 16);
    221  1.20  christos 	xstamp[1] = (clr << 16) | (clr >>  8);
    222  1.39       rin 	xstamp[2] = (clr << 24) |  clr;
    223   1.4        ad 
    224   1.4        ad #if BYTE_ORDER == LITTLE_ENDIAN
    225   1.7        ad 	if ((ri->ri_flg & RI_BSWAP) == 0) {
    226   1.4        ad #else
    227   1.7        ad 	if ((ri->ri_flg & RI_BSWAP) != 0) {
    228   1.4        ad #endif
    229  1.20  christos 		xstamp[0] = bswap32(xstamp[0]);
    230  1.20  christos 		xstamp[1] = bswap32(xstamp[1]);
    231  1.20  christos 		xstamp[2] = bswap32(xstamp[2]);
    232   1.4        ad 	}
    233   1.4        ad 
    234  1.12        pk 	/*
    235   1.7        ad 	 * XXX the wsdisplay_emulops interface seems a little deficient in
    236  1.12        pk 	 * that there is no way to clear the *entire* screen. We provide a
    237  1.12        pk 	 * workaround here: if the entire console area is being cleared, and
    238   1.7        ad 	 * the RI_FULLCLEAR flag is set, clear the entire display.
    239  1.12        pk 	 */
    240   1.7        ad 	if (num == ri->ri_rows && (ri->ri_flg & RI_FULLCLEAR) != 0) {
    241   1.7        ad 		stride = ri->ri_stride;
    242   1.7        ad 		num = ri->ri_height;
    243  1.39       rin 		rp = (uint32_t *)ri->ri_origbits;
    244  1.39       rin 		if (ri->ri_hwbits)
    245  1.39       rin 			hp = (uint32_t *)ri->ri_hworigbits;
    246   1.7        ad 	} else {
    247   1.7        ad 		stride = ri->ri_emustride;
    248   1.7        ad 		num *= ri->ri_font->fontheight;
    249  1.39       rin 		rp = (uint32_t *)(ri->ri_bits + row * ri->ri_yscale);
    250  1.39       rin 		if (ri->ri_hwbits)
    251  1.39       rin 			hp = (uint32_t *)(ri->ri_hwbits + row * ri->ri_yscale);
    252   1.7        ad 	}
    253   1.7        ad 
    254  1.39       rin 	n9 = stride / (4 * 9);
    255  1.39       rin 	cnt = n9 * (4 * 9);
    256  1.39       rin 	n3 = (stride - cnt) / (4 * 3);
    257  1.39       rin 	cnt += n3 * (4 * 3);
    258  1.39       rin 	n1 = (stride - cnt) / 4;
    259  1.12        pk 
    260   1.4        ad 	while (num--) {
    261  1.39       rin 		dp = rp;
    262   1.4        ad 		for (cnt = n9; cnt; cnt--) {
    263  1.39       rin 			dp[0] = xstamp[0]; dp[1] = xstamp[1]; dp[2] = xstamp[2];
    264  1.39       rin 			dp[3] = xstamp[0]; dp[4] = xstamp[1]; dp[5] = xstamp[2];
    265  1.39       rin 			dp[6] = xstamp[0]; dp[7] = xstamp[1]; dp[8] = xstamp[2];
    266   1.4        ad 			dp += 9;
    267   1.4        ad 		}
    268   1.1        ad 
    269   1.4        ad 		for (cnt = n3; cnt; cnt--) {
    270  1.39       rin 			dp[0] = xstamp[0]; dp[1] = xstamp[1]; dp[2] = xstamp[2];
    271   1.4        ad 			dp += 3;
    272   1.4        ad 		}
    273  1.12        pk 
    274   1.4        ad 		for (cnt = 0; cnt < n1; cnt++)
    275  1.20  christos 			*dp++ = xstamp[cnt];
    276  1.12        pk 
    277  1.39       rin 		if (ri->ri_hwbits) {
    278  1.39       rin 			memcpy(hp, rp, stride);
    279  1.39       rin 			DELTA(hp, ri->ri_stride, uint32_t *);
    280  1.39       rin 		}
    281  1.39       rin 		DELTA(rp, ri->ri_stride, uint32_t *);
    282   1.4        ad 	}
    283   1.4        ad }
    284   1.4        ad 
    285   1.4        ad /*
    286   1.4        ad  * Erase columns.
    287   1.4        ad  */
    288   1.4        ad static void
    289  1.27       dsl rasops24_erasecols(void *cookie, int row, int col, int num, long attr)
    290   1.4        ad {
    291  1.39       rin 	struct rasops_info *ri = (struct rasops_info *)cookie;
    292  1.39       rin 	int n12, n4, height, cnt, slop1, slop2, clr, xstamp[3];
    293  1.39       rin 	uint32_t *dp;
    294  1.39       rin 	uint8_t *rp, *hp, *dbp;
    295  1.39       rin 
    296  1.39       rin 	hp = NULL;	/* XXX GCC */
    297   1.4        ad 
    298  1.12        pk 	/*
    299   1.4        ad 	 * If the color is gray, we can cheat and use the generic routines
    300   1.4        ad 	 * (which are faster, hopefully) since the r,g,b values are the same.
    301   1.4        ad 	 */
    302  1.30   mlelstv 	if ((attr & WSATTR_PRIVATE2) != 0) {
    303   1.4        ad 		rasops_erasecols(cookie, row, col, num, attr);
    304   1.4        ad 		return;
    305   1.4        ad 	}
    306  1.12        pk 
    307  1.12        pk #ifdef RASOPS_CLIPPING
    308  1.12        pk 	/* Catches 'row < 0' case too */
    309   1.4        ad 	if ((unsigned)row >= (unsigned)ri->ri_rows)
    310   1.4        ad 		return;
    311   1.4        ad 
    312   1.4        ad 	if (col < 0) {
    313   1.4        ad 		num += col;
    314   1.4        ad 		col = 0;
    315   1.4        ad 	}
    316   1.4        ad 
    317  1.39       rin 	if (col + num > ri->ri_cols)
    318   1.4        ad 		num = ri->ri_cols - col;
    319  1.12        pk 
    320   1.4        ad 	if (num <= 0)
    321   1.4        ad 		return;
    322   1.4        ad #endif
    323  1.12        pk 
    324  1.39       rin 	rp = ri->ri_bits + row * ri->ri_yscale + col * ri->ri_xscale;
    325  1.39       rin 	if (ri->ri_hwbits)
    326  1.39       rin 		hp = ri->ri_hwbits + row * ri->ri_yscale + col * ri->ri_xscale;
    327  1.39       rin 
    328   1.4        ad 	num *= ri->ri_font->fontwidth;
    329   1.4        ad 	height = ri->ri_font->fontheight;
    330   1.4        ad 
    331  1.36       rin 	clr = ri->ri_devcmap[((uint32_t)attr >> 16) & 0xf] & 0xffffff;
    332  1.20  christos 	xstamp[0] = (clr <<  8) | (clr >> 16);
    333  1.20  christos 	xstamp[1] = (clr << 16) | (clr >>  8);
    334  1.39       rin 	xstamp[2] = (clr << 24) |  clr;
    335   1.4        ad 
    336   1.4        ad #if BYTE_ORDER == LITTLE_ENDIAN
    337   1.7        ad 	if ((ri->ri_flg & RI_BSWAP) == 0) {
    338   1.4        ad #else
    339   1.7        ad 	if ((ri->ri_flg & RI_BSWAP) != 0) {
    340   1.4        ad #endif
    341  1.20  christos 		xstamp[0] = bswap32(xstamp[0]);
    342  1.20  christos 		xstamp[1] = bswap32(xstamp[1]);
    343  1.20  christos 		xstamp[2] = bswap32(xstamp[2]);
    344   1.4        ad 	}
    345  1.12        pk 
    346  1.12        pk 	/*
    347   1.4        ad 	 * The current byte offset mod 4 tells us the number of 24-bit pels
    348   1.4        ad 	 * we need to write for alignment to 32-bits. Once we're aligned on
    349   1.4        ad 	 * a 32-bit boundary, we're also aligned on a 4 pixel boundary, so
    350   1.4        ad 	 * the stamp does not need to be rotated. The following shows the
    351   1.9        ad 	 * layout of 4 pels in a 3 word region and illustrates this:
    352   1.4        ad 	 *
    353   1.4        ad 	 *	aaab bbcc cddd
    354   1.4        ad 	 */
    355  1.39       rin 	slop1 = (uintptr_t)rp & 3;
    356  1.39       rin 	cnt = slop1;
    357  1.39       rin 	n12 = (num - cnt) / 12;
    358  1.39       rin 	cnt += n12 * 12;
    359  1.39       rin 	n4 = (num - cnt) / 4;
    360  1.39       rin 	cnt += n4 * 4;
    361  1.39       rin 	slop2 = num - cnt;
    362  1.12        pk 
    363   1.4        ad 	while (height--) {
    364  1.39       rin 		dbp = rp;
    365   1.4        ad 
    366   1.4        ad 		/* Align to 4 bytes */
    367   1.7        ad 		/* XXX handle with masks, bring under control of RI_BSWAP */
    368  1.39       rin 		for (cnt = slop1; cnt; cnt--) {
    369   1.4        ad 			*dbp++ = (clr >> 16);
    370   1.4        ad 			*dbp++ = (clr >> 8);
    371  1.39       rin 			*dbp++ =  clr;
    372  1.12        pk 		}
    373   1.4        ad 
    374  1.32       rin 		dp = (uint32_t *)dbp;
    375  1.12        pk 
    376   1.4        ad 		/* 12 pels per loop */
    377   1.4        ad 		for (cnt = n12; cnt; cnt--) {
    378  1.39       rin 			dp[0] = xstamp[0]; dp[1] = xstamp[1]; dp[2] = xstamp[2];
    379  1.39       rin 			dp[3] = xstamp[0]; dp[4] = xstamp[1]; dp[5] = xstamp[2];
    380  1.39       rin 			dp[6] = xstamp[0]; dp[7] = xstamp[1]; dp[8] = xstamp[2];
    381   1.4        ad 			dp += 9;
    382   1.1        ad 		}
    383   1.1        ad 
    384   1.4        ad 		/* 4 pels per loop */
    385   1.4        ad 		for (cnt = n4; cnt; cnt--) {
    386  1.39       rin 			dp[0] = xstamp[0]; dp[1] = xstamp[1]; dp[2] = xstamp[2];
    387   1.4        ad 			dp += 3;
    388   1.4        ad 		}
    389  1.12        pk 
    390   1.4        ad 		/* Trailing slop */
    391   1.7        ad 		/* XXX handle with masks, bring under control of RI_BSWAP */
    392  1.31       rin 		dbp = (uint8_t *)dp;
    393  1.39       rin 		for (cnt = slop2; cnt; cnt--) {
    394   1.4        ad 			*dbp++ = (clr >> 16);
    395   1.4        ad 			*dbp++ = (clr >> 8);
    396  1.39       rin 			*dbp++ =  clr;
    397  1.39       rin 		}
    398  1.39       rin 
    399  1.39       rin 		if (ri->ri_hwbits) {
    400  1.39       rin 			memcpy(hp, rp, num * 3);
    401  1.39       rin 			hp += ri->ri_stride;
    402  1.12        pk 		}
    403  1.39       rin 		rp += ri->ri_stride;
    404   1.1        ad 	}
    405   1.1        ad }
    406