if_le_ioasic.c revision 1.35 1 1.35 rin /* $NetBSD: if_le_ioasic.c,v 1.35 2022/05/29 10:43:46 rin Exp $ */
2 1.1 cgd
3 1.1 cgd /*
4 1.1 cgd * Copyright (c) 1996 Carnegie-Mellon University.
5 1.1 cgd * All rights reserved.
6 1.1 cgd *
7 1.1 cgd * Author: Chris G. Demetriou
8 1.1 cgd *
9 1.1 cgd * Permission to use, copy, modify and distribute this software and
10 1.1 cgd * its documentation is hereby granted, provided that both the copyright
11 1.1 cgd * notice and this permission notice appear in all copies of the
12 1.1 cgd * software, derivative works or modified versions, and any portions
13 1.1 cgd * thereof, and that both notices appear in supporting documentation.
14 1.1 cgd *
15 1.1 cgd * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
16 1.1 cgd * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
17 1.1 cgd * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
18 1.1 cgd *
19 1.1 cgd * Carnegie Mellon requests users of this software to return to
20 1.1 cgd *
21 1.1 cgd * Software Distribution Coordinator or Software.Distribution (at) CS.CMU.EDU
22 1.1 cgd * School of Computer Science
23 1.1 cgd * Carnegie Mellon University
24 1.1 cgd * Pittsburgh PA 15213-3890
25 1.1 cgd *
26 1.1 cgd * any improvements or extensions that they make and grant Carnegie the
27 1.1 cgd * rights to redistribute these changes.
28 1.1 cgd */
29 1.1 cgd
30 1.1 cgd /*
31 1.1 cgd * LANCE on DEC IOCTL ASIC.
32 1.1 cgd */
33 1.9 jonathan
34 1.18 lukem #include <sys/cdefs.h>
35 1.35 rin __KERNEL_RCSID(0, "$NetBSD: if_le_ioasic.c,v 1.35 2022/05/29 10:43:46 rin Exp $");
36 1.11 jonathan
37 1.11 jonathan #include "opt_inet.h"
38 1.1 cgd
39 1.1 cgd #include <sys/param.h>
40 1.1 cgd #include <sys/systm.h>
41 1.1 cgd #include <sys/mbuf.h>
42 1.1 cgd #include <sys/syslog.h>
43 1.1 cgd #include <sys/socket.h>
44 1.1 cgd #include <sys/device.h>
45 1.1 cgd
46 1.1 cgd #include <net/if.h>
47 1.5 cgd #include <net/if_ether.h>
48 1.6 thorpej #include <net/if_media.h>
49 1.1 cgd
50 1.1 cgd #ifdef INET
51 1.1 cgd #include <netinet/in.h>
52 1.4 is #include <netinet/if_inarp.h>
53 1.1 cgd #endif
54 1.1 cgd
55 1.12 drochner #include <dev/ic/lancereg.h>
56 1.12 drochner #include <dev/ic/lancevar.h>
57 1.1 cgd #include <dev/ic/am7990reg.h>
58 1.1 cgd #include <dev/ic/am7990var.h>
59 1.1 cgd
60 1.2 thorpej #include <dev/tc/if_levar.h>
61 1.1 cgd #include <dev/tc/tcvar.h>
62 1.13 nisimura #include <dev/tc/ioasicreg.h>
63 1.1 cgd #include <dev/tc/ioasicvar.h>
64 1.1 cgd
65 1.16 nisimura struct le_ioasic_softc {
66 1.16 nisimura struct am7990_softc sc_am7990; /* glue to MI code */
67 1.16 nisimura struct lereg1 *sc_r1; /* LANCE registers */
68 1.16 nisimura /* XXX must match with le_softc of if_levar.h XXX */
69 1.12 drochner
70 1.16 nisimura bus_dma_tag_t sc_dmat; /* bus dma tag */
71 1.16 nisimura bus_dmamap_t sc_dmamap; /* bus dmamap */
72 1.16 nisimura };
73 1.13 nisimura
74 1.30 tsutsui static int le_ioasic_match(device_t, cfdata_t, void *);
75 1.30 tsutsui static void le_ioasic_attach(device_t, device_t, void *);
76 1.13 nisimura
77 1.30 tsutsui CFATTACH_DECL_NEW(le_ioasic, sizeof(struct le_softc),
78 1.21 thorpej le_ioasic_match, le_ioasic_attach, NULL, NULL);
79 1.13 nisimura
80 1.22 perry static void le_ioasic_copytobuf_gap2(struct lance_softc *, void *, int, int);
81 1.22 perry static void le_ioasic_copyfrombuf_gap2(struct lance_softc *, void *, int, int);
82 1.22 perry static void le_ioasic_copytobuf_gap16(struct lance_softc *, void *, int, int);
83 1.22 perry static void le_ioasic_copyfrombuf_gap16(struct lance_softc *, void *,
84 1.22 perry int, int);
85 1.22 perry static void le_ioasic_zerobuf_gap16(struct lance_softc *, int, int);
86 1.2 thorpej
87 1.16 nisimura static int
88 1.30 tsutsui le_ioasic_match(device_t parent, cfdata_t cf, void *aux)
89 1.1 cgd {
90 1.1 cgd struct ioasicdev_attach_args *d = aux;
91 1.1 cgd
92 1.16 nisimura if (strncmp("PMAD-BA ", d->iada_modname, TC_ROM_LLEN) != 0)
93 1.16 nisimura return 0;
94 1.1 cgd
95 1.16 nisimura return 1;
96 1.1 cgd }
97 1.1 cgd
98 1.16 nisimura /* IOASIC LANCE DMA needs 128KB boundary aligned 128KB chunk */
99 1.30 tsutsui #define LE_IOASIC_MEMSIZE (128 * 1024)
100 1.30 tsutsui #define LE_IOASIC_MEMALIGN (128 * 1024)
101 1.16 nisimura
102 1.16 nisimura static void
103 1.30 tsutsui le_ioasic_attach(device_t parent, device_t self, void *aux)
104 1.1 cgd {
105 1.25 thorpej struct le_ioasic_softc *sc = device_private(self);
106 1.1 cgd struct ioasicdev_attach_args *d = aux;
107 1.16 nisimura struct lance_softc *le = &sc->sc_am7990.lsc;
108 1.26 thorpej struct ioasic_softc *iosc = device_private(parent);
109 1.16 nisimura bus_space_tag_t ioasic_bst;
110 1.16 nisimura bus_space_handle_t ioasic_bsh;
111 1.16 nisimura bus_dma_tag_t dmat;
112 1.16 nisimura bus_dma_segment_t seg;
113 1.16 nisimura tc_addr_t tca;
114 1.30 tsutsui uint32_t ssr;
115 1.16 nisimura int rseg;
116 1.28 christos void *le_iomem;
117 1.1 cgd
118 1.30 tsutsui le->sc_dev = self;
119 1.26 thorpej ioasic_bst = iosc->sc_bst;
120 1.26 thorpej ioasic_bsh = iosc->sc_bsh;
121 1.26 thorpej dmat = sc->sc_dmat = iosc->sc_dmat;
122 1.16 nisimura /*
123 1.16 nisimura * Allocate a DMA area for the chip.
124 1.16 nisimura */
125 1.16 nisimura if (bus_dmamem_alloc(dmat, LE_IOASIC_MEMSIZE, LE_IOASIC_MEMALIGN,
126 1.16 nisimura 0, &seg, 1, &rseg, BUS_DMA_NOWAIT)) {
127 1.30 tsutsui aprint_error(": can't allocate DMA area for LANCE\n");
128 1.16 nisimura return;
129 1.16 nisimura }
130 1.16 nisimura if (bus_dmamem_map(dmat, &seg, rseg, LE_IOASIC_MEMSIZE,
131 1.16 nisimura &le_iomem, BUS_DMA_NOWAIT|BUS_DMA_COHERENT)) {
132 1.30 tsutsui aprint_error(": can't map DMA area for LANCE\n");
133 1.35 rin goto bad_free;
134 1.13 nisimura }
135 1.16 nisimura /*
136 1.16 nisimura * Create and load the DMA map for the DMA area.
137 1.16 nisimura */
138 1.16 nisimura if (bus_dmamap_create(dmat, LE_IOASIC_MEMSIZE, 1,
139 1.16 nisimura LE_IOASIC_MEMSIZE, 0, BUS_DMA_NOWAIT, &sc->sc_dmamap)) {
140 1.30 tsutsui aprint_error(": can't create DMA map\n");
141 1.35 rin goto bad_unmap;
142 1.16 nisimura }
143 1.16 nisimura if (bus_dmamap_load(dmat, sc->sc_dmamap,
144 1.16 nisimura le_iomem, LE_IOASIC_MEMSIZE, NULL, BUS_DMA_NOWAIT)) {
145 1.30 tsutsui aprint_error(": can't load DMA map\n");
146 1.35 rin goto bad_destroy;
147 1.16 nisimura }
148 1.16 nisimura /*
149 1.16 nisimura * Bind 128KB buffer with IOASIC DMA.
150 1.16 nisimura */
151 1.17 thorpej tca = IOASIC_DMA_ADDR(sc->sc_dmamap->dm_segs[0].ds_addr);
152 1.16 nisimura bus_space_write_4(ioasic_bst, ioasic_bsh, IOASIC_LANCE_DMAPTR, tca);
153 1.16 nisimura ssr = bus_space_read_4(ioasic_bst, ioasic_bsh, IOASIC_CSR);
154 1.16 nisimura ssr |= IOASIC_CSR_DMAEN_LANCE;
155 1.16 nisimura bus_space_write_4(ioasic_bst, ioasic_bsh, IOASIC_CSR, ssr);
156 1.13 nisimura
157 1.16 nisimura sc->sc_r1 = (struct lereg1 *)
158 1.1 cgd TC_DENSE_TO_SPARSE(TC_PHYS_TO_UNCACHED(d->iada_addr));
159 1.16 nisimura le->sc_mem = (void *)TC_PHYS_TO_UNCACHED(le_iomem);
160 1.16 nisimura le->sc_copytodesc = le_ioasic_copytobuf_gap2;
161 1.16 nisimura le->sc_copyfromdesc = le_ioasic_copyfrombuf_gap2;
162 1.16 nisimura le->sc_copytobuf = le_ioasic_copytobuf_gap16;
163 1.16 nisimura le->sc_copyfrombuf = le_ioasic_copyfrombuf_gap16;
164 1.16 nisimura le->sc_zerobuf = le_ioasic_zerobuf_gap16;
165 1.16 nisimura
166 1.16 nisimura dec_le_common_attach(&sc->sc_am7990,
167 1.30 tsutsui (uint8_t *)iosc->sc_base + IOASIC_SLOT_2_START);
168 1.1 cgd
169 1.2 thorpej ioasic_intr_establish(parent, d->iada_cookie, TC_IPL_NET,
170 1.2 thorpej am7990_intr, sc);
171 1.16 nisimura return;
172 1.16 nisimura
173 1.35 rin bad_destroy:
174 1.35 rin bus_dmamap_destroy(dmat, sc->sc_dmamap);
175 1.35 rin bad_unmap:
176 1.16 nisimura bus_dmamem_unmap(dmat, le_iomem, LE_IOASIC_MEMSIZE);
177 1.35 rin bad_free:
178 1.16 nisimura bus_dmamem_free(dmat, &seg, rseg);
179 1.2 thorpej }
180 1.2 thorpej
181 1.2 thorpej /*
182 1.2 thorpej * Special memory access functions needed by ioasic-attached LANCE
183 1.2 thorpej * chips.
184 1.2 thorpej */
185 1.2 thorpej
186 1.2 thorpej /*
187 1.2 thorpej * gap2: two bytes of data followed by two bytes of pad.
188 1.2 thorpej *
189 1.2 thorpej * Buffers must be 4-byte aligned. The code doesn't worry about
190 1.2 thorpej * doing an extra byte.
191 1.2 thorpej */
192 1.2 thorpej
193 1.2 thorpej void
194 1.27 thorpej le_ioasic_copytobuf_gap2(struct lance_softc *sc, void *fromv, int boff, int len)
195 1.2 thorpej {
196 1.28 christos volatile void *buf = sc->sc_mem;
197 1.30 tsutsui uint8_t *from = fromv;
198 1.30 tsutsui volatile uint16_t *bptr;
199 1.2 thorpej
200 1.2 thorpej if (boff & 0x1) {
201 1.2 thorpej /* handle unaligned first byte */
202 1.30 tsutsui bptr = ((volatile uint16_t *)buf) + (boff - 1);
203 1.2 thorpej *bptr = (*from++ << 8) | (*bptr & 0xff);
204 1.23 perry bptr += 2;
205 1.2 thorpej len--;
206 1.2 thorpej } else
207 1.30 tsutsui bptr = ((volatile uint16_t *)buf) + boff;
208 1.2 thorpej while (len > 1) {
209 1.2 thorpej *bptr = (from[1] << 8) | (from[0] & 0xff);
210 1.2 thorpej bptr += 2;
211 1.2 thorpej from += 2;
212 1.2 thorpej len -= 2;
213 1.2 thorpej }
214 1.2 thorpej if (len == 1)
215 1.30 tsutsui *bptr = (uint16_t)*from;
216 1.2 thorpej }
217 1.2 thorpej
218 1.2 thorpej void
219 1.27 thorpej le_ioasic_copyfrombuf_gap2(struct lance_softc *sc, void *tov, int boff, int len)
220 1.2 thorpej {
221 1.28 christos volatile void *buf = sc->sc_mem;
222 1.30 tsutsui uint8_t *to = tov;
223 1.30 tsutsui volatile uint16_t *bptr;
224 1.30 tsutsui uint16_t tmp;
225 1.2 thorpej
226 1.2 thorpej if (boff & 0x1) {
227 1.2 thorpej /* handle unaligned first byte */
228 1.30 tsutsui bptr = ((volatile uint16_t *)buf) + (boff - 1);
229 1.2 thorpej *to++ = (*bptr >> 8) & 0xff;
230 1.2 thorpej bptr += 2;
231 1.2 thorpej len--;
232 1.2 thorpej } else
233 1.30 tsutsui bptr = ((volatile uint16_t *)buf) + boff;
234 1.2 thorpej while (len > 1) {
235 1.2 thorpej tmp = *bptr;
236 1.2 thorpej *to++ = tmp & 0xff;
237 1.2 thorpej *to++ = (tmp >> 8) & 0xff;
238 1.2 thorpej bptr += 2;
239 1.2 thorpej len -= 2;
240 1.2 thorpej }
241 1.2 thorpej if (len == 1)
242 1.2 thorpej *to = *bptr & 0xff;
243 1.2 thorpej }
244 1.2 thorpej
245 1.2 thorpej /*
246 1.2 thorpej * gap16: 16 bytes of data followed by 16 bytes of pad.
247 1.2 thorpej *
248 1.2 thorpej * Buffers must be 32-byte aligned.
249 1.2 thorpej */
250 1.2 thorpej
251 1.2 thorpej void
252 1.27 thorpej le_ioasic_copytobuf_gap16(struct lance_softc *sc, void *fromv, int boff,
253 1.27 thorpej int len)
254 1.2 thorpej {
255 1.30 tsutsui uint8_t *buf = sc->sc_mem;
256 1.30 tsutsui uint8_t *from = fromv;
257 1.30 tsutsui uint8_t *bptr;
258 1.2 thorpej
259 1.2 thorpej bptr = buf + ((boff << 1) & ~0x1f);
260 1.2 thorpej boff &= 0xf;
261 1.8 jonathan
262 1.8 jonathan /*
263 1.8 jonathan * Dispose of boff so destination of subsequent copies is
264 1.8 jonathan * 16-byte aligned.
265 1.8 jonathan */
266 1.8 jonathan if (boff) {
267 1.15 augustss int xfer;
268 1.34 riastrad xfer = uimin(len, 16 - boff);
269 1.33 tsutsui memcpy(bptr + boff, from, xfer);
270 1.2 thorpej from += xfer;
271 1.2 thorpej bptr += 32;
272 1.2 thorpej len -= xfer;
273 1.2 thorpej }
274 1.8 jonathan
275 1.8 jonathan /* Destination of copies is now 16-byte aligned. */
276 1.8 jonathan if (len >= 16)
277 1.30 tsutsui switch ((u_long)from & (sizeof(uint32_t) -1)) {
278 1.8 jonathan case 2:
279 1.8 jonathan /* Ethernet headers make this the dominant case. */
280 1.8 jonathan do {
281 1.30 tsutsui uint32_t *dst = (uint32_t *)bptr;
282 1.30 tsutsui uint16_t t0;
283 1.30 tsutsui uint32_t t1, t2, t3, t4;
284 1.8 jonathan
285 1.8 jonathan /* read from odd-16-bit-aligned, cached src */
286 1.30 tsutsui t0 = *(uint16_t *)(from + 0);
287 1.30 tsutsui t1 = *(uint32_t *)(from + 2);
288 1.30 tsutsui t2 = *(uint32_t *)(from + 6);
289 1.30 tsutsui t3 = *(uint32_t *)(from + 10);
290 1.30 tsutsui t4 = *(uint16_t *)(from + 14);
291 1.8 jonathan
292 1.8 jonathan /* DMA buffer is uncached on mips */
293 1.8 jonathan dst[0] = t0 | (t1 << 16);
294 1.8 jonathan dst[1] = (t1 >> 16) | (t2 << 16);
295 1.8 jonathan dst[2] = (t2 >> 16) | (t3 << 16);
296 1.8 jonathan dst[3] = (t3 >> 16) | (t4 << 16);
297 1.8 jonathan
298 1.8 jonathan from += 16;
299 1.8 jonathan bptr += 32;
300 1.8 jonathan len -= 16;
301 1.8 jonathan } while (len >= 16);
302 1.8 jonathan break;
303 1.8 jonathan
304 1.8 jonathan case 0:
305 1.8 jonathan do {
306 1.30 tsutsui uint32_t *src = (uint32_t*)from;
307 1.30 tsutsui uint32_t *dst = (uint32_t*)bptr;
308 1.30 tsutsui uint32_t t0, t1, t2, t3;
309 1.8 jonathan
310 1.8 jonathan t0 = src[0]; t1 = src[1]; t2 = src[2]; t3 = src[3];
311 1.8 jonathan dst[0] = t0; dst[1] = t1; dst[2] = t2; dst[3] = t3;
312 1.8 jonathan
313 1.8 jonathan from += 16;
314 1.8 jonathan bptr += 32;
315 1.8 jonathan len -= 16;
316 1.8 jonathan } while (len >= 16);
317 1.8 jonathan break;
318 1.8 jonathan
319 1.23 perry default:
320 1.8 jonathan /* Does odd-aligned case ever happen? */
321 1.8 jonathan do {
322 1.33 tsutsui memcpy(bptr, from, 16);
323 1.8 jonathan from += 16;
324 1.8 jonathan bptr += 32;
325 1.8 jonathan len -= 16;
326 1.8 jonathan } while (len >= 16);
327 1.8 jonathan break;
328 1.8 jonathan }
329 1.8 jonathan if (len)
330 1.33 tsutsui memcpy(bptr, from, len);
331 1.2 thorpej }
332 1.2 thorpej
333 1.2 thorpej void
334 1.27 thorpej le_ioasic_copyfrombuf_gap16(struct lance_softc *sc, void *tov, int boff,
335 1.27 thorpej int len)
336 1.2 thorpej {
337 1.30 tsutsui uint8_t *buf = sc->sc_mem;
338 1.30 tsutsui uint8_t *to = tov;
339 1.30 tsutsui uint8_t *bptr;
340 1.2 thorpej
341 1.2 thorpej bptr = buf + ((boff << 1) & ~0x1f);
342 1.2 thorpej boff &= 0xf;
343 1.8 jonathan
344 1.8 jonathan /* Dispose of boff. source of copy is subsequently 16-byte aligned. */
345 1.8 jonathan if (boff) {
346 1.15 augustss int xfer;
347 1.34 riastrad xfer = uimin(len, 16 - boff);
348 1.33 tsutsui memcpy(to, bptr + boff, xfer);
349 1.2 thorpej to += xfer;
350 1.2 thorpej bptr += 32;
351 1.2 thorpej len -= xfer;
352 1.2 thorpej }
353 1.8 jonathan if (len >= 16)
354 1.30 tsutsui switch ((u_long)to & (sizeof(uint32_t) -1)) {
355 1.8 jonathan case 2:
356 1.8 jonathan /*
357 1.8 jonathan * to is aligned to an odd 16-bit boundary. Ethernet headers
358 1.8 jonathan * make this the dominant case (98% or more).
359 1.8 jonathan */
360 1.8 jonathan do {
361 1.30 tsutsui uint32_t *src = (uint32_t *)bptr;
362 1.30 tsutsui uint32_t t0, t1, t2, t3;
363 1.8 jonathan
364 1.8 jonathan /* read from uncached aligned DMA buf */
365 1.8 jonathan t0 = src[0]; t1 = src[1]; t2 = src[2]; t3 = src[3];
366 1.8 jonathan
367 1.8 jonathan /* write to odd-16-bit-word aligned dst */
368 1.30 tsutsui *(uint16_t *)(to + 0) = (uint16_t)t0;
369 1.30 tsutsui *(uint32_t *)(to + 2) = (t0 >> 16) | (t1 << 16);
370 1.30 tsutsui *(uint32_t *)(to + 6) = (t1 >> 16) | (t2 << 16);
371 1.30 tsutsui *(uint32_t *)(to + 10) = (t2 >> 16) | (t3 << 16);
372 1.30 tsutsui *(uint16_t *)(to + 14) = (t3 >> 16);
373 1.8 jonathan bptr += 32;
374 1.8 jonathan to += 16;
375 1.8 jonathan len -= 16;
376 1.8 jonathan } while (len > 16);
377 1.8 jonathan break;
378 1.8 jonathan case 0:
379 1.8 jonathan /* 32-bit aligned aligned copy. Rare. */
380 1.8 jonathan do {
381 1.30 tsutsui uint32_t *src = (uint32_t *)bptr;
382 1.30 tsutsui uint32_t *dst = (uint32_t *)to;
383 1.30 tsutsui uint32_t t0, t1, t2, t3;
384 1.8 jonathan
385 1.8 jonathan t0 = src[0]; t1 = src[1]; t2 = src[2]; t3 = src[3];
386 1.8 jonathan dst[0] = t0; dst[1] = t1; dst[2] = t2; dst[3] = t3;
387 1.8 jonathan to += 16;
388 1.8 jonathan bptr += 32;
389 1.8 jonathan len -= 16;
390 1.8 jonathan } while (len > 16);
391 1.8 jonathan break;
392 1.8 jonathan
393 1.8 jonathan /* XXX Does odd-byte-aligned case ever happen? */
394 1.8 jonathan default:
395 1.8 jonathan do {
396 1.33 tsutsui memcpy(to, bptr, 16);
397 1.8 jonathan to += 16;
398 1.8 jonathan bptr += 32;
399 1.8 jonathan len -= 16;
400 1.8 jonathan } while (len > 16);
401 1.8 jonathan break;
402 1.8 jonathan }
403 1.8 jonathan if (len)
404 1.33 tsutsui memcpy(to, bptr, len);
405 1.2 thorpej }
406 1.2 thorpej
407 1.2 thorpej void
408 1.27 thorpej le_ioasic_zerobuf_gap16(struct lance_softc *sc, int boff, int len)
409 1.2 thorpej {
410 1.30 tsutsui uint8_t *buf = sc->sc_mem;
411 1.30 tsutsui uint8_t *bptr;
412 1.15 augustss int xfer;
413 1.2 thorpej
414 1.2 thorpej bptr = buf + ((boff << 1) & ~0x1f);
415 1.2 thorpej boff &= 0xf;
416 1.34 riastrad xfer = uimin(len, 16 - boff);
417 1.2 thorpej while (len > 0) {
418 1.31 cegger memset(bptr + boff, 0, xfer);
419 1.2 thorpej bptr += 32;
420 1.2 thorpej boff = 0;
421 1.2 thorpej len -= xfer;
422 1.34 riastrad xfer = uimin(len, 16);
423 1.2 thorpej }
424 1.1 cgd }
425