1 1.35 rin /* $NetBSD: if_le_ioasic.c,v 1.35 2022/05/29 10:43:46 rin Exp $ */ 2 1.1 cgd 3 1.1 cgd /* 4 1.1 cgd * Copyright (c) 1996 Carnegie-Mellon University. 5 1.1 cgd * All rights reserved. 6 1.1 cgd * 7 1.1 cgd * Author: Chris G. Demetriou 8 1.1 cgd * 9 1.1 cgd * Permission to use, copy, modify and distribute this software and 10 1.1 cgd * its documentation is hereby granted, provided that both the copyright 11 1.1 cgd * notice and this permission notice appear in all copies of the 12 1.1 cgd * software, derivative works or modified versions, and any portions 13 1.1 cgd * thereof, and that both notices appear in supporting documentation. 14 1.1 cgd * 15 1.1 cgd * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS" 16 1.1 cgd * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND 17 1.1 cgd * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE. 18 1.1 cgd * 19 1.1 cgd * Carnegie Mellon requests users of this software to return to 20 1.1 cgd * 21 1.1 cgd * Software Distribution Coordinator or Software.Distribution (at) CS.CMU.EDU 22 1.1 cgd * School of Computer Science 23 1.1 cgd * Carnegie Mellon University 24 1.1 cgd * Pittsburgh PA 15213-3890 25 1.1 cgd * 26 1.1 cgd * any improvements or extensions that they make and grant Carnegie the 27 1.1 cgd * rights to redistribute these changes. 28 1.1 cgd */ 29 1.1 cgd 30 1.1 cgd /* 31 1.1 cgd * LANCE on DEC IOCTL ASIC. 32 1.1 cgd */ 33 1.9 jonathan 34 1.18 lukem #include <sys/cdefs.h> 35 1.35 rin __KERNEL_RCSID(0, "$NetBSD: if_le_ioasic.c,v 1.35 2022/05/29 10:43:46 rin Exp $"); 36 1.11 jonathan 37 1.11 jonathan #include "opt_inet.h" 38 1.1 cgd 39 1.1 cgd #include <sys/param.h> 40 1.1 cgd #include <sys/systm.h> 41 1.1 cgd #include <sys/mbuf.h> 42 1.1 cgd #include <sys/syslog.h> 43 1.1 cgd #include <sys/socket.h> 44 1.1 cgd #include <sys/device.h> 45 1.1 cgd 46 1.1 cgd #include <net/if.h> 47 1.5 cgd #include <net/if_ether.h> 48 1.6 thorpej #include <net/if_media.h> 49 1.1 cgd 50 1.1 cgd #ifdef INET 51 1.1 cgd #include <netinet/in.h> 52 1.4 is #include <netinet/if_inarp.h> 53 1.1 cgd #endif 54 1.1 cgd 55 1.12 drochner #include <dev/ic/lancereg.h> 56 1.12 drochner #include <dev/ic/lancevar.h> 57 1.1 cgd #include <dev/ic/am7990reg.h> 58 1.1 cgd #include <dev/ic/am7990var.h> 59 1.1 cgd 60 1.2 thorpej #include <dev/tc/if_levar.h> 61 1.1 cgd #include <dev/tc/tcvar.h> 62 1.13 nisimura #include <dev/tc/ioasicreg.h> 63 1.1 cgd #include <dev/tc/ioasicvar.h> 64 1.1 cgd 65 1.16 nisimura struct le_ioasic_softc { 66 1.16 nisimura struct am7990_softc sc_am7990; /* glue to MI code */ 67 1.16 nisimura struct lereg1 *sc_r1; /* LANCE registers */ 68 1.16 nisimura /* XXX must match with le_softc of if_levar.h XXX */ 69 1.12 drochner 70 1.16 nisimura bus_dma_tag_t sc_dmat; /* bus dma tag */ 71 1.16 nisimura bus_dmamap_t sc_dmamap; /* bus dmamap */ 72 1.16 nisimura }; 73 1.13 nisimura 74 1.30 tsutsui static int le_ioasic_match(device_t, cfdata_t, void *); 75 1.30 tsutsui static void le_ioasic_attach(device_t, device_t, void *); 76 1.13 nisimura 77 1.30 tsutsui CFATTACH_DECL_NEW(le_ioasic, sizeof(struct le_softc), 78 1.21 thorpej le_ioasic_match, le_ioasic_attach, NULL, NULL); 79 1.13 nisimura 80 1.22 perry static void le_ioasic_copytobuf_gap2(struct lance_softc *, void *, int, int); 81 1.22 perry static void le_ioasic_copyfrombuf_gap2(struct lance_softc *, void *, int, int); 82 1.22 perry static void le_ioasic_copytobuf_gap16(struct lance_softc *, void *, int, int); 83 1.22 perry static void le_ioasic_copyfrombuf_gap16(struct lance_softc *, void *, 84 1.22 perry int, int); 85 1.22 perry static void le_ioasic_zerobuf_gap16(struct lance_softc *, int, int); 86 1.2 thorpej 87 1.16 nisimura static int 88 1.30 tsutsui le_ioasic_match(device_t parent, cfdata_t cf, void *aux) 89 1.1 cgd { 90 1.1 cgd struct ioasicdev_attach_args *d = aux; 91 1.1 cgd 92 1.16 nisimura if (strncmp("PMAD-BA ", d->iada_modname, TC_ROM_LLEN) != 0) 93 1.16 nisimura return 0; 94 1.1 cgd 95 1.16 nisimura return 1; 96 1.1 cgd } 97 1.1 cgd 98 1.16 nisimura /* IOASIC LANCE DMA needs 128KB boundary aligned 128KB chunk */ 99 1.30 tsutsui #define LE_IOASIC_MEMSIZE (128 * 1024) 100 1.30 tsutsui #define LE_IOASIC_MEMALIGN (128 * 1024) 101 1.16 nisimura 102 1.16 nisimura static void 103 1.30 tsutsui le_ioasic_attach(device_t parent, device_t self, void *aux) 104 1.1 cgd { 105 1.25 thorpej struct le_ioasic_softc *sc = device_private(self); 106 1.1 cgd struct ioasicdev_attach_args *d = aux; 107 1.16 nisimura struct lance_softc *le = &sc->sc_am7990.lsc; 108 1.26 thorpej struct ioasic_softc *iosc = device_private(parent); 109 1.16 nisimura bus_space_tag_t ioasic_bst; 110 1.16 nisimura bus_space_handle_t ioasic_bsh; 111 1.16 nisimura bus_dma_tag_t dmat; 112 1.16 nisimura bus_dma_segment_t seg; 113 1.16 nisimura tc_addr_t tca; 114 1.30 tsutsui uint32_t ssr; 115 1.16 nisimura int rseg; 116 1.28 christos void *le_iomem; 117 1.1 cgd 118 1.30 tsutsui le->sc_dev = self; 119 1.26 thorpej ioasic_bst = iosc->sc_bst; 120 1.26 thorpej ioasic_bsh = iosc->sc_bsh; 121 1.26 thorpej dmat = sc->sc_dmat = iosc->sc_dmat; 122 1.16 nisimura /* 123 1.16 nisimura * Allocate a DMA area for the chip. 124 1.16 nisimura */ 125 1.16 nisimura if (bus_dmamem_alloc(dmat, LE_IOASIC_MEMSIZE, LE_IOASIC_MEMALIGN, 126 1.16 nisimura 0, &seg, 1, &rseg, BUS_DMA_NOWAIT)) { 127 1.30 tsutsui aprint_error(": can't allocate DMA area for LANCE\n"); 128 1.16 nisimura return; 129 1.16 nisimura } 130 1.16 nisimura if (bus_dmamem_map(dmat, &seg, rseg, LE_IOASIC_MEMSIZE, 131 1.16 nisimura &le_iomem, BUS_DMA_NOWAIT|BUS_DMA_COHERENT)) { 132 1.30 tsutsui aprint_error(": can't map DMA area for LANCE\n"); 133 1.35 rin goto bad_free; 134 1.13 nisimura } 135 1.16 nisimura /* 136 1.16 nisimura * Create and load the DMA map for the DMA area. 137 1.16 nisimura */ 138 1.16 nisimura if (bus_dmamap_create(dmat, LE_IOASIC_MEMSIZE, 1, 139 1.16 nisimura LE_IOASIC_MEMSIZE, 0, BUS_DMA_NOWAIT, &sc->sc_dmamap)) { 140 1.30 tsutsui aprint_error(": can't create DMA map\n"); 141 1.35 rin goto bad_unmap; 142 1.16 nisimura } 143 1.16 nisimura if (bus_dmamap_load(dmat, sc->sc_dmamap, 144 1.16 nisimura le_iomem, LE_IOASIC_MEMSIZE, NULL, BUS_DMA_NOWAIT)) { 145 1.30 tsutsui aprint_error(": can't load DMA map\n"); 146 1.35 rin goto bad_destroy; 147 1.16 nisimura } 148 1.16 nisimura /* 149 1.16 nisimura * Bind 128KB buffer with IOASIC DMA. 150 1.16 nisimura */ 151 1.17 thorpej tca = IOASIC_DMA_ADDR(sc->sc_dmamap->dm_segs[0].ds_addr); 152 1.16 nisimura bus_space_write_4(ioasic_bst, ioasic_bsh, IOASIC_LANCE_DMAPTR, tca); 153 1.16 nisimura ssr = bus_space_read_4(ioasic_bst, ioasic_bsh, IOASIC_CSR); 154 1.16 nisimura ssr |= IOASIC_CSR_DMAEN_LANCE; 155 1.16 nisimura bus_space_write_4(ioasic_bst, ioasic_bsh, IOASIC_CSR, ssr); 156 1.13 nisimura 157 1.16 nisimura sc->sc_r1 = (struct lereg1 *) 158 1.1 cgd TC_DENSE_TO_SPARSE(TC_PHYS_TO_UNCACHED(d->iada_addr)); 159 1.16 nisimura le->sc_mem = (void *)TC_PHYS_TO_UNCACHED(le_iomem); 160 1.16 nisimura le->sc_copytodesc = le_ioasic_copytobuf_gap2; 161 1.16 nisimura le->sc_copyfromdesc = le_ioasic_copyfrombuf_gap2; 162 1.16 nisimura le->sc_copytobuf = le_ioasic_copytobuf_gap16; 163 1.16 nisimura le->sc_copyfrombuf = le_ioasic_copyfrombuf_gap16; 164 1.16 nisimura le->sc_zerobuf = le_ioasic_zerobuf_gap16; 165 1.16 nisimura 166 1.16 nisimura dec_le_common_attach(&sc->sc_am7990, 167 1.30 tsutsui (uint8_t *)iosc->sc_base + IOASIC_SLOT_2_START); 168 1.1 cgd 169 1.2 thorpej ioasic_intr_establish(parent, d->iada_cookie, TC_IPL_NET, 170 1.2 thorpej am7990_intr, sc); 171 1.16 nisimura return; 172 1.16 nisimura 173 1.35 rin bad_destroy: 174 1.35 rin bus_dmamap_destroy(dmat, sc->sc_dmamap); 175 1.35 rin bad_unmap: 176 1.16 nisimura bus_dmamem_unmap(dmat, le_iomem, LE_IOASIC_MEMSIZE); 177 1.35 rin bad_free: 178 1.16 nisimura bus_dmamem_free(dmat, &seg, rseg); 179 1.2 thorpej } 180 1.2 thorpej 181 1.2 thorpej /* 182 1.2 thorpej * Special memory access functions needed by ioasic-attached LANCE 183 1.2 thorpej * chips. 184 1.2 thorpej */ 185 1.2 thorpej 186 1.2 thorpej /* 187 1.2 thorpej * gap2: two bytes of data followed by two bytes of pad. 188 1.2 thorpej * 189 1.2 thorpej * Buffers must be 4-byte aligned. The code doesn't worry about 190 1.2 thorpej * doing an extra byte. 191 1.2 thorpej */ 192 1.2 thorpej 193 1.2 thorpej void 194 1.27 thorpej le_ioasic_copytobuf_gap2(struct lance_softc *sc, void *fromv, int boff, int len) 195 1.2 thorpej { 196 1.28 christos volatile void *buf = sc->sc_mem; 197 1.30 tsutsui uint8_t *from = fromv; 198 1.30 tsutsui volatile uint16_t *bptr; 199 1.2 thorpej 200 1.2 thorpej if (boff & 0x1) { 201 1.2 thorpej /* handle unaligned first byte */ 202 1.30 tsutsui bptr = ((volatile uint16_t *)buf) + (boff - 1); 203 1.2 thorpej *bptr = (*from++ << 8) | (*bptr & 0xff); 204 1.23 perry bptr += 2; 205 1.2 thorpej len--; 206 1.2 thorpej } else 207 1.30 tsutsui bptr = ((volatile uint16_t *)buf) + boff; 208 1.2 thorpej while (len > 1) { 209 1.2 thorpej *bptr = (from[1] << 8) | (from[0] & 0xff); 210 1.2 thorpej bptr += 2; 211 1.2 thorpej from += 2; 212 1.2 thorpej len -= 2; 213 1.2 thorpej } 214 1.2 thorpej if (len == 1) 215 1.30 tsutsui *bptr = (uint16_t)*from; 216 1.2 thorpej } 217 1.2 thorpej 218 1.2 thorpej void 219 1.27 thorpej le_ioasic_copyfrombuf_gap2(struct lance_softc *sc, void *tov, int boff, int len) 220 1.2 thorpej { 221 1.28 christos volatile void *buf = sc->sc_mem; 222 1.30 tsutsui uint8_t *to = tov; 223 1.30 tsutsui volatile uint16_t *bptr; 224 1.30 tsutsui uint16_t tmp; 225 1.2 thorpej 226 1.2 thorpej if (boff & 0x1) { 227 1.2 thorpej /* handle unaligned first byte */ 228 1.30 tsutsui bptr = ((volatile uint16_t *)buf) + (boff - 1); 229 1.2 thorpej *to++ = (*bptr >> 8) & 0xff; 230 1.2 thorpej bptr += 2; 231 1.2 thorpej len--; 232 1.2 thorpej } else 233 1.30 tsutsui bptr = ((volatile uint16_t *)buf) + boff; 234 1.2 thorpej while (len > 1) { 235 1.2 thorpej tmp = *bptr; 236 1.2 thorpej *to++ = tmp & 0xff; 237 1.2 thorpej *to++ = (tmp >> 8) & 0xff; 238 1.2 thorpej bptr += 2; 239 1.2 thorpej len -= 2; 240 1.2 thorpej } 241 1.2 thorpej if (len == 1) 242 1.2 thorpej *to = *bptr & 0xff; 243 1.2 thorpej } 244 1.2 thorpej 245 1.2 thorpej /* 246 1.2 thorpej * gap16: 16 bytes of data followed by 16 bytes of pad. 247 1.2 thorpej * 248 1.2 thorpej * Buffers must be 32-byte aligned. 249 1.2 thorpej */ 250 1.2 thorpej 251 1.2 thorpej void 252 1.27 thorpej le_ioasic_copytobuf_gap16(struct lance_softc *sc, void *fromv, int boff, 253 1.27 thorpej int len) 254 1.2 thorpej { 255 1.30 tsutsui uint8_t *buf = sc->sc_mem; 256 1.30 tsutsui uint8_t *from = fromv; 257 1.30 tsutsui uint8_t *bptr; 258 1.2 thorpej 259 1.2 thorpej bptr = buf + ((boff << 1) & ~0x1f); 260 1.2 thorpej boff &= 0xf; 261 1.8 jonathan 262 1.8 jonathan /* 263 1.8 jonathan * Dispose of boff so destination of subsequent copies is 264 1.8 jonathan * 16-byte aligned. 265 1.8 jonathan */ 266 1.8 jonathan if (boff) { 267 1.15 augustss int xfer; 268 1.34 riastrad xfer = uimin(len, 16 - boff); 269 1.33 tsutsui memcpy(bptr + boff, from, xfer); 270 1.2 thorpej from += xfer; 271 1.2 thorpej bptr += 32; 272 1.2 thorpej len -= xfer; 273 1.2 thorpej } 274 1.8 jonathan 275 1.8 jonathan /* Destination of copies is now 16-byte aligned. */ 276 1.8 jonathan if (len >= 16) 277 1.30 tsutsui switch ((u_long)from & (sizeof(uint32_t) -1)) { 278 1.8 jonathan case 2: 279 1.8 jonathan /* Ethernet headers make this the dominant case. */ 280 1.8 jonathan do { 281 1.30 tsutsui uint32_t *dst = (uint32_t *)bptr; 282 1.30 tsutsui uint16_t t0; 283 1.30 tsutsui uint32_t t1, t2, t3, t4; 284 1.8 jonathan 285 1.8 jonathan /* read from odd-16-bit-aligned, cached src */ 286 1.30 tsutsui t0 = *(uint16_t *)(from + 0); 287 1.30 tsutsui t1 = *(uint32_t *)(from + 2); 288 1.30 tsutsui t2 = *(uint32_t *)(from + 6); 289 1.30 tsutsui t3 = *(uint32_t *)(from + 10); 290 1.30 tsutsui t4 = *(uint16_t *)(from + 14); 291 1.8 jonathan 292 1.8 jonathan /* DMA buffer is uncached on mips */ 293 1.8 jonathan dst[0] = t0 | (t1 << 16); 294 1.8 jonathan dst[1] = (t1 >> 16) | (t2 << 16); 295 1.8 jonathan dst[2] = (t2 >> 16) | (t3 << 16); 296 1.8 jonathan dst[3] = (t3 >> 16) | (t4 << 16); 297 1.8 jonathan 298 1.8 jonathan from += 16; 299 1.8 jonathan bptr += 32; 300 1.8 jonathan len -= 16; 301 1.8 jonathan } while (len >= 16); 302 1.8 jonathan break; 303 1.8 jonathan 304 1.8 jonathan case 0: 305 1.8 jonathan do { 306 1.30 tsutsui uint32_t *src = (uint32_t*)from; 307 1.30 tsutsui uint32_t *dst = (uint32_t*)bptr; 308 1.30 tsutsui uint32_t t0, t1, t2, t3; 309 1.8 jonathan 310 1.8 jonathan t0 = src[0]; t1 = src[1]; t2 = src[2]; t3 = src[3]; 311 1.8 jonathan dst[0] = t0; dst[1] = t1; dst[2] = t2; dst[3] = t3; 312 1.8 jonathan 313 1.8 jonathan from += 16; 314 1.8 jonathan bptr += 32; 315 1.8 jonathan len -= 16; 316 1.8 jonathan } while (len >= 16); 317 1.8 jonathan break; 318 1.8 jonathan 319 1.23 perry default: 320 1.8 jonathan /* Does odd-aligned case ever happen? */ 321 1.8 jonathan do { 322 1.33 tsutsui memcpy(bptr, from, 16); 323 1.8 jonathan from += 16; 324 1.8 jonathan bptr += 32; 325 1.8 jonathan len -= 16; 326 1.8 jonathan } while (len >= 16); 327 1.8 jonathan break; 328 1.8 jonathan } 329 1.8 jonathan if (len) 330 1.33 tsutsui memcpy(bptr, from, len); 331 1.2 thorpej } 332 1.2 thorpej 333 1.2 thorpej void 334 1.27 thorpej le_ioasic_copyfrombuf_gap16(struct lance_softc *sc, void *tov, int boff, 335 1.27 thorpej int len) 336 1.2 thorpej { 337 1.30 tsutsui uint8_t *buf = sc->sc_mem; 338 1.30 tsutsui uint8_t *to = tov; 339 1.30 tsutsui uint8_t *bptr; 340 1.2 thorpej 341 1.2 thorpej bptr = buf + ((boff << 1) & ~0x1f); 342 1.2 thorpej boff &= 0xf; 343 1.8 jonathan 344 1.8 jonathan /* Dispose of boff. source of copy is subsequently 16-byte aligned. */ 345 1.8 jonathan if (boff) { 346 1.15 augustss int xfer; 347 1.34 riastrad xfer = uimin(len, 16 - boff); 348 1.33 tsutsui memcpy(to, bptr + boff, xfer); 349 1.2 thorpej to += xfer; 350 1.2 thorpej bptr += 32; 351 1.2 thorpej len -= xfer; 352 1.2 thorpej } 353 1.8 jonathan if (len >= 16) 354 1.30 tsutsui switch ((u_long)to & (sizeof(uint32_t) -1)) { 355 1.8 jonathan case 2: 356 1.8 jonathan /* 357 1.8 jonathan * to is aligned to an odd 16-bit boundary. Ethernet headers 358 1.8 jonathan * make this the dominant case (98% or more). 359 1.8 jonathan */ 360 1.8 jonathan do { 361 1.30 tsutsui uint32_t *src = (uint32_t *)bptr; 362 1.30 tsutsui uint32_t t0, t1, t2, t3; 363 1.8 jonathan 364 1.8 jonathan /* read from uncached aligned DMA buf */ 365 1.8 jonathan t0 = src[0]; t1 = src[1]; t2 = src[2]; t3 = src[3]; 366 1.8 jonathan 367 1.8 jonathan /* write to odd-16-bit-word aligned dst */ 368 1.30 tsutsui *(uint16_t *)(to + 0) = (uint16_t)t0; 369 1.30 tsutsui *(uint32_t *)(to + 2) = (t0 >> 16) | (t1 << 16); 370 1.30 tsutsui *(uint32_t *)(to + 6) = (t1 >> 16) | (t2 << 16); 371 1.30 tsutsui *(uint32_t *)(to + 10) = (t2 >> 16) | (t3 << 16); 372 1.30 tsutsui *(uint16_t *)(to + 14) = (t3 >> 16); 373 1.8 jonathan bptr += 32; 374 1.8 jonathan to += 16; 375 1.8 jonathan len -= 16; 376 1.8 jonathan } while (len > 16); 377 1.8 jonathan break; 378 1.8 jonathan case 0: 379 1.8 jonathan /* 32-bit aligned aligned copy. Rare. */ 380 1.8 jonathan do { 381 1.30 tsutsui uint32_t *src = (uint32_t *)bptr; 382 1.30 tsutsui uint32_t *dst = (uint32_t *)to; 383 1.30 tsutsui uint32_t t0, t1, t2, t3; 384 1.8 jonathan 385 1.8 jonathan t0 = src[0]; t1 = src[1]; t2 = src[2]; t3 = src[3]; 386 1.8 jonathan dst[0] = t0; dst[1] = t1; dst[2] = t2; dst[3] = t3; 387 1.8 jonathan to += 16; 388 1.8 jonathan bptr += 32; 389 1.8 jonathan len -= 16; 390 1.8 jonathan } while (len > 16); 391 1.8 jonathan break; 392 1.8 jonathan 393 1.8 jonathan /* XXX Does odd-byte-aligned case ever happen? */ 394 1.8 jonathan default: 395 1.8 jonathan do { 396 1.33 tsutsui memcpy(to, bptr, 16); 397 1.8 jonathan to += 16; 398 1.8 jonathan bptr += 32; 399 1.8 jonathan len -= 16; 400 1.8 jonathan } while (len > 16); 401 1.8 jonathan break; 402 1.8 jonathan } 403 1.8 jonathan if (len) 404 1.33 tsutsui memcpy(to, bptr, len); 405 1.2 thorpej } 406 1.2 thorpej 407 1.2 thorpej void 408 1.27 thorpej le_ioasic_zerobuf_gap16(struct lance_softc *sc, int boff, int len) 409 1.2 thorpej { 410 1.30 tsutsui uint8_t *buf = sc->sc_mem; 411 1.30 tsutsui uint8_t *bptr; 412 1.15 augustss int xfer; 413 1.2 thorpej 414 1.2 thorpej bptr = buf + ((boff << 1) & ~0x1f); 415 1.2 thorpej boff &= 0xf; 416 1.34 riastrad xfer = uimin(len, 16 - boff); 417 1.2 thorpej while (len > 0) { 418 1.31 cegger memset(bptr + boff, 0, xfer); 419 1.2 thorpej bptr += 32; 420 1.2 thorpej boff = 0; 421 1.2 thorpej len -= xfer; 422 1.34 riastrad xfer = uimin(len, 16); 423 1.2 thorpej } 424 1.1 cgd } 425