Home | History | Annotate | Line # | Download | only in dev
mm.c revision 1.15.6.1
      1  1.15.6.1       mrg /*	$NetBSD: mm.c,v 1.15.6.1 2012/02/24 09:11:41 mrg Exp $	*/
      2       1.1  christos 
      3       1.1  christos /*-
      4      1.14     rmind  * Copyright (c) 2002, 2008, 2010 The NetBSD Foundation, Inc.
      5       1.1  christos  * All rights reserved.
      6       1.1  christos  *
      7       1.1  christos  * This code is derived from software contributed to The NetBSD Foundation
      8      1.14     rmind  * by Christos Zoulas, Joerg Sonnenberger and Mindaugas Rasiukevicius.
      9       1.1  christos  *
     10       1.1  christos  * Redistribution and use in source and binary forms, with or without
     11       1.1  christos  * modification, are permitted provided that the following conditions
     12       1.1  christos  * are met:
     13       1.1  christos  * 1. Redistributions of source code must retain the above copyright
     14       1.1  christos  *    notice, this list of conditions and the following disclaimer.
     15       1.1  christos  * 2. Redistributions in binary form must reproduce the above copyright
     16       1.1  christos  *    notice, this list of conditions and the following disclaimer in the
     17       1.1  christos  *    documentation and/or other materials provided with the distribution.
     18       1.1  christos  *
     19       1.1  christos  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20       1.1  christos  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21       1.1  christos  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22       1.1  christos  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23       1.1  christos  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24       1.1  christos  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25       1.1  christos  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26       1.1  christos  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27       1.1  christos  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28       1.1  christos  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29       1.1  christos  * POSSIBILITY OF SUCH DAMAGE.
     30       1.1  christos  */
     31       1.1  christos 
     32      1.14     rmind /*
     33      1.14     rmind  * Special /dev/{mem,kmem,zero,null} memory devices.
     34      1.14     rmind  */
     35       1.1  christos 
     36       1.1  christos #include <sys/cdefs.h>
     37  1.15.6.1       mrg __KERNEL_RCSID(0, "$NetBSD: mm.c,v 1.15.6.1 2012/02/24 09:11:41 mrg Exp $");
     38       1.1  christos 
     39      1.14     rmind #include "opt_compat_netbsd.h"
     40       1.1  christos 
     41       1.1  christos #include <sys/param.h>
     42       1.1  christos #include <sys/conf.h>
     43      1.14     rmind #include <sys/ioctl.h>
     44      1.14     rmind #include <sys/mman.h>
     45       1.1  christos #include <sys/uio.h>
     46      1.13     oster #include <sys/termios.h>
     47       1.2   gehenna 
     48      1.14     rmind #include <dev/mm.h>
     49      1.14     rmind 
     50      1.14     rmind #include <uvm/uvm_extern.h>
     51      1.14     rmind 
     52      1.14     rmind static void *		dev_zero_page	__read_mostly;
     53      1.14     rmind static kmutex_t		dev_mem_lock	__cacheline_aligned;
     54      1.14     rmind static vaddr_t		dev_mem_addr	__read_mostly;
     55      1.14     rmind 
     56      1.14     rmind static dev_type_read(mm_readwrite);
     57      1.14     rmind static dev_type_ioctl(mm_ioctl);
     58      1.14     rmind static dev_type_mmap(mm_mmap);
     59      1.14     rmind static dev_type_ioctl(mm_ioctl);
     60      1.14     rmind 
     61      1.14     rmind const struct cdevsw mem_cdevsw = {
     62      1.14     rmind #ifdef __HAVE_MM_MD_OPEN
     63      1.14     rmind 	mm_md_open,
     64      1.14     rmind #else
     65      1.14     rmind 	nullopen,
     66      1.14     rmind #endif
     67      1.14     rmind 	nullclose, mm_readwrite, mm_readwrite,
     68      1.14     rmind 	mm_ioctl, nostop, notty, nopoll, mm_mmap, nokqfilter,
     69      1.14     rmind 	D_MPSAFE
     70      1.14     rmind };
     71      1.14     rmind 
     72      1.14     rmind #ifdef pmax	/* XXX */
     73      1.14     rmind const struct cdevsw mem_ultrix_cdevsw = {
     74      1.14     rmind 	nullopen, nullclose, mm_readwrite, mm_readwrite, mm_ioctl,
     75      1.14     rmind 	nostop, notty, nopoll, mm_mmap, nokqfilter, D_MPSAFE
     76      1.14     rmind };
     77      1.14     rmind #endif
     78      1.14     rmind 
     79      1.14     rmind /*
     80      1.14     rmind  * mm_init: initialize memory device driver.
     81      1.14     rmind  */
     82      1.14     rmind void
     83      1.14     rmind mm_init(void)
     84      1.14     rmind {
     85      1.14     rmind 	vaddr_t pg;
     86      1.14     rmind 
     87      1.14     rmind 	mutex_init(&dev_mem_lock, MUTEX_DEFAULT, IPL_NONE);
     88      1.14     rmind 
     89      1.14     rmind 	/* Read-only zero-page. */
     90      1.14     rmind 	pg = uvm_km_alloc(kernel_map, PAGE_SIZE, 0, UVM_KMF_WIRED|UVM_KMF_ZERO);
     91      1.14     rmind 	KASSERT(pg != 0);
     92      1.14     rmind 	pmap_protect(pmap_kernel(), pg, pg + PAGE_SIZE, VM_PROT_READ);
     93      1.14     rmind 	pmap_update(pmap_kernel());
     94      1.14     rmind 	dev_zero_page = (void *)pg;
     95      1.14     rmind 
     96      1.14     rmind #ifndef __HAVE_MM_MD_CACHE_ALIASING
     97      1.14     rmind 	/* KVA for mappings during I/O. */
     98      1.14     rmind 	dev_mem_addr = uvm_km_alloc(kernel_map, PAGE_SIZE, 0,
     99      1.14     rmind 	    UVM_KMF_VAONLY|UVM_KMF_WAITVA);
    100      1.14     rmind 	KASSERT(dev_mem_addr != 0);
    101      1.14     rmind #else
    102      1.14     rmind 	dev_mem_addr = 0;
    103      1.14     rmind #endif
    104      1.14     rmind }
    105      1.14     rmind 
    106      1.14     rmind 
    107      1.14     rmind /*
    108      1.14     rmind  * dev_mem_getva: get a special virtual address.  If architecture requires,
    109      1.14     rmind  * allocate VA according to PA, which avoids cache-aliasing issues.  Use a
    110      1.14     rmind  * constant, general mapping address otherwise.
    111      1.14     rmind  */
    112      1.14     rmind static inline vaddr_t
    113      1.14     rmind dev_mem_getva(paddr_t pa)
    114      1.14     rmind {
    115      1.14     rmind #ifdef __HAVE_MM_MD_CACHE_ALIASING
    116      1.14     rmind 	const vsize_t coloroff = trunc_page(pa) & ptoa(uvmexp.colormask);
    117      1.14     rmind 	const vaddr_t kva = uvm_km_alloc(kernel_map, PAGE_SIZE + coloroff,
    118      1.14     rmind 	    ptoa(uvmexp.ncolors), UVM_KMF_VAONLY | UVM_KMF_WAITVA);
    119      1.14     rmind 
    120      1.14     rmind 	return kva + coloroff;
    121      1.14     rmind #else
    122      1.14     rmind 	return dev_mem_addr;
    123      1.14     rmind #endif
    124      1.14     rmind }
    125      1.14     rmind 
    126      1.14     rmind static inline void
    127      1.14     rmind dev_mem_relva(paddr_t pa, vaddr_t va)
    128      1.14     rmind {
    129      1.14     rmind #ifdef __HAVE_MM_MD_CACHE_ALIASING
    130      1.14     rmind 	const vsize_t coloroff = trunc_page(pa) & ptoa(uvmexp.colormask);
    131      1.14     rmind 	const vaddr_t origva = va - coloroff;
    132      1.14     rmind 
    133      1.14     rmind 	uvm_km_free(kernel_map, origva, PAGE_SIZE + coloroff, UVM_KMF_VAONLY);
    134      1.14     rmind #else
    135      1.14     rmind 	KASSERT(dev_mem_addr == va);
    136      1.14     rmind #endif
    137      1.14     rmind }
    138      1.14     rmind 
    139      1.14     rmind /*
    140      1.14     rmind  * dev_kmem_readwrite: helper for DEV_MEM (/dev/mem) case of R/W.
    141      1.14     rmind  */
    142      1.14     rmind static int
    143      1.14     rmind dev_mem_readwrite(struct uio *uio, struct iovec *iov)
    144      1.14     rmind {
    145      1.14     rmind 	paddr_t paddr;
    146      1.14     rmind 	vaddr_t vaddr;
    147      1.14     rmind 	vm_prot_t prot;
    148      1.14     rmind 	size_t len, offset;
    149      1.14     rmind 	bool have_direct;
    150      1.14     rmind 	int error;
    151      1.14     rmind 
    152      1.14     rmind 	/* Check for wrap around. */
    153      1.14     rmind 	if ((intptr_t)uio->uio_offset != uio->uio_offset) {
    154      1.14     rmind 		return EFAULT;
    155      1.14     rmind 	}
    156      1.14     rmind 	paddr = uio->uio_offset & ~PAGE_MASK;
    157      1.14     rmind 	prot = (uio->uio_rw == UIO_WRITE) ? VM_PROT_WRITE : VM_PROT_READ;
    158      1.14     rmind 	error = mm_md_physacc(paddr, prot);
    159      1.14     rmind 	if (error) {
    160      1.14     rmind 		return error;
    161      1.14     rmind 	}
    162      1.14     rmind 	offset = uio->uio_offset & PAGE_MASK;
    163      1.14     rmind 	len = MIN(uio->uio_resid, PAGE_SIZE - offset);
    164      1.14     rmind 
    165      1.14     rmind #ifdef __HAVE_MM_MD_DIRECT_MAPPED_PHYS
    166      1.14     rmind 	/* Is physical address directly mapped?  Return VA. */
    167      1.14     rmind 	have_direct = mm_md_direct_mapped_phys(paddr, &vaddr);
    168      1.14     rmind #else
    169      1.15     joerg 	vaddr = 0;
    170      1.14     rmind 	have_direct = false;
    171      1.14     rmind #endif
    172      1.14     rmind 	if (!have_direct) {
    173      1.14     rmind 		/* Get a special virtual address. */
    174      1.14     rmind 		const vaddr_t va = dev_mem_getva(paddr);
    175      1.14     rmind 
    176      1.14     rmind 		/* Map selected KVA to physical address. */
    177      1.14     rmind 		mutex_enter(&dev_mem_lock);
    178      1.14     rmind 		pmap_kenter_pa(va, paddr, prot, 0);
    179      1.14     rmind 		pmap_update(pmap_kernel());
    180      1.14     rmind 
    181      1.14     rmind 		/* Perform I/O. */
    182      1.14     rmind 		vaddr = va + offset;
    183      1.14     rmind 		error = uiomove((void *)vaddr, len, uio);
    184      1.14     rmind 
    185      1.14     rmind 		/* Unmap, flush before unlock. */
    186      1.14     rmind 		pmap_kremove(va, PAGE_SIZE);
    187      1.14     rmind 		pmap_update(pmap_kernel());
    188      1.14     rmind 		mutex_exit(&dev_mem_lock);
    189      1.14     rmind 
    190      1.14     rmind 		/* "Release" the virtual address. */
    191      1.14     rmind 		dev_mem_relva(paddr, va);
    192      1.14     rmind 	} else {
    193      1.14     rmind 		/* Direct map, just perform I/O. */
    194      1.14     rmind 		vaddr += offset;
    195      1.14     rmind 		error = uiomove((void *)vaddr, len, uio);
    196      1.14     rmind 	}
    197      1.14     rmind 	return error;
    198      1.14     rmind }
    199      1.14     rmind 
    200      1.14     rmind /*
    201      1.14     rmind  * dev_kmem_readwrite: helper for DEV_KMEM (/dev/kmem) case of R/W.
    202      1.14     rmind  */
    203      1.14     rmind static int
    204      1.14     rmind dev_kmem_readwrite(struct uio *uio, struct iovec *iov)
    205      1.14     rmind {
    206      1.14     rmind 	void *addr;
    207      1.14     rmind 	size_t len, offset;
    208      1.14     rmind 	vm_prot_t prot;
    209      1.14     rmind 	int error;
    210      1.14     rmind 	bool md_kva;
    211      1.14     rmind 
    212      1.14     rmind 	/* Check for wrap around. */
    213      1.14     rmind 	addr = (void *)(intptr_t)uio->uio_offset;
    214      1.14     rmind 	if ((uintptr_t)addr != uio->uio_offset) {
    215      1.14     rmind 		return EFAULT;
    216      1.14     rmind 	}
    217      1.14     rmind 	/*
    218      1.14     rmind 	 * Handle non-page aligned offset.
    219      1.14     rmind 	 * Otherwise, we operate in page-by-page basis.
    220      1.14     rmind 	 */
    221      1.14     rmind 	offset = uio->uio_offset & PAGE_MASK;
    222      1.14     rmind 	len = MIN(uio->uio_resid, PAGE_SIZE - offset);
    223      1.14     rmind 	prot = (uio->uio_rw == UIO_WRITE) ? VM_PROT_WRITE : VM_PROT_READ;
    224      1.14     rmind 
    225      1.14     rmind 	md_kva = false;
    226      1.14     rmind 
    227      1.14     rmind #ifdef __HAVE_MM_MD_DIRECT_MAPPED_IO
    228      1.14     rmind 	paddr_t paddr;
    229      1.14     rmind 	/* MD case: is this is a directly mapped address? */
    230      1.14     rmind 	if (mm_md_direct_mapped_io(addr, &paddr)) {
    231      1.14     rmind 		/* If so, validate physical address. */
    232      1.14     rmind 		error = mm_md_physacc(paddr, prot);
    233      1.14     rmind 		if (error) {
    234      1.14     rmind 			return error;
    235      1.14     rmind 		}
    236      1.14     rmind 		md_kva = true;
    237      1.14     rmind 	}
    238      1.14     rmind #endif
    239      1.14     rmind 	if (!md_kva) {
    240      1.14     rmind 		bool checked = false;
    241      1.14     rmind 
    242      1.14     rmind #ifdef __HAVE_MM_MD_KERNACC
    243      1.14     rmind 		/* MD check for the address. */
    244      1.14     rmind 		error = mm_md_kernacc(addr, prot, &checked);
    245      1.14     rmind 		if (error) {
    246      1.14     rmind 			return error;
    247      1.14     rmind 		}
    248      1.14     rmind #endif
    249      1.14     rmind 		/* UVM check for the address (unless MD indicated to not). */
    250      1.14     rmind 		if (!checked && !uvm_kernacc(addr, len, prot)) {
    251      1.14     rmind 			return EFAULT;
    252      1.14     rmind 		}
    253      1.14     rmind 	}
    254      1.14     rmind 	error = uiomove(addr, len, uio);
    255      1.14     rmind 	return error;
    256      1.14     rmind }
    257      1.14     rmind 
    258      1.14     rmind /*
    259      1.14     rmind  * dev_zero_readwrite: helper for DEV_ZERO (/dev/null) case of R/W.
    260      1.14     rmind  */
    261      1.14     rmind static inline int
    262      1.14     rmind dev_zero_readwrite(struct uio *uio, struct iovec *iov)
    263      1.14     rmind {
    264      1.14     rmind 	size_t len;
    265      1.14     rmind 
    266      1.14     rmind 	/* Nothing to do for the write case. */
    267      1.14     rmind 	if (uio->uio_rw == UIO_WRITE) {
    268      1.14     rmind 		uio->uio_resid = 0;
    269      1.14     rmind 		return 0;
    270      1.14     rmind 	}
    271      1.14     rmind 	/*
    272      1.14     rmind 	 * Read in page-by-page basis, caller will continue.
    273      1.14     rmind 	 * Cut appropriately for a single/last-iteration cases.
    274      1.14     rmind 	 */
    275      1.14     rmind 	len = MIN(iov->iov_len, PAGE_SIZE);
    276      1.14     rmind 	return uiomove(dev_zero_page, len, uio);
    277      1.14     rmind }
    278       1.1  christos 
    279      1.14     rmind /*
    280      1.14     rmind  * mm_readwrite: general memory R/W function.
    281      1.14     rmind  */
    282      1.14     rmind static int
    283      1.14     rmind mm_readwrite(dev_t dev, struct uio *uio, int flags)
    284       1.1  christos {
    285      1.14     rmind 	struct iovec *iov;
    286      1.14     rmind 	int error;
    287      1.14     rmind 
    288      1.14     rmind #ifdef __HAVE_MM_MD_READWRITE
    289      1.14     rmind 	/* If defined - there are extra MD cases. */
    290       1.1  christos 	switch (minor(dev)) {
    291      1.14     rmind 	case DEV_MEM:
    292      1.14     rmind 	case DEV_KMEM:
    293      1.14     rmind 	case DEV_NULL:
    294      1.14     rmind 	case DEV_ZERO:
    295      1.14     rmind #if defined(COMPAT_16) && defined(__arm)
    296      1.14     rmind 	case _DEV_ZERO_oARM:
    297      1.14     rmind #endif
    298      1.14     rmind 		break;
    299       1.6  jdolecek 	default:
    300      1.14     rmind 		return mm_md_readwrite(dev, uio);
    301      1.14     rmind 	}
    302      1.14     rmind #endif
    303      1.14     rmind 	error = 0;
    304      1.14     rmind 	while (uio->uio_resid > 0 && error == 0) {
    305      1.14     rmind 		iov = uio->uio_iov;
    306      1.14     rmind 		if (iov->iov_len == 0) {
    307      1.14     rmind 			/* Processed; next I/O vector. */
    308      1.14     rmind 			uio->uio_iov++;
    309      1.14     rmind 			uio->uio_iovcnt--;
    310      1.14     rmind 			KASSERT(uio->uio_iovcnt >= 0);
    311      1.14     rmind 			continue;
    312      1.14     rmind 		}
    313      1.14     rmind 		/* Helper functions will process in page-by-page basis. */
    314      1.14     rmind 		switch (minor(dev)) {
    315      1.14     rmind 		case DEV_MEM:
    316      1.14     rmind 			error = dev_mem_readwrite(uio, iov);
    317      1.14     rmind 			break;
    318      1.14     rmind 		case DEV_KMEM:
    319      1.14     rmind 			error = dev_kmem_readwrite(uio, iov);
    320      1.14     rmind 			break;
    321      1.14     rmind 		case DEV_NULL:
    322      1.14     rmind 			if (uio->uio_rw == UIO_WRITE) {
    323      1.14     rmind 				uio->uio_resid = 0;
    324      1.14     rmind 			}
    325      1.14     rmind 			/* Break directly out of the loop. */
    326       1.1  christos 			return 0;
    327      1.14     rmind #if defined(COMPAT_16) && defined(__arm)
    328      1.14     rmind 		case _DEV_ZERO_oARM:
    329      1.14     rmind #endif
    330      1.14     rmind 		case DEV_ZERO:
    331      1.14     rmind 			error = dev_zero_readwrite(uio, iov);
    332      1.14     rmind 			break;
    333      1.14     rmind 		default:
    334      1.14     rmind 			error = ENXIO;
    335      1.14     rmind 			break;
    336       1.1  christos 		}
    337      1.14     rmind 	}
    338      1.14     rmind 	return error;
    339      1.14     rmind }
    340      1.14     rmind 
    341      1.14     rmind /*
    342      1.14     rmind  * mm_mmap: general mmap() handler.
    343      1.14     rmind  */
    344      1.14     rmind static paddr_t
    345      1.14     rmind mm_mmap(dev_t dev, off_t off, int acc)
    346      1.14     rmind {
    347      1.14     rmind 	vm_prot_t prot;
    348      1.14     rmind 
    349      1.14     rmind #ifdef __HAVE_MM_MD_MMAP
    350      1.14     rmind 	/* If defined - there are extra mmap() MD cases. */
    351      1.14     rmind 	switch (minor(dev)) {
    352      1.14     rmind 	case DEV_MEM:
    353      1.14     rmind 	case DEV_KMEM:
    354      1.14     rmind 	case DEV_NULL:
    355      1.14     rmind #if defined(COMPAT_16) && defined(__arm)
    356      1.14     rmind 	case _DEV_ZERO_oARM:
    357      1.14     rmind #endif
    358      1.14     rmind 	case DEV_ZERO:
    359      1.14     rmind 		break;
    360      1.14     rmind 	default:
    361      1.14     rmind 		return mm_md_mmap(dev, off, acc);
    362      1.14     rmind 	}
    363      1.14     rmind #endif
    364      1.14     rmind 	/*
    365      1.14     rmind 	 * /dev/null does not make sense, /dev/kmem is volatile and
    366      1.14     rmind 	 * /dev/zero is handled in mmap already.
    367      1.14     rmind 	 */
    368      1.14     rmind 	if (minor(dev) != DEV_MEM) {
    369      1.14     rmind 		return -1;
    370      1.14     rmind 	}
    371      1.14     rmind 
    372      1.14     rmind 	prot = 0;
    373      1.14     rmind 	if (acc & PROT_EXEC)
    374      1.14     rmind 		prot |= VM_PROT_EXECUTE;
    375      1.14     rmind 	if (acc & PROT_READ)
    376      1.14     rmind 		prot |= VM_PROT_READ;
    377      1.14     rmind 	if (acc & PROT_WRITE)
    378      1.14     rmind 		prot |= VM_PROT_WRITE;
    379      1.14     rmind 
    380      1.14     rmind 	/* Validate the physical address. */
    381      1.14     rmind 	if (mm_md_physacc(off, prot) != 0) {
    382      1.14     rmind 		return -1;
    383      1.14     rmind 	}
    384      1.14     rmind 	return off >> PGSHIFT;
    385      1.14     rmind }
    386      1.14     rmind 
    387      1.14     rmind static int
    388      1.14     rmind mm_ioctl(dev_t dev, u_long cmd, void *data, int flag, struct lwp *l)
    389      1.14     rmind {
    390      1.14     rmind 
    391      1.14     rmind 	switch (cmd) {
    392      1.14     rmind 	case FIONBIO:
    393      1.14     rmind 		/* We never block anyway. */
    394      1.14     rmind 		return 0;
    395      1.14     rmind 
    396      1.14     rmind 	case FIOSETOWN:
    397      1.14     rmind 	case FIOGETOWN:
    398      1.14     rmind 	case TIOCGPGRP:
    399      1.14     rmind 	case TIOCSPGRP:
    400      1.14     rmind 	case TIOCGETA:
    401      1.14     rmind 		return ENOTTY;
    402      1.14     rmind 
    403      1.14     rmind 	case FIOASYNC:
    404      1.14     rmind 		if ((*(int *)data) == 0) {
    405      1.14     rmind 			return 0;
    406      1.14     rmind 		}
    407      1.14     rmind 		/* FALLTHROUGH */
    408      1.14     rmind 	default:
    409       1.1  christos 		return EOPNOTSUPP;
    410       1.1  christos 	}
    411       1.1  christos }
    412