Home | History | Annotate | Line # | Download | only in x86
xen_bus_dma.c revision 1.20
      1 /*	$NetBSD: xen_bus_dma.c,v 1.20 2010/03/09 23:12:06 jym Exp $	*/
      2 /*	NetBSD bus_dma.c,v 1.21 2005/04/16 07:53:35 yamt Exp */
      3 
      4 /*-
      5  * Copyright (c) 1996, 1997, 1998 The NetBSD Foundation, Inc.
      6  * All rights reserved.
      7  *
      8  * This code is derived from software contributed to The NetBSD Foundation
      9  * by Charles M. Hannum and by Jason R. Thorpe of the Numerical Aerospace
     10  * Simulation Facility, NASA Ames Research Center.
     11  *
     12  * Redistribution and use in source and binary forms, with or without
     13  * modification, are permitted provided that the following conditions
     14  * are met:
     15  * 1. Redistributions of source code must retain the above copyright
     16  *    notice, this list of conditions and the following disclaimer.
     17  * 2. Redistributions in binary form must reproduce the above copyright
     18  *    notice, this list of conditions and the following disclaimer in the
     19  *    documentation and/or other materials provided with the distribution.
     20  *
     21  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     22  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     23  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     24  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     25  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     26  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     27  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     28  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     29  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     30  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     31  * POSSIBILITY OF SUCH DAMAGE.
     32  */
     33 
     34 #include <sys/cdefs.h>
     35 __KERNEL_RCSID(0, "$NetBSD: xen_bus_dma.c,v 1.20 2010/03/09 23:12:06 jym Exp $");
     36 
     37 #include <sys/param.h>
     38 #include <sys/systm.h>
     39 #include <sys/kernel.h>
     40 #include <sys/mbuf.h>
     41 #include <sys/proc.h>
     42 
     43 #include <machine/bus.h>
     44 #include <machine/bus_private.h>
     45 
     46 #include <uvm/uvm_extern.h>
     47 
     48 extern paddr_t avail_end;
     49 
     50 /* Pure 2^n version of get_order */
     51 static inline int get_order(unsigned long size)
     52 {
     53 	int order = -1;
     54 	size = (size - 1) >> (PAGE_SHIFT - 1);
     55 	do {
     56 		size >>= 1;
     57 		order++;
     58 	} while (size);
     59 	return order;
     60 }
     61 
     62 static int
     63 _xen_alloc_contig(bus_size_t size, bus_size_t alignment, bus_size_t boundary,
     64     struct pglist *mlistp, int flags, bus_addr_t low, bus_addr_t high)
     65 {
     66 	int order, i;
     67 	unsigned long npagesreq, npages, mfn;
     68 	bus_addr_t pa;
     69 	struct vm_page *pg, *pgnext;
     70 	int s, error;
     71 	struct xen_memory_reservation res;
     72 
     73 	/*
     74 	 * When requesting a contigous memory region, the hypervisor will
     75 	 * return a memory range aligned on size. This will automagically
     76 	 * handle "boundary", but the only way to enforce alignment
     77 	 * is to request a memory region of size max(alignment, size).
     78 	 */
     79 	order = max(get_order(size), get_order(alignment));
     80 	npages = (1 << order);
     81 	npagesreq = (size >> PAGE_SHIFT);
     82 	KASSERT(npages >= npagesreq);
     83 
     84 	/* get npages from UVM, and give them back to the hypervisor */
     85 	error = uvm_pglistalloc(((psize_t)npages) << PAGE_SHIFT,
     86             0, avail_end, 0, 0, mlistp, npages, (flags & BUS_DMA_NOWAIT) == 0);
     87 	if (error)
     88 		return (error);
     89 
     90 	for (pg = mlistp->tqh_first; pg != NULL; pg = pg->pageq.queue.tqe_next) {
     91 		pa = VM_PAGE_TO_PHYS(pg);
     92 		mfn = xpmap_ptom(pa) >> PAGE_SHIFT;
     93 		xpmap_phys_to_machine_mapping[
     94 		    (pa - XPMAP_OFFSET) >> PAGE_SHIFT] = INVALID_P2M_ENTRY;
     95 		xenguest_handle(res.extent_start) = &mfn;
     96 		res.nr_extents = 1;
     97 		res.extent_order = 0;
     98 		res.address_bits = 0;
     99 		res.domid = DOMID_SELF;
    100 		error = HYPERVISOR_memory_op(XENMEM_decrease_reservation, &res);
    101 		if (error != 1) {
    102 #ifdef DEBUG
    103 			printf("xen_alloc_contig: XENMEM_decrease_reservation "
    104 			    "failed: err %d (pa %#" PRIxPADDR " mfn %#lx)\n",
    105 			    error, pa, mfn);
    106 #endif
    107 			xpmap_phys_to_machine_mapping[
    108 			    (pa - XPMAP_OFFSET) >> PAGE_SHIFT] = mfn;
    109 
    110 			error = ENOMEM;
    111 			goto failed;
    112 		}
    113 	}
    114 	/* Get the new contiguous memory extent */
    115 	xenguest_handle(res.extent_start) = &mfn;
    116 	res.nr_extents = 1;
    117 	res.extent_order = order;
    118 	res.address_bits = get_order(high) + PAGE_SHIFT;
    119 	res.domid = DOMID_SELF;
    120 	error = HYPERVISOR_memory_op(XENMEM_increase_reservation, &res);
    121 	if (error != 1) {
    122 #ifdef DEBUG
    123 		printf("xen_alloc_contig: XENMEM_increase_reservation "
    124 		    "failed: %d (order %d address_bits %d)\n",
    125 		    error, order, res.address_bits);
    126 #endif
    127 		error = ENOMEM;
    128 		pg = NULL;
    129 		goto failed;
    130 	}
    131 	s = splvm();
    132 	/* Map the new extent in place of the old pages */
    133 	for (pg = mlistp->tqh_first, i = 0; pg != NULL; pg = pgnext, i++) {
    134 		pgnext = pg->pageq.queue.tqe_next;
    135 		pa = VM_PAGE_TO_PHYS(pg);
    136 		xpmap_phys_to_machine_mapping[
    137 		    (pa - XPMAP_OFFSET) >> PAGE_SHIFT] = mfn+i;
    138 		xpq_queue_machphys_update(((paddr_t)(mfn+i)) << PAGE_SHIFT, pa);
    139 		/* while here, give extra pages back to UVM */
    140 		if (i >= npagesreq) {
    141 			TAILQ_REMOVE(mlistp, pg, pageq.queue);
    142 			uvm_pagefree(pg);
    143 		}
    144 	}
    145 	/* Flush updates through and flush the TLB */
    146 	xpq_queue_tlb_flush();
    147 	splx(s);
    148 	return 0;
    149 
    150 failed:
    151 	/*
    152 	 * Attempt to recover from a failed decrease or increase reservation:
    153 	 * if decrease_reservation failed, we don't have given all pages
    154 	 * back to Xen; give them back to UVM, and get the missing pages
    155 	 * from Xen.
    156 	 * if increase_reservation failed, we expect pg to be NULL and we just
    157 	 * get back the missing pages from Xen one by one.
    158 	 */
    159 	/* give back remaining pages to UVM */
    160 	for (; pg != NULL; pg = pgnext) {
    161 		pgnext = pg->pageq.queue.tqe_next;
    162 		TAILQ_REMOVE(mlistp, pg, pageq.queue);
    163 		uvm_pagefree(pg);
    164 	}
    165 	/* remplace the pages that we already gave to Xen */
    166 	s = splvm();
    167 	for (pg = mlistp->tqh_first; pg != NULL; pg = pgnext) {
    168 		pgnext = pg->pageq.queue.tqe_next;
    169 		xenguest_handle(res.extent_start) = &mfn;
    170 		res.nr_extents = 1;
    171 		res.extent_order = 0;
    172 		res.address_bits = 32;
    173 		res.domid = DOMID_SELF;
    174 		if (HYPERVISOR_memory_op(XENMEM_increase_reservation, &res)
    175 		    < 0) {
    176 			printf("xen_alloc_contig: recovery "
    177 			    "XENMEM_increase_reservation failed!\n");
    178 			break;
    179 		}
    180 		pa = VM_PAGE_TO_PHYS(pg);
    181 		xpmap_phys_to_machine_mapping[
    182 		    (pa - XPMAP_OFFSET) >> PAGE_SHIFT] = mfn;
    183 		xpq_queue_machphys_update(((paddr_t)mfn) << PAGE_SHIFT, pa);
    184 		TAILQ_REMOVE(mlistp, pg, pageq.queue);
    185 		uvm_pagefree(pg);
    186 	}
    187 	/* Flush updates through and flush the TLB */
    188 	xpq_queue_tlb_flush();
    189 	splx(s);
    190 	return error;
    191 }
    192 
    193 
    194 /*
    195  * Allocate physical memory from the given physical address range.
    196  * Called by DMA-safe memory allocation methods.
    197  * We need our own version to deal with physical vs machine addresses.
    198  */
    199 int
    200 _xen_bus_dmamem_alloc_range(bus_dma_tag_t t, bus_size_t size,
    201     bus_size_t alignment, bus_size_t boundary, bus_dma_segment_t *segs,
    202     int nsegs, int *rsegs, int flags, bus_addr_t low, bus_addr_t high)
    203 {
    204 	bus_addr_t curaddr, lastaddr;
    205 	struct vm_page *m;
    206 	struct pglist mlist;
    207 	int curseg, error;
    208 	int doingrealloc = 0;
    209 
    210 	/* Always round the size. */
    211 	size = round_page(size);
    212 
    213 	KASSERT((alignment & (alignment - 1)) == 0);
    214 	KASSERT((boundary & (boundary - 1)) == 0);
    215 	if (alignment < PAGE_SIZE)
    216 		alignment = PAGE_SIZE;
    217 	if (boundary != 0 && boundary < size)
    218 		return (EINVAL);
    219 
    220 	/*
    221 	 * Allocate pages from the VM system.
    222 	 */
    223 	error = uvm_pglistalloc(size, 0, avail_end, alignment, boundary,
    224 	    &mlist, nsegs, (flags & BUS_DMA_NOWAIT) == 0);
    225 	if (error)
    226 		return (error);
    227 again:
    228 
    229 	/*
    230 	 * Compute the location, size, and number of segments actually
    231 	 * returned by the VM code.
    232 	 */
    233 	m = mlist.tqh_first;
    234 	curseg = 0;
    235 	curaddr = lastaddr = segs[curseg].ds_addr = _BUS_VM_PAGE_TO_BUS(m);
    236 	if (curaddr < low || curaddr >= high)
    237 		goto badaddr;
    238 	segs[curseg].ds_len = PAGE_SIZE;
    239 	m = m->pageq.queue.tqe_next;
    240 	if ((segs[curseg].ds_addr & (alignment - 1)) != 0)
    241 		goto dorealloc;
    242 
    243 	for (; m != NULL; m = m->pageq.queue.tqe_next) {
    244 		curaddr = _BUS_VM_PAGE_TO_BUS(m);
    245 		if (curaddr < low || curaddr >= high)
    246 			goto badaddr;
    247 		if (curaddr == (lastaddr + PAGE_SIZE)) {
    248 			segs[curseg].ds_len += PAGE_SIZE;
    249 			if ((lastaddr & boundary) != (curaddr & boundary))
    250 				goto dorealloc;
    251 		} else {
    252 			curseg++;
    253 			if (curseg >= nsegs || (curaddr & (alignment - 1)) != 0)
    254 				goto dorealloc;
    255 			segs[curseg].ds_addr = curaddr;
    256 			segs[curseg].ds_len = PAGE_SIZE;
    257 		}
    258 		lastaddr = curaddr;
    259 	}
    260 
    261 	*rsegs = curseg + 1;
    262 	return (0);
    263 
    264 badaddr:
    265 	if (doingrealloc == 0)
    266 		goto dorealloc;
    267 	if (curaddr < low) {
    268 		/* no way to enforce this */
    269 		printf("_xen_bus_dmamem_alloc_range: no way to "
    270 		    "enforce address range (0x%" PRIx64 " - 0x%" PRIx64 ")\n",
    271 		    (uint64_t)low, (uint64_t)high);
    272 		uvm_pglistfree(&mlist);
    273 		return EINVAL;
    274 	}
    275 	printf("xen_bus_dmamem_alloc_range: "
    276 	    "curraddr=0x%lx > high=0x%lx\n",
    277 	    (u_long)curaddr, (u_long)high);
    278 	panic("xen_bus_dmamem_alloc_range 1");
    279 dorealloc:
    280 	if (doingrealloc == 1)
    281 		panic("_xen_bus_dmamem_alloc_range: "
    282 		   "xen_alloc_contig returned "
    283 		   "too much segments");
    284 	doingrealloc = 1;
    285 	/*
    286 	 * Too much segments, or memory doesn't fit
    287 	 * constraints. Free this memory and
    288 	 * get a contigous segment from the hypervisor.
    289 	 */
    290 	uvm_pglistfree(&mlist);
    291 	for (curseg = 0; curseg < nsegs; curseg++) {
    292 		segs[curseg].ds_addr = 0;
    293 		segs[curseg].ds_len = 0;
    294 	}
    295 	error = _xen_alloc_contig(size, alignment,
    296 	    boundary, &mlist, flags, low, high);
    297 	if (error)
    298 		return error;
    299 	goto again;
    300 }
    301