Home | History | Annotate | Line # | Download | only in x86
xen_bus_dma.c revision 1.19
      1  1.19     jym /*	$NetBSD: xen_bus_dma.c,v 1.19 2010/03/02 00:13:50 jym Exp $	*/
      2   1.1  bouyer /*	NetBSD bus_dma.c,v 1.21 2005/04/16 07:53:35 yamt Exp */
      3   1.1  bouyer 
      4   1.1  bouyer /*-
      5   1.1  bouyer  * Copyright (c) 1996, 1997, 1998 The NetBSD Foundation, Inc.
      6   1.1  bouyer  * All rights reserved.
      7   1.1  bouyer  *
      8   1.1  bouyer  * This code is derived from software contributed to The NetBSD Foundation
      9   1.1  bouyer  * by Charles M. Hannum and by Jason R. Thorpe of the Numerical Aerospace
     10   1.1  bouyer  * Simulation Facility, NASA Ames Research Center.
     11   1.1  bouyer  *
     12   1.1  bouyer  * Redistribution and use in source and binary forms, with or without
     13   1.1  bouyer  * modification, are permitted provided that the following conditions
     14   1.1  bouyer  * are met:
     15   1.1  bouyer  * 1. Redistributions of source code must retain the above copyright
     16   1.1  bouyer  *    notice, this list of conditions and the following disclaimer.
     17   1.1  bouyer  * 2. Redistributions in binary form must reproduce the above copyright
     18   1.1  bouyer  *    notice, this list of conditions and the following disclaimer in the
     19   1.1  bouyer  *    documentation and/or other materials provided with the distribution.
     20   1.1  bouyer  *
     21   1.1  bouyer  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     22   1.1  bouyer  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     23   1.1  bouyer  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     24   1.1  bouyer  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     25   1.1  bouyer  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     26   1.1  bouyer  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     27   1.1  bouyer  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     28   1.1  bouyer  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     29   1.1  bouyer  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     30   1.1  bouyer  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     31   1.1  bouyer  * POSSIBILITY OF SUCH DAMAGE.
     32   1.1  bouyer  */
     33   1.1  bouyer 
     34   1.1  bouyer #include <sys/cdefs.h>
     35  1.19     jym __KERNEL_RCSID(0, "$NetBSD: xen_bus_dma.c,v 1.19 2010/03/02 00:13:50 jym Exp $");
     36   1.1  bouyer 
     37   1.1  bouyer #include <sys/param.h>
     38   1.1  bouyer #include <sys/systm.h>
     39   1.1  bouyer #include <sys/kernel.h>
     40   1.1  bouyer #include <sys/mbuf.h>
     41   1.1  bouyer #include <sys/proc.h>
     42   1.1  bouyer 
     43   1.1  bouyer #include <machine/bus.h>
     44   1.1  bouyer #include <machine/bus_private.h>
     45   1.1  bouyer 
     46   1.1  bouyer #include <uvm/uvm_extern.h>
     47   1.1  bouyer 
     48   1.1  bouyer extern paddr_t avail_end;
     49   1.1  bouyer 
     50   1.1  bouyer /* Pure 2^n version of get_order */
     51   1.5   perry static inline int get_order(unsigned long size)
     52   1.1  bouyer {
     53   1.1  bouyer 	int order = -1;
     54   1.1  bouyer 	size = (size - 1) >> (PAGE_SHIFT - 1);
     55   1.1  bouyer 	do {
     56   1.1  bouyer 		size >>= 1;
     57   1.1  bouyer 		order++;
     58   1.1  bouyer 	} while (size);
     59   1.1  bouyer 	return order;
     60   1.1  bouyer }
     61   1.1  bouyer 
     62   1.1  bouyer static int
     63   1.1  bouyer _xen_alloc_contig(bus_size_t size, bus_size_t alignment, bus_size_t boundary,
     64   1.9  bouyer     struct pglist *mlistp, int flags, bus_addr_t low, bus_addr_t high)
     65   1.1  bouyer {
     66   1.1  bouyer 	int order, i;
     67   1.1  bouyer 	unsigned long npagesreq, npages, mfn;
     68   1.1  bouyer 	bus_addr_t pa;
     69   1.1  bouyer 	struct vm_page *pg, *pgnext;
     70   1.1  bouyer 	int s, error;
     71   1.6  bouyer 	struct xen_memory_reservation res;
     72   1.1  bouyer 
     73   1.1  bouyer 	/*
     74   1.1  bouyer 	 * When requesting a contigous memory region, the hypervisor will
     75   1.1  bouyer 	 * return a memory range aligned on size. This will automagically
     76   1.1  bouyer 	 * handle "boundary", but the only way to enforce alignment
     77   1.1  bouyer 	 * is to request a memory region of size max(alignment, size).
     78   1.1  bouyer 	 */
     79   1.1  bouyer 	order = max(get_order(size), get_order(alignment));
     80   1.1  bouyer 	npages = (1 << order);
     81   1.1  bouyer 	npagesreq = (size >> PAGE_SHIFT);
     82   1.1  bouyer 	KASSERT(npages >= npagesreq);
     83   1.1  bouyer 
     84  1.19     jym 	/* get npages from UVM, and give them back to the hypervisor */
     85  1.16  cegger 	error = uvm_pglistalloc(((psize_t)npages) << PAGE_SHIFT,
     86  1.16  cegger             0, avail_end, 0, 0, mlistp, npages, (flags & BUS_DMA_NOWAIT) == 0);
     87   1.1  bouyer 	if (error)
     88   1.1  bouyer 		return (error);
     89   1.1  bouyer 
     90  1.11      ad 	for (pg = mlistp->tqh_first; pg != NULL; pg = pg->pageq.queue.tqe_next) {
     91   1.1  bouyer 		pa = VM_PAGE_TO_PHYS(pg);
     92   1.1  bouyer 		mfn = xpmap_ptom(pa) >> PAGE_SHIFT;
     93   1.1  bouyer 		xpmap_phys_to_machine_mapping[
     94   1.1  bouyer 		    (pa - XPMAP_OFFSET) >> PAGE_SHIFT] = INVALID_P2M_ENTRY;
     95  1.12  cegger 		xenguest_handle(res.extent_start) = &mfn;
     96   1.6  bouyer 		res.nr_extents = 1;
     97   1.6  bouyer 		res.extent_order = 0;
     98   1.6  bouyer 		res.domid = DOMID_SELF;
     99  1.19     jym 		error = HYPERVISOR_memory_op(XENMEM_decrease_reservation, &res);
    100  1.19     jym 		if (error != 1) {
    101   1.8  bouyer #ifdef DEBUG
    102   1.6  bouyer 			printf("xen_alloc_contig: XENMEM_decrease_reservation "
    103  1.18     jym 			    "failed: err %d (pa %#" PRIxPADDR " mfn %#lx)\n",
    104  1.18     jym 			    error, pa, mfn);
    105   1.8  bouyer #endif
    106   1.7  bouyer 			xpmap_phys_to_machine_mapping[
    107   1.7  bouyer 			    (pa - XPMAP_OFFSET) >> PAGE_SHIFT] = mfn;
    108   1.7  bouyer 
    109   1.7  bouyer 			error = ENOMEM;
    110   1.7  bouyer 			goto failed;
    111   1.6  bouyer 		}
    112   1.1  bouyer 	}
    113   1.1  bouyer 	/* Get the new contiguous memory extent */
    114  1.12  cegger 	xenguest_handle(res.extent_start) = &mfn;
    115   1.6  bouyer 	res.nr_extents = 1;
    116   1.6  bouyer 	res.extent_order = order;
    117   1.9  bouyer 	res.address_bits = get_order(high) + PAGE_SHIFT;
    118   1.6  bouyer 	res.domid = DOMID_SELF;
    119  1.14  bouyer 	error = HYPERVISOR_memory_op(XENMEM_increase_reservation, &res);
    120  1.14  bouyer 	if (error != 1) {
    121   1.8  bouyer #ifdef DEBUG
    122   1.6  bouyer 		printf("xen_alloc_contig: XENMEM_increase_reservation "
    123  1.14  bouyer 		    "failed: %d (order %d address_bits %d)\n",
    124  1.14  bouyer 		    error, order, res.address_bits);
    125   1.8  bouyer #endif
    126   1.7  bouyer 		error = ENOMEM;
    127   1.7  bouyer 		pg = NULL;
    128   1.7  bouyer 		goto failed;
    129   1.6  bouyer 	}
    130   1.1  bouyer 	s = splvm();
    131   1.1  bouyer 	/* Map the new extent in place of the old pages */
    132   1.1  bouyer 	for (pg = mlistp->tqh_first, i = 0; pg != NULL; pg = pgnext, i++) {
    133  1.11      ad 		pgnext = pg->pageq.queue.tqe_next;
    134   1.1  bouyer 		pa = VM_PAGE_TO_PHYS(pg);
    135   1.1  bouyer 		xpmap_phys_to_machine_mapping[
    136   1.1  bouyer 		    (pa - XPMAP_OFFSET) >> PAGE_SHIFT] = mfn+i;
    137  1.16  cegger 		xpq_queue_machphys_update(((paddr_t)(mfn+i)) << PAGE_SHIFT, pa);
    138   1.1  bouyer 		/* while here, give extra pages back to UVM */
    139   1.1  bouyer 		if (i >= npagesreq) {
    140  1.11      ad 			TAILQ_REMOVE(mlistp, pg, pageq.queue);
    141   1.1  bouyer 			uvm_pagefree(pg);
    142   1.1  bouyer 		}
    143   1.1  bouyer 	}
    144   1.1  bouyer 	/* Flush updates through and flush the TLB */
    145   1.1  bouyer 	xpq_queue_tlb_flush();
    146   1.1  bouyer 	splx(s);
    147   1.1  bouyer 	return 0;
    148   1.7  bouyer 
    149   1.7  bouyer failed:
    150   1.7  bouyer 	/*
    151   1.7  bouyer 	 * Attempt to recover from a failed decrease or increase reservation:
    152   1.7  bouyer 	 * if decrease_reservation failed, we don't have given all pages
    153   1.7  bouyer 	 * back to Xen; give them back to UVM, and get the missing pages
    154   1.7  bouyer 	 * from Xen.
    155   1.7  bouyer 	 * if increase_reservation failed, we expect pg to be NULL and we just
    156   1.7  bouyer 	 * get back the missing pages from Xen one by one.
    157   1.7  bouyer 	 */
    158   1.7  bouyer 	/* give back remaining pages to UVM */
    159   1.7  bouyer 	for (; pg != NULL; pg = pgnext) {
    160  1.11      ad 		pgnext = pg->pageq.queue.tqe_next;
    161  1.11      ad 		TAILQ_REMOVE(mlistp, pg, pageq.queue);
    162   1.7  bouyer 		uvm_pagefree(pg);
    163   1.7  bouyer 	}
    164   1.7  bouyer 	/* remplace the pages that we already gave to Xen */
    165   1.7  bouyer 	s = splvm();
    166   1.7  bouyer 	for (pg = mlistp->tqh_first; pg != NULL; pg = pgnext) {
    167  1.11      ad 		pgnext = pg->pageq.queue.tqe_next;
    168  1.12  cegger 		xenguest_handle(res.extent_start) = &mfn;
    169   1.7  bouyer 		res.nr_extents = 1;
    170   1.7  bouyer 		res.extent_order = 0;
    171   1.9  bouyer 		res.address_bits = 32;
    172   1.7  bouyer 		res.domid = DOMID_SELF;
    173   1.7  bouyer 		if (HYPERVISOR_memory_op(XENMEM_increase_reservation, &res)
    174   1.7  bouyer 		    < 0) {
    175   1.7  bouyer 			printf("xen_alloc_contig: recovery "
    176   1.7  bouyer 			    "XENMEM_increase_reservation failed!\n");
    177   1.7  bouyer 			break;
    178   1.7  bouyer 		}
    179   1.7  bouyer 		pa = VM_PAGE_TO_PHYS(pg);
    180   1.7  bouyer 		xpmap_phys_to_machine_mapping[
    181   1.7  bouyer 		    (pa - XPMAP_OFFSET) >> PAGE_SHIFT] = mfn;
    182  1.16  cegger 		xpq_queue_machphys_update(((paddr_t)mfn) << PAGE_SHIFT, pa);
    183  1.11      ad 		TAILQ_REMOVE(mlistp, pg, pageq.queue);
    184   1.7  bouyer 		uvm_pagefree(pg);
    185   1.7  bouyer 	}
    186   1.7  bouyer 	/* Flush updates through and flush the TLB */
    187   1.7  bouyer 	xpq_queue_tlb_flush();
    188   1.7  bouyer 	splx(s);
    189   1.7  bouyer 	return error;
    190   1.1  bouyer }
    191   1.1  bouyer 
    192   1.1  bouyer 
    193   1.1  bouyer /*
    194   1.1  bouyer  * Allocate physical memory from the given physical address range.
    195   1.1  bouyer  * Called by DMA-safe memory allocation methods.
    196   1.1  bouyer  * We need our own version to deal with physical vs machine addresses.
    197   1.1  bouyer  */
    198   1.1  bouyer int
    199   1.1  bouyer _xen_bus_dmamem_alloc_range(bus_dma_tag_t t, bus_size_t size,
    200   1.1  bouyer     bus_size_t alignment, bus_size_t boundary, bus_dma_segment_t *segs,
    201   1.1  bouyer     int nsegs, int *rsegs, int flags, bus_addr_t low, bus_addr_t high)
    202   1.1  bouyer {
    203   1.7  bouyer 	bus_addr_t curaddr, lastaddr;
    204   1.1  bouyer 	struct vm_page *m;
    205   1.1  bouyer 	struct pglist mlist;
    206   1.1  bouyer 	int curseg, error;
    207   1.1  bouyer 	int doingrealloc = 0;
    208   1.1  bouyer 
    209   1.1  bouyer 	/* Always round the size. */
    210   1.1  bouyer 	size = round_page(size);
    211   1.1  bouyer 
    212   1.2  bouyer 	KASSERT((alignment & (alignment - 1)) == 0);
    213   1.2  bouyer 	KASSERT((boundary & (boundary - 1)) == 0);
    214   1.2  bouyer 	if (alignment < PAGE_SIZE)
    215   1.2  bouyer 		alignment = PAGE_SIZE;
    216   1.2  bouyer 	if (boundary != 0 && boundary < size)
    217   1.2  bouyer 		return (EINVAL);
    218   1.2  bouyer 
    219   1.1  bouyer 	/*
    220   1.1  bouyer 	 * Allocate pages from the VM system.
    221   1.1  bouyer 	 */
    222   1.1  bouyer 	error = uvm_pglistalloc(size, 0, avail_end, alignment, boundary,
    223   1.1  bouyer 	    &mlist, nsegs, (flags & BUS_DMA_NOWAIT) == 0);
    224   1.1  bouyer 	if (error)
    225   1.1  bouyer 		return (error);
    226   1.1  bouyer again:
    227   1.1  bouyer 
    228   1.1  bouyer 	/*
    229   1.1  bouyer 	 * Compute the location, size, and number of segments actually
    230   1.1  bouyer 	 * returned by the VM code.
    231   1.1  bouyer 	 */
    232   1.1  bouyer 	m = mlist.tqh_first;
    233   1.1  bouyer 	curseg = 0;
    234   1.9  bouyer 	curaddr = lastaddr = segs[curseg].ds_addr = _BUS_VM_PAGE_TO_BUS(m);
    235   1.9  bouyer 	if (curaddr < low || curaddr >= high)
    236   1.9  bouyer 		goto badaddr;
    237   1.1  bouyer 	segs[curseg].ds_len = PAGE_SIZE;
    238  1.11      ad 	m = m->pageq.queue.tqe_next;
    239   1.7  bouyer 	if ((segs[curseg].ds_addr & (alignment - 1)) != 0)
    240   1.2  bouyer 		goto dorealloc;
    241   1.1  bouyer 
    242  1.11      ad 	for (; m != NULL; m = m->pageq.queue.tqe_next) {
    243   1.7  bouyer 		curaddr = _BUS_VM_PAGE_TO_BUS(m);
    244   1.9  bouyer 		if (curaddr < low || curaddr >= high)
    245   1.9  bouyer 			goto badaddr;
    246   1.7  bouyer 		if (curaddr == (lastaddr + PAGE_SIZE)) {
    247   1.1  bouyer 			segs[curseg].ds_len += PAGE_SIZE;
    248   1.9  bouyer 			if ((lastaddr & boundary) != (curaddr & boundary))
    249   1.2  bouyer 				goto dorealloc;
    250   1.7  bouyer 		} else {
    251   1.1  bouyer 			curseg++;
    252   1.9  bouyer 			if (curseg >= nsegs || (curaddr & (alignment - 1)) != 0)
    253   1.9  bouyer 				goto dorealloc;
    254   1.1  bouyer 			segs[curseg].ds_addr = curaddr;
    255   1.1  bouyer 			segs[curseg].ds_len = PAGE_SIZE;
    256   1.1  bouyer 		}
    257   1.1  bouyer 		lastaddr = curaddr;
    258   1.1  bouyer 	}
    259   1.1  bouyer 
    260   1.1  bouyer 	*rsegs = curseg + 1;
    261   1.9  bouyer 	return (0);
    262   1.1  bouyer 
    263   1.9  bouyer badaddr:
    264   1.9  bouyer 	if (doingrealloc == 0)
    265   1.9  bouyer 		goto dorealloc;
    266   1.9  bouyer 	if (curaddr < low) {
    267   1.9  bouyer 		/* no way to enforce this */
    268   1.9  bouyer 		printf("_xen_bus_dmamem_alloc_range: no way to "
    269  1.14  bouyer 		    "enforce address range (0x%" PRIx64 " - 0x%" PRIx64 ")\n",
    270  1.14  bouyer 		    (uint64_t)low, (uint64_t)high);
    271   1.9  bouyer 		uvm_pglistfree(&mlist);
    272   1.9  bouyer 		return EINVAL;
    273   1.9  bouyer 	}
    274   1.9  bouyer 	printf("xen_bus_dmamem_alloc_range: "
    275   1.9  bouyer 	    "curraddr=0x%lx > high=0x%lx\n",
    276   1.9  bouyer 	    (u_long)curaddr, (u_long)high);
    277   1.9  bouyer 	panic("xen_bus_dmamem_alloc_range 1");
    278   1.9  bouyer dorealloc:
    279   1.9  bouyer 	if (doingrealloc == 1)
    280   1.9  bouyer 		panic("_xen_bus_dmamem_alloc_range: "
    281   1.9  bouyer 		   "xen_alloc_contig returned "
    282   1.9  bouyer 		   "too much segments");
    283   1.9  bouyer 	doingrealloc = 1;
    284   1.9  bouyer 	/*
    285   1.9  bouyer 	 * Too much segments, or memory doesn't fit
    286   1.9  bouyer 	 * constraints. Free this memory and
    287   1.9  bouyer 	 * get a contigous segment from the hypervisor.
    288   1.9  bouyer 	 */
    289   1.9  bouyer 	uvm_pglistfree(&mlist);
    290   1.9  bouyer 	for (curseg = 0; curseg < nsegs; curseg++) {
    291   1.9  bouyer 		segs[curseg].ds_addr = 0;
    292   1.9  bouyer 		segs[curseg].ds_len = 0;
    293   1.9  bouyer 	}
    294   1.9  bouyer 	error = _xen_alloc_contig(size, alignment,
    295   1.9  bouyer 	    boundary, &mlist, flags, low, high);
    296   1.9  bouyer 	if (error)
    297   1.9  bouyer 		return error;
    298   1.9  bouyer 	goto again;
    299   1.1  bouyer }
    300