2 * Copyright (c) 1997, 1998 Justin T. Gibbs.
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions, and the following disclaimer,
10 * without modification, immediately at the beginning of the file.
11 * 2. The name of the author may not be used to endorse or promote products
12 * derived from this software without specific prior written permission.
14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
18 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 * $FreeBSD: src/sys/i386/i386/busdma_machdep.c,v 1.16.2.2 2003/01/23 00:55:27 scottl Exp $
27 * $DragonFly: src/sys/platform/pc32/i386/busdma_machdep.c,v 1.23 2008/06/05 18:06:32 swildner Exp $
30 #include <sys/param.h>
31 #include <sys/systm.h>
32 #include <sys/malloc.h>
35 #include <sys/thread2.h>
36 #include <sys/bus_dma.h>
37 #include <sys/kernel.h>
38 #include <sys/sysctl.h>
41 #include <vm/vm_page.h>
43 /* XXX needed for to access pmap to convert per-proc virtual to physical */
46 #include <vm/vm_map.h>
48 #include <machine/md_var.h>
50 #define MAX_BPAGES 1024
58 bus_dma_filter_t *filter;
66 bus_dma_segment_t *segments;
70 * bus_dma_tag private flags
72 #define BUS_DMA_MIN_ALLOC_COMP BUS_DMA_BUS4
75 vm_offset_t vaddr; /* kva of bounce buffer */
76 bus_addr_t busaddr; /* Physical address */
77 vm_offset_t datavaddr; /* kva of client data */
78 bus_size_t datacount; /* client data count */
79 STAILQ_ENTRY(bounce_page) links;
82 int busdma_swi_pending;
84 static STAILQ_HEAD(bp_list, bounce_page) bounce_page_list;
85 static int free_bpages;
86 static int reserved_bpages;
87 static int active_bpages;
88 static int total_bpages;
89 static bus_addr_t bounce_lowaddr = BUS_SPACE_MAXADDR;
92 struct bp_list bpages;
96 void *buf; /* unmapped buffer pointer */
97 bus_size_t buflen; /* unmapped buffer length */
98 bus_dmamap_callback_t *callback;
100 STAILQ_ENTRY(bus_dmamap) links;
103 static STAILQ_HEAD(, bus_dmamap) bounce_map_waitinglist;
104 static STAILQ_HEAD(, bus_dmamap) bounce_map_callbacklist;
105 static struct bus_dmamap nobounce_dmamap;
107 static int alloc_bounce_pages(bus_dma_tag_t, u_int);
108 static int reserve_bounce_pages(bus_dma_tag_t, bus_dmamap_t);
109 static bus_addr_t add_bounce_page(bus_dma_tag_t, bus_dmamap_t,
110 vm_offset_t, bus_size_t);
111 static void free_bounce_page(bus_dma_tag_t, struct bounce_page *);
113 SYSCTL_NODE(_hw, OID_AUTO, busdma, CTLFLAG_RD, 0, "Busdma parameters");
114 SYSCTL_INT(_hw_busdma, OID_AUTO, total_bpages, CTLFLAG_RD, &total_bpages, 0,
115 "Total bounce pages");
118 run_filter(bus_dma_tag_t dmat, bus_addr_t paddr)
124 if (paddr > dmat->lowaddr
125 && paddr <= dmat->highaddr
126 && (dmat->filter == NULL
127 || (*dmat->filter)(dmat->filterarg, paddr) != 0))
131 } while (retval == 0 && dmat != NULL);
136 * Allocate a device specific dma_tag.
139 bus_dma_tag_create(bus_dma_tag_t parent, bus_size_t alignment,
140 bus_size_t boundary, bus_addr_t lowaddr,
141 bus_addr_t highaddr, bus_dma_filter_t *filter,
142 void *filterarg, bus_size_t maxsize, int nsegments,
143 bus_size_t maxsegsz, int flags, bus_dma_tag_t *dmat)
145 bus_dma_tag_t newtag;
148 /* Return a NULL tag on failure */
151 newtag = kmalloc(sizeof(*newtag), M_DEVBUF, M_INTWAIT);
153 newtag->parent = parent;
154 newtag->alignment = alignment;
155 newtag->boundary = boundary;
156 newtag->lowaddr = trunc_page((vm_paddr_t)lowaddr) + (PAGE_SIZE - 1);
157 newtag->highaddr = trunc_page((vm_paddr_t)highaddr) + (PAGE_SIZE - 1);
158 newtag->filter = filter;
159 newtag->filterarg = filterarg;
160 newtag->maxsize = maxsize;
161 newtag->nsegments = nsegments;
162 newtag->maxsegsz = maxsegsz;
163 newtag->flags = flags;
164 newtag->ref_count = 1; /* Count ourself */
165 newtag->map_count = 0;
166 newtag->segments = NULL;
168 /* Take into account any restrictions imposed by our parent tag */
169 if (parent != NULL) {
170 newtag->lowaddr = MIN(parent->lowaddr, newtag->lowaddr);
171 newtag->highaddr = MAX(parent->highaddr, newtag->highaddr);
173 * XXX Not really correct??? Probably need to honor boundary
174 * all the way up the inheritence chain.
176 newtag->boundary = MAX(parent->boundary, newtag->boundary);
177 if (newtag->filter == NULL) {
179 * Short circuit looking at our parent directly
180 * since we have encapsulated all of its information
182 newtag->filter = parent->filter;
183 newtag->filterarg = parent->filterarg;
184 newtag->parent = parent->parent;
186 if (newtag->parent != NULL)
190 if (newtag->lowaddr < ptoa(Maxmem) &&
191 (flags & BUS_DMA_ALLOCNOW) != 0) {
194 if (lowaddr > bounce_lowaddr) {
196 * Go through the pool and kill any pages
197 * that don't reside below lowaddr.
199 panic("bus_dma_tag_create: page reallocation "
202 if (ptoa(total_bpages) < maxsize) {
205 pages = atop(maxsize) - total_bpages;
207 /* Add pages to our bounce pool */
208 if (alloc_bounce_pages(newtag, pages) < pages)
211 /* Performed initial allocation */
212 newtag->flags |= BUS_DMA_MIN_ALLOC_COMP;
216 kfree(newtag, M_DEVBUF);
224 bus_dma_tag_destroy(bus_dma_tag_t dmat)
227 if (dmat->map_count != 0)
230 while (dmat != NULL) {
231 bus_dma_tag_t parent;
233 parent = dmat->parent;
235 if (dmat->ref_count == 0) {
236 if (dmat->segments != NULL)
237 kfree(dmat->segments, M_DEVBUF);
238 kfree(dmat, M_DEVBUF);
240 * Last reference count, so
241 * release our reference
242 * count on our parent.
253 * Allocate a handle for mapping from kva/uva/physical
254 * address space into bus device space.
257 bus_dmamap_create(bus_dma_tag_t dmat, int flags, bus_dmamap_t *mapp)
263 if (dmat->segments == NULL) {
264 KKASSERT(dmat->nsegments && dmat->nsegments < 16384);
265 dmat->segments = kmalloc(sizeof(bus_dma_segment_t) *
266 dmat->nsegments, M_DEVBUF, M_INTWAIT);
269 if (dmat->lowaddr < ptoa(Maxmem)) {
273 *mapp = kmalloc(sizeof(**mapp), M_DEVBUF, M_INTWAIT | M_ZERO);
275 /* Initialize the new map */
276 STAILQ_INIT(&((*mapp)->bpages));
278 * Attempt to add pages to our pool on a per-instance
279 * basis up to a sane limit.
281 maxpages = MIN(MAX_BPAGES, Maxmem - atop(dmat->lowaddr));
282 if ((dmat->flags & BUS_DMA_MIN_ALLOC_COMP) == 0
283 || (dmat->map_count > 0
284 && total_bpages < maxpages)) {
287 if (dmat->lowaddr > bounce_lowaddr) {
289 * Go through the pool and kill any pages
290 * that don't reside below lowaddr.
292 panic("bus_dmamap_create: page reallocation "
296 pages = MAX(atop(dmat->maxsize), 1);
297 pages = MIN(maxpages - total_bpages, pages);
298 pages = MAX(pages, 1);
299 if (alloc_bounce_pages(dmat, pages) < pages)
302 if ((dmat->flags & BUS_DMA_MIN_ALLOC_COMP) == 0) {
304 dmat->flags |= BUS_DMA_MIN_ALLOC_COMP;
318 * Destroy a handle for mapping from kva/uva/physical
319 * address space into bus device space.
322 bus_dmamap_destroy(bus_dma_tag_t dmat, bus_dmamap_t map)
325 if (STAILQ_FIRST(&map->bpages) != NULL)
327 kfree(map, M_DEVBUF);
334 * Allocate a piece of memory that can be efficiently mapped into
335 * bus device space based on the constraints lited in the dma tag.
337 * mapp is degenerate. By definition this allocation should not require
338 * bounce buffers so do not allocate a dma map.
341 bus_dmamem_alloc(bus_dma_tag_t dmat, void** vaddr, int flags,
346 /* If we succeed, no mapping/bouncing will be required */
349 if (dmat->segments == NULL) {
350 KKASSERT(dmat->nsegments < 16384);
351 dmat->segments = kmalloc(sizeof(bus_dma_segment_t) *
352 dmat->nsegments, M_DEVBUF, M_INTWAIT);
355 if (flags & BUS_DMA_NOWAIT)
359 if (flags & BUS_DMA_ZERO)
362 if ((dmat->maxsize <= PAGE_SIZE) &&
363 dmat->lowaddr >= ptoa(Maxmem)) {
364 *vaddr = kmalloc(dmat->maxsize, M_DEVBUF, mflags);
366 * XXX Check whether the allocation crossed a page boundary
367 * and retry with power-of-2 alignment in that case.
369 if ((((intptr_t)*vaddr) & PAGE_MASK) !=
370 (((intptr_t)*vaddr + dmat->maxsize) & PAGE_MASK)) {
372 kfree(*vaddr, M_DEVBUF);
373 /* XXX check for overflow? */
374 for (size = 1; size <= dmat->maxsize; size <<= 1)
376 *vaddr = kmalloc(size, M_DEVBUF, mflags);
380 * XXX Use Contigmalloc until it is merged into this facility
381 * and handles multi-seg allocations. Nobody is doing
382 * multi-seg allocations yet though.
384 *vaddr = contigmalloc(dmat->maxsize, M_DEVBUF, mflags,
385 0ul, dmat->lowaddr, dmat->alignment? dmat->alignment : 1ul,
394 * Free a piece of memory and it's allociated dmamap, that was allocated
395 * via bus_dmamem_alloc. Make the same choice for free/contigfree.
398 bus_dmamem_free(bus_dma_tag_t dmat, void *vaddr, bus_dmamap_t map)
401 * dmamem does not need to be bounced, so the map should be
405 panic("bus_dmamem_free: Invalid map freed\n");
406 if ((dmat->maxsize <= PAGE_SIZE) &&
407 dmat->lowaddr >= ptoa(Maxmem))
408 kfree(vaddr, M_DEVBUF);
410 contigfree(vaddr, dmat->maxsize, M_DEVBUF);
413 #define BUS_DMAMAP_NSEGS ((BUS_SPACE_MAXSIZE / PAGE_SIZE) + 1)
416 * Map the buffer buf into bus space using the dmamap map.
419 bus_dmamap_load(bus_dma_tag_t dmat, bus_dmamap_t map, void *buf,
420 bus_size_t buflen, bus_dmamap_callback_t *callback,
421 void *callback_arg, int flags)
425 bus_dma_segment_t *sg;
428 vm_paddr_t nextpaddr;
432 map = &nobounce_dmamap;
436 * If we are being called during a callback, pagesneeded will
437 * be non-zero, so we can avoid doing the work twice.
439 if (dmat->lowaddr < ptoa(Maxmem) &&
440 map->pagesneeded == 0) {
441 vm_offset_t vendaddr;
444 * Count the number of bounce pages
445 * needed in order to complete this transfer
447 vaddr = trunc_page((vm_offset_t)buf);
448 vendaddr = (vm_offset_t)buf + buflen;
450 while (vaddr < vendaddr) {
451 paddr = pmap_kextract(vaddr);
452 if (run_filter(dmat, paddr) != 0)
458 /* Reserve Necessary Bounce Pages */
459 if (map->pagesneeded != 0) {
461 if (reserve_bounce_pages(dmat, map) != 0) {
462 /* Queue us for resources */
465 map->buflen = buflen;
466 map->callback = callback;
467 map->callback_arg = callback_arg;
469 STAILQ_INSERT_TAIL(&bounce_map_waitinglist, map, links);
472 return (EINPROGRESS);
477 vaddr = (vm_offset_t)buf;
482 bmask = ~(dmat->boundary - 1); /* note: will be 0 if boundary is 0 */
484 /* force at least one segment */
491 paddr = pmap_kextract(vaddr);
492 size = PAGE_SIZE - (paddr & PAGE_MASK);
495 if (map->pagesneeded != 0 && run_filter(dmat, paddr)) {
497 * note: this paddr has the same in-page offset
498 * as vaddr and thus the paddr above, so the
499 * size does not have to be recalculated
501 paddr = add_bounce_page(dmat, map, vaddr, size);
505 * Fill in the bus_dma_segment
507 if (sg->ds_len == 0) {
510 } else if (paddr == nextpaddr) {
515 if (seg > dmat->nsegments)
520 nextpaddr = paddr + size;
523 * Handle maxsegsz and boundary issues with a nested loop
529 * Limit to the boundary and maximum segment size
531 if (((nextpaddr - 1) ^ sg->ds_addr) & bmask) {
532 tmpsize = dmat->boundary -
533 (sg->ds_addr & ~bmask);
534 if (tmpsize > dmat->maxsegsz)
535 tmpsize = dmat->maxsegsz;
536 KKASSERT(tmpsize < sg->ds_len);
537 } else if (sg->ds_len > dmat->maxsegsz) {
538 tmpsize = dmat->maxsegsz;
544 * Futz, split the data into a new segment.
546 if (seg >= dmat->nsegments)
548 sg[1].ds_len = sg[0].ds_len - tmpsize;
549 sg[1].ds_addr = sg[0].ds_addr + tmpsize;
550 sg[0].ds_len = tmpsize;
560 } while (buflen > 0);
564 kprintf("bus_dmamap_load: Too many segs! buf_len = 0x%lx\n",
569 (*callback)(callback_arg, dmat->segments, seg, error);
575 * Utility function to load a linear buffer. lastaddrp holds state
576 * between invocations (for multiple-buffer loads). segp contains
577 * the starting segment on entrace, and the ending segment on exit.
578 * first indicates if this is the first invocation of this function.
581 _bus_dmamap_load_buffer(bus_dma_tag_t dmat,
582 void *buf, bus_size_t buflen,
585 vm_offset_t *lastaddrp,
589 bus_dma_segment_t *segs;
591 bus_addr_t curaddr, lastaddr, baddr, bmask;
592 vm_offset_t vaddr = (vm_offset_t)buf;
596 if (td->td_proc != NULL)
597 pmap = vmspace_pmap(td->td_proc->p_vmspace);
601 segs = dmat->segments;
602 lastaddr = *lastaddrp;
603 bmask = ~(dmat->boundary - 1);
605 for (seg = *segp; buflen > 0 ; ) {
607 * Get the physical address for this segment.
610 curaddr = pmap_extract(pmap, vaddr);
612 curaddr = pmap_kextract(vaddr);
615 * Compute the segment size, and adjust counts.
617 sgsize = PAGE_SIZE - ((u_long)curaddr & PAGE_MASK);
622 * Make sure we don't cross any boundaries.
624 if (dmat->boundary > 0) {
625 baddr = (curaddr + dmat->boundary) & bmask;
626 if (sgsize > (baddr - curaddr))
627 sgsize = (baddr - curaddr);
631 * Insert chunk into a segment, coalescing with
632 * previous segment if possible.
635 segs[seg].ds_addr = curaddr;
636 segs[seg].ds_len = sgsize;
639 if (curaddr == lastaddr &&
640 (segs[seg].ds_len + sgsize) <= dmat->maxsegsz &&
641 (dmat->boundary == 0 ||
642 (segs[seg].ds_addr & bmask) == (curaddr & bmask)))
643 segs[seg].ds_len += sgsize;
645 if (++seg >= dmat->nsegments)
647 segs[seg].ds_addr = curaddr;
648 segs[seg].ds_len = sgsize;
652 lastaddr = curaddr + sgsize;
658 *lastaddrp = lastaddr;
663 return (buflen != 0 ? EFBIG : 0); /* XXX better return value here? */
667 * Like _bus_dmamap_load(), but for mbufs.
670 bus_dmamap_load_mbuf(bus_dma_tag_t dmat, bus_dmamap_t map,
672 bus_dmamap_callback2_t *callback, void *callback_arg,
677 KASSERT(dmat->lowaddr >= ptoa(Maxmem) || map != NULL,
678 ("bus_dmamap_load_mbuf: No support for bounce pages!"));
679 KASSERT(m0->m_flags & M_PKTHDR,
680 ("bus_dmamap_load_mbuf: no packet header"));
684 if (m0->m_pkthdr.len <= dmat->maxsize) {
686 vm_offset_t lastaddr = 0;
689 for (m = m0; m != NULL && error == 0; m = m->m_next) {
692 error = _bus_dmamap_load_buffer(dmat,
694 curthread, flags, &lastaddr,
703 /* force "no valid mappings" in callback */
704 (*callback)(callback_arg, dmat->segments, 0, 0, error);
706 (*callback)(callback_arg, dmat->segments,
707 nsegs+1, m0->m_pkthdr.len, error);
713 * Like _bus_dmamap_load(), but for uios.
716 bus_dmamap_load_uio(bus_dma_tag_t dmat, bus_dmamap_t map,
718 bus_dmamap_callback2_t *callback, void *callback_arg,
721 vm_offset_t lastaddr;
722 int nsegs, error, first, i;
725 struct thread *td = NULL;
727 KASSERT(dmat->lowaddr >= ptoa(Maxmem) || map != NULL,
728 ("bus_dmamap_load_uio: No support for bounce pages!"));
730 resid = uio->uio_resid;
733 if (uio->uio_segflg == UIO_USERSPACE) {
735 KASSERT(td != NULL && td->td_proc != NULL,
736 ("bus_dmamap_load_uio: USERSPACE but no proc"));
742 for (i = 0; i < uio->uio_iovcnt && resid != 0 && !error; i++) {
744 * Now at the first iovec to load. Load each iovec
745 * until we have exhausted the residual count.
748 resid < iov[i].iov_len ? resid : iov[i].iov_len;
749 caddr_t addr = (caddr_t) iov[i].iov_base;
751 error = _bus_dmamap_load_buffer(dmat,
753 td, flags, &lastaddr, &nsegs, first);
760 /* force "no valid mappings" in callback */
761 (*callback)(callback_arg, dmat->segments, 0, 0, error);
763 (*callback)(callback_arg, dmat->segments,
764 nsegs+1, uio->uio_resid, error);
770 * Release the mapping held by map.
773 _bus_dmamap_unload(bus_dma_tag_t dmat, bus_dmamap_t map)
775 struct bounce_page *bpage;
777 while ((bpage = STAILQ_FIRST(&map->bpages)) != NULL) {
778 STAILQ_REMOVE_HEAD(&map->bpages, links);
779 free_bounce_page(dmat, bpage);
784 _bus_dmamap_sync(bus_dma_tag_t dmat, bus_dmamap_t map, bus_dmasync_op_t op)
786 struct bounce_page *bpage;
788 if ((bpage = STAILQ_FIRST(&map->bpages)) != NULL) {
790 * Handle data bouncing. We might also
791 * want to add support for invalidating
792 * the caches on broken hardware
795 case BUS_DMASYNC_PREWRITE:
796 while (bpage != NULL) {
797 bcopy((void *)bpage->datavaddr,
798 (void *)bpage->vaddr,
800 bpage = STAILQ_NEXT(bpage, links);
804 case BUS_DMASYNC_POSTREAD:
805 while (bpage != NULL) {
806 bcopy((void *)bpage->vaddr,
807 (void *)bpage->datavaddr,
809 bpage = STAILQ_NEXT(bpage, links);
813 case BUS_DMASYNC_PREREAD:
814 case BUS_DMASYNC_POSTWRITE:
822 alloc_bounce_pages(bus_dma_tag_t dmat, u_int numpages)
827 if (total_bpages == 0) {
828 STAILQ_INIT(&bounce_page_list);
829 STAILQ_INIT(&bounce_map_waitinglist);
830 STAILQ_INIT(&bounce_map_callbacklist);
833 while (numpages > 0) {
834 struct bounce_page *bpage;
836 bpage = kmalloc(sizeof(*bpage), M_DEVBUF, M_INTWAIT | M_ZERO);
838 bpage->vaddr = (vm_offset_t)contigmalloc(PAGE_SIZE, M_DEVBUF,
843 if (bpage->vaddr == 0) {
844 kfree(bpage, M_DEVBUF);
847 bpage->busaddr = pmap_kextract(bpage->vaddr);
849 STAILQ_INSERT_TAIL(&bounce_page_list, bpage, links);
860 reserve_bounce_pages(bus_dma_tag_t dmat, bus_dmamap_t map)
864 pages = MIN(free_bpages, map->pagesneeded - map->pagesreserved);
865 free_bpages -= pages;
866 reserved_bpages += pages;
867 map->pagesreserved += pages;
868 pages = map->pagesneeded - map->pagesreserved;
874 add_bounce_page(bus_dma_tag_t dmat, bus_dmamap_t map, vm_offset_t vaddr,
877 struct bounce_page *bpage;
879 if (map->pagesneeded == 0)
880 panic("add_bounce_page: map doesn't need any pages");
883 if (map->pagesreserved == 0)
884 panic("add_bounce_page: map doesn't need any pages");
885 map->pagesreserved--;
888 bpage = STAILQ_FIRST(&bounce_page_list);
890 panic("add_bounce_page: free page list is empty");
892 STAILQ_REMOVE_HEAD(&bounce_page_list, links);
897 bpage->datavaddr = vaddr;
898 bpage->datacount = size;
899 STAILQ_INSERT_TAIL(&(map->bpages), bpage, links);
900 return (bpage->busaddr);
904 free_bounce_page(bus_dma_tag_t dmat, struct bounce_page *bpage)
906 struct bus_dmamap *map;
908 bpage->datavaddr = 0;
909 bpage->datacount = 0;
912 STAILQ_INSERT_HEAD(&bounce_page_list, bpage, links);
915 if ((map = STAILQ_FIRST(&bounce_map_waitinglist)) != NULL) {
916 if (reserve_bounce_pages(map->dmat, map) == 0) {
917 STAILQ_REMOVE_HEAD(&bounce_map_waitinglist, links);
918 STAILQ_INSERT_TAIL(&bounce_map_callbacklist,
920 busdma_swi_pending = 1;
930 struct bus_dmamap *map;
933 while ((map = STAILQ_FIRST(&bounce_map_callbacklist)) != NULL) {
934 STAILQ_REMOVE_HEAD(&bounce_map_callbacklist, links);
936 bus_dmamap_load(map->dmat, map, map->buf, map->buflen,
937 map->callback, map->callback_arg, /*flags*/0);