2 ** PARISC 1.1 Dynamic DMA mapping support.
3 ** This implementation is for PA-RISC platforms that do not support
4 ** I/O TLBs (aka DMA address translation hardware).
5 ** See Documentation/DMA-mapping.txt for interface definitions.
7 ** (c) Copyright 1999,2000 Hewlett-Packard Company
8 ** (c) Copyright 2000 Grant Grundler
9 ** (c) Copyright 2000 Philipp Rumpf <prumpf@tux.org>
10 ** (c) Copyright 2000 John Marvin
12 ** "leveraged" from 2.3.47: arch/ia64/kernel/pci-dma.c.
13 ** (I assume it's from David Mosberger-Tang but there was no Copyright)
15 ** AFAIK, all PA7100LC and PA7300LC platforms can use this code.
20 #include <linux/init.h>
22 #include <linux/pci.h>
23 #include <linux/proc_fs.h>
24 #include <linux/slab.h>
25 #include <linux/string.h>
26 #include <linux/types.h>
28 #include <asm/cacheflush.h>
29 #include <asm/dma.h> /* for DMA_CHUNK_SIZE */
31 #include <asm/page.h> /* get_order */
32 #include <asm/pgalloc.h>
33 #include <asm/uaccess.h>
37 #define ASSERT(expr) \
39 printk("\n%s:%d: Assertion " #expr " failed!\n", \
40 __FILE__, __LINE__); \
48 static struct proc_dir_entry * proc_gsc_root = NULL;
49 static int pcxl_proc_info(char *buffer, char **start, off_t offset, int length);
50 static unsigned long pcxl_used_bytes = 0;
51 static unsigned long pcxl_used_pages = 0;
53 extern unsigned long pcxl_dma_start; /* Start of pcxl dma mapping area */
54 static spinlock_t pcxl_res_lock;
55 static char *pcxl_res_map;
56 static int pcxl_res_hint;
57 static int pcxl_res_size;
59 #ifdef DEBUG_PCXL_RESOURCE
60 #define DBG_RES(x...) printk(x)
67 ** Dump a hex representation of the resource map.
72 void dump_resmap(void)
74 u_long *res_ptr = (unsigned long *)pcxl_res_map;
78 for(; i < (pcxl_res_size / sizeof(unsigned long)); ++i, ++res_ptr)
79 printk("%08lx ", *res_ptr);
84 static inline void dump_resmap(void) {;}
87 static int pa11_dma_supported( struct device *dev, u64 mask)
92 static inline int map_pte_uncached(pte_t * pte,
94 unsigned long size, unsigned long *paddr_ptr)
97 unsigned long orig_vaddr = vaddr;
105 printk(KERN_ERR "map_pte_uncached: page already exists\n");
106 set_pte(pte, __mk_pte(*paddr_ptr, PAGE_KERNEL_UNC));
108 pdtlb_kernel(orig_vaddr);
111 orig_vaddr += PAGE_SIZE;
112 (*paddr_ptr) += PAGE_SIZE;
114 } while (vaddr < end);
118 static inline int map_pmd_uncached(pmd_t * pmd, unsigned long vaddr,
119 unsigned long size, unsigned long *paddr_ptr)
122 unsigned long orig_vaddr = vaddr;
124 vaddr &= ~PGDIR_MASK;
126 if (end > PGDIR_SIZE)
129 pte_t * pte = pte_alloc_kernel(&init_mm, pmd, vaddr);
132 if (map_pte_uncached(pte, orig_vaddr, end - vaddr, paddr_ptr))
134 vaddr = (vaddr + PMD_SIZE) & PMD_MASK;
135 orig_vaddr += PMD_SIZE;
137 } while (vaddr < end);
141 static inline int map_uncached_pages(unsigned long vaddr, unsigned long size,
145 unsigned long end = vaddr + size;
147 dir = pgd_offset_k(vaddr);
151 pmd = pmd_alloc(NULL, dir, vaddr);
154 if (map_pmd_uncached(pmd, vaddr, end - vaddr, &paddr))
156 vaddr = vaddr + PGDIR_SIZE;
158 } while (vaddr && (vaddr < end));
162 static inline void unmap_uncached_pte(pmd_t * pmd, unsigned long vaddr,
167 unsigned long orig_vaddr = vaddr;
176 pte = pte_offset_map(pmd, vaddr);
185 pdtlb_kernel(orig_vaddr);
188 orig_vaddr += PAGE_SIZE;
190 if (pte_none(page) || pte_present(page))
192 printk(KERN_CRIT "Whee.. Swapped out page in kernel page table\n");
193 } while (vaddr < end);
196 static inline void unmap_uncached_pmd(pgd_t * dir, unsigned long vaddr,
201 unsigned long orig_vaddr = vaddr;
210 pmd = pmd_offset(dir, vaddr);
211 vaddr &= ~PGDIR_MASK;
213 if (end > PGDIR_SIZE)
216 unmap_uncached_pte(pmd, orig_vaddr, end - vaddr);
217 vaddr = (vaddr + PMD_SIZE) & PMD_MASK;
218 orig_vaddr += PMD_SIZE;
220 } while (vaddr < end);
223 static void unmap_uncached_pages(unsigned long vaddr, unsigned long size)
226 unsigned long end = vaddr + size;
228 dir = pgd_offset_k(vaddr);
230 unmap_uncached_pmd(dir, vaddr, end - vaddr);
231 vaddr = vaddr + PGDIR_SIZE;
233 } while (vaddr && (vaddr < end));
236 #define PCXL_SEARCH_LOOP(idx, mask, size) \
237 for(; res_ptr < res_end; ++res_ptr) \
239 if(0 == ((*res_ptr) & mask)) { \
241 idx = (int)((u_long)res_ptr - (u_long)pcxl_res_map); \
242 pcxl_res_hint = idx + (size >> 3); \
243 goto resource_found; \
247 #define PCXL_FIND_FREE_MAPPING(idx, mask, size) { \
248 u##size *res_ptr = (u##size *)&(pcxl_res_map[pcxl_res_hint & ~((size >> 3) - 1)]); \
249 u##size *res_end = (u##size *)&pcxl_res_map[pcxl_res_size]; \
250 PCXL_SEARCH_LOOP(idx, mask, size); \
251 res_ptr = (u##size *)&pcxl_res_map[0]; \
252 PCXL_SEARCH_LOOP(idx, mask, size); \
256 pcxl_alloc_range(size_t size)
260 unsigned int pages_needed = size >> PAGE_SHIFT;
262 ASSERT(pages_needed);
263 ASSERT((pages_needed * PAGE_SIZE) < DMA_CHUNK_SIZE);
264 ASSERT(pages_needed < (BITS_PER_LONG - PAGE_SHIFT));
267 mask >>= BITS_PER_LONG - pages_needed;
269 DBG_RES("pcxl_alloc_range() size: %d pages_needed %d pages_mask 0x%08lx\n",
270 size, pages_needed, mask);
272 spin_lock_irqsave(&pcxl_res_lock, flags);
274 if(pages_needed <= 8) {
275 PCXL_FIND_FREE_MAPPING(res_idx, mask, 8);
276 } else if(pages_needed <= 16) {
277 PCXL_FIND_FREE_MAPPING(res_idx, mask, 16);
278 } else if(pages_needed <= 32) {
279 PCXL_FIND_FREE_MAPPING(res_idx, mask, 32);
281 panic("%s: pcxl_alloc_range() Too many pages to map.\n",
286 panic("%s: pcxl_alloc_range() out of dma mapping resources\n",
291 DBG_RES("pcxl_alloc_range() res_idx %d mask 0x%08lx res_hint: %d\n",
292 res_idx, mask, pcxl_res_hint);
294 pcxl_used_pages += pages_needed;
295 pcxl_used_bytes += ((pages_needed >> 3) ? (pages_needed >> 3) : 1);
297 spin_unlock_irqrestore(&pcxl_res_lock, flags);
302 ** return the corresponding vaddr in the pcxl dma map
304 return (pcxl_dma_start + (res_idx << (PAGE_SHIFT + 3)));
307 #define PCXL_FREE_MAPPINGS(idx, m, size) \
308 u##size *res_ptr = (u##size *)&(pcxl_res_map[(idx) + (((size >> 3) - 1) & (~((size >> 3) - 1)))]); \
309 ASSERT((*res_ptr & m) == m); \
313 ** clear bits in the pcxl resource map
316 pcxl_free_range(unsigned long vaddr, size_t size)
319 unsigned int res_idx = (vaddr - pcxl_dma_start) >> (PAGE_SHIFT + 3);
320 unsigned int pages_mapped = size >> PAGE_SHIFT;
322 ASSERT(pages_mapped);
323 ASSERT((pages_mapped * PAGE_SIZE) < DMA_CHUNK_SIZE);
324 ASSERT(pages_mapped < (BITS_PER_LONG - PAGE_SHIFT));
327 mask >>= BITS_PER_LONG - pages_mapped;
329 DBG_RES("pcxl_free_range() res_idx: %d size: %d pages_mapped %d mask 0x%08lx\n",
330 res_idx, size, pages_mapped, mask);
332 spin_lock_irqsave(&pcxl_res_lock, flags);
334 if(pages_mapped <= 8) {
335 PCXL_FREE_MAPPINGS(res_idx, mask, 8);
336 } else if(pages_mapped <= 16) {
337 PCXL_FREE_MAPPINGS(res_idx, mask, 16);
338 } else if(pages_mapped <= 32) {
339 PCXL_FREE_MAPPINGS(res_idx, mask, 32);
341 panic("%s: pcxl_free_range() Too many pages to unmap.\n",
345 pcxl_used_pages -= (pages_mapped ? pages_mapped : 1);
346 pcxl_used_bytes -= ((pages_mapped >> 3) ? (pages_mapped >> 3) : 1);
348 spin_unlock_irqrestore(&pcxl_res_lock, flags);
356 if (pcxl_dma_start == 0)
359 spin_lock_init(&pcxl_res_lock);
360 pcxl_res_size = PCXL_DMA_MAP_SIZE >> (PAGE_SHIFT + 3);
362 pcxl_res_map = (char *)__get_free_pages(GFP_KERNEL,
363 get_order(pcxl_res_size));
364 memset(pcxl_res_map, 0, pcxl_res_size);
365 proc_gsc_root = proc_mkdir("gsc", 0);
366 create_proc_info_entry("dino", 0, proc_gsc_root, pcxl_proc_info);
370 __initcall(pcxl_dma_init);
372 static void * pa11_dma_alloc_consistent (struct device *dev, size_t size, dma_addr_t *dma_handle, int flag)
378 order = get_order(size);
379 size = 1 << (order + PAGE_SHIFT);
380 vaddr = pcxl_alloc_range(size);
381 paddr = __get_free_pages(flag, order);
382 flush_kernel_dcache_range(paddr, size);
384 map_uncached_pages(vaddr, size, paddr);
385 *dma_handle = (dma_addr_t) paddr;
388 /* This probably isn't needed to support EISA cards.
389 ** ISA cards will certainly only support 24-bit DMA addressing.
390 ** Not clear if we can, want, or need to support ISA.
392 if (!dev || *dev->coherent_dma_mask < 0xffffffff)
395 return (void *)vaddr;
398 static void pa11_dma_free_consistent (struct device *dev, size_t size, void *vaddr, dma_addr_t dma_handle)
402 order = get_order(size);
403 size = 1 << (order + PAGE_SHIFT);
404 unmap_uncached_pages((unsigned long)vaddr, size);
405 pcxl_free_range((unsigned long)vaddr, size);
406 free_pages((unsigned long)__va(dma_handle), order);
409 static dma_addr_t pa11_dma_map_single(struct device *dev, void *addr, size_t size, enum dma_data_direction direction)
411 if (direction == DMA_NONE) {
412 printk(KERN_ERR "pa11_dma_map_single(PCI_DMA_NONE) called by %p\n", __builtin_return_address(0));
416 flush_kernel_dcache_range((unsigned long) addr, size);
417 return virt_to_phys(addr);
420 static void pa11_dma_unmap_single(struct device *dev, dma_addr_t dma_handle, size_t size, enum dma_data_direction direction)
422 if (direction == DMA_NONE) {
423 printk(KERN_ERR "pa11_dma_unmap_single(PCI_DMA_NONE) called by %p\n", __builtin_return_address(0));
427 if (direction == DMA_TO_DEVICE)
431 * For PCI_DMA_FROMDEVICE this flush is not necessary for the
432 * simple map/unmap case. However, it IS necessary if if
433 * pci_dma_sync_single_* has been called and the buffer reused.
436 flush_kernel_dcache_range((unsigned long) phys_to_virt(dma_handle), size);
440 static int pa11_dma_map_sg(struct device *dev, struct scatterlist *sglist, int nents, enum dma_data_direction direction)
444 if (direction == DMA_NONE)
447 for (i = 0; i < nents; i++, sglist++ ) {
448 unsigned long vaddr = sg_virt_addr(sglist);
449 sg_dma_address(sglist) = (dma_addr_t) virt_to_phys(vaddr);
450 sg_dma_len(sglist) = sglist->length;
451 flush_kernel_dcache_range(vaddr, sglist->length);
456 static void pa11_dma_unmap_sg(struct device *dev, struct scatterlist *sglist, int nents, enum dma_data_direction direction)
460 if (direction == DMA_NONE)
463 if (direction == DMA_TO_DEVICE)
466 /* once we do combining we'll need to use phys_to_virt(sg_dma_address(sglist)) */
468 for (i = 0; i < nents; i++, sglist++ )
469 flush_kernel_dcache_range(sg_virt_addr(sglist), sglist->length);
473 static void pa11_dma_sync_single_for_cpu(struct device *dev, dma_addr_t dma_handle, unsigned long offset, size_t size, enum dma_data_direction direction)
475 if (direction == DMA_NONE)
478 flush_kernel_dcache_range((unsigned long) phys_to_virt(dma_handle) + offset, size);
481 static void pa11_dma_sync_single_for_device(struct device *dev, dma_addr_t dma_handle, unsigned long offset, size_t size, enum dma_data_direction direction)
483 if (direction == DMA_NONE)
486 flush_kernel_dcache_range((unsigned long) phys_to_virt(dma_handle) + offset, size);
489 static void pa11_dma_sync_sg_for_cpu(struct device *dev, struct scatterlist *sglist, int nents, enum dma_data_direction direction)
493 /* once we do combining we'll need to use phys_to_virt(sg_dma_address(sglist)) */
495 for (i = 0; i < nents; i++, sglist++ )
496 flush_kernel_dcache_range(sg_virt_addr(sglist), sglist->length);
499 static void pa11_dma_sync_sg_for_device(struct device *dev, struct scatterlist *sglist, int nents, enum dma_data_direction direction)
503 /* once we do combining we'll need to use phys_to_virt(sg_dma_address(sglist)) */
505 for (i = 0; i < nents; i++, sglist++ )
506 flush_kernel_dcache_range(sg_virt_addr(sglist), sglist->length);
509 struct hppa_dma_ops pcxl_dma_ops = {
510 .dma_supported = pa11_dma_supported,
511 .alloc_consistent = pa11_dma_alloc_consistent,
512 .alloc_noncoherent = pa11_dma_alloc_consistent,
513 .free_consistent = pa11_dma_free_consistent,
514 .map_single = pa11_dma_map_single,
515 .unmap_single = pa11_dma_unmap_single,
516 .map_sg = pa11_dma_map_sg,
517 .unmap_sg = pa11_dma_unmap_sg,
518 .dma_sync_single_for_cpu = pa11_dma_sync_single_for_cpu,
519 .dma_sync_single_for_device = pa11_dma_sync_single_for_device,
520 .dma_sync_sg_for_cpu = pa11_dma_sync_sg_for_cpu,
521 .dma_sync_sg_for_device = pa11_dma_sync_sg_for_device,
524 static void *fail_alloc_consistent(struct device *dev, size_t size,
525 dma_addr_t *dma_handle, int flag)
530 static void *pa11_dma_alloc_noncoherent(struct device *dev, size_t size,
531 dma_addr_t *dma_handle, int flag)
535 /* rely on kmalloc to be cacheline aligned */
536 addr = kmalloc(size, flag);
538 *dma_handle = (dma_addr_t)virt_to_phys(addr);
543 static void pa11_dma_free_noncoherent(struct device *dev, size_t size,
544 void *vaddr, dma_addr_t iova)
550 struct hppa_dma_ops pcx_dma_ops = {
551 .dma_supported = pa11_dma_supported,
552 .alloc_consistent = fail_alloc_consistent,
553 .alloc_noncoherent = pa11_dma_alloc_noncoherent,
554 .free_consistent = pa11_dma_free_noncoherent,
555 .map_single = pa11_dma_map_single,
556 .unmap_single = pa11_dma_unmap_single,
557 .map_sg = pa11_dma_map_sg,
558 .unmap_sg = pa11_dma_unmap_sg,
559 .dma_sync_single_for_cpu = pa11_dma_sync_single_for_cpu,
560 .dma_sync_single_for_device = pa11_dma_sync_single_for_device,
561 .dma_sync_sg_for_cpu = pa11_dma_sync_sg_for_cpu,
562 .dma_sync_sg_for_device = pa11_dma_sync_sg_for_device,
566 static int pcxl_proc_info(char *buf, char **start, off_t offset, int len)
569 unsigned long *res_ptr = (u_long *)pcxl_res_map;
570 unsigned long total_pages = pcxl_res_size << 3; /* 8 bits per byte */
572 sprintf(buf, "\nDMA Mapping Area size : %d bytes (%d pages)\n",
574 (pcxl_res_size << 3) ); /* 1 bit per page */
576 sprintf(buf, "%sResource bitmap : %d bytes (%d pages)\n",
577 buf, pcxl_res_size, pcxl_res_size << 3); /* 8 bits per byte */
579 strcat(buf, " total: free: used: % used:\n");
580 sprintf(buf, "%sblocks %8d %8ld %8ld %8ld%%\n", buf, pcxl_res_size,
581 pcxl_res_size - pcxl_used_bytes, pcxl_used_bytes,
582 (pcxl_used_bytes * 100) / pcxl_res_size);
584 sprintf(buf, "%spages %8ld %8ld %8ld %8ld%%\n", buf, total_pages,
585 total_pages - pcxl_used_pages, pcxl_used_pages,
586 (pcxl_used_pages * 100 / total_pages));
588 strcat(buf, "\nResource bitmap:");
590 for(; i < (pcxl_res_size / sizeof(u_long)); ++i, ++res_ptr) {
593 sprintf(buf, "%s %08lx", buf, *res_ptr);