2 ** PARISC 1.1 Dynamic DMA mapping support.
3 ** This implementation is for PA-RISC platforms that do not support
4 ** I/O TLBs (aka DMA address translation hardware).
5 ** See Documentation/DMA-API-HOWTO.txt for interface definitions.
7 ** (c) Copyright 1999,2000 Hewlett-Packard Company
8 ** (c) Copyright 2000 Grant Grundler
9 ** (c) Copyright 2000 Philipp Rumpf <prumpf@tux.org>
10 ** (c) Copyright 2000 John Marvin
12 ** "leveraged" from 2.3.47: arch/ia64/kernel/pci-dma.c.
13 ** (I assume it's from David Mosberger-Tang but there was no Copyright)
15 ** AFAIK, all PA7100LC and PA7300LC platforms can use this code.
20 #include <linux/init.h>
21 #include <linux/gfp.h>
23 #include <linux/pci.h>
24 #include <linux/proc_fs.h>
25 #include <linux/seq_file.h>
26 #include <linux/string.h>
27 #include <linux/types.h>
28 #include <linux/scatterlist.h>
29 #include <linux/export.h>
31 #include <asm/cacheflush.h>
32 #include <asm/dma.h> /* for DMA_CHUNK_SIZE */
34 #include <asm/page.h> /* get_order */
35 #include <asm/pgalloc.h>
36 #include <linux/uaccess.h>
37 #include <asm/tlbflush.h> /* for purge_tlb_*() macros */
39 static struct proc_dir_entry
* proc_gsc_root __read_mostly
= NULL
;
40 static unsigned long pcxl_used_bytes __read_mostly
= 0;
41 static unsigned long pcxl_used_pages __read_mostly
= 0;
43 extern unsigned long pcxl_dma_start
; /* Start of pcxl dma mapping area */
44 static spinlock_t pcxl_res_lock
;
45 static char *pcxl_res_map
;
46 static int pcxl_res_hint
;
47 static int pcxl_res_size
;
49 #ifdef DEBUG_PCXL_RESOURCE
50 #define DBG_RES(x...) printk(x)
57 ** Dump a hex representation of the resource map.
62 void dump_resmap(void)
64 u_long
*res_ptr
= (unsigned long *)pcxl_res_map
;
68 for(; i
< (pcxl_res_size
/ sizeof(unsigned long)); ++i
, ++res_ptr
)
69 printk("%08lx ", *res_ptr
);
74 static inline void dump_resmap(void) {;}
77 static int pa11_dma_supported( struct device
*dev
, u64 mask
)
82 static inline int map_pte_uncached(pte_t
* pte
,
84 unsigned long size
, unsigned long *paddr_ptr
)
87 unsigned long orig_vaddr
= vaddr
;
97 printk(KERN_ERR
"map_pte_uncached: page already exists\n");
98 purge_tlb_start(flags
);
99 set_pte(pte
, __mk_pte(*paddr_ptr
, PAGE_KERNEL_UNC
));
100 pdtlb_kernel(orig_vaddr
);
101 purge_tlb_end(flags
);
103 orig_vaddr
+= PAGE_SIZE
;
104 (*paddr_ptr
) += PAGE_SIZE
;
106 } while (vaddr
< end
);
110 static inline int map_pmd_uncached(pmd_t
* pmd
, unsigned long vaddr
,
111 unsigned long size
, unsigned long *paddr_ptr
)
114 unsigned long orig_vaddr
= vaddr
;
116 vaddr
&= ~PGDIR_MASK
;
118 if (end
> PGDIR_SIZE
)
121 pte_t
* pte
= pte_alloc_kernel(pmd
, vaddr
);
124 if (map_pte_uncached(pte
, orig_vaddr
, end
- vaddr
, paddr_ptr
))
126 vaddr
= (vaddr
+ PMD_SIZE
) & PMD_MASK
;
127 orig_vaddr
+= PMD_SIZE
;
129 } while (vaddr
< end
);
133 static inline int map_uncached_pages(unsigned long vaddr
, unsigned long size
,
137 unsigned long end
= vaddr
+ size
;
139 dir
= pgd_offset_k(vaddr
);
143 pmd
= pmd_alloc(NULL
, dir
, vaddr
);
146 if (map_pmd_uncached(pmd
, vaddr
, end
- vaddr
, &paddr
))
148 vaddr
= vaddr
+ PGDIR_SIZE
;
150 } while (vaddr
&& (vaddr
< end
));
154 static inline void unmap_uncached_pte(pmd_t
* pmd
, unsigned long vaddr
,
159 unsigned long orig_vaddr
= vaddr
;
168 pte
= pte_offset_map(pmd
, vaddr
);
177 pte_clear(&init_mm
, vaddr
, pte
);
178 purge_tlb_start(flags
);
179 pdtlb_kernel(orig_vaddr
);
180 purge_tlb_end(flags
);
182 orig_vaddr
+= PAGE_SIZE
;
184 if (pte_none(page
) || pte_present(page
))
186 printk(KERN_CRIT
"Whee.. Swapped out page in kernel page table\n");
187 } while (vaddr
< end
);
190 static inline void unmap_uncached_pmd(pgd_t
* dir
, unsigned long vaddr
,
195 unsigned long orig_vaddr
= vaddr
;
204 pmd
= pmd_offset(dir
, vaddr
);
205 vaddr
&= ~PGDIR_MASK
;
207 if (end
> PGDIR_SIZE
)
210 unmap_uncached_pte(pmd
, orig_vaddr
, end
- vaddr
);
211 vaddr
= (vaddr
+ PMD_SIZE
) & PMD_MASK
;
212 orig_vaddr
+= PMD_SIZE
;
214 } while (vaddr
< end
);
217 static void unmap_uncached_pages(unsigned long vaddr
, unsigned long size
)
220 unsigned long end
= vaddr
+ size
;
222 dir
= pgd_offset_k(vaddr
);
224 unmap_uncached_pmd(dir
, vaddr
, end
- vaddr
);
225 vaddr
= vaddr
+ PGDIR_SIZE
;
227 } while (vaddr
&& (vaddr
< end
));
230 #define PCXL_SEARCH_LOOP(idx, mask, size) \
231 for(; res_ptr < res_end; ++res_ptr) \
233 if(0 == ((*res_ptr) & mask)) { \
235 idx = (int)((u_long)res_ptr - (u_long)pcxl_res_map); \
236 pcxl_res_hint = idx + (size >> 3); \
237 goto resource_found; \
241 #define PCXL_FIND_FREE_MAPPING(idx, mask, size) { \
242 u##size *res_ptr = (u##size *)&(pcxl_res_map[pcxl_res_hint & ~((size >> 3) - 1)]); \
243 u##size *res_end = (u##size *)&pcxl_res_map[pcxl_res_size]; \
244 PCXL_SEARCH_LOOP(idx, mask, size); \
245 res_ptr = (u##size *)&pcxl_res_map[0]; \
246 PCXL_SEARCH_LOOP(idx, mask, size); \
250 pcxl_alloc_range(size_t size
)
254 unsigned int pages_needed
= size
>> PAGE_SHIFT
;
257 mask
>>= BITS_PER_LONG
- pages_needed
;
259 DBG_RES("pcxl_alloc_range() size: %d pages_needed %d pages_mask 0x%08lx\n",
260 size
, pages_needed
, mask
);
262 spin_lock_irqsave(&pcxl_res_lock
, flags
);
264 if(pages_needed
<= 8) {
265 PCXL_FIND_FREE_MAPPING(res_idx
, mask
, 8);
266 } else if(pages_needed
<= 16) {
267 PCXL_FIND_FREE_MAPPING(res_idx
, mask
, 16);
268 } else if(pages_needed
<= 32) {
269 PCXL_FIND_FREE_MAPPING(res_idx
, mask
, 32);
271 panic("%s: pcxl_alloc_range() Too many pages to map.\n",
276 panic("%s: pcxl_alloc_range() out of dma mapping resources\n",
281 DBG_RES("pcxl_alloc_range() res_idx %d mask 0x%08lx res_hint: %d\n",
282 res_idx
, mask
, pcxl_res_hint
);
284 pcxl_used_pages
+= pages_needed
;
285 pcxl_used_bytes
+= ((pages_needed
>> 3) ? (pages_needed
>> 3) : 1);
287 spin_unlock_irqrestore(&pcxl_res_lock
, flags
);
292 ** return the corresponding vaddr in the pcxl dma map
294 return (pcxl_dma_start
+ (res_idx
<< (PAGE_SHIFT
+ 3)));
297 #define PCXL_FREE_MAPPINGS(idx, m, size) \
298 u##size *res_ptr = (u##size *)&(pcxl_res_map[(idx) + (((size >> 3) - 1) & (~((size >> 3) - 1)))]); \
299 /* BUG_ON((*res_ptr & m) != m); */ \
303 ** clear bits in the pcxl resource map
306 pcxl_free_range(unsigned long vaddr
, size_t size
)
309 unsigned int res_idx
= (vaddr
- pcxl_dma_start
) >> (PAGE_SHIFT
+ 3);
310 unsigned int pages_mapped
= size
>> PAGE_SHIFT
;
313 mask
>>= BITS_PER_LONG
- pages_mapped
;
315 DBG_RES("pcxl_free_range() res_idx: %d size: %d pages_mapped %d mask 0x%08lx\n",
316 res_idx
, size
, pages_mapped
, mask
);
318 spin_lock_irqsave(&pcxl_res_lock
, flags
);
320 if(pages_mapped
<= 8) {
321 PCXL_FREE_MAPPINGS(res_idx
, mask
, 8);
322 } else if(pages_mapped
<= 16) {
323 PCXL_FREE_MAPPINGS(res_idx
, mask
, 16);
324 } else if(pages_mapped
<= 32) {
325 PCXL_FREE_MAPPINGS(res_idx
, mask
, 32);
327 panic("%s: pcxl_free_range() Too many pages to unmap.\n",
331 pcxl_used_pages
-= (pages_mapped
? pages_mapped
: 1);
332 pcxl_used_bytes
-= ((pages_mapped
>> 3) ? (pages_mapped
>> 3) : 1);
334 spin_unlock_irqrestore(&pcxl_res_lock
, flags
);
339 static int proc_pcxl_dma_show(struct seq_file
*m
, void *v
)
343 unsigned long *res_ptr
= (u_long
*)pcxl_res_map
;
345 unsigned long total_pages
= pcxl_res_size
<< 3; /* 8 bits per byte */
347 seq_printf(m
, "\nDMA Mapping Area size : %d bytes (%ld pages)\n",
348 PCXL_DMA_MAP_SIZE
, total_pages
);
350 seq_printf(m
, "Resource bitmap : %d bytes\n", pcxl_res_size
);
352 seq_puts(m
, " total: free: used: % used:\n");
353 seq_printf(m
, "blocks %8d %8ld %8ld %8ld%%\n", pcxl_res_size
,
354 pcxl_res_size
- pcxl_used_bytes
, pcxl_used_bytes
,
355 (pcxl_used_bytes
* 100) / pcxl_res_size
);
357 seq_printf(m
, "pages %8ld %8ld %8ld %8ld%%\n", total_pages
,
358 total_pages
- pcxl_used_pages
, pcxl_used_pages
,
359 (pcxl_used_pages
* 100 / total_pages
));
362 seq_puts(m
, "\nResource bitmap:");
364 for(; i
< (pcxl_res_size
/ sizeof(u_long
)); ++i
, ++res_ptr
) {
367 seq_printf(m
, "%s %08lx", buf
, *res_ptr
);
374 static int proc_pcxl_dma_open(struct inode
*inode
, struct file
*file
)
376 return single_open(file
, proc_pcxl_dma_show
, NULL
);
379 static const struct file_operations proc_pcxl_dma_ops
= {
380 .owner
= THIS_MODULE
,
381 .open
= proc_pcxl_dma_open
,
384 .release
= single_release
,
390 if (pcxl_dma_start
== 0)
393 spin_lock_init(&pcxl_res_lock
);
394 pcxl_res_size
= PCXL_DMA_MAP_SIZE
>> (PAGE_SHIFT
+ 3);
396 pcxl_res_map
= (char *)__get_free_pages(GFP_KERNEL
,
397 get_order(pcxl_res_size
));
398 memset(pcxl_res_map
, 0, pcxl_res_size
);
399 proc_gsc_root
= proc_mkdir("gsc", NULL
);
402 "pcxl_dma_init: Unable to create gsc /proc dir entry\n");
404 struct proc_dir_entry
* ent
;
405 ent
= proc_create("pcxl_dma", 0, proc_gsc_root
,
409 "pci-dma.c: Unable to create pcxl_dma /proc entry.\n");
414 __initcall(pcxl_dma_init
);
416 static void *pa11_dma_alloc(struct device
*dev
, size_t size
,
417 dma_addr_t
*dma_handle
, gfp_t flag
, unsigned long attrs
)
423 order
= get_order(size
);
424 size
= 1 << (order
+ PAGE_SHIFT
);
425 vaddr
= pcxl_alloc_range(size
);
426 paddr
= __get_free_pages(flag
, order
);
427 flush_kernel_dcache_range(paddr
, size
);
429 map_uncached_pages(vaddr
, size
, paddr
);
430 *dma_handle
= (dma_addr_t
) paddr
;
433 /* This probably isn't needed to support EISA cards.
434 ** ISA cards will certainly only support 24-bit DMA addressing.
435 ** Not clear if we can, want, or need to support ISA.
437 if (!dev
|| *dev
->coherent_dma_mask
< 0xffffffff)
440 return (void *)vaddr
;
443 static void pa11_dma_free(struct device
*dev
, size_t size
, void *vaddr
,
444 dma_addr_t dma_handle
, unsigned long attrs
)
448 order
= get_order(size
);
449 size
= 1 << (order
+ PAGE_SHIFT
);
450 unmap_uncached_pages((unsigned long)vaddr
, size
);
451 pcxl_free_range((unsigned long)vaddr
, size
);
452 free_pages((unsigned long)__va(dma_handle
), order
);
455 static dma_addr_t
pa11_dma_map_page(struct device
*dev
, struct page
*page
,
456 unsigned long offset
, size_t size
,
457 enum dma_data_direction direction
, unsigned long attrs
)
459 void *addr
= page_address(page
) + offset
;
460 BUG_ON(direction
== DMA_NONE
);
462 if (!(attrs
& DMA_ATTR_SKIP_CPU_SYNC
))
463 flush_kernel_dcache_range((unsigned long) addr
, size
);
465 return virt_to_phys(addr
);
468 static void pa11_dma_unmap_page(struct device
*dev
, dma_addr_t dma_handle
,
469 size_t size
, enum dma_data_direction direction
,
472 BUG_ON(direction
== DMA_NONE
);
474 if (attrs
& DMA_ATTR_SKIP_CPU_SYNC
)
477 if (direction
== DMA_TO_DEVICE
)
481 * For PCI_DMA_FROMDEVICE this flush is not necessary for the
482 * simple map/unmap case. However, it IS necessary if if
483 * pci_dma_sync_single_* has been called and the buffer reused.
486 flush_kernel_dcache_range((unsigned long) phys_to_virt(dma_handle
), size
);
489 static int pa11_dma_map_sg(struct device
*dev
, struct scatterlist
*sglist
,
490 int nents
, enum dma_data_direction direction
,
494 struct scatterlist
*sg
;
496 BUG_ON(direction
== DMA_NONE
);
498 for_each_sg(sglist
, sg
, nents
, i
) {
499 unsigned long vaddr
= (unsigned long)sg_virt(sg
);
501 sg_dma_address(sg
) = (dma_addr_t
) virt_to_phys(vaddr
);
502 sg_dma_len(sg
) = sg
->length
;
504 if (attrs
& DMA_ATTR_SKIP_CPU_SYNC
)
507 flush_kernel_dcache_range(vaddr
, sg
->length
);
512 static void pa11_dma_unmap_sg(struct device
*dev
, struct scatterlist
*sglist
,
513 int nents
, enum dma_data_direction direction
,
517 struct scatterlist
*sg
;
519 BUG_ON(direction
== DMA_NONE
);
521 if (attrs
& DMA_ATTR_SKIP_CPU_SYNC
)
524 if (direction
== DMA_TO_DEVICE
)
527 /* once we do combining we'll need to use phys_to_virt(sg_dma_address(sglist)) */
529 for_each_sg(sglist
, sg
, nents
, i
)
530 flush_kernel_vmap_range(sg_virt(sg
), sg
->length
);
533 static void pa11_dma_sync_single_for_cpu(struct device
*dev
,
534 dma_addr_t dma_handle
, size_t size
,
535 enum dma_data_direction direction
)
537 BUG_ON(direction
== DMA_NONE
);
539 flush_kernel_dcache_range((unsigned long) phys_to_virt(dma_handle
),
543 static void pa11_dma_sync_single_for_device(struct device
*dev
,
544 dma_addr_t dma_handle
, size_t size
,
545 enum dma_data_direction direction
)
547 BUG_ON(direction
== DMA_NONE
);
549 flush_kernel_dcache_range((unsigned long) phys_to_virt(dma_handle
),
553 static void pa11_dma_sync_sg_for_cpu(struct device
*dev
, struct scatterlist
*sglist
, int nents
, enum dma_data_direction direction
)
556 struct scatterlist
*sg
;
558 /* once we do combining we'll need to use phys_to_virt(sg_dma_address(sglist)) */
560 for_each_sg(sglist
, sg
, nents
, i
)
561 flush_kernel_vmap_range(sg_virt(sg
), sg
->length
);
564 static void pa11_dma_sync_sg_for_device(struct device
*dev
, struct scatterlist
*sglist
, int nents
, enum dma_data_direction direction
)
567 struct scatterlist
*sg
;
569 /* once we do combining we'll need to use phys_to_virt(sg_dma_address(sglist)) */
571 for_each_sg(sglist
, sg
, nents
, i
)
572 flush_kernel_vmap_range(sg_virt(sg
), sg
->length
);
575 const struct dma_map_ops pcxl_dma_ops
= {
576 .dma_supported
= pa11_dma_supported
,
577 .alloc
= pa11_dma_alloc
,
578 .free
= pa11_dma_free
,
579 .map_page
= pa11_dma_map_page
,
580 .unmap_page
= pa11_dma_unmap_page
,
581 .map_sg
= pa11_dma_map_sg
,
582 .unmap_sg
= pa11_dma_unmap_sg
,
583 .sync_single_for_cpu
= pa11_dma_sync_single_for_cpu
,
584 .sync_single_for_device
= pa11_dma_sync_single_for_device
,
585 .sync_sg_for_cpu
= pa11_dma_sync_sg_for_cpu
,
586 .sync_sg_for_device
= pa11_dma_sync_sg_for_device
,
589 static void *pcx_dma_alloc(struct device
*dev
, size_t size
,
590 dma_addr_t
*dma_handle
, gfp_t flag
, unsigned long attrs
)
594 if ((attrs
& DMA_ATTR_NON_CONSISTENT
) == 0)
597 addr
= (void *)__get_free_pages(flag
, get_order(size
));
599 *dma_handle
= (dma_addr_t
)virt_to_phys(addr
);
604 static void pcx_dma_free(struct device
*dev
, size_t size
, void *vaddr
,
605 dma_addr_t iova
, unsigned long attrs
)
607 free_pages((unsigned long)vaddr
, get_order(size
));
611 const struct dma_map_ops pcx_dma_ops
= {
612 .dma_supported
= pa11_dma_supported
,
613 .alloc
= pcx_dma_alloc
,
614 .free
= pcx_dma_free
,
615 .map_page
= pa11_dma_map_page
,
616 .unmap_page
= pa11_dma_unmap_page
,
617 .map_sg
= pa11_dma_map_sg
,
618 .unmap_sg
= pa11_dma_unmap_sg
,
619 .sync_single_for_cpu
= pa11_dma_sync_single_for_cpu
,
620 .sync_single_for_device
= pa11_dma_sync_single_for_device
,
621 .sync_sg_for_cpu
= pa11_dma_sync_sg_for_cpu
,
622 .sync_sg_for_device
= pa11_dma_sync_sg_for_device
,