1/* 2** PARISC 1.1 Dynamic DMA mapping support. 3** This implementation is for PA-RISC platforms that do not support 4** I/O TLBs (aka DMA address translation hardware). 5** See Documentation/DMA-mapping.txt for interface definitions. 6** 7** (c) Copyright 1999,2000 Hewlett-Packard Company 8** (c) Copyright 2000 Grant Grundler 9** (c) Copyright 2000 Philipp Rumpf <prumpf@tux.org> 10** (c) Copyright 2000 John Marvin 11** 12** "leveraged" from 2.3.47: arch/ia64/kernel/pci-dma.c. 13** (I assume it's from David Mosberger-Tang but there was no Copyright) 14** 15** AFAIK, all PA7100LC and PA7300LC platforms can use this code. 16** 17** - ggg 18*/ 19 20#include <linux/init.h> 21#include <linux/mm.h> 22#include <linux/pci.h> 23#include <linux/proc_fs.h> 24#include <linux/seq_file.h> 25#include <linux/slab.h> 26#include <linux/string.h> 27#include <linux/types.h> 28 29#include <asm/cacheflush.h> 30#include <asm/dma.h> /* for DMA_CHUNK_SIZE */ 31#include <asm/io.h> 32#include <asm/page.h> /* get_order */ 33#include <asm/pgalloc.h> 34#include <asm/uaccess.h> 35#include <asm/tlbflush.h> /* for purge_tlb_*() macros */ 36 37static struct proc_dir_entry * proc_gsc_root __read_mostly = NULL; 38static unsigned long pcxl_used_bytes __read_mostly = 0; 39static unsigned long pcxl_used_pages __read_mostly = 0; 40 41extern unsigned long pcxl_dma_start; /* Start of pcxl dma mapping area */ 42static spinlock_t pcxl_res_lock; 43static char *pcxl_res_map; 44static int pcxl_res_hint; 45static int pcxl_res_size; 46 47#ifdef DEBUG_PCXL_RESOURCE 48#define DBG_RES(x...) printk(x) 49#else 50#define DBG_RES(x...) 51#endif 52 53 54/* 55** Dump a hex representation of the resource map. 56*/ 57 58#ifdef DUMP_RESMAP 59static 60void dump_resmap(void) 61{ 62 u_long *res_ptr = (unsigned long *)pcxl_res_map; 63 u_long i = 0; 64 65 printk("res_map: "); 66 for(; i < (pcxl_res_size / sizeof(unsigned long)); ++i, ++res_ptr) 67 printk("%08lx ", *res_ptr); 68 69 printk("\n"); 70} 71#else 72static inline void dump_resmap(void) {;} 73#endif 74 75static int pa11_dma_supported( struct device *dev, u64 mask) 76{ 77 return 1; 78} 79 80static inline int map_pte_uncached(pte_t * pte, 81 unsigned long vaddr, 82 unsigned long size, unsigned long *paddr_ptr) 83{ 84 unsigned long end; 85 unsigned long orig_vaddr = vaddr; 86 87 vaddr &= ~PMD_MASK; 88 end = vaddr + size; 89 if (end > PMD_SIZE) 90 end = PMD_SIZE; 91 do { 92 if (!pte_none(*pte)) 93 printk(KERN_ERR "map_pte_uncached: page already exists\n"); 94 set_pte(pte, __mk_pte(*paddr_ptr, PAGE_KERNEL_UNC)); 95 purge_tlb_start(); 96 pdtlb_kernel(orig_vaddr); 97 purge_tlb_end(); 98 vaddr += PAGE_SIZE; 99 orig_vaddr += PAGE_SIZE; 100 (*paddr_ptr) += PAGE_SIZE; 101 pte++; 102 } while (vaddr < end); 103 return 0; 104} 105 106static inline int map_pmd_uncached(pmd_t * pmd, unsigned long vaddr, 107 unsigned long size, unsigned long *paddr_ptr) 108{ 109 unsigned long end; 110 unsigned long orig_vaddr = vaddr; 111 112 vaddr &= ~PGDIR_MASK; 113 end = vaddr + size; 114 if (end > PGDIR_SIZE) 115 end = PGDIR_SIZE; 116 do { 117 pte_t * pte = pte_alloc_kernel(pmd, vaddr); 118 if (!pte) 119 return -ENOMEM; 120 if (map_pte_uncached(pte, orig_vaddr, end - vaddr, paddr_ptr)) 121 return -ENOMEM; 122 vaddr = (vaddr + PMD_SIZE) & PMD_MASK; 123 orig_vaddr += PMD_SIZE; 124 pmd++; 125 } while (vaddr < end); 126 return 0; 127} 128 129static inline int map_uncached_pages(unsigned long vaddr, unsigned long size, 130 unsigned long paddr) 131{ 132 pgd_t * dir; 133 unsigned long end = vaddr + size; 134 135 dir = pgd_offset_k(vaddr); 136 do { 137 pmd_t *pmd; 138 139 pmd = pmd_alloc(NULL, dir, vaddr); 140 if (!pmd) 141 return -ENOMEM; 142 if (map_pmd_uncached(pmd, vaddr, end - vaddr, &paddr)) 143 return -ENOMEM; 144 vaddr = vaddr + PGDIR_SIZE; 145 dir++; 146 } while (vaddr && (vaddr < end)); 147 return 0; 148} 149 150static inline void unmap_uncached_pte(pmd_t * pmd, unsigned long vaddr, 151 unsigned long size) 152{ 153 pte_t * pte; 154 unsigned long end; 155 unsigned long orig_vaddr = vaddr; 156 157 if (pmd_none(*pmd)) 158 return; 159 if (pmd_bad(*pmd)) { 160 pmd_ERROR(*pmd); 161 pmd_clear(pmd); 162 return; 163 } 164 pte = pte_offset_map(pmd, vaddr); 165 vaddr &= ~PMD_MASK; 166 end = vaddr + size; 167 if (end > PMD_SIZE) 168 end = PMD_SIZE; 169 do { 170 pte_t page = *pte; 171 pte_clear(&init_mm, vaddr, pte); 172 purge_tlb_start(); 173 pdtlb_kernel(orig_vaddr); 174 purge_tlb_end(); 175 vaddr += PAGE_SIZE; 176 orig_vaddr += PAGE_SIZE; 177 pte++; 178 if (pte_none(page) || pte_present(page)) 179 continue; 180 printk(KERN_CRIT "Whee.. Swapped out page in kernel page table\n"); 181 } while (vaddr < end); 182} 183 184static inline void unmap_uncached_pmd(pgd_t * dir, unsigned long vaddr, 185 unsigned long size) 186{ 187 pmd_t * pmd; 188 unsigned long end; 189 unsigned long orig_vaddr = vaddr; 190 191 if (pgd_none(*dir)) 192 return; 193 if (pgd_bad(*dir)) { 194 pgd_ERROR(*dir); 195 pgd_clear(dir); 196 return; 197 } 198 pmd = pmd_offset(dir, vaddr); 199 vaddr &= ~PGDIR_MASK; 200 end = vaddr + size; 201 if (end > PGDIR_SIZE) 202 end = PGDIR_SIZE; 203 do { 204 unmap_uncached_pte(pmd, orig_vaddr, end - vaddr); 205 vaddr = (vaddr + PMD_SIZE) & PMD_MASK; 206 orig_vaddr += PMD_SIZE; 207 pmd++; 208 } while (vaddr < end); 209} 210 211static void unmap_uncached_pages(unsigned long vaddr, unsigned long size) 212{ 213 pgd_t * dir; 214 unsigned long end = vaddr + size; 215 216 dir = pgd_offset_k(vaddr); 217 do { 218 unmap_uncached_pmd(dir, vaddr, end - vaddr); 219 vaddr = vaddr + PGDIR_SIZE; 220 dir++; 221 } while (vaddr && (vaddr < end)); 222} 223 224#define PCXL_SEARCH_LOOP(idx, mask, size) \ 225 for(; res_ptr < res_end; ++res_ptr) \ 226 { \ 227 if(0 == ((*res_ptr) & mask)) { \ 228 *res_ptr |= mask; \ 229 idx = (int)((u_long)res_ptr - (u_long)pcxl_res_map); \ 230 pcxl_res_hint = idx + (size >> 3); \ 231 goto resource_found; \ 232 } \ 233 } 234 235#define PCXL_FIND_FREE_MAPPING(idx, mask, size) { \ 236 u##size *res_ptr = (u##size *)&(pcxl_res_map[pcxl_res_hint & ~((size >> 3) - 1)]); \ 237 u##size *res_end = (u##size *)&pcxl_res_map[pcxl_res_size]; \ 238 PCXL_SEARCH_LOOP(idx, mask, size); \ 239 res_ptr = (u##size *)&pcxl_res_map[0]; \ 240 PCXL_SEARCH_LOOP(idx, mask, size); \ 241} 242 243unsigned long 244pcxl_alloc_range(size_t size) 245{ 246 int res_idx; 247 u_long mask, flags; 248 unsigned int pages_needed = size >> PAGE_SHIFT; 249 250 mask = (u_long) -1L; 251 mask >>= BITS_PER_LONG - pages_needed; 252 253 DBG_RES("pcxl_alloc_range() size: %d pages_needed %d pages_mask 0x%08lx\n", 254 size, pages_needed, mask); 255 256 spin_lock_irqsave(&pcxl_res_lock, flags); 257 258 if(pages_needed <= 8) { 259 PCXL_FIND_FREE_MAPPING(res_idx, mask, 8); 260 } else if(pages_needed <= 16) { 261 PCXL_FIND_FREE_MAPPING(res_idx, mask, 16); 262 } else if(pages_needed <= 32) { 263 PCXL_FIND_FREE_MAPPING(res_idx, mask, 32); 264 } else { 265 panic("%s: pcxl_alloc_range() Too many pages to map.\n", 266 __FILE__); 267 } 268 269 dump_resmap(); 270 panic("%s: pcxl_alloc_range() out of dma mapping resources\n", 271 __FILE__); 272 273resource_found: 274 275 DBG_RES("pcxl_alloc_range() res_idx %d mask 0x%08lx res_hint: %d\n", 276 res_idx, mask, pcxl_res_hint); 277 278 pcxl_used_pages += pages_needed; 279 pcxl_used_bytes += ((pages_needed >> 3) ? (pages_needed >> 3) : 1); 280 281 spin_unlock_irqrestore(&pcxl_res_lock, flags); 282 283 dump_resmap(); 284 285 /* 286 ** return the corresponding vaddr in the pcxl dma map 287 */ 288 return (pcxl_dma_start + (res_idx << (PAGE_SHIFT + 3))); 289} 290 291#define PCXL_FREE_MAPPINGS(idx, m, size) \ 292 u##size *res_ptr = (u##size *)&(pcxl_res_map[(idx) + (((size >> 3) - 1) & (~((size >> 3) - 1)))]); \ 293 /* BUG_ON((*res_ptr & m) != m); */ \ 294 *res_ptr &= ~m; 295 296/* 297** clear bits in the pcxl resource map 298*/ 299static void 300pcxl_free_range(unsigned long vaddr, size_t size) 301{ 302 u_long mask, flags; 303 unsigned int res_idx = (vaddr - pcxl_dma_start) >> (PAGE_SHIFT + 3); 304 unsigned int pages_mapped = size >> PAGE_SHIFT; 305 306 mask = (u_long) -1L; 307 mask >>= BITS_PER_LONG - pages_mapped; 308 309 DBG_RES("pcxl_free_range() res_idx: %d size: %d pages_mapped %d mask 0x%08lx\n", 310 res_idx, size, pages_mapped, mask); 311 312 spin_lock_irqsave(&pcxl_res_lock, flags); 313 314 if(pages_mapped <= 8) { 315 PCXL_FREE_MAPPINGS(res_idx, mask, 8); 316 } else if(pages_mapped <= 16) { 317 PCXL_FREE_MAPPINGS(res_idx, mask, 16); 318 } else if(pages_mapped <= 32) { 319 PCXL_FREE_MAPPINGS(res_idx, mask, 32); 320 } else { 321 panic("%s: pcxl_free_range() Too many pages to unmap.\n", 322 __FILE__); 323 } 324 325 pcxl_used_pages -= (pages_mapped ? pages_mapped : 1); 326 pcxl_used_bytes -= ((pages_mapped >> 3) ? (pages_mapped >> 3) : 1); 327 328 spin_unlock_irqrestore(&pcxl_res_lock, flags); 329 330 dump_resmap(); 331} 332 333static int proc_pcxl_dma_show(struct seq_file *m, void *v) 334{ 335 unsigned long total_pages = pcxl_res_size << 3; /* 8 bits per byte */ 336 337 seq_printf(m, "\nDMA Mapping Area size : %d bytes (%ld pages)\n", 338 PCXL_DMA_MAP_SIZE, total_pages); 339 340 seq_printf(m, "Resource bitmap : %d bytes\n", pcxl_res_size); 341 342 seq_puts(m, " total: free: used: % used:\n"); 343 seq_printf(m, "blocks %8d %8ld %8ld %8ld%%\n", pcxl_res_size, 344 pcxl_res_size - pcxl_used_bytes, pcxl_used_bytes, 345 (pcxl_used_bytes * 100) / pcxl_res_size); 346 347 seq_printf(m, "pages %8ld %8ld %8ld %8ld%%\n", total_pages, 348 total_pages - pcxl_used_pages, pcxl_used_pages, 349 (pcxl_used_pages * 100 / total_pages)); 350 351 seq_putc(m, '\n'); 352 return 0; 353} 354 355static int proc_pcxl_dma_open(struct inode *inode, struct file *file) 356{ 357 return single_open(file, proc_pcxl_dma_show, NULL); 358} 359 360static const struct file_operations proc_pcxl_dma_ops = { 361 .owner = THIS_MODULE, 362 .open = proc_pcxl_dma_open, 363 .read = seq_read, 364 .llseek = seq_lseek, 365 .release = single_release, 366}; 367 368static int __init 369pcxl_dma_init(void) 370{ 371 if (pcxl_dma_start == 0) 372 return 0; 373 374 spin_lock_init(&pcxl_res_lock); 375 pcxl_res_size = PCXL_DMA_MAP_SIZE >> (PAGE_SHIFT + 3); 376 pcxl_res_hint = 0; 377 pcxl_res_map = (char *)__get_free_pages(GFP_KERNEL, 378 get_order(pcxl_res_size)); 379 memset(pcxl_res_map, 0, pcxl_res_size); 380 proc_gsc_root = proc_mkdir("gsc", NULL); 381 if (!proc_gsc_root) 382 printk(KERN_WARNING 383 "pcxl_dma_init: Unable to create gsc /proc dir entry\n"); 384 else { 385 struct proc_dir_entry* ent; 386 ent = create_proc_entry("pcxl_dma", 0, proc_gsc_root); 387 if (ent) 388 ent->proc_fops = &proc_pcxl_dma_ops; 389 else 390 printk(KERN_WARNING 391 "pci-dma.c: Unable to create pcxl_dma /proc entry.\n"); 392 } 393 return 0; 394} 395 396__initcall(pcxl_dma_init); 397 398static void * pa11_dma_alloc_consistent (struct device *dev, size_t size, dma_addr_t *dma_handle, gfp_t flag) 399{ 400 unsigned long vaddr; 401 unsigned long paddr; 402 int order; 403 404 order = get_order(size); 405 size = 1 << (order + PAGE_SHIFT); 406 vaddr = pcxl_alloc_range(size); 407 paddr = __get_free_pages(flag, order); 408 flush_kernel_dcache_range(paddr, size); 409 paddr = __pa(paddr); 410 map_uncached_pages(vaddr, size, paddr); 411 *dma_handle = (dma_addr_t) paddr; 412 413 return (void *)vaddr; 414} 415 416static void pa11_dma_free_consistent (struct device *dev, size_t size, void *vaddr, dma_addr_t dma_handle) 417{ 418 int order; 419 420 order = get_order(size); 421 size = 1 << (order + PAGE_SHIFT); 422 unmap_uncached_pages((unsigned long)vaddr, size); 423 pcxl_free_range((unsigned long)vaddr, size); 424 free_pages((unsigned long)__va(dma_handle), order); 425} 426 427static dma_addr_t pa11_dma_map_single(struct device *dev, void *addr, size_t size, enum dma_data_direction direction) 428{ 429 if (direction == DMA_NONE) { 430 printk(KERN_ERR "pa11_dma_map_single(PCI_DMA_NONE) called by %p\n", __builtin_return_address(0)); 431 BUG(); 432 } 433 434 flush_kernel_dcache_range((unsigned long) addr, size); 435 return virt_to_phys(addr); 436} 437 438static void pa11_dma_unmap_single(struct device *dev, dma_addr_t dma_handle, size_t size, enum dma_data_direction direction) 439{ 440 if (direction == DMA_NONE) { 441 printk(KERN_ERR "pa11_dma_unmap_single(PCI_DMA_NONE) called by %p\n", __builtin_return_address(0)); 442 BUG(); 443 } 444 445 if (direction == DMA_TO_DEVICE) 446 return; 447 448 /* 449 * For PCI_DMA_FROMDEVICE this flush is not necessary for the 450 * simple map/unmap case. However, it IS necessary if if 451 * pci_dma_sync_single_* has been called and the buffer reused. 452 */ 453 454 flush_kernel_dcache_range((unsigned long) phys_to_virt(dma_handle), size); 455 return; 456} 457 458static int pa11_dma_map_sg(struct device *dev, struct scatterlist *sglist, int nents, enum dma_data_direction direction) 459{ 460 int i; 461 462 if (direction == DMA_NONE) 463 BUG(); 464 465 for (i = 0; i < nents; i++, sglist++ ) { 466 unsigned long vaddr = sg_virt_addr(sglist); 467 sg_dma_address(sglist) = (dma_addr_t) virt_to_phys(vaddr); 468 sg_dma_len(sglist) = sglist->length; 469 flush_kernel_dcache_range(vaddr, sglist->length); 470 } 471 return nents; 472} 473 474static void pa11_dma_unmap_sg(struct device *dev, struct scatterlist *sglist, int nents, enum dma_data_direction direction) 475{ 476 int i; 477 478 if (direction == DMA_NONE) 479 BUG(); 480 481 if (direction == DMA_TO_DEVICE) 482 return; 483 484 /* once we do combining we'll need to use phys_to_virt(sg_dma_address(sglist)) */ 485 486 for (i = 0; i < nents; i++, sglist++ ) 487 flush_kernel_dcache_range(sg_virt_addr(sglist), sglist->length); 488 return; 489} 490 491static void pa11_dma_sync_single_for_cpu(struct device *dev, dma_addr_t dma_handle, unsigned long offset, size_t size, enum dma_data_direction direction) 492{ 493 if (direction == DMA_NONE) 494 BUG(); 495 496 flush_kernel_dcache_range((unsigned long) phys_to_virt(dma_handle) + offset, size); 497} 498 499static void pa11_dma_sync_single_for_device(struct device *dev, dma_addr_t dma_handle, unsigned long offset, size_t size, enum dma_data_direction direction) 500{ 501 if (direction == DMA_NONE) 502 BUG(); 503 504 flush_kernel_dcache_range((unsigned long) phys_to_virt(dma_handle) + offset, size); 505} 506 507static void pa11_dma_sync_sg_for_cpu(struct device *dev, struct scatterlist *sglist, int nents, enum dma_data_direction direction) 508{ 509 int i; 510 511 /* once we do combining we'll need to use phys_to_virt(sg_dma_address(sglist)) */ 512 513 for (i = 0; i < nents; i++, sglist++ ) 514 flush_kernel_dcache_range(sg_virt_addr(sglist), sglist->length); 515} 516 517static void pa11_dma_sync_sg_for_device(struct device *dev, struct scatterlist *sglist, int nents, enum dma_data_direction direction) 518{ 519 int i; 520 521 /* once we do combining we'll need to use phys_to_virt(sg_dma_address(sglist)) */ 522 523 for (i = 0; i < nents; i++, sglist++ ) 524 flush_kernel_dcache_range(sg_virt_addr(sglist), sglist->length); 525} 526 527struct hppa_dma_ops pcxl_dma_ops = { 528 .dma_supported = pa11_dma_supported, 529 .alloc_consistent = pa11_dma_alloc_consistent, 530 .alloc_noncoherent = pa11_dma_alloc_consistent, 531 .free_consistent = pa11_dma_free_consistent, 532 .map_single = pa11_dma_map_single, 533 .unmap_single = pa11_dma_unmap_single, 534 .map_sg = pa11_dma_map_sg, 535 .unmap_sg = pa11_dma_unmap_sg, 536 .dma_sync_single_for_cpu = pa11_dma_sync_single_for_cpu, 537 .dma_sync_single_for_device = pa11_dma_sync_single_for_device, 538 .dma_sync_sg_for_cpu = pa11_dma_sync_sg_for_cpu, 539 .dma_sync_sg_for_device = pa11_dma_sync_sg_for_device, 540}; 541 542static void *fail_alloc_consistent(struct device *dev, size_t size, 543 dma_addr_t *dma_handle, gfp_t flag) 544{ 545 return NULL; 546} 547 548static void *pa11_dma_alloc_noncoherent(struct device *dev, size_t size, 549 dma_addr_t *dma_handle, gfp_t flag) 550{ 551 void *addr = NULL; 552 553 /* rely on kmalloc to be cacheline aligned */ 554 addr = kmalloc(size, flag); 555 if(addr) 556 *dma_handle = (dma_addr_t)virt_to_phys(addr); 557 558 return addr; 559} 560 561static void pa11_dma_free_noncoherent(struct device *dev, size_t size, 562 void *vaddr, dma_addr_t iova) 563{ 564 kfree(vaddr); 565 return; 566} 567 568struct hppa_dma_ops pcx_dma_ops = { 569 .dma_supported = pa11_dma_supported, 570 .alloc_consistent = fail_alloc_consistent, 571 .alloc_noncoherent = pa11_dma_alloc_noncoherent, 572 .free_consistent = pa11_dma_free_noncoherent, 573 .map_single = pa11_dma_map_single, 574 .unmap_single = pa11_dma_unmap_single, 575 .map_sg = pa11_dma_map_sg, 576 .unmap_sg = pa11_dma_unmap_sg, 577 .dma_sync_single_for_cpu = pa11_dma_sync_single_for_cpu, 578 .dma_sync_single_for_device = pa11_dma_sync_single_for_device, 579 .dma_sync_sg_for_cpu = pa11_dma_sync_sg_for_cpu, 580 .dma_sync_sg_for_device = pa11_dma_sync_sg_for_device, 581}; 582