alpha: use iommu_is_span_boundary helper function
[deliverable/linux.git] / arch / alpha / kernel / pci_iommu.c
1 /*
2 * linux/arch/alpha/kernel/pci_iommu.c
3 */
4
5 #include <linux/kernel.h>
6 #include <linux/mm.h>
7 #include <linux/pci.h>
8 #include <linux/slab.h>
9 #include <linux/bootmem.h>
10 #include <linux/scatterlist.h>
11 #include <linux/log2.h>
12 #include <linux/dma-mapping.h>
13 #include <linux/iommu-helper.h>
14
15 #include <asm/io.h>
16 #include <asm/hwrpb.h>
17
18 #include "proto.h"
19 #include "pci_impl.h"
20
21
22 #define DEBUG_ALLOC 0
23 #if DEBUG_ALLOC > 0
24 # define DBGA(args...) printk(KERN_DEBUG args)
25 #else
26 # define DBGA(args...)
27 #endif
28 #if DEBUG_ALLOC > 1
29 # define DBGA2(args...) printk(KERN_DEBUG args)
30 #else
31 # define DBGA2(args...)
32 #endif
33
34 #define DEBUG_NODIRECT 0
35
36 #define ISA_DMA_MASK 0x00ffffff
37
38 static inline unsigned long
39 mk_iommu_pte(unsigned long paddr)
40 {
41 return (paddr >> (PAGE_SHIFT-1)) | 1;
42 }
43
44 static inline long
45 calc_npages(long bytes)
46 {
47 return (bytes + PAGE_SIZE - 1) >> PAGE_SHIFT;
48 }
49 \f
50
51 /* Return the minimum of MAX or the first power of two larger
52 than main memory. */
53
54 unsigned long
55 size_for_memory(unsigned long max)
56 {
57 unsigned long mem = max_low_pfn << PAGE_SHIFT;
58 if (mem < max)
59 max = roundup_pow_of_two(mem);
60 return max;
61 }
62 \f
63 struct pci_iommu_arena * __init
64 iommu_arena_new_node(int nid, struct pci_controller *hose, dma_addr_t base,
65 unsigned long window_size, unsigned long align)
66 {
67 unsigned long mem_size;
68 struct pci_iommu_arena *arena;
69
70 mem_size = window_size / (PAGE_SIZE / sizeof(unsigned long));
71
72 /* Note that the TLB lookup logic uses bitwise concatenation,
73 not addition, so the required arena alignment is based on
74 the size of the window. Retain the align parameter so that
75 particular systems can over-align the arena. */
76 if (align < mem_size)
77 align = mem_size;
78
79
80 #ifdef CONFIG_DISCONTIGMEM
81
82 if (!NODE_DATA(nid) ||
83 (NULL == (arena = alloc_bootmem_node(NODE_DATA(nid),
84 sizeof(*arena))))) {
85 printk("%s: couldn't allocate arena from node %d\n"
86 " falling back to system-wide allocation\n",
87 __FUNCTION__, nid);
88 arena = alloc_bootmem(sizeof(*arena));
89 }
90
91 if (!NODE_DATA(nid) ||
92 (NULL == (arena->ptes = __alloc_bootmem_node(NODE_DATA(nid),
93 mem_size,
94 align,
95 0)))) {
96 printk("%s: couldn't allocate arena ptes from node %d\n"
97 " falling back to system-wide allocation\n",
98 __FUNCTION__, nid);
99 arena->ptes = __alloc_bootmem(mem_size, align, 0);
100 }
101
102 #else /* CONFIG_DISCONTIGMEM */
103
104 arena = alloc_bootmem(sizeof(*arena));
105 arena->ptes = __alloc_bootmem(mem_size, align, 0);
106
107 #endif /* CONFIG_DISCONTIGMEM */
108
109 spin_lock_init(&arena->lock);
110 arena->hose = hose;
111 arena->dma_base = base;
112 arena->size = window_size;
113 arena->next_entry = 0;
114
115 /* Align allocations to a multiple of a page size. Not needed
116 unless there are chip bugs. */
117 arena->align_entry = 1;
118
119 return arena;
120 }
121
122 struct pci_iommu_arena * __init
123 iommu_arena_new(struct pci_controller *hose, dma_addr_t base,
124 unsigned long window_size, unsigned long align)
125 {
126 return iommu_arena_new_node(0, hose, base, window_size, align);
127 }
128
129 /* Must be called with the arena lock held */
130 static long
131 iommu_arena_find_pages(struct device *dev, struct pci_iommu_arena *arena,
132 long n, long mask)
133 {
134 unsigned long *ptes;
135 long i, p, nent;
136 int pass = 0;
137 unsigned long base;
138 unsigned long boundary_size;
139
140 base = arena->dma_base >> PAGE_SHIFT;
141 if (dev) {
142 boundary_size = dma_get_seg_boundary(dev) + 1;
143 boundary_size >>= PAGE_SHIFT;
144 } else {
145 boundary_size = 1UL << (32 - PAGE_SHIFT);
146 }
147
148 /* Search forward for the first mask-aligned sequence of N free ptes */
149 ptes = arena->ptes;
150 nent = arena->size >> PAGE_SHIFT;
151 p = ALIGN(arena->next_entry, mask + 1);
152 i = 0;
153
154 again:
155 while (i < n && p+i < nent) {
156 if (!i && iommu_is_span_boundary(p, n, base, boundary_size)) {
157 p = ALIGN(p + 1, mask + 1);
158 goto again;
159 }
160
161 if (ptes[p+i])
162 p = ALIGN(p + i + 1, mask + 1), i = 0;
163 else
164 i = i + 1;
165 }
166
167 if (i < n) {
168 if (pass < 1) {
169 /*
170 * Reached the end. Flush the TLB and restart
171 * the search from the beginning.
172 */
173 alpha_mv.mv_pci_tbi(arena->hose, 0, -1);
174
175 pass++;
176 p = 0;
177 i = 0;
178 goto again;
179 } else
180 return -1;
181 }
182
183 /* Success. It's the responsibility of the caller to mark them
184 in use before releasing the lock */
185 return p;
186 }
187
188 static long
189 iommu_arena_alloc(struct device *dev, struct pci_iommu_arena *arena, long n,
190 unsigned int align)
191 {
192 unsigned long flags;
193 unsigned long *ptes;
194 long i, p, mask;
195
196 spin_lock_irqsave(&arena->lock, flags);
197
198 /* Search for N empty ptes */
199 ptes = arena->ptes;
200 mask = max(align, arena->align_entry) - 1;
201 p = iommu_arena_find_pages(dev, arena, n, mask);
202 if (p < 0) {
203 spin_unlock_irqrestore(&arena->lock, flags);
204 return -1;
205 }
206
207 /* Success. Mark them all in use, ie not zero and invalid
208 for the iommu tlb that could load them from under us.
209 The chip specific bits will fill this in with something
210 kosher when we return. */
211 for (i = 0; i < n; ++i)
212 ptes[p+i] = IOMMU_INVALID_PTE;
213
214 arena->next_entry = p + n;
215 spin_unlock_irqrestore(&arena->lock, flags);
216
217 return p;
218 }
219
220 static void
221 iommu_arena_free(struct pci_iommu_arena *arena, long ofs, long n)
222 {
223 unsigned long *p;
224 long i;
225
226 p = arena->ptes + ofs;
227 for (i = 0; i < n; ++i)
228 p[i] = 0;
229 }
230 \f
231 /* True if the machine supports DAC addressing, and DEV can
232 make use of it given MASK. */
233 static int pci_dac_dma_supported(struct pci_dev *hwdev, u64 mask);
234
235 /* Map a single buffer of the indicated size for PCI DMA in streaming
236 mode. The 32-bit PCI bus mastering address to use is returned.
237 Once the device is given the dma address, the device owns this memory
238 until either pci_unmap_single or pci_dma_sync_single is performed. */
239
240 static dma_addr_t
241 pci_map_single_1(struct pci_dev *pdev, void *cpu_addr, size_t size,
242 int dac_allowed)
243 {
244 struct pci_controller *hose = pdev ? pdev->sysdata : pci_isa_hose;
245 dma_addr_t max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
246 struct pci_iommu_arena *arena;
247 long npages, dma_ofs, i;
248 unsigned long paddr;
249 dma_addr_t ret;
250 unsigned int align = 0;
251 struct device *dev = pdev ? &pdev->dev : NULL;
252
253 paddr = __pa(cpu_addr);
254
255 #if !DEBUG_NODIRECT
256 /* First check to see if we can use the direct map window. */
257 if (paddr + size + __direct_map_base - 1 <= max_dma
258 && paddr + size <= __direct_map_size) {
259 ret = paddr + __direct_map_base;
260
261 DBGA2("pci_map_single: [%p,%lx] -> direct %lx from %p\n",
262 cpu_addr, size, ret, __builtin_return_address(0));
263
264 return ret;
265 }
266 #endif
267
268 /* Next, use DAC if selected earlier. */
269 if (dac_allowed) {
270 ret = paddr + alpha_mv.pci_dac_offset;
271
272 DBGA2("pci_map_single: [%p,%lx] -> DAC %lx from %p\n",
273 cpu_addr, size, ret, __builtin_return_address(0));
274
275 return ret;
276 }
277
278 /* If the machine doesn't define a pci_tbi routine, we have to
279 assume it doesn't support sg mapping, and, since we tried to
280 use direct_map above, it now must be considered an error. */
281 if (! alpha_mv.mv_pci_tbi) {
282 static int been_here = 0; /* Only print the message once. */
283 if (!been_here) {
284 printk(KERN_WARNING "pci_map_single: no HW sg\n");
285 been_here = 1;
286 }
287 return 0;
288 }
289
290 arena = hose->sg_pci;
291 if (!arena || arena->dma_base + arena->size - 1 > max_dma)
292 arena = hose->sg_isa;
293
294 npages = calc_npages((paddr & ~PAGE_MASK) + size);
295
296 /* Force allocation to 64KB boundary for ISA bridges. */
297 if (pdev && pdev == isa_bridge)
298 align = 8;
299 dma_ofs = iommu_arena_alloc(dev, arena, npages, align);
300 if (dma_ofs < 0) {
301 printk(KERN_WARNING "pci_map_single failed: "
302 "could not allocate dma page tables\n");
303 return 0;
304 }
305
306 paddr &= PAGE_MASK;
307 for (i = 0; i < npages; ++i, paddr += PAGE_SIZE)
308 arena->ptes[i + dma_ofs] = mk_iommu_pte(paddr);
309
310 ret = arena->dma_base + dma_ofs * PAGE_SIZE;
311 ret += (unsigned long)cpu_addr & ~PAGE_MASK;
312
313 DBGA2("pci_map_single: [%p,%lx] np %ld -> sg %lx from %p\n",
314 cpu_addr, size, npages, ret, __builtin_return_address(0));
315
316 return ret;
317 }
318
319 dma_addr_t
320 pci_map_single(struct pci_dev *pdev, void *cpu_addr, size_t size, int dir)
321 {
322 int dac_allowed;
323
324 if (dir == PCI_DMA_NONE)
325 BUG();
326
327 dac_allowed = pdev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0;
328 return pci_map_single_1(pdev, cpu_addr, size, dac_allowed);
329 }
330 EXPORT_SYMBOL(pci_map_single);
331
332 dma_addr_t
333 pci_map_page(struct pci_dev *pdev, struct page *page, unsigned long offset,
334 size_t size, int dir)
335 {
336 int dac_allowed;
337
338 if (dir == PCI_DMA_NONE)
339 BUG();
340
341 dac_allowed = pdev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0;
342 return pci_map_single_1(pdev, (char *)page_address(page) + offset,
343 size, dac_allowed);
344 }
345 EXPORT_SYMBOL(pci_map_page);
346
347 /* Unmap a single streaming mode DMA translation. The DMA_ADDR and
348 SIZE must match what was provided for in a previous pci_map_single
349 call. All other usages are undefined. After this call, reads by
350 the cpu to the buffer are guaranteed to see whatever the device
351 wrote there. */
352
353 void
354 pci_unmap_single(struct pci_dev *pdev, dma_addr_t dma_addr, size_t size,
355 int direction)
356 {
357 unsigned long flags;
358 struct pci_controller *hose = pdev ? pdev->sysdata : pci_isa_hose;
359 struct pci_iommu_arena *arena;
360 long dma_ofs, npages;
361
362 if (direction == PCI_DMA_NONE)
363 BUG();
364
365 if (dma_addr >= __direct_map_base
366 && dma_addr < __direct_map_base + __direct_map_size) {
367 /* Nothing to do. */
368
369 DBGA2("pci_unmap_single: direct [%lx,%lx] from %p\n",
370 dma_addr, size, __builtin_return_address(0));
371
372 return;
373 }
374
375 if (dma_addr > 0xffffffff) {
376 DBGA2("pci64_unmap_single: DAC [%lx,%lx] from %p\n",
377 dma_addr, size, __builtin_return_address(0));
378 return;
379 }
380
381 arena = hose->sg_pci;
382 if (!arena || dma_addr < arena->dma_base)
383 arena = hose->sg_isa;
384
385 dma_ofs = (dma_addr - arena->dma_base) >> PAGE_SHIFT;
386 if (dma_ofs * PAGE_SIZE >= arena->size) {
387 printk(KERN_ERR "Bogus pci_unmap_single: dma_addr %lx "
388 " base %lx size %x\n", dma_addr, arena->dma_base,
389 arena->size);
390 return;
391 BUG();
392 }
393
394 npages = calc_npages((dma_addr & ~PAGE_MASK) + size);
395
396 spin_lock_irqsave(&arena->lock, flags);
397
398 iommu_arena_free(arena, dma_ofs, npages);
399
400 /* If we're freeing ptes above the `next_entry' pointer (they
401 may have snuck back into the TLB since the last wrap flush),
402 we need to flush the TLB before reallocating the latter. */
403 if (dma_ofs >= arena->next_entry)
404 alpha_mv.mv_pci_tbi(hose, dma_addr, dma_addr + size - 1);
405
406 spin_unlock_irqrestore(&arena->lock, flags);
407
408 DBGA2("pci_unmap_single: sg [%lx,%lx] np %ld from %p\n",
409 dma_addr, size, npages, __builtin_return_address(0));
410 }
411 EXPORT_SYMBOL(pci_unmap_single);
412
413 void
414 pci_unmap_page(struct pci_dev *pdev, dma_addr_t dma_addr,
415 size_t size, int direction)
416 {
417 pci_unmap_single(pdev, dma_addr, size, direction);
418 }
419 EXPORT_SYMBOL(pci_unmap_page);
420
421 /* Allocate and map kernel buffer using consistent mode DMA for PCI
422 device. Returns non-NULL cpu-view pointer to the buffer if
423 successful and sets *DMA_ADDRP to the pci side dma address as well,
424 else DMA_ADDRP is undefined. */
425
426 void *
427 pci_alloc_consistent(struct pci_dev *pdev, size_t size, dma_addr_t *dma_addrp)
428 {
429 void *cpu_addr;
430 long order = get_order(size);
431 gfp_t gfp = GFP_ATOMIC;
432
433 try_again:
434 cpu_addr = (void *)__get_free_pages(gfp, order);
435 if (! cpu_addr) {
436 printk(KERN_INFO "pci_alloc_consistent: "
437 "get_free_pages failed from %p\n",
438 __builtin_return_address(0));
439 /* ??? Really atomic allocation? Otherwise we could play
440 with vmalloc and sg if we can't find contiguous memory. */
441 return NULL;
442 }
443 memset(cpu_addr, 0, size);
444
445 *dma_addrp = pci_map_single_1(pdev, cpu_addr, size, 0);
446 if (*dma_addrp == 0) {
447 free_pages((unsigned long)cpu_addr, order);
448 if (alpha_mv.mv_pci_tbi || (gfp & GFP_DMA))
449 return NULL;
450 /* The address doesn't fit required mask and we
451 do not have iommu. Try again with GFP_DMA. */
452 gfp |= GFP_DMA;
453 goto try_again;
454 }
455
456 DBGA2("pci_alloc_consistent: %lx -> [%p,%x] from %p\n",
457 size, cpu_addr, *dma_addrp, __builtin_return_address(0));
458
459 return cpu_addr;
460 }
461 EXPORT_SYMBOL(pci_alloc_consistent);
462
463 /* Free and unmap a consistent DMA buffer. CPU_ADDR and DMA_ADDR must
464 be values that were returned from pci_alloc_consistent. SIZE must
465 be the same as what as passed into pci_alloc_consistent.
466 References to the memory and mappings associated with CPU_ADDR or
467 DMA_ADDR past this call are illegal. */
468
469 void
470 pci_free_consistent(struct pci_dev *pdev, size_t size, void *cpu_addr,
471 dma_addr_t dma_addr)
472 {
473 pci_unmap_single(pdev, dma_addr, size, PCI_DMA_BIDIRECTIONAL);
474 free_pages((unsigned long)cpu_addr, get_order(size));
475
476 DBGA2("pci_free_consistent: [%x,%lx] from %p\n",
477 dma_addr, size, __builtin_return_address(0));
478 }
479 EXPORT_SYMBOL(pci_free_consistent);
480
481 /* Classify the elements of the scatterlist. Write dma_address
482 of each element with:
483 0 : Followers all physically adjacent.
484 1 : Followers all virtually adjacent.
485 -1 : Not leader, physically adjacent to previous.
486 -2 : Not leader, virtually adjacent to previous.
487 Write dma_length of each leader with the combined lengths of
488 the mergable followers. */
489
490 #define SG_ENT_VIRT_ADDRESS(SG) (sg_virt((SG)))
491 #define SG_ENT_PHYS_ADDRESS(SG) __pa(SG_ENT_VIRT_ADDRESS(SG))
492
493 static void
494 sg_classify(struct device *dev, struct scatterlist *sg, struct scatterlist *end,
495 int virt_ok)
496 {
497 unsigned long next_paddr;
498 struct scatterlist *leader;
499 long leader_flag, leader_length;
500 unsigned int max_seg_size;
501
502 leader = sg;
503 leader_flag = 0;
504 leader_length = leader->length;
505 next_paddr = SG_ENT_PHYS_ADDRESS(leader) + leader_length;
506
507 /* we will not marge sg without device. */
508 max_seg_size = dev ? dma_get_max_seg_size(dev) : 0;
509 for (++sg; sg < end; ++sg) {
510 unsigned long addr, len;
511 addr = SG_ENT_PHYS_ADDRESS(sg);
512 len = sg->length;
513
514 if (leader_length + len > max_seg_size)
515 goto new_segment;
516
517 if (next_paddr == addr) {
518 sg->dma_address = -1;
519 leader_length += len;
520 } else if (((next_paddr | addr) & ~PAGE_MASK) == 0 && virt_ok) {
521 sg->dma_address = -2;
522 leader_flag = 1;
523 leader_length += len;
524 } else {
525 new_segment:
526 leader->dma_address = leader_flag;
527 leader->dma_length = leader_length;
528 leader = sg;
529 leader_flag = 0;
530 leader_length = len;
531 }
532
533 next_paddr = addr + len;
534 }
535
536 leader->dma_address = leader_flag;
537 leader->dma_length = leader_length;
538 }
539
540 /* Given a scatterlist leader, choose an allocation method and fill
541 in the blanks. */
542
543 static int
544 sg_fill(struct device *dev, struct scatterlist *leader, struct scatterlist *end,
545 struct scatterlist *out, struct pci_iommu_arena *arena,
546 dma_addr_t max_dma, int dac_allowed)
547 {
548 unsigned long paddr = SG_ENT_PHYS_ADDRESS(leader);
549 long size = leader->dma_length;
550 struct scatterlist *sg;
551 unsigned long *ptes;
552 long npages, dma_ofs, i;
553
554 #if !DEBUG_NODIRECT
555 /* If everything is physically contiguous, and the addresses
556 fall into the direct-map window, use it. */
557 if (leader->dma_address == 0
558 && paddr + size + __direct_map_base - 1 <= max_dma
559 && paddr + size <= __direct_map_size) {
560 out->dma_address = paddr + __direct_map_base;
561 out->dma_length = size;
562
563 DBGA(" sg_fill: [%p,%lx] -> direct %lx\n",
564 __va(paddr), size, out->dma_address);
565
566 return 0;
567 }
568 #endif
569
570 /* If physically contiguous and DAC is available, use it. */
571 if (leader->dma_address == 0 && dac_allowed) {
572 out->dma_address = paddr + alpha_mv.pci_dac_offset;
573 out->dma_length = size;
574
575 DBGA(" sg_fill: [%p,%lx] -> DAC %lx\n",
576 __va(paddr), size, out->dma_address);
577
578 return 0;
579 }
580
581 /* Otherwise, we'll use the iommu to make the pages virtually
582 contiguous. */
583
584 paddr &= ~PAGE_MASK;
585 npages = calc_npages(paddr + size);
586 dma_ofs = iommu_arena_alloc(dev, arena, npages, 0);
587 if (dma_ofs < 0) {
588 /* If we attempted a direct map above but failed, die. */
589 if (leader->dma_address == 0)
590 return -1;
591
592 /* Otherwise, break up the remaining virtually contiguous
593 hunks into individual direct maps and retry. */
594 sg_classify(dev, leader, end, 0);
595 return sg_fill(dev, leader, end, out, arena, max_dma, dac_allowed);
596 }
597
598 out->dma_address = arena->dma_base + dma_ofs*PAGE_SIZE + paddr;
599 out->dma_length = size;
600
601 DBGA(" sg_fill: [%p,%lx] -> sg %lx np %ld\n",
602 __va(paddr), size, out->dma_address, npages);
603
604 /* All virtually contiguous. We need to find the length of each
605 physically contiguous subsegment to fill in the ptes. */
606 ptes = &arena->ptes[dma_ofs];
607 sg = leader;
608 do {
609 #if DEBUG_ALLOC > 0
610 struct scatterlist *last_sg = sg;
611 #endif
612
613 size = sg->length;
614 paddr = SG_ENT_PHYS_ADDRESS(sg);
615
616 while (sg+1 < end && (int) sg[1].dma_address == -1) {
617 size += sg[1].length;
618 sg++;
619 }
620
621 npages = calc_npages((paddr & ~PAGE_MASK) + size);
622
623 paddr &= PAGE_MASK;
624 for (i = 0; i < npages; ++i, paddr += PAGE_SIZE)
625 *ptes++ = mk_iommu_pte(paddr);
626
627 #if DEBUG_ALLOC > 0
628 DBGA(" (%ld) [%p,%x] np %ld\n",
629 last_sg - leader, SG_ENT_VIRT_ADDRESS(last_sg),
630 last_sg->length, npages);
631 while (++last_sg <= sg) {
632 DBGA(" (%ld) [%p,%x] cont\n",
633 last_sg - leader, SG_ENT_VIRT_ADDRESS(last_sg),
634 last_sg->length);
635 }
636 #endif
637 } while (++sg < end && (int) sg->dma_address < 0);
638
639 return 1;
640 }
641
642 int
643 pci_map_sg(struct pci_dev *pdev, struct scatterlist *sg, int nents,
644 int direction)
645 {
646 struct scatterlist *start, *end, *out;
647 struct pci_controller *hose;
648 struct pci_iommu_arena *arena;
649 dma_addr_t max_dma;
650 int dac_allowed;
651 struct device *dev;
652
653 if (direction == PCI_DMA_NONE)
654 BUG();
655
656 dac_allowed = pdev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0;
657
658 dev = pdev ? &pdev->dev : NULL;
659
660 /* Fast path single entry scatterlists. */
661 if (nents == 1) {
662 sg->dma_length = sg->length;
663 sg->dma_address
664 = pci_map_single_1(pdev, SG_ENT_VIRT_ADDRESS(sg),
665 sg->length, dac_allowed);
666 return sg->dma_address != 0;
667 }
668
669 start = sg;
670 end = sg + nents;
671
672 /* First, prepare information about the entries. */
673 sg_classify(dev, sg, end, alpha_mv.mv_pci_tbi != 0);
674
675 /* Second, figure out where we're going to map things. */
676 if (alpha_mv.mv_pci_tbi) {
677 hose = pdev ? pdev->sysdata : pci_isa_hose;
678 max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
679 arena = hose->sg_pci;
680 if (!arena || arena->dma_base + arena->size - 1 > max_dma)
681 arena = hose->sg_isa;
682 } else {
683 max_dma = -1;
684 arena = NULL;
685 hose = NULL;
686 }
687
688 /* Third, iterate over the scatterlist leaders and allocate
689 dma space as needed. */
690 for (out = sg; sg < end; ++sg) {
691 if ((int) sg->dma_address < 0)
692 continue;
693 if (sg_fill(dev, sg, end, out, arena, max_dma, dac_allowed) < 0)
694 goto error;
695 out++;
696 }
697
698 /* Mark the end of the list for pci_unmap_sg. */
699 if (out < end)
700 out->dma_length = 0;
701
702 if (out - start == 0)
703 printk(KERN_WARNING "pci_map_sg failed: no entries?\n");
704 DBGA("pci_map_sg: %ld entries\n", out - start);
705
706 return out - start;
707
708 error:
709 printk(KERN_WARNING "pci_map_sg failed: "
710 "could not allocate dma page tables\n");
711
712 /* Some allocation failed while mapping the scatterlist
713 entries. Unmap them now. */
714 if (out > start)
715 pci_unmap_sg(pdev, start, out - start, direction);
716 return 0;
717 }
718 EXPORT_SYMBOL(pci_map_sg);
719
720 /* Unmap a set of streaming mode DMA translations. Again, cpu read
721 rules concerning calls here are the same as for pci_unmap_single()
722 above. */
723
724 void
725 pci_unmap_sg(struct pci_dev *pdev, struct scatterlist *sg, int nents,
726 int direction)
727 {
728 unsigned long flags;
729 struct pci_controller *hose;
730 struct pci_iommu_arena *arena;
731 struct scatterlist *end;
732 dma_addr_t max_dma;
733 dma_addr_t fbeg, fend;
734
735 if (direction == PCI_DMA_NONE)
736 BUG();
737
738 if (! alpha_mv.mv_pci_tbi)
739 return;
740
741 hose = pdev ? pdev->sysdata : pci_isa_hose;
742 max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
743 arena = hose->sg_pci;
744 if (!arena || arena->dma_base + arena->size - 1 > max_dma)
745 arena = hose->sg_isa;
746
747 fbeg = -1, fend = 0;
748
749 spin_lock_irqsave(&arena->lock, flags);
750
751 for (end = sg + nents; sg < end; ++sg) {
752 dma64_addr_t addr;
753 size_t size;
754 long npages, ofs;
755 dma_addr_t tend;
756
757 addr = sg->dma_address;
758 size = sg->dma_length;
759 if (!size)
760 break;
761
762 if (addr > 0xffffffff) {
763 /* It's a DAC address -- nothing to do. */
764 DBGA(" (%ld) DAC [%lx,%lx]\n",
765 sg - end + nents, addr, size);
766 continue;
767 }
768
769 if (addr >= __direct_map_base
770 && addr < __direct_map_base + __direct_map_size) {
771 /* Nothing to do. */
772 DBGA(" (%ld) direct [%lx,%lx]\n",
773 sg - end + nents, addr, size);
774 continue;
775 }
776
777 DBGA(" (%ld) sg [%lx,%lx]\n",
778 sg - end + nents, addr, size);
779
780 npages = calc_npages((addr & ~PAGE_MASK) + size);
781 ofs = (addr - arena->dma_base) >> PAGE_SHIFT;
782 iommu_arena_free(arena, ofs, npages);
783
784 tend = addr + size - 1;
785 if (fbeg > addr) fbeg = addr;
786 if (fend < tend) fend = tend;
787 }
788
789 /* If we're freeing ptes above the `next_entry' pointer (they
790 may have snuck back into the TLB since the last wrap flush),
791 we need to flush the TLB before reallocating the latter. */
792 if ((fend - arena->dma_base) >> PAGE_SHIFT >= arena->next_entry)
793 alpha_mv.mv_pci_tbi(hose, fbeg, fend);
794
795 spin_unlock_irqrestore(&arena->lock, flags);
796
797 DBGA("pci_unmap_sg: %ld entries\n", nents - (end - sg));
798 }
799 EXPORT_SYMBOL(pci_unmap_sg);
800
801
802 /* Return whether the given PCI device DMA address mask can be
803 supported properly. */
804
805 int
806 pci_dma_supported(struct pci_dev *pdev, u64 mask)
807 {
808 struct pci_controller *hose;
809 struct pci_iommu_arena *arena;
810
811 /* If there exists a direct map, and the mask fits either
812 the entire direct mapped space or the total system memory as
813 shifted by the map base */
814 if (__direct_map_size != 0
815 && (__direct_map_base + __direct_map_size - 1 <= mask ||
816 __direct_map_base + (max_low_pfn << PAGE_SHIFT) - 1 <= mask))
817 return 1;
818
819 /* Check that we have a scatter-gather arena that fits. */
820 hose = pdev ? pdev->sysdata : pci_isa_hose;
821 arena = hose->sg_isa;
822 if (arena && arena->dma_base + arena->size - 1 <= mask)
823 return 1;
824 arena = hose->sg_pci;
825 if (arena && arena->dma_base + arena->size - 1 <= mask)
826 return 1;
827
828 /* As last resort try ZONE_DMA. */
829 if (!__direct_map_base && MAX_DMA_ADDRESS - IDENT_ADDR - 1 <= mask)
830 return 1;
831
832 return 0;
833 }
834 EXPORT_SYMBOL(pci_dma_supported);
835
836 \f
837 /*
838 * AGP GART extensions to the IOMMU
839 */
840 int
841 iommu_reserve(struct pci_iommu_arena *arena, long pg_count, long align_mask)
842 {
843 unsigned long flags;
844 unsigned long *ptes;
845 long i, p;
846
847 if (!arena) return -EINVAL;
848
849 spin_lock_irqsave(&arena->lock, flags);
850
851 /* Search for N empty ptes. */
852 ptes = arena->ptes;
853 p = iommu_arena_find_pages(NULL, arena, pg_count, align_mask);
854 if (p < 0) {
855 spin_unlock_irqrestore(&arena->lock, flags);
856 return -1;
857 }
858
859 /* Success. Mark them all reserved (ie not zero and invalid)
860 for the iommu tlb that could load them from under us.
861 They will be filled in with valid bits by _bind() */
862 for (i = 0; i < pg_count; ++i)
863 ptes[p+i] = IOMMU_RESERVED_PTE;
864
865 arena->next_entry = p + pg_count;
866 spin_unlock_irqrestore(&arena->lock, flags);
867
868 return p;
869 }
870
871 int
872 iommu_release(struct pci_iommu_arena *arena, long pg_start, long pg_count)
873 {
874 unsigned long *ptes;
875 long i;
876
877 if (!arena) return -EINVAL;
878
879 ptes = arena->ptes;
880
881 /* Make sure they're all reserved first... */
882 for(i = pg_start; i < pg_start + pg_count; i++)
883 if (ptes[i] != IOMMU_RESERVED_PTE)
884 return -EBUSY;
885
886 iommu_arena_free(arena, pg_start, pg_count);
887 return 0;
888 }
889
890 int
891 iommu_bind(struct pci_iommu_arena *arena, long pg_start, long pg_count,
892 unsigned long *physaddrs)
893 {
894 unsigned long flags;
895 unsigned long *ptes;
896 long i, j;
897
898 if (!arena) return -EINVAL;
899
900 spin_lock_irqsave(&arena->lock, flags);
901
902 ptes = arena->ptes;
903
904 for(j = pg_start; j < pg_start + pg_count; j++) {
905 if (ptes[j] != IOMMU_RESERVED_PTE) {
906 spin_unlock_irqrestore(&arena->lock, flags);
907 return -EBUSY;
908 }
909 }
910
911 for(i = 0, j = pg_start; i < pg_count; i++, j++)
912 ptes[j] = mk_iommu_pte(physaddrs[i]);
913
914 spin_unlock_irqrestore(&arena->lock, flags);
915
916 return 0;
917 }
918
919 int
920 iommu_unbind(struct pci_iommu_arena *arena, long pg_start, long pg_count)
921 {
922 unsigned long *p;
923 long i;
924
925 if (!arena) return -EINVAL;
926
927 p = arena->ptes + pg_start;
928 for(i = 0; i < pg_count; i++)
929 p[i] = IOMMU_RESERVED_PTE;
930
931 return 0;
932 }
933
934 /* True if the machine supports DAC addressing, and DEV can
935 make use of it given MASK. */
936
937 static int
938 pci_dac_dma_supported(struct pci_dev *dev, u64 mask)
939 {
940 dma64_addr_t dac_offset = alpha_mv.pci_dac_offset;
941 int ok = 1;
942
943 /* If this is not set, the machine doesn't support DAC at all. */
944 if (dac_offset == 0)
945 ok = 0;
946
947 /* The device has to be able to address our DAC bit. */
948 if ((dac_offset & dev->dma_mask) != dac_offset)
949 ok = 0;
950
951 /* If both conditions above are met, we are fine. */
952 DBGA("pci_dac_dma_supported %s from %p\n",
953 ok ? "yes" : "no", __builtin_return_address(0));
954
955 return ok;
956 }
957
958 /* Helper for generic DMA-mapping functions. */
959
960 struct pci_dev *
961 alpha_gendev_to_pci(struct device *dev)
962 {
963 if (dev && dev->bus == &pci_bus_type)
964 return to_pci_dev(dev);
965
966 /* Assume that non-PCI devices asking for DMA are either ISA or EISA,
967 BUG() otherwise. */
968 BUG_ON(!isa_bridge);
969
970 /* Assume non-busmaster ISA DMA when dma_mask is not set (the ISA
971 bridge is bus master then). */
972 if (!dev || !dev->dma_mask || !*dev->dma_mask)
973 return isa_bridge;
974
975 /* For EISA bus masters, return isa_bridge (it might have smaller
976 dma_mask due to wiring limitations). */
977 if (*dev->dma_mask >= isa_bridge->dma_mask)
978 return isa_bridge;
979
980 /* This assumes ISA bus master with dma_mask 0xffffff. */
981 return NULL;
982 }
983 EXPORT_SYMBOL(alpha_gendev_to_pci);
984
985 int
986 dma_set_mask(struct device *dev, u64 mask)
987 {
988 if (!dev->dma_mask ||
989 !pci_dma_supported(alpha_gendev_to_pci(dev), mask))
990 return -EIO;
991
992 *dev->dma_mask = mask;
993
994 return 0;
995 }
996 EXPORT_SYMBOL(dma_set_mask);
This page took 0.122256 seconds and 5 git commands to generate.