x86: dma-ops on highmem fix
[deliverable/linux.git] / arch / x86 / kernel / pci-dma_64.c
1 /*
2 * Dynamic DMA mapping support.
3 */
4
5 #include <linux/types.h>
6 #include <linux/mm.h>
7 #include <linux/string.h>
8 #include <linux/pci.h>
9 #include <linux/module.h>
10 #include <linux/dmar.h>
11 #include <linux/bootmem.h>
12 #include <asm/proto.h>
13 #include <asm/io.h>
14 #include <asm/gart.h>
15 #include <asm/calgary.h>
16
17 int iommu_merge __read_mostly = 0;
18
19 dma_addr_t bad_dma_address __read_mostly;
20 EXPORT_SYMBOL(bad_dma_address);
21
22 /* This tells the BIO block layer to assume merging. Default to off
23 because we cannot guarantee merging later. */
24 int iommu_bio_merge __read_mostly = 0;
25 EXPORT_SYMBOL(iommu_bio_merge);
26
27 static int iommu_sac_force __read_mostly = 0;
28
29 int no_iommu __read_mostly;
30 #ifdef CONFIG_IOMMU_DEBUG
31 int panic_on_overflow __read_mostly = 1;
32 int force_iommu __read_mostly = 1;
33 #else
34 int panic_on_overflow __read_mostly = 0;
35 int force_iommu __read_mostly= 0;
36 #endif
37
38 /* Set this to 1 if there is a HW IOMMU in the system */
39 int iommu_detected __read_mostly = 0;
40
41 /* Dummy device used for NULL arguments (normally ISA). Better would
42 be probably a smaller DMA mask, but this is bug-to-bug compatible
43 to i386. */
44 struct device fallback_dev = {
45 .bus_id = "fallback device",
46 .coherent_dma_mask = DMA_32BIT_MASK,
47 .dma_mask = &fallback_dev.coherent_dma_mask,
48 };
49
50 /* Allocate DMA memory on node near device */
51 noinline static void *
52 dma_alloc_pages(struct device *dev, gfp_t gfp, unsigned order)
53 {
54 struct page *page;
55 int node;
56
57 node = dev_to_node(dev);
58
59 page = alloc_pages_node(node, gfp, order);
60 return page ? page_address(page) : NULL;
61 }
62
63 /*
64 * Allocate memory for a coherent mapping.
65 */
66 void *
67 dma_alloc_coherent(struct device *dev, size_t size, dma_addr_t *dma_handle,
68 gfp_t gfp)
69 {
70 void *memory;
71 unsigned long dma_mask = 0;
72 u64 bus;
73
74 if (!dev)
75 dev = &fallback_dev;
76 dma_mask = dev->coherent_dma_mask;
77 if (dma_mask == 0)
78 dma_mask = DMA_32BIT_MASK;
79
80 /* Device not DMA able */
81 if (dev->dma_mask == NULL)
82 return NULL;
83
84 /* Don't invoke OOM killer */
85 gfp |= __GFP_NORETRY;
86
87 /* Kludge to make it bug-to-bug compatible with i386. i386
88 uses the normal dma_mask for alloc_coherent. */
89 dma_mask &= *dev->dma_mask;
90
91 /* Why <=? Even when the mask is smaller than 4GB it is often
92 larger than 16MB and in this case we have a chance of
93 finding fitting memory in the next higher zone first. If
94 not retry with true GFP_DMA. -AK */
95 if (dma_mask <= DMA_32BIT_MASK)
96 gfp |= GFP_DMA32;
97
98 again:
99 memory = dma_alloc_pages(dev, gfp, get_order(size));
100 if (memory == NULL)
101 return NULL;
102
103 {
104 int high, mmu;
105 bus = virt_to_bus(memory);
106 high = (bus + size) >= dma_mask;
107 mmu = high;
108 if (force_iommu && !(gfp & GFP_DMA))
109 mmu = 1;
110 else if (high) {
111 free_pages((unsigned long)memory,
112 get_order(size));
113
114 /* Don't use the 16MB ZONE_DMA unless absolutely
115 needed. It's better to use remapping first. */
116 if (dma_mask < DMA_32BIT_MASK && !(gfp & GFP_DMA)) {
117 gfp = (gfp & ~GFP_DMA32) | GFP_DMA;
118 goto again;
119 }
120
121 /* Let low level make its own zone decisions */
122 gfp &= ~(GFP_DMA32|GFP_DMA);
123
124 if (dma_ops->alloc_coherent)
125 return dma_ops->alloc_coherent(dev, size,
126 dma_handle, gfp);
127 return NULL;
128 }
129
130 memset(memory, 0, size);
131 if (!mmu) {
132 *dma_handle = virt_to_bus(memory);
133 return memory;
134 }
135 }
136
137 if (dma_ops->alloc_coherent) {
138 free_pages((unsigned long)memory, get_order(size));
139 gfp &= ~(GFP_DMA|GFP_DMA32);
140 return dma_ops->alloc_coherent(dev, size, dma_handle, gfp);
141 }
142
143 if (dma_ops->map_simple) {
144 *dma_handle = dma_ops->map_simple(dev, virt_to_phys(memory),
145 size,
146 PCI_DMA_BIDIRECTIONAL);
147 if (*dma_handle != bad_dma_address)
148 return memory;
149 }
150
151 if (panic_on_overflow)
152 panic("dma_alloc_coherent: IOMMU overflow by %lu bytes\n",size);
153 free_pages((unsigned long)memory, get_order(size));
154 return NULL;
155 }
156 EXPORT_SYMBOL(dma_alloc_coherent);
157
158 /*
159 * Unmap coherent memory.
160 * The caller must ensure that the device has finished accessing the mapping.
161 */
162 void dma_free_coherent(struct device *dev, size_t size,
163 void *vaddr, dma_addr_t bus)
164 {
165 WARN_ON(irqs_disabled()); /* for portability */
166 if (dma_ops->unmap_single)
167 dma_ops->unmap_single(dev, bus, size, 0);
168 free_pages((unsigned long)vaddr, get_order(size));
169 }
170 EXPORT_SYMBOL(dma_free_coherent);
171
172 static int forbid_dac __read_mostly;
173
174 int dma_supported(struct device *dev, u64 mask)
175 {
176 #ifdef CONFIG_PCI
177 if (mask > 0xffffffff && forbid_dac > 0) {
178
179
180
181 printk(KERN_INFO "PCI: Disallowing DAC for device %s\n", dev->bus_id);
182 return 0;
183 }
184 #endif
185
186 if (dma_ops->dma_supported)
187 return dma_ops->dma_supported(dev, mask);
188
189 /* Copied from i386. Doesn't make much sense, because it will
190 only work for pci_alloc_coherent.
191 The caller just has to use GFP_DMA in this case. */
192 if (mask < DMA_24BIT_MASK)
193 return 0;
194
195 /* Tell the device to use SAC when IOMMU force is on. This
196 allows the driver to use cheaper accesses in some cases.
197
198 Problem with this is that if we overflow the IOMMU area and
199 return DAC as fallback address the device may not handle it
200 correctly.
201
202 As a special case some controllers have a 39bit address
203 mode that is as efficient as 32bit (aic79xx). Don't force
204 SAC for these. Assume all masks <= 40 bits are of this
205 type. Normally this doesn't make any difference, but gives
206 more gentle handling of IOMMU overflow. */
207 if (iommu_sac_force && (mask >= DMA_40BIT_MASK)) {
208 printk(KERN_INFO "%s: Force SAC with mask %Lx\n", dev->bus_id,mask);
209 return 0;
210 }
211
212 return 1;
213 }
214 EXPORT_SYMBOL(dma_supported);
215
216 int dma_set_mask(struct device *dev, u64 mask)
217 {
218 if (!dev->dma_mask || !dma_supported(dev, mask))
219 return -EIO;
220 *dev->dma_mask = mask;
221 return 0;
222 }
223 EXPORT_SYMBOL(dma_set_mask);
224
225 /*
226 * See <Documentation/x86_64/boot-options.txt> for the iommu kernel parameter
227 * documentation.
228 */
229 static __init int iommu_setup(char *p)
230 {
231 iommu_merge = 1;
232
233 if (!p)
234 return -EINVAL;
235
236 while (*p) {
237 if (!strncmp(p, "off", 3))
238 no_iommu = 1;
239 /* gart_parse_options has more force support */
240 if (!strncmp(p, "force", 5))
241 force_iommu = 1;
242 if (!strncmp(p, "noforce", 7)) {
243 iommu_merge = 0;
244 force_iommu = 0;
245 }
246
247 if (!strncmp(p, "biomerge", 8)) {
248 iommu_bio_merge = 4096;
249 iommu_merge = 1;
250 force_iommu = 1;
251 }
252 if (!strncmp(p, "panic", 5))
253 panic_on_overflow = 1;
254 if (!strncmp(p, "nopanic", 7))
255 panic_on_overflow = 0;
256 if (!strncmp(p, "merge", 5)) {
257 iommu_merge = 1;
258 force_iommu = 1;
259 }
260 if (!strncmp(p, "nomerge", 7))
261 iommu_merge = 0;
262 if (!strncmp(p, "forcesac", 8))
263 iommu_sac_force = 1;
264 if (!strncmp(p, "allowdac", 8))
265 forbid_dac = 0;
266 if (!strncmp(p, "nodac", 5))
267 forbid_dac = -1;
268
269 #ifdef CONFIG_SWIOTLB
270 if (!strncmp(p, "soft", 4))
271 swiotlb = 1;
272 #endif
273
274 #ifdef CONFIG_GART_IOMMU
275 gart_parse_options(p);
276 #endif
277
278 #ifdef CONFIG_CALGARY_IOMMU
279 if (!strncmp(p, "calgary", 7))
280 use_calgary = 1;
281 #endif /* CONFIG_CALGARY_IOMMU */
282
283 p += strcspn(p, ",");
284 if (*p == ',')
285 ++p;
286 }
287 return 0;
288 }
289 early_param("iommu", iommu_setup);
290
291 static __initdata void *dma32_bootmem_ptr;
292 static unsigned long dma32_bootmem_size __initdata = (128ULL<<20);
293
294 static int __init parse_dma32_size_opt(char *p)
295 {
296 if (!p)
297 return -EINVAL;
298 dma32_bootmem_size = memparse(p, &p);
299 return 0;
300 }
301 early_param("dma32_size", parse_dma32_size_opt);
302
303 void __init dma32_reserve_bootmem(void)
304 {
305 unsigned long size, align;
306 if (end_pfn <= MAX_DMA32_PFN)
307 return;
308
309 align = 64ULL<<20;
310 size = round_up(dma32_bootmem_size, align);
311 dma32_bootmem_ptr = __alloc_bootmem_nopanic(size, align,
312 __pa(MAX_DMA_ADDRESS));
313 if (dma32_bootmem_ptr)
314 dma32_bootmem_size = size;
315 else
316 dma32_bootmem_size = 0;
317 }
318 static void __init dma32_free_bootmem(void)
319 {
320 int node;
321
322 if (end_pfn <= MAX_DMA32_PFN)
323 return;
324
325 if (!dma32_bootmem_ptr)
326 return;
327
328 for_each_online_node(node)
329 free_bootmem_node(NODE_DATA(node), __pa(dma32_bootmem_ptr),
330 dma32_bootmem_size);
331
332 dma32_bootmem_ptr = NULL;
333 dma32_bootmem_size = 0;
334 }
335
336 void __init pci_iommu_alloc(void)
337 {
338 /* free the range so iommu could get some range less than 4G */
339 dma32_free_bootmem();
340 /*
341 * The order of these functions is important for
342 * fall-back/fail-over reasons
343 */
344 #ifdef CONFIG_GART_IOMMU
345 gart_iommu_hole_init();
346 #endif
347
348 #ifdef CONFIG_CALGARY_IOMMU
349 detect_calgary();
350 #endif
351
352 detect_intel_iommu();
353
354 #ifdef CONFIG_SWIOTLB
355 pci_swiotlb_init();
356 #endif
357 }
358
359 static int __init pci_iommu_init(void)
360 {
361 #ifdef CONFIG_CALGARY_IOMMU
362 calgary_iommu_init();
363 #endif
364
365 intel_iommu_init();
366
367 #ifdef CONFIG_GART_IOMMU
368 gart_iommu_init();
369 #endif
370
371 no_iommu_init();
372 return 0;
373 }
374
375 void pci_iommu_shutdown(void)
376 {
377 gart_iommu_shutdown();
378 }
379
380 #ifdef CONFIG_PCI
381 /* Many VIA bridges seem to corrupt data for DAC. Disable it here */
382
383 static __devinit void via_no_dac(struct pci_dev *dev)
384 {
385 if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI && forbid_dac == 0) {
386 printk(KERN_INFO "PCI: VIA PCI bridge detected. Disabling DAC.\n");
387 forbid_dac = 1;
388 }
389 }
390 DECLARE_PCI_FIXUP_FINAL(PCI_VENDOR_ID_VIA, PCI_ANY_ID, via_no_dac);
391 #endif
392 /* Must execute after PCI subsystem */
393 fs_initcall(pci_iommu_init);
This page took 0.039477 seconds and 5 git commands to generate.