intel-iommu: Performance improvement for dma_pte_free_pagetable()
[deliverable/linux.git] / arch / x86 / kernel / pci-dma.c
CommitLineData
459121c9 1#include <linux/dma-mapping.h>
2118d0c5 2#include <linux/dma-debug.h>
cb5867a5 3#include <linux/dmar.h>
116890d5 4#include <linux/bootmem.h>
bca5c096 5#include <linux/pci.h>
cb5867a5 6
116890d5
GC
7#include <asm/proto.h>
8#include <asm/dma.h>
46a7fa27 9#include <asm/iommu.h>
1d9b16d1 10#include <asm/gart.h>
cb5867a5 11#include <asm/calgary.h>
a69ca340 12#include <asm/amd_iommu.h>
459121c9 13
3b15e581
FY
14static int forbid_dac __read_mostly;
15
160c1d8e 16struct dma_map_ops *dma_ops;
85c246ee
GC
17EXPORT_SYMBOL(dma_ops);
18
b4cdc430 19static int iommu_sac_force __read_mostly;
8e0c3797 20
f9c258de
GC
21#ifdef CONFIG_IOMMU_DEBUG
22int panic_on_overflow __read_mostly = 1;
23int force_iommu __read_mostly = 1;
24#else
25int panic_on_overflow __read_mostly = 0;
26int force_iommu __read_mostly = 0;
27#endif
28
fae9a0d8
GC
29int iommu_merge __read_mostly = 0;
30
31int no_iommu __read_mostly;
32/* Set this to 1 if there is a HW IOMMU in the system */
33int iommu_detected __read_mostly = 0;
34
aed5d5f4
FY
35int iommu_pass_through;
36
cac67877
GC
37dma_addr_t bad_dma_address __read_mostly = 0;
38EXPORT_SYMBOL(bad_dma_address);
fae9a0d8 39
098cb7f2
GC
40/* Dummy device used for NULL arguments (normally ISA). Better would
41 be probably a smaller DMA mask, but this is bug-to-bug compatible
42 to older i386. */
6c505ce3 43struct device x86_dma_fallback_dev = {
1a927133 44 .init_name = "fallback device",
284901a9 45 .coherent_dma_mask = DMA_BIT_MASK(32),
6c505ce3 46 .dma_mask = &x86_dma_fallback_dev.coherent_dma_mask,
098cb7f2 47};
6c505ce3 48EXPORT_SYMBOL(x86_dma_fallback_dev);
098cb7f2 49
2118d0c5
JR
50/* Number of entries preallocated for DMA-API debugging */
51#define PREALLOC_DMA_DEBUG_ENTRIES 32768
52
459121c9
GC
53int dma_set_mask(struct device *dev, u64 mask)
54{
55 if (!dev->dma_mask || !dma_supported(dev, mask))
56 return -EIO;
57
58 *dev->dma_mask = mask;
59
60 return 0;
61}
62EXPORT_SYMBOL(dma_set_mask);
63
116890d5
GC
64#ifdef CONFIG_X86_64
65static __initdata void *dma32_bootmem_ptr;
66static unsigned long dma32_bootmem_size __initdata = (128ULL<<20);
67
68static int __init parse_dma32_size_opt(char *p)
69{
70 if (!p)
71 return -EINVAL;
72 dma32_bootmem_size = memparse(p, &p);
73 return 0;
74}
75early_param("dma32_size", parse_dma32_size_opt);
76
77void __init dma32_reserve_bootmem(void)
78{
79 unsigned long size, align;
c987d12f 80 if (max_pfn <= MAX_DMA32_PFN)
116890d5
GC
81 return;
82
7677b2ef
YL
83 /*
84 * check aperture_64.c allocate_aperture() for reason about
85 * using 512M as goal
86 */
116890d5 87 align = 64ULL<<20;
1ddb5518 88 size = roundup(dma32_bootmem_size, align);
116890d5 89 dma32_bootmem_ptr = __alloc_bootmem_nopanic(size, align,
7677b2ef 90 512ULL<<20);
116890d5
GC
91 if (dma32_bootmem_ptr)
92 dma32_bootmem_size = size;
93 else
94 dma32_bootmem_size = 0;
95}
96static void __init dma32_free_bootmem(void)
97{
116890d5 98
c987d12f 99 if (max_pfn <= MAX_DMA32_PFN)
116890d5
GC
100 return;
101
102 if (!dma32_bootmem_ptr)
103 return;
104
330fce23 105 free_bootmem(__pa(dma32_bootmem_ptr), dma32_bootmem_size);
116890d5
GC
106
107 dma32_bootmem_ptr = NULL;
108 dma32_bootmem_size = 0;
109}
cfb80c9e 110#endif
116890d5
GC
111
112void __init pci_iommu_alloc(void)
113{
cfb80c9e 114#ifdef CONFIG_X86_64
116890d5
GC
115 /* free the range so iommu could get some range less than 4G */
116 dma32_free_bootmem();
cfb80c9e
JF
117#endif
118
116890d5
GC
119 /*
120 * The order of these functions is important for
121 * fall-back/fail-over reasons
122 */
116890d5 123 gart_iommu_hole_init();
116890d5 124
116890d5 125 detect_calgary();
116890d5
GC
126
127 detect_intel_iommu();
128
a69ca340
JR
129 amd_iommu_detect();
130
116890d5 131 pci_swiotlb_init();
116890d5 132}
8978b742 133
9f6ac577
FT
134void *dma_generic_alloc_coherent(struct device *dev, size_t size,
135 dma_addr_t *dma_addr, gfp_t flag)
136{
137 unsigned long dma_mask;
138 struct page *page;
139 dma_addr_t addr;
140
141 dma_mask = dma_alloc_coherent_mask(dev, flag);
142
143 flag |= __GFP_ZERO;
144again:
145 page = alloc_pages_node(dev_to_node(dev), flag, get_order(size));
146 if (!page)
147 return NULL;
148
149 addr = page_to_phys(page);
150 if (!is_buffer_dma_capable(dma_mask, addr, size)) {
151 __free_pages(page, get_order(size));
152
284901a9 153 if (dma_mask < DMA_BIT_MASK(32) && !(flag & GFP_DMA)) {
9f6ac577
FT
154 flag = (flag & ~GFP_DMA32) | GFP_DMA;
155 goto again;
156 }
157
158 return NULL;
159 }
160
161 *dma_addr = addr;
162 return page_address(page);
163}
164
fae9a0d8
GC
165/*
166 * See <Documentation/x86_64/boot-options.txt> for the iommu kernel parameter
167 * documentation.
168 */
169static __init int iommu_setup(char *p)
170{
171 iommu_merge = 1;
172
173 if (!p)
174 return -EINVAL;
175
176 while (*p) {
177 if (!strncmp(p, "off", 3))
178 no_iommu = 1;
179 /* gart_parse_options has more force support */
180 if (!strncmp(p, "force", 5))
181 force_iommu = 1;
182 if (!strncmp(p, "noforce", 7)) {
183 iommu_merge = 0;
184 force_iommu = 0;
185 }
186
187 if (!strncmp(p, "biomerge", 8)) {
fae9a0d8
GC
188 iommu_merge = 1;
189 force_iommu = 1;
190 }
191 if (!strncmp(p, "panic", 5))
192 panic_on_overflow = 1;
193 if (!strncmp(p, "nopanic", 7))
194 panic_on_overflow = 0;
195 if (!strncmp(p, "merge", 5)) {
196 iommu_merge = 1;
197 force_iommu = 1;
198 }
199 if (!strncmp(p, "nomerge", 7))
200 iommu_merge = 0;
201 if (!strncmp(p, "forcesac", 8))
202 iommu_sac_force = 1;
203 if (!strncmp(p, "allowdac", 8))
204 forbid_dac = 0;
205 if (!strncmp(p, "nodac", 5))
206 forbid_dac = -1;
207 if (!strncmp(p, "usedac", 6)) {
208 forbid_dac = -1;
209 return 1;
210 }
211#ifdef CONFIG_SWIOTLB
212 if (!strncmp(p, "soft", 4))
213 swiotlb = 1;
4ed0d3e6
FY
214 if (!strncmp(p, "pt", 2)) {
215 iommu_pass_through = 1;
216 return 1;
217 }
fae9a0d8
GC
218#endif
219
fae9a0d8 220 gart_parse_options(p);
fae9a0d8
GC
221
222#ifdef CONFIG_CALGARY_IOMMU
223 if (!strncmp(p, "calgary", 7))
224 use_calgary = 1;
225#endif /* CONFIG_CALGARY_IOMMU */
226
227 p += strcspn(p, ",");
228 if (*p == ',')
229 ++p;
230 }
231 return 0;
232}
233early_param("iommu", iommu_setup);
234
8e0c3797
GC
235int dma_supported(struct device *dev, u64 mask)
236{
160c1d8e 237 struct dma_map_ops *ops = get_dma_ops(dev);
8d8bb39b 238
8e0c3797
GC
239#ifdef CONFIG_PCI
240 if (mask > 0xffffffff && forbid_dac > 0) {
fc3a8828 241 dev_info(dev, "PCI: Disallowing DAC for device\n");
8e0c3797
GC
242 return 0;
243 }
244#endif
245
8d8bb39b
FT
246 if (ops->dma_supported)
247 return ops->dma_supported(dev, mask);
8e0c3797
GC
248
249 /* Copied from i386. Doesn't make much sense, because it will
250 only work for pci_alloc_coherent.
251 The caller just has to use GFP_DMA in this case. */
2f4f27d4 252 if (mask < DMA_BIT_MASK(24))
8e0c3797
GC
253 return 0;
254
255 /* Tell the device to use SAC when IOMMU force is on. This
256 allows the driver to use cheaper accesses in some cases.
257
258 Problem with this is that if we overflow the IOMMU area and
259 return DAC as fallback address the device may not handle it
260 correctly.
261
262 As a special case some controllers have a 39bit address
263 mode that is as efficient as 32bit (aic79xx). Don't force
264 SAC for these. Assume all masks <= 40 bits are of this
265 type. Normally this doesn't make any difference, but gives
266 more gentle handling of IOMMU overflow. */
50cf156a 267 if (iommu_sac_force && (mask >= DMA_BIT_MASK(40))) {
fc3a8828 268 dev_info(dev, "Force SAC with mask %Lx\n", mask);
8e0c3797
GC
269 return 0;
270 }
271
272 return 1;
273}
274EXPORT_SYMBOL(dma_supported);
275
cb5867a5
GC
276static int __init pci_iommu_init(void)
277{
2118d0c5
JR
278 dma_debug_init(PREALLOC_DMA_DEBUG_ENTRIES);
279
86f31952
JR
280#ifdef CONFIG_PCI
281 dma_debug_add_bus(&pci_bus_type);
282#endif
283
cb5867a5 284 calgary_iommu_init();
cb5867a5
GC
285
286 intel_iommu_init();
287
a69ca340
JR
288 amd_iommu_init();
289
cb5867a5 290 gart_iommu_init();
459121c9 291
cb5867a5
GC
292 no_iommu_init();
293 return 0;
294}
295
296void pci_iommu_shutdown(void)
297{
298 gart_iommu_shutdown();
09759042
JR
299
300 amd_iommu_shutdown();
cb5867a5
GC
301}
302/* Must execute after PCI subsystem */
303fs_initcall(pci_iommu_init);
3b15e581
FY
304
305#ifdef CONFIG_PCI
306/* Many VIA bridges seem to corrupt data for DAC. Disable it here */
307
308static __devinit void via_no_dac(struct pci_dev *dev)
309{
310 if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI && forbid_dac == 0) {
13bf7576 311 dev_info(&dev->dev, "disabling DAC on VIA PCI bridge\n");
3b15e581
FY
312 forbid_dac = 1;
313 }
314}
315DECLARE_PCI_FIXUP_FINAL(PCI_VENDOR_ID_VIA, PCI_ANY_ID, via_no_dac);
316#endif
This page took 0.193506 seconds and 5 git commands to generate.