x86: unify pci iommu setup and allow swiotlb to compile for 32 bit
[linux-2.6/mini2440.git] / arch / x86 / kernel / pci-dma.c
blob00e07447a5bd4881f474e843f5a93abdf52fcb49
1 #include <linux/dma-mapping.h>
2 #include <linux/dmar.h>
3 #include <linux/bootmem.h>
4 #include <linux/pci.h>
6 #include <asm/proto.h>
7 #include <asm/dma.h>
8 #include <asm/iommu.h>
9 #include <asm/calgary.h>
10 #include <asm/amd_iommu.h>
12 static int forbid_dac __read_mostly;
14 struct dma_mapping_ops *dma_ops;
15 EXPORT_SYMBOL(dma_ops);
17 static int iommu_sac_force __read_mostly;
19 #ifdef CONFIG_IOMMU_DEBUG
20 int panic_on_overflow __read_mostly = 1;
21 int force_iommu __read_mostly = 1;
22 #else
23 int panic_on_overflow __read_mostly = 0;
24 int force_iommu __read_mostly = 0;
25 #endif
27 int iommu_merge __read_mostly = 0;
29 int no_iommu __read_mostly;
30 /* Set this to 1 if there is a HW IOMMU in the system */
31 int iommu_detected __read_mostly = 0;
33 /* This tells the BIO block layer to assume merging. Default to off
34 because we cannot guarantee merging later. */
35 int iommu_bio_merge __read_mostly = 0;
36 EXPORT_SYMBOL(iommu_bio_merge);
38 dma_addr_t bad_dma_address __read_mostly = 0;
39 EXPORT_SYMBOL(bad_dma_address);
41 /* Dummy device used for NULL arguments (normally ISA). Better would
42 be probably a smaller DMA mask, but this is bug-to-bug compatible
43 to older i386. */
44 struct device x86_dma_fallback_dev = {
45 .bus_id = "fallback device",
46 .coherent_dma_mask = DMA_32BIT_MASK,
47 .dma_mask = &x86_dma_fallback_dev.coherent_dma_mask,
49 EXPORT_SYMBOL(x86_dma_fallback_dev);
51 int dma_set_mask(struct device *dev, u64 mask)
53 if (!dev->dma_mask || !dma_supported(dev, mask))
54 return -EIO;
56 *dev->dma_mask = mask;
58 return 0;
60 EXPORT_SYMBOL(dma_set_mask);
62 #ifdef CONFIG_X86_64
63 static __initdata void *dma32_bootmem_ptr;
64 static unsigned long dma32_bootmem_size __initdata = (128ULL<<20);
66 static int __init parse_dma32_size_opt(char *p)
68 if (!p)
69 return -EINVAL;
70 dma32_bootmem_size = memparse(p, &p);
71 return 0;
73 early_param("dma32_size", parse_dma32_size_opt);
75 void __init dma32_reserve_bootmem(void)
77 unsigned long size, align;
78 if (max_pfn <= MAX_DMA32_PFN)
79 return;
82 * check aperture_64.c allocate_aperture() for reason about
83 * using 512M as goal
85 align = 64ULL<<20;
86 size = roundup(dma32_bootmem_size, align);
87 dma32_bootmem_ptr = __alloc_bootmem_nopanic(size, align,
88 512ULL<<20);
89 if (dma32_bootmem_ptr)
90 dma32_bootmem_size = size;
91 else
92 dma32_bootmem_size = 0;
94 static void __init dma32_free_bootmem(void)
97 if (max_pfn <= MAX_DMA32_PFN)
98 return;
100 if (!dma32_bootmem_ptr)
101 return;
103 free_bootmem(__pa(dma32_bootmem_ptr), dma32_bootmem_size);
105 dma32_bootmem_ptr = NULL;
106 dma32_bootmem_size = 0;
108 #endif
110 void __init pci_iommu_alloc(void)
112 #ifdef CONFIG_X86_64
113 /* free the range so iommu could get some range less than 4G */
114 dma32_free_bootmem();
115 #endif
118 * The order of these functions is important for
119 * fall-back/fail-over reasons
121 gart_iommu_hole_init();
123 detect_calgary();
125 detect_intel_iommu();
127 amd_iommu_detect();
129 pci_swiotlb_init();
132 void *dma_generic_alloc_coherent(struct device *dev, size_t size,
133 dma_addr_t *dma_addr, gfp_t flag)
135 unsigned long dma_mask;
136 struct page *page;
137 dma_addr_t addr;
139 dma_mask = dma_alloc_coherent_mask(dev, flag);
141 flag |= __GFP_ZERO;
142 again:
143 page = alloc_pages_node(dev_to_node(dev), flag, get_order(size));
144 if (!page)
145 return NULL;
147 addr = page_to_phys(page);
148 if (!is_buffer_dma_capable(dma_mask, addr, size)) {
149 __free_pages(page, get_order(size));
151 if (dma_mask < DMA_32BIT_MASK && !(flag & GFP_DMA)) {
152 flag = (flag & ~GFP_DMA32) | GFP_DMA;
153 goto again;
156 return NULL;
159 *dma_addr = addr;
160 return page_address(page);
164 * See <Documentation/x86_64/boot-options.txt> for the iommu kernel parameter
165 * documentation.
167 static __init int iommu_setup(char *p)
169 iommu_merge = 1;
171 if (!p)
172 return -EINVAL;
174 while (*p) {
175 if (!strncmp(p, "off", 3))
176 no_iommu = 1;
177 /* gart_parse_options has more force support */
178 if (!strncmp(p, "force", 5))
179 force_iommu = 1;
180 if (!strncmp(p, "noforce", 7)) {
181 iommu_merge = 0;
182 force_iommu = 0;
185 if (!strncmp(p, "biomerge", 8)) {
186 iommu_bio_merge = 4096;
187 iommu_merge = 1;
188 force_iommu = 1;
190 if (!strncmp(p, "panic", 5))
191 panic_on_overflow = 1;
192 if (!strncmp(p, "nopanic", 7))
193 panic_on_overflow = 0;
194 if (!strncmp(p, "merge", 5)) {
195 iommu_merge = 1;
196 force_iommu = 1;
198 if (!strncmp(p, "nomerge", 7))
199 iommu_merge = 0;
200 if (!strncmp(p, "forcesac", 8))
201 iommu_sac_force = 1;
202 if (!strncmp(p, "allowdac", 8))
203 forbid_dac = 0;
204 if (!strncmp(p, "nodac", 5))
205 forbid_dac = -1;
206 if (!strncmp(p, "usedac", 6)) {
207 forbid_dac = -1;
208 return 1;
210 #ifdef CONFIG_SWIOTLB
211 if (!strncmp(p, "soft", 4))
212 swiotlb = 1;
213 #endif
215 gart_parse_options(p);
217 #ifdef CONFIG_CALGARY_IOMMU
218 if (!strncmp(p, "calgary", 7))
219 use_calgary = 1;
220 #endif /* CONFIG_CALGARY_IOMMU */
222 p += strcspn(p, ",");
223 if (*p == ',')
224 ++p;
226 return 0;
228 early_param("iommu", iommu_setup);
230 int dma_supported(struct device *dev, u64 mask)
232 struct dma_mapping_ops *ops = get_dma_ops(dev);
234 #ifdef CONFIG_PCI
235 if (mask > 0xffffffff && forbid_dac > 0) {
236 dev_info(dev, "PCI: Disallowing DAC for device\n");
237 return 0;
239 #endif
241 if (ops->dma_supported)
242 return ops->dma_supported(dev, mask);
244 /* Copied from i386. Doesn't make much sense, because it will
245 only work for pci_alloc_coherent.
246 The caller just has to use GFP_DMA in this case. */
247 if (mask < DMA_24BIT_MASK)
248 return 0;
250 /* Tell the device to use SAC when IOMMU force is on. This
251 allows the driver to use cheaper accesses in some cases.
253 Problem with this is that if we overflow the IOMMU area and
254 return DAC as fallback address the device may not handle it
255 correctly.
257 As a special case some controllers have a 39bit address
258 mode that is as efficient as 32bit (aic79xx). Don't force
259 SAC for these. Assume all masks <= 40 bits are of this
260 type. Normally this doesn't make any difference, but gives
261 more gentle handling of IOMMU overflow. */
262 if (iommu_sac_force && (mask >= DMA_40BIT_MASK)) {
263 dev_info(dev, "Force SAC with mask %Lx\n", mask);
264 return 0;
267 return 1;
269 EXPORT_SYMBOL(dma_supported);
271 static int __init pci_iommu_init(void)
273 calgary_iommu_init();
275 intel_iommu_init();
277 amd_iommu_init();
279 gart_iommu_init();
281 no_iommu_init();
282 return 0;
285 void pci_iommu_shutdown(void)
287 gart_iommu_shutdown();
289 /* Must execute after PCI subsystem */
290 fs_initcall(pci_iommu_init);
292 #ifdef CONFIG_PCI
293 /* Many VIA bridges seem to corrupt data for DAC. Disable it here */
295 static __devinit void via_no_dac(struct pci_dev *dev)
297 if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI && forbid_dac == 0) {
298 printk(KERN_INFO "PCI: VIA PCI bridge detected."
299 "Disabling DAC.\n");
300 forbid_dac = 1;
303 DECLARE_PCI_FIXUP_FINAL(PCI_VENDOR_ID_VIA, PCI_ANY_ID, via_no_dac);
304 #endif