blob: 05d745ede561320a6c50d0a47c5a3cbb26cdf1f1 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Dynamic DMA mapping support.
3 */
4
5#include <linux/types.h>
6#include <linux/mm.h>
7#include <linux/string.h>
8#include <linux/pci.h>
9#include <linux/module.h>
10#include <asm/io.h>
Yinghai Luf2cf8e02007-07-21 17:11:31 +020011#include <asm/iommu.h>
Jon Masone4650582006-06-26 13:58:14 +020012#include <asm/calgary.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070013
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010014int iommu_merge __read_mostly = 0;
15EXPORT_SYMBOL(iommu_merge);
16
17dma_addr_t bad_dma_address __read_mostly;
18EXPORT_SYMBOL(bad_dma_address);
19
20/* This tells the BIO block layer to assume merging. Default to off
21 because we cannot guarantee merging later. */
22int iommu_bio_merge __read_mostly = 0;
23EXPORT_SYMBOL(iommu_bio_merge);
24
Jan Beulichcaa51712007-07-09 11:55:51 -070025static int iommu_sac_force __read_mostly = 0;
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010026
27int no_iommu __read_mostly;
28#ifdef CONFIG_IOMMU_DEBUG
29int panic_on_overflow __read_mostly = 1;
30int force_iommu __read_mostly = 1;
31#else
32int panic_on_overflow __read_mostly = 0;
33int force_iommu __read_mostly= 0;
34#endif
35
Jon Mason8d4f6b92006-06-26 13:58:05 +020036/* Set this to 1 if there is a HW IOMMU in the system */
37int iommu_detected __read_mostly = 0;
38
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010039/* Dummy device used for NULL arguments (normally ISA). Better would
40 be probably a smaller DMA mask, but this is bug-to-bug compatible
41 to i386. */
42struct device fallback_dev = {
43 .bus_id = "fallback device",
Jon Mason9f2036f2006-06-26 13:56:19 +020044 .coherent_dma_mask = DMA_32BIT_MASK,
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010045 .dma_mask = &fallback_dev.coherent_dma_mask,
46};
47
48/* Allocate DMA memory on node near device */
49noinline static void *
50dma_alloc_pages(struct device *dev, gfp_t gfp, unsigned order)
Linus Torvalds1da177e2005-04-16 15:20:36 -070051{
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010052 struct page *page;
53 int node;
Andi Kleenfa47dd02006-04-07 19:49:33 +020054#ifdef CONFIG_PCI
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010055 if (dev->bus == &pci_bus_type)
56 node = pcibus_to_node(to_pci_dev(dev)->bus);
57 else
Andi Kleenfa47dd02006-04-07 19:49:33 +020058#endif
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010059 node = numa_node_id();
Daniel Yeisley0d015322006-05-30 22:47:57 +020060
61 if (node < first_node(node_online_map))
62 node = first_node(node_online_map);
63
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010064 page = alloc_pages_node(node, gfp, order);
65 return page ? page_address(page) : NULL;
66}
Linus Torvalds1da177e2005-04-16 15:20:36 -070067
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010068/*
69 * Allocate memory for a coherent mapping.
70 */
71void *
72dma_alloc_coherent(struct device *dev, size_t size, dma_addr_t *dma_handle,
73 gfp_t gfp)
74{
75 void *memory;
76 unsigned long dma_mask = 0;
77 u64 bus;
78
79 if (!dev)
80 dev = &fallback_dev;
81 dma_mask = dev->coherent_dma_mask;
82 if (dma_mask == 0)
Jon Mason9f2036f2006-06-26 13:56:19 +020083 dma_mask = DMA_32BIT_MASK;
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010084
Andi Kleen3056d6b2006-03-25 16:30:43 +010085 /* Don't invoke OOM killer */
86 gfp |= __GFP_NORETRY;
87
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010088 /* Kludge to make it bug-to-bug compatible with i386. i386
89 uses the normal dma_mask for alloc_coherent. */
90 dma_mask &= *dev->dma_mask;
91
92 /* Why <=? Even when the mask is smaller than 4GB it is often
93 larger than 16MB and in this case we have a chance of
94 finding fitting memory in the next higher zone first. If
95 not retry with true GFP_DMA. -AK */
Jon Mason9f2036f2006-06-26 13:56:19 +020096 if (dma_mask <= DMA_32BIT_MASK)
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010097 gfp |= GFP_DMA32;
98
99 again:
100 memory = dma_alloc_pages(dev, gfp, get_order(size));
101 if (memory == NULL)
102 return NULL;
103
104 {
105 int high, mmu;
106 bus = virt_to_bus(memory);
107 high = (bus + size) >= dma_mask;
108 mmu = high;
109 if (force_iommu && !(gfp & GFP_DMA))
110 mmu = 1;
111 else if (high) {
112 free_pages((unsigned long)memory,
113 get_order(size));
114
115 /* Don't use the 16MB ZONE_DMA unless absolutely
116 needed. It's better to use remapping first. */
Jon Mason9f2036f2006-06-26 13:56:19 +0200117 if (dma_mask < DMA_32BIT_MASK && !(gfp & GFP_DMA)) {
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100118 gfp = (gfp & ~GFP_DMA32) | GFP_DMA;
119 goto again;
120 }
121
Andi Kleen6bca52b2006-02-03 21:50:59 +0100122 /* Let low level make its own zone decisions */
123 gfp &= ~(GFP_DMA32|GFP_DMA);
124
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100125 if (dma_ops->alloc_coherent)
126 return dma_ops->alloc_coherent(dev, size,
127 dma_handle, gfp);
128 return NULL;
129 }
130
131 memset(memory, 0, size);
132 if (!mmu) {
133 *dma_handle = virt_to_bus(memory);
134 return memory;
135 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700136 }
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100137
138 if (dma_ops->alloc_coherent) {
139 free_pages((unsigned long)memory, get_order(size));
140 gfp &= ~(GFP_DMA|GFP_DMA32);
141 return dma_ops->alloc_coherent(dev, size, dma_handle, gfp);
142 }
143
144 if (dma_ops->map_simple) {
145 *dma_handle = dma_ops->map_simple(dev, memory,
146 size,
147 PCI_DMA_BIDIRECTIONAL);
148 if (*dma_handle != bad_dma_address)
149 return memory;
150 }
151
152 if (panic_on_overflow)
153 panic("dma_alloc_coherent: IOMMU overflow by %lu bytes\n",size);
154 free_pages((unsigned long)memory, get_order(size));
155 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700156}
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100157EXPORT_SYMBOL(dma_alloc_coherent);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100159/*
160 * Unmap coherent memory.
161 * The caller must ensure that the device has finished accessing the mapping.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700162 */
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100163void dma_free_coherent(struct device *dev, size_t size,
164 void *vaddr, dma_addr_t bus)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165{
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100166 if (dma_ops->unmap_single)
167 dma_ops->unmap_single(dev, bus, size, 0);
168 free_pages((unsigned long)vaddr, get_order(size));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169}
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100170EXPORT_SYMBOL(dma_free_coherent);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171
Andi Kleenece66842006-09-30 01:47:55 +0200172static int forbid_dac __read_mostly;
173
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100174int dma_supported(struct device *dev, u64 mask)
175{
Andi Kleenece66842006-09-30 01:47:55 +0200176#ifdef CONFIG_PCI
177 if (mask > 0xffffffff && forbid_dac > 0) {
178
179
180
181 printk(KERN_INFO "PCI: Disallowing DAC for device %s\n", dev->bus_id);
182 return 0;
183 }
184#endif
185
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100186 if (dma_ops->dma_supported)
187 return dma_ops->dma_supported(dev, mask);
188
189 /* Copied from i386. Doesn't make much sense, because it will
190 only work for pci_alloc_coherent.
191 The caller just has to use GFP_DMA in this case. */
Jon Mason9f2036f2006-06-26 13:56:19 +0200192 if (mask < DMA_24BIT_MASK)
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100193 return 0;
194
195 /* Tell the device to use SAC when IOMMU force is on. This
196 allows the driver to use cheaper accesses in some cases.
197
198 Problem with this is that if we overflow the IOMMU area and
199 return DAC as fallback address the device may not handle it
200 correctly.
201
202 As a special case some controllers have a 39bit address
203 mode that is as efficient as 32bit (aic79xx). Don't force
204 SAC for these. Assume all masks <= 40 bits are of this
205 type. Normally this doesn't make any difference, but gives
206 more gentle handling of IOMMU overflow. */
Jon Mason9f2036f2006-06-26 13:56:19 +0200207 if (iommu_sac_force && (mask >= DMA_40BIT_MASK)) {
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100208 printk(KERN_INFO "%s: Force SAC with mask %Lx\n", dev->bus_id,mask);
209 return 0;
210 }
211
212 return 1;
213}
214EXPORT_SYMBOL(dma_supported);
215
216int dma_set_mask(struct device *dev, u64 mask)
217{
218 if (!dev->dma_mask || !dma_supported(dev, mask))
219 return -EIO;
220 *dev->dma_mask = mask;
221 return 0;
222}
223EXPORT_SYMBOL(dma_set_mask);
224
Karsten Weiss55588702007-02-13 13:26:21 +0100225/*
226 * See <Documentation/x86_64/boot-options.txt> for the iommu kernel parameter
227 * documentation.
228 */
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100229__init int iommu_setup(char *p)
230{
Andi Kleended318e2006-09-30 01:47:55 +0200231 iommu_merge = 1;
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100232
Andi Kleen2c8c0e62006-09-26 10:52:32 +0200233 if (!p)
234 return -EINVAL;
235
Andi Kleended318e2006-09-30 01:47:55 +0200236 while (*p) {
237 if (!strncmp(p,"off",3))
238 no_iommu = 1;
239 /* gart_parse_options has more force support */
240 if (!strncmp(p,"force",5))
241 force_iommu = 1;
242 if (!strncmp(p,"noforce",7)) {
243 iommu_merge = 0;
244 force_iommu = 0;
245 }
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100246
Andi Kleended318e2006-09-30 01:47:55 +0200247 if (!strncmp(p, "biomerge",8)) {
248 iommu_bio_merge = 4096;
249 iommu_merge = 1;
250 force_iommu = 1;
251 }
252 if (!strncmp(p, "panic",5))
253 panic_on_overflow = 1;
254 if (!strncmp(p, "nopanic",7))
255 panic_on_overflow = 0;
256 if (!strncmp(p, "merge",5)) {
257 iommu_merge = 1;
258 force_iommu = 1;
259 }
260 if (!strncmp(p, "nomerge",7))
261 iommu_merge = 0;
262 if (!strncmp(p, "forcesac",8))
263 iommu_sac_force = 1;
264 if (!strncmp(p, "allowdac", 8))
265 forbid_dac = 0;
266 if (!strncmp(p, "nodac", 5))
267 forbid_dac = -1;
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100268
269#ifdef CONFIG_SWIOTLB
Andi Kleended318e2006-09-30 01:47:55 +0200270 if (!strncmp(p, "soft",4))
271 swiotlb = 1;
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100272#endif
273
Andi Kleena813ce42006-06-26 13:57:22 +0200274#ifdef CONFIG_IOMMU
Andi Kleended318e2006-09-30 01:47:55 +0200275 gart_parse_options(p);
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100276#endif
277
Muli Ben-Yehudabff65472006-12-07 02:14:07 +0100278#ifdef CONFIG_CALGARY_IOMMU
279 if (!strncmp(p, "calgary", 7))
280 use_calgary = 1;
281#endif /* CONFIG_CALGARY_IOMMU */
282
Andi Kleended318e2006-09-30 01:47:55 +0200283 p += strcspn(p, ",");
284 if (*p == ',')
285 ++p;
286 }
287 return 0;
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +0100288}
Andi Kleen2c8c0e62006-09-26 10:52:32 +0200289early_param("iommu", iommu_setup);
Jon Mason0dc243a2006-06-26 13:58:11 +0200290
291void __init pci_iommu_alloc(void)
292{
293 /*
294 * The order of these functions is important for
295 * fall-back/fail-over reasons
296 */
297#ifdef CONFIG_IOMMU
298 iommu_hole_init();
299#endif
300
Jon Masone4650582006-06-26 13:58:14 +0200301#ifdef CONFIG_CALGARY_IOMMU
302 detect_calgary();
303#endif
304
Jon Mason0dc243a2006-06-26 13:58:11 +0200305#ifdef CONFIG_SWIOTLB
306 pci_swiotlb_init();
307#endif
308}
309
310static int __init pci_iommu_init(void)
311{
Jon Masone4650582006-06-26 13:58:14 +0200312#ifdef CONFIG_CALGARY_IOMMU
313 calgary_iommu_init();
314#endif
315
Jon Mason0dc243a2006-06-26 13:58:11 +0200316#ifdef CONFIG_IOMMU
317 gart_iommu_init();
318#endif
319
320 no_iommu_init();
321 return 0;
322}
323
Yinghai Lubc2cea62007-07-21 17:11:28 +0200324void pci_iommu_shutdown(void)
325{
326 gart_iommu_shutdown();
327}
328
Andi Kleen388c19e2007-06-20 12:23:32 +0200329#ifdef CONFIG_PCI
330/* Many VIA bridges seem to corrupt data for DAC. Disable it here */
331
332static __devinit void via_no_dac(struct pci_dev *dev)
333{
334 if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI && forbid_dac == 0) {
335 printk(KERN_INFO "PCI: VIA PCI bridge detected. Disabling DAC.\n");
336 forbid_dac = 1;
337 }
338}
339DECLARE_PCI_FIXUP_FINAL(PCI_VENDOR_ID_VIA, PCI_ANY_ID, via_no_dac);
340#endif
Jon Mason0dc243a2006-06-26 13:58:11 +0200341/* Must execute after PCI subsystem */
342fs_initcall(pci_iommu_init);