blob: 9f07cfcbd3a5e60db651c952c9a66fa21dd68d87 [file] [log] [blame]
Glauber Costa459121c92008-04-08 13:20:43 -03001#include <linux/dma-mapping.h>
Joerg Roedel2118d0c2009-01-09 15:13:15 +01002#include <linux/dma-debug.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03003#include <linux/dmar.h>
Glauber Costa116890d2008-04-08 13:20:54 -03004#include <linux/bootmem.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +09005#include <linux/gfp.h>
Glauber Costabca5c092008-04-08 13:20:53 -03006#include <linux/pci.h>
Catalin Marinasacde31d2009-08-27 14:29:20 +01007#include <linux/kmemleak.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03008
Glauber Costa116890d2008-04-08 13:20:54 -03009#include <asm/proto.h>
10#include <asm/dma.h>
FUJITA Tomonori46a7fa22008-07-11 10:23:42 +090011#include <asm/iommu.h>
Joerg Roedel1d9b16d2008-11-27 18:39:15 +010012#include <asm/gart.h>
Glauber Costacb5867a2008-04-08 13:20:51 -030013#include <asm/calgary.h>
Joerg Roedela69ca342008-06-26 21:28:08 +020014#include <asm/amd_iommu.h>
Ingo Molnarb4941a92009-11-10 14:37:58 +010015#include <asm/x86_init.h>
Konrad Rzeszutek Wilkfe96eb42010-03-18 13:53:24 -040016#include <asm/xen/swiotlb-xen.h>
Glauber Costa459121c92008-04-08 13:20:43 -030017
Fenghua Yu3b15e582008-10-23 16:51:00 -070018static int forbid_dac __read_mostly;
19
FUJITA Tomonoria3b28ee2009-11-14 20:46:36 +090020struct dma_map_ops *dma_ops = &nommu_dma_ops;
Glauber Costa85c246e2008-04-08 13:20:50 -030021EXPORT_SYMBOL(dma_ops);
22
Dmitri Vorobievb4cdc432008-04-28 03:15:58 +040023static int iommu_sac_force __read_mostly;
Glauber Costa8e0c3792008-04-08 13:20:55 -030024
Glauber Costaf9c258d2008-04-08 13:20:52 -030025#ifdef CONFIG_IOMMU_DEBUG
26int panic_on_overflow __read_mostly = 1;
27int force_iommu __read_mostly = 1;
28#else
29int panic_on_overflow __read_mostly = 0;
30int force_iommu __read_mostly = 0;
31#endif
32
Glauber Costafae9a0d2008-04-08 13:20:56 -030033int iommu_merge __read_mostly = 0;
34
35int no_iommu __read_mostly;
36/* Set this to 1 if there is a HW IOMMU in the system */
37int iommu_detected __read_mostly = 0;
38
Joerg Roedelac0101d2009-09-01 16:00:35 +020039/*
40 * This variable becomes 1 if iommu=pt is passed on the kernel command line.
Marin Mitove3be7852009-10-03 20:45:02 +030041 * If this variable is 1, IOMMU implementations do no DMA translation for
Joerg Roedelac0101d2009-09-01 16:00:35 +020042 * devices and allow every device to access to whole physical memory. This is
Justin P. Mattockfb637f32010-01-14 22:16:16 -080043 * useful if a user wants to use an IOMMU only for KVM device assignment to
Joerg Roedelac0101d2009-09-01 16:00:35 +020044 * guests and not for driver dma translation.
45 */
46int iommu_pass_through __read_mostly;
Fenghua Yuaed5d5f2009-04-30 17:57:11 -070047
Jan Beulicheb647132009-11-08 12:12:14 +010048/* Dummy device used for NULL arguments (normally ISA). */
Joerg Roedel6c505ce2008-08-19 16:32:45 +020049struct device x86_dma_fallback_dev = {
Kay Sievers1a927132008-10-30 02:17:49 +010050 .init_name = "fallback device",
Jan Beulicheb647132009-11-08 12:12:14 +010051 .coherent_dma_mask = ISA_DMA_BIT_MASK,
Joerg Roedel6c505ce2008-08-19 16:32:45 +020052 .dma_mask = &x86_dma_fallback_dev.coherent_dma_mask,
Glauber Costa098cb7f2008-04-09 13:18:10 -030053};
Joerg Roedel6c505ce2008-08-19 16:32:45 +020054EXPORT_SYMBOL(x86_dma_fallback_dev);
Glauber Costa098cb7f2008-04-09 13:18:10 -030055
Joerg Roedel2118d0c2009-01-09 15:13:15 +010056/* Number of entries preallocated for DMA-API debugging */
57#define PREALLOC_DMA_DEBUG_ENTRIES 32768
58
Glauber Costa459121c92008-04-08 13:20:43 -030059int dma_set_mask(struct device *dev, u64 mask)
60{
61 if (!dev->dma_mask || !dma_supported(dev, mask))
62 return -EIO;
63
64 *dev->dma_mask = mask;
65
66 return 0;
67}
68EXPORT_SYMBOL(dma_set_mask);
69
Yinghai Luc252a5b2010-02-10 01:20:19 -080070#if defined(CONFIG_X86_64) && !defined(CONFIG_NUMA)
Glauber Costa116890d2008-04-08 13:20:54 -030071static __initdata void *dma32_bootmem_ptr;
72static unsigned long dma32_bootmem_size __initdata = (128ULL<<20);
73
74static int __init parse_dma32_size_opt(char *p)
75{
76 if (!p)
77 return -EINVAL;
78 dma32_bootmem_size = memparse(p, &p);
79 return 0;
80}
81early_param("dma32_size", parse_dma32_size_opt);
82
83void __init dma32_reserve_bootmem(void)
84{
85 unsigned long size, align;
Yinghai Luc987d122008-06-24 22:14:09 -070086 if (max_pfn <= MAX_DMA32_PFN)
Glauber Costa116890d2008-04-08 13:20:54 -030087 return;
88
Yinghai Lu7677b2e2008-04-14 20:40:37 -070089 /*
90 * check aperture_64.c allocate_aperture() for reason about
91 * using 512M as goal
92 */
Glauber Costa116890d2008-04-08 13:20:54 -030093 align = 64ULL<<20;
Joerg Roedel1ddb5512008-07-25 16:48:55 +020094 size = roundup(dma32_bootmem_size, align);
Glauber Costa116890d2008-04-08 13:20:54 -030095 dma32_bootmem_ptr = __alloc_bootmem_nopanic(size, align,
Yinghai Lu7677b2e2008-04-14 20:40:37 -070096 512ULL<<20);
Catalin Marinasacde31d2009-08-27 14:29:20 +010097 /*
98 * Kmemleak should not scan this block as it may not be mapped via the
99 * kernel direct mapping.
100 */
101 kmemleak_ignore(dma32_bootmem_ptr);
Glauber Costa116890d2008-04-08 13:20:54 -0300102 if (dma32_bootmem_ptr)
103 dma32_bootmem_size = size;
104 else
105 dma32_bootmem_size = 0;
106}
107static void __init dma32_free_bootmem(void)
108{
Glauber Costa116890d2008-04-08 13:20:54 -0300109
Yinghai Luc987d122008-06-24 22:14:09 -0700110 if (max_pfn <= MAX_DMA32_PFN)
Glauber Costa116890d2008-04-08 13:20:54 -0300111 return;
112
113 if (!dma32_bootmem_ptr)
114 return;
115
Yinghai Lu330fce22008-04-19 01:31:45 -0700116 free_bootmem(__pa(dma32_bootmem_ptr), dma32_bootmem_size);
Glauber Costa116890d2008-04-08 13:20:54 -0300117
118 dma32_bootmem_ptr = NULL;
119 dma32_bootmem_size = 0;
120}
Yinghai Luc252a5b2010-02-10 01:20:19 -0800121#else
122void __init dma32_reserve_bootmem(void)
123{
124}
125static void __init dma32_free_bootmem(void)
126{
127}
128
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800129#endif
Glauber Costa116890d2008-04-08 13:20:54 -0300130
131void __init pci_iommu_alloc(void)
132{
133 /* free the range so iommu could get some range less than 4G */
134 dma32_free_bootmem();
Yinghai Luc252a5b2010-02-10 01:20:19 -0800135
Konrad Rzeszutek Wilkfe96eb42010-03-18 13:53:24 -0400136 if (pci_xen_swiotlb_detect() || pci_swiotlb_detect())
FUJITA Tomonori186a2502009-12-15 20:47:56 +0900137 goto out;
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800138
Glauber Costa116890d2008-04-08 13:20:54 -0300139 gart_iommu_hole_init();
Glauber Costa116890d2008-04-08 13:20:54 -0300140
Glauber Costa116890d2008-04-08 13:20:54 -0300141 detect_calgary();
Glauber Costa116890d2008-04-08 13:20:54 -0300142
143 detect_intel_iommu();
144
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900145 /* needs to be called after gart_iommu_hole_init */
Joerg Roedela69ca342008-06-26 21:28:08 +0200146 amd_iommu_detect();
FUJITA Tomonori186a2502009-12-15 20:47:56 +0900147out:
Konrad Rzeszutek Wilkfe96eb42010-03-18 13:53:24 -0400148 pci_xen_swiotlb_init();
149
FUJITA Tomonori186a2502009-12-15 20:47:56 +0900150 pci_swiotlb_init();
Glauber Costa116890d2008-04-08 13:20:54 -0300151}
FUJITA Tomonori8978b742008-07-29 13:38:53 +0900152
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900153void *dma_generic_alloc_coherent(struct device *dev, size_t size,
154 dma_addr_t *dma_addr, gfp_t flag)
155{
156 unsigned long dma_mask;
157 struct page *page;
158 dma_addr_t addr;
159
160 dma_mask = dma_alloc_coherent_mask(dev, flag);
161
162 flag |= __GFP_ZERO;
163again:
164 page = alloc_pages_node(dev_to_node(dev), flag, get_order(size));
165 if (!page)
166 return NULL;
167
168 addr = page_to_phys(page);
FUJITA Tomonoria4c2baa2009-07-10 10:04:55 +0900169 if (addr + size > dma_mask) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900170 __free_pages(page, get_order(size));
171
Yang Hongyang284901a2009-04-06 19:01:15 -0700172 if (dma_mask < DMA_BIT_MASK(32) && !(flag & GFP_DMA)) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900173 flag = (flag & ~GFP_DMA32) | GFP_DMA;
174 goto again;
175 }
176
177 return NULL;
178 }
179
180 *dma_addr = addr;
181 return page_address(page);
182}
183
Glauber Costafae9a0d2008-04-08 13:20:56 -0300184/*
185 * See <Documentation/x86_64/boot-options.txt> for the iommu kernel parameter
186 * documentation.
187 */
188static __init int iommu_setup(char *p)
189{
190 iommu_merge = 1;
191
192 if (!p)
193 return -EINVAL;
194
195 while (*p) {
196 if (!strncmp(p, "off", 3))
197 no_iommu = 1;
198 /* gart_parse_options has more force support */
199 if (!strncmp(p, "force", 5))
200 force_iommu = 1;
201 if (!strncmp(p, "noforce", 7)) {
202 iommu_merge = 0;
203 force_iommu = 0;
204 }
205
206 if (!strncmp(p, "biomerge", 8)) {
Glauber Costafae9a0d2008-04-08 13:20:56 -0300207 iommu_merge = 1;
208 force_iommu = 1;
209 }
210 if (!strncmp(p, "panic", 5))
211 panic_on_overflow = 1;
212 if (!strncmp(p, "nopanic", 7))
213 panic_on_overflow = 0;
214 if (!strncmp(p, "merge", 5)) {
215 iommu_merge = 1;
216 force_iommu = 1;
217 }
218 if (!strncmp(p, "nomerge", 7))
219 iommu_merge = 0;
220 if (!strncmp(p, "forcesac", 8))
221 iommu_sac_force = 1;
222 if (!strncmp(p, "allowdac", 8))
223 forbid_dac = 0;
224 if (!strncmp(p, "nodac", 5))
Tejun Heo2ae8bb72009-10-26 15:41:46 +0100225 forbid_dac = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300226 if (!strncmp(p, "usedac", 6)) {
227 forbid_dac = -1;
228 return 1;
229 }
230#ifdef CONFIG_SWIOTLB
231 if (!strncmp(p, "soft", 4))
232 swiotlb = 1;
David Woodhouse3238c0c2009-07-01 18:56:16 +0100233#endif
Alex Williamson80286872009-07-30 16:15:18 -0600234 if (!strncmp(p, "pt", 2))
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700235 iommu_pass_through = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300236
Glauber Costafae9a0d2008-04-08 13:20:56 -0300237 gart_parse_options(p);
Glauber Costafae9a0d2008-04-08 13:20:56 -0300238
239#ifdef CONFIG_CALGARY_IOMMU
240 if (!strncmp(p, "calgary", 7))
241 use_calgary = 1;
242#endif /* CONFIG_CALGARY_IOMMU */
243
244 p += strcspn(p, ",");
245 if (*p == ',')
246 ++p;
247 }
248 return 0;
249}
250early_param("iommu", iommu_setup);
251
Glauber Costa8e0c3792008-04-08 13:20:55 -0300252int dma_supported(struct device *dev, u64 mask)
253{
FUJITA Tomonori160c1d82009-01-05 23:59:02 +0900254 struct dma_map_ops *ops = get_dma_ops(dev);
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700255
Glauber Costa8e0c3792008-04-08 13:20:55 -0300256#ifdef CONFIG_PCI
257 if (mask > 0xffffffff && forbid_dac > 0) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200258 dev_info(dev, "PCI: Disallowing DAC for device\n");
Glauber Costa8e0c3792008-04-08 13:20:55 -0300259 return 0;
260 }
261#endif
262
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700263 if (ops->dma_supported)
264 return ops->dma_supported(dev, mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300265
266 /* Copied from i386. Doesn't make much sense, because it will
267 only work for pci_alloc_coherent.
268 The caller just has to use GFP_DMA in this case. */
Yang Hongyang2f4f27d2009-04-06 19:01:18 -0700269 if (mask < DMA_BIT_MASK(24))
Glauber Costa8e0c3792008-04-08 13:20:55 -0300270 return 0;
271
272 /* Tell the device to use SAC when IOMMU force is on. This
273 allows the driver to use cheaper accesses in some cases.
274
275 Problem with this is that if we overflow the IOMMU area and
276 return DAC as fallback address the device may not handle it
277 correctly.
278
279 As a special case some controllers have a 39bit address
280 mode that is as efficient as 32bit (aic79xx). Don't force
281 SAC for these. Assume all masks <= 40 bits are of this
282 type. Normally this doesn't make any difference, but gives
283 more gentle handling of IOMMU overflow. */
Yang Hongyang50cf1562009-04-06 19:01:14 -0700284 if (iommu_sac_force && (mask >= DMA_BIT_MASK(40))) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200285 dev_info(dev, "Force SAC with mask %Lx\n", mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300286 return 0;
287 }
288
289 return 1;
290}
291EXPORT_SYMBOL(dma_supported);
292
Glauber Costacb5867a2008-04-08 13:20:51 -0300293static int __init pci_iommu_init(void)
294{
Joerg Roedel2118d0c2009-01-09 15:13:15 +0100295 dma_debug_init(PREALLOC_DMA_DEBUG_ENTRIES);
296
Joerg Roedel86f31952009-03-16 17:50:28 +0100297#ifdef CONFIG_PCI
298 dma_debug_add_bus(&pci_bus_type);
299#endif
FUJITA Tomonorid07c1be2009-11-10 19:46:12 +0900300 x86_init.iommu.iommu_init();
301
Konrad Rzeszutek Wilkfe96eb42010-03-18 13:53:24 -0400302 if (swiotlb || xen_swiotlb) {
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900303 printk(KERN_INFO "PCI-DMA: "
304 "Using software bounce buffering for IO (SWIOTLB)\n");
305 swiotlb_print_info();
306 } else
307 swiotlb_free();
308
Glauber Costacb5867a2008-04-08 13:20:51 -0300309 return 0;
310}
Glauber Costacb5867a2008-04-08 13:20:51 -0300311/* Must execute after PCI subsystem */
David Woodhouse9a821b22009-10-12 12:59:29 +0100312rootfs_initcall(pci_iommu_init);
Fenghua Yu3b15e582008-10-23 16:51:00 -0700313
314#ifdef CONFIG_PCI
315/* Many VIA bridges seem to corrupt data for DAC. Disable it here */
316
317static __devinit void via_no_dac(struct pci_dev *dev)
318{
319 if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI && forbid_dac == 0) {
Bjorn Helgaas13bf7572009-02-24 10:38:22 -0700320 dev_info(&dev->dev, "disabling DAC on VIA PCI bridge\n");
Fenghua Yu3b15e582008-10-23 16:51:00 -0700321 forbid_dac = 1;
322 }
323}
324DECLARE_PCI_FIXUP_FINAL(PCI_VENDOR_ID_VIA, PCI_ANY_ID, via_no_dac);
325#endif