blob: 9ea999a4dcc178ce4e27dd069a957ff050d1dee7 [file] [log] [blame]
Glauber Costa459121c92008-04-08 13:20:43 -03001#include <linux/dma-mapping.h>
Joerg Roedel2118d0c2009-01-09 15:13:15 +01002#include <linux/dma-debug.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03003#include <linux/dmar.h>
Glauber Costa116890d2008-04-08 13:20:54 -03004#include <linux/bootmem.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +09005#include <linux/gfp.h>
Glauber Costabca5c092008-04-08 13:20:53 -03006#include <linux/pci.h>
Catalin Marinasacde31d2009-08-27 14:29:20 +01007#include <linux/kmemleak.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03008
Glauber Costa116890d2008-04-08 13:20:54 -03009#include <asm/proto.h>
10#include <asm/dma.h>
FUJITA Tomonori46a7fa22008-07-11 10:23:42 +090011#include <asm/iommu.h>
Joerg Roedel1d9b16d2008-11-27 18:39:15 +010012#include <asm/gart.h>
Glauber Costacb5867a2008-04-08 13:20:51 -030013#include <asm/calgary.h>
Ingo Molnarb4941a92009-11-10 14:37:58 +010014#include <asm/x86_init.h>
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -040015#include <asm/iommu_table.h>
Glauber Costa459121c92008-04-08 13:20:43 -030016
Fenghua Yu3b15e582008-10-23 16:51:00 -070017static int forbid_dac __read_mostly;
18
FUJITA Tomonoria3b28ee2009-11-14 20:46:36 +090019struct dma_map_ops *dma_ops = &nommu_dma_ops;
Glauber Costa85c246e2008-04-08 13:20:50 -030020EXPORT_SYMBOL(dma_ops);
21
Dmitri Vorobievb4cdc432008-04-28 03:15:58 +040022static int iommu_sac_force __read_mostly;
Glauber Costa8e0c3792008-04-08 13:20:55 -030023
Glauber Costaf9c258d2008-04-08 13:20:52 -030024#ifdef CONFIG_IOMMU_DEBUG
25int panic_on_overflow __read_mostly = 1;
26int force_iommu __read_mostly = 1;
27#else
28int panic_on_overflow __read_mostly = 0;
29int force_iommu __read_mostly = 0;
30#endif
31
Glauber Costafae9a0d2008-04-08 13:20:56 -030032int iommu_merge __read_mostly = 0;
33
34int no_iommu __read_mostly;
35/* Set this to 1 if there is a HW IOMMU in the system */
36int iommu_detected __read_mostly = 0;
37
Joerg Roedelac0101d2009-09-01 16:00:35 +020038/*
39 * This variable becomes 1 if iommu=pt is passed on the kernel command line.
Marin Mitove3be7852009-10-03 20:45:02 +030040 * If this variable is 1, IOMMU implementations do no DMA translation for
Joerg Roedelac0101d2009-09-01 16:00:35 +020041 * devices and allow every device to access to whole physical memory. This is
Justin P. Mattockfb637f32010-01-14 22:16:16 -080042 * useful if a user wants to use an IOMMU only for KVM device assignment to
Joerg Roedelac0101d2009-09-01 16:00:35 +020043 * guests and not for driver dma translation.
44 */
45int iommu_pass_through __read_mostly;
Fenghua Yuaed5d5f2009-04-30 17:57:11 -070046
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -040047extern struct iommu_table_entry __iommu_table[], __iommu_table_end[];
48
Jan Beulicheb647132009-11-08 12:12:14 +010049/* Dummy device used for NULL arguments (normally ISA). */
Joerg Roedel6c505ce2008-08-19 16:32:45 +020050struct device x86_dma_fallback_dev = {
Kay Sievers1a927132008-10-30 02:17:49 +010051 .init_name = "fallback device",
Jan Beulicheb647132009-11-08 12:12:14 +010052 .coherent_dma_mask = ISA_DMA_BIT_MASK,
Joerg Roedel6c505ce2008-08-19 16:32:45 +020053 .dma_mask = &x86_dma_fallback_dev.coherent_dma_mask,
Glauber Costa098cb7f2008-04-09 13:18:10 -030054};
Joerg Roedel6c505ce2008-08-19 16:32:45 +020055EXPORT_SYMBOL(x86_dma_fallback_dev);
Glauber Costa098cb7f2008-04-09 13:18:10 -030056
Joerg Roedel2118d0c2009-01-09 15:13:15 +010057/* Number of entries preallocated for DMA-API debugging */
58#define PREALLOC_DMA_DEBUG_ENTRIES 32768
59
Glauber Costa459121c92008-04-08 13:20:43 -030060int dma_set_mask(struct device *dev, u64 mask)
61{
62 if (!dev->dma_mask || !dma_supported(dev, mask))
63 return -EIO;
64
65 *dev->dma_mask = mask;
66
67 return 0;
68}
69EXPORT_SYMBOL(dma_set_mask);
70
Yinghai Luc252a5b2010-02-10 01:20:19 -080071#if defined(CONFIG_X86_64) && !defined(CONFIG_NUMA)
Glauber Costa116890d2008-04-08 13:20:54 -030072static __initdata void *dma32_bootmem_ptr;
73static unsigned long dma32_bootmem_size __initdata = (128ULL<<20);
74
75static int __init parse_dma32_size_opt(char *p)
76{
77 if (!p)
78 return -EINVAL;
79 dma32_bootmem_size = memparse(p, &p);
80 return 0;
81}
82early_param("dma32_size", parse_dma32_size_opt);
83
84void __init dma32_reserve_bootmem(void)
85{
86 unsigned long size, align;
Yinghai Luc987d122008-06-24 22:14:09 -070087 if (max_pfn <= MAX_DMA32_PFN)
Glauber Costa116890d2008-04-08 13:20:54 -030088 return;
89
Yinghai Lu7677b2e2008-04-14 20:40:37 -070090 /*
91 * check aperture_64.c allocate_aperture() for reason about
92 * using 512M as goal
93 */
Glauber Costa116890d2008-04-08 13:20:54 -030094 align = 64ULL<<20;
Joerg Roedel1ddb5512008-07-25 16:48:55 +020095 size = roundup(dma32_bootmem_size, align);
Glauber Costa116890d2008-04-08 13:20:54 -030096 dma32_bootmem_ptr = __alloc_bootmem_nopanic(size, align,
Yinghai Lu7677b2e2008-04-14 20:40:37 -070097 512ULL<<20);
Catalin Marinasacde31d2009-08-27 14:29:20 +010098 /*
99 * Kmemleak should not scan this block as it may not be mapped via the
100 * kernel direct mapping.
101 */
102 kmemleak_ignore(dma32_bootmem_ptr);
Glauber Costa116890d2008-04-08 13:20:54 -0300103 if (dma32_bootmem_ptr)
104 dma32_bootmem_size = size;
105 else
106 dma32_bootmem_size = 0;
107}
108static void __init dma32_free_bootmem(void)
109{
Glauber Costa116890d2008-04-08 13:20:54 -0300110
Yinghai Luc987d122008-06-24 22:14:09 -0700111 if (max_pfn <= MAX_DMA32_PFN)
Glauber Costa116890d2008-04-08 13:20:54 -0300112 return;
113
114 if (!dma32_bootmem_ptr)
115 return;
116
Yinghai Lu330fce22008-04-19 01:31:45 -0700117 free_bootmem(__pa(dma32_bootmem_ptr), dma32_bootmem_size);
Glauber Costa116890d2008-04-08 13:20:54 -0300118
119 dma32_bootmem_ptr = NULL;
120 dma32_bootmem_size = 0;
121}
Yinghai Luc252a5b2010-02-10 01:20:19 -0800122#else
123void __init dma32_reserve_bootmem(void)
124{
125}
126static void __init dma32_free_bootmem(void)
127{
128}
129
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800130#endif
Glauber Costa116890d2008-04-08 13:20:54 -0300131
132void __init pci_iommu_alloc(void)
133{
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -0400134 struct iommu_table_entry *p;
135
Glauber Costa116890d2008-04-08 13:20:54 -0300136 /* free the range so iommu could get some range less than 4G */
137 dma32_free_bootmem();
Yinghai Luc252a5b2010-02-10 01:20:19 -0800138
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -0400139 sort_iommu_table(__iommu_table, __iommu_table_end);
140 check_iommu_entries(__iommu_table, __iommu_table_end);
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800141
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -0400142 for (p = __iommu_table; p < __iommu_table_end; p++) {
143 if (p && p->detect && p->detect() > 0) {
144 p->flags |= IOMMU_DETECTED;
145 if (p->early_init)
146 p->early_init();
147 if (p->flags & IOMMU_FINISH_IF_DETECTED)
148 break;
149 }
150 }
Glauber Costa116890d2008-04-08 13:20:54 -0300151}
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900152void *dma_generic_alloc_coherent(struct device *dev, size_t size,
153 dma_addr_t *dma_addr, gfp_t flag)
154{
155 unsigned long dma_mask;
156 struct page *page;
157 dma_addr_t addr;
158
159 dma_mask = dma_alloc_coherent_mask(dev, flag);
160
161 flag |= __GFP_ZERO;
162again:
163 page = alloc_pages_node(dev_to_node(dev), flag, get_order(size));
164 if (!page)
165 return NULL;
166
167 addr = page_to_phys(page);
FUJITA Tomonoria4c2baa2009-07-10 10:04:55 +0900168 if (addr + size > dma_mask) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900169 __free_pages(page, get_order(size));
170
Yang Hongyang284901a2009-04-06 19:01:15 -0700171 if (dma_mask < DMA_BIT_MASK(32) && !(flag & GFP_DMA)) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900172 flag = (flag & ~GFP_DMA32) | GFP_DMA;
173 goto again;
174 }
175
176 return NULL;
177 }
178
179 *dma_addr = addr;
180 return page_address(page);
181}
182
Glauber Costafae9a0d2008-04-08 13:20:56 -0300183/*
184 * See <Documentation/x86_64/boot-options.txt> for the iommu kernel parameter
185 * documentation.
186 */
187static __init int iommu_setup(char *p)
188{
189 iommu_merge = 1;
190
191 if (!p)
192 return -EINVAL;
193
194 while (*p) {
195 if (!strncmp(p, "off", 3))
196 no_iommu = 1;
197 /* gart_parse_options has more force support */
198 if (!strncmp(p, "force", 5))
199 force_iommu = 1;
200 if (!strncmp(p, "noforce", 7)) {
201 iommu_merge = 0;
202 force_iommu = 0;
203 }
204
205 if (!strncmp(p, "biomerge", 8)) {
Glauber Costafae9a0d2008-04-08 13:20:56 -0300206 iommu_merge = 1;
207 force_iommu = 1;
208 }
209 if (!strncmp(p, "panic", 5))
210 panic_on_overflow = 1;
211 if (!strncmp(p, "nopanic", 7))
212 panic_on_overflow = 0;
213 if (!strncmp(p, "merge", 5)) {
214 iommu_merge = 1;
215 force_iommu = 1;
216 }
217 if (!strncmp(p, "nomerge", 7))
218 iommu_merge = 0;
219 if (!strncmp(p, "forcesac", 8))
220 iommu_sac_force = 1;
221 if (!strncmp(p, "allowdac", 8))
222 forbid_dac = 0;
223 if (!strncmp(p, "nodac", 5))
Tejun Heo2ae8bb72009-10-26 15:41:46 +0100224 forbid_dac = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300225 if (!strncmp(p, "usedac", 6)) {
226 forbid_dac = -1;
227 return 1;
228 }
229#ifdef CONFIG_SWIOTLB
230 if (!strncmp(p, "soft", 4))
231 swiotlb = 1;
David Woodhouse3238c0c2009-07-01 18:56:16 +0100232#endif
Alex Williamson80286872009-07-30 16:15:18 -0600233 if (!strncmp(p, "pt", 2))
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700234 iommu_pass_through = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300235
Glauber Costafae9a0d2008-04-08 13:20:56 -0300236 gart_parse_options(p);
Glauber Costafae9a0d2008-04-08 13:20:56 -0300237
238#ifdef CONFIG_CALGARY_IOMMU
239 if (!strncmp(p, "calgary", 7))
240 use_calgary = 1;
241#endif /* CONFIG_CALGARY_IOMMU */
242
243 p += strcspn(p, ",");
244 if (*p == ',')
245 ++p;
246 }
247 return 0;
248}
249early_param("iommu", iommu_setup);
250
Glauber Costa8e0c3792008-04-08 13:20:55 -0300251int dma_supported(struct device *dev, u64 mask)
252{
FUJITA Tomonori160c1d82009-01-05 23:59:02 +0900253 struct dma_map_ops *ops = get_dma_ops(dev);
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700254
Glauber Costa8e0c3792008-04-08 13:20:55 -0300255#ifdef CONFIG_PCI
256 if (mask > 0xffffffff && forbid_dac > 0) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200257 dev_info(dev, "PCI: Disallowing DAC for device\n");
Glauber Costa8e0c3792008-04-08 13:20:55 -0300258 return 0;
259 }
260#endif
261
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700262 if (ops->dma_supported)
263 return ops->dma_supported(dev, mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300264
265 /* Copied from i386. Doesn't make much sense, because it will
266 only work for pci_alloc_coherent.
267 The caller just has to use GFP_DMA in this case. */
Yang Hongyang2f4f27d2009-04-06 19:01:18 -0700268 if (mask < DMA_BIT_MASK(24))
Glauber Costa8e0c3792008-04-08 13:20:55 -0300269 return 0;
270
271 /* Tell the device to use SAC when IOMMU force is on. This
272 allows the driver to use cheaper accesses in some cases.
273
274 Problem with this is that if we overflow the IOMMU area and
275 return DAC as fallback address the device may not handle it
276 correctly.
277
278 As a special case some controllers have a 39bit address
279 mode that is as efficient as 32bit (aic79xx). Don't force
280 SAC for these. Assume all masks <= 40 bits are of this
281 type. Normally this doesn't make any difference, but gives
282 more gentle handling of IOMMU overflow. */
Yang Hongyang50cf1562009-04-06 19:01:14 -0700283 if (iommu_sac_force && (mask >= DMA_BIT_MASK(40))) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200284 dev_info(dev, "Force SAC with mask %Lx\n", mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300285 return 0;
286 }
287
288 return 1;
289}
290EXPORT_SYMBOL(dma_supported);
291
Glauber Costacb5867a2008-04-08 13:20:51 -0300292static int __init pci_iommu_init(void)
293{
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -0400294 struct iommu_table_entry *p;
Joerg Roedel2118d0c2009-01-09 15:13:15 +0100295 dma_debug_init(PREALLOC_DMA_DEBUG_ENTRIES);
296
Joerg Roedel86f31952009-03-16 17:50:28 +0100297#ifdef CONFIG_PCI
298 dma_debug_add_bus(&pci_bus_type);
299#endif
FUJITA Tomonorid07c1be2009-11-10 19:46:12 +0900300 x86_init.iommu.iommu_init();
301
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -0400302 for (p = __iommu_table; p < __iommu_table_end; p++) {
303 if (p && (p->flags & IOMMU_DETECTED) && p->late_init)
304 p->late_init();
305 }
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900306
Glauber Costacb5867a2008-04-08 13:20:51 -0300307 return 0;
308}
Glauber Costacb5867a2008-04-08 13:20:51 -0300309/* Must execute after PCI subsystem */
David Woodhouse9a821b22009-10-12 12:59:29 +0100310rootfs_initcall(pci_iommu_init);
Fenghua Yu3b15e582008-10-23 16:51:00 -0700311
312#ifdef CONFIG_PCI
313/* Many VIA bridges seem to corrupt data for DAC. Disable it here */
314
315static __devinit void via_no_dac(struct pci_dev *dev)
316{
317 if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI && forbid_dac == 0) {
Bjorn Helgaas13bf7572009-02-24 10:38:22 -0700318 dev_info(&dev->dev, "disabling DAC on VIA PCI bridge\n");
Fenghua Yu3b15e582008-10-23 16:51:00 -0700319 forbid_dac = 1;
320 }
321}
322DECLARE_PCI_FIXUP_FINAL(PCI_VENDOR_ID_VIA, PCI_ANY_ID, via_no_dac);
323#endif