blob: 75e14e21f61a728cb120590a475ff8e0f3e2c37d [file] [log] [blame]
Glauber Costa459121c92008-04-08 13:20:43 -03001#include <linux/dma-mapping.h>
Joerg Roedel2118d0c2009-01-09 15:13:15 +01002#include <linux/dma-debug.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03003#include <linux/dmar.h>
Glauber Costa116890d2008-04-08 13:20:54 -03004#include <linux/bootmem.h>
Glauber Costabca5c092008-04-08 13:20:53 -03005#include <linux/pci.h>
Catalin Marinasacde31d2009-08-27 14:29:20 +01006#include <linux/kmemleak.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03007
Glauber Costa116890d2008-04-08 13:20:54 -03008#include <asm/proto.h>
9#include <asm/dma.h>
FUJITA Tomonori46a7fa22008-07-11 10:23:42 +090010#include <asm/iommu.h>
Joerg Roedel1d9b16d2008-11-27 18:39:15 +010011#include <asm/gart.h>
Glauber Costacb5867a2008-04-08 13:20:51 -030012#include <asm/calgary.h>
Joerg Roedela69ca342008-06-26 21:28:08 +020013#include <asm/amd_iommu.h>
Ingo Molnarb4941a92009-11-10 14:37:58 +010014#include <asm/x86_init.h>
Glauber Costa459121c92008-04-08 13:20:43 -030015
Fenghua Yu3b15e582008-10-23 16:51:00 -070016static int forbid_dac __read_mostly;
17
FUJITA Tomonoria3b28ee2009-11-14 20:46:36 +090018struct dma_map_ops *dma_ops = &nommu_dma_ops;
Glauber Costa85c246e2008-04-08 13:20:50 -030019EXPORT_SYMBOL(dma_ops);
20
Dmitri Vorobievb4cdc432008-04-28 03:15:58 +040021static int iommu_sac_force __read_mostly;
Glauber Costa8e0c3792008-04-08 13:20:55 -030022
Glauber Costaf9c258d2008-04-08 13:20:52 -030023#ifdef CONFIG_IOMMU_DEBUG
24int panic_on_overflow __read_mostly = 1;
25int force_iommu __read_mostly = 1;
26#else
27int panic_on_overflow __read_mostly = 0;
28int force_iommu __read_mostly = 0;
29#endif
30
Glauber Costafae9a0d2008-04-08 13:20:56 -030031int iommu_merge __read_mostly = 0;
32
33int no_iommu __read_mostly;
34/* Set this to 1 if there is a HW IOMMU in the system */
35int iommu_detected __read_mostly = 0;
36
Joerg Roedelac0101d2009-09-01 16:00:35 +020037/*
38 * This variable becomes 1 if iommu=pt is passed on the kernel command line.
Marin Mitove3be7852009-10-03 20:45:02 +030039 * If this variable is 1, IOMMU implementations do no DMA translation for
Joerg Roedelac0101d2009-09-01 16:00:35 +020040 * devices and allow every device to access to whole physical memory. This is
41 * useful if a user want to use an IOMMU only for KVM device assignment to
42 * guests and not for driver dma translation.
43 */
44int iommu_pass_through __read_mostly;
Fenghua Yuaed5d5f2009-04-30 17:57:11 -070045
Jan Beulicheb647132009-11-08 12:12:14 +010046/* Dummy device used for NULL arguments (normally ISA). */
Joerg Roedel6c505ce2008-08-19 16:32:45 +020047struct device x86_dma_fallback_dev = {
Kay Sievers1a927132008-10-30 02:17:49 +010048 .init_name = "fallback device",
Jan Beulicheb647132009-11-08 12:12:14 +010049 .coherent_dma_mask = ISA_DMA_BIT_MASK,
Joerg Roedel6c505ce2008-08-19 16:32:45 +020050 .dma_mask = &x86_dma_fallback_dev.coherent_dma_mask,
Glauber Costa098cb7f2008-04-09 13:18:10 -030051};
Joerg Roedel6c505ce2008-08-19 16:32:45 +020052EXPORT_SYMBOL(x86_dma_fallback_dev);
Glauber Costa098cb7f2008-04-09 13:18:10 -030053
Joerg Roedel2118d0c2009-01-09 15:13:15 +010054/* Number of entries preallocated for DMA-API debugging */
55#define PREALLOC_DMA_DEBUG_ENTRIES 32768
56
Glauber Costa459121c92008-04-08 13:20:43 -030057int dma_set_mask(struct device *dev, u64 mask)
58{
59 if (!dev->dma_mask || !dma_supported(dev, mask))
60 return -EIO;
61
62 *dev->dma_mask = mask;
63
64 return 0;
65}
66EXPORT_SYMBOL(dma_set_mask);
67
Glauber Costa116890d2008-04-08 13:20:54 -030068#ifdef CONFIG_X86_64
69static __initdata void *dma32_bootmem_ptr;
70static unsigned long dma32_bootmem_size __initdata = (128ULL<<20);
71
72static int __init parse_dma32_size_opt(char *p)
73{
74 if (!p)
75 return -EINVAL;
76 dma32_bootmem_size = memparse(p, &p);
77 return 0;
78}
79early_param("dma32_size", parse_dma32_size_opt);
80
81void __init dma32_reserve_bootmem(void)
82{
83 unsigned long size, align;
Yinghai Luc987d122008-06-24 22:14:09 -070084 if (max_pfn <= MAX_DMA32_PFN)
Glauber Costa116890d2008-04-08 13:20:54 -030085 return;
86
Yinghai Lu7677b2e2008-04-14 20:40:37 -070087 /*
88 * check aperture_64.c allocate_aperture() for reason about
89 * using 512M as goal
90 */
Glauber Costa116890d2008-04-08 13:20:54 -030091 align = 64ULL<<20;
Joerg Roedel1ddb5512008-07-25 16:48:55 +020092 size = roundup(dma32_bootmem_size, align);
Glauber Costa116890d2008-04-08 13:20:54 -030093 dma32_bootmem_ptr = __alloc_bootmem_nopanic(size, align,
Yinghai Lu7677b2e2008-04-14 20:40:37 -070094 512ULL<<20);
Catalin Marinasacde31d2009-08-27 14:29:20 +010095 /*
96 * Kmemleak should not scan this block as it may not be mapped via the
97 * kernel direct mapping.
98 */
99 kmemleak_ignore(dma32_bootmem_ptr);
Glauber Costa116890d2008-04-08 13:20:54 -0300100 if (dma32_bootmem_ptr)
101 dma32_bootmem_size = size;
102 else
103 dma32_bootmem_size = 0;
104}
105static void __init dma32_free_bootmem(void)
106{
Glauber Costa116890d2008-04-08 13:20:54 -0300107
Yinghai Luc987d122008-06-24 22:14:09 -0700108 if (max_pfn <= MAX_DMA32_PFN)
Glauber Costa116890d2008-04-08 13:20:54 -0300109 return;
110
111 if (!dma32_bootmem_ptr)
112 return;
113
Yinghai Lu330fce22008-04-19 01:31:45 -0700114 free_bootmem(__pa(dma32_bootmem_ptr), dma32_bootmem_size);
Glauber Costa116890d2008-04-08 13:20:54 -0300115
116 dma32_bootmem_ptr = NULL;
117 dma32_bootmem_size = 0;
118}
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800119#endif
Glauber Costa116890d2008-04-08 13:20:54 -0300120
121void __init pci_iommu_alloc(void)
122{
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800123#ifdef CONFIG_X86_64
Glauber Costa116890d2008-04-08 13:20:54 -0300124 /* free the range so iommu could get some range less than 4G */
125 dma32_free_bootmem();
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800126#endif
FUJITA Tomonori186a2502009-12-15 20:47:56 +0900127 if (pci_swiotlb_detect())
128 goto out;
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800129
Glauber Costa116890d2008-04-08 13:20:54 -0300130 gart_iommu_hole_init();
Glauber Costa116890d2008-04-08 13:20:54 -0300131
Glauber Costa116890d2008-04-08 13:20:54 -0300132 detect_calgary();
Glauber Costa116890d2008-04-08 13:20:54 -0300133
134 detect_intel_iommu();
135
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900136 /* needs to be called after gart_iommu_hole_init */
Joerg Roedela69ca342008-06-26 21:28:08 +0200137 amd_iommu_detect();
FUJITA Tomonori186a2502009-12-15 20:47:56 +0900138out:
139 pci_swiotlb_init();
Glauber Costa116890d2008-04-08 13:20:54 -0300140}
FUJITA Tomonori8978b742008-07-29 13:38:53 +0900141
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900142void *dma_generic_alloc_coherent(struct device *dev, size_t size,
143 dma_addr_t *dma_addr, gfp_t flag)
144{
145 unsigned long dma_mask;
146 struct page *page;
147 dma_addr_t addr;
148
149 dma_mask = dma_alloc_coherent_mask(dev, flag);
150
151 flag |= __GFP_ZERO;
152again:
153 page = alloc_pages_node(dev_to_node(dev), flag, get_order(size));
154 if (!page)
155 return NULL;
156
157 addr = page_to_phys(page);
FUJITA Tomonoria4c2baa2009-07-10 10:04:55 +0900158 if (addr + size > dma_mask) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900159 __free_pages(page, get_order(size));
160
Yang Hongyang284901a2009-04-06 19:01:15 -0700161 if (dma_mask < DMA_BIT_MASK(32) && !(flag & GFP_DMA)) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900162 flag = (flag & ~GFP_DMA32) | GFP_DMA;
163 goto again;
164 }
165
166 return NULL;
167 }
168
169 *dma_addr = addr;
170 return page_address(page);
171}
172
Glauber Costafae9a0d2008-04-08 13:20:56 -0300173/*
174 * See <Documentation/x86_64/boot-options.txt> for the iommu kernel parameter
175 * documentation.
176 */
177static __init int iommu_setup(char *p)
178{
179 iommu_merge = 1;
180
181 if (!p)
182 return -EINVAL;
183
184 while (*p) {
185 if (!strncmp(p, "off", 3))
186 no_iommu = 1;
187 /* gart_parse_options has more force support */
188 if (!strncmp(p, "force", 5))
189 force_iommu = 1;
190 if (!strncmp(p, "noforce", 7)) {
191 iommu_merge = 0;
192 force_iommu = 0;
193 }
194
195 if (!strncmp(p, "biomerge", 8)) {
Glauber Costafae9a0d2008-04-08 13:20:56 -0300196 iommu_merge = 1;
197 force_iommu = 1;
198 }
199 if (!strncmp(p, "panic", 5))
200 panic_on_overflow = 1;
201 if (!strncmp(p, "nopanic", 7))
202 panic_on_overflow = 0;
203 if (!strncmp(p, "merge", 5)) {
204 iommu_merge = 1;
205 force_iommu = 1;
206 }
207 if (!strncmp(p, "nomerge", 7))
208 iommu_merge = 0;
209 if (!strncmp(p, "forcesac", 8))
210 iommu_sac_force = 1;
211 if (!strncmp(p, "allowdac", 8))
212 forbid_dac = 0;
213 if (!strncmp(p, "nodac", 5))
Tejun Heo2ae8bb72009-10-26 15:41:46 +0100214 forbid_dac = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300215 if (!strncmp(p, "usedac", 6)) {
216 forbid_dac = -1;
217 return 1;
218 }
219#ifdef CONFIG_SWIOTLB
220 if (!strncmp(p, "soft", 4))
221 swiotlb = 1;
David Woodhouse3238c0c2009-07-01 18:56:16 +0100222#endif
Alex Williamson80286872009-07-30 16:15:18 -0600223 if (!strncmp(p, "pt", 2))
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700224 iommu_pass_through = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300225
Glauber Costafae9a0d2008-04-08 13:20:56 -0300226 gart_parse_options(p);
Glauber Costafae9a0d2008-04-08 13:20:56 -0300227
228#ifdef CONFIG_CALGARY_IOMMU
229 if (!strncmp(p, "calgary", 7))
230 use_calgary = 1;
231#endif /* CONFIG_CALGARY_IOMMU */
232
233 p += strcspn(p, ",");
234 if (*p == ',')
235 ++p;
236 }
237 return 0;
238}
239early_param("iommu", iommu_setup);
240
Glauber Costa8e0c3792008-04-08 13:20:55 -0300241int dma_supported(struct device *dev, u64 mask)
242{
FUJITA Tomonori160c1d82009-01-05 23:59:02 +0900243 struct dma_map_ops *ops = get_dma_ops(dev);
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700244
Glauber Costa8e0c3792008-04-08 13:20:55 -0300245#ifdef CONFIG_PCI
246 if (mask > 0xffffffff && forbid_dac > 0) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200247 dev_info(dev, "PCI: Disallowing DAC for device\n");
Glauber Costa8e0c3792008-04-08 13:20:55 -0300248 return 0;
249 }
250#endif
251
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700252 if (ops->dma_supported)
253 return ops->dma_supported(dev, mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300254
255 /* Copied from i386. Doesn't make much sense, because it will
256 only work for pci_alloc_coherent.
257 The caller just has to use GFP_DMA in this case. */
Yang Hongyang2f4f27d2009-04-06 19:01:18 -0700258 if (mask < DMA_BIT_MASK(24))
Glauber Costa8e0c3792008-04-08 13:20:55 -0300259 return 0;
260
261 /* Tell the device to use SAC when IOMMU force is on. This
262 allows the driver to use cheaper accesses in some cases.
263
264 Problem with this is that if we overflow the IOMMU area and
265 return DAC as fallback address the device may not handle it
266 correctly.
267
268 As a special case some controllers have a 39bit address
269 mode that is as efficient as 32bit (aic79xx). Don't force
270 SAC for these. Assume all masks <= 40 bits are of this
271 type. Normally this doesn't make any difference, but gives
272 more gentle handling of IOMMU overflow. */
Yang Hongyang50cf1562009-04-06 19:01:14 -0700273 if (iommu_sac_force && (mask >= DMA_BIT_MASK(40))) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200274 dev_info(dev, "Force SAC with mask %Lx\n", mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300275 return 0;
276 }
277
278 return 1;
279}
280EXPORT_SYMBOL(dma_supported);
281
Glauber Costacb5867a2008-04-08 13:20:51 -0300282static int __init pci_iommu_init(void)
283{
Joerg Roedel2118d0c2009-01-09 15:13:15 +0100284 dma_debug_init(PREALLOC_DMA_DEBUG_ENTRIES);
285
Joerg Roedel86f31952009-03-16 17:50:28 +0100286#ifdef CONFIG_PCI
287 dma_debug_add_bus(&pci_bus_type);
288#endif
FUJITA Tomonorid07c1be2009-11-10 19:46:12 +0900289 x86_init.iommu.iommu_init();
290
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900291 if (swiotlb) {
292 printk(KERN_INFO "PCI-DMA: "
293 "Using software bounce buffering for IO (SWIOTLB)\n");
294 swiotlb_print_info();
295 } else
296 swiotlb_free();
297
Glauber Costacb5867a2008-04-08 13:20:51 -0300298 return 0;
299}
Glauber Costacb5867a2008-04-08 13:20:51 -0300300/* Must execute after PCI subsystem */
David Woodhouse9a821b22009-10-12 12:59:29 +0100301rootfs_initcall(pci_iommu_init);
Fenghua Yu3b15e582008-10-23 16:51:00 -0700302
303#ifdef CONFIG_PCI
304/* Many VIA bridges seem to corrupt data for DAC. Disable it here */
305
306static __devinit void via_no_dac(struct pci_dev *dev)
307{
308 if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI && forbid_dac == 0) {
Bjorn Helgaas13bf7572009-02-24 10:38:22 -0700309 dev_info(&dev->dev, "disabling DAC on VIA PCI bridge\n");
Fenghua Yu3b15e582008-10-23 16:51:00 -0700310 forbid_dac = 1;
311 }
312}
313DECLARE_PCI_FIXUP_FINAL(PCI_VENDOR_ID_VIA, PCI_ANY_ID, via_no_dac);
314#endif