blob: 63eebee80e754e7383319b8dc4a3d9ec37ec5e80 [file] [log] [blame]
Glauber Costa459121c92008-04-08 13:20:43 -03001#include <linux/dma-mapping.h>
Joerg Roedel2118d0c2009-01-09 15:13:15 +01002#include <linux/dma-debug.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03003#include <linux/dmar.h>
Glauber Costa116890d2008-04-08 13:20:54 -03004#include <linux/bootmem.h>
Glauber Costabca5c092008-04-08 13:20:53 -03005#include <linux/pci.h>
Catalin Marinasacde31d2009-08-27 14:29:20 +01006#include <linux/kmemleak.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03007
Glauber Costa116890d2008-04-08 13:20:54 -03008#include <asm/proto.h>
9#include <asm/dma.h>
FUJITA Tomonori46a7fa22008-07-11 10:23:42 +090010#include <asm/iommu.h>
Joerg Roedel1d9b16d2008-11-27 18:39:15 +010011#include <asm/gart.h>
Glauber Costacb5867a2008-04-08 13:20:51 -030012#include <asm/calgary.h>
Joerg Roedela69ca342008-06-26 21:28:08 +020013#include <asm/amd_iommu.h>
Glauber Costa459121c92008-04-08 13:20:43 -030014
Fenghua Yu3b15e582008-10-23 16:51:00 -070015static int forbid_dac __read_mostly;
16
FUJITA Tomonori160c1d82009-01-05 23:59:02 +090017struct dma_map_ops *dma_ops;
Glauber Costa85c246e2008-04-08 13:20:50 -030018EXPORT_SYMBOL(dma_ops);
19
Dmitri Vorobievb4cdc432008-04-28 03:15:58 +040020static int iommu_sac_force __read_mostly;
Glauber Costa8e0c3792008-04-08 13:20:55 -030021
Glauber Costaf9c258d2008-04-08 13:20:52 -030022#ifdef CONFIG_IOMMU_DEBUG
23int panic_on_overflow __read_mostly = 1;
24int force_iommu __read_mostly = 1;
25#else
26int panic_on_overflow __read_mostly = 0;
27int force_iommu __read_mostly = 0;
28#endif
29
Glauber Costafae9a0d2008-04-08 13:20:56 -030030int iommu_merge __read_mostly = 0;
31
32int no_iommu __read_mostly;
33/* Set this to 1 if there is a HW IOMMU in the system */
34int iommu_detected __read_mostly = 0;
35
Joerg Roedelac0101d2009-09-01 16:00:35 +020036/*
37 * This variable becomes 1 if iommu=pt is passed on the kernel command line.
Marin Mitove3be7852009-10-03 20:45:02 +030038 * If this variable is 1, IOMMU implementations do no DMA translation for
Joerg Roedelac0101d2009-09-01 16:00:35 +020039 * devices and allow every device to access to whole physical memory. This is
40 * useful if a user want to use an IOMMU only for KVM device assignment to
41 * guests and not for driver dma translation.
42 */
43int iommu_pass_through __read_mostly;
Fenghua Yuaed5d5f2009-04-30 17:57:11 -070044
Glauber Costacac67872008-04-08 13:21:00 -030045dma_addr_t bad_dma_address __read_mostly = 0;
46EXPORT_SYMBOL(bad_dma_address);
Glauber Costafae9a0d2008-04-08 13:20:56 -030047
Glauber Costa098cb7f2008-04-09 13:18:10 -030048/* Dummy device used for NULL arguments (normally ISA). Better would
49 be probably a smaller DMA mask, but this is bug-to-bug compatible
50 to older i386. */
Joerg Roedel6c505ce2008-08-19 16:32:45 +020051struct device x86_dma_fallback_dev = {
Kay Sievers1a927132008-10-30 02:17:49 +010052 .init_name = "fallback device",
Yang Hongyang284901a2009-04-06 19:01:15 -070053 .coherent_dma_mask = DMA_BIT_MASK(32),
Joerg Roedel6c505ce2008-08-19 16:32:45 +020054 .dma_mask = &x86_dma_fallback_dev.coherent_dma_mask,
Glauber Costa098cb7f2008-04-09 13:18:10 -030055};
Joerg Roedel6c505ce2008-08-19 16:32:45 +020056EXPORT_SYMBOL(x86_dma_fallback_dev);
Glauber Costa098cb7f2008-04-09 13:18:10 -030057
Joerg Roedel2118d0c2009-01-09 15:13:15 +010058/* Number of entries preallocated for DMA-API debugging */
59#define PREALLOC_DMA_DEBUG_ENTRIES 32768
60
Glauber Costa459121c92008-04-08 13:20:43 -030061int dma_set_mask(struct device *dev, u64 mask)
62{
63 if (!dev->dma_mask || !dma_supported(dev, mask))
64 return -EIO;
65
66 *dev->dma_mask = mask;
67
68 return 0;
69}
70EXPORT_SYMBOL(dma_set_mask);
71
Glauber Costa116890d2008-04-08 13:20:54 -030072#ifdef CONFIG_X86_64
73static __initdata void *dma32_bootmem_ptr;
74static unsigned long dma32_bootmem_size __initdata = (128ULL<<20);
75
76static int __init parse_dma32_size_opt(char *p)
77{
78 if (!p)
79 return -EINVAL;
80 dma32_bootmem_size = memparse(p, &p);
81 return 0;
82}
83early_param("dma32_size", parse_dma32_size_opt);
84
85void __init dma32_reserve_bootmem(void)
86{
87 unsigned long size, align;
Yinghai Luc987d122008-06-24 22:14:09 -070088 if (max_pfn <= MAX_DMA32_PFN)
Glauber Costa116890d2008-04-08 13:20:54 -030089 return;
90
Yinghai Lu7677b2e2008-04-14 20:40:37 -070091 /*
92 * check aperture_64.c allocate_aperture() for reason about
93 * using 512M as goal
94 */
Glauber Costa116890d2008-04-08 13:20:54 -030095 align = 64ULL<<20;
Joerg Roedel1ddb5512008-07-25 16:48:55 +020096 size = roundup(dma32_bootmem_size, align);
Glauber Costa116890d2008-04-08 13:20:54 -030097 dma32_bootmem_ptr = __alloc_bootmem_nopanic(size, align,
Yinghai Lu7677b2e2008-04-14 20:40:37 -070098 512ULL<<20);
Catalin Marinasacde31d2009-08-27 14:29:20 +010099 /*
100 * Kmemleak should not scan this block as it may not be mapped via the
101 * kernel direct mapping.
102 */
103 kmemleak_ignore(dma32_bootmem_ptr);
Glauber Costa116890d2008-04-08 13:20:54 -0300104 if (dma32_bootmem_ptr)
105 dma32_bootmem_size = size;
106 else
107 dma32_bootmem_size = 0;
108}
109static void __init dma32_free_bootmem(void)
110{
Glauber Costa116890d2008-04-08 13:20:54 -0300111
Yinghai Luc987d122008-06-24 22:14:09 -0700112 if (max_pfn <= MAX_DMA32_PFN)
Glauber Costa116890d2008-04-08 13:20:54 -0300113 return;
114
115 if (!dma32_bootmem_ptr)
116 return;
117
Yinghai Lu330fce22008-04-19 01:31:45 -0700118 free_bootmem(__pa(dma32_bootmem_ptr), dma32_bootmem_size);
Glauber Costa116890d2008-04-08 13:20:54 -0300119
120 dma32_bootmem_ptr = NULL;
121 dma32_bootmem_size = 0;
122}
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800123#endif
Glauber Costa116890d2008-04-08 13:20:54 -0300124
125void __init pci_iommu_alloc(void)
126{
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900127 /* swiotlb is forced by the boot option */
128 int use_swiotlb = swiotlb;
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800129#ifdef CONFIG_X86_64
Glauber Costa116890d2008-04-08 13:20:54 -0300130 /* free the range so iommu could get some range less than 4G */
131 dma32_free_bootmem();
FUJITA Tomonori72d03802009-11-10 21:35:17 +0900132#else
133 dma_ops = &nommu_dma_ops;
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800134#endif
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900135 pci_swiotlb_init();
136 if (use_swiotlb)
137 return;
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800138
Glauber Costa116890d2008-04-08 13:20:54 -0300139 gart_iommu_hole_init();
Glauber Costa116890d2008-04-08 13:20:54 -0300140
Glauber Costa116890d2008-04-08 13:20:54 -0300141 detect_calgary();
Glauber Costa116890d2008-04-08 13:20:54 -0300142
143 detect_intel_iommu();
144
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900145 /* needs to be called after gart_iommu_hole_init */
Joerg Roedela69ca342008-06-26 21:28:08 +0200146 amd_iommu_detect();
Glauber Costa116890d2008-04-08 13:20:54 -0300147}
FUJITA Tomonori8978b742008-07-29 13:38:53 +0900148
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900149void *dma_generic_alloc_coherent(struct device *dev, size_t size,
150 dma_addr_t *dma_addr, gfp_t flag)
151{
152 unsigned long dma_mask;
153 struct page *page;
154 dma_addr_t addr;
155
156 dma_mask = dma_alloc_coherent_mask(dev, flag);
157
158 flag |= __GFP_ZERO;
159again:
160 page = alloc_pages_node(dev_to_node(dev), flag, get_order(size));
161 if (!page)
162 return NULL;
163
164 addr = page_to_phys(page);
FUJITA Tomonoria4c2baa2009-07-10 10:04:55 +0900165 if (addr + size > dma_mask) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900166 __free_pages(page, get_order(size));
167
Yang Hongyang284901a2009-04-06 19:01:15 -0700168 if (dma_mask < DMA_BIT_MASK(32) && !(flag & GFP_DMA)) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900169 flag = (flag & ~GFP_DMA32) | GFP_DMA;
170 goto again;
171 }
172
173 return NULL;
174 }
175
176 *dma_addr = addr;
177 return page_address(page);
178}
179
Glauber Costafae9a0d2008-04-08 13:20:56 -0300180/*
181 * See <Documentation/x86_64/boot-options.txt> for the iommu kernel parameter
182 * documentation.
183 */
184static __init int iommu_setup(char *p)
185{
186 iommu_merge = 1;
187
188 if (!p)
189 return -EINVAL;
190
191 while (*p) {
192 if (!strncmp(p, "off", 3))
193 no_iommu = 1;
194 /* gart_parse_options has more force support */
195 if (!strncmp(p, "force", 5))
196 force_iommu = 1;
197 if (!strncmp(p, "noforce", 7)) {
198 iommu_merge = 0;
199 force_iommu = 0;
200 }
201
202 if (!strncmp(p, "biomerge", 8)) {
Glauber Costafae9a0d2008-04-08 13:20:56 -0300203 iommu_merge = 1;
204 force_iommu = 1;
205 }
206 if (!strncmp(p, "panic", 5))
207 panic_on_overflow = 1;
208 if (!strncmp(p, "nopanic", 7))
209 panic_on_overflow = 0;
210 if (!strncmp(p, "merge", 5)) {
211 iommu_merge = 1;
212 force_iommu = 1;
213 }
214 if (!strncmp(p, "nomerge", 7))
215 iommu_merge = 0;
216 if (!strncmp(p, "forcesac", 8))
217 iommu_sac_force = 1;
218 if (!strncmp(p, "allowdac", 8))
219 forbid_dac = 0;
220 if (!strncmp(p, "nodac", 5))
Tejun Heo2ae8bb72009-10-26 15:41:46 +0100221 forbid_dac = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300222 if (!strncmp(p, "usedac", 6)) {
223 forbid_dac = -1;
224 return 1;
225 }
226#ifdef CONFIG_SWIOTLB
227 if (!strncmp(p, "soft", 4))
228 swiotlb = 1;
David Woodhouse3238c0c2009-07-01 18:56:16 +0100229#endif
Alex Williamson80286872009-07-30 16:15:18 -0600230 if (!strncmp(p, "pt", 2))
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700231 iommu_pass_through = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300232
Glauber Costafae9a0d2008-04-08 13:20:56 -0300233 gart_parse_options(p);
Glauber Costafae9a0d2008-04-08 13:20:56 -0300234
235#ifdef CONFIG_CALGARY_IOMMU
236 if (!strncmp(p, "calgary", 7))
237 use_calgary = 1;
238#endif /* CONFIG_CALGARY_IOMMU */
239
240 p += strcspn(p, ",");
241 if (*p == ',')
242 ++p;
243 }
244 return 0;
245}
246early_param("iommu", iommu_setup);
247
Glauber Costa8e0c3792008-04-08 13:20:55 -0300248int dma_supported(struct device *dev, u64 mask)
249{
FUJITA Tomonori160c1d82009-01-05 23:59:02 +0900250 struct dma_map_ops *ops = get_dma_ops(dev);
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700251
Glauber Costa8e0c3792008-04-08 13:20:55 -0300252#ifdef CONFIG_PCI
253 if (mask > 0xffffffff && forbid_dac > 0) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200254 dev_info(dev, "PCI: Disallowing DAC for device\n");
Glauber Costa8e0c3792008-04-08 13:20:55 -0300255 return 0;
256 }
257#endif
258
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700259 if (ops->dma_supported)
260 return ops->dma_supported(dev, mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300261
262 /* Copied from i386. Doesn't make much sense, because it will
263 only work for pci_alloc_coherent.
264 The caller just has to use GFP_DMA in this case. */
Yang Hongyang2f4f27d2009-04-06 19:01:18 -0700265 if (mask < DMA_BIT_MASK(24))
Glauber Costa8e0c3792008-04-08 13:20:55 -0300266 return 0;
267
268 /* Tell the device to use SAC when IOMMU force is on. This
269 allows the driver to use cheaper accesses in some cases.
270
271 Problem with this is that if we overflow the IOMMU area and
272 return DAC as fallback address the device may not handle it
273 correctly.
274
275 As a special case some controllers have a 39bit address
276 mode that is as efficient as 32bit (aic79xx). Don't force
277 SAC for these. Assume all masks <= 40 bits are of this
278 type. Normally this doesn't make any difference, but gives
279 more gentle handling of IOMMU overflow. */
Yang Hongyang50cf1562009-04-06 19:01:14 -0700280 if (iommu_sac_force && (mask >= DMA_BIT_MASK(40))) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200281 dev_info(dev, "Force SAC with mask %Lx\n", mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300282 return 0;
283 }
284
285 return 1;
286}
287EXPORT_SYMBOL(dma_supported);
288
Glauber Costacb5867a2008-04-08 13:20:51 -0300289static int __init pci_iommu_init(void)
290{
Joerg Roedel2118d0c2009-01-09 15:13:15 +0100291 dma_debug_init(PREALLOC_DMA_DEBUG_ENTRIES);
292
Joerg Roedel86f31952009-03-16 17:50:28 +0100293#ifdef CONFIG_PCI
294 dma_debug_add_bus(&pci_bus_type);
295#endif
FUJITA Tomonorid07c1be2009-11-10 19:46:12 +0900296 x86_init.iommu.iommu_init();
297
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900298 if (swiotlb) {
299 printk(KERN_INFO "PCI-DMA: "
300 "Using software bounce buffering for IO (SWIOTLB)\n");
301 swiotlb_print_info();
302 } else
303 swiotlb_free();
304
Glauber Costacb5867a2008-04-08 13:20:51 -0300305 return 0;
306}
Glauber Costacb5867a2008-04-08 13:20:51 -0300307/* Must execute after PCI subsystem */
David Woodhouse9a821b22009-10-12 12:59:29 +0100308rootfs_initcall(pci_iommu_init);
Fenghua Yu3b15e582008-10-23 16:51:00 -0700309
310#ifdef CONFIG_PCI
311/* Many VIA bridges seem to corrupt data for DAC. Disable it here */
312
313static __devinit void via_no_dac(struct pci_dev *dev)
314{
315 if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI && forbid_dac == 0) {
Bjorn Helgaas13bf7572009-02-24 10:38:22 -0700316 dev_info(&dev->dev, "disabling DAC on VIA PCI bridge\n");
Fenghua Yu3b15e582008-10-23 16:51:00 -0700317 forbid_dac = 1;
318 }
319}
320DECLARE_PCI_FIXUP_FINAL(PCI_VENDOR_ID_VIA, PCI_ANY_ID, via_no_dac);
321#endif