blob: 1c4d769e21ea07053f81f75b7aed2b21ab1f397f [file] [log] [blame]
Glauber Costa459121c92008-04-08 13:20:43 -03001#include <linux/dma-mapping.h>
Joerg Roedel2118d0c2009-01-09 15:13:15 +01002#include <linux/dma-debug.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03003#include <linux/dmar.h>
Paul Gortmaker69c60c82011-05-26 12:22:53 -04004#include <linux/export.h>
Glauber Costa116890d2008-04-08 13:20:54 -03005#include <linux/bootmem.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +09006#include <linux/gfp.h>
Glauber Costabca5c092008-04-08 13:20:53 -03007#include <linux/pci.h>
Catalin Marinasacde31d2009-08-27 14:29:20 +01008#include <linux/kmemleak.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03009
Glauber Costa116890d2008-04-08 13:20:54 -030010#include <asm/proto.h>
11#include <asm/dma.h>
FUJITA Tomonori46a7fa22008-07-11 10:23:42 +090012#include <asm/iommu.h>
Joerg Roedel1d9b16d2008-11-27 18:39:15 +010013#include <asm/gart.h>
Glauber Costacb5867a2008-04-08 13:20:51 -030014#include <asm/calgary.h>
Ingo Molnarb4941a92009-11-10 14:37:58 +010015#include <asm/x86_init.h>
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -040016#include <asm/iommu_table.h>
Glauber Costa459121c92008-04-08 13:20:43 -030017
Fenghua Yu3b15e582008-10-23 16:51:00 -070018static int forbid_dac __read_mostly;
19
FUJITA Tomonoria3b28ee2009-11-14 20:46:36 +090020struct dma_map_ops *dma_ops = &nommu_dma_ops;
Glauber Costa85c246e2008-04-08 13:20:50 -030021EXPORT_SYMBOL(dma_ops);
22
Dmitri Vorobievb4cdc432008-04-28 03:15:58 +040023static int iommu_sac_force __read_mostly;
Glauber Costa8e0c3792008-04-08 13:20:55 -030024
Glauber Costaf9c258d2008-04-08 13:20:52 -030025#ifdef CONFIG_IOMMU_DEBUG
26int panic_on_overflow __read_mostly = 1;
27int force_iommu __read_mostly = 1;
28#else
29int panic_on_overflow __read_mostly = 0;
30int force_iommu __read_mostly = 0;
31#endif
32
Glauber Costafae9a0d2008-04-08 13:20:56 -030033int iommu_merge __read_mostly = 0;
34
35int no_iommu __read_mostly;
36/* Set this to 1 if there is a HW IOMMU in the system */
37int iommu_detected __read_mostly = 0;
38
Joerg Roedelac0101d2009-09-01 16:00:35 +020039/*
40 * This variable becomes 1 if iommu=pt is passed on the kernel command line.
Marin Mitove3be7852009-10-03 20:45:02 +030041 * If this variable is 1, IOMMU implementations do no DMA translation for
Joerg Roedelac0101d2009-09-01 16:00:35 +020042 * devices and allow every device to access to whole physical memory. This is
Justin P. Mattockfb637f32010-01-14 22:16:16 -080043 * useful if a user wants to use an IOMMU only for KVM device assignment to
Joerg Roedelac0101d2009-09-01 16:00:35 +020044 * guests and not for driver dma translation.
45 */
46int iommu_pass_through __read_mostly;
Fenghua Yuaed5d5f2009-04-30 17:57:11 -070047
Alex Williamsonbcb71ab2011-10-21 15:56:24 -040048/*
49 * Group multi-function PCI devices into a single device-group for the
50 * iommu_device_group interface. This tells the iommu driver to pretend
51 * it cannot distinguish between functions of a device, exposing only one
52 * group for the device. Useful for disallowing use of individual PCI
53 * functions from userspace drivers.
54 */
55int iommu_group_mf __read_mostly;
56
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -040057extern struct iommu_table_entry __iommu_table[], __iommu_table_end[];
58
Jan Beulicheb647132009-11-08 12:12:14 +010059/* Dummy device used for NULL arguments (normally ISA). */
Joerg Roedel6c505ce2008-08-19 16:32:45 +020060struct device x86_dma_fallback_dev = {
Kay Sievers1a927132008-10-30 02:17:49 +010061 .init_name = "fallback device",
Jan Beulicheb647132009-11-08 12:12:14 +010062 .coherent_dma_mask = ISA_DMA_BIT_MASK,
Joerg Roedel6c505ce2008-08-19 16:32:45 +020063 .dma_mask = &x86_dma_fallback_dev.coherent_dma_mask,
Glauber Costa098cb7f2008-04-09 13:18:10 -030064};
Joerg Roedel6c505ce2008-08-19 16:32:45 +020065EXPORT_SYMBOL(x86_dma_fallback_dev);
Glauber Costa098cb7f2008-04-09 13:18:10 -030066
Joerg Roedel2118d0c2009-01-09 15:13:15 +010067/* Number of entries preallocated for DMA-API debugging */
68#define PREALLOC_DMA_DEBUG_ENTRIES 32768
69
Glauber Costa459121c92008-04-08 13:20:43 -030070int dma_set_mask(struct device *dev, u64 mask)
71{
72 if (!dev->dma_mask || !dma_supported(dev, mask))
73 return -EIO;
74
75 *dev->dma_mask = mask;
76
77 return 0;
78}
79EXPORT_SYMBOL(dma_set_mask);
80
Glauber Costa116890d2008-04-08 13:20:54 -030081void __init pci_iommu_alloc(void)
82{
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -040083 struct iommu_table_entry *p;
84
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -040085 sort_iommu_table(__iommu_table, __iommu_table_end);
86 check_iommu_entries(__iommu_table, __iommu_table_end);
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -080087
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -040088 for (p = __iommu_table; p < __iommu_table_end; p++) {
89 if (p && p->detect && p->detect() > 0) {
90 p->flags |= IOMMU_DETECTED;
91 if (p->early_init)
92 p->early_init();
93 if (p->flags & IOMMU_FINISH_IF_DETECTED)
94 break;
95 }
96 }
Glauber Costa116890d2008-04-08 13:20:54 -030097}
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +090098void *dma_generic_alloc_coherent(struct device *dev, size_t size,
99 dma_addr_t *dma_addr, gfp_t flag)
100{
101 unsigned long dma_mask;
102 struct page *page;
103 dma_addr_t addr;
104
105 dma_mask = dma_alloc_coherent_mask(dev, flag);
106
107 flag |= __GFP_ZERO;
108again:
109 page = alloc_pages_node(dev_to_node(dev), flag, get_order(size));
110 if (!page)
111 return NULL;
112
113 addr = page_to_phys(page);
FUJITA Tomonoria4c2baa2009-07-10 10:04:55 +0900114 if (addr + size > dma_mask) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900115 __free_pages(page, get_order(size));
116
Yang Hongyang284901a2009-04-06 19:01:15 -0700117 if (dma_mask < DMA_BIT_MASK(32) && !(flag & GFP_DMA)) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900118 flag = (flag & ~GFP_DMA32) | GFP_DMA;
119 goto again;
120 }
121
122 return NULL;
123 }
124
125 *dma_addr = addr;
126 return page_address(page);
127}
128
Glauber Costafae9a0d2008-04-08 13:20:56 -0300129/*
Paul Bolle395cf962011-08-15 02:02:26 +0200130 * See <Documentation/x86/x86_64/boot-options.txt> for the iommu kernel
131 * parameter documentation.
Glauber Costafae9a0d2008-04-08 13:20:56 -0300132 */
133static __init int iommu_setup(char *p)
134{
135 iommu_merge = 1;
136
137 if (!p)
138 return -EINVAL;
139
140 while (*p) {
141 if (!strncmp(p, "off", 3))
142 no_iommu = 1;
143 /* gart_parse_options has more force support */
144 if (!strncmp(p, "force", 5))
145 force_iommu = 1;
146 if (!strncmp(p, "noforce", 7)) {
147 iommu_merge = 0;
148 force_iommu = 0;
149 }
150
151 if (!strncmp(p, "biomerge", 8)) {
Glauber Costafae9a0d2008-04-08 13:20:56 -0300152 iommu_merge = 1;
153 force_iommu = 1;
154 }
155 if (!strncmp(p, "panic", 5))
156 panic_on_overflow = 1;
157 if (!strncmp(p, "nopanic", 7))
158 panic_on_overflow = 0;
159 if (!strncmp(p, "merge", 5)) {
160 iommu_merge = 1;
161 force_iommu = 1;
162 }
163 if (!strncmp(p, "nomerge", 7))
164 iommu_merge = 0;
165 if (!strncmp(p, "forcesac", 8))
166 iommu_sac_force = 1;
167 if (!strncmp(p, "allowdac", 8))
168 forbid_dac = 0;
169 if (!strncmp(p, "nodac", 5))
Tejun Heo2ae8bb72009-10-26 15:41:46 +0100170 forbid_dac = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300171 if (!strncmp(p, "usedac", 6)) {
172 forbid_dac = -1;
173 return 1;
174 }
175#ifdef CONFIG_SWIOTLB
176 if (!strncmp(p, "soft", 4))
177 swiotlb = 1;
David Woodhouse3238c0c2009-07-01 18:56:16 +0100178#endif
Alex Williamson80286872009-07-30 16:15:18 -0600179 if (!strncmp(p, "pt", 2))
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700180 iommu_pass_through = 1;
Alex Williamsonbcb71ab2011-10-21 15:56:24 -0400181 if (!strncmp(p, "group_mf", 8))
182 iommu_group_mf = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300183
Glauber Costafae9a0d2008-04-08 13:20:56 -0300184 gart_parse_options(p);
Glauber Costafae9a0d2008-04-08 13:20:56 -0300185
186#ifdef CONFIG_CALGARY_IOMMU
187 if (!strncmp(p, "calgary", 7))
188 use_calgary = 1;
189#endif /* CONFIG_CALGARY_IOMMU */
190
191 p += strcspn(p, ",");
192 if (*p == ',')
193 ++p;
194 }
195 return 0;
196}
197early_param("iommu", iommu_setup);
198
Glauber Costa8e0c3792008-04-08 13:20:55 -0300199int dma_supported(struct device *dev, u64 mask)
200{
FUJITA Tomonori160c1d82009-01-05 23:59:02 +0900201 struct dma_map_ops *ops = get_dma_ops(dev);
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700202
Glauber Costa8e0c3792008-04-08 13:20:55 -0300203#ifdef CONFIG_PCI
204 if (mask > 0xffffffff && forbid_dac > 0) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200205 dev_info(dev, "PCI: Disallowing DAC for device\n");
Glauber Costa8e0c3792008-04-08 13:20:55 -0300206 return 0;
207 }
208#endif
209
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700210 if (ops->dma_supported)
211 return ops->dma_supported(dev, mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300212
213 /* Copied from i386. Doesn't make much sense, because it will
214 only work for pci_alloc_coherent.
215 The caller just has to use GFP_DMA in this case. */
Yang Hongyang2f4f27d2009-04-06 19:01:18 -0700216 if (mask < DMA_BIT_MASK(24))
Glauber Costa8e0c3792008-04-08 13:20:55 -0300217 return 0;
218
219 /* Tell the device to use SAC when IOMMU force is on. This
220 allows the driver to use cheaper accesses in some cases.
221
222 Problem with this is that if we overflow the IOMMU area and
223 return DAC as fallback address the device may not handle it
224 correctly.
225
226 As a special case some controllers have a 39bit address
227 mode that is as efficient as 32bit (aic79xx). Don't force
228 SAC for these. Assume all masks <= 40 bits are of this
229 type. Normally this doesn't make any difference, but gives
230 more gentle handling of IOMMU overflow. */
Yang Hongyang50cf1562009-04-06 19:01:14 -0700231 if (iommu_sac_force && (mask >= DMA_BIT_MASK(40))) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200232 dev_info(dev, "Force SAC with mask %Lx\n", mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300233 return 0;
234 }
235
236 return 1;
237}
238EXPORT_SYMBOL(dma_supported);
239
Glauber Costacb5867a2008-04-08 13:20:51 -0300240static int __init pci_iommu_init(void)
241{
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -0400242 struct iommu_table_entry *p;
Joerg Roedel2118d0c2009-01-09 15:13:15 +0100243 dma_debug_init(PREALLOC_DMA_DEBUG_ENTRIES);
244
Joerg Roedel86f31952009-03-16 17:50:28 +0100245#ifdef CONFIG_PCI
246 dma_debug_add_bus(&pci_bus_type);
247#endif
FUJITA Tomonorid07c1be2009-11-10 19:46:12 +0900248 x86_init.iommu.iommu_init();
249
Konrad Rzeszutek Wilkee1f2842010-08-26 13:58:05 -0400250 for (p = __iommu_table; p < __iommu_table_end; p++) {
251 if (p && (p->flags & IOMMU_DETECTED) && p->late_init)
252 p->late_init();
253 }
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900254
Glauber Costacb5867a2008-04-08 13:20:51 -0300255 return 0;
256}
Glauber Costacb5867a2008-04-08 13:20:51 -0300257/* Must execute after PCI subsystem */
David Woodhouse9a821b22009-10-12 12:59:29 +0100258rootfs_initcall(pci_iommu_init);
Fenghua Yu3b15e582008-10-23 16:51:00 -0700259
260#ifdef CONFIG_PCI
261/* Many VIA bridges seem to corrupt data for DAC. Disable it here */
262
263static __devinit void via_no_dac(struct pci_dev *dev)
264{
265 if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI && forbid_dac == 0) {
Bjorn Helgaas13bf7572009-02-24 10:38:22 -0700266 dev_info(&dev->dev, "disabling DAC on VIA PCI bridge\n");
Fenghua Yu3b15e582008-10-23 16:51:00 -0700267 forbid_dac = 1;
268 }
269}
270DECLARE_PCI_FIXUP_FINAL(PCI_VENDOR_ID_VIA, PCI_ANY_ID, via_no_dac);
271#endif