blob: cd634795aa9cda898c4f129b46e94e7d1475c785 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/alpha/kernel/pci_iommu.c
3 */
4
5#include <linux/kernel.h>
6#include <linux/mm.h>
7#include <linux/pci.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +09008#include <linux/gfp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -07009#include <linux/bootmem.h>
Paul Gortmaker00cd1172011-08-01 13:50:15 -040010#include <linux/export.h>
Jens Axboe944bda22007-10-23 12:31:05 +020011#include <linux/scatterlist.h>
Richard Henderson74fd1b62007-05-29 16:01:35 -070012#include <linux/log2.h>
FUJITA Tomonori7c536642008-02-04 22:27:58 -080013#include <linux/dma-mapping.h>
FUJITA Tomonorifd288412008-03-13 12:32:40 -070014#include <linux/iommu-helper.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070015
16#include <asm/io.h>
17#include <asm/hwrpb.h>
18
19#include "proto.h"
20#include "pci_impl.h"
21
22
23#define DEBUG_ALLOC 0
24#if DEBUG_ALLOC > 0
25# define DBGA(args...) printk(KERN_DEBUG args)
26#else
27# define DBGA(args...)
28#endif
29#if DEBUG_ALLOC > 1
30# define DBGA2(args...) printk(KERN_DEBUG args)
31#else
32# define DBGA2(args...)
33#endif
34
35#define DEBUG_NODIRECT 0
Linus Torvalds1da177e2005-04-16 15:20:36 -070036
37#define ISA_DMA_MASK 0x00ffffff
38
39static inline unsigned long
40mk_iommu_pte(unsigned long paddr)
41{
42 return (paddr >> (PAGE_SHIFT-1)) | 1;
43}
44
Linus Torvalds1da177e2005-04-16 15:20:36 -070045/* Return the minimum of MAX or the first power of two larger
46 than main memory. */
47
48unsigned long
49size_for_memory(unsigned long max)
50{
51 unsigned long mem = max_low_pfn << PAGE_SHIFT;
52 if (mem < max)
Richard Henderson74fd1b62007-05-29 16:01:35 -070053 max = roundup_pow_of_two(mem);
Linus Torvalds1da177e2005-04-16 15:20:36 -070054 return max;
55}
56
Al Viroed5f6562007-07-26 17:34:19 +010057struct pci_iommu_arena * __init
Linus Torvalds1da177e2005-04-16 15:20:36 -070058iommu_arena_new_node(int nid, struct pci_controller *hose, dma_addr_t base,
59 unsigned long window_size, unsigned long align)
60{
61 unsigned long mem_size;
62 struct pci_iommu_arena *arena;
63
64 mem_size = window_size / (PAGE_SIZE / sizeof(unsigned long));
65
66 /* Note that the TLB lookup logic uses bitwise concatenation,
67 not addition, so the required arena alignment is based on
68 the size of the window. Retain the align parameter so that
69 particular systems can over-align the arena. */
70 if (align < mem_size)
71 align = mem_size;
72
73
74#ifdef CONFIG_DISCONTIGMEM
75
Harvey Harrisonbbb8d342008-04-28 02:13:46 -070076 arena = alloc_bootmem_node(NODE_DATA(nid), sizeof(*arena));
77 if (!NODE_DATA(nid) || !arena) {
78 printk("%s: couldn't allocate arena from node %d\n"
79 " falling back to system-wide allocation\n",
80 __func__, nid);
81 arena = alloc_bootmem(sizeof(*arena));
82 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070083
Harvey Harrisonbbb8d342008-04-28 02:13:46 -070084 arena->ptes = __alloc_bootmem_node(NODE_DATA(nid), mem_size, align, 0);
85 if (!NODE_DATA(nid) || !arena->ptes) {
86 printk("%s: couldn't allocate arena ptes from node %d\n"
87 " falling back to system-wide allocation\n",
88 __func__, nid);
89 arena->ptes = __alloc_bootmem(mem_size, align, 0);
90 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070091
92#else /* CONFIG_DISCONTIGMEM */
93
94 arena = alloc_bootmem(sizeof(*arena));
95 arena->ptes = __alloc_bootmem(mem_size, align, 0);
96
97#endif /* CONFIG_DISCONTIGMEM */
98
99 spin_lock_init(&arena->lock);
100 arena->hose = hose;
101 arena->dma_base = base;
102 arena->size = window_size;
103 arena->next_entry = 0;
104
105 /* Align allocations to a multiple of a page size. Not needed
106 unless there are chip bugs. */
107 arena->align_entry = 1;
108
109 return arena;
110}
111
Al Viroed5f6562007-07-26 17:34:19 +0100112struct pci_iommu_arena * __init
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113iommu_arena_new(struct pci_controller *hose, dma_addr_t base,
114 unsigned long window_size, unsigned long align)
115{
116 return iommu_arena_new_node(0, hose, base, window_size, align);
117}
118
119/* Must be called with the arena lock held */
120static long
FUJITA Tomonoricf540142008-03-04 14:28:57 -0800121iommu_arena_find_pages(struct device *dev, struct pci_iommu_arena *arena,
122 long n, long mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700123{
124 unsigned long *ptes;
125 long i, p, nent;
FUJITA Tomonori23d7e032008-03-04 14:28:57 -0800126 int pass = 0;
FUJITA Tomonoricf540142008-03-04 14:28:57 -0800127 unsigned long base;
128 unsigned long boundary_size;
129
FUJITA Tomonoricf540142008-03-04 14:28:57 -0800130 base = arena->dma_base >> PAGE_SHIFT;
Ivan Kokshayskyab875cf2008-03-09 16:31:17 +0300131 if (dev) {
132 boundary_size = dma_get_seg_boundary(dev) + 1;
Ivan Kokshayskyab875cf2008-03-09 16:31:17 +0300133 boundary_size >>= PAGE_SHIFT;
134 } else {
135 boundary_size = 1UL << (32 - PAGE_SHIFT);
136 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137
138 /* Search forward for the first mask-aligned sequence of N free ptes */
139 ptes = arena->ptes;
140 nent = arena->size >> PAGE_SHIFT;
FUJITA Tomonori3c5f1de2008-03-04 14:28:54 -0800141 p = ALIGN(arena->next_entry, mask + 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700142 i = 0;
FUJITA Tomonori23d7e032008-03-04 14:28:57 -0800143
144again:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145 while (i < n && p+i < nent) {
FUJITA Tomonorifd288412008-03-13 12:32:40 -0700146 if (!i && iommu_is_span_boundary(p, n, base, boundary_size)) {
FUJITA Tomonoricf540142008-03-04 14:28:57 -0800147 p = ALIGN(p + 1, mask + 1);
148 goto again;
149 }
150
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151 if (ptes[p+i])
FUJITA Tomonori3c5f1de2008-03-04 14:28:54 -0800152 p = ALIGN(p + i + 1, mask + 1), i = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153 else
154 i = i + 1;
155 }
156
157 if (i < n) {
FUJITA Tomonori23d7e032008-03-04 14:28:57 -0800158 if (pass < 1) {
159 /*
160 * Reached the end. Flush the TLB and restart
161 * the search from the beginning.
162 */
163 alpha_mv.mv_pci_tbi(arena->hose, 0, -1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164
FUJITA Tomonori23d7e032008-03-04 14:28:57 -0800165 pass++;
166 p = 0;
167 i = 0;
168 goto again;
169 } else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700170 return -1;
171 }
172
173 /* Success. It's the responsibility of the caller to mark them
174 in use before releasing the lock */
175 return p;
176}
177
178static long
FUJITA Tomonoricf540142008-03-04 14:28:57 -0800179iommu_arena_alloc(struct device *dev, struct pci_iommu_arena *arena, long n,
180 unsigned int align)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700181{
182 unsigned long flags;
183 unsigned long *ptes;
184 long i, p, mask;
185
186 spin_lock_irqsave(&arena->lock, flags);
187
188 /* Search for N empty ptes */
189 ptes = arena->ptes;
190 mask = max(align, arena->align_entry) - 1;
FUJITA Tomonoricf540142008-03-04 14:28:57 -0800191 p = iommu_arena_find_pages(dev, arena, n, mask);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192 if (p < 0) {
193 spin_unlock_irqrestore(&arena->lock, flags);
194 return -1;
195 }
196
197 /* Success. Mark them all in use, ie not zero and invalid
198 for the iommu tlb that could load them from under us.
199 The chip specific bits will fill this in with something
200 kosher when we return. */
201 for (i = 0; i < n; ++i)
202 ptes[p+i] = IOMMU_INVALID_PTE;
203
204 arena->next_entry = p + n;
205 spin_unlock_irqrestore(&arena->lock, flags);
206
207 return p;
208}
209
210static void
211iommu_arena_free(struct pci_iommu_arena *arena, long ofs, long n)
212{
213 unsigned long *p;
214 long i;
215
216 p = arena->ptes + ofs;
217 for (i = 0; i < n; ++i)
218 p[i] = 0;
219}
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800220
221/*
222 * True if the machine supports DAC addressing, and DEV can
223 * make use of it given MASK.
224 */
225static int pci_dac_dma_supported(struct pci_dev *dev, u64 mask)
226{
FUJITA Tomonorif49d2eb2010-10-27 15:34:48 -0700227 dma_addr_t dac_offset = alpha_mv.pci_dac_offset;
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800228 int ok = 1;
229
230 /* If this is not set, the machine doesn't support DAC at all. */
231 if (dac_offset == 0)
232 ok = 0;
233
234 /* The device has to be able to address our DAC bit. */
235 if ((dac_offset & dev->dma_mask) != dac_offset)
236 ok = 0;
237
238 /* If both conditions above are met, we are fine. */
239 DBGA("pci_dac_dma_supported %s from %p\n",
240 ok ? "yes" : "no", __builtin_return_address(0));
241
242 return ok;
243}
Jan Beulichcaa51712007-07-09 11:55:51 -0700244
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245/* Map a single buffer of the indicated size for PCI DMA in streaming
246 mode. The 32-bit PCI bus mastering address to use is returned.
247 Once the device is given the dma address, the device owns this memory
248 until either pci_unmap_single or pci_dma_sync_single is performed. */
249
250static dma_addr_t
251pci_map_single_1(struct pci_dev *pdev, void *cpu_addr, size_t size,
252 int dac_allowed)
253{
254 struct pci_controller *hose = pdev ? pdev->sysdata : pci_isa_hose;
255 dma_addr_t max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
256 struct pci_iommu_arena *arena;
257 long npages, dma_ofs, i;
258 unsigned long paddr;
259 dma_addr_t ret;
260 unsigned int align = 0;
FUJITA Tomonoricf540142008-03-04 14:28:57 -0800261 struct device *dev = pdev ? &pdev->dev : NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262
263 paddr = __pa(cpu_addr);
264
265#if !DEBUG_NODIRECT
266 /* First check to see if we can use the direct map window. */
267 if (paddr + size + __direct_map_base - 1 <= max_dma
268 && paddr + size <= __direct_map_size) {
269 ret = paddr + __direct_map_base;
270
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700271 DBGA2("pci_map_single: [%p,%zx] -> direct %llx from %p\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272 cpu_addr, size, ret, __builtin_return_address(0));
273
274 return ret;
275 }
276#endif
277
278 /* Next, use DAC if selected earlier. */
279 if (dac_allowed) {
280 ret = paddr + alpha_mv.pci_dac_offset;
281
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700282 DBGA2("pci_map_single: [%p,%zx] -> DAC %llx from %p\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700283 cpu_addr, size, ret, __builtin_return_address(0));
284
285 return ret;
286 }
287
288 /* If the machine doesn't define a pci_tbi routine, we have to
289 assume it doesn't support sg mapping, and, since we tried to
290 use direct_map above, it now must be considered an error. */
291 if (! alpha_mv.mv_pci_tbi) {
Marcin Slusarz62173192009-09-21 17:04:01 -0700292 printk_once(KERN_WARNING "pci_map_single: no HW sg\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293 return 0;
294 }
295
296 arena = hose->sg_pci;
297 if (!arena || arena->dma_base + arena->size - 1 > max_dma)
298 arena = hose->sg_isa;
299
Joerg Roedeleb117d32008-10-15 22:02:13 -0700300 npages = iommu_num_pages(paddr, size, PAGE_SIZE);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301
302 /* Force allocation to 64KB boundary for ISA bridges. */
303 if (pdev && pdev == isa_bridge)
304 align = 8;
FUJITA Tomonoricf540142008-03-04 14:28:57 -0800305 dma_ofs = iommu_arena_alloc(dev, arena, npages, align);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306 if (dma_ofs < 0) {
307 printk(KERN_WARNING "pci_map_single failed: "
308 "could not allocate dma page tables\n");
309 return 0;
310 }
311
312 paddr &= PAGE_MASK;
313 for (i = 0; i < npages; ++i, paddr += PAGE_SIZE)
314 arena->ptes[i + dma_ofs] = mk_iommu_pte(paddr);
315
316 ret = arena->dma_base + dma_ofs * PAGE_SIZE;
317 ret += (unsigned long)cpu_addr & ~PAGE_MASK;
318
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700319 DBGA2("pci_map_single: [%p,%zx] np %ld -> sg %llx from %p\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320 cpu_addr, size, npages, ret, __builtin_return_address(0));
321
322 return ret;
323}
324
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800325/* Helper for generic DMA-mapping functions. */
326static struct pci_dev *alpha_gendev_to_pci(struct device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327{
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800328 if (dev && dev->bus == &pci_bus_type)
329 return to_pci_dev(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800331 /* Assume that non-PCI devices asking for DMA are either ISA or EISA,
332 BUG() otherwise. */
333 BUG_ON(!isa_bridge);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800335 /* Assume non-busmaster ISA DMA when dma_mask is not set (the ISA
336 bridge is bus master then). */
337 if (!dev || !dev->dma_mask || !*dev->dma_mask)
338 return isa_bridge;
339
340 /* For EISA bus masters, return isa_bridge (it might have smaller
341 dma_mask due to wiring limitations). */
342 if (*dev->dma_mask >= isa_bridge->dma_mask)
343 return isa_bridge;
344
345 /* This assumes ISA bus master with dma_mask 0xffffff. */
346 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700347}
348
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800349static dma_addr_t alpha_pci_map_page(struct device *dev, struct page *page,
350 unsigned long offset, size_t size,
351 enum dma_data_direction dir,
352 struct dma_attrs *attrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353{
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800354 struct pci_dev *pdev = alpha_gendev_to_pci(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700355 int dac_allowed;
356
357 if (dir == PCI_DMA_NONE)
358 BUG();
359
360 dac_allowed = pdev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0;
361 return pci_map_single_1(pdev, (char *)page_address(page) + offset,
362 size, dac_allowed);
363}
364
365/* Unmap a single streaming mode DMA translation. The DMA_ADDR and
366 SIZE must match what was provided for in a previous pci_map_single
367 call. All other usages are undefined. After this call, reads by
368 the cpu to the buffer are guaranteed to see whatever the device
369 wrote there. */
370
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800371static void alpha_pci_unmap_page(struct device *dev, dma_addr_t dma_addr,
372 size_t size, enum dma_data_direction dir,
373 struct dma_attrs *attrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700374{
375 unsigned long flags;
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800376 struct pci_dev *pdev = alpha_gendev_to_pci(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700377 struct pci_controller *hose = pdev ? pdev->sysdata : pci_isa_hose;
378 struct pci_iommu_arena *arena;
379 long dma_ofs, npages;
380
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800381 if (dir == PCI_DMA_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700382 BUG();
383
384 if (dma_addr >= __direct_map_base
385 && dma_addr < __direct_map_base + __direct_map_size) {
386 /* Nothing to do. */
387
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700388 DBGA2("pci_unmap_single: direct [%llx,%zx] from %p\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700389 dma_addr, size, __builtin_return_address(0));
390
391 return;
392 }
393
394 if (dma_addr > 0xffffffff) {
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700395 DBGA2("pci64_unmap_single: DAC [%llx,%zx] from %p\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700396 dma_addr, size, __builtin_return_address(0));
397 return;
398 }
399
400 arena = hose->sg_pci;
401 if (!arena || dma_addr < arena->dma_base)
402 arena = hose->sg_isa;
403
404 dma_ofs = (dma_addr - arena->dma_base) >> PAGE_SHIFT;
405 if (dma_ofs * PAGE_SIZE >= arena->size) {
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700406 printk(KERN_ERR "Bogus pci_unmap_single: dma_addr %llx "
407 " base %llx size %x\n",
408 dma_addr, arena->dma_base, arena->size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700409 return;
410 BUG();
411 }
412
Joerg Roedeleb117d32008-10-15 22:02:13 -0700413 npages = iommu_num_pages(dma_addr, size, PAGE_SIZE);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414
415 spin_lock_irqsave(&arena->lock, flags);
416
417 iommu_arena_free(arena, dma_ofs, npages);
418
419 /* If we're freeing ptes above the `next_entry' pointer (they
420 may have snuck back into the TLB since the last wrap flush),
421 we need to flush the TLB before reallocating the latter. */
422 if (dma_ofs >= arena->next_entry)
423 alpha_mv.mv_pci_tbi(hose, dma_addr, dma_addr + size - 1);
424
425 spin_unlock_irqrestore(&arena->lock, flags);
426
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700427 DBGA2("pci_unmap_single: sg [%llx,%zx] np %ld from %p\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700428 dma_addr, size, npages, __builtin_return_address(0));
429}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700430
431/* Allocate and map kernel buffer using consistent mode DMA for PCI
432 device. Returns non-NULL cpu-view pointer to the buffer if
433 successful and sets *DMA_ADDRP to the pci side dma address as well,
434 else DMA_ADDRP is undefined. */
435
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800436static void *alpha_pci_alloc_coherent(struct device *dev, size_t size,
Andrzej Pietrasiewicz4ce9a912011-12-22 13:58:21 +0100437 dma_addr_t *dma_addrp, gfp_t gfp,
438 struct dma_attrs *attrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700439{
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800440 struct pci_dev *pdev = alpha_gendev_to_pci(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700441 void *cpu_addr;
442 long order = get_order(size);
Ivan Kokshayskyc143d432008-04-02 13:04:43 -0700443
444 gfp &= ~GFP_DMA;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445
446try_again:
447 cpu_addr = (void *)__get_free_pages(gfp, order);
448 if (! cpu_addr) {
449 printk(KERN_INFO "pci_alloc_consistent: "
450 "get_free_pages failed from %p\n",
451 __builtin_return_address(0));
452 /* ??? Really atomic allocation? Otherwise we could play
453 with vmalloc and sg if we can't find contiguous memory. */
454 return NULL;
455 }
456 memset(cpu_addr, 0, size);
457
458 *dma_addrp = pci_map_single_1(pdev, cpu_addr, size, 0);
459 if (*dma_addrp == 0) {
460 free_pages((unsigned long)cpu_addr, order);
461 if (alpha_mv.mv_pci_tbi || (gfp & GFP_DMA))
462 return NULL;
463 /* The address doesn't fit required mask and we
464 do not have iommu. Try again with GFP_DMA. */
465 gfp |= GFP_DMA;
466 goto try_again;
467 }
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800468
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700469 DBGA2("pci_alloc_consistent: %zx -> [%p,%llx] from %p\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700470 size, cpu_addr, *dma_addrp, __builtin_return_address(0));
471
472 return cpu_addr;
473}
474
475/* Free and unmap a consistent DMA buffer. CPU_ADDR and DMA_ADDR must
476 be values that were returned from pci_alloc_consistent. SIZE must
477 be the same as what as passed into pci_alloc_consistent.
478 References to the memory and mappings associated with CPU_ADDR or
479 DMA_ADDR past this call are illegal. */
480
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800481static void alpha_pci_free_coherent(struct device *dev, size_t size,
Andrzej Pietrasiewicz4ce9a912011-12-22 13:58:21 +0100482 void *cpu_addr, dma_addr_t dma_addr,
483 struct dma_attrs *attrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700484{
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800485 struct pci_dev *pdev = alpha_gendev_to_pci(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700486 pci_unmap_single(pdev, dma_addr, size, PCI_DMA_BIDIRECTIONAL);
487 free_pages((unsigned long)cpu_addr, get_order(size));
488
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700489 DBGA2("pci_free_consistent: [%llx,%zx] from %p\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490 dma_addr, size, __builtin_return_address(0));
491}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700492
493/* Classify the elements of the scatterlist. Write dma_address
494 of each element with:
495 0 : Followers all physically adjacent.
496 1 : Followers all virtually adjacent.
497 -1 : Not leader, physically adjacent to previous.
498 -2 : Not leader, virtually adjacent to previous.
499 Write dma_length of each leader with the combined lengths of
500 the mergable followers. */
501
Jens Axboe58b053e2007-10-22 20:02:46 +0200502#define SG_ENT_VIRT_ADDRESS(SG) (sg_virt((SG)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700503#define SG_ENT_PHYS_ADDRESS(SG) __pa(SG_ENT_VIRT_ADDRESS(SG))
504
505static void
FUJITA Tomonori7c536642008-02-04 22:27:58 -0800506sg_classify(struct device *dev, struct scatterlist *sg, struct scatterlist *end,
507 int virt_ok)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508{
509 unsigned long next_paddr;
510 struct scatterlist *leader;
511 long leader_flag, leader_length;
FUJITA Tomonori7c536642008-02-04 22:27:58 -0800512 unsigned int max_seg_size;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700513
514 leader = sg;
515 leader_flag = 0;
516 leader_length = leader->length;
517 next_paddr = SG_ENT_PHYS_ADDRESS(leader) + leader_length;
518
FUJITA Tomonori7c536642008-02-04 22:27:58 -0800519 /* we will not marge sg without device. */
520 max_seg_size = dev ? dma_get_max_seg_size(dev) : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521 for (++sg; sg < end; ++sg) {
522 unsigned long addr, len;
523 addr = SG_ENT_PHYS_ADDRESS(sg);
524 len = sg->length;
525
FUJITA Tomonori7c536642008-02-04 22:27:58 -0800526 if (leader_length + len > max_seg_size)
527 goto new_segment;
528
Linus Torvalds1da177e2005-04-16 15:20:36 -0700529 if (next_paddr == addr) {
530 sg->dma_address = -1;
531 leader_length += len;
532 } else if (((next_paddr | addr) & ~PAGE_MASK) == 0 && virt_ok) {
533 sg->dma_address = -2;
534 leader_flag = 1;
535 leader_length += len;
536 } else {
FUJITA Tomonori7c536642008-02-04 22:27:58 -0800537new_segment:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700538 leader->dma_address = leader_flag;
539 leader->dma_length = leader_length;
540 leader = sg;
541 leader_flag = 0;
542 leader_length = len;
543 }
544
545 next_paddr = addr + len;
546 }
547
548 leader->dma_address = leader_flag;
549 leader->dma_length = leader_length;
550}
551
552/* Given a scatterlist leader, choose an allocation method and fill
553 in the blanks. */
554
555static int
FUJITA Tomonori7c536642008-02-04 22:27:58 -0800556sg_fill(struct device *dev, struct scatterlist *leader, struct scatterlist *end,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700557 struct scatterlist *out, struct pci_iommu_arena *arena,
558 dma_addr_t max_dma, int dac_allowed)
559{
560 unsigned long paddr = SG_ENT_PHYS_ADDRESS(leader);
561 long size = leader->dma_length;
562 struct scatterlist *sg;
563 unsigned long *ptes;
564 long npages, dma_ofs, i;
565
566#if !DEBUG_NODIRECT
567 /* If everything is physically contiguous, and the addresses
568 fall into the direct-map window, use it. */
569 if (leader->dma_address == 0
570 && paddr + size + __direct_map_base - 1 <= max_dma
571 && paddr + size <= __direct_map_size) {
572 out->dma_address = paddr + __direct_map_base;
573 out->dma_length = size;
574
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700575 DBGA(" sg_fill: [%p,%lx] -> direct %llx\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700576 __va(paddr), size, out->dma_address);
577
578 return 0;
579 }
580#endif
581
582 /* If physically contiguous and DAC is available, use it. */
583 if (leader->dma_address == 0 && dac_allowed) {
584 out->dma_address = paddr + alpha_mv.pci_dac_offset;
585 out->dma_length = size;
586
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700587 DBGA(" sg_fill: [%p,%lx] -> DAC %llx\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 __va(paddr), size, out->dma_address);
589
590 return 0;
591 }
592
593 /* Otherwise, we'll use the iommu to make the pages virtually
594 contiguous. */
595
596 paddr &= ~PAGE_MASK;
Joerg Roedeleb117d32008-10-15 22:02:13 -0700597 npages = iommu_num_pages(paddr, size, PAGE_SIZE);
FUJITA Tomonoricf540142008-03-04 14:28:57 -0800598 dma_ofs = iommu_arena_alloc(dev, arena, npages, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700599 if (dma_ofs < 0) {
600 /* If we attempted a direct map above but failed, die. */
601 if (leader->dma_address == 0)
602 return -1;
603
604 /* Otherwise, break up the remaining virtually contiguous
605 hunks into individual direct maps and retry. */
FUJITA Tomonori7c536642008-02-04 22:27:58 -0800606 sg_classify(dev, leader, end, 0);
607 return sg_fill(dev, leader, end, out, arena, max_dma, dac_allowed);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700608 }
609
610 out->dma_address = arena->dma_base + dma_ofs*PAGE_SIZE + paddr;
611 out->dma_length = size;
612
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700613 DBGA(" sg_fill: [%p,%lx] -> sg %llx np %ld\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700614 __va(paddr), size, out->dma_address, npages);
615
616 /* All virtually contiguous. We need to find the length of each
617 physically contiguous subsegment to fill in the ptes. */
618 ptes = &arena->ptes[dma_ofs];
619 sg = leader;
620 do {
621#if DEBUG_ALLOC > 0
622 struct scatterlist *last_sg = sg;
623#endif
624
625 size = sg->length;
626 paddr = SG_ENT_PHYS_ADDRESS(sg);
627
628 while (sg+1 < end && (int) sg[1].dma_address == -1) {
629 size += sg[1].length;
630 sg++;
631 }
632
Joerg Roedeleb117d32008-10-15 22:02:13 -0700633 npages = iommu_num_pages(paddr, size, PAGE_SIZE);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700634
635 paddr &= PAGE_MASK;
636 for (i = 0; i < npages; ++i, paddr += PAGE_SIZE)
637 *ptes++ = mk_iommu_pte(paddr);
638
639#if DEBUG_ALLOC > 0
640 DBGA(" (%ld) [%p,%x] np %ld\n",
641 last_sg - leader, SG_ENT_VIRT_ADDRESS(last_sg),
642 last_sg->length, npages);
643 while (++last_sg <= sg) {
644 DBGA(" (%ld) [%p,%x] cont\n",
645 last_sg - leader, SG_ENT_VIRT_ADDRESS(last_sg),
646 last_sg->length);
647 }
648#endif
649 } while (++sg < end && (int) sg->dma_address < 0);
650
651 return 1;
652}
653
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800654static int alpha_pci_map_sg(struct device *dev, struct scatterlist *sg,
655 int nents, enum dma_data_direction dir,
656 struct dma_attrs *attrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700657{
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800658 struct pci_dev *pdev = alpha_gendev_to_pci(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700659 struct scatterlist *start, *end, *out;
660 struct pci_controller *hose;
661 struct pci_iommu_arena *arena;
662 dma_addr_t max_dma;
663 int dac_allowed;
664
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800665 if (dir == PCI_DMA_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700666 BUG();
667
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800668 dac_allowed = dev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0;
FUJITA Tomonori7c536642008-02-04 22:27:58 -0800669
Linus Torvalds1da177e2005-04-16 15:20:36 -0700670 /* Fast path single entry scatterlists. */
671 if (nents == 1) {
672 sg->dma_length = sg->length;
673 sg->dma_address
674 = pci_map_single_1(pdev, SG_ENT_VIRT_ADDRESS(sg),
675 sg->length, dac_allowed);
676 return sg->dma_address != 0;
677 }
678
679 start = sg;
680 end = sg + nents;
681
682 /* First, prepare information about the entries. */
FUJITA Tomonori7c536642008-02-04 22:27:58 -0800683 sg_classify(dev, sg, end, alpha_mv.mv_pci_tbi != 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700684
685 /* Second, figure out where we're going to map things. */
686 if (alpha_mv.mv_pci_tbi) {
687 hose = pdev ? pdev->sysdata : pci_isa_hose;
688 max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
689 arena = hose->sg_pci;
690 if (!arena || arena->dma_base + arena->size - 1 > max_dma)
691 arena = hose->sg_isa;
692 } else {
693 max_dma = -1;
694 arena = NULL;
695 hose = NULL;
696 }
697
698 /* Third, iterate over the scatterlist leaders and allocate
699 dma space as needed. */
700 for (out = sg; sg < end; ++sg) {
701 if ((int) sg->dma_address < 0)
702 continue;
FUJITA Tomonori7c536642008-02-04 22:27:58 -0800703 if (sg_fill(dev, sg, end, out, arena, max_dma, dac_allowed) < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700704 goto error;
705 out++;
706 }
707
708 /* Mark the end of the list for pci_unmap_sg. */
709 if (out < end)
710 out->dma_length = 0;
711
712 if (out - start == 0)
713 printk(KERN_WARNING "pci_map_sg failed: no entries?\n");
714 DBGA("pci_map_sg: %ld entries\n", out - start);
715
716 return out - start;
717
718 error:
719 printk(KERN_WARNING "pci_map_sg failed: "
720 "could not allocate dma page tables\n");
721
722 /* Some allocation failed while mapping the scatterlist
723 entries. Unmap them now. */
724 if (out > start)
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800725 pci_unmap_sg(pdev, start, out - start, dir);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726 return 0;
727}
728
729/* Unmap a set of streaming mode DMA translations. Again, cpu read
730 rules concerning calls here are the same as for pci_unmap_single()
731 above. */
732
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800733static void alpha_pci_unmap_sg(struct device *dev, struct scatterlist *sg,
734 int nents, enum dma_data_direction dir,
735 struct dma_attrs *attrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700736{
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800737 struct pci_dev *pdev = alpha_gendev_to_pci(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700738 unsigned long flags;
739 struct pci_controller *hose;
740 struct pci_iommu_arena *arena;
741 struct scatterlist *end;
742 dma_addr_t max_dma;
743 dma_addr_t fbeg, fend;
744
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800745 if (dir == PCI_DMA_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700746 BUG();
747
748 if (! alpha_mv.mv_pci_tbi)
749 return;
750
751 hose = pdev ? pdev->sysdata : pci_isa_hose;
752 max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
753 arena = hose->sg_pci;
754 if (!arena || arena->dma_base + arena->size - 1 > max_dma)
755 arena = hose->sg_isa;
756
757 fbeg = -1, fend = 0;
758
759 spin_lock_irqsave(&arena->lock, flags);
760
761 for (end = sg + nents; sg < end; ++sg) {
FUJITA Tomonorif49d2eb2010-10-27 15:34:48 -0700762 dma_addr_t addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700763 size_t size;
764 long npages, ofs;
765 dma_addr_t tend;
766
767 addr = sg->dma_address;
768 size = sg->dma_length;
769 if (!size)
770 break;
771
772 if (addr > 0xffffffff) {
773 /* It's a DAC address -- nothing to do. */
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700774 DBGA(" (%ld) DAC [%llx,%zx]\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775 sg - end + nents, addr, size);
776 continue;
777 }
778
779 if (addr >= __direct_map_base
780 && addr < __direct_map_base + __direct_map_size) {
781 /* Nothing to do. */
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700782 DBGA(" (%ld) direct [%llx,%zx]\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700783 sg - end + nents, addr, size);
784 continue;
785 }
786
Randy Dunlap5f0e3da2009-03-31 15:23:36 -0700787 DBGA(" (%ld) sg [%llx,%zx]\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -0700788 sg - end + nents, addr, size);
789
Joerg Roedeleb117d32008-10-15 22:02:13 -0700790 npages = iommu_num_pages(addr, size, PAGE_SIZE);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700791 ofs = (addr - arena->dma_base) >> PAGE_SHIFT;
792 iommu_arena_free(arena, ofs, npages);
793
794 tend = addr + size - 1;
795 if (fbeg > addr) fbeg = addr;
796 if (fend < tend) fend = tend;
797 }
798
799 /* If we're freeing ptes above the `next_entry' pointer (they
800 may have snuck back into the TLB since the last wrap flush),
801 we need to flush the TLB before reallocating the latter. */
802 if ((fend - arena->dma_base) >> PAGE_SHIFT >= arena->next_entry)
803 alpha_mv.mv_pci_tbi(hose, fbeg, fend);
804
805 spin_unlock_irqrestore(&arena->lock, flags);
806
807 DBGA("pci_unmap_sg: %ld entries\n", nents - (end - sg));
808}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700809
810/* Return whether the given PCI device DMA address mask can be
811 supported properly. */
812
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800813static int alpha_pci_supported(struct device *dev, u64 mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700814{
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800815 struct pci_dev *pdev = alpha_gendev_to_pci(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700816 struct pci_controller *hose;
817 struct pci_iommu_arena *arena;
818
819 /* If there exists a direct map, and the mask fits either
820 the entire direct mapped space or the total system memory as
821 shifted by the map base */
822 if (__direct_map_size != 0
823 && (__direct_map_base + __direct_map_size - 1 <= mask ||
824 __direct_map_base + (max_low_pfn << PAGE_SHIFT) - 1 <= mask))
825 return 1;
826
827 /* Check that we have a scatter-gather arena that fits. */
828 hose = pdev ? pdev->sysdata : pci_isa_hose;
829 arena = hose->sg_isa;
830 if (arena && arena->dma_base + arena->size - 1 <= mask)
831 return 1;
832 arena = hose->sg_pci;
833 if (arena && arena->dma_base + arena->size - 1 <= mask)
834 return 1;
835
836 /* As last resort try ZONE_DMA. */
837 if (!__direct_map_base && MAX_DMA_ADDRESS - IDENT_ADDR - 1 <= mask)
838 return 1;
839
840 return 0;
841}
842
843
844/*
845 * AGP GART extensions to the IOMMU
846 */
847int
848iommu_reserve(struct pci_iommu_arena *arena, long pg_count, long align_mask)
849{
850 unsigned long flags;
851 unsigned long *ptes;
852 long i, p;
853
854 if (!arena) return -EINVAL;
855
856 spin_lock_irqsave(&arena->lock, flags);
857
858 /* Search for N empty ptes. */
859 ptes = arena->ptes;
FUJITA Tomonoricf540142008-03-04 14:28:57 -0800860 p = iommu_arena_find_pages(NULL, arena, pg_count, align_mask);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700861 if (p < 0) {
862 spin_unlock_irqrestore(&arena->lock, flags);
863 return -1;
864 }
865
866 /* Success. Mark them all reserved (ie not zero and invalid)
867 for the iommu tlb that could load them from under us.
868 They will be filled in with valid bits by _bind() */
869 for (i = 0; i < pg_count; ++i)
870 ptes[p+i] = IOMMU_RESERVED_PTE;
871
872 arena->next_entry = p + pg_count;
873 spin_unlock_irqrestore(&arena->lock, flags);
874
875 return p;
876}
877
878int
879iommu_release(struct pci_iommu_arena *arena, long pg_start, long pg_count)
880{
881 unsigned long *ptes;
882 long i;
883
884 if (!arena) return -EINVAL;
885
886 ptes = arena->ptes;
887
888 /* Make sure they're all reserved first... */
889 for(i = pg_start; i < pg_start + pg_count; i++)
890 if (ptes[i] != IOMMU_RESERVED_PTE)
891 return -EBUSY;
892
893 iommu_arena_free(arena, pg_start, pg_count);
894 return 0;
895}
896
897int
898iommu_bind(struct pci_iommu_arena *arena, long pg_start, long pg_count,
Ivan Kokshayskyd68721e2009-09-23 15:57:42 -0700899 struct page **pages)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700900{
901 unsigned long flags;
902 unsigned long *ptes;
903 long i, j;
904
905 if (!arena) return -EINVAL;
906
907 spin_lock_irqsave(&arena->lock, flags);
908
909 ptes = arena->ptes;
910
911 for(j = pg_start; j < pg_start + pg_count; j++) {
912 if (ptes[j] != IOMMU_RESERVED_PTE) {
913 spin_unlock_irqrestore(&arena->lock, flags);
914 return -EBUSY;
915 }
916 }
917
918 for(i = 0, j = pg_start; i < pg_count; i++, j++)
Ivan Kokshayskyd68721e2009-09-23 15:57:42 -0700919 ptes[j] = mk_iommu_pte(page_to_phys(pages[i]));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700920
921 spin_unlock_irqrestore(&arena->lock, flags);
922
923 return 0;
924}
925
926int
927iommu_unbind(struct pci_iommu_arena *arena, long pg_start, long pg_count)
928{
929 unsigned long *p;
930 long i;
931
932 if (!arena) return -EINVAL;
933
934 p = arena->ptes + pg_start;
935 for(i = 0; i < pg_count; i++)
936 p[i] = IOMMU_RESERVED_PTE;
937
938 return 0;
939}
940
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800941static int alpha_pci_mapping_error(struct device *dev, dma_addr_t dma_addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700942{
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800943 return dma_addr == 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700944}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700945
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800946static int alpha_pci_set_mask(struct device *dev, u64 mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700947{
948 if (!dev->dma_mask ||
949 !pci_dma_supported(alpha_gendev_to_pci(dev), mask))
950 return -EIO;
951
952 *dev->dma_mask = mask;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700953 return 0;
954}
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800955
956struct dma_map_ops alpha_pci_ops = {
Andrzej Pietrasiewicz4ce9a912011-12-22 13:58:21 +0100957 .alloc = alpha_pci_alloc_coherent,
958 .free = alpha_pci_free_coherent,
FUJITA Tomonoric186cac2010-03-10 15:23:37 -0800959 .map_page = alpha_pci_map_page,
960 .unmap_page = alpha_pci_unmap_page,
961 .map_sg = alpha_pci_map_sg,
962 .unmap_sg = alpha_pci_unmap_sg,
963 .mapping_error = alpha_pci_mapping_error,
964 .dma_supported = alpha_pci_supported,
965 .set_dma_mask = alpha_pci_set_mask,
966};
967
968struct dma_map_ops *dma_ops = &alpha_pci_ops;
969EXPORT_SYMBOL(dma_ops);