| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* | 
 | 2 |  *	linux/arch/alpha/kernel/pci_iommu.c | 
 | 3 |  */ | 
 | 4 |  | 
 | 5 | #include <linux/kernel.h> | 
 | 6 | #include <linux/mm.h> | 
 | 7 | #include <linux/pci.h> | 
 | 8 | #include <linux/slab.h> | 
 | 9 | #include <linux/bootmem.h> | 
| Jens Axboe | 944bda2 | 2007-10-23 12:31:05 +0200 | [diff] [blame] | 10 | #include <linux/scatterlist.h> | 
| Richard Henderson | 74fd1b6 | 2007-05-29 16:01:35 -0700 | [diff] [blame] | 11 | #include <linux/log2.h> | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 12 | #include <linux/dma-mapping.h> | 
| FUJITA Tomonori | fd28841 | 2008-03-13 12:32:40 -0700 | [diff] [blame] | 13 | #include <linux/iommu-helper.h> | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 14 |  | 
 | 15 | #include <asm/io.h> | 
 | 16 | #include <asm/hwrpb.h> | 
 | 17 |  | 
 | 18 | #include "proto.h" | 
 | 19 | #include "pci_impl.h" | 
 | 20 |  | 
 | 21 |  | 
 | 22 | #define DEBUG_ALLOC 0 | 
 | 23 | #if DEBUG_ALLOC > 0 | 
 | 24 | # define DBGA(args...)		printk(KERN_DEBUG args) | 
 | 25 | #else | 
 | 26 | # define DBGA(args...) | 
 | 27 | #endif | 
 | 28 | #if DEBUG_ALLOC > 1 | 
 | 29 | # define DBGA2(args...)		printk(KERN_DEBUG args) | 
 | 30 | #else | 
 | 31 | # define DBGA2(args...) | 
 | 32 | #endif | 
 | 33 |  | 
 | 34 | #define DEBUG_NODIRECT 0 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 35 |  | 
 | 36 | #define ISA_DMA_MASK		0x00ffffff | 
 | 37 |  | 
 | 38 | static inline unsigned long | 
 | 39 | mk_iommu_pte(unsigned long paddr) | 
 | 40 | { | 
 | 41 | 	return (paddr >> (PAGE_SHIFT-1)) | 1; | 
 | 42 | } | 
 | 43 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 44 | /* Return the minimum of MAX or the first power of two larger | 
 | 45 |    than main memory.  */ | 
 | 46 |  | 
 | 47 | unsigned long | 
 | 48 | size_for_memory(unsigned long max) | 
 | 49 | { | 
 | 50 | 	unsigned long mem = max_low_pfn << PAGE_SHIFT; | 
 | 51 | 	if (mem < max) | 
| Richard Henderson | 74fd1b6 | 2007-05-29 16:01:35 -0700 | [diff] [blame] | 52 | 		max = roundup_pow_of_two(mem); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 53 | 	return max; | 
 | 54 | } | 
 | 55 |  | 
| Al Viro | ed5f656 | 2007-07-26 17:34:19 +0100 | [diff] [blame] | 56 | struct pci_iommu_arena * __init | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 57 | iommu_arena_new_node(int nid, struct pci_controller *hose, dma_addr_t base, | 
 | 58 | 		     unsigned long window_size, unsigned long align) | 
 | 59 | { | 
 | 60 | 	unsigned long mem_size; | 
 | 61 | 	struct pci_iommu_arena *arena; | 
 | 62 |  | 
 | 63 | 	mem_size = window_size / (PAGE_SIZE / sizeof(unsigned long)); | 
 | 64 |  | 
 | 65 | 	/* Note that the TLB lookup logic uses bitwise concatenation, | 
 | 66 | 	   not addition, so the required arena alignment is based on | 
 | 67 | 	   the size of the window.  Retain the align parameter so that | 
 | 68 | 	   particular systems can over-align the arena.  */ | 
 | 69 | 	if (align < mem_size) | 
 | 70 | 		align = mem_size; | 
 | 71 |  | 
 | 72 |  | 
 | 73 | #ifdef CONFIG_DISCONTIGMEM | 
 | 74 |  | 
| Harvey Harrison | bbb8d34 | 2008-04-28 02:13:46 -0700 | [diff] [blame] | 75 | 	arena = alloc_bootmem_node(NODE_DATA(nid), sizeof(*arena)); | 
 | 76 | 	if (!NODE_DATA(nid) || !arena) { | 
 | 77 | 		printk("%s: couldn't allocate arena from node %d\n" | 
 | 78 | 		       "    falling back to system-wide allocation\n", | 
 | 79 | 		       __func__, nid); | 
 | 80 | 		arena = alloc_bootmem(sizeof(*arena)); | 
 | 81 | 	} | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 82 |  | 
| Harvey Harrison | bbb8d34 | 2008-04-28 02:13:46 -0700 | [diff] [blame] | 83 | 	arena->ptes = __alloc_bootmem_node(NODE_DATA(nid), mem_size, align, 0); | 
 | 84 | 	if (!NODE_DATA(nid) || !arena->ptes) { | 
 | 85 | 		printk("%s: couldn't allocate arena ptes from node %d\n" | 
 | 86 | 		       "    falling back to system-wide allocation\n", | 
 | 87 | 		       __func__, nid); | 
 | 88 | 		arena->ptes = __alloc_bootmem(mem_size, align, 0); | 
 | 89 | 	} | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 90 |  | 
 | 91 | #else /* CONFIG_DISCONTIGMEM */ | 
 | 92 |  | 
 | 93 | 	arena = alloc_bootmem(sizeof(*arena)); | 
 | 94 | 	arena->ptes = __alloc_bootmem(mem_size, align, 0); | 
 | 95 |  | 
 | 96 | #endif /* CONFIG_DISCONTIGMEM */ | 
 | 97 |  | 
 | 98 | 	spin_lock_init(&arena->lock); | 
 | 99 | 	arena->hose = hose; | 
 | 100 | 	arena->dma_base = base; | 
 | 101 | 	arena->size = window_size; | 
 | 102 | 	arena->next_entry = 0; | 
 | 103 |  | 
 | 104 | 	/* Align allocations to a multiple of a page size.  Not needed | 
 | 105 | 	   unless there are chip bugs.  */ | 
 | 106 | 	arena->align_entry = 1; | 
 | 107 |  | 
 | 108 | 	return arena; | 
 | 109 | } | 
 | 110 |  | 
| Al Viro | ed5f656 | 2007-07-26 17:34:19 +0100 | [diff] [blame] | 111 | struct pci_iommu_arena * __init | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 112 | iommu_arena_new(struct pci_controller *hose, dma_addr_t base, | 
 | 113 | 		unsigned long window_size, unsigned long align) | 
 | 114 | { | 
 | 115 | 	return iommu_arena_new_node(0, hose, base, window_size, align); | 
 | 116 | } | 
 | 117 |  | 
 | 118 | /* Must be called with the arena lock held */ | 
 | 119 | static long | 
| FUJITA Tomonori | cf54014 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 120 | iommu_arena_find_pages(struct device *dev, struct pci_iommu_arena *arena, | 
 | 121 | 		       long n, long mask) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 122 | { | 
 | 123 | 	unsigned long *ptes; | 
 | 124 | 	long i, p, nent; | 
| FUJITA Tomonori | 23d7e03 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 125 | 	int pass = 0; | 
| FUJITA Tomonori | cf54014 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 126 | 	unsigned long base; | 
 | 127 | 	unsigned long boundary_size; | 
 | 128 |  | 
| FUJITA Tomonori | cf54014 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 129 | 	base = arena->dma_base >> PAGE_SHIFT; | 
| Ivan Kokshaysky | ab875cf | 2008-03-09 16:31:17 +0300 | [diff] [blame] | 130 | 	if (dev) { | 
 | 131 | 		boundary_size = dma_get_seg_boundary(dev) + 1; | 
| Ivan Kokshaysky | ab875cf | 2008-03-09 16:31:17 +0300 | [diff] [blame] | 132 | 		boundary_size >>= PAGE_SHIFT; | 
 | 133 | 	} else { | 
 | 134 | 		boundary_size = 1UL << (32 - PAGE_SHIFT); | 
 | 135 | 	} | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 136 |  | 
 | 137 | 	/* Search forward for the first mask-aligned sequence of N free ptes */ | 
 | 138 | 	ptes = arena->ptes; | 
 | 139 | 	nent = arena->size >> PAGE_SHIFT; | 
| FUJITA Tomonori | 3c5f1de | 2008-03-04 14:28:54 -0800 | [diff] [blame] | 140 | 	p = ALIGN(arena->next_entry, mask + 1); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 141 | 	i = 0; | 
| FUJITA Tomonori | 23d7e03 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 142 |  | 
 | 143 | again: | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 144 | 	while (i < n && p+i < nent) { | 
| FUJITA Tomonori | fd28841 | 2008-03-13 12:32:40 -0700 | [diff] [blame] | 145 | 		if (!i && iommu_is_span_boundary(p, n, base, boundary_size)) { | 
| FUJITA Tomonori | cf54014 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 146 | 			p = ALIGN(p + 1, mask + 1); | 
 | 147 | 			goto again; | 
 | 148 | 		} | 
 | 149 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 150 | 		if (ptes[p+i]) | 
| FUJITA Tomonori | 3c5f1de | 2008-03-04 14:28:54 -0800 | [diff] [blame] | 151 | 			p = ALIGN(p + i + 1, mask + 1), i = 0; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 152 | 		else | 
 | 153 | 			i = i + 1; | 
 | 154 | 	} | 
 | 155 |  | 
 | 156 | 	if (i < n) { | 
| FUJITA Tomonori | 23d7e03 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 157 | 		if (pass < 1) { | 
 | 158 | 			/* | 
 | 159 | 			 * Reached the end.  Flush the TLB and restart | 
 | 160 | 			 * the search from the beginning. | 
 | 161 | 			*/ | 
 | 162 | 			alpha_mv.mv_pci_tbi(arena->hose, 0, -1); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 163 |  | 
| FUJITA Tomonori | 23d7e03 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 164 | 			pass++; | 
 | 165 | 			p = 0; | 
 | 166 | 			i = 0; | 
 | 167 | 			goto again; | 
 | 168 | 		} else | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 169 | 			return -1; | 
 | 170 | 	} | 
 | 171 |  | 
 | 172 | 	/* Success. It's the responsibility of the caller to mark them | 
 | 173 | 	   in use before releasing the lock */ | 
 | 174 | 	return p; | 
 | 175 | } | 
 | 176 |  | 
 | 177 | static long | 
| FUJITA Tomonori | cf54014 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 178 | iommu_arena_alloc(struct device *dev, struct pci_iommu_arena *arena, long n, | 
 | 179 | 		  unsigned int align) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 180 | { | 
 | 181 | 	unsigned long flags; | 
 | 182 | 	unsigned long *ptes; | 
 | 183 | 	long i, p, mask; | 
 | 184 |  | 
 | 185 | 	spin_lock_irqsave(&arena->lock, flags); | 
 | 186 |  | 
 | 187 | 	/* Search for N empty ptes */ | 
 | 188 | 	ptes = arena->ptes; | 
 | 189 | 	mask = max(align, arena->align_entry) - 1; | 
| FUJITA Tomonori | cf54014 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 190 | 	p = iommu_arena_find_pages(dev, arena, n, mask); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 191 | 	if (p < 0) { | 
 | 192 | 		spin_unlock_irqrestore(&arena->lock, flags); | 
 | 193 | 		return -1; | 
 | 194 | 	} | 
 | 195 |  | 
 | 196 | 	/* Success.  Mark them all in use, ie not zero and invalid | 
 | 197 | 	   for the iommu tlb that could load them from under us. | 
 | 198 | 	   The chip specific bits will fill this in with something | 
 | 199 | 	   kosher when we return.  */ | 
 | 200 | 	for (i = 0; i < n; ++i) | 
 | 201 | 		ptes[p+i] = IOMMU_INVALID_PTE; | 
 | 202 |  | 
 | 203 | 	arena->next_entry = p + n; | 
 | 204 | 	spin_unlock_irqrestore(&arena->lock, flags); | 
 | 205 |  | 
 | 206 | 	return p; | 
 | 207 | } | 
 | 208 |  | 
 | 209 | static void | 
 | 210 | iommu_arena_free(struct pci_iommu_arena *arena, long ofs, long n) | 
 | 211 | { | 
 | 212 | 	unsigned long *p; | 
 | 213 | 	long i; | 
 | 214 |  | 
 | 215 | 	p = arena->ptes + ofs; | 
 | 216 | 	for (i = 0; i < n; ++i) | 
 | 217 | 		p[i] = 0; | 
 | 218 | } | 
 | 219 |  | 
| Jan Beulich | caa5171 | 2007-07-09 11:55:51 -0700 | [diff] [blame] | 220 | /* True if the machine supports DAC addressing, and DEV can | 
 | 221 |    make use of it given MASK.  */ | 
 | 222 | static int pci_dac_dma_supported(struct pci_dev *hwdev, u64 mask); | 
 | 223 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 224 | /* Map a single buffer of the indicated size for PCI DMA in streaming | 
 | 225 |    mode.  The 32-bit PCI bus mastering address to use is returned. | 
 | 226 |    Once the device is given the dma address, the device owns this memory | 
 | 227 |    until either pci_unmap_single or pci_dma_sync_single is performed.  */ | 
 | 228 |  | 
 | 229 | static dma_addr_t | 
 | 230 | pci_map_single_1(struct pci_dev *pdev, void *cpu_addr, size_t size, | 
 | 231 | 		 int dac_allowed) | 
 | 232 | { | 
 | 233 | 	struct pci_controller *hose = pdev ? pdev->sysdata : pci_isa_hose; | 
 | 234 | 	dma_addr_t max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK; | 
 | 235 | 	struct pci_iommu_arena *arena; | 
 | 236 | 	long npages, dma_ofs, i; | 
 | 237 | 	unsigned long paddr; | 
 | 238 | 	dma_addr_t ret; | 
 | 239 | 	unsigned int align = 0; | 
| FUJITA Tomonori | cf54014 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 240 | 	struct device *dev = pdev ? &pdev->dev : NULL; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 241 |  | 
 | 242 | 	paddr = __pa(cpu_addr); | 
 | 243 |  | 
 | 244 | #if !DEBUG_NODIRECT | 
 | 245 | 	/* First check to see if we can use the direct map window.  */ | 
 | 246 | 	if (paddr + size + __direct_map_base - 1 <= max_dma | 
 | 247 | 	    && paddr + size <= __direct_map_size) { | 
 | 248 | 		ret = paddr + __direct_map_base; | 
 | 249 |  | 
 | 250 | 		DBGA2("pci_map_single: [%p,%lx] -> direct %lx from %p\n", | 
 | 251 | 		      cpu_addr, size, ret, __builtin_return_address(0)); | 
 | 252 |  | 
 | 253 | 		return ret; | 
 | 254 | 	} | 
 | 255 | #endif | 
 | 256 |  | 
 | 257 | 	/* Next, use DAC if selected earlier.  */ | 
 | 258 | 	if (dac_allowed) { | 
 | 259 | 		ret = paddr + alpha_mv.pci_dac_offset; | 
 | 260 |  | 
 | 261 | 		DBGA2("pci_map_single: [%p,%lx] -> DAC %lx from %p\n", | 
 | 262 | 		      cpu_addr, size, ret, __builtin_return_address(0)); | 
 | 263 |  | 
 | 264 | 		return ret; | 
 | 265 | 	} | 
 | 266 |  | 
 | 267 | 	/* If the machine doesn't define a pci_tbi routine, we have to | 
 | 268 | 	   assume it doesn't support sg mapping, and, since we tried to | 
 | 269 | 	   use direct_map above, it now must be considered an error. */ | 
 | 270 | 	if (! alpha_mv.mv_pci_tbi) { | 
 | 271 | 		static int been_here = 0; /* Only print the message once. */ | 
 | 272 | 		if (!been_here) { | 
 | 273 | 		    printk(KERN_WARNING "pci_map_single: no HW sg\n"); | 
 | 274 | 		    been_here = 1; | 
 | 275 | 		} | 
 | 276 | 		return 0; | 
 | 277 | 	} | 
 | 278 |  | 
 | 279 | 	arena = hose->sg_pci; | 
 | 280 | 	if (!arena || arena->dma_base + arena->size - 1 > max_dma) | 
 | 281 | 		arena = hose->sg_isa; | 
 | 282 |  | 
| Joerg Roedel | eb117d3 | 2008-10-15 22:02:13 -0700 | [diff] [blame] | 283 | 	npages = iommu_num_pages(paddr, size, PAGE_SIZE); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 284 |  | 
 | 285 | 	/* Force allocation to 64KB boundary for ISA bridges. */ | 
 | 286 | 	if (pdev && pdev == isa_bridge) | 
 | 287 | 		align = 8; | 
| FUJITA Tomonori | cf54014 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 288 | 	dma_ofs = iommu_arena_alloc(dev, arena, npages, align); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 289 | 	if (dma_ofs < 0) { | 
 | 290 | 		printk(KERN_WARNING "pci_map_single failed: " | 
 | 291 | 		       "could not allocate dma page tables\n"); | 
 | 292 | 		return 0; | 
 | 293 | 	} | 
 | 294 |  | 
 | 295 | 	paddr &= PAGE_MASK; | 
 | 296 | 	for (i = 0; i < npages; ++i, paddr += PAGE_SIZE) | 
 | 297 | 		arena->ptes[i + dma_ofs] = mk_iommu_pte(paddr); | 
 | 298 |  | 
 | 299 | 	ret = arena->dma_base + dma_ofs * PAGE_SIZE; | 
 | 300 | 	ret += (unsigned long)cpu_addr & ~PAGE_MASK; | 
 | 301 |  | 
 | 302 | 	DBGA2("pci_map_single: [%p,%lx] np %ld -> sg %lx from %p\n", | 
 | 303 | 	      cpu_addr, size, npages, ret, __builtin_return_address(0)); | 
 | 304 |  | 
 | 305 | 	return ret; | 
 | 306 | } | 
 | 307 |  | 
 | 308 | dma_addr_t | 
 | 309 | pci_map_single(struct pci_dev *pdev, void *cpu_addr, size_t size, int dir) | 
 | 310 | { | 
 | 311 | 	int dac_allowed;  | 
 | 312 |  | 
 | 313 | 	if (dir == PCI_DMA_NONE) | 
 | 314 | 		BUG(); | 
 | 315 |  | 
 | 316 | 	dac_allowed = pdev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0;  | 
 | 317 | 	return pci_map_single_1(pdev, cpu_addr, size, dac_allowed); | 
 | 318 | } | 
| Al Viro | cff52da | 2006-10-11 17:40:22 +0100 | [diff] [blame] | 319 | EXPORT_SYMBOL(pci_map_single); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 320 |  | 
 | 321 | dma_addr_t | 
 | 322 | pci_map_page(struct pci_dev *pdev, struct page *page, unsigned long offset, | 
 | 323 | 	     size_t size, int dir) | 
 | 324 | { | 
 | 325 | 	int dac_allowed; | 
 | 326 |  | 
 | 327 | 	if (dir == PCI_DMA_NONE) | 
 | 328 | 		BUG(); | 
 | 329 |  | 
 | 330 | 	dac_allowed = pdev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0;  | 
 | 331 | 	return pci_map_single_1(pdev, (char *)page_address(page) + offset,  | 
 | 332 | 				size, dac_allowed); | 
 | 333 | } | 
| Al Viro | cff52da | 2006-10-11 17:40:22 +0100 | [diff] [blame] | 334 | EXPORT_SYMBOL(pci_map_page); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 335 |  | 
 | 336 | /* Unmap a single streaming mode DMA translation.  The DMA_ADDR and | 
 | 337 |    SIZE must match what was provided for in a previous pci_map_single | 
 | 338 |    call.  All other usages are undefined.  After this call, reads by | 
 | 339 |    the cpu to the buffer are guaranteed to see whatever the device | 
 | 340 |    wrote there.  */ | 
 | 341 |  | 
 | 342 | void | 
 | 343 | pci_unmap_single(struct pci_dev *pdev, dma_addr_t dma_addr, size_t size, | 
 | 344 | 		 int direction) | 
 | 345 | { | 
 | 346 | 	unsigned long flags; | 
 | 347 | 	struct pci_controller *hose = pdev ? pdev->sysdata : pci_isa_hose; | 
 | 348 | 	struct pci_iommu_arena *arena; | 
 | 349 | 	long dma_ofs, npages; | 
 | 350 |  | 
 | 351 | 	if (direction == PCI_DMA_NONE) | 
 | 352 | 		BUG(); | 
 | 353 |  | 
 | 354 | 	if (dma_addr >= __direct_map_base | 
 | 355 | 	    && dma_addr < __direct_map_base + __direct_map_size) { | 
 | 356 | 		/* Nothing to do.  */ | 
 | 357 |  | 
 | 358 | 		DBGA2("pci_unmap_single: direct [%lx,%lx] from %p\n", | 
 | 359 | 		      dma_addr, size, __builtin_return_address(0)); | 
 | 360 |  | 
 | 361 | 		return; | 
 | 362 | 	} | 
 | 363 |  | 
 | 364 | 	if (dma_addr > 0xffffffff) { | 
 | 365 | 		DBGA2("pci64_unmap_single: DAC [%lx,%lx] from %p\n", | 
 | 366 | 		      dma_addr, size, __builtin_return_address(0)); | 
 | 367 | 		return; | 
 | 368 | 	} | 
 | 369 |  | 
 | 370 | 	arena = hose->sg_pci; | 
 | 371 | 	if (!arena || dma_addr < arena->dma_base) | 
 | 372 | 		arena = hose->sg_isa; | 
 | 373 |  | 
 | 374 | 	dma_ofs = (dma_addr - arena->dma_base) >> PAGE_SHIFT; | 
 | 375 | 	if (dma_ofs * PAGE_SIZE >= arena->size) { | 
 | 376 | 		printk(KERN_ERR "Bogus pci_unmap_single: dma_addr %lx " | 
 | 377 | 		       " base %lx size %x\n", dma_addr, arena->dma_base, | 
 | 378 | 		       arena->size); | 
 | 379 | 		return; | 
 | 380 | 		BUG(); | 
 | 381 | 	} | 
 | 382 |  | 
| Joerg Roedel | eb117d3 | 2008-10-15 22:02:13 -0700 | [diff] [blame] | 383 | 	npages = iommu_num_pages(dma_addr, size, PAGE_SIZE); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 384 |  | 
 | 385 | 	spin_lock_irqsave(&arena->lock, flags); | 
 | 386 |  | 
 | 387 | 	iommu_arena_free(arena, dma_ofs, npages); | 
 | 388 |  | 
 | 389 |         /* If we're freeing ptes above the `next_entry' pointer (they | 
 | 390 |            may have snuck back into the TLB since the last wrap flush), | 
 | 391 |            we need to flush the TLB before reallocating the latter.  */ | 
 | 392 | 	if (dma_ofs >= arena->next_entry) | 
 | 393 | 		alpha_mv.mv_pci_tbi(hose, dma_addr, dma_addr + size - 1); | 
 | 394 |  | 
 | 395 | 	spin_unlock_irqrestore(&arena->lock, flags); | 
 | 396 |  | 
 | 397 | 	DBGA2("pci_unmap_single: sg [%lx,%lx] np %ld from %p\n", | 
 | 398 | 	      dma_addr, size, npages, __builtin_return_address(0)); | 
 | 399 | } | 
| Al Viro | cff52da | 2006-10-11 17:40:22 +0100 | [diff] [blame] | 400 | EXPORT_SYMBOL(pci_unmap_single); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 401 |  | 
 | 402 | void | 
 | 403 | pci_unmap_page(struct pci_dev *pdev, dma_addr_t dma_addr, | 
 | 404 | 	       size_t size, int direction) | 
 | 405 | { | 
 | 406 | 	pci_unmap_single(pdev, dma_addr, size, direction); | 
 | 407 | } | 
| Al Viro | cff52da | 2006-10-11 17:40:22 +0100 | [diff] [blame] | 408 | EXPORT_SYMBOL(pci_unmap_page); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 409 |  | 
 | 410 | /* Allocate and map kernel buffer using consistent mode DMA for PCI | 
 | 411 |    device.  Returns non-NULL cpu-view pointer to the buffer if | 
 | 412 |    successful and sets *DMA_ADDRP to the pci side dma address as well, | 
 | 413 |    else DMA_ADDRP is undefined.  */ | 
 | 414 |  | 
 | 415 | void * | 
| Ivan Kokshaysky | c143d43 | 2008-04-02 13:04:43 -0700 | [diff] [blame] | 416 | __pci_alloc_consistent(struct pci_dev *pdev, size_t size, | 
 | 417 | 		       dma_addr_t *dma_addrp, gfp_t gfp) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 418 | { | 
 | 419 | 	void *cpu_addr; | 
 | 420 | 	long order = get_order(size); | 
| Ivan Kokshaysky | c143d43 | 2008-04-02 13:04:43 -0700 | [diff] [blame] | 421 |  | 
 | 422 | 	gfp &= ~GFP_DMA; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 423 |  | 
 | 424 | try_again: | 
 | 425 | 	cpu_addr = (void *)__get_free_pages(gfp, order); | 
 | 426 | 	if (! cpu_addr) { | 
 | 427 | 		printk(KERN_INFO "pci_alloc_consistent: " | 
 | 428 | 		       "get_free_pages failed from %p\n", | 
 | 429 | 			__builtin_return_address(0)); | 
 | 430 | 		/* ??? Really atomic allocation?  Otherwise we could play | 
 | 431 | 		   with vmalloc and sg if we can't find contiguous memory.  */ | 
 | 432 | 		return NULL; | 
 | 433 | 	} | 
 | 434 | 	memset(cpu_addr, 0, size); | 
 | 435 |  | 
 | 436 | 	*dma_addrp = pci_map_single_1(pdev, cpu_addr, size, 0); | 
 | 437 | 	if (*dma_addrp == 0) { | 
 | 438 | 		free_pages((unsigned long)cpu_addr, order); | 
 | 439 | 		if (alpha_mv.mv_pci_tbi || (gfp & GFP_DMA)) | 
 | 440 | 			return NULL; | 
 | 441 | 		/* The address doesn't fit required mask and we | 
 | 442 | 		   do not have iommu. Try again with GFP_DMA. */ | 
 | 443 | 		gfp |= GFP_DMA; | 
 | 444 | 		goto try_again; | 
 | 445 | 	} | 
 | 446 | 		 | 
 | 447 | 	DBGA2("pci_alloc_consistent: %lx -> [%p,%x] from %p\n", | 
 | 448 | 	      size, cpu_addr, *dma_addrp, __builtin_return_address(0)); | 
 | 449 |  | 
 | 450 | 	return cpu_addr; | 
 | 451 | } | 
| Ivan Kokshaysky | c143d43 | 2008-04-02 13:04:43 -0700 | [diff] [blame] | 452 | EXPORT_SYMBOL(__pci_alloc_consistent); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 453 |  | 
 | 454 | /* Free and unmap a consistent DMA buffer.  CPU_ADDR and DMA_ADDR must | 
 | 455 |    be values that were returned from pci_alloc_consistent.  SIZE must | 
 | 456 |    be the same as what as passed into pci_alloc_consistent. | 
 | 457 |    References to the memory and mappings associated with CPU_ADDR or | 
 | 458 |    DMA_ADDR past this call are illegal.  */ | 
 | 459 |  | 
 | 460 | void | 
 | 461 | pci_free_consistent(struct pci_dev *pdev, size_t size, void *cpu_addr, | 
 | 462 | 		    dma_addr_t dma_addr) | 
 | 463 | { | 
 | 464 | 	pci_unmap_single(pdev, dma_addr, size, PCI_DMA_BIDIRECTIONAL); | 
 | 465 | 	free_pages((unsigned long)cpu_addr, get_order(size)); | 
 | 466 |  | 
 | 467 | 	DBGA2("pci_free_consistent: [%x,%lx] from %p\n", | 
 | 468 | 	      dma_addr, size, __builtin_return_address(0)); | 
 | 469 | } | 
| Al Viro | cff52da | 2006-10-11 17:40:22 +0100 | [diff] [blame] | 470 | EXPORT_SYMBOL(pci_free_consistent); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 471 |  | 
 | 472 | /* Classify the elements of the scatterlist.  Write dma_address | 
 | 473 |    of each element with: | 
 | 474 | 	0   : Followers all physically adjacent. | 
 | 475 | 	1   : Followers all virtually adjacent. | 
 | 476 | 	-1  : Not leader, physically adjacent to previous. | 
 | 477 | 	-2  : Not leader, virtually adjacent to previous. | 
 | 478 |    Write dma_length of each leader with the combined lengths of | 
 | 479 |    the mergable followers.  */ | 
 | 480 |  | 
| Jens Axboe | 58b053e | 2007-10-22 20:02:46 +0200 | [diff] [blame] | 481 | #define SG_ENT_VIRT_ADDRESS(SG) (sg_virt((SG))) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 482 | #define SG_ENT_PHYS_ADDRESS(SG) __pa(SG_ENT_VIRT_ADDRESS(SG)) | 
 | 483 |  | 
 | 484 | static void | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 485 | sg_classify(struct device *dev, struct scatterlist *sg, struct scatterlist *end, | 
 | 486 | 	    int virt_ok) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 487 | { | 
 | 488 | 	unsigned long next_paddr; | 
 | 489 | 	struct scatterlist *leader; | 
 | 490 | 	long leader_flag, leader_length; | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 491 | 	unsigned int max_seg_size; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 492 |  | 
 | 493 | 	leader = sg; | 
 | 494 | 	leader_flag = 0; | 
 | 495 | 	leader_length = leader->length; | 
 | 496 | 	next_paddr = SG_ENT_PHYS_ADDRESS(leader) + leader_length; | 
 | 497 |  | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 498 | 	/* we will not marge sg without device. */ | 
 | 499 | 	max_seg_size = dev ? dma_get_max_seg_size(dev) : 0; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 500 | 	for (++sg; sg < end; ++sg) { | 
 | 501 | 		unsigned long addr, len; | 
 | 502 | 		addr = SG_ENT_PHYS_ADDRESS(sg); | 
 | 503 | 		len = sg->length; | 
 | 504 |  | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 505 | 		if (leader_length + len > max_seg_size) | 
 | 506 | 			goto new_segment; | 
 | 507 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 508 | 		if (next_paddr == addr) { | 
 | 509 | 			sg->dma_address = -1; | 
 | 510 | 			leader_length += len; | 
 | 511 | 		} else if (((next_paddr | addr) & ~PAGE_MASK) == 0 && virt_ok) { | 
 | 512 | 			sg->dma_address = -2; | 
 | 513 | 			leader_flag = 1; | 
 | 514 | 			leader_length += len; | 
 | 515 | 		} else { | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 516 | new_segment: | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 517 | 			leader->dma_address = leader_flag; | 
 | 518 | 			leader->dma_length = leader_length; | 
 | 519 | 			leader = sg; | 
 | 520 | 			leader_flag = 0; | 
 | 521 | 			leader_length = len; | 
 | 522 | 		} | 
 | 523 |  | 
 | 524 | 		next_paddr = addr + len; | 
 | 525 | 	} | 
 | 526 |  | 
 | 527 | 	leader->dma_address = leader_flag; | 
 | 528 | 	leader->dma_length = leader_length; | 
 | 529 | } | 
 | 530 |  | 
 | 531 | /* Given a scatterlist leader, choose an allocation method and fill | 
 | 532 |    in the blanks.  */ | 
 | 533 |  | 
 | 534 | static int | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 535 | sg_fill(struct device *dev, struct scatterlist *leader, struct scatterlist *end, | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 536 | 	struct scatterlist *out, struct pci_iommu_arena *arena, | 
 | 537 | 	dma_addr_t max_dma, int dac_allowed) | 
 | 538 | { | 
 | 539 | 	unsigned long paddr = SG_ENT_PHYS_ADDRESS(leader); | 
 | 540 | 	long size = leader->dma_length; | 
 | 541 | 	struct scatterlist *sg; | 
 | 542 | 	unsigned long *ptes; | 
 | 543 | 	long npages, dma_ofs, i; | 
 | 544 |  | 
 | 545 | #if !DEBUG_NODIRECT | 
 | 546 | 	/* If everything is physically contiguous, and the addresses | 
 | 547 | 	   fall into the direct-map window, use it.  */ | 
 | 548 | 	if (leader->dma_address == 0 | 
 | 549 | 	    && paddr + size + __direct_map_base - 1 <= max_dma | 
 | 550 | 	    && paddr + size <= __direct_map_size) { | 
 | 551 | 		out->dma_address = paddr + __direct_map_base; | 
 | 552 | 		out->dma_length = size; | 
 | 553 |  | 
 | 554 | 		DBGA("    sg_fill: [%p,%lx] -> direct %lx\n", | 
 | 555 | 		     __va(paddr), size, out->dma_address); | 
 | 556 |  | 
 | 557 | 		return 0; | 
 | 558 | 	} | 
 | 559 | #endif | 
 | 560 |  | 
 | 561 | 	/* If physically contiguous and DAC is available, use it.  */ | 
 | 562 | 	if (leader->dma_address == 0 && dac_allowed) { | 
 | 563 | 		out->dma_address = paddr + alpha_mv.pci_dac_offset; | 
 | 564 | 		out->dma_length = size; | 
 | 565 |  | 
 | 566 | 		DBGA("    sg_fill: [%p,%lx] -> DAC %lx\n", | 
 | 567 | 		     __va(paddr), size, out->dma_address); | 
 | 568 |  | 
 | 569 | 		return 0; | 
 | 570 | 	} | 
 | 571 |  | 
 | 572 | 	/* Otherwise, we'll use the iommu to make the pages virtually | 
 | 573 | 	   contiguous.  */ | 
 | 574 |  | 
 | 575 | 	paddr &= ~PAGE_MASK; | 
| Joerg Roedel | eb117d3 | 2008-10-15 22:02:13 -0700 | [diff] [blame] | 576 | 	npages = iommu_num_pages(paddr, size, PAGE_SIZE); | 
| FUJITA Tomonori | cf54014 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 577 | 	dma_ofs = iommu_arena_alloc(dev, arena, npages, 0); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 578 | 	if (dma_ofs < 0) { | 
 | 579 | 		/* If we attempted a direct map above but failed, die.  */ | 
 | 580 | 		if (leader->dma_address == 0) | 
 | 581 | 			return -1; | 
 | 582 |  | 
 | 583 | 		/* Otherwise, break up the remaining virtually contiguous | 
 | 584 | 		   hunks into individual direct maps and retry.  */ | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 585 | 		sg_classify(dev, leader, end, 0); | 
 | 586 | 		return sg_fill(dev, leader, end, out, arena, max_dma, dac_allowed); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 587 | 	} | 
 | 588 |  | 
 | 589 | 	out->dma_address = arena->dma_base + dma_ofs*PAGE_SIZE + paddr; | 
 | 590 | 	out->dma_length = size; | 
 | 591 |  | 
 | 592 | 	DBGA("    sg_fill: [%p,%lx] -> sg %lx np %ld\n", | 
 | 593 | 	     __va(paddr), size, out->dma_address, npages); | 
 | 594 |  | 
 | 595 | 	/* All virtually contiguous.  We need to find the length of each | 
 | 596 | 	   physically contiguous subsegment to fill in the ptes.  */ | 
 | 597 | 	ptes = &arena->ptes[dma_ofs]; | 
 | 598 | 	sg = leader; | 
 | 599 | 	do { | 
 | 600 | #if DEBUG_ALLOC > 0 | 
 | 601 | 		struct scatterlist *last_sg = sg; | 
 | 602 | #endif | 
 | 603 |  | 
 | 604 | 		size = sg->length; | 
 | 605 | 		paddr = SG_ENT_PHYS_ADDRESS(sg); | 
 | 606 |  | 
 | 607 | 		while (sg+1 < end && (int) sg[1].dma_address == -1) { | 
 | 608 | 			size += sg[1].length; | 
 | 609 | 			sg++; | 
 | 610 | 		} | 
 | 611 |  | 
| Joerg Roedel | eb117d3 | 2008-10-15 22:02:13 -0700 | [diff] [blame] | 612 | 		npages = iommu_num_pages(paddr, size, PAGE_SIZE); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 613 |  | 
 | 614 | 		paddr &= PAGE_MASK; | 
 | 615 | 		for (i = 0; i < npages; ++i, paddr += PAGE_SIZE) | 
 | 616 | 			*ptes++ = mk_iommu_pte(paddr); | 
 | 617 |  | 
 | 618 | #if DEBUG_ALLOC > 0 | 
 | 619 | 		DBGA("    (%ld) [%p,%x] np %ld\n", | 
 | 620 | 		     last_sg - leader, SG_ENT_VIRT_ADDRESS(last_sg), | 
 | 621 | 		     last_sg->length, npages); | 
 | 622 | 		while (++last_sg <= sg) { | 
 | 623 | 			DBGA("        (%ld) [%p,%x] cont\n", | 
 | 624 | 			     last_sg - leader, SG_ENT_VIRT_ADDRESS(last_sg), | 
 | 625 | 			     last_sg->length); | 
 | 626 | 		} | 
 | 627 | #endif | 
 | 628 | 	} while (++sg < end && (int) sg->dma_address < 0); | 
 | 629 |  | 
 | 630 | 	return 1; | 
 | 631 | } | 
 | 632 |  | 
 | 633 | int | 
 | 634 | pci_map_sg(struct pci_dev *pdev, struct scatterlist *sg, int nents, | 
 | 635 | 	   int direction) | 
 | 636 | { | 
 | 637 | 	struct scatterlist *start, *end, *out; | 
 | 638 | 	struct pci_controller *hose; | 
 | 639 | 	struct pci_iommu_arena *arena; | 
 | 640 | 	dma_addr_t max_dma; | 
 | 641 | 	int dac_allowed; | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 642 | 	struct device *dev; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 643 |  | 
 | 644 | 	if (direction == PCI_DMA_NONE) | 
 | 645 | 		BUG(); | 
 | 646 |  | 
 | 647 | 	dac_allowed = pdev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0; | 
 | 648 |  | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 649 | 	dev = pdev ? &pdev->dev : NULL; | 
 | 650 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 651 | 	/* Fast path single entry scatterlists.  */ | 
 | 652 | 	if (nents == 1) { | 
 | 653 | 		sg->dma_length = sg->length; | 
 | 654 | 		sg->dma_address | 
 | 655 | 		  = pci_map_single_1(pdev, SG_ENT_VIRT_ADDRESS(sg), | 
 | 656 | 				     sg->length, dac_allowed); | 
 | 657 | 		return sg->dma_address != 0; | 
 | 658 | 	} | 
 | 659 |  | 
 | 660 | 	start = sg; | 
 | 661 | 	end = sg + nents; | 
 | 662 |  | 
 | 663 | 	/* First, prepare information about the entries.  */ | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 664 | 	sg_classify(dev, sg, end, alpha_mv.mv_pci_tbi != 0); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 665 |  | 
 | 666 | 	/* Second, figure out where we're going to map things.  */ | 
 | 667 | 	if (alpha_mv.mv_pci_tbi) { | 
 | 668 | 		hose = pdev ? pdev->sysdata : pci_isa_hose; | 
 | 669 | 		max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK; | 
 | 670 | 		arena = hose->sg_pci; | 
 | 671 | 		if (!arena || arena->dma_base + arena->size - 1 > max_dma) | 
 | 672 | 			arena = hose->sg_isa; | 
 | 673 | 	} else { | 
 | 674 | 		max_dma = -1; | 
 | 675 | 		arena = NULL; | 
 | 676 | 		hose = NULL; | 
 | 677 | 	} | 
 | 678 |  | 
 | 679 | 	/* Third, iterate over the scatterlist leaders and allocate | 
 | 680 | 	   dma space as needed.  */ | 
 | 681 | 	for (out = sg; sg < end; ++sg) { | 
 | 682 | 		if ((int) sg->dma_address < 0) | 
 | 683 | 			continue; | 
| FUJITA Tomonori | 7c53664 | 2008-02-04 22:27:58 -0800 | [diff] [blame] | 684 | 		if (sg_fill(dev, sg, end, out, arena, max_dma, dac_allowed) < 0) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 685 | 			goto error; | 
 | 686 | 		out++; | 
 | 687 | 	} | 
 | 688 |  | 
 | 689 | 	/* Mark the end of the list for pci_unmap_sg.  */ | 
 | 690 | 	if (out < end) | 
 | 691 | 		out->dma_length = 0; | 
 | 692 |  | 
 | 693 | 	if (out - start == 0) | 
 | 694 | 		printk(KERN_WARNING "pci_map_sg failed: no entries?\n"); | 
 | 695 | 	DBGA("pci_map_sg: %ld entries\n", out - start); | 
 | 696 |  | 
 | 697 | 	return out - start; | 
 | 698 |  | 
 | 699 |  error: | 
 | 700 | 	printk(KERN_WARNING "pci_map_sg failed: " | 
 | 701 | 	       "could not allocate dma page tables\n"); | 
 | 702 |  | 
 | 703 | 	/* Some allocation failed while mapping the scatterlist | 
 | 704 | 	   entries.  Unmap them now.  */ | 
 | 705 | 	if (out > start) | 
 | 706 | 		pci_unmap_sg(pdev, start, out - start, direction); | 
 | 707 | 	return 0; | 
 | 708 | } | 
| Al Viro | cff52da | 2006-10-11 17:40:22 +0100 | [diff] [blame] | 709 | EXPORT_SYMBOL(pci_map_sg); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 710 |  | 
 | 711 | /* Unmap a set of streaming mode DMA translations.  Again, cpu read | 
 | 712 |    rules concerning calls here are the same as for pci_unmap_single() | 
 | 713 |    above.  */ | 
 | 714 |  | 
 | 715 | void | 
 | 716 | pci_unmap_sg(struct pci_dev *pdev, struct scatterlist *sg, int nents, | 
 | 717 | 	     int direction) | 
 | 718 | { | 
 | 719 | 	unsigned long flags; | 
 | 720 | 	struct pci_controller *hose; | 
 | 721 | 	struct pci_iommu_arena *arena; | 
 | 722 | 	struct scatterlist *end; | 
 | 723 | 	dma_addr_t max_dma; | 
 | 724 | 	dma_addr_t fbeg, fend; | 
 | 725 |  | 
 | 726 | 	if (direction == PCI_DMA_NONE) | 
 | 727 | 		BUG(); | 
 | 728 |  | 
 | 729 | 	if (! alpha_mv.mv_pci_tbi) | 
 | 730 | 		return; | 
 | 731 |  | 
 | 732 | 	hose = pdev ? pdev->sysdata : pci_isa_hose; | 
 | 733 | 	max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK; | 
 | 734 | 	arena = hose->sg_pci; | 
 | 735 | 	if (!arena || arena->dma_base + arena->size - 1 > max_dma) | 
 | 736 | 		arena = hose->sg_isa; | 
 | 737 |  | 
 | 738 | 	fbeg = -1, fend = 0; | 
 | 739 |  | 
 | 740 | 	spin_lock_irqsave(&arena->lock, flags); | 
 | 741 |  | 
 | 742 | 	for (end = sg + nents; sg < end; ++sg) { | 
 | 743 | 		dma64_addr_t addr; | 
 | 744 | 		size_t size; | 
 | 745 | 		long npages, ofs; | 
 | 746 | 		dma_addr_t tend; | 
 | 747 |  | 
 | 748 | 		addr = sg->dma_address; | 
 | 749 | 		size = sg->dma_length; | 
 | 750 | 		if (!size) | 
 | 751 | 			break; | 
 | 752 |  | 
 | 753 | 		if (addr > 0xffffffff) { | 
 | 754 | 			/* It's a DAC address -- nothing to do.  */ | 
 | 755 | 			DBGA("    (%ld) DAC [%lx,%lx]\n", | 
 | 756 | 			      sg - end + nents, addr, size); | 
 | 757 | 			continue; | 
 | 758 | 		} | 
 | 759 |  | 
 | 760 | 		if (addr >= __direct_map_base | 
 | 761 | 		    && addr < __direct_map_base + __direct_map_size) { | 
 | 762 | 			/* Nothing to do.  */ | 
 | 763 | 			DBGA("    (%ld) direct [%lx,%lx]\n", | 
 | 764 | 			      sg - end + nents, addr, size); | 
 | 765 | 			continue; | 
 | 766 | 		} | 
 | 767 |  | 
 | 768 | 		DBGA("    (%ld) sg [%lx,%lx]\n", | 
 | 769 | 		     sg - end + nents, addr, size); | 
 | 770 |  | 
| Joerg Roedel | eb117d3 | 2008-10-15 22:02:13 -0700 | [diff] [blame] | 771 | 		npages = iommu_num_pages(addr, size, PAGE_SIZE); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 772 | 		ofs = (addr - arena->dma_base) >> PAGE_SHIFT; | 
 | 773 | 		iommu_arena_free(arena, ofs, npages); | 
 | 774 |  | 
 | 775 | 		tend = addr + size - 1; | 
 | 776 | 		if (fbeg > addr) fbeg = addr; | 
 | 777 | 		if (fend < tend) fend = tend; | 
 | 778 | 	} | 
 | 779 |  | 
 | 780 |         /* If we're freeing ptes above the `next_entry' pointer (they | 
 | 781 |            may have snuck back into the TLB since the last wrap flush), | 
 | 782 |            we need to flush the TLB before reallocating the latter.  */ | 
 | 783 | 	if ((fend - arena->dma_base) >> PAGE_SHIFT >= arena->next_entry) | 
 | 784 | 		alpha_mv.mv_pci_tbi(hose, fbeg, fend); | 
 | 785 |  | 
 | 786 | 	spin_unlock_irqrestore(&arena->lock, flags); | 
 | 787 |  | 
 | 788 | 	DBGA("pci_unmap_sg: %ld entries\n", nents - (end - sg)); | 
 | 789 | } | 
| Al Viro | cff52da | 2006-10-11 17:40:22 +0100 | [diff] [blame] | 790 | EXPORT_SYMBOL(pci_unmap_sg); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 791 |  | 
 | 792 |  | 
 | 793 | /* Return whether the given PCI device DMA address mask can be | 
 | 794 |    supported properly.  */ | 
 | 795 |  | 
 | 796 | int | 
 | 797 | pci_dma_supported(struct pci_dev *pdev, u64 mask) | 
 | 798 | { | 
 | 799 | 	struct pci_controller *hose; | 
 | 800 | 	struct pci_iommu_arena *arena; | 
 | 801 |  | 
 | 802 | 	/* If there exists a direct map, and the mask fits either | 
 | 803 | 	   the entire direct mapped space or the total system memory as | 
 | 804 | 	   shifted by the map base */ | 
 | 805 | 	if (__direct_map_size != 0 | 
 | 806 | 	    && (__direct_map_base + __direct_map_size - 1 <= mask || | 
 | 807 | 		__direct_map_base + (max_low_pfn << PAGE_SHIFT) - 1 <= mask)) | 
 | 808 | 		return 1; | 
 | 809 |  | 
 | 810 | 	/* Check that we have a scatter-gather arena that fits.  */ | 
 | 811 | 	hose = pdev ? pdev->sysdata : pci_isa_hose; | 
 | 812 | 	arena = hose->sg_isa; | 
 | 813 | 	if (arena && arena->dma_base + arena->size - 1 <= mask) | 
 | 814 | 		return 1; | 
 | 815 | 	arena = hose->sg_pci; | 
 | 816 | 	if (arena && arena->dma_base + arena->size - 1 <= mask) | 
 | 817 | 		return 1; | 
 | 818 |  | 
 | 819 | 	/* As last resort try ZONE_DMA.  */ | 
 | 820 | 	if (!__direct_map_base && MAX_DMA_ADDRESS - IDENT_ADDR - 1 <= mask) | 
 | 821 | 		return 1; | 
 | 822 |  | 
 | 823 | 	return 0; | 
 | 824 | } | 
| Al Viro | cff52da | 2006-10-11 17:40:22 +0100 | [diff] [blame] | 825 | EXPORT_SYMBOL(pci_dma_supported); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 826 |  | 
 | 827 |  | 
 | 828 | /* | 
 | 829 |  * AGP GART extensions to the IOMMU | 
 | 830 |  */ | 
 | 831 | int | 
 | 832 | iommu_reserve(struct pci_iommu_arena *arena, long pg_count, long align_mask)  | 
 | 833 | { | 
 | 834 | 	unsigned long flags; | 
 | 835 | 	unsigned long *ptes; | 
 | 836 | 	long i, p; | 
 | 837 |  | 
 | 838 | 	if (!arena) return -EINVAL; | 
 | 839 |  | 
 | 840 | 	spin_lock_irqsave(&arena->lock, flags); | 
 | 841 |  | 
 | 842 | 	/* Search for N empty ptes.  */ | 
 | 843 | 	ptes = arena->ptes; | 
| FUJITA Tomonori | cf54014 | 2008-03-04 14:28:57 -0800 | [diff] [blame] | 844 | 	p = iommu_arena_find_pages(NULL, arena, pg_count, align_mask); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 845 | 	if (p < 0) { | 
 | 846 | 		spin_unlock_irqrestore(&arena->lock, flags); | 
 | 847 | 		return -1; | 
 | 848 | 	} | 
 | 849 |  | 
 | 850 | 	/* Success.  Mark them all reserved (ie not zero and invalid) | 
 | 851 | 	   for the iommu tlb that could load them from under us. | 
 | 852 | 	   They will be filled in with valid bits by _bind() */ | 
 | 853 | 	for (i = 0; i < pg_count; ++i) | 
 | 854 | 		ptes[p+i] = IOMMU_RESERVED_PTE; | 
 | 855 |  | 
 | 856 | 	arena->next_entry = p + pg_count; | 
 | 857 | 	spin_unlock_irqrestore(&arena->lock, flags); | 
 | 858 |  | 
 | 859 | 	return p; | 
 | 860 | } | 
 | 861 |  | 
 | 862 | int  | 
 | 863 | iommu_release(struct pci_iommu_arena *arena, long pg_start, long pg_count) | 
 | 864 | { | 
 | 865 | 	unsigned long *ptes; | 
 | 866 | 	long i; | 
 | 867 |  | 
 | 868 | 	if (!arena) return -EINVAL; | 
 | 869 |  | 
 | 870 | 	ptes = arena->ptes; | 
 | 871 |  | 
 | 872 | 	/* Make sure they're all reserved first... */ | 
 | 873 | 	for(i = pg_start; i < pg_start + pg_count; i++) | 
 | 874 | 		if (ptes[i] != IOMMU_RESERVED_PTE) | 
 | 875 | 			return -EBUSY; | 
 | 876 |  | 
 | 877 | 	iommu_arena_free(arena, pg_start, pg_count); | 
 | 878 | 	return 0; | 
 | 879 | } | 
 | 880 |  | 
 | 881 | int | 
 | 882 | iommu_bind(struct pci_iommu_arena *arena, long pg_start, long pg_count,  | 
 | 883 | 	   unsigned long *physaddrs) | 
 | 884 | { | 
 | 885 | 	unsigned long flags; | 
 | 886 | 	unsigned long *ptes; | 
 | 887 | 	long i, j; | 
 | 888 |  | 
 | 889 | 	if (!arena) return -EINVAL; | 
 | 890 | 	 | 
 | 891 | 	spin_lock_irqsave(&arena->lock, flags); | 
 | 892 |  | 
 | 893 | 	ptes = arena->ptes; | 
 | 894 |  | 
 | 895 | 	for(j = pg_start; j < pg_start + pg_count; j++) { | 
 | 896 | 		if (ptes[j] != IOMMU_RESERVED_PTE) { | 
 | 897 | 			spin_unlock_irqrestore(&arena->lock, flags); | 
 | 898 | 			return -EBUSY; | 
 | 899 | 		} | 
 | 900 | 	} | 
 | 901 | 		 | 
 | 902 | 	for(i = 0, j = pg_start; i < pg_count; i++, j++) | 
 | 903 | 		ptes[j] = mk_iommu_pte(physaddrs[i]); | 
 | 904 |  | 
 | 905 | 	spin_unlock_irqrestore(&arena->lock, flags); | 
 | 906 |  | 
 | 907 | 	return 0; | 
 | 908 | } | 
 | 909 |  | 
 | 910 | int | 
 | 911 | iommu_unbind(struct pci_iommu_arena *arena, long pg_start, long pg_count) | 
 | 912 | { | 
 | 913 | 	unsigned long *p; | 
 | 914 | 	long i; | 
 | 915 |  | 
 | 916 | 	if (!arena) return -EINVAL; | 
 | 917 |  | 
 | 918 | 	p = arena->ptes + pg_start; | 
 | 919 | 	for(i = 0; i < pg_count; i++) | 
 | 920 | 		p[i] = IOMMU_RESERVED_PTE; | 
 | 921 |  | 
 | 922 | 	return 0; | 
 | 923 | } | 
 | 924 |  | 
 | 925 | /* True if the machine supports DAC addressing, and DEV can | 
 | 926 |    make use of it given MASK.  */ | 
 | 927 |  | 
| Jan Beulich | caa5171 | 2007-07-09 11:55:51 -0700 | [diff] [blame] | 928 | static int | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 929 | pci_dac_dma_supported(struct pci_dev *dev, u64 mask) | 
 | 930 | { | 
 | 931 | 	dma64_addr_t dac_offset = alpha_mv.pci_dac_offset; | 
 | 932 | 	int ok = 1; | 
 | 933 |  | 
 | 934 | 	/* If this is not set, the machine doesn't support DAC at all.  */ | 
 | 935 | 	if (dac_offset == 0) | 
 | 936 | 		ok = 0; | 
 | 937 |  | 
 | 938 | 	/* The device has to be able to address our DAC bit.  */ | 
 | 939 | 	if ((dac_offset & dev->dma_mask) != dac_offset) | 
 | 940 | 		ok = 0; | 
 | 941 |  | 
 | 942 | 	/* If both conditions above are met, we are fine. */ | 
 | 943 | 	DBGA("pci_dac_dma_supported %s from %p\n", | 
 | 944 | 	     ok ? "yes" : "no", __builtin_return_address(0)); | 
 | 945 |  | 
 | 946 | 	return ok; | 
 | 947 | } | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 948 |  | 
 | 949 | /* Helper for generic DMA-mapping functions. */ | 
 | 950 |  | 
 | 951 | struct pci_dev * | 
 | 952 | alpha_gendev_to_pci(struct device *dev) | 
 | 953 | { | 
 | 954 | 	if (dev && dev->bus == &pci_bus_type) | 
 | 955 | 		return to_pci_dev(dev); | 
 | 956 |  | 
 | 957 | 	/* Assume that non-PCI devices asking for DMA are either ISA or EISA, | 
 | 958 | 	   BUG() otherwise. */ | 
 | 959 | 	BUG_ON(!isa_bridge); | 
 | 960 |  | 
 | 961 | 	/* Assume non-busmaster ISA DMA when dma_mask is not set (the ISA | 
 | 962 | 	   bridge is bus master then). */ | 
 | 963 | 	if (!dev || !dev->dma_mask || !*dev->dma_mask) | 
 | 964 | 		return isa_bridge; | 
 | 965 |  | 
 | 966 | 	/* For EISA bus masters, return isa_bridge (it might have smaller | 
 | 967 | 	   dma_mask due to wiring limitations). */ | 
 | 968 | 	if (*dev->dma_mask >= isa_bridge->dma_mask) | 
 | 969 | 		return isa_bridge; | 
 | 970 |  | 
 | 971 | 	/* This assumes ISA bus master with dma_mask 0xffffff. */ | 
 | 972 | 	return NULL; | 
 | 973 | } | 
| Al Viro | cff52da | 2006-10-11 17:40:22 +0100 | [diff] [blame] | 974 | EXPORT_SYMBOL(alpha_gendev_to_pci); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 975 |  | 
 | 976 | int | 
 | 977 | dma_set_mask(struct device *dev, u64 mask) | 
 | 978 | { | 
 | 979 | 	if (!dev->dma_mask || | 
 | 980 | 	    !pci_dma_supported(alpha_gendev_to_pci(dev), mask)) | 
 | 981 | 		return -EIO; | 
 | 982 |  | 
 | 983 | 	*dev->dma_mask = mask; | 
 | 984 |  | 
 | 985 | 	return 0; | 
 | 986 | } | 
| Al Viro | cff52da | 2006-10-11 17:40:22 +0100 | [diff] [blame] | 987 | EXPORT_SYMBOL(dma_set_mask); |