xref: /linux/arch/alpha/kernel/pci_iommu.c (revision c532de5a67a70f8533d495f8f2aaa9a0491c3ad0)
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  *	linux/arch/alpha/kernel/pci_iommu.c
4  */
5 
6 #include <linux/kernel.h>
7 #include <linux/mm.h>
8 #include <linux/pci.h>
9 #include <linux/gfp.h>
10 #include <linux/memblock.h>
11 #include <linux/export.h>
12 #include <linux/scatterlist.h>
13 #include <linux/log2.h>
14 #include <linux/dma-map-ops.h>
15 #include <linux/iommu-helper.h>
16 
17 #include <asm/io.h>
18 #include <asm/hwrpb.h>
19 
20 #include "proto.h"
21 #include "pci_impl.h"
22 
23 
24 #define DEBUG_ALLOC 0
25 #if DEBUG_ALLOC > 0
26 # define DBGA(args...)		printk(KERN_DEBUG args)
27 #else
28 # define DBGA(args...)
29 #endif
30 #if DEBUG_ALLOC > 1
31 # define DBGA2(args...)		printk(KERN_DEBUG args)
32 #else
33 # define DBGA2(args...)
34 #endif
35 
36 #define DEBUG_NODIRECT 0
37 
38 #define ISA_DMA_MASK		0x00ffffff
39 
40 static inline unsigned long
41 mk_iommu_pte(unsigned long paddr)
42 {
43 	return (paddr >> (PAGE_SHIFT-1)) | 1;
44 }
45 
46 /* Return the minimum of MAX or the first power of two larger
47    than main memory.  */
48 
49 unsigned long
50 size_for_memory(unsigned long max)
51 {
52 	unsigned long mem = max_low_pfn << PAGE_SHIFT;
53 	if (mem < max)
54 		max = roundup_pow_of_two(mem);
55 	return max;
56 }
57 
58 struct pci_iommu_arena * __init
59 iommu_arena_new_node(int nid, struct pci_controller *hose, dma_addr_t base,
60 		     unsigned long window_size, unsigned long align)
61 {
62 	unsigned long mem_size;
63 	struct pci_iommu_arena *arena;
64 
65 	mem_size = window_size / (PAGE_SIZE / sizeof(unsigned long));
66 
67 	/* Note that the TLB lookup logic uses bitwise concatenation,
68 	   not addition, so the required arena alignment is based on
69 	   the size of the window.  Retain the align parameter so that
70 	   particular systems can over-align the arena.  */
71 	if (align < mem_size)
72 		align = mem_size;
73 
74 	arena = memblock_alloc(sizeof(*arena), SMP_CACHE_BYTES);
75 	if (!arena)
76 		panic("%s: Failed to allocate %zu bytes\n", __func__,
77 		      sizeof(*arena));
78 	arena->ptes = memblock_alloc(mem_size, align);
79 	if (!arena->ptes)
80 		panic("%s: Failed to allocate %lu bytes align=0x%lx\n",
81 		      __func__, mem_size, align);
82 
83 	spin_lock_init(&arena->lock);
84 	arena->hose = hose;
85 	arena->dma_base = base;
86 	arena->size = window_size;
87 	arena->next_entry = 0;
88 
89 	/* Align allocations to a multiple of a page size.  Not needed
90 	   unless there are chip bugs.  */
91 	arena->align_entry = 1;
92 
93 	return arena;
94 }
95 
96 struct pci_iommu_arena * __init
97 iommu_arena_new(struct pci_controller *hose, dma_addr_t base,
98 		unsigned long window_size, unsigned long align)
99 {
100 	return iommu_arena_new_node(0, hose, base, window_size, align);
101 }
102 
103 /* Must be called with the arena lock held */
104 static long
105 iommu_arena_find_pages(struct device *dev, struct pci_iommu_arena *arena,
106 		       long n, long mask)
107 {
108 	unsigned long *ptes;
109 	long i, p, nent;
110 	int pass = 0;
111 	unsigned long base;
112 	unsigned long boundary_size;
113 
114 	base = arena->dma_base >> PAGE_SHIFT;
115 	boundary_size = dma_get_seg_boundary_nr_pages(dev, PAGE_SHIFT);
116 
117 	/* Search forward for the first mask-aligned sequence of N free ptes */
118 	ptes = arena->ptes;
119 	nent = arena->size >> PAGE_SHIFT;
120 	p = ALIGN(arena->next_entry, mask + 1);
121 	i = 0;
122 
123 again:
124 	while (i < n && p+i < nent) {
125 		if (!i && iommu_is_span_boundary(p, n, base, boundary_size)) {
126 			p = ALIGN(p + 1, mask + 1);
127 			goto again;
128 		}
129 
130 		if (ptes[p+i]) {
131 			p = ALIGN(p + i + 1, mask + 1);
132 			i = 0;
133 		} else {
134 			i = i + 1;
135 		}
136 	}
137 
138 	if (i < n) {
139 		if (pass < 1) {
140 			/*
141 			 * Reached the end.  Flush the TLB and restart
142 			 * the search from the beginning.
143 			*/
144 			alpha_mv.mv_pci_tbi(arena->hose, 0, -1);
145 
146 			pass++;
147 			p = 0;
148 			i = 0;
149 			goto again;
150 		} else
151 			return -1;
152 	}
153 
154 	/* Success. It's the responsibility of the caller to mark them
155 	   in use before releasing the lock */
156 	return p;
157 }
158 
159 static long
160 iommu_arena_alloc(struct device *dev, struct pci_iommu_arena *arena, long n,
161 		  unsigned int align)
162 {
163 	unsigned long flags;
164 	unsigned long *ptes;
165 	long i, p, mask;
166 
167 	spin_lock_irqsave(&arena->lock, flags);
168 
169 	/* Search for N empty ptes */
170 	ptes = arena->ptes;
171 	mask = max(align, arena->align_entry) - 1;
172 	p = iommu_arena_find_pages(dev, arena, n, mask);
173 	if (p < 0) {
174 		spin_unlock_irqrestore(&arena->lock, flags);
175 		return -1;
176 	}
177 
178 	/* Success.  Mark them all in use, ie not zero and invalid
179 	   for the iommu tlb that could load them from under us.
180 	   The chip specific bits will fill this in with something
181 	   kosher when we return.  */
182 	for (i = 0; i < n; ++i)
183 		ptes[p+i] = IOMMU_INVALID_PTE;
184 
185 	arena->next_entry = p + n;
186 	spin_unlock_irqrestore(&arena->lock, flags);
187 
188 	return p;
189 }
190 
191 static void
192 iommu_arena_free(struct pci_iommu_arena *arena, long ofs, long n)
193 {
194 	unsigned long *p;
195 	long i;
196 
197 	p = arena->ptes + ofs;
198 	for (i = 0; i < n; ++i)
199 		p[i] = 0;
200 }
201 
202 /*
203  * True if the machine supports DAC addressing, and DEV can
204  * make use of it given MASK.
205  */
206 static int pci_dac_dma_supported(struct pci_dev *dev, u64 mask)
207 {
208 	dma_addr_t dac_offset = alpha_mv.pci_dac_offset;
209 	int ok = 1;
210 
211 	/* If this is not set, the machine doesn't support DAC at all.  */
212 	if (dac_offset == 0)
213 		ok = 0;
214 
215 	/* The device has to be able to address our DAC bit.  */
216 	if ((dac_offset & dev->dma_mask) != dac_offset)
217 		ok = 0;
218 
219 	/* If both conditions above are met, we are fine. */
220 	DBGA("pci_dac_dma_supported %s from %ps\n",
221 	     ok ? "yes" : "no", __builtin_return_address(0));
222 
223 	return ok;
224 }
225 
226 /* Map a single buffer of the indicated size for PCI DMA in streaming
227    mode.  The 32-bit PCI bus mastering address to use is returned.
228    Once the device is given the dma address, the device owns this memory
229    until either pci_unmap_single or pci_dma_sync_single is performed.  */
230 
231 static dma_addr_t
232 pci_map_single_1(struct pci_dev *pdev, void *cpu_addr, size_t size,
233 		 int dac_allowed)
234 {
235 	struct pci_controller *hose = pdev ? pdev->sysdata : pci_isa_hose;
236 	dma_addr_t max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
237 	struct pci_iommu_arena *arena;
238 	long npages, dma_ofs, i;
239 	unsigned long paddr;
240 	dma_addr_t ret;
241 	unsigned int align = 0;
242 	struct device *dev = pdev ? &pdev->dev : NULL;
243 
244 	paddr = __pa(cpu_addr);
245 
246 #if !DEBUG_NODIRECT
247 	/* First check to see if we can use the direct map window.  */
248 	if (paddr + size + __direct_map_base - 1 <= max_dma
249 	    && paddr + size <= __direct_map_size) {
250 		ret = paddr + __direct_map_base;
251 
252 		DBGA2("pci_map_single: [%p,%zx] -> direct %llx from %ps\n",
253 		      cpu_addr, size, ret, __builtin_return_address(0));
254 
255 		return ret;
256 	}
257 #endif
258 
259 	/* Next, use DAC if selected earlier.  */
260 	if (dac_allowed) {
261 		ret = paddr + alpha_mv.pci_dac_offset;
262 
263 		DBGA2("pci_map_single: [%p,%zx] -> DAC %llx from %ps\n",
264 		      cpu_addr, size, ret, __builtin_return_address(0));
265 
266 		return ret;
267 	}
268 
269 	/* If the machine doesn't define a pci_tbi routine, we have to
270 	   assume it doesn't support sg mapping, and, since we tried to
271 	   use direct_map above, it now must be considered an error. */
272 	if (! alpha_mv.mv_pci_tbi) {
273 		printk_once(KERN_WARNING "pci_map_single: no HW sg\n");
274 		return DMA_MAPPING_ERROR;
275 	}
276 
277 	arena = hose->sg_pci;
278 	if (!arena || arena->dma_base + arena->size - 1 > max_dma)
279 		arena = hose->sg_isa;
280 
281 	npages = iommu_num_pages(paddr, size, PAGE_SIZE);
282 
283 	/* Force allocation to 64KB boundary for ISA bridges. */
284 	if (pdev && pdev == isa_bridge)
285 		align = 8;
286 	dma_ofs = iommu_arena_alloc(dev, arena, npages, align);
287 	if (dma_ofs < 0) {
288 		printk(KERN_WARNING "pci_map_single failed: "
289 		       "could not allocate dma page tables\n");
290 		return DMA_MAPPING_ERROR;
291 	}
292 
293 	paddr &= PAGE_MASK;
294 	for (i = 0; i < npages; ++i, paddr += PAGE_SIZE)
295 		arena->ptes[i + dma_ofs] = mk_iommu_pte(paddr);
296 
297 	ret = arena->dma_base + dma_ofs * PAGE_SIZE;
298 	ret += (unsigned long)cpu_addr & ~PAGE_MASK;
299 
300 	DBGA2("pci_map_single: [%p,%zx] np %ld -> sg %llx from %ps\n",
301 	      cpu_addr, size, npages, ret, __builtin_return_address(0));
302 
303 	return ret;
304 }
305 
306 /* Helper for generic DMA-mapping functions. */
307 static struct pci_dev *alpha_gendev_to_pci(struct device *dev)
308 {
309 	if (dev && dev_is_pci(dev))
310 		return to_pci_dev(dev);
311 
312 	/* Assume that non-PCI devices asking for DMA are either ISA or EISA,
313 	   BUG() otherwise. */
314 	BUG_ON(!isa_bridge);
315 
316 	/* Assume non-busmaster ISA DMA when dma_mask is not set (the ISA
317 	   bridge is bus master then). */
318 	if (!dev || !dev->dma_mask || !*dev->dma_mask)
319 		return isa_bridge;
320 
321 	/* For EISA bus masters, return isa_bridge (it might have smaller
322 	   dma_mask due to wiring limitations). */
323 	if (*dev->dma_mask >= isa_bridge->dma_mask)
324 		return isa_bridge;
325 
326 	/* This assumes ISA bus master with dma_mask 0xffffff. */
327 	return NULL;
328 }
329 
330 static dma_addr_t alpha_pci_map_page(struct device *dev, struct page *page,
331 				     unsigned long offset, size_t size,
332 				     enum dma_data_direction dir,
333 				     unsigned long attrs)
334 {
335 	struct pci_dev *pdev = alpha_gendev_to_pci(dev);
336 	int dac_allowed;
337 
338 	BUG_ON(dir == DMA_NONE);
339 
340 	dac_allowed = pdev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0;
341 	return pci_map_single_1(pdev, (char *)page_address(page) + offset,
342 				size, dac_allowed);
343 }
344 
345 /* Unmap a single streaming mode DMA translation.  The DMA_ADDR and
346    SIZE must match what was provided for in a previous pci_map_single
347    call.  All other usages are undefined.  After this call, reads by
348    the cpu to the buffer are guaranteed to see whatever the device
349    wrote there.  */
350 
351 static void alpha_pci_unmap_page(struct device *dev, dma_addr_t dma_addr,
352 				 size_t size, enum dma_data_direction dir,
353 				 unsigned long attrs)
354 {
355 	unsigned long flags;
356 	struct pci_dev *pdev = alpha_gendev_to_pci(dev);
357 	struct pci_controller *hose = pdev ? pdev->sysdata : pci_isa_hose;
358 	struct pci_iommu_arena *arena;
359 	long dma_ofs, npages;
360 
361 	BUG_ON(dir == DMA_NONE);
362 
363 	if (dma_addr >= __direct_map_base
364 	    && dma_addr < __direct_map_base + __direct_map_size) {
365 		/* Nothing to do.  */
366 
367 		DBGA2("pci_unmap_single: direct [%llx,%zx] from %ps\n",
368 		      dma_addr, size, __builtin_return_address(0));
369 
370 		return;
371 	}
372 
373 	if (dma_addr > 0xffffffff) {
374 		DBGA2("pci64_unmap_single: DAC [%llx,%zx] from %ps\n",
375 		      dma_addr, size, __builtin_return_address(0));
376 		return;
377 	}
378 
379 	arena = hose->sg_pci;
380 	if (!arena || dma_addr < arena->dma_base)
381 		arena = hose->sg_isa;
382 
383 	dma_ofs = (dma_addr - arena->dma_base) >> PAGE_SHIFT;
384 	if (dma_ofs * PAGE_SIZE >= arena->size) {
385 		printk(KERN_ERR "Bogus pci_unmap_single: dma_addr %llx "
386 		       " base %llx size %x\n",
387 		       dma_addr, arena->dma_base, arena->size);
388 		return;
389 		BUG();
390 	}
391 
392 	npages = iommu_num_pages(dma_addr, size, PAGE_SIZE);
393 
394 	spin_lock_irqsave(&arena->lock, flags);
395 
396 	iommu_arena_free(arena, dma_ofs, npages);
397 
398         /* If we're freeing ptes above the `next_entry' pointer (they
399            may have snuck back into the TLB since the last wrap flush),
400            we need to flush the TLB before reallocating the latter.  */
401 	if (dma_ofs >= arena->next_entry)
402 		alpha_mv.mv_pci_tbi(hose, dma_addr, dma_addr + size - 1);
403 
404 	spin_unlock_irqrestore(&arena->lock, flags);
405 
406 	DBGA2("pci_unmap_single: sg [%llx,%zx] np %ld from %ps\n",
407 	      dma_addr, size, npages, __builtin_return_address(0));
408 }
409 
410 /* Allocate and map kernel buffer using consistent mode DMA for PCI
411    device.  Returns non-NULL cpu-view pointer to the buffer if
412    successful and sets *DMA_ADDRP to the pci side dma address as well,
413    else DMA_ADDRP is undefined.  */
414 
415 static void *alpha_pci_alloc_coherent(struct device *dev, size_t size,
416 				      dma_addr_t *dma_addrp, gfp_t gfp,
417 				      unsigned long attrs)
418 {
419 	struct pci_dev *pdev = alpha_gendev_to_pci(dev);
420 	void *cpu_addr;
421 	long order = get_order(size);
422 
423 	gfp &= ~GFP_DMA;
424 
425 try_again:
426 	cpu_addr = (void *)__get_free_pages(gfp | __GFP_ZERO, order);
427 	if (! cpu_addr) {
428 		printk(KERN_INFO "pci_alloc_consistent: "
429 		       "get_free_pages failed from %ps\n",
430 			__builtin_return_address(0));
431 		/* ??? Really atomic allocation?  Otherwise we could play
432 		   with vmalloc and sg if we can't find contiguous memory.  */
433 		return NULL;
434 	}
435 	memset(cpu_addr, 0, size);
436 
437 	*dma_addrp = pci_map_single_1(pdev, cpu_addr, size, 0);
438 	if (*dma_addrp == DMA_MAPPING_ERROR) {
439 		free_pages((unsigned long)cpu_addr, order);
440 		if (alpha_mv.mv_pci_tbi || (gfp & GFP_DMA))
441 			return NULL;
442 		/* The address doesn't fit required mask and we
443 		   do not have iommu. Try again with GFP_DMA. */
444 		gfp |= GFP_DMA;
445 		goto try_again;
446 	}
447 
448 	DBGA2("pci_alloc_consistent: %zx -> [%p,%llx] from %ps\n",
449 	      size, cpu_addr, *dma_addrp, __builtin_return_address(0));
450 
451 	return cpu_addr;
452 }
453 
454 /* Free and unmap a consistent DMA buffer.  CPU_ADDR and DMA_ADDR must
455    be values that were returned from pci_alloc_consistent.  SIZE must
456    be the same as what as passed into pci_alloc_consistent.
457    References to the memory and mappings associated with CPU_ADDR or
458    DMA_ADDR past this call are illegal.  */
459 
460 static void alpha_pci_free_coherent(struct device *dev, size_t size,
461 				    void *cpu_addr, dma_addr_t dma_addr,
462 				    unsigned long attrs)
463 {
464 	struct pci_dev *pdev = alpha_gendev_to_pci(dev);
465 	dma_unmap_single(&pdev->dev, dma_addr, size, DMA_BIDIRECTIONAL);
466 	free_pages((unsigned long)cpu_addr, get_order(size));
467 
468 	DBGA2("pci_free_consistent: [%llx,%zx] from %ps\n",
469 	      dma_addr, size, __builtin_return_address(0));
470 }
471 
472 /* Classify the elements of the scatterlist.  Write dma_address
473    of each element with:
474 	0   : Followers all physically adjacent.
475 	1   : Followers all virtually adjacent.
476 	-1  : Not leader, physically adjacent to previous.
477 	-2  : Not leader, virtually adjacent to previous.
478    Write dma_length of each leader with the combined lengths of
479    the mergable followers.  */
480 
481 #define SG_ENT_VIRT_ADDRESS(SG) (sg_virt((SG)))
482 #define SG_ENT_PHYS_ADDRESS(SG) __pa(SG_ENT_VIRT_ADDRESS(SG))
483 
484 static void
485 sg_classify(struct device *dev, struct scatterlist *sg, struct scatterlist *end,
486 	    int virt_ok)
487 {
488 	unsigned long next_paddr;
489 	struct scatterlist *leader;
490 	long leader_flag, leader_length;
491 	unsigned int max_seg_size;
492 
493 	leader = sg;
494 	leader_flag = 0;
495 	leader_length = leader->length;
496 	next_paddr = SG_ENT_PHYS_ADDRESS(leader) + leader_length;
497 
498 	/* we will not marge sg without device. */
499 	max_seg_size = dev ? dma_get_max_seg_size(dev) : 0;
500 	for (++sg; sg < end; ++sg) {
501 		unsigned long addr, len;
502 		addr = SG_ENT_PHYS_ADDRESS(sg);
503 		len = sg->length;
504 
505 		if (leader_length + len > max_seg_size)
506 			goto new_segment;
507 
508 		if (next_paddr == addr) {
509 			sg->dma_address = -1;
510 			leader_length += len;
511 		} else if (((next_paddr | addr) & ~PAGE_MASK) == 0 && virt_ok) {
512 			sg->dma_address = -2;
513 			leader_flag = 1;
514 			leader_length += len;
515 		} else {
516 new_segment:
517 			leader->dma_address = leader_flag;
518 			leader->dma_length = leader_length;
519 			leader = sg;
520 			leader_flag = 0;
521 			leader_length = len;
522 		}
523 
524 		next_paddr = addr + len;
525 	}
526 
527 	leader->dma_address = leader_flag;
528 	leader->dma_length = leader_length;
529 }
530 
531 /* Given a scatterlist leader, choose an allocation method and fill
532    in the blanks.  */
533 
534 static int
535 sg_fill(struct device *dev, struct scatterlist *leader, struct scatterlist *end,
536 	struct scatterlist *out, struct pci_iommu_arena *arena,
537 	dma_addr_t max_dma, int dac_allowed)
538 {
539 	unsigned long paddr = SG_ENT_PHYS_ADDRESS(leader);
540 	long size = leader->dma_length;
541 	struct scatterlist *sg;
542 	unsigned long *ptes;
543 	long npages, dma_ofs, i;
544 
545 #if !DEBUG_NODIRECT
546 	/* If everything is physically contiguous, and the addresses
547 	   fall into the direct-map window, use it.  */
548 	if (leader->dma_address == 0
549 	    && paddr + size + __direct_map_base - 1 <= max_dma
550 	    && paddr + size <= __direct_map_size) {
551 		out->dma_address = paddr + __direct_map_base;
552 		out->dma_length = size;
553 
554 		DBGA("    sg_fill: [%p,%lx] -> direct %llx\n",
555 		     __va(paddr), size, out->dma_address);
556 
557 		return 0;
558 	}
559 #endif
560 
561 	/* If physically contiguous and DAC is available, use it.  */
562 	if (leader->dma_address == 0 && dac_allowed) {
563 		out->dma_address = paddr + alpha_mv.pci_dac_offset;
564 		out->dma_length = size;
565 
566 		DBGA("    sg_fill: [%p,%lx] -> DAC %llx\n",
567 		     __va(paddr), size, out->dma_address);
568 
569 		return 0;
570 	}
571 
572 	/* Otherwise, we'll use the iommu to make the pages virtually
573 	   contiguous.  */
574 
575 	paddr &= ~PAGE_MASK;
576 	npages = iommu_num_pages(paddr, size, PAGE_SIZE);
577 	dma_ofs = iommu_arena_alloc(dev, arena, npages, 0);
578 	if (dma_ofs < 0) {
579 		/* If we attempted a direct map above but failed, die.  */
580 		if (leader->dma_address == 0)
581 			return -1;
582 
583 		/* Otherwise, break up the remaining virtually contiguous
584 		   hunks into individual direct maps and retry.  */
585 		sg_classify(dev, leader, end, 0);
586 		return sg_fill(dev, leader, end, out, arena, max_dma, dac_allowed);
587 	}
588 
589 	out->dma_address = arena->dma_base + dma_ofs*PAGE_SIZE + paddr;
590 	out->dma_length = size;
591 
592 	DBGA("    sg_fill: [%p,%lx] -> sg %llx np %ld\n",
593 	     __va(paddr), size, out->dma_address, npages);
594 
595 	/* All virtually contiguous.  We need to find the length of each
596 	   physically contiguous subsegment to fill in the ptes.  */
597 	ptes = &arena->ptes[dma_ofs];
598 	sg = leader;
599 	do {
600 #if DEBUG_ALLOC > 0
601 		struct scatterlist *last_sg = sg;
602 #endif
603 
604 		size = sg->length;
605 		paddr = SG_ENT_PHYS_ADDRESS(sg);
606 
607 		while (sg+1 < end && (int) sg[1].dma_address == -1) {
608 			size += sg[1].length;
609 			sg = sg_next(sg);
610 		}
611 
612 		npages = iommu_num_pages(paddr, size, PAGE_SIZE);
613 
614 		paddr &= PAGE_MASK;
615 		for (i = 0; i < npages; ++i, paddr += PAGE_SIZE)
616 			*ptes++ = mk_iommu_pte(paddr);
617 
618 #if DEBUG_ALLOC > 0
619 		DBGA("    (%ld) [%p,%x] np %ld\n",
620 		     last_sg - leader, SG_ENT_VIRT_ADDRESS(last_sg),
621 		     last_sg->length, npages);
622 		while (++last_sg <= sg) {
623 			DBGA("        (%ld) [%p,%x] cont\n",
624 			     last_sg - leader, SG_ENT_VIRT_ADDRESS(last_sg),
625 			     last_sg->length);
626 		}
627 #endif
628 	} while (++sg < end && (int) sg->dma_address < 0);
629 
630 	return 1;
631 }
632 
633 static int alpha_pci_map_sg(struct device *dev, struct scatterlist *sg,
634 			    int nents, enum dma_data_direction dir,
635 			    unsigned long attrs)
636 {
637 	struct pci_dev *pdev = alpha_gendev_to_pci(dev);
638 	struct scatterlist *start, *end, *out;
639 	struct pci_controller *hose;
640 	struct pci_iommu_arena *arena;
641 	dma_addr_t max_dma;
642 	int dac_allowed;
643 
644 	BUG_ON(dir == DMA_NONE);
645 
646 	dac_allowed = dev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0;
647 
648 	/* Fast path single entry scatterlists.  */
649 	if (nents == 1) {
650 		sg->dma_length = sg->length;
651 		sg->dma_address
652 		  = pci_map_single_1(pdev, SG_ENT_VIRT_ADDRESS(sg),
653 				     sg->length, dac_allowed);
654 		if (sg->dma_address == DMA_MAPPING_ERROR)
655 			return -EIO;
656 		return 1;
657 	}
658 
659 	start = sg;
660 	end = sg + nents;
661 
662 	/* First, prepare information about the entries.  */
663 	sg_classify(dev, sg, end, alpha_mv.mv_pci_tbi != 0);
664 
665 	/* Second, figure out where we're going to map things.  */
666 	if (alpha_mv.mv_pci_tbi) {
667 		hose = pdev ? pdev->sysdata : pci_isa_hose;
668 		max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
669 		arena = hose->sg_pci;
670 		if (!arena || arena->dma_base + arena->size - 1 > max_dma)
671 			arena = hose->sg_isa;
672 	} else {
673 		max_dma = -1;
674 		arena = NULL;
675 		hose = NULL;
676 	}
677 
678 	/* Third, iterate over the scatterlist leaders and allocate
679 	   dma space as needed.  */
680 	for (out = sg; sg < end; ++sg) {
681 		if ((int) sg->dma_address < 0)
682 			continue;
683 		if (sg_fill(dev, sg, end, out, arena, max_dma, dac_allowed) < 0)
684 			goto error;
685 		out++;
686 	}
687 
688 	/* Mark the end of the list for pci_unmap_sg.  */
689 	if (out < end)
690 		out->dma_length = 0;
691 
692 	if (out - start == 0) {
693 		printk(KERN_WARNING "pci_map_sg failed: no entries?\n");
694 		return -ENOMEM;
695 	}
696 	DBGA("pci_map_sg: %ld entries\n", out - start);
697 
698 	return out - start;
699 
700  error:
701 	printk(KERN_WARNING "pci_map_sg failed: "
702 	       "could not allocate dma page tables\n");
703 
704 	/* Some allocation failed while mapping the scatterlist
705 	   entries.  Unmap them now.  */
706 	if (out > start)
707 		dma_unmap_sg(&pdev->dev, start, out - start, dir);
708 	return -ENOMEM;
709 }
710 
711 /* Unmap a set of streaming mode DMA translations.  Again, cpu read
712    rules concerning calls here are the same as for pci_unmap_single()
713    above.  */
714 
715 static void alpha_pci_unmap_sg(struct device *dev, struct scatterlist *sg,
716 			       int nents, enum dma_data_direction dir,
717 			       unsigned long attrs)
718 {
719 	struct pci_dev *pdev = alpha_gendev_to_pci(dev);
720 	unsigned long flags;
721 	struct pci_controller *hose;
722 	struct pci_iommu_arena *arena;
723 	struct scatterlist *end;
724 	dma_addr_t max_dma;
725 	dma_addr_t fbeg, fend;
726 
727 	BUG_ON(dir == DMA_NONE);
728 
729 	if (! alpha_mv.mv_pci_tbi)
730 		return;
731 
732 	hose = pdev ? pdev->sysdata : pci_isa_hose;
733 	max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
734 	arena = hose->sg_pci;
735 	if (!arena || arena->dma_base + arena->size - 1 > max_dma)
736 		arena = hose->sg_isa;
737 
738 	fbeg = -1, fend = 0;
739 
740 	spin_lock_irqsave(&arena->lock, flags);
741 
742 	for (end = sg + nents; sg < end; ++sg) {
743 		dma_addr_t addr;
744 		size_t size;
745 		long npages, ofs;
746 		dma_addr_t tend;
747 
748 		addr = sg->dma_address;
749 		size = sg->dma_length;
750 		if (!size)
751 			break;
752 
753 		if (addr > 0xffffffff) {
754 			/* It's a DAC address -- nothing to do.  */
755 			DBGA("    (%ld) DAC [%llx,%zx]\n",
756 			      sg - end + nents, addr, size);
757 			continue;
758 		}
759 
760 		if (addr >= __direct_map_base
761 		    && addr < __direct_map_base + __direct_map_size) {
762 			/* Nothing to do.  */
763 			DBGA("    (%ld) direct [%llx,%zx]\n",
764 			      sg - end + nents, addr, size);
765 			continue;
766 		}
767 
768 		DBGA("    (%ld) sg [%llx,%zx]\n",
769 		     sg - end + nents, addr, size);
770 
771 		npages = iommu_num_pages(addr, size, PAGE_SIZE);
772 		ofs = (addr - arena->dma_base) >> PAGE_SHIFT;
773 		iommu_arena_free(arena, ofs, npages);
774 
775 		tend = addr + size - 1;
776 		if (fbeg > addr) fbeg = addr;
777 		if (fend < tend) fend = tend;
778 	}
779 
780         /* If we're freeing ptes above the `next_entry' pointer (they
781            may have snuck back into the TLB since the last wrap flush),
782            we need to flush the TLB before reallocating the latter.  */
783 	if ((fend - arena->dma_base) >> PAGE_SHIFT >= arena->next_entry)
784 		alpha_mv.mv_pci_tbi(hose, fbeg, fend);
785 
786 	spin_unlock_irqrestore(&arena->lock, flags);
787 
788 	DBGA("pci_unmap_sg: %ld entries\n", nents - (end - sg));
789 }
790 
791 /* Return whether the given PCI device DMA address mask can be
792    supported properly.  */
793 
794 static int alpha_pci_supported(struct device *dev, u64 mask)
795 {
796 	struct pci_dev *pdev = alpha_gendev_to_pci(dev);
797 	struct pci_controller *hose;
798 	struct pci_iommu_arena *arena;
799 
800 	/* If there exists a direct map, and the mask fits either
801 	   the entire direct mapped space or the total system memory as
802 	   shifted by the map base */
803 	if (__direct_map_size != 0
804 	    && (__direct_map_base + __direct_map_size - 1 <= mask ||
805 		__direct_map_base + (max_low_pfn << PAGE_SHIFT) - 1 <= mask))
806 		return 1;
807 
808 	/* Check that we have a scatter-gather arena that fits.  */
809 	hose = pdev ? pdev->sysdata : pci_isa_hose;
810 	arena = hose->sg_isa;
811 	if (arena && arena->dma_base + arena->size - 1 <= mask)
812 		return 1;
813 	arena = hose->sg_pci;
814 	if (arena && arena->dma_base + arena->size - 1 <= mask)
815 		return 1;
816 
817 	/* As last resort try ZONE_DMA.  */
818 	if (!__direct_map_base && MAX_DMA_ADDRESS - IDENT_ADDR - 1 <= mask)
819 		return 1;
820 
821 	return 0;
822 }
823 
824 
825 /*
826  * AGP GART extensions to the IOMMU
827  */
828 int
829 iommu_reserve(struct pci_iommu_arena *arena, long pg_count, long align_mask)
830 {
831 	unsigned long flags;
832 	unsigned long *ptes;
833 	long i, p;
834 
835 	if (!arena) return -EINVAL;
836 
837 	spin_lock_irqsave(&arena->lock, flags);
838 
839 	/* Search for N empty ptes.  */
840 	ptes = arena->ptes;
841 	p = iommu_arena_find_pages(NULL, arena, pg_count, align_mask);
842 	if (p < 0) {
843 		spin_unlock_irqrestore(&arena->lock, flags);
844 		return -1;
845 	}
846 
847 	/* Success.  Mark them all reserved (ie not zero and invalid)
848 	   for the iommu tlb that could load them from under us.
849 	   They will be filled in with valid bits by _bind() */
850 	for (i = 0; i < pg_count; ++i)
851 		ptes[p+i] = IOMMU_RESERVED_PTE;
852 
853 	arena->next_entry = p + pg_count;
854 	spin_unlock_irqrestore(&arena->lock, flags);
855 
856 	return p;
857 }
858 
859 int
860 iommu_release(struct pci_iommu_arena *arena, long pg_start, long pg_count)
861 {
862 	unsigned long *ptes;
863 	long i;
864 
865 	if (!arena) return -EINVAL;
866 
867 	ptes = arena->ptes;
868 
869 	/* Make sure they're all reserved first... */
870 	for(i = pg_start; i < pg_start + pg_count; i++)
871 		if (ptes[i] != IOMMU_RESERVED_PTE)
872 			return -EBUSY;
873 
874 	iommu_arena_free(arena, pg_start, pg_count);
875 	return 0;
876 }
877 
878 int
879 iommu_bind(struct pci_iommu_arena *arena, long pg_start, long pg_count,
880 	   struct page **pages)
881 {
882 	unsigned long flags;
883 	unsigned long *ptes;
884 	long i, j;
885 
886 	if (!arena) return -EINVAL;
887 
888 	spin_lock_irqsave(&arena->lock, flags);
889 
890 	ptes = arena->ptes;
891 
892 	for(j = pg_start; j < pg_start + pg_count; j++) {
893 		if (ptes[j] != IOMMU_RESERVED_PTE) {
894 			spin_unlock_irqrestore(&arena->lock, flags);
895 			return -EBUSY;
896 		}
897 	}
898 
899 	for(i = 0, j = pg_start; i < pg_count; i++, j++)
900 		ptes[j] = mk_iommu_pte(page_to_phys(pages[i]));
901 
902 	spin_unlock_irqrestore(&arena->lock, flags);
903 
904 	return 0;
905 }
906 
907 int
908 iommu_unbind(struct pci_iommu_arena *arena, long pg_start, long pg_count)
909 {
910 	unsigned long *p;
911 	long i;
912 
913 	if (!arena) return -EINVAL;
914 
915 	p = arena->ptes + pg_start;
916 	for(i = 0; i < pg_count; i++)
917 		p[i] = IOMMU_RESERVED_PTE;
918 
919 	return 0;
920 }
921 
922 const struct dma_map_ops alpha_pci_ops = {
923 	.alloc			= alpha_pci_alloc_coherent,
924 	.free			= alpha_pci_free_coherent,
925 	.map_page		= alpha_pci_map_page,
926 	.unmap_page		= alpha_pci_unmap_page,
927 	.map_sg			= alpha_pci_map_sg,
928 	.unmap_sg		= alpha_pci_unmap_sg,
929 	.dma_supported		= alpha_pci_supported,
930 	.mmap			= dma_common_mmap,
931 	.get_sgtable		= dma_common_get_sgtable,
932 	.alloc_pages_op		= dma_common_alloc_pages,
933 	.free_pages		= dma_common_free_pages,
934 };
935 EXPORT_SYMBOL(alpha_pci_ops);
936