Linux Kernel  3.7.1
 All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Groups Pages
pci_iommu.c
Go to the documentation of this file.
1 /*
2  * linux/arch/alpha/kernel/pci_iommu.c
3  */
4 
5 #include <linux/kernel.h>
6 #include <linux/mm.h>
7 #include <linux/pci.h>
8 #include <linux/gfp.h>
9 #include <linux/bootmem.h>
10 #include <linux/export.h>
11 #include <linux/scatterlist.h>
12 #include <linux/log2.h>
13 #include <linux/dma-mapping.h>
14 #include <linux/iommu-helper.h>
15 
16 #include <asm/io.h>
17 #include <asm/hwrpb.h>
18 
19 #include "proto.h"
20 #include "pci_impl.h"
21 
22 
23 #define DEBUG_ALLOC 0
24 #if DEBUG_ALLOC > 0
25 # define DBGA(args...) printk(KERN_DEBUG args)
26 #else
27 # define DBGA(args...)
28 #endif
29 #if DEBUG_ALLOC > 1
30 # define DBGA2(args...) printk(KERN_DEBUG args)
31 #else
32 # define DBGA2(args...)
33 #endif
34 
35 #define DEBUG_NODIRECT 0
36 
37 #define ISA_DMA_MASK 0x00ffffff
38 
39 static inline unsigned long
40 mk_iommu_pte(unsigned long paddr)
41 {
42  return (paddr >> (PAGE_SHIFT-1)) | 1;
43 }
44 
45 /* Return the minimum of MAX or the first power of two larger
46  than main memory. */
47 
48 unsigned long
49 size_for_memory(unsigned long max)
50 {
51  unsigned long mem = max_low_pfn << PAGE_SHIFT;
52  if (mem < max)
53  max = roundup_pow_of_two(mem);
54  return max;
55 }
56 
57 struct pci_iommu_arena * __init
59  unsigned long window_size, unsigned long align)
60 {
61  unsigned long mem_size;
62  struct pci_iommu_arena *arena;
63 
64  mem_size = window_size / (PAGE_SIZE / sizeof(unsigned long));
65 
66  /* Note that the TLB lookup logic uses bitwise concatenation,
67  not addition, so the required arena alignment is based on
68  the size of the window. Retain the align parameter so that
69  particular systems can over-align the arena. */
70  if (align < mem_size)
71  align = mem_size;
72 
73 
74 #ifdef CONFIG_DISCONTIGMEM
75 
76  arena = alloc_bootmem_node(NODE_DATA(nid), sizeof(*arena));
77  if (!NODE_DATA(nid) || !arena) {
78  printk("%s: couldn't allocate arena from node %d\n"
79  " falling back to system-wide allocation\n",
80  __func__, nid);
81  arena = alloc_bootmem(sizeof(*arena));
82  }
83 
84  arena->ptes = __alloc_bootmem_node(NODE_DATA(nid), mem_size, align, 0);
85  if (!NODE_DATA(nid) || !arena->ptes) {
86  printk("%s: couldn't allocate arena ptes from node %d\n"
87  " falling back to system-wide allocation\n",
88  __func__, nid);
89  arena->ptes = __alloc_bootmem(mem_size, align, 0);
90  }
91 
92 #else /* CONFIG_DISCONTIGMEM */
93 
94  arena = alloc_bootmem(sizeof(*arena));
95  arena->ptes = __alloc_bootmem(mem_size, align, 0);
96 
97 #endif /* CONFIG_DISCONTIGMEM */
98 
99  spin_lock_init(&arena->lock);
100  arena->hose = hose;
101  arena->dma_base = base;
102  arena->size = window_size;
103  arena->next_entry = 0;
104 
105  /* Align allocations to a multiple of a page size. Not needed
106  unless there are chip bugs. */
107  arena->align_entry = 1;
108 
109  return arena;
110 }
111 
112 struct pci_iommu_arena * __init
114  unsigned long window_size, unsigned long align)
115 {
116  return iommu_arena_new_node(0, hose, base, window_size, align);
117 }
118 
119 /* Must be called with the arena lock held */
120 static long
121 iommu_arena_find_pages(struct device *dev, struct pci_iommu_arena *arena,
122  long n, long mask)
123 {
124  unsigned long *ptes;
125  long i, p, nent;
126  int pass = 0;
127  unsigned long base;
128  unsigned long boundary_size;
129 
130  base = arena->dma_base >> PAGE_SHIFT;
131  if (dev) {
132  boundary_size = dma_get_seg_boundary(dev) + 1;
133  boundary_size >>= PAGE_SHIFT;
134  } else {
135  boundary_size = 1UL << (32 - PAGE_SHIFT);
136  }
137 
138  /* Search forward for the first mask-aligned sequence of N free ptes */
139  ptes = arena->ptes;
140  nent = arena->size >> PAGE_SHIFT;
141  p = ALIGN(arena->next_entry, mask + 1);
142  i = 0;
143 
144 again:
145  while (i < n && p+i < nent) {
146  if (!i && iommu_is_span_boundary(p, n, base, boundary_size)) {
147  p = ALIGN(p + 1, mask + 1);
148  goto again;
149  }
150 
151  if (ptes[p+i])
152  p = ALIGN(p + i + 1, mask + 1), i = 0;
153  else
154  i = i + 1;
155  }
156 
157  if (i < n) {
158  if (pass < 1) {
159  /*
160  * Reached the end. Flush the TLB and restart
161  * the search from the beginning.
162  */
163  alpha_mv.mv_pci_tbi(arena->hose, 0, -1);
164 
165  pass++;
166  p = 0;
167  i = 0;
168  goto again;
169  } else
170  return -1;
171  }
172 
173  /* Success. It's the responsibility of the caller to mark them
174  in use before releasing the lock */
175  return p;
176 }
177 
178 static long
179 iommu_arena_alloc(struct device *dev, struct pci_iommu_arena *arena, long n,
180  unsigned int align)
181 {
182  unsigned long flags;
183  unsigned long *ptes;
184  long i, p, mask;
185 
186  spin_lock_irqsave(&arena->lock, flags);
187 
188  /* Search for N empty ptes */
189  ptes = arena->ptes;
190  mask = max(align, arena->align_entry) - 1;
191  p = iommu_arena_find_pages(dev, arena, n, mask);
192  if (p < 0) {
193  spin_unlock_irqrestore(&arena->lock, flags);
194  return -1;
195  }
196 
197  /* Success. Mark them all in use, ie not zero and invalid
198  for the iommu tlb that could load them from under us.
199  The chip specific bits will fill this in with something
200  kosher when we return. */
201  for (i = 0; i < n; ++i)
202  ptes[p+i] = IOMMU_INVALID_PTE;
203 
204  arena->next_entry = p + n;
205  spin_unlock_irqrestore(&arena->lock, flags);
206 
207  return p;
208 }
209 
210 static void
211 iommu_arena_free(struct pci_iommu_arena *arena, long ofs, long n)
212 {
213  unsigned long *p;
214  long i;
215 
216  p = arena->ptes + ofs;
217  for (i = 0; i < n; ++i)
218  p[i] = 0;
219 }
220 
221 /*
222  * True if the machine supports DAC addressing, and DEV can
223  * make use of it given MASK.
224  */
225 static int pci_dac_dma_supported(struct pci_dev *dev, u64 mask)
226 {
227  dma_addr_t dac_offset = alpha_mv.pci_dac_offset;
228  int ok = 1;
229 
230  /* If this is not set, the machine doesn't support DAC at all. */
231  if (dac_offset == 0)
232  ok = 0;
233 
234  /* The device has to be able to address our DAC bit. */
235  if ((dac_offset & dev->dma_mask) != dac_offset)
236  ok = 0;
237 
238  /* If both conditions above are met, we are fine. */
239  DBGA("pci_dac_dma_supported %s from %pf\n",
240  ok ? "yes" : "no", __builtin_return_address(0));
241 
242  return ok;
243 }
244 
245 /* Map a single buffer of the indicated size for PCI DMA in streaming
246  mode. The 32-bit PCI bus mastering address to use is returned.
247  Once the device is given the dma address, the device owns this memory
248  until either pci_unmap_single or pci_dma_sync_single is performed. */
249 
250 static dma_addr_t
251 pci_map_single_1(struct pci_dev *pdev, void *cpu_addr, size_t size,
252  int dac_allowed)
253 {
254  struct pci_controller *hose = pdev ? pdev->sysdata : pci_isa_hose;
255  dma_addr_t max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
256  struct pci_iommu_arena *arena;
257  long npages, dma_ofs, i;
258  unsigned long paddr;
259  dma_addr_t ret;
260  unsigned int align = 0;
261  struct device *dev = pdev ? &pdev->dev : NULL;
262 
263  paddr = __pa(cpu_addr);
264 
265 #if !DEBUG_NODIRECT
266  /* First check to see if we can use the direct map window. */
267  if (paddr + size + __direct_map_base - 1 <= max_dma
268  && paddr + size <= __direct_map_size) {
269  ret = paddr + __direct_map_base;
270 
271  DBGA2("pci_map_single: [%p,%zx] -> direct %llx from %pf\n",
272  cpu_addr, size, ret, __builtin_return_address(0));
273 
274  return ret;
275  }
276 #endif
277 
278  /* Next, use DAC if selected earlier. */
279  if (dac_allowed) {
280  ret = paddr + alpha_mv.pci_dac_offset;
281 
282  DBGA2("pci_map_single: [%p,%zx] -> DAC %llx from %pf\n",
283  cpu_addr, size, ret, __builtin_return_address(0));
284 
285  return ret;
286  }
287 
288  /* If the machine doesn't define a pci_tbi routine, we have to
289  assume it doesn't support sg mapping, and, since we tried to
290  use direct_map above, it now must be considered an error. */
291  if (! alpha_mv.mv_pci_tbi) {
292  printk_once(KERN_WARNING "pci_map_single: no HW sg\n");
293  return 0;
294  }
295 
296  arena = hose->sg_pci;
297  if (!arena || arena->dma_base + arena->size - 1 > max_dma)
298  arena = hose->sg_isa;
299 
300  npages = iommu_num_pages(paddr, size, PAGE_SIZE);
301 
302  /* Force allocation to 64KB boundary for ISA bridges. */
303  if (pdev && pdev == isa_bridge)
304  align = 8;
305  dma_ofs = iommu_arena_alloc(dev, arena, npages, align);
306  if (dma_ofs < 0) {
307  printk(KERN_WARNING "pci_map_single failed: "
308  "could not allocate dma page tables\n");
309  return 0;
310  }
311 
312  paddr &= PAGE_MASK;
313  for (i = 0; i < npages; ++i, paddr += PAGE_SIZE)
314  arena->ptes[i + dma_ofs] = mk_iommu_pte(paddr);
315 
316  ret = arena->dma_base + dma_ofs * PAGE_SIZE;
317  ret += (unsigned long)cpu_addr & ~PAGE_MASK;
318 
319  DBGA2("pci_map_single: [%p,%zx] np %ld -> sg %llx from %pf\n",
320  cpu_addr, size, npages, ret, __builtin_return_address(0));
321 
322  return ret;
323 }
324 
325 /* Helper for generic DMA-mapping functions. */
326 static struct pci_dev *alpha_gendev_to_pci(struct device *dev)
327 {
328  if (dev && dev->bus == &pci_bus_type)
329  return to_pci_dev(dev);
330 
331  /* Assume that non-PCI devices asking for DMA are either ISA or EISA,
332  BUG() otherwise. */
333  BUG_ON(!isa_bridge);
334 
335  /* Assume non-busmaster ISA DMA when dma_mask is not set (the ISA
336  bridge is bus master then). */
337  if (!dev || !dev->dma_mask || !*dev->dma_mask)
338  return isa_bridge;
339 
340  /* For EISA bus masters, return isa_bridge (it might have smaller
341  dma_mask due to wiring limitations). */
342  if (*dev->dma_mask >= isa_bridge->dma_mask)
343  return isa_bridge;
344 
345  /* This assumes ISA bus master with dma_mask 0xffffff. */
346  return NULL;
347 }
348 
349 static dma_addr_t alpha_pci_map_page(struct device *dev, struct page *page,
350  unsigned long offset, size_t size,
351  enum dma_data_direction dir,
352  struct dma_attrs *attrs)
353 {
354  struct pci_dev *pdev = alpha_gendev_to_pci(dev);
355  int dac_allowed;
356 
357  if (dir == PCI_DMA_NONE)
358  BUG();
359 
360  dac_allowed = pdev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0;
361  return pci_map_single_1(pdev, (char *)page_address(page) + offset,
362  size, dac_allowed);
363 }
364 
365 /* Unmap a single streaming mode DMA translation. The DMA_ADDR and
366  SIZE must match what was provided for in a previous pci_map_single
367  call. All other usages are undefined. After this call, reads by
368  the cpu to the buffer are guaranteed to see whatever the device
369  wrote there. */
370 
371 static void alpha_pci_unmap_page(struct device *dev, dma_addr_t dma_addr,
372  size_t size, enum dma_data_direction dir,
373  struct dma_attrs *attrs)
374 {
375  unsigned long flags;
376  struct pci_dev *pdev = alpha_gendev_to_pci(dev);
377  struct pci_controller *hose = pdev ? pdev->sysdata : pci_isa_hose;
378  struct pci_iommu_arena *arena;
379  long dma_ofs, npages;
380 
381  if (dir == PCI_DMA_NONE)
382  BUG();
383 
384  if (dma_addr >= __direct_map_base
385  && dma_addr < __direct_map_base + __direct_map_size) {
386  /* Nothing to do. */
387 
388  DBGA2("pci_unmap_single: direct [%llx,%zx] from %pf\n",
389  dma_addr, size, __builtin_return_address(0));
390 
391  return;
392  }
393 
394  if (dma_addr > 0xffffffff) {
395  DBGA2("pci64_unmap_single: DAC [%llx,%zx] from %pf\n",
396  dma_addr, size, __builtin_return_address(0));
397  return;
398  }
399 
400  arena = hose->sg_pci;
401  if (!arena || dma_addr < arena->dma_base)
402  arena = hose->sg_isa;
403 
404  dma_ofs = (dma_addr - arena->dma_base) >> PAGE_SHIFT;
405  if (dma_ofs * PAGE_SIZE >= arena->size) {
406  printk(KERN_ERR "Bogus pci_unmap_single: dma_addr %llx "
407  " base %llx size %x\n",
408  dma_addr, arena->dma_base, arena->size);
409  return;
410  BUG();
411  }
412 
413  npages = iommu_num_pages(dma_addr, size, PAGE_SIZE);
414 
415  spin_lock_irqsave(&arena->lock, flags);
416 
417  iommu_arena_free(arena, dma_ofs, npages);
418 
419  /* If we're freeing ptes above the `next_entry' pointer (they
420  may have snuck back into the TLB since the last wrap flush),
421  we need to flush the TLB before reallocating the latter. */
422  if (dma_ofs >= arena->next_entry)
423  alpha_mv.mv_pci_tbi(hose, dma_addr, dma_addr + size - 1);
424 
425  spin_unlock_irqrestore(&arena->lock, flags);
426 
427  DBGA2("pci_unmap_single: sg [%llx,%zx] np %ld from %pf\n",
428  dma_addr, size, npages, __builtin_return_address(0));
429 }
430 
431 /* Allocate and map kernel buffer using consistent mode DMA for PCI
432  device. Returns non-NULL cpu-view pointer to the buffer if
433  successful and sets *DMA_ADDRP to the pci side dma address as well,
434  else DMA_ADDRP is undefined. */
435 
436 static void *alpha_pci_alloc_coherent(struct device *dev, size_t size,
437  dma_addr_t *dma_addrp, gfp_t gfp,
438  struct dma_attrs *attrs)
439 {
440  struct pci_dev *pdev = alpha_gendev_to_pci(dev);
441  void *cpu_addr;
442  long order = get_order(size);
443 
444  gfp &= ~GFP_DMA;
445 
446 try_again:
447  cpu_addr = (void *)__get_free_pages(gfp, order);
448  if (! cpu_addr) {
449  printk(KERN_INFO "pci_alloc_consistent: "
450  "get_free_pages failed from %pf\n",
451  __builtin_return_address(0));
452  /* ??? Really atomic allocation? Otherwise we could play
453  with vmalloc and sg if we can't find contiguous memory. */
454  return NULL;
455  }
456  memset(cpu_addr, 0, size);
457 
458  *dma_addrp = pci_map_single_1(pdev, cpu_addr, size, 0);
459  if (*dma_addrp == 0) {
460  free_pages((unsigned long)cpu_addr, order);
461  if (alpha_mv.mv_pci_tbi || (gfp & GFP_DMA))
462  return NULL;
463  /* The address doesn't fit required mask and we
464  do not have iommu. Try again with GFP_DMA. */
465  gfp |= GFP_DMA;
466  goto try_again;
467  }
468 
469  DBGA2("pci_alloc_consistent: %zx -> [%p,%llx] from %pf\n",
470  size, cpu_addr, *dma_addrp, __builtin_return_address(0));
471 
472  return cpu_addr;
473 }
474 
475 /* Free and unmap a consistent DMA buffer. CPU_ADDR and DMA_ADDR must
476  be values that were returned from pci_alloc_consistent. SIZE must
477  be the same as what as passed into pci_alloc_consistent.
478  References to the memory and mappings associated with CPU_ADDR or
479  DMA_ADDR past this call are illegal. */
480 
481 static void alpha_pci_free_coherent(struct device *dev, size_t size,
482  void *cpu_addr, dma_addr_t dma_addr,
483  struct dma_attrs *attrs)
484 {
485  struct pci_dev *pdev = alpha_gendev_to_pci(dev);
486  pci_unmap_single(pdev, dma_addr, size, PCI_DMA_BIDIRECTIONAL);
487  free_pages((unsigned long)cpu_addr, get_order(size));
488 
489  DBGA2("pci_free_consistent: [%llx,%zx] from %pf\n",
490  dma_addr, size, __builtin_return_address(0));
491 }
492 
493 /* Classify the elements of the scatterlist. Write dma_address
494  of each element with:
495  0 : Followers all physically adjacent.
496  1 : Followers all virtually adjacent.
497  -1 : Not leader, physically adjacent to previous.
498  -2 : Not leader, virtually adjacent to previous.
499  Write dma_length of each leader with the combined lengths of
500  the mergable followers. */
501 
502 #define SG_ENT_VIRT_ADDRESS(SG) (sg_virt((SG)))
503 #define SG_ENT_PHYS_ADDRESS(SG) __pa(SG_ENT_VIRT_ADDRESS(SG))
504 
505 static void
506 sg_classify(struct device *dev, struct scatterlist *sg, struct scatterlist *end,
507  int virt_ok)
508 {
509  unsigned long next_paddr;
510  struct scatterlist *leader;
511  long leader_flag, leader_length;
512  unsigned int max_seg_size;
513 
514  leader = sg;
515  leader_flag = 0;
516  leader_length = leader->length;
517  next_paddr = SG_ENT_PHYS_ADDRESS(leader) + leader_length;
518 
519  /* we will not marge sg without device. */
520  max_seg_size = dev ? dma_get_max_seg_size(dev) : 0;
521  for (++sg; sg < end; ++sg) {
522  unsigned long addr, len;
523  addr = SG_ENT_PHYS_ADDRESS(sg);
524  len = sg->length;
525 
526  if (leader_length + len > max_seg_size)
527  goto new_segment;
528 
529  if (next_paddr == addr) {
530  sg->dma_address = -1;
531  leader_length += len;
532  } else if (((next_paddr | addr) & ~PAGE_MASK) == 0 && virt_ok) {
533  sg->dma_address = -2;
534  leader_flag = 1;
535  leader_length += len;
536  } else {
537 new_segment:
538  leader->dma_address = leader_flag;
539  leader->dma_length = leader_length;
540  leader = sg;
541  leader_flag = 0;
542  leader_length = len;
543  }
544 
545  next_paddr = addr + len;
546  }
547 
548  leader->dma_address = leader_flag;
549  leader->dma_length = leader_length;
550 }
551 
552 /* Given a scatterlist leader, choose an allocation method and fill
553  in the blanks. */
554 
555 static int
556 sg_fill(struct device *dev, struct scatterlist *leader, struct scatterlist *end,
557  struct scatterlist *out, struct pci_iommu_arena *arena,
558  dma_addr_t max_dma, int dac_allowed)
559 {
560  unsigned long paddr = SG_ENT_PHYS_ADDRESS(leader);
561  long size = leader->dma_length;
562  struct scatterlist *sg;
563  unsigned long *ptes;
564  long npages, dma_ofs, i;
565 
566 #if !DEBUG_NODIRECT
567  /* If everything is physically contiguous, and the addresses
568  fall into the direct-map window, use it. */
569  if (leader->dma_address == 0
570  && paddr + size + __direct_map_base - 1 <= max_dma
571  && paddr + size <= __direct_map_size) {
572  out->dma_address = paddr + __direct_map_base;
573  out->dma_length = size;
574 
575  DBGA(" sg_fill: [%p,%lx] -> direct %llx\n",
576  __va(paddr), size, out->dma_address);
577 
578  return 0;
579  }
580 #endif
581 
582  /* If physically contiguous and DAC is available, use it. */
583  if (leader->dma_address == 0 && dac_allowed) {
584  out->dma_address = paddr + alpha_mv.pci_dac_offset;
585  out->dma_length = size;
586 
587  DBGA(" sg_fill: [%p,%lx] -> DAC %llx\n",
588  __va(paddr), size, out->dma_address);
589 
590  return 0;
591  }
592 
593  /* Otherwise, we'll use the iommu to make the pages virtually
594  contiguous. */
595 
596  paddr &= ~PAGE_MASK;
597  npages = iommu_num_pages(paddr, size, PAGE_SIZE);
598  dma_ofs = iommu_arena_alloc(dev, arena, npages, 0);
599  if (dma_ofs < 0) {
600  /* If we attempted a direct map above but failed, die. */
601  if (leader->dma_address == 0)
602  return -1;
603 
604  /* Otherwise, break up the remaining virtually contiguous
605  hunks into individual direct maps and retry. */
606  sg_classify(dev, leader, end, 0);
607  return sg_fill(dev, leader, end, out, arena, max_dma, dac_allowed);
608  }
609 
610  out->dma_address = arena->dma_base + dma_ofs*PAGE_SIZE + paddr;
611  out->dma_length = size;
612 
613  DBGA(" sg_fill: [%p,%lx] -> sg %llx np %ld\n",
614  __va(paddr), size, out->dma_address, npages);
615 
616  /* All virtually contiguous. We need to find the length of each
617  physically contiguous subsegment to fill in the ptes. */
618  ptes = &arena->ptes[dma_ofs];
619  sg = leader;
620  do {
621 #if DEBUG_ALLOC > 0
622  struct scatterlist *last_sg = sg;
623 #endif
624 
625  size = sg->length;
626  paddr = SG_ENT_PHYS_ADDRESS(sg);
627 
628  while (sg+1 < end && (int) sg[1].dma_address == -1) {
629  size += sg[1].length;
630  sg++;
631  }
632 
633  npages = iommu_num_pages(paddr, size, PAGE_SIZE);
634 
635  paddr &= PAGE_MASK;
636  for (i = 0; i < npages; ++i, paddr += PAGE_SIZE)
637  *ptes++ = mk_iommu_pte(paddr);
638 
639 #if DEBUG_ALLOC > 0
640  DBGA(" (%ld) [%p,%x] np %ld\n",
641  last_sg - leader, SG_ENT_VIRT_ADDRESS(last_sg),
642  last_sg->length, npages);
643  while (++last_sg <= sg) {
644  DBGA(" (%ld) [%p,%x] cont\n",
645  last_sg - leader, SG_ENT_VIRT_ADDRESS(last_sg),
646  last_sg->length);
647  }
648 #endif
649  } while (++sg < end && (int) sg->dma_address < 0);
650 
651  return 1;
652 }
653 
654 static int alpha_pci_map_sg(struct device *dev, struct scatterlist *sg,
655  int nents, enum dma_data_direction dir,
656  struct dma_attrs *attrs)
657 {
658  struct pci_dev *pdev = alpha_gendev_to_pci(dev);
659  struct scatterlist *start, *end, *out;
660  struct pci_controller *hose;
661  struct pci_iommu_arena *arena;
662  dma_addr_t max_dma;
663  int dac_allowed;
664 
665  if (dir == PCI_DMA_NONE)
666  BUG();
667 
668  dac_allowed = dev ? pci_dac_dma_supported(pdev, pdev->dma_mask) : 0;
669 
670  /* Fast path single entry scatterlists. */
671  if (nents == 1) {
672  sg->dma_length = sg->length;
673  sg->dma_address
674  = pci_map_single_1(pdev, SG_ENT_VIRT_ADDRESS(sg),
675  sg->length, dac_allowed);
676  return sg->dma_address != 0;
677  }
678 
679  start = sg;
680  end = sg + nents;
681 
682  /* First, prepare information about the entries. */
683  sg_classify(dev, sg, end, alpha_mv.mv_pci_tbi != 0);
684 
685  /* Second, figure out where we're going to map things. */
686  if (alpha_mv.mv_pci_tbi) {
687  hose = pdev ? pdev->sysdata : pci_isa_hose;
688  max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
689  arena = hose->sg_pci;
690  if (!arena || arena->dma_base + arena->size - 1 > max_dma)
691  arena = hose->sg_isa;
692  } else {
693  max_dma = -1;
694  arena = NULL;
695  hose = NULL;
696  }
697 
698  /* Third, iterate over the scatterlist leaders and allocate
699  dma space as needed. */
700  for (out = sg; sg < end; ++sg) {
701  if ((int) sg->dma_address < 0)
702  continue;
703  if (sg_fill(dev, sg, end, out, arena, max_dma, dac_allowed) < 0)
704  goto error;
705  out++;
706  }
707 
708  /* Mark the end of the list for pci_unmap_sg. */
709  if (out < end)
710  out->dma_length = 0;
711 
712  if (out - start == 0)
713  printk(KERN_WARNING "pci_map_sg failed: no entries?\n");
714  DBGA("pci_map_sg: %ld entries\n", out - start);
715 
716  return out - start;
717 
718  error:
719  printk(KERN_WARNING "pci_map_sg failed: "
720  "could not allocate dma page tables\n");
721 
722  /* Some allocation failed while mapping the scatterlist
723  entries. Unmap them now. */
724  if (out > start)
725  pci_unmap_sg(pdev, start, out - start, dir);
726  return 0;
727 }
728 
729 /* Unmap a set of streaming mode DMA translations. Again, cpu read
730  rules concerning calls here are the same as for pci_unmap_single()
731  above. */
732 
733 static void alpha_pci_unmap_sg(struct device *dev, struct scatterlist *sg,
734  int nents, enum dma_data_direction dir,
735  struct dma_attrs *attrs)
736 {
737  struct pci_dev *pdev = alpha_gendev_to_pci(dev);
738  unsigned long flags;
739  struct pci_controller *hose;
740  struct pci_iommu_arena *arena;
741  struct scatterlist *end;
742  dma_addr_t max_dma;
743  dma_addr_t fbeg, fend;
744 
745  if (dir == PCI_DMA_NONE)
746  BUG();
747 
748  if (! alpha_mv.mv_pci_tbi)
749  return;
750 
751  hose = pdev ? pdev->sysdata : pci_isa_hose;
752  max_dma = pdev ? pdev->dma_mask : ISA_DMA_MASK;
753  arena = hose->sg_pci;
754  if (!arena || arena->dma_base + arena->size - 1 > max_dma)
755  arena = hose->sg_isa;
756 
757  fbeg = -1, fend = 0;
758 
759  spin_lock_irqsave(&arena->lock, flags);
760 
761  for (end = sg + nents; sg < end; ++sg) {
763  size_t size;
764  long npages, ofs;
765  dma_addr_t tend;
766 
767  addr = sg->dma_address;
768  size = sg->dma_length;
769  if (!size)
770  break;
771 
772  if (addr > 0xffffffff) {
773  /* It's a DAC address -- nothing to do. */
774  DBGA(" (%ld) DAC [%llx,%zx]\n",
775  sg - end + nents, addr, size);
776  continue;
777  }
778 
779  if (addr >= __direct_map_base
780  && addr < __direct_map_base + __direct_map_size) {
781  /* Nothing to do. */
782  DBGA(" (%ld) direct [%llx,%zx]\n",
783  sg - end + nents, addr, size);
784  continue;
785  }
786 
787  DBGA(" (%ld) sg [%llx,%zx]\n",
788  sg - end + nents, addr, size);
789 
790  npages = iommu_num_pages(addr, size, PAGE_SIZE);
791  ofs = (addr - arena->dma_base) >> PAGE_SHIFT;
792  iommu_arena_free(arena, ofs, npages);
793 
794  tend = addr + size - 1;
795  if (fbeg > addr) fbeg = addr;
796  if (fend < tend) fend = tend;
797  }
798 
799  /* If we're freeing ptes above the `next_entry' pointer (they
800  may have snuck back into the TLB since the last wrap flush),
801  we need to flush the TLB before reallocating the latter. */
802  if ((fend - arena->dma_base) >> PAGE_SHIFT >= arena->next_entry)
803  alpha_mv.mv_pci_tbi(hose, fbeg, fend);
804 
805  spin_unlock_irqrestore(&arena->lock, flags);
806 
807  DBGA("pci_unmap_sg: %ld entries\n", nents - (end - sg));
808 }
809 
810 /* Return whether the given PCI device DMA address mask can be
811  supported properly. */
812 
813 static int alpha_pci_supported(struct device *dev, u64 mask)
814 {
815  struct pci_dev *pdev = alpha_gendev_to_pci(dev);
816  struct pci_controller *hose;
817  struct pci_iommu_arena *arena;
818 
819  /* If there exists a direct map, and the mask fits either
820  the entire direct mapped space or the total system memory as
821  shifted by the map base */
822  if (__direct_map_size != 0
823  && (__direct_map_base + __direct_map_size - 1 <= mask ||
824  __direct_map_base + (max_low_pfn << PAGE_SHIFT) - 1 <= mask))
825  return 1;
826 
827  /* Check that we have a scatter-gather arena that fits. */
828  hose = pdev ? pdev->sysdata : pci_isa_hose;
829  arena = hose->sg_isa;
830  if (arena && arena->dma_base + arena->size - 1 <= mask)
831  return 1;
832  arena = hose->sg_pci;
833  if (arena && arena->dma_base + arena->size - 1 <= mask)
834  return 1;
835 
836  /* As last resort try ZONE_DMA. */
837  if (!__direct_map_base && MAX_DMA_ADDRESS - IDENT_ADDR - 1 <= mask)
838  return 1;
839 
840  return 0;
841 }
842 
843 
844 /*
845  * AGP GART extensions to the IOMMU
846  */
847 int
848 iommu_reserve(struct pci_iommu_arena *arena, long pg_count, long align_mask)
849 {
850  unsigned long flags;
851  unsigned long *ptes;
852  long i, p;
853 
854  if (!arena) return -EINVAL;
855 
856  spin_lock_irqsave(&arena->lock, flags);
857 
858  /* Search for N empty ptes. */
859  ptes = arena->ptes;
860  p = iommu_arena_find_pages(NULL, arena, pg_count, align_mask);
861  if (p < 0) {
862  spin_unlock_irqrestore(&arena->lock, flags);
863  return -1;
864  }
865 
866  /* Success. Mark them all reserved (ie not zero and invalid)
867  for the iommu tlb that could load them from under us.
868  They will be filled in with valid bits by _bind() */
869  for (i = 0; i < pg_count; ++i)
870  ptes[p+i] = IOMMU_RESERVED_PTE;
871 
872  arena->next_entry = p + pg_count;
873  spin_unlock_irqrestore(&arena->lock, flags);
874 
875  return p;
876 }
877 
878 int
879 iommu_release(struct pci_iommu_arena *arena, long pg_start, long pg_count)
880 {
881  unsigned long *ptes;
882  long i;
883 
884  if (!arena) return -EINVAL;
885 
886  ptes = arena->ptes;
887 
888  /* Make sure they're all reserved first... */
889  for(i = pg_start; i < pg_start + pg_count; i++)
890  if (ptes[i] != IOMMU_RESERVED_PTE)
891  return -EBUSY;
892 
893  iommu_arena_free(arena, pg_start, pg_count);
894  return 0;
895 }
896 
897 int
898 iommu_bind(struct pci_iommu_arena *arena, long pg_start, long pg_count,
899  struct page **pages)
900 {
901  unsigned long flags;
902  unsigned long *ptes;
903  long i, j;
904 
905  if (!arena) return -EINVAL;
906 
907  spin_lock_irqsave(&arena->lock, flags);
908 
909  ptes = arena->ptes;
910 
911  for(j = pg_start; j < pg_start + pg_count; j++) {
912  if (ptes[j] != IOMMU_RESERVED_PTE) {
913  spin_unlock_irqrestore(&arena->lock, flags);
914  return -EBUSY;
915  }
916  }
917 
918  for(i = 0, j = pg_start; i < pg_count; i++, j++)
919  ptes[j] = mk_iommu_pte(page_to_phys(pages[i]));
920 
921  spin_unlock_irqrestore(&arena->lock, flags);
922 
923  return 0;
924 }
925 
926 int
927 iommu_unbind(struct pci_iommu_arena *arena, long pg_start, long pg_count)
928 {
929  unsigned long *p;
930  long i;
931 
932  if (!arena) return -EINVAL;
933 
934  p = arena->ptes + pg_start;
935  for(i = 0; i < pg_count; i++)
936  p[i] = IOMMU_RESERVED_PTE;
937 
938  return 0;
939 }
940 
941 static int alpha_pci_mapping_error(struct device *dev, dma_addr_t dma_addr)
942 {
943  return dma_addr == 0;
944 }
945 
946 static int alpha_pci_set_mask(struct device *dev, u64 mask)
947 {
948  if (!dev->dma_mask ||
949  !pci_dma_supported(alpha_gendev_to_pci(dev), mask))
950  return -EIO;
951 
952  *dev->dma_mask = mask;
953  return 0;
954 }
955 
957  .alloc = alpha_pci_alloc_coherent,
958  .free = alpha_pci_free_coherent,
959  .map_page = alpha_pci_map_page,
960  .unmap_page = alpha_pci_unmap_page,
961  .map_sg = alpha_pci_map_sg,
962  .unmap_sg = alpha_pci_unmap_sg,
963  .mapping_error = alpha_pci_mapping_error,
964  .dma_supported = alpha_pci_supported,
965  .set_dma_mask = alpha_pci_set_mask,
966 };
967 
969 EXPORT_SYMBOL(dma_ops);