[PATCH] x86_64: fix boot hang caused by CALGARY_IOMMU_ENABLED_BY_DEFAULT
[deliverable/linux.git] / arch / x86_64 / kernel / pci-calgary.c
CommitLineData
e465058d
JM
1/*
2 * Derived from arch/powerpc/kernel/iommu.c
3 *
aa0a9f37 4 * Copyright (C) IBM Corporation, 2006
d8d2bedf 5 * Copyright (C) 2006 Jon Mason <jdmason@kudzu.us>
e465058d 6 *
d8d2bedf 7 * Author: Jon Mason <jdmason@kudzu.us>
aa0a9f37
MBY
8 * Author: Muli Ben-Yehuda <muli@il.ibm.com>
9
e465058d
JM
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to the Free Software
22 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 */
24
e465058d
JM
25#include <linux/kernel.h>
26#include <linux/init.h>
27#include <linux/types.h>
28#include <linux/slab.h>
29#include <linux/mm.h>
30#include <linux/spinlock.h>
31#include <linux/string.h>
32#include <linux/dma-mapping.h>
33#include <linux/init.h>
34#include <linux/bitops.h>
35#include <linux/pci_ids.h>
36#include <linux/pci.h>
37#include <linux/delay.h>
38#include <asm/proto.h>
39#include <asm/calgary.h>
40#include <asm/tce.h>
41#include <asm/pci-direct.h>
42#include <asm/system.h>
43#include <asm/dma.h>
b34e90b8 44#include <asm/rio.h>
e465058d 45
bff6547b
MBY
46#ifdef CONFIG_CALGARY_IOMMU_ENABLED_BY_DEFAULT
47int use_calgary __read_mostly = 1;
48#else
49int use_calgary __read_mostly = 0;
50#endif /* CONFIG_CALGARY_DEFAULT_ENABLED */
51
e465058d
JM
52#define PCI_DEVICE_ID_IBM_CALGARY 0x02a1
53#define PCI_VENDOR_DEVICE_ID_CALGARY \
54 (PCI_VENDOR_ID_IBM | PCI_DEVICE_ID_IBM_CALGARY << 16)
55
56/* we need these for register space address calculation */
57#define START_ADDRESS 0xfe000000
58#define CHASSIS_BASE 0
59#define ONE_BASED_CHASSIS_NUM 1
60
61/* register offsets inside the host bridge space */
cb01fc72
MBY
62#define CALGARY_CONFIG_REG 0x0108
63#define PHB_CSR_OFFSET 0x0110 /* Channel Status */
e465058d
JM
64#define PHB_PLSSR_OFFSET 0x0120
65#define PHB_CONFIG_RW_OFFSET 0x0160
66#define PHB_IOBASE_BAR_LOW 0x0170
67#define PHB_IOBASE_BAR_HIGH 0x0180
68#define PHB_MEM_1_LOW 0x0190
69#define PHB_MEM_1_HIGH 0x01A0
70#define PHB_IO_ADDR_SIZE 0x01B0
71#define PHB_MEM_1_SIZE 0x01C0
72#define PHB_MEM_ST_OFFSET 0x01D0
73#define PHB_AER_OFFSET 0x0200
74#define PHB_CONFIG_0_HIGH 0x0220
75#define PHB_CONFIG_0_LOW 0x0230
76#define PHB_CONFIG_0_END 0x0240
77#define PHB_MEM_2_LOW 0x02B0
78#define PHB_MEM_2_HIGH 0x02C0
79#define PHB_MEM_2_SIZE_HIGH 0x02D0
80#define PHB_MEM_2_SIZE_LOW 0x02E0
81#define PHB_DOSHOLE_OFFSET 0x08E0
82
83/* PHB_CONFIG_RW */
84#define PHB_TCE_ENABLE 0x20000000
85#define PHB_SLOT_DISABLE 0x1C000000
86#define PHB_DAC_DISABLE 0x01000000
87#define PHB_MEM2_ENABLE 0x00400000
88#define PHB_MCSR_ENABLE 0x00100000
89/* TAR (Table Address Register) */
90#define TAR_SW_BITS 0x0000ffffffff800fUL
91#define TAR_VALID 0x0000000000000008UL
92/* CSR (Channel/DMA Status Register) */
93#define CSR_AGENT_MASK 0xffe0ffff
cb01fc72
MBY
94/* CCR (Calgary Configuration Register) */
95#define CCR_2SEC_TIMEOUT 0x000000000000000EUL
e465058d
JM
96
97#define MAX_NUM_OF_PHBS 8 /* how many PHBs in total? */
d2105b10 98#define MAX_NUM_CHASSIS 8 /* max number of chassis */
4ea8a5d8
MBY
99/* MAX_PHB_BUS_NUM is the maximal possible dev->bus->number */
100#define MAX_PHB_BUS_NUM (MAX_NUM_OF_PHBS * MAX_NUM_CHASSIS * 2)
e465058d
JM
101#define PHBS_PER_CALGARY 4
102
103/* register offsets in Calgary's internal register space */
104static const unsigned long tar_offsets[] = {
105 0x0580 /* TAR0 */,
106 0x0588 /* TAR1 */,
107 0x0590 /* TAR2 */,
108 0x0598 /* TAR3 */
109};
110
111static const unsigned long split_queue_offsets[] = {
112 0x4870 /* SPLIT QUEUE 0 */,
113 0x5870 /* SPLIT QUEUE 1 */,
114 0x6870 /* SPLIT QUEUE 2 */,
115 0x7870 /* SPLIT QUEUE 3 */
116};
117
118static const unsigned long phb_offsets[] = {
119 0x8000 /* PHB0 */,
120 0x9000 /* PHB1 */,
121 0xA000 /* PHB2 */,
122 0xB000 /* PHB3 */
123};
124
b34e90b8
LV
125/* PHB debug registers */
126
127static const unsigned long phb_debug_offsets[] = {
128 0x4000 /* PHB 0 DEBUG */,
129 0x5000 /* PHB 1 DEBUG */,
130 0x6000 /* PHB 2 DEBUG */,
131 0x7000 /* PHB 3 DEBUG */
132};
133
134/*
135 * STUFF register for each debug PHB,
136 * byte 1 = start bus number, byte 2 = end bus number
137 */
138
139#define PHB_DEBUG_STUFF_OFFSET 0x0020
140
e465058d
JM
141unsigned int specified_table_size = TCE_TABLE_SIZE_UNSPECIFIED;
142static int translate_empty_slots __read_mostly = 0;
143static int calgary_detected __read_mostly = 0;
144
b34e90b8
LV
145static struct rio_table_hdr *rio_table_hdr __initdata;
146static struct scal_detail *scal_devs[MAX_NUMNODES] __initdata;
eae93755 147static struct rio_detail *rio_devs[MAX_NUMNODES * 4] __initdata;
b34e90b8 148
f38db651
MBY
149struct calgary_bus_info {
150 void *tce_space;
0577f148 151 unsigned char translation_disabled;
f38db651 152 signed char phbid;
b34e90b8 153 void __iomem *bbar;
f38db651
MBY
154};
155
156static struct calgary_bus_info bus_info[MAX_PHB_BUS_NUM] = { { NULL, 0, 0 }, };
e465058d
JM
157
158static void tce_cache_blast(struct iommu_table *tbl);
159
160/* enable this to stress test the chip's TCE cache */
161#ifdef CONFIG_IOMMU_DEBUG
de684652
MBY
162int debugging __read_mostly = 1;
163
796e4390
MBY
164static inline unsigned long verify_bit_range(unsigned long* bitmap,
165 int expected, unsigned long start, unsigned long end)
166{
167 unsigned long idx = start;
168
169 BUG_ON(start >= end);
170
171 while (idx < end) {
172 if (!!test_bit(idx, bitmap) != expected)
173 return idx;
174 ++idx;
175 }
176
177 /* all bits have the expected value */
178 return ~0UL;
179}
de684652
MBY
180#else /* debugging is disabled */
181int debugging __read_mostly = 0;
182
796e4390
MBY
183static inline unsigned long verify_bit_range(unsigned long* bitmap,
184 int expected, unsigned long start, unsigned long end)
185{
186 return ~0UL;
187}
de684652 188#endif /* CONFIG_IOMMU_DEBUG */
e465058d
JM
189
190static inline unsigned int num_dma_pages(unsigned long dma, unsigned int dmalen)
191{
192 unsigned int npages;
193
194 npages = PAGE_ALIGN(dma + dmalen) - (dma & PAGE_MASK);
195 npages >>= PAGE_SHIFT;
196
197 return npages;
198}
199
200static inline int translate_phb(struct pci_dev* dev)
201{
f38db651 202 int disabled = bus_info[dev->bus->number].translation_disabled;
e465058d
JM
203 return !disabled;
204}
205
206static void iommu_range_reserve(struct iommu_table *tbl,
207 unsigned long start_addr, unsigned int npages)
208{
209 unsigned long index;
210 unsigned long end;
796e4390 211 unsigned long badbit;
e465058d
JM
212
213 index = start_addr >> PAGE_SHIFT;
214
215 /* bail out if we're asked to reserve a region we don't cover */
216 if (index >= tbl->it_size)
217 return;
218
219 end = index + npages;
220 if (end > tbl->it_size) /* don't go off the table */
221 end = tbl->it_size;
222
796e4390
MBY
223 badbit = verify_bit_range(tbl->it_map, 0, index, end);
224 if (badbit != ~0UL) {
225 if (printk_ratelimit())
e465058d
JM
226 printk(KERN_ERR "Calgary: entry already allocated at "
227 "0x%lx tbl %p dma 0x%lx npages %u\n",
796e4390 228 badbit, tbl, start_addr, npages);
e465058d 229 }
796e4390
MBY
230
231 set_bit_string(tbl->it_map, index, npages);
e465058d
JM
232}
233
234static unsigned long iommu_range_alloc(struct iommu_table *tbl,
235 unsigned int npages)
236{
237 unsigned long offset;
238
239 BUG_ON(npages == 0);
240
241 offset = find_next_zero_string(tbl->it_map, tbl->it_hint,
242 tbl->it_size, npages);
243 if (offset == ~0UL) {
244 tce_cache_blast(tbl);
245 offset = find_next_zero_string(tbl->it_map, 0,
246 tbl->it_size, npages);
247 if (offset == ~0UL) {
248 printk(KERN_WARNING "Calgary: IOMMU full.\n");
249 if (panic_on_overflow)
250 panic("Calgary: fix the allocator.\n");
251 else
252 return bad_dma_address;
253 }
254 }
255
256 set_bit_string(tbl->it_map, offset, npages);
257 tbl->it_hint = offset + npages;
258 BUG_ON(tbl->it_hint > tbl->it_size);
259
260 return offset;
261}
262
263static dma_addr_t iommu_alloc(struct iommu_table *tbl, void *vaddr,
264 unsigned int npages, int direction)
265{
266 unsigned long entry, flags;
267 dma_addr_t ret = bad_dma_address;
268
269 spin_lock_irqsave(&tbl->it_lock, flags);
270
271 entry = iommu_range_alloc(tbl, npages);
272
273 if (unlikely(entry == bad_dma_address))
274 goto error;
275
276 /* set the return dma address */
277 ret = (entry << PAGE_SHIFT) | ((unsigned long)vaddr & ~PAGE_MASK);
278
279 /* put the TCEs in the HW table */
280 tce_build(tbl, entry, npages, (unsigned long)vaddr & PAGE_MASK,
281 direction);
282
283 spin_unlock_irqrestore(&tbl->it_lock, flags);
284
285 return ret;
286
287error:
288 spin_unlock_irqrestore(&tbl->it_lock, flags);
289 printk(KERN_WARNING "Calgary: failed to allocate %u pages in "
290 "iommu %p\n", npages, tbl);
291 return bad_dma_address;
292}
293
294static void __iommu_free(struct iommu_table *tbl, dma_addr_t dma_addr,
295 unsigned int npages)
296{
297 unsigned long entry;
796e4390 298 unsigned long badbit;
e465058d
JM
299
300 entry = dma_addr >> PAGE_SHIFT;
301
302 BUG_ON(entry + npages > tbl->it_size);
303
304 tce_free(tbl, entry, npages);
305
796e4390
MBY
306 badbit = verify_bit_range(tbl->it_map, 1, entry, entry + npages);
307 if (badbit != ~0UL) {
308 if (printk_ratelimit())
e465058d
JM
309 printk(KERN_ERR "Calgary: bit is off at 0x%lx "
310 "tbl %p dma 0x%Lx entry 0x%lx npages %u\n",
796e4390 311 badbit, tbl, dma_addr, entry, npages);
e465058d
JM
312 }
313
314 __clear_bit_string(tbl->it_map, entry, npages);
e465058d
JM
315}
316
317static void iommu_free(struct iommu_table *tbl, dma_addr_t dma_addr,
318 unsigned int npages)
319{
320 unsigned long flags;
321
322 spin_lock_irqsave(&tbl->it_lock, flags);
323
324 __iommu_free(tbl, dma_addr, npages);
325
326 spin_unlock_irqrestore(&tbl->it_lock, flags);
327}
328
329static void __calgary_unmap_sg(struct iommu_table *tbl,
330 struct scatterlist *sglist, int nelems, int direction)
331{
332 while (nelems--) {
333 unsigned int npages;
334 dma_addr_t dma = sglist->dma_address;
335 unsigned int dmalen = sglist->dma_length;
336
337 if (dmalen == 0)
338 break;
339
340 npages = num_dma_pages(dma, dmalen);
341 __iommu_free(tbl, dma, npages);
342 sglist++;
343 }
344}
345
346void calgary_unmap_sg(struct device *dev, struct scatterlist *sglist,
347 int nelems, int direction)
348{
349 unsigned long flags;
350 struct iommu_table *tbl = to_pci_dev(dev)->bus->self->sysdata;
351
352 if (!translate_phb(to_pci_dev(dev)))
353 return;
354
355 spin_lock_irqsave(&tbl->it_lock, flags);
356
357 __calgary_unmap_sg(tbl, sglist, nelems, direction);
358
359 spin_unlock_irqrestore(&tbl->it_lock, flags);
360}
361
362static int calgary_nontranslate_map_sg(struct device* dev,
363 struct scatterlist *sg, int nelems, int direction)
364{
365 int i;
366
367 for (i = 0; i < nelems; i++ ) {
368 struct scatterlist *s = &sg[i];
369 BUG_ON(!s->page);
370 s->dma_address = virt_to_bus(page_address(s->page) +s->offset);
371 s->dma_length = s->length;
372 }
373 return nelems;
374}
375
376int calgary_map_sg(struct device *dev, struct scatterlist *sg,
377 int nelems, int direction)
378{
379 struct iommu_table *tbl = to_pci_dev(dev)->bus->self->sysdata;
380 unsigned long flags;
381 unsigned long vaddr;
382 unsigned int npages;
383 unsigned long entry;
384 int i;
385
386 if (!translate_phb(to_pci_dev(dev)))
387 return calgary_nontranslate_map_sg(dev, sg, nelems, direction);
388
389 spin_lock_irqsave(&tbl->it_lock, flags);
390
391 for (i = 0; i < nelems; i++ ) {
392 struct scatterlist *s = &sg[i];
393 BUG_ON(!s->page);
394
395 vaddr = (unsigned long)page_address(s->page) + s->offset;
396 npages = num_dma_pages(vaddr, s->length);
397
398 entry = iommu_range_alloc(tbl, npages);
399 if (entry == bad_dma_address) {
400 /* makes sure unmap knows to stop */
401 s->dma_length = 0;
402 goto error;
403 }
404
405 s->dma_address = (entry << PAGE_SHIFT) | s->offset;
406
407 /* insert into HW table */
408 tce_build(tbl, entry, npages, vaddr & PAGE_MASK,
409 direction);
410
411 s->dma_length = s->length;
412 }
413
414 spin_unlock_irqrestore(&tbl->it_lock, flags);
415
416 return nelems;
417error:
418 __calgary_unmap_sg(tbl, sg, nelems, direction);
419 for (i = 0; i < nelems; i++) {
420 sg[i].dma_address = bad_dma_address;
421 sg[i].dma_length = 0;
422 }
423 spin_unlock_irqrestore(&tbl->it_lock, flags);
424 return 0;
425}
426
427dma_addr_t calgary_map_single(struct device *dev, void *vaddr,
428 size_t size, int direction)
429{
430 dma_addr_t dma_handle = bad_dma_address;
431 unsigned long uaddr;
432 unsigned int npages;
433 struct iommu_table *tbl = to_pci_dev(dev)->bus->self->sysdata;
434
435 uaddr = (unsigned long)vaddr;
436 npages = num_dma_pages(uaddr, size);
437
438 if (translate_phb(to_pci_dev(dev)))
439 dma_handle = iommu_alloc(tbl, vaddr, npages, direction);
440 else
441 dma_handle = virt_to_bus(vaddr);
442
443 return dma_handle;
444}
445
446void calgary_unmap_single(struct device *dev, dma_addr_t dma_handle,
447 size_t size, int direction)
448{
449 struct iommu_table *tbl = to_pci_dev(dev)->bus->self->sysdata;
450 unsigned int npages;
451
452 if (!translate_phb(to_pci_dev(dev)))
453 return;
454
455 npages = num_dma_pages(dma_handle, size);
456 iommu_free(tbl, dma_handle, npages);
457}
458
459void* calgary_alloc_coherent(struct device *dev, size_t size,
460 dma_addr_t *dma_handle, gfp_t flag)
461{
462 void *ret = NULL;
463 dma_addr_t mapping;
464 unsigned int npages, order;
465 struct iommu_table *tbl;
466
467 tbl = to_pci_dev(dev)->bus->self->sysdata;
468
469 size = PAGE_ALIGN(size); /* size rounded up to full pages */
470 npages = size >> PAGE_SHIFT;
471 order = get_order(size);
472
473 /* alloc enough pages (and possibly more) */
474 ret = (void *)__get_free_pages(flag, order);
475 if (!ret)
476 goto error;
477 memset(ret, 0, size);
478
479 if (translate_phb(to_pci_dev(dev))) {
480 /* set up tces to cover the allocated range */
481 mapping = iommu_alloc(tbl, ret, npages, DMA_BIDIRECTIONAL);
482 if (mapping == bad_dma_address)
483 goto free;
484
485 *dma_handle = mapping;
486 } else /* non translated slot */
487 *dma_handle = virt_to_bus(ret);
488
489 return ret;
490
491free:
492 free_pages((unsigned long)ret, get_order(size));
493 ret = NULL;
494error:
495 return ret;
496}
497
498static struct dma_mapping_ops calgary_dma_ops = {
499 .alloc_coherent = calgary_alloc_coherent,
500 .map_single = calgary_map_single,
501 .unmap_single = calgary_unmap_single,
502 .map_sg = calgary_map_sg,
503 .unmap_sg = calgary_unmap_sg,
504};
505
b34e90b8
LV
506static inline void __iomem * busno_to_bbar(unsigned char num)
507{
508 return bus_info[num].bbar;
509}
510
e465058d
JM
511static inline int busno_to_phbid(unsigned char num)
512{
f38db651 513 return bus_info[num].phbid;
e465058d
JM
514}
515
516static inline unsigned long split_queue_offset(unsigned char num)
517{
518 size_t idx = busno_to_phbid(num);
519
520 return split_queue_offsets[idx];
521}
522
523static inline unsigned long tar_offset(unsigned char num)
524{
525 size_t idx = busno_to_phbid(num);
526
527 return tar_offsets[idx];
528}
529
530static inline unsigned long phb_offset(unsigned char num)
531{
532 size_t idx = busno_to_phbid(num);
533
534 return phb_offsets[idx];
535}
536
537static inline void __iomem* calgary_reg(void __iomem *bar, unsigned long offset)
538{
539 unsigned long target = ((unsigned long)bar) | offset;
540 return (void __iomem*)target;
541}
542
543static void tce_cache_blast(struct iommu_table *tbl)
544{
545 u64 val;
546 u32 aer;
547 int i = 0;
548 void __iomem *bbar = tbl->bbar;
549 void __iomem *target;
550
551 /* disable arbitration on the bus */
552 target = calgary_reg(bbar, phb_offset(tbl->it_busno) | PHB_AER_OFFSET);
553 aer = readl(target);
554 writel(0, target);
555
556 /* read plssr to ensure it got there */
557 target = calgary_reg(bbar, phb_offset(tbl->it_busno) | PHB_PLSSR_OFFSET);
558 val = readl(target);
559
560 /* poll split queues until all DMA activity is done */
561 target = calgary_reg(bbar, split_queue_offset(tbl->it_busno));
562 do {
563 val = readq(target);
564 i++;
565 } while ((val & 0xff) != 0xff && i < 100);
566 if (i == 100)
567 printk(KERN_WARNING "Calgary: PCI bus not quiesced, "
568 "continuing anyway\n");
569
570 /* invalidate TCE cache */
571 target = calgary_reg(bbar, tar_offset(tbl->it_busno));
572 writeq(tbl->tar_val, target);
573
574 /* enable arbitration */
575 target = calgary_reg(bbar, phb_offset(tbl->it_busno) | PHB_AER_OFFSET);
576 writel(aer, target);
577 (void)readl(target); /* flush */
578}
579
580static void __init calgary_reserve_mem_region(struct pci_dev *dev, u64 start,
581 u64 limit)
582{
583 unsigned int numpages;
584
585 limit = limit | 0xfffff;
586 limit++;
587
588 numpages = ((limit - start) >> PAGE_SHIFT);
589 iommu_range_reserve(dev->sysdata, start, numpages);
590}
591
592static void __init calgary_reserve_peripheral_mem_1(struct pci_dev *dev)
593{
594 void __iomem *target;
595 u64 low, high, sizelow;
596 u64 start, limit;
597 struct iommu_table *tbl = dev->sysdata;
598 unsigned char busnum = dev->bus->number;
599 void __iomem *bbar = tbl->bbar;
600
601 /* peripheral MEM_1 region */
602 target = calgary_reg(bbar, phb_offset(busnum) | PHB_MEM_1_LOW);
603 low = be32_to_cpu(readl(target));
604 target = calgary_reg(bbar, phb_offset(busnum) | PHB_MEM_1_HIGH);
605 high = be32_to_cpu(readl(target));
606 target = calgary_reg(bbar, phb_offset(busnum) | PHB_MEM_1_SIZE);
607 sizelow = be32_to_cpu(readl(target));
608
609 start = (high << 32) | low;
610 limit = sizelow;
611
612 calgary_reserve_mem_region(dev, start, limit);
613}
614
615static void __init calgary_reserve_peripheral_mem_2(struct pci_dev *dev)
616{
617 void __iomem *target;
618 u32 val32;
619 u64 low, high, sizelow, sizehigh;
620 u64 start, limit;
621 struct iommu_table *tbl = dev->sysdata;
622 unsigned char busnum = dev->bus->number;
623 void __iomem *bbar = tbl->bbar;
624
625 /* is it enabled? */
626 target = calgary_reg(bbar, phb_offset(busnum) | PHB_CONFIG_RW_OFFSET);
627 val32 = be32_to_cpu(readl(target));
628 if (!(val32 & PHB_MEM2_ENABLE))
629 return;
630
631 target = calgary_reg(bbar, phb_offset(busnum) | PHB_MEM_2_LOW);
632 low = be32_to_cpu(readl(target));
633 target = calgary_reg(bbar, phb_offset(busnum) | PHB_MEM_2_HIGH);
634 high = be32_to_cpu(readl(target));
635 target = calgary_reg(bbar, phb_offset(busnum) | PHB_MEM_2_SIZE_LOW);
636 sizelow = be32_to_cpu(readl(target));
637 target = calgary_reg(bbar, phb_offset(busnum) | PHB_MEM_2_SIZE_HIGH);
638 sizehigh = be32_to_cpu(readl(target));
639
640 start = (high << 32) | low;
641 limit = (sizehigh << 32) | sizelow;
642
643 calgary_reserve_mem_region(dev, start, limit);
644}
645
646/*
647 * some regions of the IO address space do not get translated, so we
648 * must not give devices IO addresses in those regions. The regions
649 * are the 640KB-1MB region and the two PCI peripheral memory holes.
650 * Reserve all of them in the IOMMU bitmap to avoid giving them out
651 * later.
652 */
653static void __init calgary_reserve_regions(struct pci_dev *dev)
654{
655 unsigned int npages;
e465058d
JM
656 u64 start;
657 struct iommu_table *tbl = dev->sysdata;
658
e465058d
JM
659 /* reserve bad_dma_address in case it's a legal address */
660 iommu_range_reserve(tbl, bad_dma_address, 1);
661
662 /* avoid the BIOS/VGA first 640KB-1MB region */
663 start = (640 * 1024);
664 npages = ((1024 - 640) * 1024) >> PAGE_SHIFT;
665 iommu_range_reserve(tbl, start, npages);
666
667 /* reserve the two PCI peripheral memory regions in IO space */
668 calgary_reserve_peripheral_mem_1(dev);
669 calgary_reserve_peripheral_mem_2(dev);
670}
671
672static int __init calgary_setup_tar(struct pci_dev *dev, void __iomem *bbar)
673{
674 u64 val64;
675 u64 table_phys;
676 void __iomem *target;
677 int ret;
678 struct iommu_table *tbl;
679
680 /* build TCE tables for each PHB */
681 ret = build_tce_table(dev, bbar);
682 if (ret)
683 return ret;
684
f38db651
MBY
685 tbl = dev->sysdata;
686 tbl->it_base = (unsigned long)bus_info[dev->bus->number].tce_space;
687 tce_free(tbl, 0, tbl->it_size);
688
e465058d
JM
689 calgary_reserve_regions(dev);
690
691 /* set TARs for each PHB */
692 target = calgary_reg(bbar, tar_offset(dev->bus->number));
693 val64 = be64_to_cpu(readq(target));
694
695 /* zero out all TAR bits under sw control */
696 val64 &= ~TAR_SW_BITS;
697
698 tbl = dev->sysdata;
699 table_phys = (u64)__pa(tbl->it_base);
700 val64 |= table_phys;
701
702 BUG_ON(specified_table_size > TCE_TABLE_SIZE_8M);
703 val64 |= (u64) specified_table_size;
704
705 tbl->tar_val = cpu_to_be64(val64);
706 writeq(tbl->tar_val, target);
707 readq(target); /* flush */
708
709 return 0;
710}
711
b8f4fe66 712static void __init calgary_free_bus(struct pci_dev *dev)
e465058d
JM
713{
714 u64 val64;
715 struct iommu_table *tbl = dev->sysdata;
716 void __iomem *target;
b8f4fe66 717 unsigned int bitmapsz;
e465058d
JM
718
719 target = calgary_reg(tbl->bbar, tar_offset(dev->bus->number));
720 val64 = be64_to_cpu(readq(target));
721 val64 &= ~TAR_SW_BITS;
722 writeq(cpu_to_be64(val64), target);
723 readq(target); /* flush */
724
b8f4fe66
MBY
725 bitmapsz = tbl->it_size / BITS_PER_BYTE;
726 free_pages((unsigned long)tbl->it_map, get_order(bitmapsz));
727 tbl->it_map = NULL;
728
e465058d
JM
729 kfree(tbl);
730 dev->sysdata = NULL;
b8f4fe66
MBY
731
732 /* Can't free bootmem allocated memory after system is up :-( */
733 bus_info[dev->bus->number].tce_space = NULL;
e465058d
JM
734}
735
736static void calgary_watchdog(unsigned long data)
737{
738 struct pci_dev *dev = (struct pci_dev *)data;
739 struct iommu_table *tbl = dev->sysdata;
740 void __iomem *bbar = tbl->bbar;
741 u32 val32;
742 void __iomem *target;
743
744 target = calgary_reg(bbar, phb_offset(tbl->it_busno) | PHB_CSR_OFFSET);
745 val32 = be32_to_cpu(readl(target));
746
747 /* If no error, the agent ID in the CSR is not valid */
748 if (val32 & CSR_AGENT_MASK) {
70d666d6 749 printk(KERN_EMERG "calgary_watchdog: DMA error on PHB %#x, "
e465058d
JM
750 "CSR = %#x\n", dev->bus->number, val32);
751 writel(0, target);
752
753 /* Disable bus that caused the error */
754 target = calgary_reg(bbar, phb_offset(tbl->it_busno) |
755 PHB_CONFIG_RW_OFFSET);
756 val32 = be32_to_cpu(readl(target));
757 val32 |= PHB_SLOT_DISABLE;
758 writel(cpu_to_be32(val32), target);
759 readl(target); /* flush */
760 } else {
761 /* Reset the timer */
762 mod_timer(&tbl->watchdog_timer, jiffies + 2 * HZ);
763 }
764}
765
cb01fc72
MBY
766static void __init calgary_increase_split_completion_timeout(void __iomem *bbar,
767 unsigned char busnum)
768{
769 u64 val64;
770 void __iomem *target;
58db8548 771 unsigned int phb_shift = ~0; /* silence gcc */
cb01fc72
MBY
772 u64 mask;
773
774 switch (busno_to_phbid(busnum)) {
775 case 0: phb_shift = (63 - 19);
776 break;
777 case 1: phb_shift = (63 - 23);
778 break;
779 case 2: phb_shift = (63 - 27);
780 break;
781 case 3: phb_shift = (63 - 35);
782 break;
783 default:
784 BUG_ON(busno_to_phbid(busnum));
785 }
786
787 target = calgary_reg(bbar, CALGARY_CONFIG_REG);
788 val64 = be64_to_cpu(readq(target));
789
790 /* zero out this PHB's timer bits */
791 mask = ~(0xFUL << phb_shift);
792 val64 &= mask;
793 val64 |= (CCR_2SEC_TIMEOUT << phb_shift);
794 writeq(cpu_to_be64(val64), target);
795 readq(target); /* flush */
796}
797
e465058d
JM
798static void __init calgary_enable_translation(struct pci_dev *dev)
799{
800 u32 val32;
801 unsigned char busnum;
802 void __iomem *target;
803 void __iomem *bbar;
804 struct iommu_table *tbl;
805
806 busnum = dev->bus->number;
807 tbl = dev->sysdata;
808 bbar = tbl->bbar;
809
810 /* enable TCE in PHB Config Register */
811 target = calgary_reg(bbar, phb_offset(busnum) | PHB_CONFIG_RW_OFFSET);
812 val32 = be32_to_cpu(readl(target));
813 val32 |= PHB_TCE_ENABLE | PHB_DAC_DISABLE | PHB_MCSR_ENABLE;
814
70d666d6 815 printk(KERN_INFO "Calgary: enabling translation on PHB %#x\n", busnum);
e465058d
JM
816 printk(KERN_INFO "Calgary: errant DMAs will now be prevented on this "
817 "bus.\n");
818
819 writel(cpu_to_be32(val32), target);
820 readl(target); /* flush */
821
cb01fc72
MBY
822 /*
823 * Give split completion a longer timeout on bus 1 for aic94xx
824 * http://bugzilla.kernel.org/show_bug.cgi?id=7180
825 */
826 if (busnum == 1)
827 calgary_increase_split_completion_timeout(bbar, busnum);
828
e465058d
JM
829 init_timer(&tbl->watchdog_timer);
830 tbl->watchdog_timer.function = &calgary_watchdog;
831 tbl->watchdog_timer.data = (unsigned long)dev;
832 mod_timer(&tbl->watchdog_timer, jiffies);
833}
834
835static void __init calgary_disable_translation(struct pci_dev *dev)
836{
837 u32 val32;
838 unsigned char busnum;
839 void __iomem *target;
840 void __iomem *bbar;
841 struct iommu_table *tbl;
842
843 busnum = dev->bus->number;
844 tbl = dev->sysdata;
845 bbar = tbl->bbar;
846
847 /* disable TCE in PHB Config Register */
848 target = calgary_reg(bbar, phb_offset(busnum) | PHB_CONFIG_RW_OFFSET);
849 val32 = be32_to_cpu(readl(target));
850 val32 &= ~(PHB_TCE_ENABLE | PHB_DAC_DISABLE | PHB_MCSR_ENABLE);
851
70d666d6 852 printk(KERN_INFO "Calgary: disabling translation on PHB %#x!\n", busnum);
e465058d
JM
853 writel(cpu_to_be32(val32), target);
854 readl(target); /* flush */
855
856 del_timer_sync(&tbl->watchdog_timer);
857}
858
a4fc520a 859static void __init calgary_init_one_nontraslated(struct pci_dev *dev)
e465058d 860{
871b1700 861 pci_dev_get(dev);
e465058d
JM
862 dev->sysdata = NULL;
863 dev->bus->self = dev;
e465058d
JM
864}
865
866static int __init calgary_init_one(struct pci_dev *dev)
867{
e465058d
JM
868 void __iomem *bbar;
869 int ret;
870
dedc9937
JM
871 BUG_ON(dev->bus->number >= MAX_PHB_BUS_NUM);
872
eae93755 873 bbar = busno_to_bbar(dev->bus->number);
e465058d
JM
874 ret = calgary_setup_tar(dev, bbar);
875 if (ret)
eae93755 876 goto done;
e465058d 877
871b1700 878 pci_dev_get(dev);
e465058d
JM
879 dev->bus->self = dev;
880 calgary_enable_translation(dev);
881
882 return 0;
883
e465058d
JM
884done:
885 return ret;
886}
887
eae93755 888static int __init calgary_locate_bbars(void)
e465058d 889{
eae93755
MBY
890 int ret;
891 int rioidx, phb, bus;
b34e90b8
LV
892 void __iomem *bbar;
893 void __iomem *target;
eae93755 894 unsigned long offset;
b34e90b8
LV
895 u8 start_bus, end_bus;
896 u32 val;
897
eae93755
MBY
898 ret = -ENODATA;
899 for (rioidx = 0; rioidx < rio_table_hdr->num_rio_dev; rioidx++) {
900 struct rio_detail *rio = rio_devs[rioidx];
b34e90b8 901
eae93755 902 if ((rio->type != COMPAT_CALGARY) && (rio->type != ALT_CALGARY))
b34e90b8
LV
903 continue;
904
905 /* map entire 1MB of Calgary config space */
eae93755
MBY
906 bbar = ioremap_nocache(rio->BBAR, 1024 * 1024);
907 if (!bbar)
908 goto error;
b34e90b8
LV
909
910 for (phb = 0; phb < PHBS_PER_CALGARY; phb++) {
eae93755
MBY
911 offset = phb_debug_offsets[phb] | PHB_DEBUG_STUFF_OFFSET;
912 target = calgary_reg(bbar, offset);
b34e90b8 913
b34e90b8
LV
914 val = be32_to_cpu(readl(target));
915 start_bus = (u8)((val & 0x00FF0000) >> 16);
eae93755 916 end_bus = (u8)((val & 0x0000FF00) >> 8);
b34e90b8
LV
917 for (bus = start_bus; bus <= end_bus; bus++) {
918 bus_info[bus].bbar = bbar;
919 bus_info[bus].phbid = phb;
920 }
921 }
922 }
923
eae93755
MBY
924 return 0;
925
926error:
927 /* scan bus_info and iounmap any bbars we previously ioremap'd */
928 for (bus = 0; bus < ARRAY_SIZE(bus_info); bus++)
929 if (bus_info[bus].bbar)
930 iounmap(bus_info[bus].bbar);
931
932 return ret;
933}
934
935static int __init calgary_init(void)
936{
937 int ret;
938 struct pci_dev *dev = NULL;
939
940 ret = calgary_locate_bbars();
941 if (ret)
942 return ret;
e465058d 943
dedc9937 944 do {
e465058d
JM
945 dev = pci_get_device(PCI_VENDOR_ID_IBM,
946 PCI_DEVICE_ID_IBM_CALGARY,
947 dev);
948 if (!dev)
949 break;
950 if (!translate_phb(dev)) {
951 calgary_init_one_nontraslated(dev);
952 continue;
953 }
871b1700 954 if (!bus_info[dev->bus->number].tce_space && !translate_empty_slots)
e465058d 955 continue;
871b1700 956
e465058d
JM
957 ret = calgary_init_one(dev);
958 if (ret)
959 goto error;
dedc9937 960 } while (1);
e465058d
JM
961
962 return ret;
963
964error:
dedc9937 965 do {
7cd8b686 966 dev = pci_get_device_reverse(PCI_VENDOR_ID_IBM,
e465058d
JM
967 PCI_DEVICE_ID_IBM_CALGARY,
968 dev);
9f2dc46d
MBY
969 if (!dev)
970 break;
e465058d
JM
971 if (!translate_phb(dev)) {
972 pci_dev_put(dev);
973 continue;
974 }
f38db651 975 if (!bus_info[dev->bus->number].tce_space && !translate_empty_slots)
e465058d 976 continue;
871b1700 977
e465058d 978 calgary_disable_translation(dev);
b8f4fe66 979 calgary_free_bus(dev);
871b1700 980 pci_dev_put(dev); /* Undo calgary_init_one()'s pci_dev_get() */
dedc9937 981 } while (1);
e465058d
JM
982
983 return ret;
984}
985
986static inline int __init determine_tce_table_size(u64 ram)
987{
988 int ret;
989
990 if (specified_table_size != TCE_TABLE_SIZE_UNSPECIFIED)
991 return specified_table_size;
992
993 /*
994 * Table sizes are from 0 to 7 (TCE_TABLE_SIZE_64K to
995 * TCE_TABLE_SIZE_8M). Table size 0 has 8K entries and each
996 * larger table size has twice as many entries, so shift the
997 * max ram address by 13 to divide by 8K and then look at the
998 * order of the result to choose between 0-7.
999 */
1000 ret = get_order(ram >> 13);
1001 if (ret > TCE_TABLE_SIZE_8M)
1002 ret = TCE_TABLE_SIZE_8M;
1003
1004 return ret;
1005}
1006
b34e90b8
LV
1007static int __init build_detail_arrays(void)
1008{
1009 unsigned long ptr;
1010 int i, scal_detail_size, rio_detail_size;
1011
1012 if (rio_table_hdr->num_scal_dev > MAX_NUMNODES){
1013 printk(KERN_WARNING
eae93755 1014 "Calgary: MAX_NUMNODES too low! Defined as %d, "
b34e90b8
LV
1015 "but system has %d nodes.\n",
1016 MAX_NUMNODES, rio_table_hdr->num_scal_dev);
1017 return -ENODEV;
1018 }
1019
1020 switch (rio_table_hdr->version){
b34e90b8
LV
1021 case 2:
1022 scal_detail_size = 11;
1023 rio_detail_size = 13;
1024 break;
1025 case 3:
1026 scal_detail_size = 12;
1027 rio_detail_size = 15;
1028 break;
eae93755
MBY
1029 default:
1030 printk(KERN_WARNING
1031 "Calgary: Invalid Rio Grande Table Version: %d\n",
1032 rio_table_hdr->version);
1033 return -EPROTO;
b34e90b8
LV
1034 }
1035
1036 ptr = ((unsigned long)rio_table_hdr) + 3;
1037 for (i = 0; i < rio_table_hdr->num_scal_dev;
1038 i++, ptr += scal_detail_size)
1039 scal_devs[i] = (struct scal_detail *)ptr;
1040
1041 for (i = 0; i < rio_table_hdr->num_rio_dev;
1042 i++, ptr += rio_detail_size)
1043 rio_devs[i] = (struct rio_detail *)ptr;
1044
1045 return 0;
1046}
1047
e465058d
JM
1048void __init detect_calgary(void)
1049{
1050 u32 val;
d2105b10 1051 int bus;
e465058d 1052 void *tbl;
d2105b10 1053 int calgary_found = 0;
b34e90b8
LV
1054 unsigned long ptr;
1055 int offset;
eae93755 1056 int ret;
e465058d
JM
1057
1058 /*
1059 * if the user specified iommu=off or iommu=soft or we found
1060 * another HW IOMMU already, bail out.
1061 */
1062 if (swiotlb || no_iommu || iommu_detected)
1063 return;
1064
bff6547b
MBY
1065 if (!use_calgary)
1066 return;
1067
0637a70a
AK
1068 if (!early_pci_allowed())
1069 return;
1070
b34e90b8
LV
1071 ptr = (unsigned long)phys_to_virt(get_bios_ebda());
1072
1073 rio_table_hdr = NULL;
1074 offset = 0x180;
1075 while (offset) {
1076 /* The block id is stored in the 2nd word */
1077 if (*((unsigned short *)(ptr + offset + 2)) == 0x4752){
1078 /* set the pointer past the offset & block id */
eae93755 1079 rio_table_hdr = (struct rio_table_hdr *)(ptr + offset + 4);
b34e90b8
LV
1080 break;
1081 }
1082 /* The next offset is stored in the 1st word. 0 means no more */
1083 offset = *((unsigned short *)(ptr + offset));
1084 }
eae93755 1085 if (!rio_table_hdr) {
b34e90b8
LV
1086 printk(KERN_ERR "Calgary: Unable to locate "
1087 "Rio Grande Table in EBDA - bailing!\n");
1088 return;
1089 }
1090
eae93755
MBY
1091 ret = build_detail_arrays();
1092 if (ret) {
1093 printk(KERN_ERR "Calgary: build_detail_arrays ret %d\n", ret);
b34e90b8 1094 return;
eae93755 1095 }
b34e90b8 1096
e465058d
JM
1097 specified_table_size = determine_tce_table_size(end_pfn * PAGE_SIZE);
1098
d2105b10
JM
1099 for (bus = 0; bus < MAX_PHB_BUS_NUM; bus++) {
1100 int dev;
f38db651 1101 struct calgary_bus_info *info = &bus_info[bus];
d2105b10 1102
e465058d
JM
1103 if (read_pci_config(bus, 0, 0, 0) != PCI_VENDOR_DEVICE_ID_CALGARY)
1104 continue;
d2105b10 1105
f38db651 1106 if (info->translation_disabled)
e465058d 1107 continue;
f38db651 1108
e465058d 1109 /*
d2105b10
JM
1110 * Scan the slots of the PCI bus to see if there is a device present.
1111 * The parent bus will be the zero-ith device, so start at 1.
e465058d 1112 */
d2105b10
JM
1113 for (dev = 1; dev < 8; dev++) {
1114 val = read_pci_config(bus, dev, 0, 0);
1115 if (val != 0xffffffff || translate_empty_slots) {
1116 tbl = alloc_tce_table();
1117 if (!tbl)
1118 goto cleanup;
f38db651 1119 info->tce_space = tbl;
d2105b10
JM
1120 calgary_found = 1;
1121 break;
1122 }
1123 }
e465058d
JM
1124 }
1125
d2105b10 1126 if (calgary_found) {
e465058d
JM
1127 iommu_detected = 1;
1128 calgary_detected = 1;
de684652
MBY
1129 printk(KERN_INFO "PCI-DMA: Calgary IOMMU detected.\n");
1130 printk(KERN_INFO "PCI-DMA: Calgary TCE table spec is %d, "
1131 "CONFIG_IOMMU_DEBUG is %s.\n", specified_table_size,
1132 debugging ? "enabled" : "disabled");
e465058d
JM
1133 }
1134 return;
1135
1136cleanup:
f38db651
MBY
1137 for (--bus; bus >= 0; --bus) {
1138 struct calgary_bus_info *info = &bus_info[bus];
1139
1140 if (info->tce_space)
1141 free_tce_table(info->tce_space);
1142 }
e465058d
JM
1143}
1144
1145int __init calgary_iommu_init(void)
1146{
1147 int ret;
1148
1149 if (no_iommu || swiotlb)
1150 return -ENODEV;
1151
1152 if (!calgary_detected)
1153 return -ENODEV;
1154
1155 /* ok, we're trying to use Calgary - let's roll */
1156 printk(KERN_INFO "PCI-DMA: Using Calgary IOMMU\n");
1157
1158 ret = calgary_init();
1159 if (ret) {
1160 printk(KERN_ERR "PCI-DMA: Calgary init failed %d, "
1161 "falling back to no_iommu\n", ret);
1162 if (end_pfn > MAX_DMA32_PFN)
1163 printk(KERN_ERR "WARNING more than 4GB of memory, "
1164 "32bit PCI may malfunction.\n");
1165 return ret;
1166 }
1167
1168 force_iommu = 1;
1169 dma_ops = &calgary_dma_ops;
1170
1171 return 0;
1172}
1173
1174static int __init calgary_parse_options(char *p)
1175{
1176 unsigned int bridge;
1177 size_t len;
1178 char* endp;
1179
1180 while (*p) {
1181 if (!strncmp(p, "64k", 3))
1182 specified_table_size = TCE_TABLE_SIZE_64K;
1183 else if (!strncmp(p, "128k", 4))
1184 specified_table_size = TCE_TABLE_SIZE_128K;
1185 else if (!strncmp(p, "256k", 4))
1186 specified_table_size = TCE_TABLE_SIZE_256K;
1187 else if (!strncmp(p, "512k", 4))
1188 specified_table_size = TCE_TABLE_SIZE_512K;
1189 else if (!strncmp(p, "1M", 2))
1190 specified_table_size = TCE_TABLE_SIZE_1M;
1191 else if (!strncmp(p, "2M", 2))
1192 specified_table_size = TCE_TABLE_SIZE_2M;
1193 else if (!strncmp(p, "4M", 2))
1194 specified_table_size = TCE_TABLE_SIZE_4M;
1195 else if (!strncmp(p, "8M", 2))
1196 specified_table_size = TCE_TABLE_SIZE_8M;
1197
1198 len = strlen("translate_empty_slots");
1199 if (!strncmp(p, "translate_empty_slots", len))
1200 translate_empty_slots = 1;
1201
1202 len = strlen("disable");
1203 if (!strncmp(p, "disable", len)) {
1204 p += len;
1205 if (*p == '=')
1206 ++p;
1207 if (*p == '\0')
1208 break;
1209 bridge = simple_strtol(p, &endp, 0);
1210 if (p == endp)
1211 break;
1212
d2105b10 1213 if (bridge < MAX_PHB_BUS_NUM) {
e465058d 1214 printk(KERN_INFO "Calgary: disabling "
70d666d6 1215 "translation for PHB %#x\n", bridge);
f38db651 1216 bus_info[bridge].translation_disabled = 1;
e465058d
JM
1217 }
1218 }
1219
1220 p = strpbrk(p, ",");
1221 if (!p)
1222 break;
1223
1224 p++; /* skip ',' */
1225 }
1226 return 1;
1227}
1228__setup("calgary=", calgary_parse_options);
This page took 0.178516 seconds and 5 git commands to generate.