162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * arch/powerpc/sysdev/dart_iommu.c 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Copyright (C) 2004 Olof Johansson <olof@lixom.net>, IBM Corporation 662306a36Sopenharmony_ci * Copyright (C) 2005 Benjamin Herrenschmidt <benh@kernel.crashing.org>, 762306a36Sopenharmony_ci * IBM Corporation 862306a36Sopenharmony_ci * 962306a36Sopenharmony_ci * Based on pSeries_iommu.c: 1062306a36Sopenharmony_ci * Copyright (C) 2001 Mike Corrigan & Dave Engebretsen, IBM Corporation 1162306a36Sopenharmony_ci * Copyright (C) 2004 Olof Johansson <olof@lixom.net>, IBM Corporation 1262306a36Sopenharmony_ci * 1362306a36Sopenharmony_ci * Dynamic DMA mapping support, Apple U3, U4 & IBM CPC925 "DART" iommu. 1462306a36Sopenharmony_ci */ 1562306a36Sopenharmony_ci 1662306a36Sopenharmony_ci#include <linux/init.h> 1762306a36Sopenharmony_ci#include <linux/types.h> 1862306a36Sopenharmony_ci#include <linux/mm.h> 1962306a36Sopenharmony_ci#include <linux/spinlock.h> 2062306a36Sopenharmony_ci#include <linux/string.h> 2162306a36Sopenharmony_ci#include <linux/pci.h> 2262306a36Sopenharmony_ci#include <linux/dma-mapping.h> 2362306a36Sopenharmony_ci#include <linux/vmalloc.h> 2462306a36Sopenharmony_ci#include <linux/suspend.h> 2562306a36Sopenharmony_ci#include <linux/memblock.h> 2662306a36Sopenharmony_ci#include <linux/gfp.h> 2762306a36Sopenharmony_ci#include <linux/kmemleak.h> 2862306a36Sopenharmony_ci#include <linux/of_address.h> 2962306a36Sopenharmony_ci#include <asm/io.h> 3062306a36Sopenharmony_ci#include <asm/iommu.h> 3162306a36Sopenharmony_ci#include <asm/pci-bridge.h> 3262306a36Sopenharmony_ci#include <asm/machdep.h> 3362306a36Sopenharmony_ci#include <asm/cacheflush.h> 3462306a36Sopenharmony_ci#include <asm/ppc-pci.h> 3562306a36Sopenharmony_ci 3662306a36Sopenharmony_ci#include "dart.h" 3762306a36Sopenharmony_ci 3862306a36Sopenharmony_ci/* DART table address and size */ 3962306a36Sopenharmony_cistatic u32 *dart_tablebase; 4062306a36Sopenharmony_cistatic unsigned long dart_tablesize; 4162306a36Sopenharmony_ci 4262306a36Sopenharmony_ci/* Mapped base address for the dart */ 4362306a36Sopenharmony_cistatic unsigned int __iomem *dart; 4462306a36Sopenharmony_ci 4562306a36Sopenharmony_ci/* Dummy val that entries are set to when unused */ 4662306a36Sopenharmony_cistatic unsigned int dart_emptyval; 4762306a36Sopenharmony_ci 4862306a36Sopenharmony_cistatic struct iommu_table iommu_table_dart; 4962306a36Sopenharmony_cistatic int iommu_table_dart_inited; 5062306a36Sopenharmony_cistatic int dart_dirty; 5162306a36Sopenharmony_cistatic int dart_is_u4; 5262306a36Sopenharmony_ci 5362306a36Sopenharmony_ci#define DART_U4_BYPASS_BASE 0x8000000000ull 5462306a36Sopenharmony_ci 5562306a36Sopenharmony_ci#define DBG(...) 5662306a36Sopenharmony_ci 5762306a36Sopenharmony_cistatic DEFINE_SPINLOCK(invalidate_lock); 5862306a36Sopenharmony_ci 5962306a36Sopenharmony_cistatic inline void dart_tlb_invalidate_all(void) 6062306a36Sopenharmony_ci{ 6162306a36Sopenharmony_ci unsigned long l = 0; 6262306a36Sopenharmony_ci unsigned int reg, inv_bit; 6362306a36Sopenharmony_ci unsigned long limit; 6462306a36Sopenharmony_ci unsigned long flags; 6562306a36Sopenharmony_ci 6662306a36Sopenharmony_ci spin_lock_irqsave(&invalidate_lock, flags); 6762306a36Sopenharmony_ci 6862306a36Sopenharmony_ci DBG("dart: flush\n"); 6962306a36Sopenharmony_ci 7062306a36Sopenharmony_ci /* To invalidate the DART, set the DARTCNTL_FLUSHTLB bit in the 7162306a36Sopenharmony_ci * control register and wait for it to clear. 7262306a36Sopenharmony_ci * 7362306a36Sopenharmony_ci * Gotcha: Sometimes, the DART won't detect that the bit gets 7462306a36Sopenharmony_ci * set. If so, clear it and set it again. 7562306a36Sopenharmony_ci */ 7662306a36Sopenharmony_ci 7762306a36Sopenharmony_ci limit = 0; 7862306a36Sopenharmony_ci 7962306a36Sopenharmony_ci inv_bit = dart_is_u4 ? DART_CNTL_U4_FLUSHTLB : DART_CNTL_U3_FLUSHTLB; 8062306a36Sopenharmony_ciretry: 8162306a36Sopenharmony_ci l = 0; 8262306a36Sopenharmony_ci reg = DART_IN(DART_CNTL); 8362306a36Sopenharmony_ci reg |= inv_bit; 8462306a36Sopenharmony_ci DART_OUT(DART_CNTL, reg); 8562306a36Sopenharmony_ci 8662306a36Sopenharmony_ci while ((DART_IN(DART_CNTL) & inv_bit) && l < (1L << limit)) 8762306a36Sopenharmony_ci l++; 8862306a36Sopenharmony_ci if (l == (1L << limit)) { 8962306a36Sopenharmony_ci if (limit < 4) { 9062306a36Sopenharmony_ci limit++; 9162306a36Sopenharmony_ci reg = DART_IN(DART_CNTL); 9262306a36Sopenharmony_ci reg &= ~inv_bit; 9362306a36Sopenharmony_ci DART_OUT(DART_CNTL, reg); 9462306a36Sopenharmony_ci goto retry; 9562306a36Sopenharmony_ci } else 9662306a36Sopenharmony_ci panic("DART: TLB did not flush after waiting a long " 9762306a36Sopenharmony_ci "time. Buggy U3 ?"); 9862306a36Sopenharmony_ci } 9962306a36Sopenharmony_ci 10062306a36Sopenharmony_ci spin_unlock_irqrestore(&invalidate_lock, flags); 10162306a36Sopenharmony_ci} 10262306a36Sopenharmony_ci 10362306a36Sopenharmony_cistatic inline void dart_tlb_invalidate_one(unsigned long bus_rpn) 10462306a36Sopenharmony_ci{ 10562306a36Sopenharmony_ci unsigned int reg; 10662306a36Sopenharmony_ci unsigned int l, limit; 10762306a36Sopenharmony_ci unsigned long flags; 10862306a36Sopenharmony_ci 10962306a36Sopenharmony_ci spin_lock_irqsave(&invalidate_lock, flags); 11062306a36Sopenharmony_ci 11162306a36Sopenharmony_ci reg = DART_CNTL_U4_ENABLE | DART_CNTL_U4_IONE | 11262306a36Sopenharmony_ci (bus_rpn & DART_CNTL_U4_IONE_MASK); 11362306a36Sopenharmony_ci DART_OUT(DART_CNTL, reg); 11462306a36Sopenharmony_ci 11562306a36Sopenharmony_ci limit = 0; 11662306a36Sopenharmony_ciwait_more: 11762306a36Sopenharmony_ci l = 0; 11862306a36Sopenharmony_ci while ((DART_IN(DART_CNTL) & DART_CNTL_U4_IONE) && l < (1L << limit)) { 11962306a36Sopenharmony_ci rmb(); 12062306a36Sopenharmony_ci l++; 12162306a36Sopenharmony_ci } 12262306a36Sopenharmony_ci 12362306a36Sopenharmony_ci if (l == (1L << limit)) { 12462306a36Sopenharmony_ci if (limit < 4) { 12562306a36Sopenharmony_ci limit++; 12662306a36Sopenharmony_ci goto wait_more; 12762306a36Sopenharmony_ci } else 12862306a36Sopenharmony_ci panic("DART: TLB did not flush after waiting a long " 12962306a36Sopenharmony_ci "time. Buggy U4 ?"); 13062306a36Sopenharmony_ci } 13162306a36Sopenharmony_ci 13262306a36Sopenharmony_ci spin_unlock_irqrestore(&invalidate_lock, flags); 13362306a36Sopenharmony_ci} 13462306a36Sopenharmony_ci 13562306a36Sopenharmony_cistatic void dart_cache_sync(unsigned int *base, unsigned int count) 13662306a36Sopenharmony_ci{ 13762306a36Sopenharmony_ci /* 13862306a36Sopenharmony_ci * We add 1 to the number of entries to flush, following a 13962306a36Sopenharmony_ci * comment in Darwin indicating that the memory controller 14062306a36Sopenharmony_ci * can prefetch unmapped memory under some circumstances. 14162306a36Sopenharmony_ci */ 14262306a36Sopenharmony_ci unsigned long start = (unsigned long)base; 14362306a36Sopenharmony_ci unsigned long end = start + (count + 1) * sizeof(unsigned int); 14462306a36Sopenharmony_ci unsigned int tmp; 14562306a36Sopenharmony_ci 14662306a36Sopenharmony_ci /* Perform a standard cache flush */ 14762306a36Sopenharmony_ci flush_dcache_range(start, end); 14862306a36Sopenharmony_ci 14962306a36Sopenharmony_ci /* 15062306a36Sopenharmony_ci * Perform the sequence described in the CPC925 manual to 15162306a36Sopenharmony_ci * ensure all the data gets to a point the cache incoherent 15262306a36Sopenharmony_ci * DART hardware will see. 15362306a36Sopenharmony_ci */ 15462306a36Sopenharmony_ci asm volatile(" sync;" 15562306a36Sopenharmony_ci " isync;" 15662306a36Sopenharmony_ci " dcbf 0,%1;" 15762306a36Sopenharmony_ci " sync;" 15862306a36Sopenharmony_ci " isync;" 15962306a36Sopenharmony_ci " lwz %0,0(%1);" 16062306a36Sopenharmony_ci " isync" : "=r" (tmp) : "r" (end) : "memory"); 16162306a36Sopenharmony_ci} 16262306a36Sopenharmony_ci 16362306a36Sopenharmony_cistatic void dart_flush(struct iommu_table *tbl) 16462306a36Sopenharmony_ci{ 16562306a36Sopenharmony_ci mb(); 16662306a36Sopenharmony_ci if (dart_dirty) { 16762306a36Sopenharmony_ci dart_tlb_invalidate_all(); 16862306a36Sopenharmony_ci dart_dirty = 0; 16962306a36Sopenharmony_ci } 17062306a36Sopenharmony_ci} 17162306a36Sopenharmony_ci 17262306a36Sopenharmony_cistatic int dart_build(struct iommu_table *tbl, long index, 17362306a36Sopenharmony_ci long npages, unsigned long uaddr, 17462306a36Sopenharmony_ci enum dma_data_direction direction, 17562306a36Sopenharmony_ci unsigned long attrs) 17662306a36Sopenharmony_ci{ 17762306a36Sopenharmony_ci unsigned int *dp, *orig_dp; 17862306a36Sopenharmony_ci unsigned int rpn; 17962306a36Sopenharmony_ci long l; 18062306a36Sopenharmony_ci 18162306a36Sopenharmony_ci DBG("dart: build at: %lx, %lx, addr: %x\n", index, npages, uaddr); 18262306a36Sopenharmony_ci 18362306a36Sopenharmony_ci orig_dp = dp = ((unsigned int*)tbl->it_base) + index; 18462306a36Sopenharmony_ci 18562306a36Sopenharmony_ci /* On U3, all memory is contiguous, so we can move this 18662306a36Sopenharmony_ci * out of the loop. 18762306a36Sopenharmony_ci */ 18862306a36Sopenharmony_ci l = npages; 18962306a36Sopenharmony_ci while (l--) { 19062306a36Sopenharmony_ci rpn = __pa(uaddr) >> DART_PAGE_SHIFT; 19162306a36Sopenharmony_ci 19262306a36Sopenharmony_ci *(dp++) = DARTMAP_VALID | (rpn & DARTMAP_RPNMASK); 19362306a36Sopenharmony_ci 19462306a36Sopenharmony_ci uaddr += DART_PAGE_SIZE; 19562306a36Sopenharmony_ci } 19662306a36Sopenharmony_ci dart_cache_sync(orig_dp, npages); 19762306a36Sopenharmony_ci 19862306a36Sopenharmony_ci if (dart_is_u4) { 19962306a36Sopenharmony_ci rpn = index; 20062306a36Sopenharmony_ci while (npages--) 20162306a36Sopenharmony_ci dart_tlb_invalidate_one(rpn++); 20262306a36Sopenharmony_ci } else { 20362306a36Sopenharmony_ci dart_dirty = 1; 20462306a36Sopenharmony_ci } 20562306a36Sopenharmony_ci return 0; 20662306a36Sopenharmony_ci} 20762306a36Sopenharmony_ci 20862306a36Sopenharmony_ci 20962306a36Sopenharmony_cistatic void dart_free(struct iommu_table *tbl, long index, long npages) 21062306a36Sopenharmony_ci{ 21162306a36Sopenharmony_ci unsigned int *dp, *orig_dp; 21262306a36Sopenharmony_ci long orig_npages = npages; 21362306a36Sopenharmony_ci 21462306a36Sopenharmony_ci /* We don't worry about flushing the TLB cache. The only drawback of 21562306a36Sopenharmony_ci * not doing it is that we won't catch buggy device drivers doing 21662306a36Sopenharmony_ci * bad DMAs, but then no 32-bit architecture ever does either. 21762306a36Sopenharmony_ci */ 21862306a36Sopenharmony_ci 21962306a36Sopenharmony_ci DBG("dart: free at: %lx, %lx\n", index, npages); 22062306a36Sopenharmony_ci 22162306a36Sopenharmony_ci orig_dp = dp = ((unsigned int *)tbl->it_base) + index; 22262306a36Sopenharmony_ci 22362306a36Sopenharmony_ci while (npages--) 22462306a36Sopenharmony_ci *(dp++) = dart_emptyval; 22562306a36Sopenharmony_ci 22662306a36Sopenharmony_ci dart_cache_sync(orig_dp, orig_npages); 22762306a36Sopenharmony_ci} 22862306a36Sopenharmony_ci 22962306a36Sopenharmony_cistatic void __init allocate_dart(void) 23062306a36Sopenharmony_ci{ 23162306a36Sopenharmony_ci unsigned long tmp; 23262306a36Sopenharmony_ci 23362306a36Sopenharmony_ci /* 512 pages (2MB) is max DART tablesize. */ 23462306a36Sopenharmony_ci dart_tablesize = 1UL << 21; 23562306a36Sopenharmony_ci 23662306a36Sopenharmony_ci /* 23762306a36Sopenharmony_ci * 16MB (1 << 24) alignment. We allocate a full 16Mb chuck since we 23862306a36Sopenharmony_ci * will blow up an entire large page anyway in the kernel mapping. 23962306a36Sopenharmony_ci */ 24062306a36Sopenharmony_ci dart_tablebase = memblock_alloc_try_nid_raw(SZ_16M, SZ_16M, 24162306a36Sopenharmony_ci MEMBLOCK_LOW_LIMIT, SZ_2G, 24262306a36Sopenharmony_ci NUMA_NO_NODE); 24362306a36Sopenharmony_ci if (!dart_tablebase) 24462306a36Sopenharmony_ci panic("Failed to allocate 16MB below 2GB for DART table\n"); 24562306a36Sopenharmony_ci 24662306a36Sopenharmony_ci /* There is no point scanning the DART space for leaks*/ 24762306a36Sopenharmony_ci kmemleak_no_scan((void *)dart_tablebase); 24862306a36Sopenharmony_ci 24962306a36Sopenharmony_ci /* Allocate a spare page to map all invalid DART pages. We need to do 25062306a36Sopenharmony_ci * that to work around what looks like a problem with the HT bridge 25162306a36Sopenharmony_ci * prefetching into invalid pages and corrupting data 25262306a36Sopenharmony_ci */ 25362306a36Sopenharmony_ci tmp = memblock_phys_alloc(DART_PAGE_SIZE, DART_PAGE_SIZE); 25462306a36Sopenharmony_ci if (!tmp) 25562306a36Sopenharmony_ci panic("DART: table allocation failed\n"); 25662306a36Sopenharmony_ci 25762306a36Sopenharmony_ci dart_emptyval = DARTMAP_VALID | ((tmp >> DART_PAGE_SHIFT) & 25862306a36Sopenharmony_ci DARTMAP_RPNMASK); 25962306a36Sopenharmony_ci 26062306a36Sopenharmony_ci printk(KERN_INFO "DART table allocated at: %p\n", dart_tablebase); 26162306a36Sopenharmony_ci} 26262306a36Sopenharmony_ci 26362306a36Sopenharmony_cistatic int __init dart_init(struct device_node *dart_node) 26462306a36Sopenharmony_ci{ 26562306a36Sopenharmony_ci unsigned int i; 26662306a36Sopenharmony_ci unsigned long base, size; 26762306a36Sopenharmony_ci struct resource r; 26862306a36Sopenharmony_ci 26962306a36Sopenharmony_ci /* IOMMU disabled by the user ? bail out */ 27062306a36Sopenharmony_ci if (iommu_is_off) 27162306a36Sopenharmony_ci return -ENODEV; 27262306a36Sopenharmony_ci 27362306a36Sopenharmony_ci /* 27462306a36Sopenharmony_ci * Only use the DART if the machine has more than 1GB of RAM 27562306a36Sopenharmony_ci * or if requested with iommu=on on cmdline. 27662306a36Sopenharmony_ci * 27762306a36Sopenharmony_ci * 1GB of RAM is picked as limit because some default devices 27862306a36Sopenharmony_ci * (i.e. Airport Extreme) have 30 bit address range limits. 27962306a36Sopenharmony_ci */ 28062306a36Sopenharmony_ci 28162306a36Sopenharmony_ci if (!iommu_force_on && memblock_end_of_DRAM() <= 0x40000000ull) 28262306a36Sopenharmony_ci return -ENODEV; 28362306a36Sopenharmony_ci 28462306a36Sopenharmony_ci /* Get DART registers */ 28562306a36Sopenharmony_ci if (of_address_to_resource(dart_node, 0, &r)) 28662306a36Sopenharmony_ci panic("DART: can't get register base ! "); 28762306a36Sopenharmony_ci 28862306a36Sopenharmony_ci /* Map in DART registers */ 28962306a36Sopenharmony_ci dart = ioremap(r.start, resource_size(&r)); 29062306a36Sopenharmony_ci if (dart == NULL) 29162306a36Sopenharmony_ci panic("DART: Cannot map registers!"); 29262306a36Sopenharmony_ci 29362306a36Sopenharmony_ci /* Allocate the DART and dummy page */ 29462306a36Sopenharmony_ci allocate_dart(); 29562306a36Sopenharmony_ci 29662306a36Sopenharmony_ci /* Fill initial table */ 29762306a36Sopenharmony_ci for (i = 0; i < dart_tablesize/4; i++) 29862306a36Sopenharmony_ci dart_tablebase[i] = dart_emptyval; 29962306a36Sopenharmony_ci 30062306a36Sopenharmony_ci /* Push to memory */ 30162306a36Sopenharmony_ci dart_cache_sync(dart_tablebase, dart_tablesize / sizeof(u32)); 30262306a36Sopenharmony_ci 30362306a36Sopenharmony_ci /* Initialize DART with table base and enable it. */ 30462306a36Sopenharmony_ci base = ((unsigned long)dart_tablebase) >> DART_PAGE_SHIFT; 30562306a36Sopenharmony_ci size = dart_tablesize >> DART_PAGE_SHIFT; 30662306a36Sopenharmony_ci if (dart_is_u4) { 30762306a36Sopenharmony_ci size &= DART_SIZE_U4_SIZE_MASK; 30862306a36Sopenharmony_ci DART_OUT(DART_BASE_U4, base); 30962306a36Sopenharmony_ci DART_OUT(DART_SIZE_U4, size); 31062306a36Sopenharmony_ci DART_OUT(DART_CNTL, DART_CNTL_U4_ENABLE); 31162306a36Sopenharmony_ci } else { 31262306a36Sopenharmony_ci size &= DART_CNTL_U3_SIZE_MASK; 31362306a36Sopenharmony_ci DART_OUT(DART_CNTL, 31462306a36Sopenharmony_ci DART_CNTL_U3_ENABLE | 31562306a36Sopenharmony_ci (base << DART_CNTL_U3_BASE_SHIFT) | 31662306a36Sopenharmony_ci (size << DART_CNTL_U3_SIZE_SHIFT)); 31762306a36Sopenharmony_ci } 31862306a36Sopenharmony_ci 31962306a36Sopenharmony_ci /* Invalidate DART to get rid of possible stale TLBs */ 32062306a36Sopenharmony_ci dart_tlb_invalidate_all(); 32162306a36Sopenharmony_ci 32262306a36Sopenharmony_ci printk(KERN_INFO "DART IOMMU initialized for %s type chipset\n", 32362306a36Sopenharmony_ci dart_is_u4 ? "U4" : "U3"); 32462306a36Sopenharmony_ci 32562306a36Sopenharmony_ci return 0; 32662306a36Sopenharmony_ci} 32762306a36Sopenharmony_ci 32862306a36Sopenharmony_cistatic struct iommu_table_ops iommu_dart_ops = { 32962306a36Sopenharmony_ci .set = dart_build, 33062306a36Sopenharmony_ci .clear = dart_free, 33162306a36Sopenharmony_ci .flush = dart_flush, 33262306a36Sopenharmony_ci}; 33362306a36Sopenharmony_ci 33462306a36Sopenharmony_cistatic void iommu_table_dart_setup(void) 33562306a36Sopenharmony_ci{ 33662306a36Sopenharmony_ci iommu_table_dart.it_busno = 0; 33762306a36Sopenharmony_ci iommu_table_dart.it_offset = 0; 33862306a36Sopenharmony_ci /* it_size is in number of entries */ 33962306a36Sopenharmony_ci iommu_table_dart.it_size = dart_tablesize / sizeof(u32); 34062306a36Sopenharmony_ci iommu_table_dart.it_page_shift = IOMMU_PAGE_SHIFT_4K; 34162306a36Sopenharmony_ci 34262306a36Sopenharmony_ci /* Initialize the common IOMMU code */ 34362306a36Sopenharmony_ci iommu_table_dart.it_base = (unsigned long)dart_tablebase; 34462306a36Sopenharmony_ci iommu_table_dart.it_index = 0; 34562306a36Sopenharmony_ci iommu_table_dart.it_blocksize = 1; 34662306a36Sopenharmony_ci iommu_table_dart.it_ops = &iommu_dart_ops; 34762306a36Sopenharmony_ci if (!iommu_init_table(&iommu_table_dart, -1, 0, 0)) 34862306a36Sopenharmony_ci panic("Failed to initialize iommu table"); 34962306a36Sopenharmony_ci 35062306a36Sopenharmony_ci /* Reserve the last page of the DART to avoid possible prefetch 35162306a36Sopenharmony_ci * past the DART mapped area 35262306a36Sopenharmony_ci */ 35362306a36Sopenharmony_ci set_bit(iommu_table_dart.it_size - 1, iommu_table_dart.it_map); 35462306a36Sopenharmony_ci} 35562306a36Sopenharmony_ci 35662306a36Sopenharmony_cistatic void pci_dma_bus_setup_dart(struct pci_bus *bus) 35762306a36Sopenharmony_ci{ 35862306a36Sopenharmony_ci if (!iommu_table_dart_inited) { 35962306a36Sopenharmony_ci iommu_table_dart_inited = 1; 36062306a36Sopenharmony_ci iommu_table_dart_setup(); 36162306a36Sopenharmony_ci } 36262306a36Sopenharmony_ci} 36362306a36Sopenharmony_ci 36462306a36Sopenharmony_cistatic bool dart_device_on_pcie(struct device *dev) 36562306a36Sopenharmony_ci{ 36662306a36Sopenharmony_ci struct device_node *np = of_node_get(dev->of_node); 36762306a36Sopenharmony_ci 36862306a36Sopenharmony_ci while(np) { 36962306a36Sopenharmony_ci if (of_device_is_compatible(np, "U4-pcie") || 37062306a36Sopenharmony_ci of_device_is_compatible(np, "u4-pcie")) { 37162306a36Sopenharmony_ci of_node_put(np); 37262306a36Sopenharmony_ci return true; 37362306a36Sopenharmony_ci } 37462306a36Sopenharmony_ci np = of_get_next_parent(np); 37562306a36Sopenharmony_ci } 37662306a36Sopenharmony_ci return false; 37762306a36Sopenharmony_ci} 37862306a36Sopenharmony_ci 37962306a36Sopenharmony_cistatic void pci_dma_dev_setup_dart(struct pci_dev *dev) 38062306a36Sopenharmony_ci{ 38162306a36Sopenharmony_ci if (dart_is_u4 && dart_device_on_pcie(&dev->dev)) 38262306a36Sopenharmony_ci dev->dev.archdata.dma_offset = DART_U4_BYPASS_BASE; 38362306a36Sopenharmony_ci set_iommu_table_base(&dev->dev, &iommu_table_dart); 38462306a36Sopenharmony_ci} 38562306a36Sopenharmony_ci 38662306a36Sopenharmony_cistatic bool iommu_bypass_supported_dart(struct pci_dev *dev, u64 mask) 38762306a36Sopenharmony_ci{ 38862306a36Sopenharmony_ci return dart_is_u4 && 38962306a36Sopenharmony_ci dart_device_on_pcie(&dev->dev) && 39062306a36Sopenharmony_ci mask >= DMA_BIT_MASK(40); 39162306a36Sopenharmony_ci} 39262306a36Sopenharmony_ci 39362306a36Sopenharmony_civoid __init iommu_init_early_dart(struct pci_controller_ops *controller_ops) 39462306a36Sopenharmony_ci{ 39562306a36Sopenharmony_ci struct device_node *dn; 39662306a36Sopenharmony_ci 39762306a36Sopenharmony_ci /* Find the DART in the device-tree */ 39862306a36Sopenharmony_ci dn = of_find_compatible_node(NULL, "dart", "u3-dart"); 39962306a36Sopenharmony_ci if (dn == NULL) { 40062306a36Sopenharmony_ci dn = of_find_compatible_node(NULL, "dart", "u4-dart"); 40162306a36Sopenharmony_ci if (dn == NULL) 40262306a36Sopenharmony_ci return; /* use default direct_dma_ops */ 40362306a36Sopenharmony_ci dart_is_u4 = 1; 40462306a36Sopenharmony_ci } 40562306a36Sopenharmony_ci 40662306a36Sopenharmony_ci /* Initialize the DART HW */ 40762306a36Sopenharmony_ci if (dart_init(dn) != 0) { 40862306a36Sopenharmony_ci of_node_put(dn); 40962306a36Sopenharmony_ci return; 41062306a36Sopenharmony_ci } 41162306a36Sopenharmony_ci /* 41262306a36Sopenharmony_ci * U4 supports a DART bypass, we use it for 64-bit capable devices to 41362306a36Sopenharmony_ci * improve performance. However, that only works for devices connected 41462306a36Sopenharmony_ci * to the U4 own PCIe interface, not bridged through hypertransport. 41562306a36Sopenharmony_ci * We need the device to support at least 40 bits of addresses. 41662306a36Sopenharmony_ci */ 41762306a36Sopenharmony_ci controller_ops->dma_dev_setup = pci_dma_dev_setup_dart; 41862306a36Sopenharmony_ci controller_ops->dma_bus_setup = pci_dma_bus_setup_dart; 41962306a36Sopenharmony_ci controller_ops->iommu_bypass_supported = iommu_bypass_supported_dart; 42062306a36Sopenharmony_ci 42162306a36Sopenharmony_ci /* Setup pci_dma ops */ 42262306a36Sopenharmony_ci set_pci_dma_ops(&dma_iommu_ops); 42362306a36Sopenharmony_ci of_node_put(dn); 42462306a36Sopenharmony_ci} 42562306a36Sopenharmony_ci 42662306a36Sopenharmony_ci#ifdef CONFIG_PM 42762306a36Sopenharmony_cistatic void iommu_dart_restore(void) 42862306a36Sopenharmony_ci{ 42962306a36Sopenharmony_ci dart_cache_sync(dart_tablebase, dart_tablesize / sizeof(u32)); 43062306a36Sopenharmony_ci dart_tlb_invalidate_all(); 43162306a36Sopenharmony_ci} 43262306a36Sopenharmony_ci 43362306a36Sopenharmony_cistatic int __init iommu_init_late_dart(void) 43462306a36Sopenharmony_ci{ 43562306a36Sopenharmony_ci if (!dart_tablebase) 43662306a36Sopenharmony_ci return 0; 43762306a36Sopenharmony_ci 43862306a36Sopenharmony_ci ppc_md.iommu_restore = iommu_dart_restore; 43962306a36Sopenharmony_ci 44062306a36Sopenharmony_ci return 0; 44162306a36Sopenharmony_ci} 44262306a36Sopenharmony_ci 44362306a36Sopenharmony_cilate_initcall(iommu_init_late_dart); 44462306a36Sopenharmony_ci#endif /* CONFIG_PM */ 445