162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Copyright © 2006-2009, Intel Corporation. 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Author: Anil S Keshavamurthy <anil.s.keshavamurthy@intel.com> 662306a36Sopenharmony_ci */ 762306a36Sopenharmony_ci 862306a36Sopenharmony_ci#include <linux/iova.h> 962306a36Sopenharmony_ci#include <linux/module.h> 1062306a36Sopenharmony_ci#include <linux/slab.h> 1162306a36Sopenharmony_ci#include <linux/smp.h> 1262306a36Sopenharmony_ci#include <linux/bitops.h> 1362306a36Sopenharmony_ci#include <linux/cpu.h> 1462306a36Sopenharmony_ci 1562306a36Sopenharmony_ci/* The anchor node sits above the top of the usable address space */ 1662306a36Sopenharmony_ci#define IOVA_ANCHOR ~0UL 1762306a36Sopenharmony_ci 1862306a36Sopenharmony_ci#define IOVA_RANGE_CACHE_MAX_SIZE 6 /* log of max cached IOVA range size (in pages) */ 1962306a36Sopenharmony_ci 2062306a36Sopenharmony_cistatic bool iova_rcache_insert(struct iova_domain *iovad, 2162306a36Sopenharmony_ci unsigned long pfn, 2262306a36Sopenharmony_ci unsigned long size); 2362306a36Sopenharmony_cistatic unsigned long iova_rcache_get(struct iova_domain *iovad, 2462306a36Sopenharmony_ci unsigned long size, 2562306a36Sopenharmony_ci unsigned long limit_pfn); 2662306a36Sopenharmony_cistatic void free_cpu_cached_iovas(unsigned int cpu, struct iova_domain *iovad); 2762306a36Sopenharmony_cistatic void free_iova_rcaches(struct iova_domain *iovad); 2862306a36Sopenharmony_ci 2962306a36Sopenharmony_ciunsigned long iova_rcache_range(void) 3062306a36Sopenharmony_ci{ 3162306a36Sopenharmony_ci return PAGE_SIZE << (IOVA_RANGE_CACHE_MAX_SIZE - 1); 3262306a36Sopenharmony_ci} 3362306a36Sopenharmony_ci 3462306a36Sopenharmony_cistatic int iova_cpuhp_dead(unsigned int cpu, struct hlist_node *node) 3562306a36Sopenharmony_ci{ 3662306a36Sopenharmony_ci struct iova_domain *iovad; 3762306a36Sopenharmony_ci 3862306a36Sopenharmony_ci iovad = hlist_entry_safe(node, struct iova_domain, cpuhp_dead); 3962306a36Sopenharmony_ci 4062306a36Sopenharmony_ci free_cpu_cached_iovas(cpu, iovad); 4162306a36Sopenharmony_ci return 0; 4262306a36Sopenharmony_ci} 4362306a36Sopenharmony_ci 4462306a36Sopenharmony_cistatic void free_global_cached_iovas(struct iova_domain *iovad); 4562306a36Sopenharmony_ci 4662306a36Sopenharmony_cistatic struct iova *to_iova(struct rb_node *node) 4762306a36Sopenharmony_ci{ 4862306a36Sopenharmony_ci return rb_entry(node, struct iova, node); 4962306a36Sopenharmony_ci} 5062306a36Sopenharmony_ci 5162306a36Sopenharmony_civoid 5262306a36Sopenharmony_ciinit_iova_domain(struct iova_domain *iovad, unsigned long granule, 5362306a36Sopenharmony_ci unsigned long start_pfn) 5462306a36Sopenharmony_ci{ 5562306a36Sopenharmony_ci /* 5662306a36Sopenharmony_ci * IOVA granularity will normally be equal to the smallest 5762306a36Sopenharmony_ci * supported IOMMU page size; both *must* be capable of 5862306a36Sopenharmony_ci * representing individual CPU pages exactly. 5962306a36Sopenharmony_ci */ 6062306a36Sopenharmony_ci BUG_ON((granule > PAGE_SIZE) || !is_power_of_2(granule)); 6162306a36Sopenharmony_ci 6262306a36Sopenharmony_ci spin_lock_init(&iovad->iova_rbtree_lock); 6362306a36Sopenharmony_ci iovad->rbroot = RB_ROOT; 6462306a36Sopenharmony_ci iovad->cached_node = &iovad->anchor.node; 6562306a36Sopenharmony_ci iovad->cached32_node = &iovad->anchor.node; 6662306a36Sopenharmony_ci iovad->granule = granule; 6762306a36Sopenharmony_ci iovad->start_pfn = start_pfn; 6862306a36Sopenharmony_ci iovad->dma_32bit_pfn = 1UL << (32 - iova_shift(iovad)); 6962306a36Sopenharmony_ci iovad->max32_alloc_size = iovad->dma_32bit_pfn; 7062306a36Sopenharmony_ci iovad->anchor.pfn_lo = iovad->anchor.pfn_hi = IOVA_ANCHOR; 7162306a36Sopenharmony_ci rb_link_node(&iovad->anchor.node, NULL, &iovad->rbroot.rb_node); 7262306a36Sopenharmony_ci rb_insert_color(&iovad->anchor.node, &iovad->rbroot); 7362306a36Sopenharmony_ci} 7462306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(init_iova_domain); 7562306a36Sopenharmony_ci 7662306a36Sopenharmony_cistatic struct rb_node * 7762306a36Sopenharmony_ci__get_cached_rbnode(struct iova_domain *iovad, unsigned long limit_pfn) 7862306a36Sopenharmony_ci{ 7962306a36Sopenharmony_ci if (limit_pfn <= iovad->dma_32bit_pfn) 8062306a36Sopenharmony_ci return iovad->cached32_node; 8162306a36Sopenharmony_ci 8262306a36Sopenharmony_ci return iovad->cached_node; 8362306a36Sopenharmony_ci} 8462306a36Sopenharmony_ci 8562306a36Sopenharmony_cistatic void 8662306a36Sopenharmony_ci__cached_rbnode_insert_update(struct iova_domain *iovad, struct iova *new) 8762306a36Sopenharmony_ci{ 8862306a36Sopenharmony_ci if (new->pfn_hi < iovad->dma_32bit_pfn) 8962306a36Sopenharmony_ci iovad->cached32_node = &new->node; 9062306a36Sopenharmony_ci else 9162306a36Sopenharmony_ci iovad->cached_node = &new->node; 9262306a36Sopenharmony_ci} 9362306a36Sopenharmony_ci 9462306a36Sopenharmony_cistatic void 9562306a36Sopenharmony_ci__cached_rbnode_delete_update(struct iova_domain *iovad, struct iova *free) 9662306a36Sopenharmony_ci{ 9762306a36Sopenharmony_ci struct iova *cached_iova; 9862306a36Sopenharmony_ci 9962306a36Sopenharmony_ci cached_iova = to_iova(iovad->cached32_node); 10062306a36Sopenharmony_ci if (free == cached_iova || 10162306a36Sopenharmony_ci (free->pfn_hi < iovad->dma_32bit_pfn && 10262306a36Sopenharmony_ci free->pfn_lo >= cached_iova->pfn_lo)) 10362306a36Sopenharmony_ci iovad->cached32_node = rb_next(&free->node); 10462306a36Sopenharmony_ci 10562306a36Sopenharmony_ci if (free->pfn_lo < iovad->dma_32bit_pfn) 10662306a36Sopenharmony_ci iovad->max32_alloc_size = iovad->dma_32bit_pfn; 10762306a36Sopenharmony_ci 10862306a36Sopenharmony_ci cached_iova = to_iova(iovad->cached_node); 10962306a36Sopenharmony_ci if (free->pfn_lo >= cached_iova->pfn_lo) 11062306a36Sopenharmony_ci iovad->cached_node = rb_next(&free->node); 11162306a36Sopenharmony_ci} 11262306a36Sopenharmony_ci 11362306a36Sopenharmony_cistatic struct rb_node *iova_find_limit(struct iova_domain *iovad, unsigned long limit_pfn) 11462306a36Sopenharmony_ci{ 11562306a36Sopenharmony_ci struct rb_node *node, *next; 11662306a36Sopenharmony_ci /* 11762306a36Sopenharmony_ci * Ideally what we'd like to judge here is whether limit_pfn is close 11862306a36Sopenharmony_ci * enough to the highest-allocated IOVA that starting the allocation 11962306a36Sopenharmony_ci * walk from the anchor node will be quicker than this initial work to 12062306a36Sopenharmony_ci * find an exact starting point (especially if that ends up being the 12162306a36Sopenharmony_ci * anchor node anyway). This is an incredibly crude approximation which 12262306a36Sopenharmony_ci * only really helps the most likely case, but is at least trivially easy. 12362306a36Sopenharmony_ci */ 12462306a36Sopenharmony_ci if (limit_pfn > iovad->dma_32bit_pfn) 12562306a36Sopenharmony_ci return &iovad->anchor.node; 12662306a36Sopenharmony_ci 12762306a36Sopenharmony_ci node = iovad->rbroot.rb_node; 12862306a36Sopenharmony_ci while (to_iova(node)->pfn_hi < limit_pfn) 12962306a36Sopenharmony_ci node = node->rb_right; 13062306a36Sopenharmony_ci 13162306a36Sopenharmony_cisearch_left: 13262306a36Sopenharmony_ci while (node->rb_left && to_iova(node->rb_left)->pfn_lo >= limit_pfn) 13362306a36Sopenharmony_ci node = node->rb_left; 13462306a36Sopenharmony_ci 13562306a36Sopenharmony_ci if (!node->rb_left) 13662306a36Sopenharmony_ci return node; 13762306a36Sopenharmony_ci 13862306a36Sopenharmony_ci next = node->rb_left; 13962306a36Sopenharmony_ci while (next->rb_right) { 14062306a36Sopenharmony_ci next = next->rb_right; 14162306a36Sopenharmony_ci if (to_iova(next)->pfn_lo >= limit_pfn) { 14262306a36Sopenharmony_ci node = next; 14362306a36Sopenharmony_ci goto search_left; 14462306a36Sopenharmony_ci } 14562306a36Sopenharmony_ci } 14662306a36Sopenharmony_ci 14762306a36Sopenharmony_ci return node; 14862306a36Sopenharmony_ci} 14962306a36Sopenharmony_ci 15062306a36Sopenharmony_ci/* Insert the iova into domain rbtree by holding writer lock */ 15162306a36Sopenharmony_cistatic void 15262306a36Sopenharmony_ciiova_insert_rbtree(struct rb_root *root, struct iova *iova, 15362306a36Sopenharmony_ci struct rb_node *start) 15462306a36Sopenharmony_ci{ 15562306a36Sopenharmony_ci struct rb_node **new, *parent = NULL; 15662306a36Sopenharmony_ci 15762306a36Sopenharmony_ci new = (start) ? &start : &(root->rb_node); 15862306a36Sopenharmony_ci /* Figure out where to put new node */ 15962306a36Sopenharmony_ci while (*new) { 16062306a36Sopenharmony_ci struct iova *this = to_iova(*new); 16162306a36Sopenharmony_ci 16262306a36Sopenharmony_ci parent = *new; 16362306a36Sopenharmony_ci 16462306a36Sopenharmony_ci if (iova->pfn_lo < this->pfn_lo) 16562306a36Sopenharmony_ci new = &((*new)->rb_left); 16662306a36Sopenharmony_ci else if (iova->pfn_lo > this->pfn_lo) 16762306a36Sopenharmony_ci new = &((*new)->rb_right); 16862306a36Sopenharmony_ci else { 16962306a36Sopenharmony_ci WARN_ON(1); /* this should not happen */ 17062306a36Sopenharmony_ci return; 17162306a36Sopenharmony_ci } 17262306a36Sopenharmony_ci } 17362306a36Sopenharmony_ci /* Add new node and rebalance tree. */ 17462306a36Sopenharmony_ci rb_link_node(&iova->node, parent, new); 17562306a36Sopenharmony_ci rb_insert_color(&iova->node, root); 17662306a36Sopenharmony_ci} 17762306a36Sopenharmony_ci 17862306a36Sopenharmony_cistatic int __alloc_and_insert_iova_range(struct iova_domain *iovad, 17962306a36Sopenharmony_ci unsigned long size, unsigned long limit_pfn, 18062306a36Sopenharmony_ci struct iova *new, bool size_aligned) 18162306a36Sopenharmony_ci{ 18262306a36Sopenharmony_ci struct rb_node *curr, *prev; 18362306a36Sopenharmony_ci struct iova *curr_iova; 18462306a36Sopenharmony_ci unsigned long flags; 18562306a36Sopenharmony_ci unsigned long new_pfn, retry_pfn; 18662306a36Sopenharmony_ci unsigned long align_mask = ~0UL; 18762306a36Sopenharmony_ci unsigned long high_pfn = limit_pfn, low_pfn = iovad->start_pfn; 18862306a36Sopenharmony_ci 18962306a36Sopenharmony_ci if (size_aligned) 19062306a36Sopenharmony_ci align_mask <<= fls_long(size - 1); 19162306a36Sopenharmony_ci 19262306a36Sopenharmony_ci /* Walk the tree backwards */ 19362306a36Sopenharmony_ci spin_lock_irqsave(&iovad->iova_rbtree_lock, flags); 19462306a36Sopenharmony_ci if (limit_pfn <= iovad->dma_32bit_pfn && 19562306a36Sopenharmony_ci size >= iovad->max32_alloc_size) 19662306a36Sopenharmony_ci goto iova32_full; 19762306a36Sopenharmony_ci 19862306a36Sopenharmony_ci curr = __get_cached_rbnode(iovad, limit_pfn); 19962306a36Sopenharmony_ci curr_iova = to_iova(curr); 20062306a36Sopenharmony_ci retry_pfn = curr_iova->pfn_hi; 20162306a36Sopenharmony_ci 20262306a36Sopenharmony_ciretry: 20362306a36Sopenharmony_ci do { 20462306a36Sopenharmony_ci high_pfn = min(high_pfn, curr_iova->pfn_lo); 20562306a36Sopenharmony_ci new_pfn = (high_pfn - size) & align_mask; 20662306a36Sopenharmony_ci prev = curr; 20762306a36Sopenharmony_ci curr = rb_prev(curr); 20862306a36Sopenharmony_ci curr_iova = to_iova(curr); 20962306a36Sopenharmony_ci } while (curr && new_pfn <= curr_iova->pfn_hi && new_pfn >= low_pfn); 21062306a36Sopenharmony_ci 21162306a36Sopenharmony_ci if (high_pfn < size || new_pfn < low_pfn) { 21262306a36Sopenharmony_ci if (low_pfn == iovad->start_pfn && retry_pfn < limit_pfn) { 21362306a36Sopenharmony_ci high_pfn = limit_pfn; 21462306a36Sopenharmony_ci low_pfn = retry_pfn + 1; 21562306a36Sopenharmony_ci curr = iova_find_limit(iovad, limit_pfn); 21662306a36Sopenharmony_ci curr_iova = to_iova(curr); 21762306a36Sopenharmony_ci goto retry; 21862306a36Sopenharmony_ci } 21962306a36Sopenharmony_ci iovad->max32_alloc_size = size; 22062306a36Sopenharmony_ci goto iova32_full; 22162306a36Sopenharmony_ci } 22262306a36Sopenharmony_ci 22362306a36Sopenharmony_ci /* pfn_lo will point to size aligned address if size_aligned is set */ 22462306a36Sopenharmony_ci new->pfn_lo = new_pfn; 22562306a36Sopenharmony_ci new->pfn_hi = new->pfn_lo + size - 1; 22662306a36Sopenharmony_ci 22762306a36Sopenharmony_ci /* If we have 'prev', it's a valid place to start the insertion. */ 22862306a36Sopenharmony_ci iova_insert_rbtree(&iovad->rbroot, new, prev); 22962306a36Sopenharmony_ci __cached_rbnode_insert_update(iovad, new); 23062306a36Sopenharmony_ci 23162306a36Sopenharmony_ci spin_unlock_irqrestore(&iovad->iova_rbtree_lock, flags); 23262306a36Sopenharmony_ci return 0; 23362306a36Sopenharmony_ci 23462306a36Sopenharmony_ciiova32_full: 23562306a36Sopenharmony_ci spin_unlock_irqrestore(&iovad->iova_rbtree_lock, flags); 23662306a36Sopenharmony_ci return -ENOMEM; 23762306a36Sopenharmony_ci} 23862306a36Sopenharmony_ci 23962306a36Sopenharmony_cistatic struct kmem_cache *iova_cache; 24062306a36Sopenharmony_cistatic unsigned int iova_cache_users; 24162306a36Sopenharmony_cistatic DEFINE_MUTEX(iova_cache_mutex); 24262306a36Sopenharmony_ci 24362306a36Sopenharmony_cistatic struct iova *alloc_iova_mem(void) 24462306a36Sopenharmony_ci{ 24562306a36Sopenharmony_ci return kmem_cache_zalloc(iova_cache, GFP_ATOMIC | __GFP_NOWARN); 24662306a36Sopenharmony_ci} 24762306a36Sopenharmony_ci 24862306a36Sopenharmony_cistatic void free_iova_mem(struct iova *iova) 24962306a36Sopenharmony_ci{ 25062306a36Sopenharmony_ci if (iova->pfn_lo != IOVA_ANCHOR) 25162306a36Sopenharmony_ci kmem_cache_free(iova_cache, iova); 25262306a36Sopenharmony_ci} 25362306a36Sopenharmony_ci 25462306a36Sopenharmony_ciint iova_cache_get(void) 25562306a36Sopenharmony_ci{ 25662306a36Sopenharmony_ci mutex_lock(&iova_cache_mutex); 25762306a36Sopenharmony_ci if (!iova_cache_users) { 25862306a36Sopenharmony_ci int ret; 25962306a36Sopenharmony_ci 26062306a36Sopenharmony_ci ret = cpuhp_setup_state_multi(CPUHP_IOMMU_IOVA_DEAD, "iommu/iova:dead", NULL, 26162306a36Sopenharmony_ci iova_cpuhp_dead); 26262306a36Sopenharmony_ci if (ret) { 26362306a36Sopenharmony_ci mutex_unlock(&iova_cache_mutex); 26462306a36Sopenharmony_ci pr_err("Couldn't register cpuhp handler\n"); 26562306a36Sopenharmony_ci return ret; 26662306a36Sopenharmony_ci } 26762306a36Sopenharmony_ci 26862306a36Sopenharmony_ci iova_cache = kmem_cache_create( 26962306a36Sopenharmony_ci "iommu_iova", sizeof(struct iova), 0, 27062306a36Sopenharmony_ci SLAB_HWCACHE_ALIGN, NULL); 27162306a36Sopenharmony_ci if (!iova_cache) { 27262306a36Sopenharmony_ci cpuhp_remove_multi_state(CPUHP_IOMMU_IOVA_DEAD); 27362306a36Sopenharmony_ci mutex_unlock(&iova_cache_mutex); 27462306a36Sopenharmony_ci pr_err("Couldn't create iova cache\n"); 27562306a36Sopenharmony_ci return -ENOMEM; 27662306a36Sopenharmony_ci } 27762306a36Sopenharmony_ci } 27862306a36Sopenharmony_ci 27962306a36Sopenharmony_ci iova_cache_users++; 28062306a36Sopenharmony_ci mutex_unlock(&iova_cache_mutex); 28162306a36Sopenharmony_ci 28262306a36Sopenharmony_ci return 0; 28362306a36Sopenharmony_ci} 28462306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(iova_cache_get); 28562306a36Sopenharmony_ci 28662306a36Sopenharmony_civoid iova_cache_put(void) 28762306a36Sopenharmony_ci{ 28862306a36Sopenharmony_ci mutex_lock(&iova_cache_mutex); 28962306a36Sopenharmony_ci if (WARN_ON(!iova_cache_users)) { 29062306a36Sopenharmony_ci mutex_unlock(&iova_cache_mutex); 29162306a36Sopenharmony_ci return; 29262306a36Sopenharmony_ci } 29362306a36Sopenharmony_ci iova_cache_users--; 29462306a36Sopenharmony_ci if (!iova_cache_users) { 29562306a36Sopenharmony_ci cpuhp_remove_multi_state(CPUHP_IOMMU_IOVA_DEAD); 29662306a36Sopenharmony_ci kmem_cache_destroy(iova_cache); 29762306a36Sopenharmony_ci } 29862306a36Sopenharmony_ci mutex_unlock(&iova_cache_mutex); 29962306a36Sopenharmony_ci} 30062306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(iova_cache_put); 30162306a36Sopenharmony_ci 30262306a36Sopenharmony_ci/** 30362306a36Sopenharmony_ci * alloc_iova - allocates an iova 30462306a36Sopenharmony_ci * @iovad: - iova domain in question 30562306a36Sopenharmony_ci * @size: - size of page frames to allocate 30662306a36Sopenharmony_ci * @limit_pfn: - max limit address 30762306a36Sopenharmony_ci * @size_aligned: - set if size_aligned address range is required 30862306a36Sopenharmony_ci * This function allocates an iova in the range iovad->start_pfn to limit_pfn, 30962306a36Sopenharmony_ci * searching top-down from limit_pfn to iovad->start_pfn. If the size_aligned 31062306a36Sopenharmony_ci * flag is set then the allocated address iova->pfn_lo will be naturally 31162306a36Sopenharmony_ci * aligned on roundup_power_of_two(size). 31262306a36Sopenharmony_ci */ 31362306a36Sopenharmony_cistruct iova * 31462306a36Sopenharmony_cialloc_iova(struct iova_domain *iovad, unsigned long size, 31562306a36Sopenharmony_ci unsigned long limit_pfn, 31662306a36Sopenharmony_ci bool size_aligned) 31762306a36Sopenharmony_ci{ 31862306a36Sopenharmony_ci struct iova *new_iova; 31962306a36Sopenharmony_ci int ret; 32062306a36Sopenharmony_ci 32162306a36Sopenharmony_ci new_iova = alloc_iova_mem(); 32262306a36Sopenharmony_ci if (!new_iova) 32362306a36Sopenharmony_ci return NULL; 32462306a36Sopenharmony_ci 32562306a36Sopenharmony_ci ret = __alloc_and_insert_iova_range(iovad, size, limit_pfn + 1, 32662306a36Sopenharmony_ci new_iova, size_aligned); 32762306a36Sopenharmony_ci 32862306a36Sopenharmony_ci if (ret) { 32962306a36Sopenharmony_ci free_iova_mem(new_iova); 33062306a36Sopenharmony_ci return NULL; 33162306a36Sopenharmony_ci } 33262306a36Sopenharmony_ci 33362306a36Sopenharmony_ci return new_iova; 33462306a36Sopenharmony_ci} 33562306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(alloc_iova); 33662306a36Sopenharmony_ci 33762306a36Sopenharmony_cistatic struct iova * 33862306a36Sopenharmony_ciprivate_find_iova(struct iova_domain *iovad, unsigned long pfn) 33962306a36Sopenharmony_ci{ 34062306a36Sopenharmony_ci struct rb_node *node = iovad->rbroot.rb_node; 34162306a36Sopenharmony_ci 34262306a36Sopenharmony_ci assert_spin_locked(&iovad->iova_rbtree_lock); 34362306a36Sopenharmony_ci 34462306a36Sopenharmony_ci while (node) { 34562306a36Sopenharmony_ci struct iova *iova = to_iova(node); 34662306a36Sopenharmony_ci 34762306a36Sopenharmony_ci if (pfn < iova->pfn_lo) 34862306a36Sopenharmony_ci node = node->rb_left; 34962306a36Sopenharmony_ci else if (pfn > iova->pfn_hi) 35062306a36Sopenharmony_ci node = node->rb_right; 35162306a36Sopenharmony_ci else 35262306a36Sopenharmony_ci return iova; /* pfn falls within iova's range */ 35362306a36Sopenharmony_ci } 35462306a36Sopenharmony_ci 35562306a36Sopenharmony_ci return NULL; 35662306a36Sopenharmony_ci} 35762306a36Sopenharmony_ci 35862306a36Sopenharmony_cistatic void remove_iova(struct iova_domain *iovad, struct iova *iova) 35962306a36Sopenharmony_ci{ 36062306a36Sopenharmony_ci assert_spin_locked(&iovad->iova_rbtree_lock); 36162306a36Sopenharmony_ci __cached_rbnode_delete_update(iovad, iova); 36262306a36Sopenharmony_ci rb_erase(&iova->node, &iovad->rbroot); 36362306a36Sopenharmony_ci} 36462306a36Sopenharmony_ci 36562306a36Sopenharmony_ci/** 36662306a36Sopenharmony_ci * find_iova - finds an iova for a given pfn 36762306a36Sopenharmony_ci * @iovad: - iova domain in question. 36862306a36Sopenharmony_ci * @pfn: - page frame number 36962306a36Sopenharmony_ci * This function finds and returns an iova belonging to the 37062306a36Sopenharmony_ci * given domain which matches the given pfn. 37162306a36Sopenharmony_ci */ 37262306a36Sopenharmony_cistruct iova *find_iova(struct iova_domain *iovad, unsigned long pfn) 37362306a36Sopenharmony_ci{ 37462306a36Sopenharmony_ci unsigned long flags; 37562306a36Sopenharmony_ci struct iova *iova; 37662306a36Sopenharmony_ci 37762306a36Sopenharmony_ci /* Take the lock so that no other thread is manipulating the rbtree */ 37862306a36Sopenharmony_ci spin_lock_irqsave(&iovad->iova_rbtree_lock, flags); 37962306a36Sopenharmony_ci iova = private_find_iova(iovad, pfn); 38062306a36Sopenharmony_ci spin_unlock_irqrestore(&iovad->iova_rbtree_lock, flags); 38162306a36Sopenharmony_ci return iova; 38262306a36Sopenharmony_ci} 38362306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(find_iova); 38462306a36Sopenharmony_ci 38562306a36Sopenharmony_ci/** 38662306a36Sopenharmony_ci * __free_iova - frees the given iova 38762306a36Sopenharmony_ci * @iovad: iova domain in question. 38862306a36Sopenharmony_ci * @iova: iova in question. 38962306a36Sopenharmony_ci * Frees the given iova belonging to the giving domain 39062306a36Sopenharmony_ci */ 39162306a36Sopenharmony_civoid 39262306a36Sopenharmony_ci__free_iova(struct iova_domain *iovad, struct iova *iova) 39362306a36Sopenharmony_ci{ 39462306a36Sopenharmony_ci unsigned long flags; 39562306a36Sopenharmony_ci 39662306a36Sopenharmony_ci spin_lock_irqsave(&iovad->iova_rbtree_lock, flags); 39762306a36Sopenharmony_ci remove_iova(iovad, iova); 39862306a36Sopenharmony_ci spin_unlock_irqrestore(&iovad->iova_rbtree_lock, flags); 39962306a36Sopenharmony_ci free_iova_mem(iova); 40062306a36Sopenharmony_ci} 40162306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(__free_iova); 40262306a36Sopenharmony_ci 40362306a36Sopenharmony_ci/** 40462306a36Sopenharmony_ci * free_iova - finds and frees the iova for a given pfn 40562306a36Sopenharmony_ci * @iovad: - iova domain in question. 40662306a36Sopenharmony_ci * @pfn: - pfn that is allocated previously 40762306a36Sopenharmony_ci * This functions finds an iova for a given pfn and then 40862306a36Sopenharmony_ci * frees the iova from that domain. 40962306a36Sopenharmony_ci */ 41062306a36Sopenharmony_civoid 41162306a36Sopenharmony_cifree_iova(struct iova_domain *iovad, unsigned long pfn) 41262306a36Sopenharmony_ci{ 41362306a36Sopenharmony_ci unsigned long flags; 41462306a36Sopenharmony_ci struct iova *iova; 41562306a36Sopenharmony_ci 41662306a36Sopenharmony_ci spin_lock_irqsave(&iovad->iova_rbtree_lock, flags); 41762306a36Sopenharmony_ci iova = private_find_iova(iovad, pfn); 41862306a36Sopenharmony_ci if (!iova) { 41962306a36Sopenharmony_ci spin_unlock_irqrestore(&iovad->iova_rbtree_lock, flags); 42062306a36Sopenharmony_ci return; 42162306a36Sopenharmony_ci } 42262306a36Sopenharmony_ci remove_iova(iovad, iova); 42362306a36Sopenharmony_ci spin_unlock_irqrestore(&iovad->iova_rbtree_lock, flags); 42462306a36Sopenharmony_ci free_iova_mem(iova); 42562306a36Sopenharmony_ci} 42662306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(free_iova); 42762306a36Sopenharmony_ci 42862306a36Sopenharmony_ci/** 42962306a36Sopenharmony_ci * alloc_iova_fast - allocates an iova from rcache 43062306a36Sopenharmony_ci * @iovad: - iova domain in question 43162306a36Sopenharmony_ci * @size: - size of page frames to allocate 43262306a36Sopenharmony_ci * @limit_pfn: - max limit address 43362306a36Sopenharmony_ci * @flush_rcache: - set to flush rcache on regular allocation failure 43462306a36Sopenharmony_ci * This function tries to satisfy an iova allocation from the rcache, 43562306a36Sopenharmony_ci * and falls back to regular allocation on failure. If regular allocation 43662306a36Sopenharmony_ci * fails too and the flush_rcache flag is set then the rcache will be flushed. 43762306a36Sopenharmony_ci*/ 43862306a36Sopenharmony_ciunsigned long 43962306a36Sopenharmony_cialloc_iova_fast(struct iova_domain *iovad, unsigned long size, 44062306a36Sopenharmony_ci unsigned long limit_pfn, bool flush_rcache) 44162306a36Sopenharmony_ci{ 44262306a36Sopenharmony_ci unsigned long iova_pfn; 44362306a36Sopenharmony_ci struct iova *new_iova; 44462306a36Sopenharmony_ci 44562306a36Sopenharmony_ci /* 44662306a36Sopenharmony_ci * Freeing non-power-of-two-sized allocations back into the IOVA caches 44762306a36Sopenharmony_ci * will come back to bite us badly, so we have to waste a bit of space 44862306a36Sopenharmony_ci * rounding up anything cacheable to make sure that can't happen. The 44962306a36Sopenharmony_ci * order of the unadjusted size will still match upon freeing. 45062306a36Sopenharmony_ci */ 45162306a36Sopenharmony_ci if (size < (1 << (IOVA_RANGE_CACHE_MAX_SIZE - 1))) 45262306a36Sopenharmony_ci size = roundup_pow_of_two(size); 45362306a36Sopenharmony_ci 45462306a36Sopenharmony_ci iova_pfn = iova_rcache_get(iovad, size, limit_pfn + 1); 45562306a36Sopenharmony_ci if (iova_pfn) 45662306a36Sopenharmony_ci return iova_pfn; 45762306a36Sopenharmony_ci 45862306a36Sopenharmony_ciretry: 45962306a36Sopenharmony_ci new_iova = alloc_iova(iovad, size, limit_pfn, true); 46062306a36Sopenharmony_ci if (!new_iova) { 46162306a36Sopenharmony_ci unsigned int cpu; 46262306a36Sopenharmony_ci 46362306a36Sopenharmony_ci if (!flush_rcache) 46462306a36Sopenharmony_ci return 0; 46562306a36Sopenharmony_ci 46662306a36Sopenharmony_ci /* Try replenishing IOVAs by flushing rcache. */ 46762306a36Sopenharmony_ci flush_rcache = false; 46862306a36Sopenharmony_ci for_each_online_cpu(cpu) 46962306a36Sopenharmony_ci free_cpu_cached_iovas(cpu, iovad); 47062306a36Sopenharmony_ci free_global_cached_iovas(iovad); 47162306a36Sopenharmony_ci goto retry; 47262306a36Sopenharmony_ci } 47362306a36Sopenharmony_ci 47462306a36Sopenharmony_ci return new_iova->pfn_lo; 47562306a36Sopenharmony_ci} 47662306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(alloc_iova_fast); 47762306a36Sopenharmony_ci 47862306a36Sopenharmony_ci/** 47962306a36Sopenharmony_ci * free_iova_fast - free iova pfn range into rcache 48062306a36Sopenharmony_ci * @iovad: - iova domain in question. 48162306a36Sopenharmony_ci * @pfn: - pfn that is allocated previously 48262306a36Sopenharmony_ci * @size: - # of pages in range 48362306a36Sopenharmony_ci * This functions frees an iova range by trying to put it into the rcache, 48462306a36Sopenharmony_ci * falling back to regular iova deallocation via free_iova() if this fails. 48562306a36Sopenharmony_ci */ 48662306a36Sopenharmony_civoid 48762306a36Sopenharmony_cifree_iova_fast(struct iova_domain *iovad, unsigned long pfn, unsigned long size) 48862306a36Sopenharmony_ci{ 48962306a36Sopenharmony_ci if (iova_rcache_insert(iovad, pfn, size)) 49062306a36Sopenharmony_ci return; 49162306a36Sopenharmony_ci 49262306a36Sopenharmony_ci free_iova(iovad, pfn); 49362306a36Sopenharmony_ci} 49462306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(free_iova_fast); 49562306a36Sopenharmony_ci 49662306a36Sopenharmony_cistatic void iova_domain_free_rcaches(struct iova_domain *iovad) 49762306a36Sopenharmony_ci{ 49862306a36Sopenharmony_ci cpuhp_state_remove_instance_nocalls(CPUHP_IOMMU_IOVA_DEAD, 49962306a36Sopenharmony_ci &iovad->cpuhp_dead); 50062306a36Sopenharmony_ci free_iova_rcaches(iovad); 50162306a36Sopenharmony_ci} 50262306a36Sopenharmony_ci 50362306a36Sopenharmony_ci/** 50462306a36Sopenharmony_ci * put_iova_domain - destroys the iova domain 50562306a36Sopenharmony_ci * @iovad: - iova domain in question. 50662306a36Sopenharmony_ci * All the iova's in that domain are destroyed. 50762306a36Sopenharmony_ci */ 50862306a36Sopenharmony_civoid put_iova_domain(struct iova_domain *iovad) 50962306a36Sopenharmony_ci{ 51062306a36Sopenharmony_ci struct iova *iova, *tmp; 51162306a36Sopenharmony_ci 51262306a36Sopenharmony_ci if (iovad->rcaches) 51362306a36Sopenharmony_ci iova_domain_free_rcaches(iovad); 51462306a36Sopenharmony_ci 51562306a36Sopenharmony_ci rbtree_postorder_for_each_entry_safe(iova, tmp, &iovad->rbroot, node) 51662306a36Sopenharmony_ci free_iova_mem(iova); 51762306a36Sopenharmony_ci} 51862306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(put_iova_domain); 51962306a36Sopenharmony_ci 52062306a36Sopenharmony_cistatic int 52162306a36Sopenharmony_ci__is_range_overlap(struct rb_node *node, 52262306a36Sopenharmony_ci unsigned long pfn_lo, unsigned long pfn_hi) 52362306a36Sopenharmony_ci{ 52462306a36Sopenharmony_ci struct iova *iova = to_iova(node); 52562306a36Sopenharmony_ci 52662306a36Sopenharmony_ci if ((pfn_lo <= iova->pfn_hi) && (pfn_hi >= iova->pfn_lo)) 52762306a36Sopenharmony_ci return 1; 52862306a36Sopenharmony_ci return 0; 52962306a36Sopenharmony_ci} 53062306a36Sopenharmony_ci 53162306a36Sopenharmony_cistatic inline struct iova * 53262306a36Sopenharmony_cialloc_and_init_iova(unsigned long pfn_lo, unsigned long pfn_hi) 53362306a36Sopenharmony_ci{ 53462306a36Sopenharmony_ci struct iova *iova; 53562306a36Sopenharmony_ci 53662306a36Sopenharmony_ci iova = alloc_iova_mem(); 53762306a36Sopenharmony_ci if (iova) { 53862306a36Sopenharmony_ci iova->pfn_lo = pfn_lo; 53962306a36Sopenharmony_ci iova->pfn_hi = pfn_hi; 54062306a36Sopenharmony_ci } 54162306a36Sopenharmony_ci 54262306a36Sopenharmony_ci return iova; 54362306a36Sopenharmony_ci} 54462306a36Sopenharmony_ci 54562306a36Sopenharmony_cistatic struct iova * 54662306a36Sopenharmony_ci__insert_new_range(struct iova_domain *iovad, 54762306a36Sopenharmony_ci unsigned long pfn_lo, unsigned long pfn_hi) 54862306a36Sopenharmony_ci{ 54962306a36Sopenharmony_ci struct iova *iova; 55062306a36Sopenharmony_ci 55162306a36Sopenharmony_ci iova = alloc_and_init_iova(pfn_lo, pfn_hi); 55262306a36Sopenharmony_ci if (iova) 55362306a36Sopenharmony_ci iova_insert_rbtree(&iovad->rbroot, iova, NULL); 55462306a36Sopenharmony_ci 55562306a36Sopenharmony_ci return iova; 55662306a36Sopenharmony_ci} 55762306a36Sopenharmony_ci 55862306a36Sopenharmony_cistatic void 55962306a36Sopenharmony_ci__adjust_overlap_range(struct iova *iova, 56062306a36Sopenharmony_ci unsigned long *pfn_lo, unsigned long *pfn_hi) 56162306a36Sopenharmony_ci{ 56262306a36Sopenharmony_ci if (*pfn_lo < iova->pfn_lo) 56362306a36Sopenharmony_ci iova->pfn_lo = *pfn_lo; 56462306a36Sopenharmony_ci if (*pfn_hi > iova->pfn_hi) 56562306a36Sopenharmony_ci *pfn_lo = iova->pfn_hi + 1; 56662306a36Sopenharmony_ci} 56762306a36Sopenharmony_ci 56862306a36Sopenharmony_ci/** 56962306a36Sopenharmony_ci * reserve_iova - reserves an iova in the given range 57062306a36Sopenharmony_ci * @iovad: - iova domain pointer 57162306a36Sopenharmony_ci * @pfn_lo: - lower page frame address 57262306a36Sopenharmony_ci * @pfn_hi:- higher pfn adderss 57362306a36Sopenharmony_ci * This function allocates reserves the address range from pfn_lo to pfn_hi so 57462306a36Sopenharmony_ci * that this address is not dished out as part of alloc_iova. 57562306a36Sopenharmony_ci */ 57662306a36Sopenharmony_cistruct iova * 57762306a36Sopenharmony_cireserve_iova(struct iova_domain *iovad, 57862306a36Sopenharmony_ci unsigned long pfn_lo, unsigned long pfn_hi) 57962306a36Sopenharmony_ci{ 58062306a36Sopenharmony_ci struct rb_node *node; 58162306a36Sopenharmony_ci unsigned long flags; 58262306a36Sopenharmony_ci struct iova *iova; 58362306a36Sopenharmony_ci unsigned int overlap = 0; 58462306a36Sopenharmony_ci 58562306a36Sopenharmony_ci /* Don't allow nonsensical pfns */ 58662306a36Sopenharmony_ci if (WARN_ON((pfn_hi | pfn_lo) > (ULLONG_MAX >> iova_shift(iovad)))) 58762306a36Sopenharmony_ci return NULL; 58862306a36Sopenharmony_ci 58962306a36Sopenharmony_ci spin_lock_irqsave(&iovad->iova_rbtree_lock, flags); 59062306a36Sopenharmony_ci for (node = rb_first(&iovad->rbroot); node; node = rb_next(node)) { 59162306a36Sopenharmony_ci if (__is_range_overlap(node, pfn_lo, pfn_hi)) { 59262306a36Sopenharmony_ci iova = to_iova(node); 59362306a36Sopenharmony_ci __adjust_overlap_range(iova, &pfn_lo, &pfn_hi); 59462306a36Sopenharmony_ci if ((pfn_lo >= iova->pfn_lo) && 59562306a36Sopenharmony_ci (pfn_hi <= iova->pfn_hi)) 59662306a36Sopenharmony_ci goto finish; 59762306a36Sopenharmony_ci overlap = 1; 59862306a36Sopenharmony_ci 59962306a36Sopenharmony_ci } else if (overlap) 60062306a36Sopenharmony_ci break; 60162306a36Sopenharmony_ci } 60262306a36Sopenharmony_ci 60362306a36Sopenharmony_ci /* We are here either because this is the first reserver node 60462306a36Sopenharmony_ci * or need to insert remaining non overlap addr range 60562306a36Sopenharmony_ci */ 60662306a36Sopenharmony_ci iova = __insert_new_range(iovad, pfn_lo, pfn_hi); 60762306a36Sopenharmony_cifinish: 60862306a36Sopenharmony_ci 60962306a36Sopenharmony_ci spin_unlock_irqrestore(&iovad->iova_rbtree_lock, flags); 61062306a36Sopenharmony_ci return iova; 61162306a36Sopenharmony_ci} 61262306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(reserve_iova); 61362306a36Sopenharmony_ci 61462306a36Sopenharmony_ci/* 61562306a36Sopenharmony_ci * Magazine caches for IOVA ranges. For an introduction to magazines, 61662306a36Sopenharmony_ci * see the USENIX 2001 paper "Magazines and Vmem: Extending the Slab 61762306a36Sopenharmony_ci * Allocator to Many CPUs and Arbitrary Resources" by Bonwick and Adams. 61862306a36Sopenharmony_ci * For simplicity, we use a static magazine size and don't implement the 61962306a36Sopenharmony_ci * dynamic size tuning described in the paper. 62062306a36Sopenharmony_ci */ 62162306a36Sopenharmony_ci 62262306a36Sopenharmony_ci/* 62362306a36Sopenharmony_ci * As kmalloc's buffer size is fixed to power of 2, 127 is chosen to 62462306a36Sopenharmony_ci * assure size of 'iova_magazine' to be 1024 bytes, so that no memory 62562306a36Sopenharmony_ci * will be wasted. 62662306a36Sopenharmony_ci */ 62762306a36Sopenharmony_ci#define IOVA_MAG_SIZE 127 62862306a36Sopenharmony_ci#define MAX_GLOBAL_MAGS 32 /* magazines per bin */ 62962306a36Sopenharmony_ci 63062306a36Sopenharmony_cistruct iova_magazine { 63162306a36Sopenharmony_ci unsigned long size; 63262306a36Sopenharmony_ci unsigned long pfns[IOVA_MAG_SIZE]; 63362306a36Sopenharmony_ci}; 63462306a36Sopenharmony_ci 63562306a36Sopenharmony_cistruct iova_cpu_rcache { 63662306a36Sopenharmony_ci spinlock_t lock; 63762306a36Sopenharmony_ci struct iova_magazine *loaded; 63862306a36Sopenharmony_ci struct iova_magazine *prev; 63962306a36Sopenharmony_ci}; 64062306a36Sopenharmony_ci 64162306a36Sopenharmony_cistruct iova_rcache { 64262306a36Sopenharmony_ci spinlock_t lock; 64362306a36Sopenharmony_ci unsigned long depot_size; 64462306a36Sopenharmony_ci struct iova_magazine *depot[MAX_GLOBAL_MAGS]; 64562306a36Sopenharmony_ci struct iova_cpu_rcache __percpu *cpu_rcaches; 64662306a36Sopenharmony_ci}; 64762306a36Sopenharmony_ci 64862306a36Sopenharmony_cistatic struct iova_magazine *iova_magazine_alloc(gfp_t flags) 64962306a36Sopenharmony_ci{ 65062306a36Sopenharmony_ci struct iova_magazine *mag; 65162306a36Sopenharmony_ci 65262306a36Sopenharmony_ci mag = kmalloc(sizeof(*mag), flags); 65362306a36Sopenharmony_ci if (mag) 65462306a36Sopenharmony_ci mag->size = 0; 65562306a36Sopenharmony_ci 65662306a36Sopenharmony_ci return mag; 65762306a36Sopenharmony_ci} 65862306a36Sopenharmony_ci 65962306a36Sopenharmony_cistatic void iova_magazine_free(struct iova_magazine *mag) 66062306a36Sopenharmony_ci{ 66162306a36Sopenharmony_ci kfree(mag); 66262306a36Sopenharmony_ci} 66362306a36Sopenharmony_ci 66462306a36Sopenharmony_cistatic void 66562306a36Sopenharmony_ciiova_magazine_free_pfns(struct iova_magazine *mag, struct iova_domain *iovad) 66662306a36Sopenharmony_ci{ 66762306a36Sopenharmony_ci unsigned long flags; 66862306a36Sopenharmony_ci int i; 66962306a36Sopenharmony_ci 67062306a36Sopenharmony_ci spin_lock_irqsave(&iovad->iova_rbtree_lock, flags); 67162306a36Sopenharmony_ci 67262306a36Sopenharmony_ci for (i = 0 ; i < mag->size; ++i) { 67362306a36Sopenharmony_ci struct iova *iova = private_find_iova(iovad, mag->pfns[i]); 67462306a36Sopenharmony_ci 67562306a36Sopenharmony_ci if (WARN_ON(!iova)) 67662306a36Sopenharmony_ci continue; 67762306a36Sopenharmony_ci 67862306a36Sopenharmony_ci remove_iova(iovad, iova); 67962306a36Sopenharmony_ci free_iova_mem(iova); 68062306a36Sopenharmony_ci } 68162306a36Sopenharmony_ci 68262306a36Sopenharmony_ci spin_unlock_irqrestore(&iovad->iova_rbtree_lock, flags); 68362306a36Sopenharmony_ci 68462306a36Sopenharmony_ci mag->size = 0; 68562306a36Sopenharmony_ci} 68662306a36Sopenharmony_ci 68762306a36Sopenharmony_cistatic bool iova_magazine_full(struct iova_magazine *mag) 68862306a36Sopenharmony_ci{ 68962306a36Sopenharmony_ci return mag->size == IOVA_MAG_SIZE; 69062306a36Sopenharmony_ci} 69162306a36Sopenharmony_ci 69262306a36Sopenharmony_cistatic bool iova_magazine_empty(struct iova_magazine *mag) 69362306a36Sopenharmony_ci{ 69462306a36Sopenharmony_ci return mag->size == 0; 69562306a36Sopenharmony_ci} 69662306a36Sopenharmony_ci 69762306a36Sopenharmony_cistatic unsigned long iova_magazine_pop(struct iova_magazine *mag, 69862306a36Sopenharmony_ci unsigned long limit_pfn) 69962306a36Sopenharmony_ci{ 70062306a36Sopenharmony_ci int i; 70162306a36Sopenharmony_ci unsigned long pfn; 70262306a36Sopenharmony_ci 70362306a36Sopenharmony_ci /* Only fall back to the rbtree if we have no suitable pfns at all */ 70462306a36Sopenharmony_ci for (i = mag->size - 1; mag->pfns[i] > limit_pfn; i--) 70562306a36Sopenharmony_ci if (i == 0) 70662306a36Sopenharmony_ci return 0; 70762306a36Sopenharmony_ci 70862306a36Sopenharmony_ci /* Swap it to pop it */ 70962306a36Sopenharmony_ci pfn = mag->pfns[i]; 71062306a36Sopenharmony_ci mag->pfns[i] = mag->pfns[--mag->size]; 71162306a36Sopenharmony_ci 71262306a36Sopenharmony_ci return pfn; 71362306a36Sopenharmony_ci} 71462306a36Sopenharmony_ci 71562306a36Sopenharmony_cistatic void iova_magazine_push(struct iova_magazine *mag, unsigned long pfn) 71662306a36Sopenharmony_ci{ 71762306a36Sopenharmony_ci mag->pfns[mag->size++] = pfn; 71862306a36Sopenharmony_ci} 71962306a36Sopenharmony_ci 72062306a36Sopenharmony_ciint iova_domain_init_rcaches(struct iova_domain *iovad) 72162306a36Sopenharmony_ci{ 72262306a36Sopenharmony_ci unsigned int cpu; 72362306a36Sopenharmony_ci int i, ret; 72462306a36Sopenharmony_ci 72562306a36Sopenharmony_ci iovad->rcaches = kcalloc(IOVA_RANGE_CACHE_MAX_SIZE, 72662306a36Sopenharmony_ci sizeof(struct iova_rcache), 72762306a36Sopenharmony_ci GFP_KERNEL); 72862306a36Sopenharmony_ci if (!iovad->rcaches) 72962306a36Sopenharmony_ci return -ENOMEM; 73062306a36Sopenharmony_ci 73162306a36Sopenharmony_ci for (i = 0; i < IOVA_RANGE_CACHE_MAX_SIZE; ++i) { 73262306a36Sopenharmony_ci struct iova_cpu_rcache *cpu_rcache; 73362306a36Sopenharmony_ci struct iova_rcache *rcache; 73462306a36Sopenharmony_ci 73562306a36Sopenharmony_ci rcache = &iovad->rcaches[i]; 73662306a36Sopenharmony_ci spin_lock_init(&rcache->lock); 73762306a36Sopenharmony_ci rcache->depot_size = 0; 73862306a36Sopenharmony_ci rcache->cpu_rcaches = __alloc_percpu(sizeof(*cpu_rcache), 73962306a36Sopenharmony_ci cache_line_size()); 74062306a36Sopenharmony_ci if (!rcache->cpu_rcaches) { 74162306a36Sopenharmony_ci ret = -ENOMEM; 74262306a36Sopenharmony_ci goto out_err; 74362306a36Sopenharmony_ci } 74462306a36Sopenharmony_ci for_each_possible_cpu(cpu) { 74562306a36Sopenharmony_ci cpu_rcache = per_cpu_ptr(rcache->cpu_rcaches, cpu); 74662306a36Sopenharmony_ci 74762306a36Sopenharmony_ci spin_lock_init(&cpu_rcache->lock); 74862306a36Sopenharmony_ci cpu_rcache->loaded = iova_magazine_alloc(GFP_KERNEL); 74962306a36Sopenharmony_ci cpu_rcache->prev = iova_magazine_alloc(GFP_KERNEL); 75062306a36Sopenharmony_ci if (!cpu_rcache->loaded || !cpu_rcache->prev) { 75162306a36Sopenharmony_ci ret = -ENOMEM; 75262306a36Sopenharmony_ci goto out_err; 75362306a36Sopenharmony_ci } 75462306a36Sopenharmony_ci } 75562306a36Sopenharmony_ci } 75662306a36Sopenharmony_ci 75762306a36Sopenharmony_ci ret = cpuhp_state_add_instance_nocalls(CPUHP_IOMMU_IOVA_DEAD, 75862306a36Sopenharmony_ci &iovad->cpuhp_dead); 75962306a36Sopenharmony_ci if (ret) 76062306a36Sopenharmony_ci goto out_err; 76162306a36Sopenharmony_ci return 0; 76262306a36Sopenharmony_ci 76362306a36Sopenharmony_ciout_err: 76462306a36Sopenharmony_ci free_iova_rcaches(iovad); 76562306a36Sopenharmony_ci return ret; 76662306a36Sopenharmony_ci} 76762306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(iova_domain_init_rcaches); 76862306a36Sopenharmony_ci 76962306a36Sopenharmony_ci/* 77062306a36Sopenharmony_ci * Try inserting IOVA range starting with 'iova_pfn' into 'rcache', and 77162306a36Sopenharmony_ci * return true on success. Can fail if rcache is full and we can't free 77262306a36Sopenharmony_ci * space, and free_iova() (our only caller) will then return the IOVA 77362306a36Sopenharmony_ci * range to the rbtree instead. 77462306a36Sopenharmony_ci */ 77562306a36Sopenharmony_cistatic bool __iova_rcache_insert(struct iova_domain *iovad, 77662306a36Sopenharmony_ci struct iova_rcache *rcache, 77762306a36Sopenharmony_ci unsigned long iova_pfn) 77862306a36Sopenharmony_ci{ 77962306a36Sopenharmony_ci struct iova_magazine *mag_to_free = NULL; 78062306a36Sopenharmony_ci struct iova_cpu_rcache *cpu_rcache; 78162306a36Sopenharmony_ci bool can_insert = false; 78262306a36Sopenharmony_ci unsigned long flags; 78362306a36Sopenharmony_ci 78462306a36Sopenharmony_ci cpu_rcache = raw_cpu_ptr(rcache->cpu_rcaches); 78562306a36Sopenharmony_ci spin_lock_irqsave(&cpu_rcache->lock, flags); 78662306a36Sopenharmony_ci 78762306a36Sopenharmony_ci if (!iova_magazine_full(cpu_rcache->loaded)) { 78862306a36Sopenharmony_ci can_insert = true; 78962306a36Sopenharmony_ci } else if (!iova_magazine_full(cpu_rcache->prev)) { 79062306a36Sopenharmony_ci swap(cpu_rcache->prev, cpu_rcache->loaded); 79162306a36Sopenharmony_ci can_insert = true; 79262306a36Sopenharmony_ci } else { 79362306a36Sopenharmony_ci struct iova_magazine *new_mag = iova_magazine_alloc(GFP_ATOMIC); 79462306a36Sopenharmony_ci 79562306a36Sopenharmony_ci if (new_mag) { 79662306a36Sopenharmony_ci spin_lock(&rcache->lock); 79762306a36Sopenharmony_ci if (rcache->depot_size < MAX_GLOBAL_MAGS) { 79862306a36Sopenharmony_ci rcache->depot[rcache->depot_size++] = 79962306a36Sopenharmony_ci cpu_rcache->loaded; 80062306a36Sopenharmony_ci } else { 80162306a36Sopenharmony_ci mag_to_free = cpu_rcache->loaded; 80262306a36Sopenharmony_ci } 80362306a36Sopenharmony_ci spin_unlock(&rcache->lock); 80462306a36Sopenharmony_ci 80562306a36Sopenharmony_ci cpu_rcache->loaded = new_mag; 80662306a36Sopenharmony_ci can_insert = true; 80762306a36Sopenharmony_ci } 80862306a36Sopenharmony_ci } 80962306a36Sopenharmony_ci 81062306a36Sopenharmony_ci if (can_insert) 81162306a36Sopenharmony_ci iova_magazine_push(cpu_rcache->loaded, iova_pfn); 81262306a36Sopenharmony_ci 81362306a36Sopenharmony_ci spin_unlock_irqrestore(&cpu_rcache->lock, flags); 81462306a36Sopenharmony_ci 81562306a36Sopenharmony_ci if (mag_to_free) { 81662306a36Sopenharmony_ci iova_magazine_free_pfns(mag_to_free, iovad); 81762306a36Sopenharmony_ci iova_magazine_free(mag_to_free); 81862306a36Sopenharmony_ci } 81962306a36Sopenharmony_ci 82062306a36Sopenharmony_ci return can_insert; 82162306a36Sopenharmony_ci} 82262306a36Sopenharmony_ci 82362306a36Sopenharmony_cistatic bool iova_rcache_insert(struct iova_domain *iovad, unsigned long pfn, 82462306a36Sopenharmony_ci unsigned long size) 82562306a36Sopenharmony_ci{ 82662306a36Sopenharmony_ci unsigned int log_size = order_base_2(size); 82762306a36Sopenharmony_ci 82862306a36Sopenharmony_ci if (log_size >= IOVA_RANGE_CACHE_MAX_SIZE) 82962306a36Sopenharmony_ci return false; 83062306a36Sopenharmony_ci 83162306a36Sopenharmony_ci return __iova_rcache_insert(iovad, &iovad->rcaches[log_size], pfn); 83262306a36Sopenharmony_ci} 83362306a36Sopenharmony_ci 83462306a36Sopenharmony_ci/* 83562306a36Sopenharmony_ci * Caller wants to allocate a new IOVA range from 'rcache'. If we can 83662306a36Sopenharmony_ci * satisfy the request, return a matching non-NULL range and remove 83762306a36Sopenharmony_ci * it from the 'rcache'. 83862306a36Sopenharmony_ci */ 83962306a36Sopenharmony_cistatic unsigned long __iova_rcache_get(struct iova_rcache *rcache, 84062306a36Sopenharmony_ci unsigned long limit_pfn) 84162306a36Sopenharmony_ci{ 84262306a36Sopenharmony_ci struct iova_cpu_rcache *cpu_rcache; 84362306a36Sopenharmony_ci unsigned long iova_pfn = 0; 84462306a36Sopenharmony_ci bool has_pfn = false; 84562306a36Sopenharmony_ci unsigned long flags; 84662306a36Sopenharmony_ci 84762306a36Sopenharmony_ci cpu_rcache = raw_cpu_ptr(rcache->cpu_rcaches); 84862306a36Sopenharmony_ci spin_lock_irqsave(&cpu_rcache->lock, flags); 84962306a36Sopenharmony_ci 85062306a36Sopenharmony_ci if (!iova_magazine_empty(cpu_rcache->loaded)) { 85162306a36Sopenharmony_ci has_pfn = true; 85262306a36Sopenharmony_ci } else if (!iova_magazine_empty(cpu_rcache->prev)) { 85362306a36Sopenharmony_ci swap(cpu_rcache->prev, cpu_rcache->loaded); 85462306a36Sopenharmony_ci has_pfn = true; 85562306a36Sopenharmony_ci } else { 85662306a36Sopenharmony_ci spin_lock(&rcache->lock); 85762306a36Sopenharmony_ci if (rcache->depot_size > 0) { 85862306a36Sopenharmony_ci iova_magazine_free(cpu_rcache->loaded); 85962306a36Sopenharmony_ci cpu_rcache->loaded = rcache->depot[--rcache->depot_size]; 86062306a36Sopenharmony_ci has_pfn = true; 86162306a36Sopenharmony_ci } 86262306a36Sopenharmony_ci spin_unlock(&rcache->lock); 86362306a36Sopenharmony_ci } 86462306a36Sopenharmony_ci 86562306a36Sopenharmony_ci if (has_pfn) 86662306a36Sopenharmony_ci iova_pfn = iova_magazine_pop(cpu_rcache->loaded, limit_pfn); 86762306a36Sopenharmony_ci 86862306a36Sopenharmony_ci spin_unlock_irqrestore(&cpu_rcache->lock, flags); 86962306a36Sopenharmony_ci 87062306a36Sopenharmony_ci return iova_pfn; 87162306a36Sopenharmony_ci} 87262306a36Sopenharmony_ci 87362306a36Sopenharmony_ci/* 87462306a36Sopenharmony_ci * Try to satisfy IOVA allocation range from rcache. Fail if requested 87562306a36Sopenharmony_ci * size is too big or the DMA limit we are given isn't satisfied by the 87662306a36Sopenharmony_ci * top element in the magazine. 87762306a36Sopenharmony_ci */ 87862306a36Sopenharmony_cistatic unsigned long iova_rcache_get(struct iova_domain *iovad, 87962306a36Sopenharmony_ci unsigned long size, 88062306a36Sopenharmony_ci unsigned long limit_pfn) 88162306a36Sopenharmony_ci{ 88262306a36Sopenharmony_ci unsigned int log_size = order_base_2(size); 88362306a36Sopenharmony_ci 88462306a36Sopenharmony_ci if (log_size >= IOVA_RANGE_CACHE_MAX_SIZE) 88562306a36Sopenharmony_ci return 0; 88662306a36Sopenharmony_ci 88762306a36Sopenharmony_ci return __iova_rcache_get(&iovad->rcaches[log_size], limit_pfn - size); 88862306a36Sopenharmony_ci} 88962306a36Sopenharmony_ci 89062306a36Sopenharmony_ci/* 89162306a36Sopenharmony_ci * free rcache data structures. 89262306a36Sopenharmony_ci */ 89362306a36Sopenharmony_cistatic void free_iova_rcaches(struct iova_domain *iovad) 89462306a36Sopenharmony_ci{ 89562306a36Sopenharmony_ci struct iova_rcache *rcache; 89662306a36Sopenharmony_ci struct iova_cpu_rcache *cpu_rcache; 89762306a36Sopenharmony_ci unsigned int cpu; 89862306a36Sopenharmony_ci int i, j; 89962306a36Sopenharmony_ci 90062306a36Sopenharmony_ci for (i = 0; i < IOVA_RANGE_CACHE_MAX_SIZE; ++i) { 90162306a36Sopenharmony_ci rcache = &iovad->rcaches[i]; 90262306a36Sopenharmony_ci if (!rcache->cpu_rcaches) 90362306a36Sopenharmony_ci break; 90462306a36Sopenharmony_ci for_each_possible_cpu(cpu) { 90562306a36Sopenharmony_ci cpu_rcache = per_cpu_ptr(rcache->cpu_rcaches, cpu); 90662306a36Sopenharmony_ci iova_magazine_free(cpu_rcache->loaded); 90762306a36Sopenharmony_ci iova_magazine_free(cpu_rcache->prev); 90862306a36Sopenharmony_ci } 90962306a36Sopenharmony_ci free_percpu(rcache->cpu_rcaches); 91062306a36Sopenharmony_ci for (j = 0; j < rcache->depot_size; ++j) 91162306a36Sopenharmony_ci iova_magazine_free(rcache->depot[j]); 91262306a36Sopenharmony_ci } 91362306a36Sopenharmony_ci 91462306a36Sopenharmony_ci kfree(iovad->rcaches); 91562306a36Sopenharmony_ci iovad->rcaches = NULL; 91662306a36Sopenharmony_ci} 91762306a36Sopenharmony_ci 91862306a36Sopenharmony_ci/* 91962306a36Sopenharmony_ci * free all the IOVA ranges cached by a cpu (used when cpu is unplugged) 92062306a36Sopenharmony_ci */ 92162306a36Sopenharmony_cistatic void free_cpu_cached_iovas(unsigned int cpu, struct iova_domain *iovad) 92262306a36Sopenharmony_ci{ 92362306a36Sopenharmony_ci struct iova_cpu_rcache *cpu_rcache; 92462306a36Sopenharmony_ci struct iova_rcache *rcache; 92562306a36Sopenharmony_ci unsigned long flags; 92662306a36Sopenharmony_ci int i; 92762306a36Sopenharmony_ci 92862306a36Sopenharmony_ci for (i = 0; i < IOVA_RANGE_CACHE_MAX_SIZE; ++i) { 92962306a36Sopenharmony_ci rcache = &iovad->rcaches[i]; 93062306a36Sopenharmony_ci cpu_rcache = per_cpu_ptr(rcache->cpu_rcaches, cpu); 93162306a36Sopenharmony_ci spin_lock_irqsave(&cpu_rcache->lock, flags); 93262306a36Sopenharmony_ci iova_magazine_free_pfns(cpu_rcache->loaded, iovad); 93362306a36Sopenharmony_ci iova_magazine_free_pfns(cpu_rcache->prev, iovad); 93462306a36Sopenharmony_ci spin_unlock_irqrestore(&cpu_rcache->lock, flags); 93562306a36Sopenharmony_ci } 93662306a36Sopenharmony_ci} 93762306a36Sopenharmony_ci 93862306a36Sopenharmony_ci/* 93962306a36Sopenharmony_ci * free all the IOVA ranges of global cache 94062306a36Sopenharmony_ci */ 94162306a36Sopenharmony_cistatic void free_global_cached_iovas(struct iova_domain *iovad) 94262306a36Sopenharmony_ci{ 94362306a36Sopenharmony_ci struct iova_rcache *rcache; 94462306a36Sopenharmony_ci unsigned long flags; 94562306a36Sopenharmony_ci int i, j; 94662306a36Sopenharmony_ci 94762306a36Sopenharmony_ci for (i = 0; i < IOVA_RANGE_CACHE_MAX_SIZE; ++i) { 94862306a36Sopenharmony_ci rcache = &iovad->rcaches[i]; 94962306a36Sopenharmony_ci spin_lock_irqsave(&rcache->lock, flags); 95062306a36Sopenharmony_ci for (j = 0; j < rcache->depot_size; ++j) { 95162306a36Sopenharmony_ci iova_magazine_free_pfns(rcache->depot[j], iovad); 95262306a36Sopenharmony_ci iova_magazine_free(rcache->depot[j]); 95362306a36Sopenharmony_ci } 95462306a36Sopenharmony_ci rcache->depot_size = 0; 95562306a36Sopenharmony_ci spin_unlock_irqrestore(&rcache->lock, flags); 95662306a36Sopenharmony_ci } 95762306a36Sopenharmony_ci} 95862306a36Sopenharmony_ciMODULE_AUTHOR("Anil S Keshavamurthy <anil.s.keshavamurthy@intel.com>"); 95962306a36Sopenharmony_ciMODULE_LICENSE("GPL"); 960