162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * dma-fence-util: misc functions for dma_fence objects 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Copyright (C) 2022 Advanced Micro Devices, Inc. 662306a36Sopenharmony_ci * Authors: 762306a36Sopenharmony_ci * Christian König <christian.koenig@amd.com> 862306a36Sopenharmony_ci */ 962306a36Sopenharmony_ci 1062306a36Sopenharmony_ci#include <linux/dma-fence.h> 1162306a36Sopenharmony_ci#include <linux/dma-fence-array.h> 1262306a36Sopenharmony_ci#include <linux/dma-fence-chain.h> 1362306a36Sopenharmony_ci#include <linux/dma-fence-unwrap.h> 1462306a36Sopenharmony_ci#include <linux/slab.h> 1562306a36Sopenharmony_ci 1662306a36Sopenharmony_ci/* Internal helper to start new array iteration, don't use directly */ 1762306a36Sopenharmony_cistatic struct dma_fence * 1862306a36Sopenharmony_ci__dma_fence_unwrap_array(struct dma_fence_unwrap *cursor) 1962306a36Sopenharmony_ci{ 2062306a36Sopenharmony_ci cursor->array = dma_fence_chain_contained(cursor->chain); 2162306a36Sopenharmony_ci cursor->index = 0; 2262306a36Sopenharmony_ci return dma_fence_array_first(cursor->array); 2362306a36Sopenharmony_ci} 2462306a36Sopenharmony_ci 2562306a36Sopenharmony_ci/** 2662306a36Sopenharmony_ci * dma_fence_unwrap_first - return the first fence from fence containers 2762306a36Sopenharmony_ci * @head: the entrypoint into the containers 2862306a36Sopenharmony_ci * @cursor: current position inside the containers 2962306a36Sopenharmony_ci * 3062306a36Sopenharmony_ci * Unwraps potential dma_fence_chain/dma_fence_array containers and return the 3162306a36Sopenharmony_ci * first fence. 3262306a36Sopenharmony_ci */ 3362306a36Sopenharmony_cistruct dma_fence *dma_fence_unwrap_first(struct dma_fence *head, 3462306a36Sopenharmony_ci struct dma_fence_unwrap *cursor) 3562306a36Sopenharmony_ci{ 3662306a36Sopenharmony_ci cursor->chain = dma_fence_get(head); 3762306a36Sopenharmony_ci return __dma_fence_unwrap_array(cursor); 3862306a36Sopenharmony_ci} 3962306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(dma_fence_unwrap_first); 4062306a36Sopenharmony_ci 4162306a36Sopenharmony_ci/** 4262306a36Sopenharmony_ci * dma_fence_unwrap_next - return the next fence from a fence containers 4362306a36Sopenharmony_ci * @cursor: current position inside the containers 4462306a36Sopenharmony_ci * 4562306a36Sopenharmony_ci * Continue unwrapping the dma_fence_chain/dma_fence_array containers and return 4662306a36Sopenharmony_ci * the next fence from them. 4762306a36Sopenharmony_ci */ 4862306a36Sopenharmony_cistruct dma_fence *dma_fence_unwrap_next(struct dma_fence_unwrap *cursor) 4962306a36Sopenharmony_ci{ 5062306a36Sopenharmony_ci struct dma_fence *tmp; 5162306a36Sopenharmony_ci 5262306a36Sopenharmony_ci ++cursor->index; 5362306a36Sopenharmony_ci tmp = dma_fence_array_next(cursor->array, cursor->index); 5462306a36Sopenharmony_ci if (tmp) 5562306a36Sopenharmony_ci return tmp; 5662306a36Sopenharmony_ci 5762306a36Sopenharmony_ci cursor->chain = dma_fence_chain_walk(cursor->chain); 5862306a36Sopenharmony_ci return __dma_fence_unwrap_array(cursor); 5962306a36Sopenharmony_ci} 6062306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(dma_fence_unwrap_next); 6162306a36Sopenharmony_ci 6262306a36Sopenharmony_ci/* Implementation for the dma_fence_merge() marco, don't use directly */ 6362306a36Sopenharmony_cistruct dma_fence *__dma_fence_unwrap_merge(unsigned int num_fences, 6462306a36Sopenharmony_ci struct dma_fence **fences, 6562306a36Sopenharmony_ci struct dma_fence_unwrap *iter) 6662306a36Sopenharmony_ci{ 6762306a36Sopenharmony_ci struct dma_fence_array *result; 6862306a36Sopenharmony_ci struct dma_fence *tmp, **array; 6962306a36Sopenharmony_ci ktime_t timestamp; 7062306a36Sopenharmony_ci unsigned int i; 7162306a36Sopenharmony_ci size_t count; 7262306a36Sopenharmony_ci 7362306a36Sopenharmony_ci count = 0; 7462306a36Sopenharmony_ci timestamp = ns_to_ktime(0); 7562306a36Sopenharmony_ci for (i = 0; i < num_fences; ++i) { 7662306a36Sopenharmony_ci dma_fence_unwrap_for_each(tmp, &iter[i], fences[i]) { 7762306a36Sopenharmony_ci if (!dma_fence_is_signaled(tmp)) { 7862306a36Sopenharmony_ci ++count; 7962306a36Sopenharmony_ci } else { 8062306a36Sopenharmony_ci ktime_t t = dma_fence_timestamp(tmp); 8162306a36Sopenharmony_ci 8262306a36Sopenharmony_ci if (ktime_after(t, timestamp)) 8362306a36Sopenharmony_ci timestamp = t; 8462306a36Sopenharmony_ci } 8562306a36Sopenharmony_ci } 8662306a36Sopenharmony_ci } 8762306a36Sopenharmony_ci 8862306a36Sopenharmony_ci /* 8962306a36Sopenharmony_ci * If we couldn't find a pending fence just return a private signaled 9062306a36Sopenharmony_ci * fence with the timestamp of the last signaled one. 9162306a36Sopenharmony_ci */ 9262306a36Sopenharmony_ci if (count == 0) 9362306a36Sopenharmony_ci return dma_fence_allocate_private_stub(timestamp); 9462306a36Sopenharmony_ci 9562306a36Sopenharmony_ci array = kmalloc_array(count, sizeof(*array), GFP_KERNEL); 9662306a36Sopenharmony_ci if (!array) 9762306a36Sopenharmony_ci return NULL; 9862306a36Sopenharmony_ci 9962306a36Sopenharmony_ci /* 10062306a36Sopenharmony_ci * This trashes the input fence array and uses it as position for the 10162306a36Sopenharmony_ci * following merge loop. This works because the dma_fence_merge() 10262306a36Sopenharmony_ci * wrapper macro is creating this temporary array on the stack together 10362306a36Sopenharmony_ci * with the iterators. 10462306a36Sopenharmony_ci */ 10562306a36Sopenharmony_ci for (i = 0; i < num_fences; ++i) 10662306a36Sopenharmony_ci fences[i] = dma_fence_unwrap_first(fences[i], &iter[i]); 10762306a36Sopenharmony_ci 10862306a36Sopenharmony_ci count = 0; 10962306a36Sopenharmony_ci do { 11062306a36Sopenharmony_ci unsigned int sel; 11162306a36Sopenharmony_ci 11262306a36Sopenharmony_cirestart: 11362306a36Sopenharmony_ci tmp = NULL; 11462306a36Sopenharmony_ci for (i = 0; i < num_fences; ++i) { 11562306a36Sopenharmony_ci struct dma_fence *next; 11662306a36Sopenharmony_ci 11762306a36Sopenharmony_ci while (fences[i] && dma_fence_is_signaled(fences[i])) 11862306a36Sopenharmony_ci fences[i] = dma_fence_unwrap_next(&iter[i]); 11962306a36Sopenharmony_ci 12062306a36Sopenharmony_ci next = fences[i]; 12162306a36Sopenharmony_ci if (!next) 12262306a36Sopenharmony_ci continue; 12362306a36Sopenharmony_ci 12462306a36Sopenharmony_ci /* 12562306a36Sopenharmony_ci * We can't guarantee that inpute fences are ordered by 12662306a36Sopenharmony_ci * context, but it is still quite likely when this 12762306a36Sopenharmony_ci * function is used multiple times. So attempt to order 12862306a36Sopenharmony_ci * the fences by context as we pass over them and merge 12962306a36Sopenharmony_ci * fences with the same context. 13062306a36Sopenharmony_ci */ 13162306a36Sopenharmony_ci if (!tmp || tmp->context > next->context) { 13262306a36Sopenharmony_ci tmp = next; 13362306a36Sopenharmony_ci sel = i; 13462306a36Sopenharmony_ci 13562306a36Sopenharmony_ci } else if (tmp->context < next->context) { 13662306a36Sopenharmony_ci continue; 13762306a36Sopenharmony_ci 13862306a36Sopenharmony_ci } else if (dma_fence_is_later(tmp, next)) { 13962306a36Sopenharmony_ci fences[i] = dma_fence_unwrap_next(&iter[i]); 14062306a36Sopenharmony_ci goto restart; 14162306a36Sopenharmony_ci } else { 14262306a36Sopenharmony_ci fences[sel] = dma_fence_unwrap_next(&iter[sel]); 14362306a36Sopenharmony_ci goto restart; 14462306a36Sopenharmony_ci } 14562306a36Sopenharmony_ci } 14662306a36Sopenharmony_ci 14762306a36Sopenharmony_ci if (tmp) { 14862306a36Sopenharmony_ci array[count++] = dma_fence_get(tmp); 14962306a36Sopenharmony_ci fences[sel] = dma_fence_unwrap_next(&iter[sel]); 15062306a36Sopenharmony_ci } 15162306a36Sopenharmony_ci } while (tmp); 15262306a36Sopenharmony_ci 15362306a36Sopenharmony_ci if (count == 0) { 15462306a36Sopenharmony_ci tmp = dma_fence_allocate_private_stub(ktime_get()); 15562306a36Sopenharmony_ci goto return_tmp; 15662306a36Sopenharmony_ci } 15762306a36Sopenharmony_ci 15862306a36Sopenharmony_ci if (count == 1) { 15962306a36Sopenharmony_ci tmp = array[0]; 16062306a36Sopenharmony_ci goto return_tmp; 16162306a36Sopenharmony_ci } 16262306a36Sopenharmony_ci 16362306a36Sopenharmony_ci result = dma_fence_array_create(count, array, 16462306a36Sopenharmony_ci dma_fence_context_alloc(1), 16562306a36Sopenharmony_ci 1, false); 16662306a36Sopenharmony_ci if (!result) { 16762306a36Sopenharmony_ci tmp = NULL; 16862306a36Sopenharmony_ci goto return_tmp; 16962306a36Sopenharmony_ci } 17062306a36Sopenharmony_ci return &result->base; 17162306a36Sopenharmony_ci 17262306a36Sopenharmony_cireturn_tmp: 17362306a36Sopenharmony_ci kfree(array); 17462306a36Sopenharmony_ci return tmp; 17562306a36Sopenharmony_ci} 17662306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(__dma_fence_unwrap_merge); 177