162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * dma-fence-util: misc functions for dma_fence objects
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * Copyright (C) 2022 Advanced Micro Devices, Inc.
662306a36Sopenharmony_ci * Authors:
762306a36Sopenharmony_ci *	Christian König <christian.koenig@amd.com>
862306a36Sopenharmony_ci */
962306a36Sopenharmony_ci
1062306a36Sopenharmony_ci#include <linux/dma-fence.h>
1162306a36Sopenharmony_ci#include <linux/dma-fence-array.h>
1262306a36Sopenharmony_ci#include <linux/dma-fence-chain.h>
1362306a36Sopenharmony_ci#include <linux/dma-fence-unwrap.h>
1462306a36Sopenharmony_ci#include <linux/slab.h>
1562306a36Sopenharmony_ci
1662306a36Sopenharmony_ci/* Internal helper to start new array iteration, don't use directly */
1762306a36Sopenharmony_cistatic struct dma_fence *
1862306a36Sopenharmony_ci__dma_fence_unwrap_array(struct dma_fence_unwrap *cursor)
1962306a36Sopenharmony_ci{
2062306a36Sopenharmony_ci	cursor->array = dma_fence_chain_contained(cursor->chain);
2162306a36Sopenharmony_ci	cursor->index = 0;
2262306a36Sopenharmony_ci	return dma_fence_array_first(cursor->array);
2362306a36Sopenharmony_ci}
2462306a36Sopenharmony_ci
2562306a36Sopenharmony_ci/**
2662306a36Sopenharmony_ci * dma_fence_unwrap_first - return the first fence from fence containers
2762306a36Sopenharmony_ci * @head: the entrypoint into the containers
2862306a36Sopenharmony_ci * @cursor: current position inside the containers
2962306a36Sopenharmony_ci *
3062306a36Sopenharmony_ci * Unwraps potential dma_fence_chain/dma_fence_array containers and return the
3162306a36Sopenharmony_ci * first fence.
3262306a36Sopenharmony_ci */
3362306a36Sopenharmony_cistruct dma_fence *dma_fence_unwrap_first(struct dma_fence *head,
3462306a36Sopenharmony_ci					 struct dma_fence_unwrap *cursor)
3562306a36Sopenharmony_ci{
3662306a36Sopenharmony_ci	cursor->chain = dma_fence_get(head);
3762306a36Sopenharmony_ci	return __dma_fence_unwrap_array(cursor);
3862306a36Sopenharmony_ci}
3962306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(dma_fence_unwrap_first);
4062306a36Sopenharmony_ci
4162306a36Sopenharmony_ci/**
4262306a36Sopenharmony_ci * dma_fence_unwrap_next - return the next fence from a fence containers
4362306a36Sopenharmony_ci * @cursor: current position inside the containers
4462306a36Sopenharmony_ci *
4562306a36Sopenharmony_ci * Continue unwrapping the dma_fence_chain/dma_fence_array containers and return
4662306a36Sopenharmony_ci * the next fence from them.
4762306a36Sopenharmony_ci */
4862306a36Sopenharmony_cistruct dma_fence *dma_fence_unwrap_next(struct dma_fence_unwrap *cursor)
4962306a36Sopenharmony_ci{
5062306a36Sopenharmony_ci	struct dma_fence *tmp;
5162306a36Sopenharmony_ci
5262306a36Sopenharmony_ci	++cursor->index;
5362306a36Sopenharmony_ci	tmp = dma_fence_array_next(cursor->array, cursor->index);
5462306a36Sopenharmony_ci	if (tmp)
5562306a36Sopenharmony_ci		return tmp;
5662306a36Sopenharmony_ci
5762306a36Sopenharmony_ci	cursor->chain = dma_fence_chain_walk(cursor->chain);
5862306a36Sopenharmony_ci	return __dma_fence_unwrap_array(cursor);
5962306a36Sopenharmony_ci}
6062306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(dma_fence_unwrap_next);
6162306a36Sopenharmony_ci
6262306a36Sopenharmony_ci/* Implementation for the dma_fence_merge() marco, don't use directly */
6362306a36Sopenharmony_cistruct dma_fence *__dma_fence_unwrap_merge(unsigned int num_fences,
6462306a36Sopenharmony_ci					   struct dma_fence **fences,
6562306a36Sopenharmony_ci					   struct dma_fence_unwrap *iter)
6662306a36Sopenharmony_ci{
6762306a36Sopenharmony_ci	struct dma_fence_array *result;
6862306a36Sopenharmony_ci	struct dma_fence *tmp, **array;
6962306a36Sopenharmony_ci	ktime_t timestamp;
7062306a36Sopenharmony_ci	unsigned int i;
7162306a36Sopenharmony_ci	size_t count;
7262306a36Sopenharmony_ci
7362306a36Sopenharmony_ci	count = 0;
7462306a36Sopenharmony_ci	timestamp = ns_to_ktime(0);
7562306a36Sopenharmony_ci	for (i = 0; i < num_fences; ++i) {
7662306a36Sopenharmony_ci		dma_fence_unwrap_for_each(tmp, &iter[i], fences[i]) {
7762306a36Sopenharmony_ci			if (!dma_fence_is_signaled(tmp)) {
7862306a36Sopenharmony_ci				++count;
7962306a36Sopenharmony_ci			} else {
8062306a36Sopenharmony_ci				ktime_t t = dma_fence_timestamp(tmp);
8162306a36Sopenharmony_ci
8262306a36Sopenharmony_ci				if (ktime_after(t, timestamp))
8362306a36Sopenharmony_ci					timestamp = t;
8462306a36Sopenharmony_ci			}
8562306a36Sopenharmony_ci		}
8662306a36Sopenharmony_ci	}
8762306a36Sopenharmony_ci
8862306a36Sopenharmony_ci	/*
8962306a36Sopenharmony_ci	 * If we couldn't find a pending fence just return a private signaled
9062306a36Sopenharmony_ci	 * fence with the timestamp of the last signaled one.
9162306a36Sopenharmony_ci	 */
9262306a36Sopenharmony_ci	if (count == 0)
9362306a36Sopenharmony_ci		return dma_fence_allocate_private_stub(timestamp);
9462306a36Sopenharmony_ci
9562306a36Sopenharmony_ci	array = kmalloc_array(count, sizeof(*array), GFP_KERNEL);
9662306a36Sopenharmony_ci	if (!array)
9762306a36Sopenharmony_ci		return NULL;
9862306a36Sopenharmony_ci
9962306a36Sopenharmony_ci	/*
10062306a36Sopenharmony_ci	 * This trashes the input fence array and uses it as position for the
10162306a36Sopenharmony_ci	 * following merge loop. This works because the dma_fence_merge()
10262306a36Sopenharmony_ci	 * wrapper macro is creating this temporary array on the stack together
10362306a36Sopenharmony_ci	 * with the iterators.
10462306a36Sopenharmony_ci	 */
10562306a36Sopenharmony_ci	for (i = 0; i < num_fences; ++i)
10662306a36Sopenharmony_ci		fences[i] = dma_fence_unwrap_first(fences[i], &iter[i]);
10762306a36Sopenharmony_ci
10862306a36Sopenharmony_ci	count = 0;
10962306a36Sopenharmony_ci	do {
11062306a36Sopenharmony_ci		unsigned int sel;
11162306a36Sopenharmony_ci
11262306a36Sopenharmony_cirestart:
11362306a36Sopenharmony_ci		tmp = NULL;
11462306a36Sopenharmony_ci		for (i = 0; i < num_fences; ++i) {
11562306a36Sopenharmony_ci			struct dma_fence *next;
11662306a36Sopenharmony_ci
11762306a36Sopenharmony_ci			while (fences[i] && dma_fence_is_signaled(fences[i]))
11862306a36Sopenharmony_ci				fences[i] = dma_fence_unwrap_next(&iter[i]);
11962306a36Sopenharmony_ci
12062306a36Sopenharmony_ci			next = fences[i];
12162306a36Sopenharmony_ci			if (!next)
12262306a36Sopenharmony_ci				continue;
12362306a36Sopenharmony_ci
12462306a36Sopenharmony_ci			/*
12562306a36Sopenharmony_ci			 * We can't guarantee that inpute fences are ordered by
12662306a36Sopenharmony_ci			 * context, but it is still quite likely when this
12762306a36Sopenharmony_ci			 * function is used multiple times. So attempt to order
12862306a36Sopenharmony_ci			 * the fences by context as we pass over them and merge
12962306a36Sopenharmony_ci			 * fences with the same context.
13062306a36Sopenharmony_ci			 */
13162306a36Sopenharmony_ci			if (!tmp || tmp->context > next->context) {
13262306a36Sopenharmony_ci				tmp = next;
13362306a36Sopenharmony_ci				sel = i;
13462306a36Sopenharmony_ci
13562306a36Sopenharmony_ci			} else if (tmp->context < next->context) {
13662306a36Sopenharmony_ci				continue;
13762306a36Sopenharmony_ci
13862306a36Sopenharmony_ci			} else if (dma_fence_is_later(tmp, next)) {
13962306a36Sopenharmony_ci				fences[i] = dma_fence_unwrap_next(&iter[i]);
14062306a36Sopenharmony_ci				goto restart;
14162306a36Sopenharmony_ci			} else {
14262306a36Sopenharmony_ci				fences[sel] = dma_fence_unwrap_next(&iter[sel]);
14362306a36Sopenharmony_ci				goto restart;
14462306a36Sopenharmony_ci			}
14562306a36Sopenharmony_ci		}
14662306a36Sopenharmony_ci
14762306a36Sopenharmony_ci		if (tmp) {
14862306a36Sopenharmony_ci			array[count++] = dma_fence_get(tmp);
14962306a36Sopenharmony_ci			fences[sel] = dma_fence_unwrap_next(&iter[sel]);
15062306a36Sopenharmony_ci		}
15162306a36Sopenharmony_ci	} while (tmp);
15262306a36Sopenharmony_ci
15362306a36Sopenharmony_ci	if (count == 0) {
15462306a36Sopenharmony_ci		tmp = dma_fence_allocate_private_stub(ktime_get());
15562306a36Sopenharmony_ci		goto return_tmp;
15662306a36Sopenharmony_ci	}
15762306a36Sopenharmony_ci
15862306a36Sopenharmony_ci	if (count == 1) {
15962306a36Sopenharmony_ci		tmp = array[0];
16062306a36Sopenharmony_ci		goto return_tmp;
16162306a36Sopenharmony_ci	}
16262306a36Sopenharmony_ci
16362306a36Sopenharmony_ci	result = dma_fence_array_create(count, array,
16462306a36Sopenharmony_ci					dma_fence_context_alloc(1),
16562306a36Sopenharmony_ci					1, false);
16662306a36Sopenharmony_ci	if (!result) {
16762306a36Sopenharmony_ci		tmp = NULL;
16862306a36Sopenharmony_ci		goto return_tmp;
16962306a36Sopenharmony_ci	}
17062306a36Sopenharmony_ci	return &result->base;
17162306a36Sopenharmony_ci
17262306a36Sopenharmony_cireturn_tmp:
17362306a36Sopenharmony_ci	kfree(array);
17462306a36Sopenharmony_ci	return tmp;
17562306a36Sopenharmony_ci}
17662306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(__dma_fence_unwrap_merge);
177