162306a36Sopenharmony_ci/* SPDX-License-Identifier: GPL-2.0 */
262306a36Sopenharmony_ci
362306a36Sopenharmony_ci/*
462306a36Sopenharmony_ci * 'Generic' ticket-lock implementation.
562306a36Sopenharmony_ci *
662306a36Sopenharmony_ci * It relies on atomic_fetch_add() having well defined forward progress
762306a36Sopenharmony_ci * guarantees under contention. If your architecture cannot provide this, stick
862306a36Sopenharmony_ci * to a test-and-set lock.
962306a36Sopenharmony_ci *
1062306a36Sopenharmony_ci * It also relies on atomic_fetch_add() being safe vs smp_store_release() on a
1162306a36Sopenharmony_ci * sub-word of the value. This is generally true for anything LL/SC although
1262306a36Sopenharmony_ci * you'd be hard pressed to find anything useful in architecture specifications
1362306a36Sopenharmony_ci * about this. If your architecture cannot do this you might be better off with
1462306a36Sopenharmony_ci * a test-and-set.
1562306a36Sopenharmony_ci *
1662306a36Sopenharmony_ci * It further assumes atomic_*_release() + atomic_*_acquire() is RCpc and hence
1762306a36Sopenharmony_ci * uses atomic_fetch_add() which is RCsc to create an RCsc hot path, along with
1862306a36Sopenharmony_ci * a full fence after the spin to upgrade the otherwise-RCpc
1962306a36Sopenharmony_ci * atomic_cond_read_acquire().
2062306a36Sopenharmony_ci *
2162306a36Sopenharmony_ci * The implementation uses smp_cond_load_acquire() to spin, so if the
2262306a36Sopenharmony_ci * architecture has WFE like instructions to sleep instead of poll for word
2362306a36Sopenharmony_ci * modifications be sure to implement that (see ARM64 for example).
2462306a36Sopenharmony_ci *
2562306a36Sopenharmony_ci */
2662306a36Sopenharmony_ci
2762306a36Sopenharmony_ci#ifndef __ASM_GENERIC_SPINLOCK_H
2862306a36Sopenharmony_ci#define __ASM_GENERIC_SPINLOCK_H
2962306a36Sopenharmony_ci
3062306a36Sopenharmony_ci#include <linux/atomic.h>
3162306a36Sopenharmony_ci#include <asm-generic/spinlock_types.h>
3262306a36Sopenharmony_ci
3362306a36Sopenharmony_cistatic __always_inline void arch_spin_lock(arch_spinlock_t *lock)
3462306a36Sopenharmony_ci{
3562306a36Sopenharmony_ci	u32 val = atomic_fetch_add(1<<16, lock);
3662306a36Sopenharmony_ci	u16 ticket = val >> 16;
3762306a36Sopenharmony_ci
3862306a36Sopenharmony_ci	if (ticket == (u16)val)
3962306a36Sopenharmony_ci		return;
4062306a36Sopenharmony_ci
4162306a36Sopenharmony_ci	/*
4262306a36Sopenharmony_ci	 * atomic_cond_read_acquire() is RCpc, but rather than defining a
4362306a36Sopenharmony_ci	 * custom cond_read_rcsc() here we just emit a full fence.  We only
4462306a36Sopenharmony_ci	 * need the prior reads before subsequent writes ordering from
4562306a36Sopenharmony_ci	 * smb_mb(), but as atomic_cond_read_acquire() just emits reads and we
4662306a36Sopenharmony_ci	 * have no outstanding writes due to the atomic_fetch_add() the extra
4762306a36Sopenharmony_ci	 * orderings are free.
4862306a36Sopenharmony_ci	 */
4962306a36Sopenharmony_ci	atomic_cond_read_acquire(lock, ticket == (u16)VAL);
5062306a36Sopenharmony_ci	smp_mb();
5162306a36Sopenharmony_ci}
5262306a36Sopenharmony_ci
5362306a36Sopenharmony_cistatic __always_inline bool arch_spin_trylock(arch_spinlock_t *lock)
5462306a36Sopenharmony_ci{
5562306a36Sopenharmony_ci	u32 old = atomic_read(lock);
5662306a36Sopenharmony_ci
5762306a36Sopenharmony_ci	if ((old >> 16) != (old & 0xffff))
5862306a36Sopenharmony_ci		return false;
5962306a36Sopenharmony_ci
6062306a36Sopenharmony_ci	return atomic_try_cmpxchg(lock, &old, old + (1<<16)); /* SC, for RCsc */
6162306a36Sopenharmony_ci}
6262306a36Sopenharmony_ci
6362306a36Sopenharmony_cistatic __always_inline void arch_spin_unlock(arch_spinlock_t *lock)
6462306a36Sopenharmony_ci{
6562306a36Sopenharmony_ci	u16 *ptr = (u16 *)lock + IS_ENABLED(CONFIG_CPU_BIG_ENDIAN);
6662306a36Sopenharmony_ci	u32 val = atomic_read(lock);
6762306a36Sopenharmony_ci
6862306a36Sopenharmony_ci	smp_store_release(ptr, (u16)val + 1);
6962306a36Sopenharmony_ci}
7062306a36Sopenharmony_ci
7162306a36Sopenharmony_cistatic __always_inline int arch_spin_is_locked(arch_spinlock_t *lock)
7262306a36Sopenharmony_ci{
7362306a36Sopenharmony_ci	u32 val = atomic_read(lock);
7462306a36Sopenharmony_ci
7562306a36Sopenharmony_ci	return ((val >> 16) != (val & 0xffff));
7662306a36Sopenharmony_ci}
7762306a36Sopenharmony_ci
7862306a36Sopenharmony_cistatic __always_inline int arch_spin_is_contended(arch_spinlock_t *lock)
7962306a36Sopenharmony_ci{
8062306a36Sopenharmony_ci	u32 val = atomic_read(lock);
8162306a36Sopenharmony_ci
8262306a36Sopenharmony_ci	return (s16)((val >> 16) - (val & 0xffff)) > 1;
8362306a36Sopenharmony_ci}
8462306a36Sopenharmony_ci
8562306a36Sopenharmony_cistatic __always_inline int arch_spin_value_unlocked(arch_spinlock_t lock)
8662306a36Sopenharmony_ci{
8762306a36Sopenharmony_ci	return !arch_spin_is_locked(&lock);
8862306a36Sopenharmony_ci}
8962306a36Sopenharmony_ci
9062306a36Sopenharmony_ci#include <asm/qrwlock.h>
9162306a36Sopenharmony_ci
9262306a36Sopenharmony_ci#endif /* __ASM_GENERIC_SPINLOCK_H */
93