162306a36Sopenharmony_ci/* SPDX-License-Identifier: GPL-2.0 */ 262306a36Sopenharmony_ci 362306a36Sopenharmony_ci/* 462306a36Sopenharmony_ci * 'Generic' ticket-lock implementation. 562306a36Sopenharmony_ci * 662306a36Sopenharmony_ci * It relies on atomic_fetch_add() having well defined forward progress 762306a36Sopenharmony_ci * guarantees under contention. If your architecture cannot provide this, stick 862306a36Sopenharmony_ci * to a test-and-set lock. 962306a36Sopenharmony_ci * 1062306a36Sopenharmony_ci * It also relies on atomic_fetch_add() being safe vs smp_store_release() on a 1162306a36Sopenharmony_ci * sub-word of the value. This is generally true for anything LL/SC although 1262306a36Sopenharmony_ci * you'd be hard pressed to find anything useful in architecture specifications 1362306a36Sopenharmony_ci * about this. If your architecture cannot do this you might be better off with 1462306a36Sopenharmony_ci * a test-and-set. 1562306a36Sopenharmony_ci * 1662306a36Sopenharmony_ci * It further assumes atomic_*_release() + atomic_*_acquire() is RCpc and hence 1762306a36Sopenharmony_ci * uses atomic_fetch_add() which is RCsc to create an RCsc hot path, along with 1862306a36Sopenharmony_ci * a full fence after the spin to upgrade the otherwise-RCpc 1962306a36Sopenharmony_ci * atomic_cond_read_acquire(). 2062306a36Sopenharmony_ci * 2162306a36Sopenharmony_ci * The implementation uses smp_cond_load_acquire() to spin, so if the 2262306a36Sopenharmony_ci * architecture has WFE like instructions to sleep instead of poll for word 2362306a36Sopenharmony_ci * modifications be sure to implement that (see ARM64 for example). 2462306a36Sopenharmony_ci * 2562306a36Sopenharmony_ci */ 2662306a36Sopenharmony_ci 2762306a36Sopenharmony_ci#ifndef __ASM_GENERIC_SPINLOCK_H 2862306a36Sopenharmony_ci#define __ASM_GENERIC_SPINLOCK_H 2962306a36Sopenharmony_ci 3062306a36Sopenharmony_ci#include <linux/atomic.h> 3162306a36Sopenharmony_ci#include <asm-generic/spinlock_types.h> 3262306a36Sopenharmony_ci 3362306a36Sopenharmony_cistatic __always_inline void arch_spin_lock(arch_spinlock_t *lock) 3462306a36Sopenharmony_ci{ 3562306a36Sopenharmony_ci u32 val = atomic_fetch_add(1<<16, lock); 3662306a36Sopenharmony_ci u16 ticket = val >> 16; 3762306a36Sopenharmony_ci 3862306a36Sopenharmony_ci if (ticket == (u16)val) 3962306a36Sopenharmony_ci return; 4062306a36Sopenharmony_ci 4162306a36Sopenharmony_ci /* 4262306a36Sopenharmony_ci * atomic_cond_read_acquire() is RCpc, but rather than defining a 4362306a36Sopenharmony_ci * custom cond_read_rcsc() here we just emit a full fence. We only 4462306a36Sopenharmony_ci * need the prior reads before subsequent writes ordering from 4562306a36Sopenharmony_ci * smb_mb(), but as atomic_cond_read_acquire() just emits reads and we 4662306a36Sopenharmony_ci * have no outstanding writes due to the atomic_fetch_add() the extra 4762306a36Sopenharmony_ci * orderings are free. 4862306a36Sopenharmony_ci */ 4962306a36Sopenharmony_ci atomic_cond_read_acquire(lock, ticket == (u16)VAL); 5062306a36Sopenharmony_ci smp_mb(); 5162306a36Sopenharmony_ci} 5262306a36Sopenharmony_ci 5362306a36Sopenharmony_cistatic __always_inline bool arch_spin_trylock(arch_spinlock_t *lock) 5462306a36Sopenharmony_ci{ 5562306a36Sopenharmony_ci u32 old = atomic_read(lock); 5662306a36Sopenharmony_ci 5762306a36Sopenharmony_ci if ((old >> 16) != (old & 0xffff)) 5862306a36Sopenharmony_ci return false; 5962306a36Sopenharmony_ci 6062306a36Sopenharmony_ci return atomic_try_cmpxchg(lock, &old, old + (1<<16)); /* SC, for RCsc */ 6162306a36Sopenharmony_ci} 6262306a36Sopenharmony_ci 6362306a36Sopenharmony_cistatic __always_inline void arch_spin_unlock(arch_spinlock_t *lock) 6462306a36Sopenharmony_ci{ 6562306a36Sopenharmony_ci u16 *ptr = (u16 *)lock + IS_ENABLED(CONFIG_CPU_BIG_ENDIAN); 6662306a36Sopenharmony_ci u32 val = atomic_read(lock); 6762306a36Sopenharmony_ci 6862306a36Sopenharmony_ci smp_store_release(ptr, (u16)val + 1); 6962306a36Sopenharmony_ci} 7062306a36Sopenharmony_ci 7162306a36Sopenharmony_cistatic __always_inline int arch_spin_is_locked(arch_spinlock_t *lock) 7262306a36Sopenharmony_ci{ 7362306a36Sopenharmony_ci u32 val = atomic_read(lock); 7462306a36Sopenharmony_ci 7562306a36Sopenharmony_ci return ((val >> 16) != (val & 0xffff)); 7662306a36Sopenharmony_ci} 7762306a36Sopenharmony_ci 7862306a36Sopenharmony_cistatic __always_inline int arch_spin_is_contended(arch_spinlock_t *lock) 7962306a36Sopenharmony_ci{ 8062306a36Sopenharmony_ci u32 val = atomic_read(lock); 8162306a36Sopenharmony_ci 8262306a36Sopenharmony_ci return (s16)((val >> 16) - (val & 0xffff)) > 1; 8362306a36Sopenharmony_ci} 8462306a36Sopenharmony_ci 8562306a36Sopenharmony_cistatic __always_inline int arch_spin_value_unlocked(arch_spinlock_t lock) 8662306a36Sopenharmony_ci{ 8762306a36Sopenharmony_ci return !arch_spin_is_locked(&lock); 8862306a36Sopenharmony_ci} 8962306a36Sopenharmony_ci 9062306a36Sopenharmony_ci#include <asm/qrwlock.h> 9162306a36Sopenharmony_ci 9262306a36Sopenharmony_ci#endif /* __ASM_GENERIC_SPINLOCK_H */ 93