mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2025-01-14 20:06:34 +07:00
3f6aa0b113
The sparc32 version of arch_write_unlock() is just a plain assignment. Unfortunately this allows the compiler to schedule side-effects in a protected region to occur after the HW-level unlock, which is broken. E.g., the following trivial test case gets miscompiled: #include <linux/spinlock.h> rwlock_t lock; int counter; void foo(void) { write_lock(&lock); ++counter; write_unlock(&lock); } Fixed by adding a compiler memory barrier to arch_write_unlock(). The sparc64 version combines the barrier and assignment into a single asm(), and implements the operation as a static inline, so that's what I did too. Compile-tested with sparc32_defconfig + CONFIG_SMP=y. Signed-off-by: Mikael Pettersson <mikpe@it.uu.se> Signed-off-by: David S. Miller <davem@davemloft.net>
201 lines
4.7 KiB
C
201 lines
4.7 KiB
C
/* spinlock.h: 32-bit Sparc spinlock support.
|
|
*
|
|
* Copyright (C) 1997 David S. Miller (davem@caip.rutgers.edu)
|
|
*/
|
|
|
|
#ifndef __SPARC_SPINLOCK_H
|
|
#define __SPARC_SPINLOCK_H
|
|
|
|
#ifndef __ASSEMBLY__
|
|
|
|
#include <asm/psr.h>
|
|
#include <asm/processor.h> /* for cpu_relax */
|
|
|
|
#define arch_spin_is_locked(lock) (*((volatile unsigned char *)(lock)) != 0)
|
|
|
|
#define arch_spin_unlock_wait(lock) \
|
|
do { while (arch_spin_is_locked(lock)) cpu_relax(); } while (0)
|
|
|
|
static inline void arch_spin_lock(arch_spinlock_t *lock)
|
|
{
|
|
__asm__ __volatile__(
|
|
"\n1:\n\t"
|
|
"ldstub [%0], %%g2\n\t"
|
|
"orcc %%g2, 0x0, %%g0\n\t"
|
|
"bne,a 2f\n\t"
|
|
" ldub [%0], %%g2\n\t"
|
|
".subsection 2\n"
|
|
"2:\n\t"
|
|
"orcc %%g2, 0x0, %%g0\n\t"
|
|
"bne,a 2b\n\t"
|
|
" ldub [%0], %%g2\n\t"
|
|
"b,a 1b\n\t"
|
|
".previous\n"
|
|
: /* no outputs */
|
|
: "r" (lock)
|
|
: "g2", "memory", "cc");
|
|
}
|
|
|
|
static inline int arch_spin_trylock(arch_spinlock_t *lock)
|
|
{
|
|
unsigned int result;
|
|
__asm__ __volatile__("ldstub [%1], %0"
|
|
: "=r" (result)
|
|
: "r" (lock)
|
|
: "memory");
|
|
return (result == 0);
|
|
}
|
|
|
|
static inline void arch_spin_unlock(arch_spinlock_t *lock)
|
|
{
|
|
__asm__ __volatile__("stb %%g0, [%0]" : : "r" (lock) : "memory");
|
|
}
|
|
|
|
/* Read-write spinlocks, allowing multiple readers
|
|
* but only one writer.
|
|
*
|
|
* NOTE! it is quite common to have readers in interrupts
|
|
* but no interrupt writers. For those circumstances we
|
|
* can "mix" irq-safe locks - any writer needs to get a
|
|
* irq-safe write-lock, but readers can get non-irqsafe
|
|
* read-locks.
|
|
*
|
|
* XXX This might create some problems with my dual spinlock
|
|
* XXX scheme, deadlocks etc. -DaveM
|
|
*
|
|
* Sort of like atomic_t's on Sparc, but even more clever.
|
|
*
|
|
* ------------------------------------
|
|
* | 24-bit counter | wlock | arch_rwlock_t
|
|
* ------------------------------------
|
|
* 31 8 7 0
|
|
*
|
|
* wlock signifies the one writer is in or somebody is updating
|
|
* counter. For a writer, if he successfully acquires the wlock,
|
|
* but counter is non-zero, he has to release the lock and wait,
|
|
* till both counter and wlock are zero.
|
|
*
|
|
* Unfortunately this scheme limits us to ~16,000,000 cpus.
|
|
*/
|
|
static inline void __arch_read_lock(arch_rwlock_t *rw)
|
|
{
|
|
register arch_rwlock_t *lp asm("g1");
|
|
lp = rw;
|
|
__asm__ __volatile__(
|
|
"mov %%o7, %%g4\n\t"
|
|
"call ___rw_read_enter\n\t"
|
|
" ldstub [%%g1 + 3], %%g2\n"
|
|
: /* no outputs */
|
|
: "r" (lp)
|
|
: "g2", "g4", "memory", "cc");
|
|
}
|
|
|
|
#define arch_read_lock(lock) \
|
|
do { unsigned long flags; \
|
|
local_irq_save(flags); \
|
|
__arch_read_lock(lock); \
|
|
local_irq_restore(flags); \
|
|
} while(0)
|
|
|
|
static inline void __arch_read_unlock(arch_rwlock_t *rw)
|
|
{
|
|
register arch_rwlock_t *lp asm("g1");
|
|
lp = rw;
|
|
__asm__ __volatile__(
|
|
"mov %%o7, %%g4\n\t"
|
|
"call ___rw_read_exit\n\t"
|
|
" ldstub [%%g1 + 3], %%g2\n"
|
|
: /* no outputs */
|
|
: "r" (lp)
|
|
: "g2", "g4", "memory", "cc");
|
|
}
|
|
|
|
#define arch_read_unlock(lock) \
|
|
do { unsigned long flags; \
|
|
local_irq_save(flags); \
|
|
__arch_read_unlock(lock); \
|
|
local_irq_restore(flags); \
|
|
} while(0)
|
|
|
|
static inline void arch_write_lock(arch_rwlock_t *rw)
|
|
{
|
|
register arch_rwlock_t *lp asm("g1");
|
|
lp = rw;
|
|
__asm__ __volatile__(
|
|
"mov %%o7, %%g4\n\t"
|
|
"call ___rw_write_enter\n\t"
|
|
" ldstub [%%g1 + 3], %%g2\n"
|
|
: /* no outputs */
|
|
: "r" (lp)
|
|
: "g2", "g4", "memory", "cc");
|
|
*(volatile __u32 *)&lp->lock = ~0U;
|
|
}
|
|
|
|
static void inline arch_write_unlock(arch_rwlock_t *lock)
|
|
{
|
|
__asm__ __volatile__(
|
|
" st %%g0, [%0]"
|
|
: /* no outputs */
|
|
: "r" (lock)
|
|
: "memory");
|
|
}
|
|
|
|
static inline int arch_write_trylock(arch_rwlock_t *rw)
|
|
{
|
|
unsigned int val;
|
|
|
|
__asm__ __volatile__("ldstub [%1 + 3], %0"
|
|
: "=r" (val)
|
|
: "r" (&rw->lock)
|
|
: "memory");
|
|
|
|
if (val == 0) {
|
|
val = rw->lock & ~0xff;
|
|
if (val)
|
|
((volatile u8*)&rw->lock)[3] = 0;
|
|
else
|
|
*(volatile u32*)&rw->lock = ~0U;
|
|
}
|
|
|
|
return (val == 0);
|
|
}
|
|
|
|
static inline int __arch_read_trylock(arch_rwlock_t *rw)
|
|
{
|
|
register arch_rwlock_t *lp asm("g1");
|
|
register int res asm("o0");
|
|
lp = rw;
|
|
__asm__ __volatile__(
|
|
"mov %%o7, %%g4\n\t"
|
|
"call ___rw_read_try\n\t"
|
|
" ldstub [%%g1 + 3], %%g2\n"
|
|
: "=r" (res)
|
|
: "r" (lp)
|
|
: "g2", "g4", "memory", "cc");
|
|
return res;
|
|
}
|
|
|
|
#define arch_read_trylock(lock) \
|
|
({ unsigned long flags; \
|
|
int res; \
|
|
local_irq_save(flags); \
|
|
res = __arch_read_trylock(lock); \
|
|
local_irq_restore(flags); \
|
|
res; \
|
|
})
|
|
|
|
#define arch_spin_lock_flags(lock, flags) arch_spin_lock(lock)
|
|
#define arch_read_lock_flags(rw, flags) arch_read_lock(rw)
|
|
#define arch_write_lock_flags(rw, flags) arch_write_lock(rw)
|
|
|
|
#define arch_spin_relax(lock) cpu_relax()
|
|
#define arch_read_relax(lock) cpu_relax()
|
|
#define arch_write_relax(lock) cpu_relax()
|
|
|
|
#define arch_read_can_lock(rw) (!((rw)->lock & 0xff))
|
|
#define arch_write_can_lock(rw) (!(rw)->lock)
|
|
|
|
#endif /* !(__ASSEMBLY__) */
|
|
|
|
#endif /* __SPARC_SPINLOCK_H */
|