3fcbb8260a
In 4.19-rc1, Eugeniy reported weird boot and IO errors on ARC HSDK | INFO: task syslogd:77 blocked for more than 10 seconds. | Not tainted 4.19.0-rc1-00007-gf213acea4e88 #40 | "echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this | message. | syslogd D 0 77 76 0x00000000 | | Stack Trace: | __switch_to+0x0/0xac | __schedule+0x1b2/0x730 | io_schedule+0x5c/0xc0 | __lock_page+0x98/0xdc | find_lock_entry+0x38/0x100 | shmem_getpage_gfp.isra.3+0x82/0xbfc | shmem_fault+0x46/0x138 | handle_mm_fault+0x5bc/0x924 | do_page_fault+0x100/0x2b8 | ret_from_exception+0x0/0x8 He bisected to84c6591103
("locking/atomics, asm-generic/bitops/lock.h: Rewrite using atomic_fetch_*()") This commit however only unmasked the real issue introduced by commit4aef66c8ae
("locking/atomic, arch/arc: Fix build") which missed the retry-if-scond-failed branch in atomic_fetch_##op() macros. The bisected commit started using atomic_fetch_##op() macros for building the rest of atomics. Fixes:4aef66c8ae
("locking/atomic, arch/arc: Fix build") Reported-by: Eugeniy Paltsev <paltsev@synopsys.com> Acked-by: Peter Zijlstra (Intel) <peterz@infradead.org> Signed-off-by: Will Deacon <will.deacon@arm.com> Signed-off-by: Vineet Gupta <vgupta@synopsys.com> [vgupta: wrote changelog]
563 lines
13 KiB
C
563 lines
13 KiB
C
/*
|
|
* Copyright (C) 2004, 2007-2010, 2011-2012 Synopsys, Inc. (www.synopsys.com)
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License version 2 as
|
|
* published by the Free Software Foundation.
|
|
*/
|
|
|
|
#ifndef _ASM_ARC_ATOMIC_H
|
|
#define _ASM_ARC_ATOMIC_H
|
|
|
|
#ifndef __ASSEMBLY__
|
|
|
|
#include <linux/types.h>
|
|
#include <linux/compiler.h>
|
|
#include <asm/cmpxchg.h>
|
|
#include <asm/barrier.h>
|
|
#include <asm/smp.h>
|
|
|
|
#define ATOMIC_INIT(i) { (i) }
|
|
|
|
#ifndef CONFIG_ARC_PLAT_EZNPS
|
|
|
|
#define atomic_read(v) READ_ONCE((v)->counter)
|
|
|
|
#ifdef CONFIG_ARC_HAS_LLSC
|
|
|
|
#define atomic_set(v, i) WRITE_ONCE(((v)->counter), (i))
|
|
|
|
#define ATOMIC_OP(op, c_op, asm_op) \
|
|
static inline void atomic_##op(int i, atomic_t *v) \
|
|
{ \
|
|
unsigned int val; \
|
|
\
|
|
__asm__ __volatile__( \
|
|
"1: llock %[val], [%[ctr]] \n" \
|
|
" " #asm_op " %[val], %[val], %[i] \n" \
|
|
" scond %[val], [%[ctr]] \n" \
|
|
" bnz 1b \n" \
|
|
: [val] "=&r" (val) /* Early clobber to prevent reg reuse */ \
|
|
: [ctr] "r" (&v->counter), /* Not "m": llock only supports reg direct addr mode */ \
|
|
[i] "ir" (i) \
|
|
: "cc"); \
|
|
} \
|
|
|
|
#define ATOMIC_OP_RETURN(op, c_op, asm_op) \
|
|
static inline int atomic_##op##_return(int i, atomic_t *v) \
|
|
{ \
|
|
unsigned int val; \
|
|
\
|
|
/* \
|
|
* Explicit full memory barrier needed before/after as \
|
|
* LLOCK/SCOND thmeselves don't provide any such semantics \
|
|
*/ \
|
|
smp_mb(); \
|
|
\
|
|
__asm__ __volatile__( \
|
|
"1: llock %[val], [%[ctr]] \n" \
|
|
" " #asm_op " %[val], %[val], %[i] \n" \
|
|
" scond %[val], [%[ctr]] \n" \
|
|
" bnz 1b \n" \
|
|
: [val] "=&r" (val) \
|
|
: [ctr] "r" (&v->counter), \
|
|
[i] "ir" (i) \
|
|
: "cc"); \
|
|
\
|
|
smp_mb(); \
|
|
\
|
|
return val; \
|
|
}
|
|
|
|
#define ATOMIC_FETCH_OP(op, c_op, asm_op) \
|
|
static inline int atomic_fetch_##op(int i, atomic_t *v) \
|
|
{ \
|
|
unsigned int val, orig; \
|
|
\
|
|
/* \
|
|
* Explicit full memory barrier needed before/after as \
|
|
* LLOCK/SCOND thmeselves don't provide any such semantics \
|
|
*/ \
|
|
smp_mb(); \
|
|
\
|
|
__asm__ __volatile__( \
|
|
"1: llock %[orig], [%[ctr]] \n" \
|
|
" " #asm_op " %[val], %[orig], %[i] \n" \
|
|
" scond %[val], [%[ctr]] \n" \
|
|
" bnz 1b \n" \
|
|
: [val] "=&r" (val), \
|
|
[orig] "=&r" (orig) \
|
|
: [ctr] "r" (&v->counter), \
|
|
[i] "ir" (i) \
|
|
: "cc"); \
|
|
\
|
|
smp_mb(); \
|
|
\
|
|
return orig; \
|
|
}
|
|
|
|
#else /* !CONFIG_ARC_HAS_LLSC */
|
|
|
|
#ifndef CONFIG_SMP
|
|
|
|
/* violating atomic_xxx API locking protocol in UP for optimization sake */
|
|
#define atomic_set(v, i) WRITE_ONCE(((v)->counter), (i))
|
|
|
|
#else
|
|
|
|
static inline void atomic_set(atomic_t *v, int i)
|
|
{
|
|
/*
|
|
* Independent of hardware support, all of the atomic_xxx() APIs need
|
|
* to follow the same locking rules to make sure that a "hardware"
|
|
* atomic insn (e.g. LD) doesn't clobber an "emulated" atomic insn
|
|
* sequence
|
|
*
|
|
* Thus atomic_set() despite being 1 insn (and seemingly atomic)
|
|
* requires the locking.
|
|
*/
|
|
unsigned long flags;
|
|
|
|
atomic_ops_lock(flags);
|
|
WRITE_ONCE(v->counter, i);
|
|
atomic_ops_unlock(flags);
|
|
}
|
|
|
|
#define atomic_set_release(v, i) atomic_set((v), (i))
|
|
|
|
#endif
|
|
|
|
/*
|
|
* Non hardware assisted Atomic-R-M-W
|
|
* Locking would change to irq-disabling only (UP) and spinlocks (SMP)
|
|
*/
|
|
|
|
#define ATOMIC_OP(op, c_op, asm_op) \
|
|
static inline void atomic_##op(int i, atomic_t *v) \
|
|
{ \
|
|
unsigned long flags; \
|
|
\
|
|
atomic_ops_lock(flags); \
|
|
v->counter c_op i; \
|
|
atomic_ops_unlock(flags); \
|
|
}
|
|
|
|
#define ATOMIC_OP_RETURN(op, c_op, asm_op) \
|
|
static inline int atomic_##op##_return(int i, atomic_t *v) \
|
|
{ \
|
|
unsigned long flags; \
|
|
unsigned long temp; \
|
|
\
|
|
/* \
|
|
* spin lock/unlock provides the needed smp_mb() before/after \
|
|
*/ \
|
|
atomic_ops_lock(flags); \
|
|
temp = v->counter; \
|
|
temp c_op i; \
|
|
v->counter = temp; \
|
|
atomic_ops_unlock(flags); \
|
|
\
|
|
return temp; \
|
|
}
|
|
|
|
#define ATOMIC_FETCH_OP(op, c_op, asm_op) \
|
|
static inline int atomic_fetch_##op(int i, atomic_t *v) \
|
|
{ \
|
|
unsigned long flags; \
|
|
unsigned long orig; \
|
|
\
|
|
/* \
|
|
* spin lock/unlock provides the needed smp_mb() before/after \
|
|
*/ \
|
|
atomic_ops_lock(flags); \
|
|
orig = v->counter; \
|
|
v->counter c_op i; \
|
|
atomic_ops_unlock(flags); \
|
|
\
|
|
return orig; \
|
|
}
|
|
|
|
#endif /* !CONFIG_ARC_HAS_LLSC */
|
|
|
|
#define ATOMIC_OPS(op, c_op, asm_op) \
|
|
ATOMIC_OP(op, c_op, asm_op) \
|
|
ATOMIC_OP_RETURN(op, c_op, asm_op) \
|
|
ATOMIC_FETCH_OP(op, c_op, asm_op)
|
|
|
|
ATOMIC_OPS(add, +=, add)
|
|
ATOMIC_OPS(sub, -=, sub)
|
|
|
|
#define atomic_andnot atomic_andnot
|
|
#define atomic_fetch_andnot atomic_fetch_andnot
|
|
|
|
#undef ATOMIC_OPS
|
|
#define ATOMIC_OPS(op, c_op, asm_op) \
|
|
ATOMIC_OP(op, c_op, asm_op) \
|
|
ATOMIC_FETCH_OP(op, c_op, asm_op)
|
|
|
|
ATOMIC_OPS(and, &=, and)
|
|
ATOMIC_OPS(andnot, &= ~, bic)
|
|
ATOMIC_OPS(or, |=, or)
|
|
ATOMIC_OPS(xor, ^=, xor)
|
|
|
|
#else /* CONFIG_ARC_PLAT_EZNPS */
|
|
|
|
static inline int atomic_read(const atomic_t *v)
|
|
{
|
|
int temp;
|
|
|
|
__asm__ __volatile__(
|
|
" ld.di %0, [%1]"
|
|
: "=r"(temp)
|
|
: "r"(&v->counter)
|
|
: "memory");
|
|
return temp;
|
|
}
|
|
|
|
static inline void atomic_set(atomic_t *v, int i)
|
|
{
|
|
__asm__ __volatile__(
|
|
" st.di %0,[%1]"
|
|
:
|
|
: "r"(i), "r"(&v->counter)
|
|
: "memory");
|
|
}
|
|
|
|
#define ATOMIC_OP(op, c_op, asm_op) \
|
|
static inline void atomic_##op(int i, atomic_t *v) \
|
|
{ \
|
|
__asm__ __volatile__( \
|
|
" mov r2, %0\n" \
|
|
" mov r3, %1\n" \
|
|
" .word %2\n" \
|
|
: \
|
|
: "r"(i), "r"(&v->counter), "i"(asm_op) \
|
|
: "r2", "r3", "memory"); \
|
|
} \
|
|
|
|
#define ATOMIC_OP_RETURN(op, c_op, asm_op) \
|
|
static inline int atomic_##op##_return(int i, atomic_t *v) \
|
|
{ \
|
|
unsigned int temp = i; \
|
|
\
|
|
/* Explicit full memory barrier needed before/after */ \
|
|
smp_mb(); \
|
|
\
|
|
__asm__ __volatile__( \
|
|
" mov r2, %0\n" \
|
|
" mov r3, %1\n" \
|
|
" .word %2\n" \
|
|
" mov %0, r2" \
|
|
: "+r"(temp) \
|
|
: "r"(&v->counter), "i"(asm_op) \
|
|
: "r2", "r3", "memory"); \
|
|
\
|
|
smp_mb(); \
|
|
\
|
|
temp c_op i; \
|
|
\
|
|
return temp; \
|
|
}
|
|
|
|
#define ATOMIC_FETCH_OP(op, c_op, asm_op) \
|
|
static inline int atomic_fetch_##op(int i, atomic_t *v) \
|
|
{ \
|
|
unsigned int temp = i; \
|
|
\
|
|
/* Explicit full memory barrier needed before/after */ \
|
|
smp_mb(); \
|
|
\
|
|
__asm__ __volatile__( \
|
|
" mov r2, %0\n" \
|
|
" mov r3, %1\n" \
|
|
" .word %2\n" \
|
|
" mov %0, r2" \
|
|
: "+r"(temp) \
|
|
: "r"(&v->counter), "i"(asm_op) \
|
|
: "r2", "r3", "memory"); \
|
|
\
|
|
smp_mb(); \
|
|
\
|
|
return temp; \
|
|
}
|
|
|
|
#define ATOMIC_OPS(op, c_op, asm_op) \
|
|
ATOMIC_OP(op, c_op, asm_op) \
|
|
ATOMIC_OP_RETURN(op, c_op, asm_op) \
|
|
ATOMIC_FETCH_OP(op, c_op, asm_op)
|
|
|
|
ATOMIC_OPS(add, +=, CTOP_INST_AADD_DI_R2_R2_R3)
|
|
#define atomic_sub(i, v) atomic_add(-(i), (v))
|
|
#define atomic_sub_return(i, v) atomic_add_return(-(i), (v))
|
|
#define atomic_fetch_sub(i, v) atomic_fetch_add(-(i), (v))
|
|
|
|
#undef ATOMIC_OPS
|
|
#define ATOMIC_OPS(op, c_op, asm_op) \
|
|
ATOMIC_OP(op, c_op, asm_op) \
|
|
ATOMIC_FETCH_OP(op, c_op, asm_op)
|
|
|
|
ATOMIC_OPS(and, &=, CTOP_INST_AAND_DI_R2_R2_R3)
|
|
ATOMIC_OPS(or, |=, CTOP_INST_AOR_DI_R2_R2_R3)
|
|
ATOMIC_OPS(xor, ^=, CTOP_INST_AXOR_DI_R2_R2_R3)
|
|
|
|
#endif /* CONFIG_ARC_PLAT_EZNPS */
|
|
|
|
#undef ATOMIC_OPS
|
|
#undef ATOMIC_FETCH_OP
|
|
#undef ATOMIC_OP_RETURN
|
|
#undef ATOMIC_OP
|
|
|
|
#ifdef CONFIG_GENERIC_ATOMIC64
|
|
|
|
#include <asm-generic/atomic64.h>
|
|
|
|
#else /* Kconfig ensures this is only enabled with needed h/w assist */
|
|
|
|
/*
|
|
* ARCv2 supports 64-bit exclusive load (LLOCKD) / store (SCONDD)
|
|
* - The address HAS to be 64-bit aligned
|
|
* - There are 2 semantics involved here:
|
|
* = exclusive implies no interim update between load/store to same addr
|
|
* = both words are observed/updated together: this is guaranteed even
|
|
* for regular 64-bit load (LDD) / store (STD). Thus atomic64_set()
|
|
* is NOT required to use LLOCKD+SCONDD, STD suffices
|
|
*/
|
|
|
|
typedef struct {
|
|
aligned_u64 counter;
|
|
} atomic64_t;
|
|
|
|
#define ATOMIC64_INIT(a) { (a) }
|
|
|
|
static inline long long atomic64_read(const atomic64_t *v)
|
|
{
|
|
unsigned long long val;
|
|
|
|
__asm__ __volatile__(
|
|
" ldd %0, [%1] \n"
|
|
: "=r"(val)
|
|
: "r"(&v->counter));
|
|
|
|
return val;
|
|
}
|
|
|
|
static inline void atomic64_set(atomic64_t *v, long long a)
|
|
{
|
|
/*
|
|
* This could have been a simple assignment in "C" but would need
|
|
* explicit volatile. Otherwise gcc optimizers could elide the store
|
|
* which borked atomic64 self-test
|
|
* In the inline asm version, memory clobber needed for exact same
|
|
* reason, to tell gcc about the store.
|
|
*
|
|
* This however is not needed for sibling atomic64_add() etc since both
|
|
* load/store are explicitly done in inline asm. As long as API is used
|
|
* for each access, gcc has no way to optimize away any load/store
|
|
*/
|
|
__asm__ __volatile__(
|
|
" std %0, [%1] \n"
|
|
:
|
|
: "r"(a), "r"(&v->counter)
|
|
: "memory");
|
|
}
|
|
|
|
#define ATOMIC64_OP(op, op1, op2) \
|
|
static inline void atomic64_##op(long long a, atomic64_t *v) \
|
|
{ \
|
|
unsigned long long val; \
|
|
\
|
|
__asm__ __volatile__( \
|
|
"1: \n" \
|
|
" llockd %0, [%1] \n" \
|
|
" " #op1 " %L0, %L0, %L2 \n" \
|
|
" " #op2 " %H0, %H0, %H2 \n" \
|
|
" scondd %0, [%1] \n" \
|
|
" bnz 1b \n" \
|
|
: "=&r"(val) \
|
|
: "r"(&v->counter), "ir"(a) \
|
|
: "cc"); \
|
|
} \
|
|
|
|
#define ATOMIC64_OP_RETURN(op, op1, op2) \
|
|
static inline long long atomic64_##op##_return(long long a, atomic64_t *v) \
|
|
{ \
|
|
unsigned long long val; \
|
|
\
|
|
smp_mb(); \
|
|
\
|
|
__asm__ __volatile__( \
|
|
"1: \n" \
|
|
" llockd %0, [%1] \n" \
|
|
" " #op1 " %L0, %L0, %L2 \n" \
|
|
" " #op2 " %H0, %H0, %H2 \n" \
|
|
" scondd %0, [%1] \n" \
|
|
" bnz 1b \n" \
|
|
: [val] "=&r"(val) \
|
|
: "r"(&v->counter), "ir"(a) \
|
|
: "cc"); /* memory clobber comes from smp_mb() */ \
|
|
\
|
|
smp_mb(); \
|
|
\
|
|
return val; \
|
|
}
|
|
|
|
#define ATOMIC64_FETCH_OP(op, op1, op2) \
|
|
static inline long long atomic64_fetch_##op(long long a, atomic64_t *v) \
|
|
{ \
|
|
unsigned long long val, orig; \
|
|
\
|
|
smp_mb(); \
|
|
\
|
|
__asm__ __volatile__( \
|
|
"1: \n" \
|
|
" llockd %0, [%2] \n" \
|
|
" " #op1 " %L1, %L0, %L3 \n" \
|
|
" " #op2 " %H1, %H0, %H3 \n" \
|
|
" scondd %1, [%2] \n" \
|
|
" bnz 1b \n" \
|
|
: "=&r"(orig), "=&r"(val) \
|
|
: "r"(&v->counter), "ir"(a) \
|
|
: "cc"); /* memory clobber comes from smp_mb() */ \
|
|
\
|
|
smp_mb(); \
|
|
\
|
|
return orig; \
|
|
}
|
|
|
|
#define ATOMIC64_OPS(op, op1, op2) \
|
|
ATOMIC64_OP(op, op1, op2) \
|
|
ATOMIC64_OP_RETURN(op, op1, op2) \
|
|
ATOMIC64_FETCH_OP(op, op1, op2)
|
|
|
|
#define atomic64_andnot atomic64_andnot
|
|
#define atomic64_fetch_andnot atomic64_fetch_andnot
|
|
|
|
ATOMIC64_OPS(add, add.f, adc)
|
|
ATOMIC64_OPS(sub, sub.f, sbc)
|
|
ATOMIC64_OPS(and, and, and)
|
|
ATOMIC64_OPS(andnot, bic, bic)
|
|
ATOMIC64_OPS(or, or, or)
|
|
ATOMIC64_OPS(xor, xor, xor)
|
|
|
|
#undef ATOMIC64_OPS
|
|
#undef ATOMIC64_FETCH_OP
|
|
#undef ATOMIC64_OP_RETURN
|
|
#undef ATOMIC64_OP
|
|
|
|
static inline long long
|
|
atomic64_cmpxchg(atomic64_t *ptr, long long expected, long long new)
|
|
{
|
|
long long prev;
|
|
|
|
smp_mb();
|
|
|
|
__asm__ __volatile__(
|
|
"1: llockd %0, [%1] \n"
|
|
" brne %L0, %L2, 2f \n"
|
|
" brne %H0, %H2, 2f \n"
|
|
" scondd %3, [%1] \n"
|
|
" bnz 1b \n"
|
|
"2: \n"
|
|
: "=&r"(prev)
|
|
: "r"(ptr), "ir"(expected), "r"(new)
|
|
: "cc"); /* memory clobber comes from smp_mb() */
|
|
|
|
smp_mb();
|
|
|
|
return prev;
|
|
}
|
|
|
|
static inline long long atomic64_xchg(atomic64_t *ptr, long long new)
|
|
{
|
|
long long prev;
|
|
|
|
smp_mb();
|
|
|
|
__asm__ __volatile__(
|
|
"1: llockd %0, [%1] \n"
|
|
" scondd %2, [%1] \n"
|
|
" bnz 1b \n"
|
|
"2: \n"
|
|
: "=&r"(prev)
|
|
: "r"(ptr), "r"(new)
|
|
: "cc"); /* memory clobber comes from smp_mb() */
|
|
|
|
smp_mb();
|
|
|
|
return prev;
|
|
}
|
|
|
|
/**
|
|
* atomic64_dec_if_positive - decrement by 1 if old value positive
|
|
* @v: pointer of type atomic64_t
|
|
*
|
|
* The function returns the old value of *v minus 1, even if
|
|
* the atomic variable, v, was not decremented.
|
|
*/
|
|
|
|
static inline long long atomic64_dec_if_positive(atomic64_t *v)
|
|
{
|
|
long long val;
|
|
|
|
smp_mb();
|
|
|
|
__asm__ __volatile__(
|
|
"1: llockd %0, [%1] \n"
|
|
" sub.f %L0, %L0, 1 # w0 - 1, set C on borrow\n"
|
|
" sub.c %H0, %H0, 1 # if C set, w1 - 1\n"
|
|
" brlt %H0, 0, 2f \n"
|
|
" scondd %0, [%1] \n"
|
|
" bnz 1b \n"
|
|
"2: \n"
|
|
: "=&r"(val)
|
|
: "r"(&v->counter)
|
|
: "cc"); /* memory clobber comes from smp_mb() */
|
|
|
|
smp_mb();
|
|
|
|
return val;
|
|
}
|
|
#define atomic64_dec_if_positive atomic64_dec_if_positive
|
|
|
|
/**
|
|
* atomic64_fetch_add_unless - add unless the number is a given value
|
|
* @v: pointer of type atomic64_t
|
|
* @a: the amount to add to v...
|
|
* @u: ...unless v is equal to u.
|
|
*
|
|
* Atomically adds @a to @v, if it was not @u.
|
|
* Returns the old value of @v
|
|
*/
|
|
static inline long long atomic64_fetch_add_unless(atomic64_t *v, long long a,
|
|
long long u)
|
|
{
|
|
long long old, temp;
|
|
|
|
smp_mb();
|
|
|
|
__asm__ __volatile__(
|
|
"1: llockd %0, [%2] \n"
|
|
" brne %L0, %L4, 2f # continue to add since v != u \n"
|
|
" breq.d %H0, %H4, 3f # return since v == u \n"
|
|
"2: \n"
|
|
" add.f %L1, %L0, %L3 \n"
|
|
" adc %H1, %H0, %H3 \n"
|
|
" scondd %1, [%2] \n"
|
|
" bnz 1b \n"
|
|
"3: \n"
|
|
: "=&r"(old), "=&r" (temp)
|
|
: "r"(&v->counter), "r"(a), "r"(u)
|
|
: "cc"); /* memory clobber comes from smp_mb() */
|
|
|
|
smp_mb();
|
|
|
|
return old;
|
|
}
|
|
#define atomic64_fetch_add_unless atomic64_fetch_add_unless
|
|
|
|
#endif /* !CONFIG_GENERIC_ATOMIC64 */
|
|
|
|
#endif /* !__ASSEMBLY__ */
|
|
|
|
#endif
|