On Mon, Oct 26, 2015 at 05:50:52PM +0800, Boqun Feng wrote:
> This patch fixes two problems to make value-returning atomics and
> {cmp}xchg fully ordered on PPC.
> 
> According to memory-barriers.txt:
> 
> > Any atomic operation that modifies some state in memory and returns
> > information about the state (old or new) implies an SMP-conditional
> > general memory barrier (smp_mb()) on each side of the actual
> > operation ...
> 
> which means these operations should be fully ordered. However on PPC,
> PPC_ATOMIC_ENTRY_BARRIER is the barrier before the actual operation,
> which is currently "lwsync" if SMP=y. The leading "lwsync" can not
> guarantee fully ordered atomics, according to Paul Mckenney:
> 
> https://lkml.org/lkml/2015/10/14/970
> 
> To fix this, we define PPC_ATOMIC_ENTRY_BARRIER as "sync" to guarantee
> the fully-ordered semantics.
> 
> This also makes futex atomics fully ordered, which can avoid possible
> memory ordering problems if userspace code relies on futex system call
> for fully ordered semantics.
> 
> Another thing to fix is that xchg, cmpxchg and their atomic{64}_
> versions are currently RELEASE+ACQUIRE, which are not fully ordered.
> 
> So also replace PPC_RELEASE_BARRIER and PPC_ACQUIRE_BARRIER with
> PPC_ATOMIC_ENTRY_BARRIER and PPC_ATOMIC_EXIT_BARRIER in
> __{cmp,}xchg_{u32,u64} respectively to guarantee fully ordered semantics
> of atomic{,64}_{cmp,}xchg() and {cmp,}xchg(), as a complement of commit
> b97021f85517 ("powerpc: Fix atomic_xxx_return barrier semantics").
> 
> Cc: <sta...@vger.kernel.org> # 3.4+

Hmm.. I use the same Cc tag as v4, seems my git(2.6.2) send-email has a
weird behavior of composing Cc address?

I will resend this one soon, sorry ;-(

Regards,
Boqun

> Signed-off-by: Boqun Feng <boqun.f...@gmail.com>
> ---
> 
> Michael, I also change PPC_ATOMIC_ENTRY_BARRIER as "sync" if SMP=y in this
> version , which is different from the previous one, so request for a new ack.
> Thank you ;-)
> 
>  arch/powerpc/include/asm/cmpxchg.h | 16 ++++++++--------
>  arch/powerpc/include/asm/synch.h   |  2 +-
>  2 files changed, 9 insertions(+), 9 deletions(-)
> 
> diff --git a/arch/powerpc/include/asm/cmpxchg.h 
> b/arch/powerpc/include/asm/cmpxchg.h
> index ad6263c..d1a8d93 100644
> --- a/arch/powerpc/include/asm/cmpxchg.h
> +++ b/arch/powerpc/include/asm/cmpxchg.h
> @@ -18,12 +18,12 @@ __xchg_u32(volatile void *p, unsigned long val)
>       unsigned long prev;
>  
>       __asm__ __volatile__(
> -     PPC_RELEASE_BARRIER
> +     PPC_ATOMIC_ENTRY_BARRIER
>  "1:  lwarx   %0,0,%2 \n"
>       PPC405_ERR77(0,%2)
>  "    stwcx.  %3,0,%2 \n\
>       bne-    1b"
> -     PPC_ACQUIRE_BARRIER
> +     PPC_ATOMIC_EXIT_BARRIER
>       : "=&r" (prev), "+m" (*(volatile unsigned int *)p)
>       : "r" (p), "r" (val)
>       : "cc", "memory");
> @@ -61,12 +61,12 @@ __xchg_u64(volatile void *p, unsigned long val)
>       unsigned long prev;
>  
>       __asm__ __volatile__(
> -     PPC_RELEASE_BARRIER
> +     PPC_ATOMIC_ENTRY_BARRIER
>  "1:  ldarx   %0,0,%2 \n"
>       PPC405_ERR77(0,%2)
>  "    stdcx.  %3,0,%2 \n\
>       bne-    1b"
> -     PPC_ACQUIRE_BARRIER
> +     PPC_ATOMIC_EXIT_BARRIER
>       : "=&r" (prev), "+m" (*(volatile unsigned long *)p)
>       : "r" (p), "r" (val)
>       : "cc", "memory");
> @@ -151,14 +151,14 @@ __cmpxchg_u32(volatile unsigned int *p, unsigned long 
> old, unsigned long new)
>       unsigned int prev;
>  
>       __asm__ __volatile__ (
> -     PPC_RELEASE_BARRIER
> +     PPC_ATOMIC_ENTRY_BARRIER
>  "1:  lwarx   %0,0,%2         # __cmpxchg_u32\n\
>       cmpw    0,%0,%3\n\
>       bne-    2f\n"
>       PPC405_ERR77(0,%2)
>  "    stwcx.  %4,0,%2\n\
>       bne-    1b"
> -     PPC_ACQUIRE_BARRIER
> +     PPC_ATOMIC_EXIT_BARRIER
>       "\n\
>  2:"
>       : "=&r" (prev), "+m" (*p)
> @@ -197,13 +197,13 @@ __cmpxchg_u64(volatile unsigned long *p, unsigned long 
> old, unsigned long new)
>       unsigned long prev;
>  
>       __asm__ __volatile__ (
> -     PPC_RELEASE_BARRIER
> +     PPC_ATOMIC_ENTRY_BARRIER
>  "1:  ldarx   %0,0,%2         # __cmpxchg_u64\n\
>       cmpd    0,%0,%3\n\
>       bne-    2f\n\
>       stdcx.  %4,0,%2\n\
>       bne-    1b"
> -     PPC_ACQUIRE_BARRIER
> +     PPC_ATOMIC_EXIT_BARRIER
>       "\n\
>  2:"
>       : "=&r" (prev), "+m" (*p)
> diff --git a/arch/powerpc/include/asm/synch.h 
> b/arch/powerpc/include/asm/synch.h
> index e682a71..c508686 100644
> --- a/arch/powerpc/include/asm/synch.h
> +++ b/arch/powerpc/include/asm/synch.h
> @@ -44,7 +44,7 @@ static inline void isync(void)
>       MAKE_LWSYNC_SECTION_ENTRY(97, __lwsync_fixup);
>  #define PPC_ACQUIRE_BARRIER   "\n" stringify_in_c(__PPC_ACQUIRE_BARRIER)
>  #define PPC_RELEASE_BARRIER   stringify_in_c(LWSYNC) "\n"
> -#define PPC_ATOMIC_ENTRY_BARRIER "\n" stringify_in_c(LWSYNC) "\n"
> +#define PPC_ATOMIC_ENTRY_BARRIER "\n" stringify_in_c(sync) "\n"
>  #define PPC_ATOMIC_EXIT_BARRIER       "\n" stringify_in_c(sync) "\n"
>  #else
>  #define PPC_ACQUIRE_BARRIER
> -- 
> 2.6.2
> 

Attachment: signature.asc
Description: PGP signature

_______________________________________________
Linuxppc-dev mailing list
Linuxppc-dev@lists.ozlabs.org
https://lists.ozlabs.org/listinfo/linuxppc-dev

Reply via email to