arm64: atomics: fix use of acquire + release for full barrier semantics

author Will Deacon <will.deacon@arm.com>

Tue, 4 Feb 2014 12:29:12 +0000 (12:29 +0000)

committer Catalin Marinas <catalin.marinas@arm.com>

Fri, 7 Feb 2014 16:45:43 +0000 (16:45 +0000)
author Will Deacon <will.deacon@arm.com>
Tue, 4 Feb 2014 12:29:12 +0000 (12:29 +0000)
committer Catalin Marinas <catalin.marinas@arm.com>
Fri, 7 Feb 2014 16:45:43 +0000 (16:45 +0000)
diff --git a/arch/arm64/include/asm/atomic.h b/arch/arm64/include/asm/atomic.h

index 01de5aaa3edc112a42548a1b3906e4353bcce949..e32893e005d4763bbc59620bcc6178b9fabf08ff 100644 (file)
--- a/arch/arm64/include/asm/atomic.h
+++ b/arch/arm64/include/asm/atomic.h
@@ -64,7 +64,7 @@ static inline int atomic_add_return(int i, atomic_t *v)
         int result;
  
         asm volatile("// atomic_add_return\n"
-"1:    ldaxr   %w0, %2\n"
+"1:    ldxr    %w0, %2\n"
  "      add     %w0, %w0, %w3\n"
  "      stlxr   %w1, %w0, %2\n"
  "      cbnz    %w1, 1b"
@@ -72,6 +72,7 @@ static inline int atomic_add_return(int i, atomic_t *v)
         : "Ir" (i)
         : "cc", "memory");
  
+       smp_mb();
         return result;
  }
  
@@ -96,7 +97,7 @@ static inline int atomic_sub_return(int i, atomic_t *v)
         int result;
  
         asm volatile("// atomic_sub_return\n"
-"1:    ldaxr   %w0, %2\n"
+"1:    ldxr    %w0, %2\n"
  "      sub     %w0, %w0, %w3\n"
  "      stlxr   %w1, %w0, %2\n"
  "      cbnz    %w1, 1b"
@@ -104,6 +105,7 @@ static inline int atomic_sub_return(int i, atomic_t *v)
         : "Ir" (i)
         : "cc", "memory");
  
+       smp_mb();
         return result;
  }
  
@@ -112,17 +114,20 @@ static inline int atomic_cmpxchg(atomic_t *ptr, int old, int new)
         unsigned long tmp;
         int oldval;
  
+       smp_mb();
+
         asm volatile("// atomic_cmpxchg\n"
-"1:    ldaxr   %w1, %2\n"
+"1:    ldxr    %w1, %2\n"
  "      cmp     %w1, %w3\n"
  "      b.ne    2f\n"
-"      stlxr   %w0, %w4, %2\n"
+"      stxr    %w0, %w4, %2\n"
  "      cbnz    %w0, 1b\n"
  "2:"
         : "=&r" (tmp), "=&r" (oldval), "+Q" (ptr->counter)
         : "Ir" (old), "r" (new)
         : "cc", "memory");
  
+       smp_mb();
         return oldval;
  }
  
@@ -183,7 +188,7 @@ static inline long atomic64_add_return(long i, atomic64_t *v)
         unsigned long tmp;
  
         asm volatile("// atomic64_add_return\n"
-"1:    ldaxr   %0, %2\n"
+"1:    ldxr    %0, %2\n"
  "      add     %0, %0, %3\n"
  "      stlxr   %w1, %0, %2\n"
  "      cbnz    %w1, 1b"
@@ -191,6 +196,7 @@ static inline long atomic64_add_return(long i, atomic64_t *v)
         : "Ir" (i)
         : "cc", "memory");
  
+       smp_mb();
         return result;
  }
  
@@ -215,7 +221,7 @@ static inline long atomic64_sub_return(long i, atomic64_t *v)
         unsigned long tmp;
  
         asm volatile("// atomic64_sub_return\n"
-"1:    ldaxr   %0, %2\n"
+"1:    ldxr    %0, %2\n"
  "      sub     %0, %0, %3\n"
  "      stlxr   %w1, %0, %2\n"
  "      cbnz    %w1, 1b"
@@ -223,6 +229,7 @@ static inline long atomic64_sub_return(long i, atomic64_t *v)
         : "Ir" (i)
         : "cc", "memory");
  
+       smp_mb();
         return result;
  }
  
@@ -231,17 +238,20 @@ static inline long atomic64_cmpxchg(atomic64_t *ptr, long old, long new)
         long oldval;
         unsigned long res;
  
+       smp_mb();
+
         asm volatile("// atomic64_cmpxchg\n"
-"1:    ldaxr   %1, %2\n"
+"1:    ldxr    %1, %2\n"
  "      cmp     %1, %3\n"
  "      b.ne    2f\n"
-"      stlxr   %w0, %4, %2\n"
+"      stxr    %w0, %4, %2\n"
  "      cbnz    %w0, 1b\n"
  "2:"
         : "=&r" (res), "=&r" (oldval), "+Q" (ptr->counter)
         : "Ir" (old), "r" (new)
         : "cc", "memory");
  
+       smp_mb();
         return oldval;
  }
  
@@ -253,11 +263,12 @@ static inline long atomic64_dec_if_positive(atomic64_t *v)
         unsigned long tmp;
  
         asm volatile("// atomic64_dec_if_positive\n"
-"1:    ldaxr   %0, %2\n"
+"1:    ldxr    %0, %2\n"
  "      subs    %0, %0, #1\n"
  "      b.mi    2f\n"
  "      stlxr   %w1, %0, %2\n"
  "      cbnz    %w1, 1b\n"
+"      dmb     ish\n"
  "2:"
         : "=&r" (result), "=&r" (tmp), "+Q" (v->counter)
         :
diff --git a/arch/arm64/include/asm/cmpxchg.h b/arch/arm64/include/asm/cmpxchg.h

index 56166d7f4a258867d817804c4c17145952895a20..189390ce865334bb1417950400e12273edb3450a 100644 (file)
--- a/arch/arm64/include/asm/cmpxchg.h
+++ b/arch/arm64/include/asm/cmpxchg.h
@@ -29,7 +29,7 @@ static inline unsigned long __xchg(unsigned long x, volatile void *ptr, int size
         switch (size) {
         case 1:
                 asm volatile("//        __xchg1\n"
-               "1:     ldaxrb  %w0, %2\n"
+               "1:     ldxrb   %w0, %2\n"
                 "       stlxrb  %w1, %w3, %2\n"
                 "       cbnz    %w1, 1b\n"
                         : "=&r" (ret), "=&r" (tmp), "+Q" (*(u8 *)ptr)
@@ -38,7 +38,7 @@ static inline unsigned long __xchg(unsigned long x, volatile void *ptr, int size
                 break;
         case 2:
                 asm volatile("//        __xchg2\n"
-               "1:     ldaxrh  %w0, %2\n"
+               "1:     ldxrh   %w0, %2\n"
                 "       stlxrh  %w1, %w3, %2\n"
                 "       cbnz    %w1, 1b\n"
                         : "=&r" (ret), "=&r" (tmp), "+Q" (*(u16 *)ptr)
@@ -47,7 +47,7 @@ static inline unsigned long __xchg(unsigned long x, volatile void *ptr, int size
                 break;
         case 4:
                 asm volatile("//        __xchg4\n"
-               "1:     ldaxr   %w0, %2\n"
+               "1:     ldxr    %w0, %2\n"
                 "       stlxr   %w1, %w3, %2\n"
                 "       cbnz    %w1, 1b\n"
                         : "=&r" (ret), "=&r" (tmp), "+Q" (*(u32 *)ptr)
@@ -56,7 +56,7 @@ static inline unsigned long __xchg(unsigned long x, volatile void *ptr, int size
                 break;
         case 8:
                 asm volatile("//        __xchg8\n"
-               "1:     ldaxr   %0, %2\n"
+               "1:     ldxr    %0, %2\n"
                 "       stlxr   %w1, %3, %2\n"
                 "       cbnz    %w1, 1b\n"
                         : "=&r" (ret), "=&r" (tmp), "+Q" (*(u64 *)ptr)
@@ -67,6 +67,7 @@ static inline unsigned long __xchg(unsigned long x, volatile void *ptr, int size
                 BUILD_BUG();
         }
  
+       smp_mb();
         return ret;
  }
  
diff --git a/arch/arm64/include/asm/futex.h b/arch/arm64/include/asm/futex.h

index 78cc3aba5d69e9ff976be9226cd975860b0a31a0..572193d0005d7597cfcc15456df72f8efa3712f7 100644 (file)
--- a/arch/arm64/include/asm/futex.h
+++ b/arch/arm64/include/asm/futex.h
@@ -24,10 +24,11 @@
  
  #define __futex_atomic_op(insn, ret, oldval, uaddr, tmp, oparg)                \
         asm volatile(                                                   \
-"1:    ldaxr   %w1, %2\n"                                              \
+"1:    ldxr    %w1, %2\n"                                              \
         insn "\n"                                                       \
  "2:    stlxr   %w3, %w0, %2\n"                                         \
  "      cbnz    %w3, 1b\n"                                              \
+"      dmb     ish\n"                                                  \
  "3:\n"                                                                 \
  "      .pushsection .fixup,\"ax\"\n"                                   \
  "      .align  2\n"                                                    \
@@ -111,11 +112,12 @@ futex_atomic_cmpxchg_inatomic(u32 *uval, u32 __user *uaddr,
                 return -EFAULT;
  
         asm volatile("// futex_atomic_cmpxchg_inatomic\n"
-"1:    ldaxr   %w1, %2\n"
+"1:    ldxr    %w1, %2\n"
  "      sub     %w3, %w1, %w4\n"
  "      cbnz    %w3, 3f\n"
  "2:    stlxr   %w3, %w5, %2\n"
  "      cbnz    %w3, 1b\n"
+"      dmb     ish\n"
  "3:\n"
  "      .pushsection .fixup,\"ax\"\n"
  "4:    mov     %w0, %w6\n"
diff --git a/arch/arm64/kernel/kuser32.S b/arch/arm64/kernel/kuser32.S

index 63c48ffdf230125dedea62d631b3067f4d7a28e1..7787208e8cc6af3a4ff55226fb85ef6b8f8d30ba 100644 (file)
--- a/arch/arm64/kernel/kuser32.S
+++ b/arch/arm64/kernel/kuser32.S
@@ -38,12 +38,13 @@ __kuser_cmpxchg64:                  // 0xffff0f60
         .inst   0xe92d00f0              //      push            {r4, r5, r6, r7}
         .inst   0xe1c040d0              //      ldrd            r4, r5, [r0]
         .inst   0xe1c160d0              //      ldrd            r6, r7, [r1]
-       .inst   0xe1b20e9f              // 1:   ldaexd          r0, r1, [r2]
+       .inst   0xe1b20f9f              // 1:   ldrexd          r0, r1, [r2]
         .inst   0xe0303004              //      eors            r3, r0, r4
         .inst   0x00313005              //      eoreqs          r3, r1, r5
         .inst   0x01a23e96              //      stlexdeq        r3, r6, [r2]
         .inst   0x03330001              //      teqeq           r3, #1
         .inst   0x0afffff9              //      beq             1b
+       .inst   0xf57ff05b              //      dmb             ish
         .inst   0xe2730000              //      rsbs            r0, r3, #0
         .inst   0xe8bd00f0              //      pop             {r4, r5, r6, r7}
         .inst   0xe12fff1e              //      bx              lr
@@ -55,11 +56,12 @@ __kuser_memory_barrier:                     // 0xffff0fa0
  
         .align  5
  __kuser_cmpxchg:                       // 0xffff0fc0
-       .inst   0xe1923e9f              // 1:   ldaex           r3, [r2]
+       .inst   0xe1923f9f              // 1:   ldrex           r3, [r2]
         .inst   0xe0533000              //      subs            r3, r3, r0
         .inst   0x01823e91              //      stlexeq         r3, r1, [r2]
         .inst   0x03330001              //      teqeq           r3, #1
         .inst   0x0afffffa              //      beq             1b
+       .inst   0xf57ff05b              //      dmb             ish
         .inst   0xe2730000              //      rsbs            r0, r3, #0
         .inst   0xe12fff1e              //      bx              lr
  
diff --git a/arch/arm64/lib/bitops.S b/arch/arm64/lib/bitops.S

index e5db797790d3265c5418d749b7537c494ddeb250..7dac371cc9a2f8c817d895d1be0103db9a009ec9 100644 (file)
--- a/arch/arm64/lib/bitops.S
+++ b/arch/arm64/lib/bitops.S
@@ -46,11 +46,12 @@ ENTRY(      \name   )
         mov     x2, #1
         add     x1, x1, x0, lsr #3      // Get word offset
         lsl     x4, x2, x3              // Create mask
-1:     ldaxr   x2, [x1]
+1:     ldxr    x2, [x1]
         lsr     x0, x2, x3              // Save old value of bit
         \instr  x2, x2, x4              // toggle bit
         stlxr   w5, x2, [x1]
         cbnz    w5, 1b
+       dmb     ish
         and     x0, x0, #1
  3:     ret
  ENDPROC(\name  )
author	Will Deacon <will.deacon@arm.com>
	Tue, 4 Feb 2014 12:29:12 +0000 (12:29 +0000)
committer	Catalin Marinas <catalin.marinas@arm.com>
	Fri, 7 Feb 2014 16:45:43 +0000 (16:45 +0000)
arch/arm64/include/asm/atomic.h		patch \| blob \| history
arch/arm64/include/asm/cmpxchg.h		patch \| blob \| history
arch/arm64/include/asm/futex.h		patch \| blob \| history
arch/arm64/kernel/kuser32.S		patch \| blob \| history
arch/arm64/lib/bitops.S		patch \| blob \| history