riscv: atomic: Optimize dec_if_positive functions
authorGuo Ren <guoren@linux.alibaba.com>
Thu, 5 May 2022 03:55:23 +0000 (11:55 +0800)
committerPalmer Dabbelt <palmer@rivosinc.com>
Sat, 21 May 2022 17:31:46 +0000 (10:31 -0700)
Current implementation wastes another register to pass the
argument, but we only need addi to calculate the result. Optimize
the code with minimize the usage of registers.

Signed-off-by: Guo Ren <guoren@linux.alibaba.com>
Signed-off-by: Guo Ren <guoren@kernel.org>
Link: https://lore.kernel.org/r/20220505035526.2974382-3-guoren@kernel.org
Signed-off-by: Palmer Dabbelt <palmer@rivosinc.com>
arch/riscv/include/asm/atomic.h

index ac9bdf4fc4044b0b784836e40dd6b4e9aab9f294..f3c6a6eac02a58715fddafbd0688c54f8f834ad4 100644 (file)
@@ -310,47 +310,47 @@ ATOMIC_OPS()
 #undef ATOMIC_OPS
 #undef ATOMIC_OP
 
-static __always_inline int arch_atomic_sub_if_positive(atomic_t *v, int offset)
+static __always_inline int arch_atomic_dec_if_positive(atomic_t *v)
 {
        int prev, rc;
 
        __asm__ __volatile__ (
                "0:     lr.w     %[p],  %[c]\n"
-               "       sub      %[rc], %[p], %[o]\n"
+               "       addi     %[rc], %[p], -1\n"
                "       bltz     %[rc], 1f\n"
                "       sc.w.rl  %[rc], %[rc], %[c]\n"
                "       bnez     %[rc], 0b\n"
                "       fence    rw, rw\n"
                "1:\n"
                : [p]"=&r" (prev), [rc]"=&r" (rc), [c]"+A" (v->counter)
-               : [o]"r" (offset)
+               :
                : "memory");
-       return prev - offset;
+       return prev - 1;
 }
 
-#define arch_atomic_dec_if_positive(v) arch_atomic_sub_if_positive(v, 1)
+#define arch_atomic_dec_if_positive arch_atomic_dec_if_positive
 
 #ifndef CONFIG_GENERIC_ATOMIC64
-static __always_inline s64 arch_atomic64_sub_if_positive(atomic64_t *v, s64 offset)
+static __always_inline s64 arch_atomic64_dec_if_positive(atomic64_t *v)
 {
        s64 prev;
        long rc;
 
        __asm__ __volatile__ (
                "0:     lr.d     %[p],  %[c]\n"
-               "       sub      %[rc], %[p], %[o]\n"
+               "       addi      %[rc], %[p], -1\n"
                "       bltz     %[rc], 1f\n"
                "       sc.d.rl  %[rc], %[rc], %[c]\n"
                "       bnez     %[rc], 0b\n"
                "       fence    rw, rw\n"
                "1:\n"
                : [p]"=&r" (prev), [rc]"=&r" (rc), [c]"+A" (v->counter)
-               : [o]"r" (offset)
+               :
                : "memory");
-       return prev - offset;
+       return prev - 1;
 }
 
-#define arch_atomic64_dec_if_positive(v)       arch_atomic64_sub_if_positive(v, 1)
+#define arch_atomic64_dec_if_positive  arch_atomic64_dec_if_positive
 #endif
 
 #endif /* _ASM_RISCV_ATOMIC_H */