arm64: atomics: Fix the issue on xchg when switch to atomic instruction

Message ID	1588669355-38741-1-git-send-email-zhangshaokun@hisilicon.com (mailing list archive)
State	New, archived
Headers	show Return-Path: <SRS0=eq5l=6T=lists.infradead.org=linux-arm-kernel-bounces+patchwork-linux-arm=patchwork.kernel.org@kernel.org> DMARC-Filter: OpenDMARC Filter v1.3.2 mail.kernel.org EF5DA206A4 From: Shaokun Zhang <zhangshaokun@hisilicon.com> To: <linux-arm-kernel@lists.infradead.org> Subject: [PATCH] arm64: atomics: Fix the issue on xchg when switch to atomic instruction Date: Tue, 5 May 2020 17:02:35 +0800 Message-ID: <1588669355-38741-1-git-send-email-zhangshaokun@hisilicon.com> MIME-Version: 1.0 summary: Content analysis details: (-2.3 points) pts rule name description ---- ---------------------- -------------------------------------------------- -2.3 RCVD_IN_DNSWL_MED RBL: Sender listed at https://www.dnswl.org/, medium trust [45.249.212.191 listed in list.dnswl.org] -0.0 RCVD_IN_MSPIKE_H2 RBL: Average reputation (+2) [45.249.212.191 listed in wl.mailspike.net] -0.0 SPF_HELO_PASS SPF: HELO matches SPF record -0.0 SPF_PASS SPF: sender matches SPF record Precedence: list Cc: Shaokun Zhang <zhangshaokun@hisilicon.com>, Yuqi Jin <jinyuqi@huawei.com>, Andrew Murray <amurray@thegoodpenguin.co.uk>, Will Deacon <will@kernel.org>, Catalin Marinas <catalin.marinas@arm.com> Content-Type: text/plain; charset="us-ascii" Content-Transfer-Encoding: 7bit Sender: "linux-arm-kernel" <linux-arm-kernel-bounces@lists.infradead.org> Errors-To: linux-arm-kernel-bounces+patchwork-linux-arm=patchwork.kernel.org@lists.infradead.org
Series	arm64: atomics: Fix the issue on xchg when switch to atomic instruction \| expand arm64: atomics: Fix the issue on xchg when switch to atomic instruction

diff --git a/arch/arm64/include/asm/atomic_ll_sc.h b/arch/arm64/include/asm/atomic_ll_sc.h index 13869b76b58c..73fcb71ccb91 100644 --- a/arch/arm64/include/asm/atomic_ll_sc.h +++ b/arch/arm64/include/asm/atomic_ll_sc.h @@ -348,6 +348,47 @@ __CMPXCHG_DBL( , , , ) __CMPXCHG_DBL(_mb, dmb ish, l, "memory") #undef __CMPXCHG_DBL + +#define __XCHG_CASE(w, sfx, name, sz, mb, nop_lse, acq, acq_lse, rel, cl) \ +static inline u##sz __ll_sc__xchg_case_##name##sz(u##sz x, volatile void *ptr) \ +{ \ + u##sz ret; \ + unsigned long tmp; \ + \ + asm volatile( \ + __LL_SC_FALLBACK( \ + " prfm pstl1strm, %2\n" \ + "1: ld" #acq "xr" #sfx "\t%" #w "0, %2\n" \ + " st" #rel "xr" #sfx "\t%w1, %" #w "3, %2\n" \ + " cbnz %w1, 1b\n" \ + " " #mb "\n" \ + "2:") \ + : "=&r" (ret), "=&r" (tmp), "+Q" (*(u##sz *)ptr) \ + : "r" (x) \ + : cl); \ + \ + return ret; \ +} + +__XCHG_CASE(w, b, , 8, , , , , , ) +__XCHG_CASE(w, h, , 16, , , , , , ) +__XCHG_CASE(w, , , 32, , , , , , ) +__XCHG_CASE( , , , 64, , , , , , ) +__XCHG_CASE(w, b, acq_, 8, , , a, a, , "memory") +__XCHG_CASE(w, h, acq_, 16, , , a, a, , "memory") +__XCHG_CASE(w, , acq_, 32, , , a, a, , "memory") +__XCHG_CASE( , , acq_, 64, , , a, a, , "memory") +__XCHG_CASE(w, b, rel_, 8, , , , , l, "memory") +__XCHG_CASE(w, h, rel_, 16, , , , , l, "memory") +__XCHG_CASE(w, , rel_, 32, , , , , l, "memory") +__XCHG_CASE( , , rel_, 64, , , , , l, "memory") +__XCHG_CASE(w, b, mb_, 8, dmb ish, nop, , a, l, "memory") +__XCHG_CASE(w, h, mb_, 16, dmb ish, nop, , a, l, "memory") +__XCHG_CASE(w, , mb_, 32, dmb ish, nop, , a, l, "memory") +__XCHG_CASE( , , mb_, 64, dmb ish, nop, , a, l, "memory") + +#undef __XCHG_CASE + #undef K #endif /* __ASM_ATOMIC_LL_SC_H */ diff --git a/arch/arm64/include/asm/atomic_lse.h b/arch/arm64/include/asm/atomic_lse.h index da3280f639cd..ddb2c212faa3 100644 --- a/arch/arm64/include/asm/atomic_lse.h +++ b/arch/arm64/include/asm/atomic_lse.h @@ -416,4 +416,39 @@ __CMPXCHG_DBL(_mb, al, "memory") #undef __CMPXCHG_DBL +#define __XCHG_CASE(w, sfx, name, sz, mb, nop_lse, acq, acq_lse, rel, cl) \ +static __always_inline u##sz __lse__xchg_case_##name##sz(u##sz x, volatile void *ptr) \ +{ \ + u##sz ret; \ + unsigned long tmp; \ + \ + asm volatile( \ + __LSE_PREAMBLE \ + " swp" #acq_lse #rel #sfx "\t%" #w "3, %" #w "0, %2\n" \ + : "=&r" (ret), "=&r" (tmp), "+Q" (*(u##sz *)ptr) \ + : "r" (x) \ + : cl); \ + \ + return ret; \ +} + +__XCHG_CASE(w, b, , 8, , , , , , ) +__XCHG_CASE(w, h, , 16, , , , , , ) +__XCHG_CASE(w, , , 32, , , , , , ) +__XCHG_CASE( , , , 64, , , , , , ) +__XCHG_CASE(w, b, acq_, 8, , , a, a, , "memory") +__XCHG_CASE(w, h, acq_, 16, , , a, a, , "memory") +__XCHG_CASE(w, , acq_, 32, , , a, a, , "memory") +__XCHG_CASE( , , acq_, 64, , , a, a, , "memory") +__XCHG_CASE(w, b, rel_, 8, , , , , l, "memory") +__XCHG_CASE(w, h, rel_, 16, , , , , l, "memory") +__XCHG_CASE(w, , rel_, 32, , , , , l, "memory") +__XCHG_CASE( , , rel_, 64, , , , , l, "memory") +__XCHG_CASE(w, b, mb_, 8, dmb ish, nop, , a, l, "memory") +__XCHG_CASE(w, h, mb_, 16, dmb ish, nop, , a, l, "memory") +__XCHG_CASE(w, , mb_, 32, dmb ish, nop, , a, l, "memory") +__XCHG_CASE( , , mb_, 64, dmb ish, nop, , a, l, "memory") + +#undef __XCHG_CASE + #endif /* __ASM_ATOMIC_LSE_H */ diff --git a/arch/arm64/include/asm/cmpxchg.h b/arch/arm64/include/asm/cmpxchg.h index f9bef42c1411..084028518417 100644 --- a/arch/arm64/include/asm/cmpxchg.h +++ b/arch/arm64/include/asm/cmpxchg.h @@ -13,73 +13,25 @@ #include <asm/barrier.h> #include <asm/lse.h> -/* - * We need separate acquire parameters for ll/sc and lse, since the full - * barrier case is generated as release+dmb for the former and - * acquire+release for the latter. - */ -#define __XCHG_CASE(w, sfx, name, sz, mb, nop_lse, acq, acq_lse, rel, cl) \ -static inline u##sz __xchg_case_##name##sz(u##sz x, volatile void *ptr) \ -{ \ - u##sz ret; \ - unsigned long tmp; \ - \ - asm volatile(ARM64_LSE_ATOMIC_INSN( \ - /* LL/SC */ \ - " prfm pstl1strm, %2\n" \ - "1: ld" #acq "xr" #sfx "\t%" #w "0, %2\n" \ - " st" #rel "xr" #sfx "\t%w1, %" #w "3, %2\n" \ - " cbnz %w1, 1b\n" \ - " " #mb, \ - /* LSE atomics */ \ - " swp" #acq_lse #rel #sfx "\t%" #w "3, %" #w "0, %2\n" \ - __nops(3) \ - " " #nop_lse) \ - : "=&r" (ret), "=&r" (tmp), "+Q" (*(u##sz *)ptr) \ - : "r" (x) \ - : cl); \ - \ - return ret; \ -} - -__XCHG_CASE(w, b, , 8, , , , , , ) -__XCHG_CASE(w, h, , 16, , , , , , ) -__XCHG_CASE(w, , , 32, , , , , , ) -__XCHG_CASE( , , , 64, , , , , , ) -__XCHG_CASE(w, b, acq_, 8, , , a, a, , "memory") -__XCHG_CASE(w, h, acq_, 16, , , a, a, , "memory") -__XCHG_CASE(w, , acq_, 32, , , a, a, , "memory") -__XCHG_CASE( , , acq_, 64, , , a, a, , "memory") -__XCHG_CASE(w, b, rel_, 8, , , , , l, "memory") -__XCHG_CASE(w, h, rel_, 16, , , , , l, "memory") -__XCHG_CASE(w, , rel_, 32, , , , , l, "memory") -__XCHG_CASE( , , rel_, 64, , , , , l, "memory") -__XCHG_CASE(w, b, mb_, 8, dmb ish, nop, , a, l, "memory") -__XCHG_CASE(w, h, mb_, 16, dmb ish, nop, , a, l, "memory") -__XCHG_CASE(w, , mb_, 32, dmb ish, nop, , a, l, "memory") -__XCHG_CASE( , , mb_, 64, dmb ish, nop, , a, l, "memory") - -#undef __XCHG_CASE - #define __XCHG_GEN(sfx) \ -static __always_inline unsigned long __xchg##sfx(unsigned long x, \ - volatile void *ptr, \ - int size) \ -{ \ - switch (size) { \ - case 1: \ - return __xchg_case##sfx##_8(x, ptr); \ - case 2: \ - return __xchg_case##sfx##_16(x, ptr); \ - case 4: \ - return __xchg_case##sfx##_32(x, ptr); \ - case 8: \ - return __xchg_case##sfx##_64(x, ptr); \ - default: \ - BUILD_BUG(); \ - } \ +static __always_inline unsigned long __xchg##sfx(unsigned long x, \ + volatile void *ptr, \ + int size) \ +{ \ + switch (size) { \ + case 1: \ + return __lse_ll_sc_body(_xchg_case##sfx##_8, x, ptr); \ + case 2: \ + return __lse_ll_sc_body(_xchg_case##sfx##_16, x, ptr); \ + case 4: \ + return __lse_ll_sc_body(_xchg_case##sfx##_32, x, ptr); \ + case 8: \ + return __lse_ll_sc_body(_xchg_case##sfx##_64, x, ptr); \ + default: \ + BUILD_BUG(); \ + } \ \ - unreachable(); \ + unreachable(); \ } __XCHG_GEN()

arm64: atomics: Fix the issue on xchg when switch to atomic instruction

Commit Message

Comments

Patch