mirror of
https://github.com/RPCSX/llvm.git
synced 2024-12-16 00:16:50 +00:00
16a661561f
ARM counterpart to r248291: In the comparison failure block of a cmpxchg expansion, the initial ldrex/ldxr will not be followed by a matching strex/stxr. On ARM/AArch64, this unnecessarily ties up the execution monitor, which might have a negative performance impact on some uarchs. Instead, release the monitor in the failure block. The clrex instruction was designed for this: use it. Also see ARMARM v8-A B2.10.2: "Exclusive access instructions and Shareable memory locations". Differential Revision: http://reviews.llvm.org/D13033 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@248294 91177308-0d34-0410-b5e6-96231b3b80d8
19 lines
495 B
LLVM
19 lines
495 B
LLVM
; RUN: llc < %s -mtriple=armv7-apple-darwin -verify-machineinstrs | FileCheck %s -check-prefix=ARM
|
|
; RUN: llc < %s -mtriple=thumbv7-apple-darwin -verify-machineinstrs | FileCheck %s -check-prefix=T2
|
|
; rdar://8964854
|
|
|
|
define i8 @t(i8* %a, i8 %b, i8 %c) nounwind {
|
|
; ARM-LABEL: t:
|
|
; ARM: ldrexb
|
|
; ARM: strexb
|
|
; ARM: clrex
|
|
|
|
; T2-LABEL: t:
|
|
; T2: strexb
|
|
; T2: ldrexb
|
|
; T2: clrex
|
|
%tmp0 = cmpxchg i8* %a, i8 %b, i8 %c monotonic monotonic
|
|
%tmp1 = extractvalue { i8, i1 } %tmp0, 0
|
|
ret i8 %tmp1
|
|
}
|