mirror of
https://github.com/RPCS3/llvm.git
synced 2025-01-12 15:30:56 +00:00
85af3e7445
Use volatile store to protect the generated PTX from DCE. Patch by Jingyue Wu. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@206763 91177308-0d34-0410-b5e6-96231b3b80d8
19 lines
796 B
LLVM
19 lines
796 B
LLVM
; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s --check-prefix=PTX32
|
|
; RUN: llc < %s -march=nvptx64 -mcpu=sm_20 | FileCheck %s --check-prefix=PTX64
|
|
|
|
; Ensure we access the local stack properly
|
|
|
|
; PTX32: mov.u32 %r{{[0-9]+}}, __local_depot{{[0-9]+}};
|
|
; PTX32: cvta.local.u32 %SP, %r{{[0-9]+}};
|
|
; PTX32: ld.param.u32 %r{{[0-9]+}}, [foo_param_0];
|
|
; PTX32: st.volatile.u32 [%SP+0], %r{{[0-9]+}};
|
|
; PTX64: mov.u64 %rl{{[0-9]+}}, __local_depot{{[0-9]+}};
|
|
; PTX64: cvta.local.u64 %SP, %rl{{[0-9]+}};
|
|
; PTX64: ld.param.u32 %r{{[0-9]+}}, [foo_param_0];
|
|
; PTX64: st.volatile.u32 [%SP+0], %r{{[0-9]+}};
|
|
define void @foo(i32 %a) {
|
|
%local = alloca i32, align 4
|
|
store volatile i32 %a, i32* %local
|
|
ret void
|
|
}
|