mirror of
https://github.com/RPCSX/llvm.git
synced 2025-01-26 22:45:05 +00:00
874371d11b
This commit changes the interface of the vld[1234], vld[234]lane, and vst[1234], vst[234]lane ARM neon intrinsics and associates an address space with the pointer that these intrinsics take. This changes, e.g., <2 x i32> @llvm.arm.neon.vld1.v2i32(i8*, i32) to <2 x i32> @llvm.arm.neon.vld1.v2i32.p0i8(i8*, i32) This change ensures that address spaces are fully taken into account in the ARM target during lowering of interleaved loads and stores. Differential Revision: http://reviews.llvm.org/D12985 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@248887 91177308-0d34-0410-b5e6-96231b3b80d8
26 lines
966 B
LLVM
26 lines
966 B
LLVM
; RUN: llc < %s -O0 -mcpu=cortex-a8 | FileCheck %s
|
|
target datalayout = "e-p:32:32:32-i1:8:32-i8:8:32-i16:16:32-i32:32:32-i64:32:32-f32:32:32-f64:32:32-v64:32:64-v128:32:128-a0:0:32-n32"
|
|
target triple = "thumbv7-apple-darwin10"
|
|
|
|
; This tests the fast register allocator's handling of partial redefines:
|
|
;
|
|
; %reg1028:dsub_0<def>, %reg1028:dsub_1<def> = VLD1q64 %reg1025...
|
|
; %reg1030:dsub_1<def> = COPY %reg1028:dsub_0<kill>
|
|
;
|
|
; %reg1028 gets allocated %Q0, and if %reg1030 is reloaded for the partial
|
|
; redef, it cannot also get %Q0.
|
|
|
|
; CHECK: vld1.64 {d16, d17}, [r{{.}}]
|
|
; CHECK-NOT: vld1.64 {d16, d17}
|
|
; CHECK: vmov.f64
|
|
|
|
define i32 @test(i8* %arg) nounwind {
|
|
entry:
|
|
%0 = call <2 x i64> @llvm.arm.neon.vld1.v2i64.p0i8(i8* %arg, i32 1)
|
|
%1 = shufflevector <2 x i64> undef, <2 x i64> %0, <2 x i32> <i32 1, i32 2>
|
|
store <2 x i64> %1, <2 x i64>* undef, align 16
|
|
ret i32 undef
|
|
}
|
|
|
|
declare <2 x i64> @llvm.arm.neon.vld1.v2i64.p0i8(i8*, i32) nounwind readonly
|