mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-01-10 13:51:37 +00:00
82c85585f9
aligned address. Based on patch by David Peixotto. Also use vld1.64 / vst1.64 with 128-bit alignment to take advantage of alignment hints. rdar://12090772, rdar://12238782 llvm-svn: 164089
334 lines
7.7 KiB
LLVM
334 lines
7.7 KiB
LLVM
; RUN: llc < %s -march=arm -mcpu=cortex-a9 | FileCheck %s
|
|
|
|
@A = global <4 x float> <float 0., float 1., float 2., float 3.>
|
|
|
|
define void @test_sqrt(<4 x float>* %X) nounwind {
|
|
|
|
; CHECK: test_sqrt:
|
|
|
|
; CHECK: movw r1, :lower16:{{.*}}
|
|
; CHECK: movt r1, :upper16:{{.*}}
|
|
; CHECK: vld1.64 {{.*}}, [r1, :128]
|
|
; CHECK: vsqrt.f32 {{s[0-9]+}}, {{s[0-9]+}}
|
|
; CHECK: vsqrt.f32 {{s[0-9]+}}, {{s[0-9]+}}
|
|
; CHECK: vsqrt.f32 {{s[0-9]+}}, {{s[0-9]+}}
|
|
; CHECK: vsqrt.f32 {{s[0-9]+}}, {{s[0-9]+}}
|
|
; CHECK: vst1.64 {{.*}}
|
|
|
|
L.entry:
|
|
%0 = load <4 x float>* @A, align 16
|
|
%1 = call <4 x float> @llvm.sqrt.v4f32(<4 x float> %0)
|
|
store <4 x float> %1, <4 x float>* %X, align 16
|
|
ret void
|
|
}
|
|
|
|
declare <4 x float> @llvm.sqrt.v4f32(<4 x float>) nounwind readonly
|
|
|
|
|
|
define void @test_cos(<4 x float>* %X) nounwind {
|
|
|
|
; CHECK: test_cos:
|
|
|
|
; CHECK: movw [[reg0:r[0-9]+]], :lower16:{{.*}}
|
|
; CHECK: movt [[reg0]], :upper16:{{.*}}
|
|
; CHECK: vld1.64
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}cosf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}cosf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}cosf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}cosf
|
|
|
|
; CHECK: vst1.64
|
|
|
|
L.entry:
|
|
%0 = load <4 x float>* @A, align 16
|
|
%1 = call <4 x float> @llvm.cos.v4f32(<4 x float> %0)
|
|
store <4 x float> %1, <4 x float>* %X, align 16
|
|
ret void
|
|
}
|
|
|
|
declare <4 x float> @llvm.cos.v4f32(<4 x float>) nounwind readonly
|
|
|
|
define void @test_exp(<4 x float>* %X) nounwind {
|
|
|
|
; CHECK: test_exp:
|
|
|
|
; CHECK: movw [[reg0:r[0-9]+]], :lower16:{{.*}}
|
|
; CHECK: movt [[reg0]], :upper16:{{.*}}
|
|
; CHECK: vld1.64
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}expf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}expf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}expf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}expf
|
|
|
|
; CHECK: vst1.64
|
|
|
|
L.entry:
|
|
%0 = load <4 x float>* @A, align 16
|
|
%1 = call <4 x float> @llvm.exp.v4f32(<4 x float> %0)
|
|
store <4 x float> %1, <4 x float>* %X, align 16
|
|
ret void
|
|
}
|
|
|
|
declare <4 x float> @llvm.exp.v4f32(<4 x float>) nounwind readonly
|
|
|
|
define void @test_exp2(<4 x float>* %X) nounwind {
|
|
|
|
; CHECK: test_exp2:
|
|
|
|
; CHECK: movw [[reg0:r[0-9]+]], :lower16:{{.*}}
|
|
; CHECK: movt [[reg0]], :upper16:{{.*}}
|
|
; CHECK: vld1.64
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}exp2f
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}exp2f
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}exp2f
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}exp2f
|
|
|
|
; CHECK: vst1.64
|
|
|
|
L.entry:
|
|
%0 = load <4 x float>* @A, align 16
|
|
%1 = call <4 x float> @llvm.exp2.v4f32(<4 x float> %0)
|
|
store <4 x float> %1, <4 x float>* %X, align 16
|
|
ret void
|
|
}
|
|
|
|
declare <4 x float> @llvm.exp2.v4f32(<4 x float>) nounwind readonly
|
|
|
|
define void @test_log10(<4 x float>* %X) nounwind {
|
|
|
|
; CHECK: test_log10:
|
|
|
|
; CHECK: movw [[reg0:r[0-9]+]], :lower16:{{.*}}
|
|
; CHECK: movt [[reg0]], :upper16:{{.*}}
|
|
; CHECK: vld1.64
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}log10f
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}log10f
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}log10f
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}log10f
|
|
|
|
; CHECK: vst1.64
|
|
|
|
L.entry:
|
|
%0 = load <4 x float>* @A, align 16
|
|
%1 = call <4 x float> @llvm.log10.v4f32(<4 x float> %0)
|
|
store <4 x float> %1, <4 x float>* %X, align 16
|
|
ret void
|
|
}
|
|
|
|
declare <4 x float> @llvm.log10.v4f32(<4 x float>) nounwind readonly
|
|
|
|
define void @test_log(<4 x float>* %X) nounwind {
|
|
|
|
; CHECK: test_log:
|
|
|
|
; CHECK: movw [[reg0:r[0-9]+]], :lower16:{{.*}}
|
|
; CHECK: movt [[reg0]], :upper16:{{.*}}
|
|
; CHECK: vld1.64
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}logf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}logf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}logf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}logf
|
|
|
|
; CHECK: vst1.64
|
|
|
|
L.entry:
|
|
%0 = load <4 x float>* @A, align 16
|
|
%1 = call <4 x float> @llvm.log.v4f32(<4 x float> %0)
|
|
store <4 x float> %1, <4 x float>* %X, align 16
|
|
ret void
|
|
}
|
|
|
|
declare <4 x float> @llvm.log.v4f32(<4 x float>) nounwind readonly
|
|
|
|
define void @test_log2(<4 x float>* %X) nounwind {
|
|
|
|
; CHECK: test_log2:
|
|
|
|
; CHECK: movw [[reg0:r[0-9]+]], :lower16:{{.*}}
|
|
; CHECK: movt [[reg0]], :upper16:{{.*}}
|
|
; CHECK: vld1.64
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}log2f
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}log2f
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}log2f
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}log2f
|
|
|
|
; CHECK: vst1.64
|
|
|
|
L.entry:
|
|
%0 = load <4 x float>* @A, align 16
|
|
%1 = call <4 x float> @llvm.log2.v4f32(<4 x float> %0)
|
|
store <4 x float> %1, <4 x float>* %X, align 16
|
|
ret void
|
|
}
|
|
|
|
declare <4 x float> @llvm.log2.v4f32(<4 x float>) nounwind readonly
|
|
|
|
|
|
define void @test_pow(<4 x float>* %X) nounwind {
|
|
|
|
; CHECK: test_pow:
|
|
|
|
; CHECK: movw [[reg0:r[0-9]+]], :lower16:{{.*}}
|
|
; CHECK: movt [[reg0]], :upper16:{{.*}}
|
|
; CHECK: vld1.64
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}powf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}powf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}powf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}powf
|
|
|
|
; CHECK: vst1.64
|
|
|
|
L.entry:
|
|
|
|
%0 = load <4 x float>* @A, align 16
|
|
%1 = call <4 x float> @llvm.pow.v4f32(<4 x float> %0, <4 x float> <float 2., float 2., float 2., float 2.>)
|
|
|
|
store <4 x float> %1, <4 x float>* %X, align 16
|
|
|
|
ret void
|
|
}
|
|
|
|
declare <4 x float> @llvm.pow.v4f32(<4 x float>, <4 x float>) nounwind readonly
|
|
|
|
define void @test_powi(<4 x float>* %X) nounwind {
|
|
|
|
; CHECK: test_powi:
|
|
|
|
; CHECK: movw [[reg0:r[0-9]+]], :lower16:{{.*}}
|
|
; CHECK: movt [[reg0]], :upper16:{{.*}}
|
|
; CHECK: vld1.64 {{.*}}, :128
|
|
; CHECK: vmul.f32 {{.*}}
|
|
|
|
; CHECK: vst1.64
|
|
|
|
L.entry:
|
|
|
|
%0 = load <4 x float>* @A, align 16
|
|
%1 = call <4 x float> @llvm.powi.v4f32(<4 x float> %0, i32 2)
|
|
|
|
store <4 x float> %1, <4 x float>* %X, align 16
|
|
|
|
ret void
|
|
}
|
|
|
|
declare <4 x float> @llvm.powi.v4f32(<4 x float>, i32) nounwind readonly
|
|
|
|
define void @test_sin(<4 x float>* %X) nounwind {
|
|
|
|
; CHECK: test_sin:
|
|
|
|
; CHECK: movw [[reg0:r[0-9]+]], :lower16:{{.*}}
|
|
; CHECK: movt [[reg0]], :upper16:{{.*}}
|
|
; CHECK: vld1.64
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}sinf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}sinf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}sinf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}sinf
|
|
|
|
; CHECK: vst1.64
|
|
|
|
L.entry:
|
|
%0 = load <4 x float>* @A, align 16
|
|
%1 = call <4 x float> @llvm.sin.v4f32(<4 x float> %0)
|
|
store <4 x float> %1, <4 x float>* %X, align 16
|
|
ret void
|
|
}
|
|
|
|
declare <4 x float> @llvm.sin.v4f32(<4 x float>) nounwind readonly
|
|
|
|
define void @test_floor(<4 x float>* %X) nounwind {
|
|
|
|
; CHECK: test_floor:
|
|
|
|
; CHECK: movw [[reg0:r[0-9]+]], :lower16:{{.*}}
|
|
; CHECK: movt [[reg0]], :upper16:{{.*}}
|
|
; CHECK: vld1.64
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}floorf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}floorf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}floorf
|
|
|
|
; CHECK: {{v?mov(.32)?}} r0,
|
|
; CHECK: bl {{.*}}floorf
|
|
|
|
; CHECK: vst1.64
|
|
|
|
L.entry:
|
|
%0 = load <4 x float>* @A, align 16
|
|
%1 = call <4 x float> @llvm.floor.v4f32(<4 x float> %0)
|
|
store <4 x float> %1, <4 x float>* %X, align 16
|
|
ret void
|
|
}
|
|
|
|
declare <4 x float> @llvm.floor.v4f32(<4 x float>) nounwind readonly
|
|
|