llvm/test/CodeGen/ARM/a15-mla.ll

; RUN: llc -mtriple=arm-eabi -float-abi=hard -mcpu=cortex-a15 -mattr=+neon,+neonfp %s -o - \
; RUN:  | FileCheck %s

; This test checks that the VMLxForwarting feature is disabled for A15.
; CHECK: fun_a:
define <4 x i32> @fun_a(<4 x i32> %x, <4 x i32> %y) nounwind{
  %1 = add <4 x i32> %x, %y
; CHECK-NOT: vmul
; CHECK: vmla
  %2 = mul <4 x i32> %1, %1
  %3 = add <4 x i32> %y, %2
  ret <4 x i32> %3
}

; This tests checks that VMLA FP patterns can be matched in instruction selection when targeting
; Cortex-A15.
; CHECK: fun_b:
define <4 x float> @fun_b(<4 x float> %x, <4 x float> %y, <4 x float> %z) nounwind{
; CHECK: vmla.f32
  %t = fmul <4 x float> %x, %y
  %r = fadd <4 x float> %t, %z
  ret <4 x float> %r
}

; This tests checks that FP VMLA instructions are not expanded into separate multiply/addition
; operations when targeting Cortex-A15.
; CHECK: fun_c:
define <4 x float> @fun_c(<4 x float> %x, <4 x float> %y, <4 x float> %z, <4 x float> %u, <4 x float> %v) nounwind{
; CHECK: vmla.f32
  %t1 = fmul <4 x float> %x, %y
  %r1 = fadd <4 x float> %t1, %z
; CHECK: vmla.f32
  %t2 = fmul <4 x float> %u, %v
  %r2 = fadd <4 x float> %t2, %r1
  ret <4 x float> %r2
}
ARM: fixup more tests to specify the target more explicitly This changes the tests that were targeting ARM EABI to explicitly specify the environment rather than relying on the default. This breaks with the new Windows on ARM support when running the tests on Windows where the default environment is no longer EABI. Take the opportunity to avoid a pointless redirect (helps when trying to debug with providing a command line invocation which can be copy and pasted) and removing a few greps in favour of FileCheck. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@205541 91177308-0d34-0410-b5e6-96231b3b80d8 2014-04-03 16:01:44 +00:00			`; RUN: llc -mtriple=arm-eabi -float-abi=hard -mcpu=cortex-a15 -mattr=+neon,+neonfp %s -o - \`
			`; RUN: \| FileCheck %s`
Removed the VMLxForwarding feature for the Cortex-A15 target. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@164030 91177308-0d34-0410-b5e6-96231b3b80d8 2012-09-17 14:10:54 +00:00
			`; This test checks that the VMLxForwarting feature is disabled for A15.`
Allow generation of vmla.f32 instructions when targeting Cortex-A15. The patch also adds the VFP4 feature to Cortex-A15 and fixes the DontUseFusedMAC predicate so that we can still generate vmla.f32 instructions on non-darwin targets with VFP4. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@187349 91177308-0d34-0410-b5e6-96231b3b80d8 2013-07-29 09:25:50 +00:00			`; CHECK: fun_a:`
Removed the VMLxForwarding feature for the Cortex-A15 target. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@164030 91177308-0d34-0410-b5e6-96231b3b80d8 2012-09-17 14:10:54 +00:00			`define <4 x i32> @fun_a(<4 x i32> %x, <4 x i32> %y) nounwind{`
			`%1 = add <4 x i32> %x, %y`
			`; CHECK-NOT: vmul`
			`; CHECK: vmla`
			`%2 = mul <4 x i32> %1, %1`
			`%3 = add <4 x i32> %y, %2`
			`ret <4 x i32> %3`
			`}`
Allow generation of vmla.f32 instructions when targeting Cortex-A15. The patch also adds the VFP4 feature to Cortex-A15 and fixes the DontUseFusedMAC predicate so that we can still generate vmla.f32 instructions on non-darwin targets with VFP4. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@187349 91177308-0d34-0410-b5e6-96231b3b80d8 2013-07-29 09:25:50 +00:00
			`; This tests checks that VMLA FP patterns can be matched in instruction selection when targeting`
			`; Cortex-A15.`
			`; CHECK: fun_b:`
			`define <4 x float> @fun_b(<4 x float> %x, <4 x float> %y, <4 x float> %z) nounwind{`
			`; CHECK: vmla.f32`
			`%t = fmul <4 x float> %x, %y`
			`%r = fadd <4 x float> %t, %z`
			`ret <4 x float> %r`
			`}`

			`; This tests checks that FP VMLA instructions are not expanded into separate multiply/addition`
			`; operations when targeting Cortex-A15.`
			`; CHECK: fun_c:`
			`define <4 x float> @fun_c(<4 x float> %x, <4 x float> %y, <4 x float> %z, <4 x float> %u, <4 x float> %v) nounwind{`
			`; CHECK: vmla.f32`
			`%t1 = fmul <4 x float> %x, %y`
			`%r1 = fadd <4 x float> %t1, %z`
			`; CHECK: vmla.f32`
			`%t2 = fmul <4 x float> %u, %v`
			`%r2 = fadd <4 x float> %t2, %r1`
			`ret <4 x float> %r2`
			`}`