llvm/test/CodeGen/AArch64/sibling-call.ll

; RUN: llc -verify-machineinstrs < %s -mtriple=aarch64-none-linux-gnu | FileCheck %s

declare void @callee_stack0()
declare void @callee_stack8([8 x i32], i64)
declare void @callee_stack16([8 x i32], i64, i64)

define void @caller_to0_from0() nounwind {
; CHECK: caller_to0_from0:
; CHECK-NEXT: // BB
  tail call void @callee_stack0()
  ret void
; CHECK-NEXT: b callee_stack0
}

define void @caller_to0_from8([8 x i32], i64) nounwind{
; CHECK: caller_to0_from8:
; CHECK-NEXT: // BB

  tail call void @callee_stack0()
  ret void
; CHECK-NEXT: b callee_stack0
}

define void @caller_to8_from0() {
; CHECK: caller_to8_from0:

; Caller isn't going to clean up any extra stack we allocate, so it
; can't be a tail call.
  tail call void @callee_stack8([8 x i32] undef, i64 42)
  ret void
; CHECK: bl callee_stack8
}

define void @caller_to8_from8([8 x i32], i64 %a) {
; CHECK: caller_to8_from8:
; CHECK-NOT: sub sp, sp,

; This should reuse our stack area for the 42
  tail call void @callee_stack8([8 x i32] undef, i64 42)
  ret void
; CHECK: str {{x[0-9]+}}, [sp]
; CHECK-NEXT: b callee_stack8
}

define void @caller_to16_from8([8 x i32], i64 %a) {
; CHECK: caller_to16_from8:

; Shouldn't be a tail call: we can't use SP+8 because our caller might
; have something there. This may sound obvious but implementation does
; some funky aligning.
  tail call void @callee_stack16([8 x i32] undef, i64 undef, i64 undef)
; CHECK: bl callee_stack16
  ret void
}

define void @caller_to8_from24([8 x i32], i64 %a, i64 %b, i64 %c) {
; CHECK: caller_to8_from24:
; CHECK-NOT: sub sp, sp

; Reuse our area, putting "42" at incoming sp
  tail call void @callee_stack8([8 x i32] undef, i64 42)
  ret void
; CHECK: str {{x[0-9]+}}, [sp]
; CHECK-NEXT: b callee_stack8
}

define void @caller_to16_from16([8 x i32], i64 %a, i64 %b) {
; CHECK: caller_to16_from16:
; CHECK-NOT: sub sp, sp,

; Here we want to make sure that both loads happen before the stores:
; otherwise either %a or %b will be wrongly clobbered.
  tail call void @callee_stack16([8 x i32] undef, i64 %b, i64 %a)
  ret void

; CHECK: ldr x0,
; CHECK: ldr x1,
; CHECK: str x1,
; CHECK: str x0,

; CHECK-NOT: add sp, sp,
; CHECK: b callee_stack16
}

@func = global void(i32)* null

define void @indirect_tail() {
; CHECK: indirect_tail:
; CHECK-NOT: sub sp, sp

  %fptr = load void(i32)** @func
  tail call void %fptr(i32 42)
  ret void
; CHECK: movz w0, #42
; CHECK: ldr [[FPTR:x[1-9]+]], [{{x[0-9]+}}, #:lo12:func]
; CHECK: br [[FPTR]]
}
Add explicit triples to AArch64 tests Only Linux is supported at the moment, and other platforms quickly fault. As a result these tests would fail on non-Linux hosts. It may be worth making the tests more generic again as more platforms are supported. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@174170 91177308-0d34-0410-b5e6-96231b3b80d8 2013-02-01 11:40:47 +00:00			`; RUN: llc -verify-machineinstrs < %s -mtriple=aarch64-none-linux-gnu \| FileCheck %s`
Add AArch64 as an experimental target. This patch adds support for AArch64 (ARM's 64-bit architecture) to LLVM in the "experimental" category. Currently, it won't be built unless requested explicitly. This initial commit should have support for: + Assembly of all scalar (i.e. non-NEON, non-Crypto) instructions (except the late addition CRC instructions). + CodeGen features required for C++03 and C99. + Compilation for the "small" memory model: code+static data < 4GB. + Absolute and position-independent code. + GNU-style (i.e. "__thread") TLS. + Debugging information. The principal omission, currently, is performance tuning. This patch excludes the NEON support also reviewed due to an outbreak of batshit insanity in our legal department. That will be committed soon bringing the changes to precisely what has been approved. Further reviews would be gratefully received. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@174054 91177308-0d34-0410-b5e6-96231b3b80d8 2013-01-31 12:12:40 +00:00
			`declare void @callee_stack0()`
			`declare void @callee_stack8([8 x i32], i64)`
			`declare void @callee_stack16([8 x i32], i64, i64)`

			`define void @caller_to0_from0() nounwind {`
			`; CHECK: caller_to0_from0:`
			`; CHECK-NEXT: // BB`
			`tail call void @callee_stack0()`
			`ret void`
			`; CHECK-NEXT: b callee_stack0`
			`}`

			`define void @caller_to0_from8([8 x i32], i64) nounwind{`
			`; CHECK: caller_to0_from8:`
			`; CHECK-NEXT: // BB`

			`tail call void @callee_stack0()`
			`ret void`
			`; CHECK-NEXT: b callee_stack0`
			`}`

			`define void @caller_to8_from0() {`
			`; CHECK: caller_to8_from0:`

			`; Caller isn't going to clean up any extra stack we allocate, so it`
			`; can't be a tail call.`
			`tail call void @callee_stack8([8 x i32] undef, i64 42)`
			`ret void`
			`; CHECK: bl callee_stack8`
			`}`

			`define void @caller_to8_from8([8 x i32], i64 %a) {`
			`; CHECK: caller_to8_from8:`
			`; CHECK-NOT: sub sp, sp,`

			`; This should reuse our stack area for the 42`
			`tail call void @callee_stack8([8 x i32] undef, i64 42)`
			`ret void`
			`; CHECK: str {{x[0-9]+}}, [sp]`
			`; CHECK-NEXT: b callee_stack8`
			`}`

			`define void @caller_to16_from8([8 x i32], i64 %a) {`
			`; CHECK: caller_to16_from8:`

			`; Shouldn't be a tail call: we can't use SP+8 because our caller might`
			`; have something there. This may sound obvious but implementation does`
			`; some funky aligning.`
			`tail call void @callee_stack16([8 x i32] undef, i64 undef, i64 undef)`
			`; CHECK: bl callee_stack16`
			`ret void`
			`}`

			`define void @caller_to8_from24([8 x i32], i64 %a, i64 %b, i64 %c) {`
			`; CHECK: caller_to8_from24:`
			`; CHECK-NOT: sub sp, sp`

			`; Reuse our area, putting "42" at incoming sp`
			`tail call void @callee_stack8([8 x i32] undef, i64 42)`
			`ret void`
			`; CHECK: str {{x[0-9]+}}, [sp]`
			`; CHECK-NEXT: b callee_stack8`
			`}`

			`define void @caller_to16_from16([8 x i32], i64 %a, i64 %b) {`
			`; CHECK: caller_to16_from16:`
			`; CHECK-NOT: sub sp, sp,`

			`; Here we want to make sure that both loads happen before the stores:`
			`; otherwise either %a or %b will be wrongly clobbered.`
			`tail call void @callee_stack16([8 x i32] undef, i64 %b, i64 %a)`
			`ret void`

			`; CHECK: ldr x0,`
			`; CHECK: ldr x1,`
			`; CHECK: str x1,`
			`; CHECK: str x0,`

			`; CHECK-NOT: add sp, sp,`
			`; CHECK: b callee_stack16`
			`}`

			`@func = global void(i32)* null`

			`define void @indirect_tail() {`
			`; CHECK: indirect_tail:`
			`; CHECK-NOT: sub sp, sp`

			`%fptr = load void(i32)** @func`
			`tail call void %fptr(i32 42)`
			`ret void`
			`; CHECK: movz w0, #42`
			`; CHECK: ldr [[FPTR:x[1-9]+]], [{{x[0-9]+}}, #:lo12:func]`
			`; CHECK: br [[FPTR]]`
			`}`