llvm/test/CodeGen/X86/hipe-prologue.ll
Hans Wennborg b667d698ac [X86] Enable call frame optimization ("mov to push") not only for optsize (PR26325)
The size savings are significant, and from what I can tell, both ICC and GCC do this.

Differential Revision: http://reviews.llvm.org/D18573

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@264966 91177308-0d34-0410-b5e6-96231b3b80d8
2016-03-30 23:38:01 +00:00

68 lines
2.1 KiB
LLVM

; RUN: llc < %s -mcpu=generic -mtriple=i686-linux -verify-machineinstrs | FileCheck %s -check-prefix=X32-Linux
; RUN: llc < %s -mtriple=x86_64-linux-gnu -verify-machineinstrs | FileCheck %s -check-prefix=X64-Linux
; The HiPE compiler (i.e., the native code compiler of the Erlang/OTP system)
; adds a custom assembly prologue in order to efficiently manipulate the stack
; at runtime.
; Just to prevent the alloca from being optimized away.
declare void @dummy_use(i32*, i32)
define {i32, i32} @test_basic(i32 %hp, i32 %p) {
; X32-Linux-LABEL: test_basic:
; X32-Linux-NOT: calll inc_stack_0
; X64-Linux-LABEL: test_basic:
; X64-Linux-NOT: callq inc_stack_0
%mem = alloca i32, i32 10
call void @dummy_use (i32* %mem, i32 10)
%1 = insertvalue {i32, i32} undef, i32 %hp, 0
%2 = insertvalue {i32, i32} %1, i32 %p, 1
ret {i32, i32} %1
}
define cc 11 {i32, i32} @test_basic_hipecc(i32 %hp, i32 %p) {
; X32-Linux-LABEL: test_basic_hipecc:
; X32-Linux: leal -140(%esp), %ebx
; X32-Linux-NEXT: cmpl 76(%ebp), %ebx
; X32-Linux-NEXT: jb .LBB1_1
; X32-Linux: ret
; X32-Linux: .LBB1_1:
; X32-Linux-NEXT: calll inc_stack_0
; X64-Linux-LABEL: test_basic_hipecc:
; X64-Linux: leaq -232(%rsp), %r14
; X64-Linux-NEXT: cmpq 144(%rbp), %r14
; X64-Linux-NEXT: jb .LBB1_1
; X64-Linux: ret
; X64-Linux: .LBB1_1:
; X64-Linux-NEXT: callq inc_stack_0
%mem = alloca i32, i32 10
call void @dummy_use (i32* %mem, i32 10)
%1 = insertvalue {i32, i32} undef, i32 %hp, 0
%2 = insertvalue {i32, i32} %1, i32 %p, 1
ret {i32, i32} %2
}
define cc 11 {i32,i32,i32} @test_nocall_hipecc(i32 %hp,i32 %p,i32 %x,i32 %y) {
; X32-Linux-LABEL: test_nocall_hipecc:
; X32-Linux-NOT: calll inc_stack_0
; X64-Linux-LABEL: test_nocall_hipecc:
; X64-Linux-NOT: callq inc_stack_0
%1 = add i32 %x, %y
%2 = mul i32 42, %1
%3 = sub i32 24, %2
%4 = insertvalue {i32, i32, i32} undef, i32 %hp, 0
%5 = insertvalue {i32, i32, i32} %4, i32 %p, 1
%6 = insertvalue {i32, i32, i32} %5, i32 %p, 2
ret {i32, i32, i32} %6
}