mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-26 12:50:30 +00:00
e45131dbf7
Summary: If LTOUnit splitting is disabled, the module summary analysis computes the summary information necessary to perform single implementation devirtualization during the thin link with the index and no IR. The information collected from the regular LTO IR in the current hybrid WPD algorithm is summarized, including: 1) For vtable definitions, record the function pointers and their offset within the vtable initializer (subsumes the information collected from IR by tryFindVirtualCallTargets). 2) A record for each type metadata summarizing the vtable definitions decorated with that metadata (subsumes the TypeIdentiferMap collected from IR). Also added are the necessary bitcode records, and the corresponding assembly support. The follow-on index-based WPD patch is D55153. Depends on D53890. Reviewers: pcc Subscribers: mehdi_amini, Prazek, inglorion, eraman, steven_wu, dexonsmith, arphaman, llvm-commits Differential Revision: https://reviews.llvm.org/D54815 llvm-svn: 364960
147 lines
6.4 KiB
LLVM
147 lines
6.4 KiB
LLVM
; REQUIRES: x86-registered-target
|
|
|
|
; Test devirtualization through the thin link and backend.
|
|
|
|
; Generate split module with summary for hybrid Thin/Regular LTO WPD.
|
|
; RUN: opt -thinlto-bc -thinlto-split-lto-unit -o %t.o %s
|
|
|
|
; Check that we have module flag showing splitting enabled, and that we don't
|
|
; generate summary information needed for index-based WPD.
|
|
; RUN: llvm-modextract -b -n=0 %t.o -o %t.o.0
|
|
; RUN: llvm-dis -o - %t.o.0 | FileCheck %s --check-prefix=ENABLESPLITFLAG --implicit-check-not=vTableFuncs --implicit-check-not=typeidCompatibleVTable
|
|
; RUN: llvm-modextract -b -n=1 %t.o -o %t.o.1
|
|
; RUN: llvm-dis -o - %t.o.1 | FileCheck %s --check-prefix=ENABLESPLITFLAG --implicit-check-not=vTableFuncs --implicit-check-not=typeidCompatibleVTable
|
|
; ENABLESPLITFLAG: !{i32 1, !"EnableSplitLTOUnit", i32 1}
|
|
|
|
; Generate unsplit module with summary for ThinLTO index-based WPD.
|
|
; RUN: opt -thinlto-bc -o %t2.o %s
|
|
|
|
; Check that we don't have module flag when splitting not enabled for ThinLTO,
|
|
; and that we generate summary information needed for index-based WPD.
|
|
; RUN: llvm-dis -o - %t2.o | FileCheck %s --check-prefix=NOENABLESPLITFLAG
|
|
; NOENABLESPLITFLAG-DAG: !{i32 1, !"EnableSplitLTOUnit", i32 0}
|
|
; NOENABLESPLITFLAG-DAG: [[An:\^[0-9]+]] = gv: (name: "_ZN1A1nEi")
|
|
; NOENABLESPLITFLAG-DAG: [[Bf:\^[0-9]+]] = gv: (name: "_ZN1B1fEi")
|
|
; NOENABLESPLITFLAG-DAG: [[Cf:\^[0-9]+]] = gv: (name: "_ZN1C1fEi")
|
|
; NOENABLESPLITFLAG-DAG: [[Dm:\^[0-9]+]] = gv: (name: "_ZN1D1mEi")
|
|
; NOENABLESPLITFLAG-DAG: [[B:\^[0-9]+]] = gv: (name: "_ZTV1B", {{.*}} vTableFuncs: ((virtFunc: [[Bf]], offset: 16), (virtFunc: [[An]], offset: 24)), refs: ([[Bf]], [[An]])
|
|
; NOENABLESPLITFLAG-DAG: [[C:\^[0-9]+]] = gv: (name: "_ZTV1C", {{.*}} vTableFuncs: ((virtFunc: [[Cf]], offset: 16), (virtFunc: [[An]], offset: 24)), refs: ([[An]], [[Cf]])
|
|
; NOENABLESPLITFLAG-DAG: [[D:\^[0-9]+]] = gv: (name: "_ZTV1D", {{.*}} vTableFuncs: ((virtFunc: [[Dm]], offset: 16)), refs: ([[Dm]])
|
|
; NOENABLESPLITFLAG-DAG: typeidCompatibleVTable: (name: "_ZTS1A", summary: ((offset: 16, [[B]]), (offset: 16, [[C]])))
|
|
; NOENABLESPLITFLAG-DAG: typeidCompatibleVTable: (name: "_ZTS1B", summary: ((offset: 16, [[B]])))
|
|
; NOENABLESPLITFLAG-DAG: typeidCompatibleVTable: (name: "_ZTS1C", summary: ((offset: 16, [[C]])))
|
|
; Type Id on _ZTV1D should have been promoted
|
|
; NOENABLESPLITFLAG-DAG: typeidCompatibleVTable: (name: "1${{.*}}", summary: ((offset: 16, [[D]])))
|
|
|
|
; TODO: Test index-based WPD one %t2.o once implemented.
|
|
|
|
; Legacy PM
|
|
; RUN: llvm-lto2 run %t.o -save-temps -pass-remarks=. \
|
|
; RUN: -o %t3 \
|
|
; RUN: -r=%t.o,test,px \
|
|
; RUN: -r=%t.o,_ZN1A1nEi,p \
|
|
; RUN: -r=%t.o,_ZN1B1fEi,p \
|
|
; RUN: -r=%t.o,_ZN1C1fEi,p \
|
|
; RUN: -r=%t.o,_ZN1D1mEi,p \
|
|
; RUN: -r=%t.o,_ZTV1B, \
|
|
; RUN: -r=%t.o,_ZTV1C, \
|
|
; RUN: -r=%t.o,_ZTV1D, \
|
|
; RUN: -r=%t.o,_ZN1A1nEi, \
|
|
; RUN: -r=%t.o,_ZN1B1fEi, \
|
|
; RUN: -r=%t.o,_ZN1C1fEi, \
|
|
; RUN: -r=%t.o,_ZN1D1mEi, \
|
|
; RUN: -r=%t.o,_ZTV1B,px \
|
|
; RUN: -r=%t.o,_ZTV1C,px \
|
|
; RUN: -r=%t.o,_ZTV1D,px 2>&1 | FileCheck %s --check-prefix=REMARK
|
|
; RUN: llvm-dis %t3.1.4.opt.bc -o - | FileCheck %s --check-prefix=CHECK-IR
|
|
|
|
; New PM
|
|
; RUN: llvm-lto2 run %t.o -save-temps -use-new-pm -pass-remarks=. \
|
|
; RUN: -o %t3 \
|
|
; RUN: -r=%t.o,test,px \
|
|
; RUN: -r=%t.o,_ZN1A1nEi,p \
|
|
; RUN: -r=%t.o,_ZN1B1fEi,p \
|
|
; RUN: -r=%t.o,_ZN1C1fEi,p \
|
|
; RUN: -r=%t.o,_ZN1D1mEi,p \
|
|
; RUN: -r=%t.o,_ZTV1B, \
|
|
; RUN: -r=%t.o,_ZTV1C, \
|
|
; RUN: -r=%t.o,_ZTV1D, \
|
|
; RUN: -r=%t.o,_ZN1A1nEi, \
|
|
; RUN: -r=%t.o,_ZN1B1fEi, \
|
|
; RUN: -r=%t.o,_ZN1C1fEi, \
|
|
; RUN: -r=%t.o,_ZN1D1mEi, \
|
|
; RUN: -r=%t.o,_ZTV1B,px \
|
|
; RUN: -r=%t.o,_ZTV1C,px \
|
|
; RUN: -r=%t.o,_ZTV1D,px 2>&1 | FileCheck %s --check-prefix=REMARK
|
|
; RUN: llvm-dis %t3.1.4.opt.bc -o - | FileCheck %s --check-prefix=CHECK-IR
|
|
|
|
; REMARK-DAG: single-impl: devirtualized a call to _ZN1A1nEi
|
|
; REMARK-DAG: single-impl: devirtualized a call to _ZN1D1mEi
|
|
|
|
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
|
|
target triple = "x86_64-grtev4-linux-gnu"
|
|
|
|
%struct.A = type { i32 (...)** }
|
|
%struct.B = type { %struct.A }
|
|
%struct.C = type { %struct.A }
|
|
%struct.D = type { i32 (...)** }
|
|
|
|
@_ZTV1B = constant { [4 x i8*] } { [4 x i8*] [i8* null, i8* undef, i8* bitcast (i32 (%struct.B*, i32)* @_ZN1B1fEi to i8*), i8* bitcast (i32 (%struct.A*, i32)* @_ZN1A1nEi to i8*)] }, !type !0, !type !1
|
|
@_ZTV1C = constant { [4 x i8*] } { [4 x i8*] [i8* null, i8* undef, i8* bitcast (i32 (%struct.C*, i32)* @_ZN1C1fEi to i8*), i8* bitcast (i32 (%struct.A*, i32)* @_ZN1A1nEi to i8*)] }, !type !0, !type !2
|
|
@_ZTV1D = constant { [3 x i8*] } { [3 x i8*] [i8* null, i8* undef, i8* bitcast (i32 (%struct.D*, i32)* @_ZN1D1mEi to i8*)] }, !type !3
|
|
|
|
|
|
; CHECK-IR-LABEL: define i32 @test
|
|
define i32 @test(%struct.A* %obj, %struct.D* %obj2, i32 %a) {
|
|
entry:
|
|
%0 = bitcast %struct.A* %obj to i8***
|
|
%vtable = load i8**, i8*** %0
|
|
%1 = bitcast i8** %vtable to i8*
|
|
%p = call i1 @llvm.type.test(i8* %1, metadata !"_ZTS1A")
|
|
call void @llvm.assume(i1 %p)
|
|
%fptrptr = getelementptr i8*, i8** %vtable, i32 1
|
|
%2 = bitcast i8** %fptrptr to i32 (%struct.A*, i32)**
|
|
%fptr1 = load i32 (%struct.A*, i32)*, i32 (%struct.A*, i32)** %2, align 8
|
|
|
|
; Check that the call was devirtualized.
|
|
; CHECK-IR: %call = tail call i32 @_ZN1A1nEi
|
|
%call = tail call i32 %fptr1(%struct.A* nonnull %obj, i32 %a)
|
|
|
|
%3 = bitcast i8** %vtable to i32 (%struct.A*, i32)**
|
|
%fptr22 = load i32 (%struct.A*, i32)*, i32 (%struct.A*, i32)** %3, align 8
|
|
|
|
; We still have to call it as virtual.
|
|
; CHECK-IR: %call3 = tail call i32 %fptr22
|
|
%call3 = tail call i32 %fptr22(%struct.A* nonnull %obj, i32 %call)
|
|
|
|
%4 = bitcast %struct.D* %obj2 to i8***
|
|
%vtable2 = load i8**, i8*** %4
|
|
%5 = bitcast i8** %vtable2 to i8*
|
|
%p2 = call i1 @llvm.type.test(i8* %5, metadata !4)
|
|
call void @llvm.assume(i1 %p2)
|
|
|
|
%6 = bitcast i8** %vtable2 to i32 (%struct.D*, i32)**
|
|
%fptr33 = load i32 (%struct.D*, i32)*, i32 (%struct.D*, i32)** %6, align 8
|
|
|
|
; Check that the call was devirtualized.
|
|
; CHECK-IR: %call4 = tail call i32 @_ZN1D1mEi
|
|
%call4 = tail call i32 %fptr33(%struct.D* nonnull %obj2, i32 %call3)
|
|
ret i32 %call4
|
|
}
|
|
; CHECK-IR-LABEL: ret i32
|
|
; CHECK-IR-LABEL: }
|
|
|
|
declare i1 @llvm.type.test(i8*, metadata)
|
|
declare void @llvm.assume(i1)
|
|
|
|
declare i32 @_ZN1B1fEi(%struct.B* %this, i32 %a)
|
|
declare i32 @_ZN1A1nEi(%struct.A* %this, i32 %a)
|
|
declare i32 @_ZN1C1fEi(%struct.C* %this, i32 %a)
|
|
declare i32 @_ZN1D1mEi(%struct.D* %this, i32 %a)
|
|
|
|
!0 = !{i64 16, !"_ZTS1A"}
|
|
!1 = !{i64 16, !"_ZTS1B"}
|
|
!2 = !{i64 16, !"_ZTS1C"}
|
|
!3 = !{i64 16, !4}
|
|
!4 = distinct !{}
|