mirror of
https://github.com/RPCS3/llvm.git
synced 2025-05-17 02:46:00 +00:00

Move the register stackification and coloring passes to run very late, after PEI, tail duplication, and most other passes. This means that all code emitted and expanded by those passes is now exposed to these passes. This also eliminates the need for prologue/epilogue code to be manually stackified, which significantly simplifies the code. This does require running LiveIntervals a second time. It's useful to think of these late passes not as late optimization passes, but as a domain-specific compression algorithm based on knowledge of liveness information. It's used to compress the code after all conventional optimizations are complete, which is why it uses LiveIntervals at a phase when actual optimization passes don't typically need it. Differential Revision: http://reviews.llvm.org/D20075 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@269012 91177308-0d34-0410-b5e6-96231b3b80d8
217 lines
8.8 KiB
C++
217 lines
8.8 KiB
C++
//===-- WebAssemblyFrameLowering.cpp - WebAssembly Frame Lowering ----------==//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
///
|
|
/// \file
|
|
/// \brief This file contains the WebAssembly implementation of
|
|
/// TargetFrameLowering class.
|
|
///
|
|
/// On WebAssembly, there aren't a lot of things to do here. There are no
|
|
/// callee-saved registers to save, and no spill slots.
|
|
///
|
|
/// The stack grows downward.
|
|
///
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "WebAssemblyFrameLowering.h"
|
|
#include "MCTargetDesc/WebAssemblyMCTargetDesc.h"
|
|
#include "WebAssemblyInstrInfo.h"
|
|
#include "WebAssemblyMachineFunctionInfo.h"
|
|
#include "WebAssemblySubtarget.h"
|
|
#include "WebAssemblyTargetMachine.h"
|
|
#include "llvm/CodeGen/MachineFrameInfo.h"
|
|
#include "llvm/CodeGen/MachineFunction.h"
|
|
#include "llvm/CodeGen/MachineInstrBuilder.h"
|
|
#include "llvm/CodeGen/MachineModuleInfo.h"
|
|
#include "llvm/CodeGen/MachineRegisterInfo.h"
|
|
#include "llvm/Support/Debug.h"
|
|
using namespace llvm;
|
|
|
|
#define DEBUG_TYPE "wasm-frame-info"
|
|
|
|
// TODO: wasm64
|
|
// TODO: Emit TargetOpcode::CFI_INSTRUCTION instructions
|
|
|
|
/// Return true if the specified function should have a dedicated frame pointer
|
|
/// register.
|
|
bool WebAssemblyFrameLowering::hasFP(const MachineFunction &MF) const {
|
|
const MachineFrameInfo *MFI = MF.getFrameInfo();
|
|
const auto *RegInfo =
|
|
MF.getSubtarget<WebAssemblySubtarget>().getRegisterInfo();
|
|
return MFI->isFrameAddressTaken() || MFI->hasVarSizedObjects() ||
|
|
MFI->hasStackMap() || MFI->hasPatchPoint() ||
|
|
RegInfo->needsStackRealignment(MF);
|
|
}
|
|
|
|
/// Under normal circumstances, when a frame pointer is not required, we reserve
|
|
/// argument space for call sites in the function immediately on entry to the
|
|
/// current function. This eliminates the need for add/sub sp brackets around
|
|
/// call sites. Returns true if the call frame is included as part of the stack
|
|
/// frame.
|
|
bool WebAssemblyFrameLowering::hasReservedCallFrame(
|
|
const MachineFunction &MF) const {
|
|
return !MF.getFrameInfo()->hasVarSizedObjects();
|
|
}
|
|
|
|
|
|
/// Returns true if this function needs a local user-space stack pointer.
|
|
/// Unlike a machine stack pointer, the wasm user stack pointer is a global
|
|
/// variable, so it is loaded into a register in the prolog.
|
|
bool WebAssemblyFrameLowering::needsSP(const MachineFunction &MF,
|
|
const MachineFrameInfo &MFI) const {
|
|
return MFI.getStackSize() || MFI.adjustsStack() || hasFP(MF);
|
|
}
|
|
|
|
/// Returns true if the local user-space stack pointer needs to be written back
|
|
/// to memory by this function (this is not meaningful if needsSP is false). If
|
|
/// false, the stack red zone can be used and only a local SP is needed.
|
|
bool WebAssemblyFrameLowering::needsSPWriteback(
|
|
const MachineFunction &MF, const MachineFrameInfo &MFI) const {
|
|
assert(needsSP(MF, MFI));
|
|
return MFI.getStackSize() > RedZoneSize || MFI.hasCalls() ||
|
|
MF.getFunction()->hasFnAttribute(Attribute::NoRedZone);
|
|
}
|
|
|
|
static void writeSPToMemory(unsigned SrcReg, MachineFunction &MF,
|
|
MachineBasicBlock &MBB,
|
|
MachineBasicBlock::iterator &InsertAddr,
|
|
MachineBasicBlock::iterator &InsertStore,
|
|
DebugLoc DL) {
|
|
auto *SPSymbol = MF.createExternalSymbolName("__stack_pointer");
|
|
MachineRegisterInfo &MRI = MF.getRegInfo();
|
|
const TargetRegisterClass *PtrRC =
|
|
MRI.getTargetRegisterInfo()->getPointerRegClass(MF);
|
|
unsigned SPAddr = MRI.createVirtualRegister(PtrRC);
|
|
unsigned Discard = MRI.createVirtualRegister(PtrRC);
|
|
const auto *TII = MF.getSubtarget<WebAssemblySubtarget>().getInstrInfo();
|
|
|
|
BuildMI(MBB, InsertAddr, DL, TII->get(WebAssembly::CONST_I32), SPAddr)
|
|
.addExternalSymbol(SPSymbol);
|
|
auto *MMO = new MachineMemOperand(MachinePointerInfo(),
|
|
MachineMemOperand::MOStore, 4, 4);
|
|
BuildMI(MBB, InsertStore, DL, TII->get(WebAssembly::STORE_I32),
|
|
Discard)
|
|
.addImm(0)
|
|
.addReg(SPAddr)
|
|
.addImm(2) // p2align
|
|
.addReg(SrcReg)
|
|
.addMemOperand(MMO);
|
|
}
|
|
|
|
MachineBasicBlock::iterator
|
|
WebAssemblyFrameLowering::eliminateCallFramePseudoInstr(
|
|
MachineFunction &MF, MachineBasicBlock &MBB,
|
|
MachineBasicBlock::iterator I) const {
|
|
assert(!I->getOperand(0).getImm() && hasFP(MF) &&
|
|
"Call frame pseudos should only be used for dynamic stack adjustment");
|
|
const auto *TII = MF.getSubtarget<WebAssemblySubtarget>().getInstrInfo();
|
|
if (I->getOpcode() == TII->getCallFrameDestroyOpcode() &&
|
|
needsSPWriteback(MF, *MF.getFrameInfo())) {
|
|
DebugLoc DL = I->getDebugLoc();
|
|
writeSPToMemory(WebAssembly::SP32, MF, MBB, I, I, DL);
|
|
}
|
|
return MBB.erase(I);
|
|
}
|
|
|
|
void WebAssemblyFrameLowering::emitPrologue(MachineFunction &MF,
|
|
MachineBasicBlock &MBB) const {
|
|
// TODO: Do ".setMIFlag(MachineInstr::FrameSetup)" on emitted instructions
|
|
auto *MFI = MF.getFrameInfo();
|
|
assert(MFI->getCalleeSavedInfo().empty() &&
|
|
"WebAssembly should not have callee-saved registers");
|
|
|
|
if (!needsSP(MF, *MFI)) return;
|
|
uint64_t StackSize = MFI->getStackSize();
|
|
|
|
const auto *TII = MF.getSubtarget<WebAssemblySubtarget>().getInstrInfo();
|
|
auto &MRI = MF.getRegInfo();
|
|
|
|
auto InsertPt = MBB.begin();
|
|
DebugLoc DL;
|
|
|
|
const TargetRegisterClass *PtrRC =
|
|
MRI.getTargetRegisterInfo()->getPointerRegClass(MF);
|
|
unsigned SPAddr = MRI.createVirtualRegister(PtrRC);
|
|
unsigned SPReg = MRI.createVirtualRegister(PtrRC);
|
|
auto *SPSymbol = MF.createExternalSymbolName("__stack_pointer");
|
|
BuildMI(MBB, InsertPt, DL, TII->get(WebAssembly::CONST_I32), SPAddr)
|
|
.addExternalSymbol(SPSymbol);
|
|
// This MachinePointerInfo should reference __stack_pointer as well but
|
|
// doesn't because MachinePointerInfo() takes a GV which we don't have for
|
|
// __stack_pointer. TODO: check if PseudoSourceValue::ExternalSymbolCallEntry
|
|
// is appropriate instead. (likewise for EmitEpologue below)
|
|
auto *LoadMMO = new MachineMemOperand(MachinePointerInfo(),
|
|
MachineMemOperand::MOLoad, 4, 4);
|
|
// Load the SP value.
|
|
BuildMI(MBB, InsertPt, DL, TII->get(WebAssembly::LOAD_I32),
|
|
StackSize ? SPReg : (unsigned)WebAssembly::SP32)
|
|
.addImm(0) // offset
|
|
.addReg(SPAddr) // addr
|
|
.addImm(2) // p2align
|
|
.addMemOperand(LoadMMO);
|
|
|
|
if (StackSize) {
|
|
// Subtract the frame size
|
|
unsigned OffsetReg = MRI.createVirtualRegister(PtrRC);
|
|
BuildMI(MBB, InsertPt, DL, TII->get(WebAssembly::CONST_I32), OffsetReg)
|
|
.addImm(StackSize);
|
|
BuildMI(MBB, InsertPt, DL, TII->get(WebAssembly::SUB_I32),
|
|
WebAssembly::SP32)
|
|
.addReg(SPReg)
|
|
.addReg(OffsetReg);
|
|
}
|
|
if (hasFP(MF)) {
|
|
// Unlike most conventional targets (where FP points to the saved FP),
|
|
// FP points to the bottom of the fixed-size locals, so we can use positive
|
|
// offsets in load/store instructions.
|
|
BuildMI(MBB, InsertPt, DL, TII->get(WebAssembly::COPY),
|
|
WebAssembly::FP32)
|
|
.addReg(WebAssembly::SP32);
|
|
}
|
|
if (StackSize && needsSPWriteback(MF, *MFI)) {
|
|
writeSPToMemory(WebAssembly::SP32, MF, MBB, InsertPt, InsertPt, DL);
|
|
}
|
|
}
|
|
|
|
void WebAssemblyFrameLowering::emitEpilogue(MachineFunction &MF,
|
|
MachineBasicBlock &MBB) const {
|
|
auto *MFI = MF.getFrameInfo();
|
|
uint64_t StackSize = MFI->getStackSize();
|
|
if (!needsSP(MF, *MFI) || !needsSPWriteback(MF, *MFI)) return;
|
|
const auto *TII = MF.getSubtarget<WebAssemblySubtarget>().getInstrInfo();
|
|
auto &MRI = MF.getRegInfo();
|
|
auto InsertPt = MBB.getFirstTerminator();
|
|
DebugLoc DL;
|
|
|
|
if (InsertPt != MBB.end())
|
|
DL = InsertPt->getDebugLoc();
|
|
|
|
// Restore the stack pointer. If we had fixed-size locals, add the offset
|
|
// subtracted in the prolog.
|
|
unsigned SPReg = 0;
|
|
MachineBasicBlock::iterator InsertAddr = InsertPt;
|
|
if (StackSize) {
|
|
const TargetRegisterClass *PtrRC =
|
|
MRI.getTargetRegisterInfo()->getPointerRegClass(MF);
|
|
unsigned OffsetReg = MRI.createVirtualRegister(PtrRC);
|
|
InsertAddr =
|
|
BuildMI(MBB, InsertPt, DL, TII->get(WebAssembly::CONST_I32), OffsetReg)
|
|
.addImm(StackSize);
|
|
// In the epilog we don't need to write the result back to the SP32 physreg
|
|
// because it won't be used again. We can use a stackified register instead.
|
|
SPReg = MRI.createVirtualRegister(PtrRC);
|
|
BuildMI(MBB, InsertPt, DL, TII->get(WebAssembly::ADD_I32), SPReg)
|
|
.addReg(hasFP(MF) ? WebAssembly::FP32 : WebAssembly::SP32)
|
|
.addReg(OffsetReg);
|
|
} else {
|
|
SPReg = hasFP(MF) ? WebAssembly::FP32 : WebAssembly::SP32;
|
|
}
|
|
|
|
writeSPToMemory(SPReg, MF, MBB, InsertAddr, InsertPt, DL);
|
|
}
|