mirror of
https://github.com/RPCSX/llvm.git
synced 2025-01-25 05:34:59 +00:00
9e24ab7252
This patch adds a pass for doing PowerPC peephole optimizations at the MI level while the code is still in SSA form. This allows for easy modifications to the instructions while depending on a subsequent pass of DCE. Both passes are very fast due to the characteristics of SSA. At this time, the only peepholes added are for cleaning up various redundancies involving the XXPERMDI instruction. However, I would expect this will be a useful place to add more peepholes for inefficiencies generated during instruction selection. The pass is placed after VSX swap optimization, as it is best to let that pass remove unnecessary swaps before performing any remaining clean-ups. The utility of these clean-ups are demonstrated by changes to four existing test cases, all of which now have tighter expected code generation. I've also added Eric Schweiz's bugpoint-reduced test from PR25157, for which we now generate tight code. One other test started failing for me, and I've fixed it (test/Transforms/PlaceSafepoints/finite-loops.ll) as well; this is not related to my changes, and I'm not sure why it works before and not after. The problem is that the CHECK-NOT: of "statepoint" from test1 fails because of the "statepoint" in test2, and so forth. Adding a CHECK-LABEL in between keeps the different occurrences of that string properly scoped. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@252651 91177308-0d34-0410-b5e6-96231b3b80d8
105 lines
3.4 KiB
C++
105 lines
3.4 KiB
C++
//===-- PPC.h - Top-level interface for PowerPC Target ----------*- C++ -*-===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file contains the entry points for global functions defined in the LLVM
|
|
// PowerPC back-end.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLVM_LIB_TARGET_POWERPC_PPC_H
|
|
#define LLVM_LIB_TARGET_POWERPC_PPC_H
|
|
|
|
#include "MCTargetDesc/PPCMCTargetDesc.h"
|
|
#include <string>
|
|
|
|
// GCC #defines PPC on Linux but we use it as our namespace name
|
|
#undef PPC
|
|
|
|
namespace llvm {
|
|
class PPCTargetMachine;
|
|
class PassRegistry;
|
|
class FunctionPass;
|
|
class ImmutablePass;
|
|
class MachineInstr;
|
|
class AsmPrinter;
|
|
class MCInst;
|
|
|
|
FunctionPass *createPPCCTRLoops(PPCTargetMachine &TM);
|
|
#ifndef NDEBUG
|
|
FunctionPass *createPPCCTRLoopsVerify();
|
|
#endif
|
|
FunctionPass *createPPCLoopDataPrefetchPass();
|
|
FunctionPass *createPPCLoopPreIncPrepPass(PPCTargetMachine &TM);
|
|
FunctionPass *createPPCTOCRegDepsPass();
|
|
FunctionPass *createPPCEarlyReturnPass();
|
|
FunctionPass *createPPCVSXCopyPass();
|
|
FunctionPass *createPPCVSXFMAMutatePass();
|
|
FunctionPass *createPPCVSXSwapRemovalPass();
|
|
FunctionPass *createPPCMIPeepholePass();
|
|
FunctionPass *createPPCBranchSelectionPass();
|
|
FunctionPass *createPPCISelDag(PPCTargetMachine &TM);
|
|
FunctionPass *createPPCTLSDynamicCallPass();
|
|
void LowerPPCMachineInstrToMCInst(const MachineInstr *MI, MCInst &OutMI,
|
|
AsmPrinter &AP, bool isDarwin);
|
|
|
|
void initializePPCVSXFMAMutatePass(PassRegistry&);
|
|
extern char &PPCVSXFMAMutateID;
|
|
|
|
namespace PPCII {
|
|
|
|
/// Target Operand Flag enum.
|
|
enum TOF {
|
|
//===------------------------------------------------------------------===//
|
|
// PPC Specific MachineOperand flags.
|
|
MO_NO_FLAG,
|
|
|
|
/// MO_PLT_OR_STUB - On a symbol operand "FOO", this indicates that the
|
|
/// reference is actually to the "FOO$stub" or "FOO@plt" symbol. This is
|
|
/// used for calls and jumps to external functions on Tiger and earlier, and
|
|
/// for PIC calls on Linux and ELF systems.
|
|
MO_PLT_OR_STUB = 1,
|
|
|
|
/// MO_PIC_FLAG - If this bit is set, the symbol reference is relative to
|
|
/// the function's picbase, e.g. lo16(symbol-picbase).
|
|
MO_PIC_FLAG = 2,
|
|
|
|
/// MO_NLP_FLAG - If this bit is set, the symbol reference is actually to
|
|
/// the non_lazy_ptr for the global, e.g. lo16(symbol$non_lazy_ptr-picbase).
|
|
MO_NLP_FLAG = 4,
|
|
|
|
/// MO_NLP_HIDDEN_FLAG - If this bit is set, the symbol reference is to a
|
|
/// symbol with hidden visibility. This causes a different kind of
|
|
/// non-lazy-pointer to be generated.
|
|
MO_NLP_HIDDEN_FLAG = 8,
|
|
|
|
/// The next are not flags but distinct values.
|
|
MO_ACCESS_MASK = 0xf0,
|
|
|
|
/// MO_LO, MO_HA - lo16(symbol) and ha16(symbol)
|
|
MO_LO = 1 << 4,
|
|
MO_HA = 2 << 4,
|
|
|
|
MO_TPREL_LO = 4 << 4,
|
|
MO_TPREL_HA = 3 << 4,
|
|
|
|
/// These values identify relocations on immediates folded
|
|
/// into memory operations.
|
|
MO_DTPREL_LO = 5 << 4,
|
|
MO_TLSLD_LO = 6 << 4,
|
|
MO_TOC_LO = 7 << 4,
|
|
|
|
// Symbol for VK_PPC_TLS fixup attached to an ADD instruction
|
|
MO_TLS = 8 << 4
|
|
};
|
|
} // end namespace PPCII
|
|
|
|
} // end namespace llvm;
|
|
|
|
#endif
|