mirror of
https://github.com/RPCS3/llvm.git
synced 2025-01-08 13:00:50 +00:00
c0b0c677a1
Only implemented for R600 so far. SI is missing implementations of a few callbacks used by the Indirect Addressing pass and needs code to handle frame indices. At the moment R600 only supports array sizes of 16 dwords or less. Register packing of vector types is currently disabled, which means that a vec4 is stored in T0_X, T1_X, T2_X, T3_X, rather than T0_XYZW. In order to correctly pack registers in all cases, we will need to implement an analysis pass for R600 that determines the correct vector width for each array. v2: - Add support for i8 zext load from stack. - Coding style fixes v3: - Don't reserve registers for indirect addressing when it isn't being used. - Fix bug caused by LLVM limiting the number of SubRegIndex declarations. v4: - Fix 64-bit defines git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@174525 91177308-0d34-0410-b5e6-96231b3b80d8
146 lines
4.7 KiB
C++
146 lines
4.7 KiB
C++
//===-- AMDGPUISelLowering.h - AMDGPU Lowering Interface --------*- C++ -*-===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
/// \file
|
|
/// \brief Interface definition of the TargetLowering class that is common
|
|
/// to all AMD GPUs.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef AMDGPUISELLOWERING_H
|
|
#define AMDGPUISELLOWERING_H
|
|
|
|
#include "llvm/Target/TargetLowering.h"
|
|
|
|
namespace llvm {
|
|
|
|
class MachineRegisterInfo;
|
|
|
|
class AMDGPUTargetLowering : public TargetLowering {
|
|
private:
|
|
SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerUDIVREM(SDValue Op, SelectionDAG &DAG) const;
|
|
|
|
protected:
|
|
|
|
/// \brief Helper function that adds Reg to the LiveIn list of the DAG's
|
|
/// MachineFunction.
|
|
///
|
|
/// \returns a RegisterSDNode representing Reg.
|
|
SDValue CreateLiveInRegister(SelectionDAG &DAG, const TargetRegisterClass *RC,
|
|
unsigned Reg, EVT VT) const;
|
|
|
|
bool isHWTrueValue(SDValue Op) const;
|
|
bool isHWFalseValue(SDValue Op) const;
|
|
|
|
public:
|
|
AMDGPUTargetLowering(TargetMachine &TM);
|
|
|
|
virtual SDValue LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv,
|
|
bool isVarArg,
|
|
const SmallVectorImpl<ISD::InputArg> &Ins,
|
|
DebugLoc DL, SelectionDAG &DAG,
|
|
SmallVectorImpl<SDValue> &InVals) const;
|
|
|
|
virtual SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv,
|
|
bool isVarArg,
|
|
const SmallVectorImpl<ISD::OutputArg> &Outs,
|
|
const SmallVectorImpl<SDValue> &OutVals,
|
|
DebugLoc DL, SelectionDAG &DAG) const;
|
|
|
|
virtual SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerIntrinsicIABS(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerIntrinsicLRP(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerMinMax(SDValue Op, SelectionDAG &DAG) const;
|
|
virtual const char* getTargetNodeName(unsigned Opcode) const;
|
|
|
|
// Functions defined in AMDILISelLowering.cpp
|
|
public:
|
|
|
|
/// \brief Determine which of the bits specified in \p Mask are known to be
|
|
/// either zero or one and return them in the \p KnownZero and \p KnownOne
|
|
/// bitsets.
|
|
virtual void computeMaskedBitsForTargetNode(const SDValue Op,
|
|
APInt &KnownZero,
|
|
APInt &KnownOne,
|
|
const SelectionDAG &DAG,
|
|
unsigned Depth = 0) const;
|
|
|
|
virtual bool getTgtMemIntrinsic(IntrinsicInfo &Info,
|
|
const CallInst &I, unsigned Intrinsic) const;
|
|
|
|
/// We want to mark f32/f64 floating point values as legal.
|
|
bool isFPImmLegal(const APFloat &Imm, EVT VT) const;
|
|
|
|
/// We don't want to shrink f64/f32 constants.
|
|
bool ShouldShrinkFPConstant(EVT VT) const;
|
|
|
|
private:
|
|
void InitAMDILLowering();
|
|
SDValue LowerSREM(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerSREM8(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerSREM16(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerSREM32(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerSREM64(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerSDIV(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerSDIV24(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerSDIV32(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerSDIV64(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerSIGN_EXTEND_INREG(SDValue Op, SelectionDAG &DAG) const;
|
|
EVT genIntType(uint32_t size = 32, uint32_t numEle = 1) const;
|
|
SDValue LowerBRCOND(SDValue Op, SelectionDAG &DAG) const;
|
|
SDValue LowerFP_ROUND(SDValue Op, SelectionDAG &DAG) const;
|
|
};
|
|
|
|
namespace AMDGPUISD {
|
|
|
|
enum {
|
|
// AMDIL ISD Opcodes
|
|
FIRST_NUMBER = ISD::BUILTIN_OP_END,
|
|
MAD, // 32bit Fused Multiply Add instruction
|
|
CALL, // Function call based on a single integer
|
|
UMUL, // 32bit unsigned multiplication
|
|
DIV_INF, // Divide with infinity returned on zero divisor
|
|
RET_FLAG,
|
|
BRANCH_COND,
|
|
// End AMDIL ISD Opcodes
|
|
BITALIGN,
|
|
DWORDADDR,
|
|
FRACT,
|
|
FMAX,
|
|
SMAX,
|
|
UMAX,
|
|
FMIN,
|
|
SMIN,
|
|
UMIN,
|
|
URECIP,
|
|
EXPORT,
|
|
CONST_ADDRESS,
|
|
REGISTER_LOAD,
|
|
REGISTER_STORE,
|
|
LAST_AMDGPU_ISD_NUMBER
|
|
};
|
|
|
|
|
|
} // End namespace AMDGPUISD
|
|
|
|
namespace SIISD {
|
|
|
|
enum {
|
|
SI_FIRST = AMDGPUISD::LAST_AMDGPU_ISD_NUMBER,
|
|
VCC_AND,
|
|
VCC_BITCAST
|
|
};
|
|
|
|
} // End namespace SIISD
|
|
|
|
} // End namespace llvm
|
|
|
|
#endif // AMDGPUISELLOWERING_H
|