2002-10-25 22:55:53 +00:00
|
|
|
//===-- InstSelectSimple.cpp - A simple instruction selector for x86 ------===//
|
2003-10-20 19:43:21 +00:00
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
|
|
|
// This file was developed by the LLVM research group and is distributed under
|
|
|
|
// the University of Illinois Open Source License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
2002-10-25 22:55:53 +00:00
|
|
|
//
|
2003-01-13 00:32:26 +00:00
|
|
|
// This file defines a simple peephole instruction selector for the x86 target
|
2002-10-25 22:55:53 +00:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "X86.h"
|
2002-11-17 21:11:55 +00:00
|
|
|
#include "X86InstrBuilder.h"
|
2003-10-23 16:22:08 +00:00
|
|
|
#include "X86InstrInfo.h"
|
|
|
|
#include "llvm/Constants.h"
|
|
|
|
#include "llvm/DerivedTypes.h"
|
2002-10-25 22:55:53 +00:00
|
|
|
#include "llvm/Function.h"
|
2003-05-13 20:21:19 +00:00
|
|
|
#include "llvm/Instructions.h"
|
2003-12-28 09:47:19 +00:00
|
|
|
#include "llvm/IntrinsicLowering.h"
|
2003-10-23 16:22:08 +00:00
|
|
|
#include "llvm/Pass.h"
|
|
|
|
#include "llvm/CodeGen/MachineConstantPool.h"
|
|
|
|
#include "llvm/CodeGen/MachineFrameInfo.h"
|
2002-10-29 17:43:55 +00:00
|
|
|
#include "llvm/CodeGen/MachineFunction.h"
|
2002-12-25 05:13:53 +00:00
|
|
|
#include "llvm/CodeGen/SSARegMap.h"
|
2002-11-20 00:58:23 +00:00
|
|
|
#include "llvm/Target/MRegisterInfo.h"
|
2003-10-23 16:22:08 +00:00
|
|
|
#include "llvm/Target/TargetMachine.h"
|
2004-02-22 07:04:00 +00:00
|
|
|
#include "llvm/Support/GetElementPtrTypeIterator.h"
|
2003-05-13 20:21:19 +00:00
|
|
|
#include "llvm/Support/InstVisitor.h"
|
2004-01-30 22:13:44 +00:00
|
|
|
#include "llvm/Support/CFG.h"
|
2004-02-22 19:47:26 +00:00
|
|
|
#include "Support/Statistic.h"
|
2003-12-28 09:47:19 +00:00
|
|
|
using namespace llvm;
|
2003-11-11 22:41:34 +00:00
|
|
|
|
2004-02-22 19:47:26 +00:00
|
|
|
namespace {
|
|
|
|
Statistic<>
|
|
|
|
NumFPKill("x86-codegen", "Number of FP_REG_KILL instructions added");
|
|
|
|
}
|
2004-01-30 22:13:44 +00:00
|
|
|
|
2002-10-25 22:55:53 +00:00
|
|
|
namespace {
|
2002-10-29 22:37:54 +00:00
|
|
|
struct ISel : public FunctionPass, InstVisitor<ISel> {
|
|
|
|
TargetMachine &TM;
|
2003-05-08 19:44:13 +00:00
|
|
|
MachineFunction *F; // The function we are compiling into
|
|
|
|
MachineBasicBlock *BB; // The current MBB we are compiling
|
|
|
|
int VarArgsFrameIndex; // FrameIndex for start of varargs area
|
2004-02-15 01:04:03 +00:00
|
|
|
int ReturnAddressIndex; // FrameIndex for the return address
|
2002-10-25 22:55:53 +00:00
|
|
|
|
|
|
|
std::map<Value*, unsigned> RegMap; // Mapping between Val's and SSA Regs
|
|
|
|
|
2002-12-13 10:09:43 +00:00
|
|
|
// MBBMap - Mapping between LLVM BB -> Machine BB
|
|
|
|
std::map<const BasicBlock*, MachineBasicBlock*> MBBMap;
|
|
|
|
|
2003-12-28 21:23:38 +00:00
|
|
|
ISel(TargetMachine &tm) : TM(tm), F(0), BB(0) {}
|
2002-10-25 22:55:53 +00:00
|
|
|
|
|
|
|
/// runOnFunction - Top level implementation of instruction selection for
|
|
|
|
/// the entire function.
|
|
|
|
///
|
2002-10-29 22:37:54 +00:00
|
|
|
bool runOnFunction(Function &Fn) {
|
2003-12-28 09:47:19 +00:00
|
|
|
// First pass over the function, lower any unknown intrinsic functions
|
|
|
|
// with the IntrinsicLowering class.
|
|
|
|
LowerUnknownIntrinsicFunctionCalls(Fn);
|
|
|
|
|
2002-10-29 23:40:58 +00:00
|
|
|
F = &MachineFunction::construct(&Fn, TM);
|
2002-12-13 10:09:43 +00:00
|
|
|
|
2002-12-28 20:24:02 +00:00
|
|
|
// Create all of the machine basic blocks for the function...
|
2002-12-13 10:09:43 +00:00
|
|
|
for (Function::iterator I = Fn.begin(), E = Fn.end(); I != E; ++I)
|
|
|
|
F->getBasicBlockList().push_back(MBBMap[I] = new MachineBasicBlock(I));
|
|
|
|
|
2002-12-16 22:54:46 +00:00
|
|
|
BB = &F->front();
|
2003-05-06 21:32:22 +00:00
|
|
|
|
2004-02-15 01:04:03 +00:00
|
|
|
// Set up a frame object for the return address. This is used by the
|
|
|
|
// llvm.returnaddress & llvm.frameaddress intrinisics.
|
|
|
|
ReturnAddressIndex = F->getFrameInfo()->CreateFixedObject(4, -4);
|
|
|
|
|
2003-05-06 21:32:22 +00:00
|
|
|
// Copy incoming arguments off of the stack...
|
2002-12-28 20:24:02 +00:00
|
|
|
LoadArgumentsToVirtualRegs(Fn);
|
2002-12-16 22:54:46 +00:00
|
|
|
|
2002-12-13 10:09:43 +00:00
|
|
|
// Instruction select everything except PHI nodes
|
2002-10-29 22:37:54 +00:00
|
|
|
visit(Fn);
|
2002-12-13 10:09:43 +00:00
|
|
|
|
|
|
|
// Select the PHI nodes
|
|
|
|
SelectPHINodes();
|
|
|
|
|
2004-02-22 19:47:26 +00:00
|
|
|
// Insert the FP_REG_KILL instructions into blocks that need them.
|
|
|
|
InsertFPRegKills();
|
|
|
|
|
2002-10-25 22:55:53 +00:00
|
|
|
RegMap.clear();
|
2002-12-13 10:09:43 +00:00
|
|
|
MBBMap.clear();
|
2002-10-29 22:37:54 +00:00
|
|
|
F = 0;
|
2003-07-26 23:05:37 +00:00
|
|
|
// We always build a machine code representation for the function
|
|
|
|
return true;
|
2002-10-25 22:55:53 +00:00
|
|
|
}
|
|
|
|
|
2002-12-15 21:13:40 +00:00
|
|
|
virtual const char *getPassName() const {
|
|
|
|
return "X86 Simple Instruction Selection";
|
|
|
|
}
|
|
|
|
|
2002-10-25 22:55:53 +00:00
|
|
|
/// visitBasicBlock - This method is called when we are visiting a new basic
|
2002-10-29 20:48:56 +00:00
|
|
|
/// block. This simply creates a new MachineBasicBlock to emit code into
|
|
|
|
/// and adds it to the current MachineFunction. Subsequent visit* for
|
|
|
|
/// instructions will be invoked for all instructions in the basic block.
|
2002-10-25 22:55:53 +00:00
|
|
|
///
|
|
|
|
void visitBasicBlock(BasicBlock &LLVM_BB) {
|
2002-12-13 10:09:43 +00:00
|
|
|
BB = MBBMap[&LLVM_BB];
|
2002-10-25 22:55:53 +00:00
|
|
|
}
|
|
|
|
|
2003-12-28 09:47:19 +00:00
|
|
|
/// LowerUnknownIntrinsicFunctionCalls - This performs a prepass over the
|
|
|
|
/// function, lowering any calls to unknown intrinsic functions into the
|
|
|
|
/// equivalent LLVM code.
|
2004-03-01 23:53:11 +00:00
|
|
|
///
|
2003-12-28 09:47:19 +00:00
|
|
|
void LowerUnknownIntrinsicFunctionCalls(Function &F);
|
|
|
|
|
2002-12-28 20:24:02 +00:00
|
|
|
/// LoadArgumentsToVirtualRegs - Load all of the arguments to this function
|
|
|
|
/// from the stack into virtual registers.
|
|
|
|
///
|
|
|
|
void LoadArgumentsToVirtualRegs(Function &F);
|
2002-12-13 10:09:43 +00:00
|
|
|
|
|
|
|
/// SelectPHINodes - Insert machine code to generate phis. This is tricky
|
|
|
|
/// because we have to generate our sources into the source basic blocks,
|
|
|
|
/// not the current one.
|
|
|
|
///
|
|
|
|
void SelectPHINodes();
|
|
|
|
|
2004-02-22 19:47:26 +00:00
|
|
|
/// InsertFPRegKills - Insert FP_REG_KILL instructions into basic blocks
|
|
|
|
/// that need them. This only occurs due to the floating point stackifier
|
|
|
|
/// not being aggressive enough to handle arbitrary global stackification.
|
|
|
|
///
|
|
|
|
void InsertFPRegKills();
|
|
|
|
|
2002-10-25 22:55:53 +00:00
|
|
|
// Visitation methods for various instructions. These methods simply emit
|
|
|
|
// fixed X86 code for each instruction.
|
|
|
|
//
|
2002-11-22 11:07:01 +00:00
|
|
|
|
|
|
|
// Control flow operators
|
2002-10-25 22:55:53 +00:00
|
|
|
void visitReturnInst(ReturnInst &RI);
|
2002-11-02 19:27:56 +00:00
|
|
|
void visitBranchInst(BranchInst &BI);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
struct ValueRecord {
|
2003-08-04 02:12:48 +00:00
|
|
|
Value *Val;
|
2003-01-13 00:32:26 +00:00
|
|
|
unsigned Reg;
|
|
|
|
const Type *Ty;
|
2003-08-04 02:12:48 +00:00
|
|
|
ValueRecord(unsigned R, const Type *T) : Val(0), Reg(R), Ty(T) {}
|
|
|
|
ValueRecord(Value *V) : Val(V), Reg(0), Ty(V->getType()) {}
|
2003-01-13 00:32:26 +00:00
|
|
|
};
|
|
|
|
void doCall(const ValueRecord &Ret, MachineInstr *CallMI,
|
2003-10-23 16:22:08 +00:00
|
|
|
const std::vector<ValueRecord> &Args);
|
2002-11-22 11:07:01 +00:00
|
|
|
void visitCallInst(CallInst &I);
|
2003-11-11 22:41:34 +00:00
|
|
|
void visitIntrinsicCall(Intrinsic::ID ID, CallInst &I);
|
2002-11-02 20:04:26 +00:00
|
|
|
|
|
|
|
// Arithmetic operators
|
2002-11-02 20:54:46 +00:00
|
|
|
void visitSimpleBinary(BinaryOperator &B, unsigned OpcodeClass);
|
2002-11-02 20:13:22 +00:00
|
|
|
void visitAdd(BinaryOperator &B) { visitSimpleBinary(B, 0); }
|
|
|
|
void visitSub(BinaryOperator &B) { visitSimpleBinary(B, 1); }
|
2004-02-23 03:10:10 +00:00
|
|
|
void doMultiply(MachineBasicBlock *MBB, MachineBasicBlock::iterator MBBI,
|
2003-01-13 00:32:26 +00:00
|
|
|
unsigned DestReg, const Type *DestTy,
|
2003-10-23 16:22:08 +00:00
|
|
|
unsigned Op0Reg, unsigned Op1Reg);
|
2003-10-19 21:09:10 +00:00
|
|
|
void doMultiplyConst(MachineBasicBlock *MBB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator MBBI,
|
2003-10-19 21:09:10 +00:00
|
|
|
unsigned DestReg, const Type *DestTy,
|
|
|
|
unsigned Op0Reg, unsigned Op1Val);
|
2002-11-02 20:28:58 +00:00
|
|
|
void visitMul(BinaryOperator &B);
|
2002-11-02 20:04:26 +00:00
|
|
|
|
2002-11-02 20:54:46 +00:00
|
|
|
void visitDiv(BinaryOperator &B) { visitDivRem(B); }
|
|
|
|
void visitRem(BinaryOperator &B) { visitDivRem(B); }
|
|
|
|
void visitDivRem(BinaryOperator &B);
|
|
|
|
|
2002-11-02 20:04:26 +00:00
|
|
|
// Bitwise operators
|
2002-11-02 20:13:22 +00:00
|
|
|
void visitAnd(BinaryOperator &B) { visitSimpleBinary(B, 2); }
|
|
|
|
void visitOr (BinaryOperator &B) { visitSimpleBinary(B, 3); }
|
|
|
|
void visitXor(BinaryOperator &B) { visitSimpleBinary(B, 4); }
|
2002-11-02 20:04:26 +00:00
|
|
|
|
2003-01-16 16:43:00 +00:00
|
|
|
// Comparison operators...
|
|
|
|
void visitSetCondInst(SetCondInst &I);
|
2003-10-19 21:09:10 +00:00
|
|
|
unsigned EmitComparison(unsigned OpNum, Value *Op0, Value *Op1,
|
|
|
|
MachineBasicBlock *MBB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator MBBI);
|
2004-03-30 21:22:00 +00:00
|
|
|
void visitSelectInst(SelectInst &SI);
|
|
|
|
|
2003-10-19 21:09:10 +00:00
|
|
|
|
2002-11-17 21:11:55 +00:00
|
|
|
// Memory Instructions
|
|
|
|
void visitLoadInst(LoadInst &I);
|
|
|
|
void visitStoreInst(StoreInst &I);
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
void visitGetElementPtrInst(GetElementPtrInst &I);
|
|
|
|
void visitAllocaInst(AllocaInst &I);
|
2003-01-13 00:32:26 +00:00
|
|
|
void visitMallocInst(MallocInst &I);
|
|
|
|
void visitFreeInst(FreeInst &I);
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
|
2002-11-02 20:04:26 +00:00
|
|
|
// Other operators
|
2002-10-31 23:03:59 +00:00
|
|
|
void visitShiftInst(ShiftInst &I);
|
2002-12-13 10:09:43 +00:00
|
|
|
void visitPHINode(PHINode &I) {} // PHI nodes handled by second pass
|
2002-11-22 11:07:01 +00:00
|
|
|
void visitCastInst(CastInst &I);
|
2003-10-18 05:56:40 +00:00
|
|
|
void visitVANextInst(VANextInst &I);
|
|
|
|
void visitVAArgInst(VAArgInst &I);
|
2002-10-25 22:55:53 +00:00
|
|
|
|
|
|
|
void visitInstruction(Instruction &I) {
|
|
|
|
std::cerr << "Cannot instruction select: " << I;
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
2002-12-13 07:56:18 +00:00
|
|
|
/// promote32 - Make a value 32-bits wide, and put it somewhere.
|
2003-01-13 00:32:26 +00:00
|
|
|
///
|
|
|
|
void promote32(unsigned targetReg, const ValueRecord &VR);
|
|
|
|
|
2004-03-08 01:18:36 +00:00
|
|
|
/// getAddressingMode - Get the addressing mode to use to address the
|
|
|
|
/// specified value. The returned value should be used with addFullAddress.
|
|
|
|
void getAddressingMode(Value *Addr, unsigned &BaseReg, unsigned &Scale,
|
|
|
|
unsigned &IndexReg, unsigned &Disp);
|
|
|
|
|
|
|
|
|
|
|
|
/// getGEPIndex - This is used to fold GEP instructions into X86 addressing
|
|
|
|
/// expressions.
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
void getGEPIndex(MachineBasicBlock *MBB, MachineBasicBlock::iterator IP,
|
|
|
|
std::vector<Value*> &GEPOps,
|
|
|
|
std::vector<const Type*> &GEPTypes, unsigned &BaseReg,
|
|
|
|
unsigned &Scale, unsigned &IndexReg, unsigned &Disp);
|
|
|
|
|
|
|
|
/// isGEPFoldable - Return true if the specified GEP can be completely
|
|
|
|
/// folded into the addressing mode of a load/store or lea instruction.
|
|
|
|
bool isGEPFoldable(MachineBasicBlock *MBB,
|
|
|
|
Value *Src, User::op_iterator IdxBegin,
|
|
|
|
User::op_iterator IdxEnd, unsigned &BaseReg,
|
|
|
|
unsigned &Scale, unsigned &IndexReg, unsigned &Disp);
|
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
/// emitGEPOperation - Common code shared between visitGetElementPtrInst and
|
|
|
|
/// constant expression GEP support.
|
|
|
|
///
|
2004-02-22 17:05:38 +00:00
|
|
|
void emitGEPOperation(MachineBasicBlock *BB, MachineBasicBlock::iterator IP,
|
2002-12-13 10:09:43 +00:00
|
|
|
Value *Src, User::op_iterator IdxBegin,
|
2002-12-13 06:56:29 +00:00
|
|
|
User::op_iterator IdxEnd, unsigned TargetReg);
|
|
|
|
|
2003-04-23 17:22:12 +00:00
|
|
|
/// emitCastOperation - Common code shared between visitCastInst and
|
|
|
|
/// constant expression cast support.
|
2004-03-01 23:53:11 +00:00
|
|
|
///
|
2004-02-23 03:10:10 +00:00
|
|
|
void emitCastOperation(MachineBasicBlock *BB,MachineBasicBlock::iterator IP,
|
2003-04-23 17:22:12 +00:00
|
|
|
Value *Src, const Type *DestTy, unsigned TargetReg);
|
|
|
|
|
2003-05-08 20:49:25 +00:00
|
|
|
/// emitSimpleBinaryOperation - Common code shared between visitSimpleBinary
|
|
|
|
/// and constant expression support.
|
2004-03-01 23:53:11 +00:00
|
|
|
///
|
2003-05-08 20:49:25 +00:00
|
|
|
void emitSimpleBinaryOperation(MachineBasicBlock *BB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2003-05-08 20:49:25 +00:00
|
|
|
Value *Op0, Value *Op1,
|
|
|
|
unsigned OperatorClass, unsigned TargetReg);
|
|
|
|
|
2003-10-23 17:21:43 +00:00
|
|
|
void emitDivRemOperation(MachineBasicBlock *BB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2003-10-23 17:21:43 +00:00
|
|
|
unsigned Op0Reg, unsigned Op1Reg, bool isDiv,
|
|
|
|
const Type *Ty, unsigned TargetReg);
|
|
|
|
|
2003-08-24 19:19:47 +00:00
|
|
|
/// emitSetCCOperation - Common code shared between visitSetCondInst and
|
|
|
|
/// constant expression support.
|
2004-03-01 23:53:11 +00:00
|
|
|
///
|
2003-08-24 19:19:47 +00:00
|
|
|
void emitSetCCOperation(MachineBasicBlock *BB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2003-08-24 19:19:47 +00:00
|
|
|
Value *Op0, Value *Op1, unsigned Opcode,
|
|
|
|
unsigned TargetReg);
|
2003-11-22 05:18:35 +00:00
|
|
|
|
|
|
|
/// emitShiftOperation - Common code shared between visitShiftInst and
|
|
|
|
/// constant expression support.
|
2004-03-01 23:53:11 +00:00
|
|
|
///
|
2003-11-22 06:49:41 +00:00
|
|
|
void emitShiftOperation(MachineBasicBlock *MBB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2003-11-22 06:49:41 +00:00
|
|
|
Value *Op, Value *ShiftAmount, bool isLeftShift,
|
|
|
|
const Type *ResultTy, unsigned DestReg);
|
|
|
|
|
2004-03-30 21:22:00 +00:00
|
|
|
/// emitSelectOperation - Common code shared between visitSelectInst and the
|
|
|
|
/// constant expression support.
|
|
|
|
void emitSelectOperation(MachineBasicBlock *MBB,
|
|
|
|
MachineBasicBlock::iterator IP,
|
|
|
|
Value *Cond, Value *TrueVal, Value *FalseVal,
|
|
|
|
unsigned DestReg);
|
2003-08-24 19:19:47 +00:00
|
|
|
|
2002-10-27 21:16:59 +00:00
|
|
|
/// copyConstantToRegister - Output the instructions required to put the
|
|
|
|
/// specified constant into the specified register.
|
|
|
|
///
|
2002-12-16 19:32:50 +00:00
|
|
|
void copyConstantToRegister(MachineBasicBlock *MBB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator MBBI,
|
2002-12-16 19:32:50 +00:00
|
|
|
Constant *C, unsigned Reg);
|
2002-10-27 21:16:59 +00:00
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
/// makeAnotherReg - This method returns the next register number we haven't
|
|
|
|
/// yet used.
|
|
|
|
///
|
|
|
|
/// Long values are handled somewhat specially. They are always allocated
|
|
|
|
/// as pairs of 32 bit integer values. The register number returned is the
|
|
|
|
/// lower 32 bits of the long value, and the regNum+1 is the upper 32 bits
|
|
|
|
/// of the long value.
|
|
|
|
///
|
2002-12-13 06:56:29 +00:00
|
|
|
unsigned makeAnotherReg(const Type *Ty) {
|
2003-07-30 05:33:48 +00:00
|
|
|
assert(dynamic_cast<const X86RegisterInfo*>(TM.getRegisterInfo()) &&
|
|
|
|
"Current target doesn't have X86 reg info??");
|
|
|
|
const X86RegisterInfo *MRI =
|
|
|
|
static_cast<const X86RegisterInfo*>(TM.getRegisterInfo());
|
2003-01-13 00:32:26 +00:00
|
|
|
if (Ty == Type::LongTy || Ty == Type::ULongTy) {
|
2003-10-23 16:22:08 +00:00
|
|
|
const TargetRegisterClass *RC = MRI->getRegClassForType(Type::IntTy);
|
|
|
|
// Create the lower part
|
|
|
|
F->getSSARegMap()->createVirtualRegister(RC);
|
|
|
|
// Create the upper part.
|
|
|
|
return F->getSSARegMap()->createVirtualRegister(RC)-1;
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
|
|
|
|
2002-12-13 06:56:29 +00:00
|
|
|
// Add the mapping of regnumber => reg class to MachineFunction
|
2003-07-30 05:33:48 +00:00
|
|
|
const TargetRegisterClass *RC = MRI->getRegClassForType(Ty);
|
2003-01-13 00:32:26 +00:00
|
|
|
return F->getSSARegMap()->createVirtualRegister(RC);
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
}
|
|
|
|
|
2002-10-25 22:55:53 +00:00
|
|
|
/// getReg - This method turns an LLVM value into a register number. This
|
|
|
|
/// is guaranteed to produce the same register number for a particular value
|
|
|
|
/// every time it is queried.
|
|
|
|
///
|
|
|
|
unsigned getReg(Value &V) { return getReg(&V); } // Allow references
|
2002-12-13 10:50:40 +00:00
|
|
|
unsigned getReg(Value *V) {
|
|
|
|
// Just append to the end of the current bb.
|
|
|
|
MachineBasicBlock::iterator It = BB->end();
|
|
|
|
return getReg(V, BB, It);
|
|
|
|
}
|
2002-12-13 11:22:48 +00:00
|
|
|
unsigned getReg(Value *V, MachineBasicBlock *MBB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IPt) {
|
2002-10-25 22:55:53 +00:00
|
|
|
unsigned &Reg = RegMap[V];
|
2002-11-20 00:58:23 +00:00
|
|
|
if (Reg == 0) {
|
2002-12-13 06:56:29 +00:00
|
|
|
Reg = makeAnotherReg(V->getType());
|
2002-11-20 00:58:23 +00:00
|
|
|
RegMap[V] = Reg;
|
|
|
|
}
|
2002-10-25 22:55:53 +00:00
|
|
|
|
2002-10-27 21:23:43 +00:00
|
|
|
// If this operand is a constant, emit the code to copy the constant into
|
|
|
|
// the register here...
|
|
|
|
//
|
2002-12-04 06:45:19 +00:00
|
|
|
if (Constant *C = dyn_cast<Constant>(V)) {
|
2002-12-16 19:32:50 +00:00
|
|
|
copyConstantToRegister(MBB, IPt, C, Reg);
|
2002-12-16 22:54:46 +00:00
|
|
|
RegMap.erase(V); // Assign a new name to this constant if ref'd again
|
2002-12-04 06:45:19 +00:00
|
|
|
} else if (GlobalValue *GV = dyn_cast<GlobalValue>(V)) {
|
|
|
|
// Move the address of the global into the register
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IPt, X86::MOV32ri, 1, Reg).addGlobalAddress(GV);
|
2002-12-16 22:54:46 +00:00
|
|
|
RegMap.erase(V); // Assign a new name to this address if ref'd again
|
2002-12-04 06:45:19 +00:00
|
|
|
}
|
2002-10-27 21:16:59 +00:00
|
|
|
|
2002-10-25 22:55:53 +00:00
|
|
|
return Reg;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
}
|
|
|
|
|
2002-11-17 20:07:45 +00:00
|
|
|
/// TypeClass - Used by the X86 backend to group LLVM types by their basic X86
|
|
|
|
/// Representation.
|
|
|
|
///
|
|
|
|
enum TypeClass {
|
2002-12-25 05:13:53 +00:00
|
|
|
cByte, cShort, cInt, cFP, cLong
|
2002-11-17 20:07:45 +00:00
|
|
|
};
|
|
|
|
|
2002-11-02 01:15:18 +00:00
|
|
|
/// getClass - Turn a primitive type into a "class" number which is based on the
|
|
|
|
/// size of the type, and whether or not it is floating point.
|
|
|
|
///
|
2002-11-17 20:07:45 +00:00
|
|
|
static inline TypeClass getClass(const Type *Ty) {
|
2002-11-02 01:15:18 +00:00
|
|
|
switch (Ty->getPrimitiveID()) {
|
|
|
|
case Type::SByteTyID:
|
2002-11-17 20:07:45 +00:00
|
|
|
case Type::UByteTyID: return cByte; // Byte operands are class #0
|
2002-11-02 01:15:18 +00:00
|
|
|
case Type::ShortTyID:
|
2002-11-17 20:07:45 +00:00
|
|
|
case Type::UShortTyID: return cShort; // Short operands are class #1
|
2002-11-02 01:15:18 +00:00
|
|
|
case Type::IntTyID:
|
|
|
|
case Type::UIntTyID:
|
2002-11-17 20:07:45 +00:00
|
|
|
case Type::PointerTyID: return cInt; // Int's and pointers are class #2
|
2002-11-02 01:15:18 +00:00
|
|
|
|
2002-12-25 05:13:53 +00:00
|
|
|
case Type::FloatTyID:
|
|
|
|
case Type::DoubleTyID: return cFP; // Floating Point is #3
|
2003-01-13 00:32:26 +00:00
|
|
|
|
2002-11-02 01:15:18 +00:00
|
|
|
case Type::LongTyID:
|
2003-01-13 00:32:26 +00:00
|
|
|
case Type::ULongTyID: return cLong; // Longs are class #4
|
2002-11-02 01:15:18 +00:00
|
|
|
default:
|
|
|
|
assert(0 && "Invalid type to getClass!");
|
2002-11-17 20:07:45 +00:00
|
|
|
return cByte; // not reached
|
2002-11-02 01:15:18 +00:00
|
|
|
}
|
|
|
|
}
|
2002-10-27 21:16:59 +00:00
|
|
|
|
2002-12-15 08:02:15 +00:00
|
|
|
// getClassB - Just like getClass, but treat boolean values as bytes.
|
|
|
|
static inline TypeClass getClassB(const Type *Ty) {
|
|
|
|
if (Ty == Type::BoolTy) return cByte;
|
|
|
|
return getClass(Ty);
|
|
|
|
}
|
|
|
|
|
2002-11-17 21:56:38 +00:00
|
|
|
|
2002-10-27 21:16:59 +00:00
|
|
|
/// copyConstantToRegister - Output the instructions required to put the
|
|
|
|
/// specified constant into the specified register.
|
|
|
|
///
|
2002-12-16 19:32:50 +00:00
|
|
|
void ISel::copyConstantToRegister(MachineBasicBlock *MBB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2002-12-16 19:32:50 +00:00
|
|
|
Constant *C, unsigned R) {
|
2002-12-13 06:56:29 +00:00
|
|
|
if (ConstantExpr *CE = dyn_cast<ConstantExpr>(C)) {
|
2003-05-08 20:49:25 +00:00
|
|
|
unsigned Class = 0;
|
|
|
|
switch (CE->getOpcode()) {
|
|
|
|
case Instruction::GetElementPtr:
|
2002-12-16 04:23:29 +00:00
|
|
|
emitGEPOperation(MBB, IP, CE->getOperand(0),
|
2002-12-13 10:09:43 +00:00
|
|
|
CE->op_begin()+1, CE->op_end(), R);
|
2002-12-13 06:56:29 +00:00
|
|
|
return;
|
2003-05-08 20:49:25 +00:00
|
|
|
case Instruction::Cast:
|
2003-04-23 17:22:12 +00:00
|
|
|
emitCastOperation(MBB, IP, CE->getOperand(0), CE->getType(), R);
|
2003-04-21 21:33:44 +00:00
|
|
|
return;
|
2002-12-13 06:56:29 +00:00
|
|
|
|
2003-05-08 20:49:25 +00:00
|
|
|
case Instruction::Xor: ++Class; // FALL THROUGH
|
|
|
|
case Instruction::Or: ++Class; // FALL THROUGH
|
|
|
|
case Instruction::And: ++Class; // FALL THROUGH
|
|
|
|
case Instruction::Sub: ++Class; // FALL THROUGH
|
|
|
|
case Instruction::Add:
|
|
|
|
emitSimpleBinaryOperation(MBB, IP, CE->getOperand(0), CE->getOperand(1),
|
|
|
|
Class, R);
|
|
|
|
return;
|
|
|
|
|
2003-10-23 17:21:43 +00:00
|
|
|
case Instruction::Mul: {
|
|
|
|
unsigned Op0Reg = getReg(CE->getOperand(0), MBB, IP);
|
|
|
|
unsigned Op1Reg = getReg(CE->getOperand(1), MBB, IP);
|
|
|
|
doMultiply(MBB, IP, R, CE->getType(), Op0Reg, Op1Reg);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
case Instruction::Div:
|
|
|
|
case Instruction::Rem: {
|
|
|
|
unsigned Op0Reg = getReg(CE->getOperand(0), MBB, IP);
|
|
|
|
unsigned Op1Reg = getReg(CE->getOperand(1), MBB, IP);
|
|
|
|
emitDivRemOperation(MBB, IP, Op0Reg, Op1Reg,
|
|
|
|
CE->getOpcode() == Instruction::Div,
|
|
|
|
CE->getType(), R);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2003-08-24 19:19:47 +00:00
|
|
|
case Instruction::SetNE:
|
|
|
|
case Instruction::SetEQ:
|
|
|
|
case Instruction::SetLT:
|
|
|
|
case Instruction::SetGT:
|
|
|
|
case Instruction::SetLE:
|
|
|
|
case Instruction::SetGE:
|
|
|
|
emitSetCCOperation(MBB, IP, CE->getOperand(0), CE->getOperand(1),
|
|
|
|
CE->getOpcode(), R);
|
|
|
|
return;
|
|
|
|
|
2003-11-22 05:18:35 +00:00
|
|
|
case Instruction::Shl:
|
|
|
|
case Instruction::Shr:
|
|
|
|
emitShiftOperation(MBB, IP, CE->getOperand(0), CE->getOperand(1),
|
2003-11-22 06:49:41 +00:00
|
|
|
CE->getOpcode() == Instruction::Shl, CE->getType(), R);
|
|
|
|
return;
|
2003-11-22 05:18:35 +00:00
|
|
|
|
2004-03-30 21:22:00 +00:00
|
|
|
case Instruction::Select:
|
|
|
|
emitSelectOperation(MBB, IP, CE->getOperand(0), CE->getOperand(1),
|
|
|
|
CE->getOperand(2), R);
|
|
|
|
return;
|
|
|
|
|
2003-05-08 20:49:25 +00:00
|
|
|
default:
|
|
|
|
std::cerr << "Offending expr: " << C << "\n";
|
2003-10-19 21:09:10 +00:00
|
|
|
assert(0 && "Constant expression not yet handled!\n");
|
2003-05-08 20:49:25 +00:00
|
|
|
}
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
}
|
2002-10-27 21:16:59 +00:00
|
|
|
|
2002-11-02 01:15:18 +00:00
|
|
|
if (C->getType()->isIntegral()) {
|
2002-12-15 08:02:15 +00:00
|
|
|
unsigned Class = getClassB(C->getType());
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
if (Class == cLong) {
|
|
|
|
// Copy the value into the register pair.
|
2003-07-23 15:22:26 +00:00
|
|
|
uint64_t Val = cast<ConstantInt>(C)->getRawValue();
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV32ri, 1, R).addImm(Val & 0xFFFFFFFF);
|
|
|
|
BuildMI(*MBB, IP, X86::MOV32ri, 1, R+1).addImm(Val >> 32);
|
2003-01-13 00:32:26 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2002-12-25 05:13:53 +00:00
|
|
|
assert(Class <= cInt && "Type not handled yet!");
|
2002-11-02 01:15:18 +00:00
|
|
|
|
|
|
|
static const unsigned IntegralOpcodeTab[] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
X86::MOV8ri, X86::MOV16ri, X86::MOV32ri
|
2002-11-02 01:15:18 +00:00
|
|
|
};
|
|
|
|
|
2002-12-15 08:02:15 +00:00
|
|
|
if (C->getType() == Type::BoolTy) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV8ri, 1, R).addImm(C == ConstantBool::True);
|
2002-11-02 01:15:18 +00:00
|
|
|
} else {
|
2003-07-23 15:22:26 +00:00
|
|
|
ConstantInt *CI = cast<ConstantInt>(C);
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, IntegralOpcodeTab[Class],1,R).addImm(CI->getRawValue());
|
2002-11-02 01:15:18 +00:00
|
|
|
}
|
2002-12-25 05:13:53 +00:00
|
|
|
} else if (ConstantFP *CFP = dyn_cast<ConstantFP>(C)) {
|
2004-02-02 18:56:30 +00:00
|
|
|
if (CFP->isExactlyValue(+0.0))
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, X86::FLD0, 0, R);
|
2004-02-02 18:56:30 +00:00
|
|
|
else if (CFP->isExactlyValue(+1.0))
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, X86::FLD1, 0, R);
|
2002-12-25 05:13:53 +00:00
|
|
|
else {
|
2003-01-13 00:32:26 +00:00
|
|
|
// Otherwise we need to spill the constant to memory...
|
|
|
|
MachineConstantPool *CP = F->getConstantPool();
|
|
|
|
unsigned CPI = CP->getConstantPoolIndex(CFP);
|
2003-10-20 04:11:23 +00:00
|
|
|
const Type *Ty = CFP->getType();
|
|
|
|
|
|
|
|
assert(Ty == Type::FloatTy || Ty == Type::DoubleTy && "Unknown FP type!");
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
unsigned LoadOpcode = Ty == Type::FloatTy ? X86::FLD32m : X86::FLD64m;
|
2004-02-29 07:22:16 +00:00
|
|
|
addConstantPoolReference(BuildMI(*MBB, IP, LoadOpcode, 4, R), CPI);
|
2002-12-25 05:13:53 +00:00
|
|
|
}
|
|
|
|
|
2002-12-13 10:50:40 +00:00
|
|
|
} else if (isa<ConstantPointerNull>(C)) {
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
// Copy zero (null pointer) to the register.
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV32ri, 1, R).addImm(0);
|
2002-12-13 06:56:29 +00:00
|
|
|
} else if (ConstantPointerRef *CPR = dyn_cast<ConstantPointerRef>(C)) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV32ri, 1, R).addGlobalAddress(CPR->getValue());
|
2002-11-02 01:15:18 +00:00
|
|
|
} else {
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
std::cerr << "Offending constant: " << C << "\n";
|
2002-11-02 01:15:18 +00:00
|
|
|
assert(0 && "Type not handled yet!");
|
2002-10-27 21:16:59 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2002-12-28 20:24:02 +00:00
|
|
|
/// LoadArgumentsToVirtualRegs - Load all of the arguments to this function from
|
|
|
|
/// the stack into virtual registers.
|
|
|
|
///
|
|
|
|
void ISel::LoadArgumentsToVirtualRegs(Function &Fn) {
|
|
|
|
// Emit instructions to load the arguments... On entry to a function on the
|
|
|
|
// X86, the stack frame looks like this:
|
|
|
|
//
|
|
|
|
// [ESP] -- return address
|
2003-01-13 00:32:26 +00:00
|
|
|
// [ESP + 4] -- first argument (leftmost lexically)
|
|
|
|
// [ESP + 8] -- second argument, if first argument is four bytes in size
|
2002-12-28 20:24:02 +00:00
|
|
|
// ...
|
|
|
|
//
|
2003-01-16 02:20:12 +00:00
|
|
|
unsigned ArgOffset = 0; // Frame mechanisms handle retaddr slot
|
2002-12-28 21:08:28 +00:00
|
|
|
MachineFrameInfo *MFI = F->getFrameInfo();
|
2002-12-28 20:24:02 +00:00
|
|
|
|
|
|
|
for (Function::aiterator I = Fn.abegin(), E = Fn.aend(); I != E; ++I) {
|
|
|
|
unsigned Reg = getReg(*I);
|
|
|
|
|
|
|
|
int FI; // Frame object index
|
|
|
|
switch (getClassB(I->getType())) {
|
|
|
|
case cByte:
|
2002-12-28 21:08:28 +00:00
|
|
|
FI = MFI->CreateFixedObject(1, ArgOffset);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(BB, X86::MOV8rm, 4, Reg), FI);
|
2002-12-28 20:24:02 +00:00
|
|
|
break;
|
|
|
|
case cShort:
|
2002-12-28 21:08:28 +00:00
|
|
|
FI = MFI->CreateFixedObject(2, ArgOffset);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(BB, X86::MOV16rm, 4, Reg), FI);
|
2002-12-28 20:24:02 +00:00
|
|
|
break;
|
|
|
|
case cInt:
|
2002-12-28 21:08:28 +00:00
|
|
|
FI = MFI->CreateFixedObject(4, ArgOffset);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(BB, X86::MOV32rm, 4, Reg), FI);
|
2002-12-28 20:24:02 +00:00
|
|
|
break;
|
2003-01-13 00:32:26 +00:00
|
|
|
case cLong:
|
|
|
|
FI = MFI->CreateFixedObject(8, ArgOffset);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(BB, X86::MOV32rm, 4, Reg), FI);
|
|
|
|
addFrameReference(BuildMI(BB, X86::MOV32rm, 4, Reg+1), FI, 4);
|
2003-01-13 00:32:26 +00:00
|
|
|
ArgOffset += 4; // longs require 4 additional bytes
|
|
|
|
break;
|
2002-12-28 20:24:02 +00:00
|
|
|
case cFP:
|
|
|
|
unsigned Opcode;
|
|
|
|
if (I->getType() == Type::FloatTy) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
Opcode = X86::FLD32m;
|
2003-10-23 16:22:08 +00:00
|
|
|
FI = MFI->CreateFixedObject(4, ArgOffset);
|
2002-12-28 20:24:02 +00:00
|
|
|
} else {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
Opcode = X86::FLD64m;
|
2003-10-23 16:22:08 +00:00
|
|
|
FI = MFI->CreateFixedObject(8, ArgOffset);
|
|
|
|
ArgOffset += 4; // doubles require 4 additional bytes
|
2002-12-28 20:24:02 +00:00
|
|
|
}
|
|
|
|
addFrameReference(BuildMI(BB, Opcode, 4, Reg), FI);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
assert(0 && "Unhandled argument type!");
|
|
|
|
}
|
2003-01-13 00:32:26 +00:00
|
|
|
ArgOffset += 4; // Each argument takes at least 4 bytes on the stack...
|
2002-12-28 20:24:02 +00:00
|
|
|
}
|
2003-05-08 19:44:13 +00:00
|
|
|
|
|
|
|
// If the function takes variable number of arguments, add a frame offset for
|
|
|
|
// the start of the first vararg value... this is used to expand
|
|
|
|
// llvm.va_start.
|
|
|
|
if (Fn.getFunctionType()->isVarArg())
|
|
|
|
VarArgsFrameIndex = MFI->CreateFixedObject(1, ArgOffset);
|
2002-12-28 20:24:02 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2002-12-13 10:09:43 +00:00
|
|
|
/// SelectPHINodes - Insert machine code to generate phis. This is tricky
|
|
|
|
/// because we have to generate our sources into the source basic blocks, not
|
|
|
|
/// the current one.
|
|
|
|
///
|
|
|
|
void ISel::SelectPHINodes() {
|
2003-01-14 22:00:31 +00:00
|
|
|
const TargetInstrInfo &TII = TM.getInstrInfo();
|
2002-12-13 10:09:43 +00:00
|
|
|
const Function &LF = *F->getFunction(); // The LLVM function...
|
|
|
|
for (Function::const_iterator I = LF.begin(), E = LF.end(); I != E; ++I) {
|
|
|
|
const BasicBlock *BB = I;
|
2004-02-29 07:10:16 +00:00
|
|
|
MachineBasicBlock &MBB = *MBBMap[I];
|
2002-12-13 10:09:43 +00:00
|
|
|
|
|
|
|
// Loop over all of the PHI nodes in the LLVM basic block...
|
2004-02-29 07:10:16 +00:00
|
|
|
MachineBasicBlock::iterator PHIInsertPoint = MBB.begin();
|
2002-12-13 10:09:43 +00:00
|
|
|
for (BasicBlock::const_iterator I = BB->begin();
|
2003-10-19 00:26:11 +00:00
|
|
|
PHINode *PN = const_cast<PHINode*>(dyn_cast<PHINode>(I)); ++I) {
|
2003-01-13 00:32:26 +00:00
|
|
|
|
2002-12-13 10:09:43 +00:00
|
|
|
// Create a new machine instr PHI node, and insert it.
|
2003-01-13 00:32:26 +00:00
|
|
|
unsigned PHIReg = getReg(*PN);
|
2004-02-29 07:10:16 +00:00
|
|
|
MachineInstr *PhiMI = BuildMI(MBB, PHIInsertPoint,
|
|
|
|
X86::PHI, PN->getNumOperands(), PHIReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
MachineInstr *LongPhiMI = 0;
|
2004-02-29 07:10:16 +00:00
|
|
|
if (PN->getType() == Type::LongTy || PN->getType() == Type::ULongTy)
|
|
|
|
LongPhiMI = BuildMI(MBB, PHIInsertPoint,
|
|
|
|
X86::PHI, PN->getNumOperands(), PHIReg+1);
|
2002-12-13 10:09:43 +00:00
|
|
|
|
2003-05-12 14:22:21 +00:00
|
|
|
// PHIValues - Map of blocks to incoming virtual registers. We use this
|
|
|
|
// so that we only initialize one incoming value for a particular block,
|
|
|
|
// even if the block has multiple entries in the PHI node.
|
|
|
|
//
|
|
|
|
std::map<MachineBasicBlock*, unsigned> PHIValues;
|
|
|
|
|
2002-12-13 10:09:43 +00:00
|
|
|
for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) {
|
|
|
|
MachineBasicBlock *PredMBB = MBBMap[PN->getIncomingBlock(i)];
|
2003-05-12 14:22:21 +00:00
|
|
|
unsigned ValReg;
|
|
|
|
std::map<MachineBasicBlock*, unsigned>::iterator EntryIt =
|
|
|
|
PHIValues.lower_bound(PredMBB);
|
|
|
|
|
|
|
|
if (EntryIt != PHIValues.end() && EntryIt->first == PredMBB) {
|
|
|
|
// We already inserted an initialization of the register for this
|
|
|
|
// predecessor. Recycle it.
|
|
|
|
ValReg = EntryIt->second;
|
|
|
|
|
|
|
|
} else {
|
2003-10-19 00:26:11 +00:00
|
|
|
// Get the incoming value into a virtual register.
|
2003-05-12 14:22:21 +00:00
|
|
|
//
|
2003-10-19 00:26:11 +00:00
|
|
|
Value *Val = PN->getIncomingValue(i);
|
|
|
|
|
|
|
|
// If this is a constant or GlobalValue, we may have to insert code
|
|
|
|
// into the basic block to compute it into a virtual register.
|
|
|
|
if (isa<Constant>(Val) || isa<GlobalValue>(Val)) {
|
2004-03-30 19:10:12 +00:00
|
|
|
if (isa<ConstantExpr>(Val)) {
|
|
|
|
// Because we don't want to clobber any values which might be in
|
|
|
|
// physical registers with the computation of this constant (which
|
|
|
|
// might be arbitrarily complex if it is a constant expression),
|
|
|
|
// just insert the computation at the top of the basic block.
|
|
|
|
MachineBasicBlock::iterator PI = PredMBB->begin();
|
|
|
|
|
|
|
|
// Skip over any PHI nodes though!
|
|
|
|
while (PI != PredMBB->end() && PI->getOpcode() == X86::PHI)
|
|
|
|
++PI;
|
|
|
|
|
|
|
|
ValReg = getReg(Val, PredMBB, PI);
|
|
|
|
} else {
|
|
|
|
// Simple constants get emitted at the end of the basic block,
|
|
|
|
// before any terminator instructions. We "know" that the code to
|
|
|
|
// move a constant into a register will never clobber any flags.
|
|
|
|
ValReg = getReg(Val, PredMBB, PredMBB->getFirstTerminator());
|
|
|
|
}
|
2003-10-19 00:26:11 +00:00
|
|
|
} else {
|
|
|
|
ValReg = getReg(Val);
|
|
|
|
}
|
2003-05-12 14:22:21 +00:00
|
|
|
|
|
|
|
// Remember that we inserted a value for this PHI for this predecessor
|
|
|
|
PHIValues.insert(EntryIt, std::make_pair(PredMBB, ValReg));
|
|
|
|
}
|
2002-12-13 10:09:43 +00:00
|
|
|
|
2003-10-23 16:22:08 +00:00
|
|
|
PhiMI->addRegOperand(ValReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
PhiMI->addMachineBasicBlockOperand(PredMBB);
|
2003-10-23 16:22:08 +00:00
|
|
|
if (LongPhiMI) {
|
|
|
|
LongPhiMI->addRegOperand(ValReg+1);
|
|
|
|
LongPhiMI->addMachineBasicBlockOperand(PredMBB);
|
|
|
|
}
|
2002-12-13 10:09:43 +00:00
|
|
|
}
|
2004-02-29 07:10:16 +00:00
|
|
|
|
|
|
|
// Now that we emitted all of the incoming values for the PHI node, make
|
|
|
|
// sure to reposition the InsertPoint after the PHI that we just added.
|
|
|
|
// This is needed because we might have inserted a constant into this
|
|
|
|
// block, right after the PHI's which is before the old insert point!
|
|
|
|
PHIInsertPoint = LongPhiMI ? LongPhiMI : PhiMI;
|
|
|
|
++PHIInsertPoint;
|
2002-12-13 10:09:43 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2004-02-22 19:47:26 +00:00
|
|
|
/// RequiresFPRegKill - The floating point stackifier pass cannot insert
|
|
|
|
/// compensation code on critical edges. As such, it requires that we kill all
|
|
|
|
/// FP registers on the exit from any blocks that either ARE critical edges, or
|
|
|
|
/// branch to a block that has incoming critical edges.
|
|
|
|
///
|
|
|
|
/// Note that this kill instruction will eventually be eliminated when
|
|
|
|
/// restrictions in the stackifier are relaxed.
|
|
|
|
///
|
|
|
|
static bool RequiresFPRegKill(const BasicBlock *BB) {
|
|
|
|
#if 0
|
|
|
|
for (succ_const_iterator SI = succ_begin(BB), E = succ_end(BB); SI!=E; ++SI) {
|
|
|
|
const BasicBlock *Succ = *SI;
|
|
|
|
pred_const_iterator PI = pred_begin(Succ), PE = pred_end(Succ);
|
|
|
|
++PI; // Block have at least one predecessory
|
|
|
|
if (PI != PE) { // If it has exactly one, this isn't crit edge
|
|
|
|
// If this block has more than one predecessor, check all of the
|
|
|
|
// predecessors to see if they have multiple successors. If so, then the
|
|
|
|
// block we are analyzing needs an FPRegKill.
|
|
|
|
for (PI = pred_begin(Succ); PI != PE; ++PI) {
|
|
|
|
const BasicBlock *Pred = *PI;
|
|
|
|
succ_const_iterator SI2 = succ_begin(Pred);
|
|
|
|
++SI2; // There must be at least one successor of this block.
|
|
|
|
if (SI2 != succ_end(Pred))
|
|
|
|
return true; // Yes, we must insert the kill on this edge.
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// If we got this far, there is no need to insert the kill instruction.
|
|
|
|
return false;
|
|
|
|
#else
|
|
|
|
return true;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
// InsertFPRegKills - Insert FP_REG_KILL instructions into basic blocks that
|
|
|
|
// need them. This only occurs due to the floating point stackifier not being
|
|
|
|
// aggressive enough to handle arbitrary global stackification.
|
|
|
|
//
|
|
|
|
// Currently we insert an FP_REG_KILL instruction into each block that uses or
|
|
|
|
// defines a floating point virtual register.
|
|
|
|
//
|
|
|
|
// When the global register allocators (like linear scan) finally update live
|
|
|
|
// variable analysis, we can keep floating point values in registers across
|
|
|
|
// portions of the CFG that do not involve critical edges. This will be a big
|
|
|
|
// win, but we are waiting on the global allocators before we can do this.
|
|
|
|
//
|
|
|
|
// With a bit of work, the floating point stackifier pass can be enhanced to
|
|
|
|
// break critical edges as needed (to make a place to put compensation code),
|
|
|
|
// but this will require some infrastructure improvements as well.
|
|
|
|
//
|
|
|
|
void ISel::InsertFPRegKills() {
|
|
|
|
SSARegMap &RegMap = *F->getSSARegMap();
|
|
|
|
|
|
|
|
for (MachineFunction::iterator BB = F->begin(), E = F->end(); BB != E; ++BB) {
|
|
|
|
for (MachineBasicBlock::iterator I = BB->begin(), E = BB->end(); I!=E; ++I)
|
2004-02-26 22:00:20 +00:00
|
|
|
for (unsigned i = 0, e = I->getNumOperands(); i != e; ++i) {
|
|
|
|
MachineOperand& MO = I->getOperand(i);
|
|
|
|
if (MO.isRegister() && MO.getReg()) {
|
|
|
|
unsigned Reg = MO.getReg();
|
2004-02-22 19:47:26 +00:00
|
|
|
if (MRegisterInfo::isVirtualRegister(Reg))
|
2004-02-23 07:29:45 +00:00
|
|
|
if (RegMap.getRegClass(Reg)->getSize() == 10)
|
|
|
|
goto UsesFPReg;
|
|
|
|
}
|
2004-02-26 22:00:20 +00:00
|
|
|
}
|
2004-02-23 07:29:45 +00:00
|
|
|
// If we haven't found an FP register use or def in this basic block, check
|
|
|
|
// to see if any of our successors has an FP PHI node, which will cause a
|
|
|
|
// copy to be inserted into this block.
|
2004-02-23 07:42:19 +00:00
|
|
|
for (succ_const_iterator SI = succ_begin(BB->getBasicBlock()),
|
|
|
|
E = succ_end(BB->getBasicBlock()); SI != E; ++SI) {
|
|
|
|
MachineBasicBlock *SBB = MBBMap[*SI];
|
|
|
|
for (MachineBasicBlock::iterator I = SBB->begin();
|
|
|
|
I != SBB->end() && I->getOpcode() == X86::PHI; ++I) {
|
|
|
|
if (RegMap.getRegClass(I->getOperand(0).getReg())->getSize() == 10)
|
|
|
|
goto UsesFPReg;
|
2004-02-22 19:47:26 +00:00
|
|
|
}
|
2004-02-23 07:42:19 +00:00
|
|
|
}
|
2004-02-23 07:29:45 +00:00
|
|
|
continue;
|
|
|
|
UsesFPReg:
|
|
|
|
// Okay, this block uses an FP register. If the block has successors (ie,
|
|
|
|
// it's not an unwind/return), insert the FP_REG_KILL instruction.
|
|
|
|
if (BB->getBasicBlock()->getTerminator()->getNumSuccessors() &&
|
|
|
|
RequiresFPRegKill(BB->getBasicBlock())) {
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, BB->getFirstTerminator(), X86::FP_REG_KILL, 0);
|
2004-02-23 07:29:45 +00:00
|
|
|
++NumFPKill;
|
2004-02-22 19:47:26 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2004-03-30 22:39:09 +00:00
|
|
|
// canFoldSetCCIntoBranchOrSelect - Return the setcc instruction if we can fold
|
|
|
|
// it into the conditional branch or select instruction which is the only user
|
|
|
|
// of the cc instruction. This is the case if the conditional branch is the
|
|
|
|
// only user of the setcc, and if the setcc is in the same basic block as the
|
|
|
|
// conditional branch. We also don't handle long arguments below, so we reject
|
|
|
|
// them here as well.
|
2003-01-16 16:43:00 +00:00
|
|
|
//
|
2004-03-30 22:39:09 +00:00
|
|
|
static SetCondInst *canFoldSetCCIntoBranchOrSelect(Value *V) {
|
2003-01-16 16:43:00 +00:00
|
|
|
if (SetCondInst *SCI = dyn_cast<SetCondInst>(V))
|
2004-03-30 22:39:09 +00:00
|
|
|
if (SCI->hasOneUse()) {
|
|
|
|
Instruction *User = cast<Instruction>(SCI->use_back());
|
|
|
|
if ((isa<BranchInst>(User) || isa<SelectInst>(User)) &&
|
|
|
|
SCI->getParent() == User->getParent() &&
|
|
|
|
getClassB(SCI->getOperand(0)->getType()) != cLong)
|
2003-01-16 16:43:00 +00:00
|
|
|
return SCI;
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
2002-12-13 10:09:43 +00:00
|
|
|
|
2003-01-16 16:43:00 +00:00
|
|
|
// Return a fixed numbering for setcc instructions which does not depend on the
|
|
|
|
// order of the opcodes.
|
|
|
|
//
|
|
|
|
static unsigned getSetCCNumber(unsigned Opcode) {
|
|
|
|
switch(Opcode) {
|
|
|
|
default: assert(0 && "Unknown setcc instruction!");
|
|
|
|
case Instruction::SetEQ: return 0;
|
|
|
|
case Instruction::SetNE: return 1;
|
|
|
|
case Instruction::SetLT: return 2;
|
2003-01-16 18:07:23 +00:00
|
|
|
case Instruction::SetGE: return 3;
|
|
|
|
case Instruction::SetGT: return 4;
|
|
|
|
case Instruction::SetLE: return 5;
|
2003-01-16 16:43:00 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// LLVM -> X86 signed X86 unsigned
|
|
|
|
// ----- ---------- ------------
|
|
|
|
// seteq -> sete sete
|
|
|
|
// setne -> setne setne
|
|
|
|
// setlt -> setl setb
|
2003-01-16 18:07:23 +00:00
|
|
|
// setge -> setge setae
|
2003-01-16 16:43:00 +00:00
|
|
|
// setgt -> setg seta
|
|
|
|
// setle -> setle setbe
|
2003-10-19 21:09:10 +00:00
|
|
|
// ----
|
|
|
|
// sets // Used by comparison with 0 optimization
|
|
|
|
// setns
|
|
|
|
static const unsigned SetCCOpcodeTab[2][8] = {
|
|
|
|
{ X86::SETEr, X86::SETNEr, X86::SETBr, X86::SETAEr, X86::SETAr, X86::SETBEr,
|
|
|
|
0, 0 },
|
|
|
|
{ X86::SETEr, X86::SETNEr, X86::SETLr, X86::SETGEr, X86::SETGr, X86::SETLEr,
|
|
|
|
X86::SETSr, X86::SETNSr },
|
2003-01-16 16:43:00 +00:00
|
|
|
};
|
|
|
|
|
2003-10-19 21:09:10 +00:00
|
|
|
// EmitComparison - This function emits a comparison of the two operands,
|
|
|
|
// returning the extended setcc code to use.
|
|
|
|
unsigned ISel::EmitComparison(unsigned OpNum, Value *Op0, Value *Op1,
|
|
|
|
MachineBasicBlock *MBB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP) {
|
2002-11-07 17:59:21 +00:00
|
|
|
// The arguments are already supposed to be of the same type.
|
2003-01-16 16:43:00 +00:00
|
|
|
const Type *CompTy = Op0->getType();
|
2003-01-13 00:32:26 +00:00
|
|
|
unsigned Class = getClassB(CompTy);
|
2003-08-24 19:19:47 +00:00
|
|
|
unsigned Op0r = getReg(Op0, MBB, IP);
|
2003-06-05 19:30:30 +00:00
|
|
|
|
|
|
|
// Special case handling of: cmp R, i
|
|
|
|
if (Class == cByte || Class == cShort || Class == cInt)
|
|
|
|
if (ConstantInt *CI = dyn_cast<ConstantInt>(Op1)) {
|
2003-07-23 15:22:26 +00:00
|
|
|
uint64_t Op1v = cast<ConstantInt>(CI)->getRawValue();
|
|
|
|
|
2003-06-05 19:30:30 +00:00
|
|
|
// Mask off any upper bits of the constant, if there are any...
|
|
|
|
Op1v &= (1ULL << (8 << Class)) - 1;
|
|
|
|
|
2003-10-19 21:09:10 +00:00
|
|
|
// If this is a comparison against zero, emit more efficient code. We
|
|
|
|
// can't handle unsigned comparisons against zero unless they are == or
|
|
|
|
// !=. These should have been strength reduced already anyway.
|
|
|
|
if (Op1v == 0 && (CompTy->isSigned() || OpNum < 2)) {
|
|
|
|
static const unsigned TESTTab[] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
X86::TEST8rr, X86::TEST16rr, X86::TEST32rr
|
2003-10-19 21:09:10 +00:00
|
|
|
};
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, TESTTab[Class], 2).addReg(Op0r).addReg(Op0r);
|
2003-10-19 21:09:10 +00:00
|
|
|
|
|
|
|
if (OpNum == 2) return 6; // Map jl -> js
|
|
|
|
if (OpNum == 3) return 7; // Map jg -> jns
|
|
|
|
return OpNum;
|
2003-06-05 19:30:30 +00:00
|
|
|
}
|
2003-10-19 21:09:10 +00:00
|
|
|
|
|
|
|
static const unsigned CMPTab[] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
X86::CMP8ri, X86::CMP16ri, X86::CMP32ri
|
2003-10-19 21:09:10 +00:00
|
|
|
};
|
|
|
|
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, CMPTab[Class], 2).addReg(Op0r).addImm(Op1v);
|
2003-10-19 21:09:10 +00:00
|
|
|
return OpNum;
|
2003-06-05 19:30:30 +00:00
|
|
|
}
|
|
|
|
|
2004-02-03 18:54:04 +00:00
|
|
|
// Special case handling of comparison against +/- 0.0
|
|
|
|
if (ConstantFP *CFP = dyn_cast<ConstantFP>(Op1))
|
|
|
|
if (CFP->isExactlyValue(+0.0) || CFP->isExactlyValue(-0.0)) {
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, X86::FTST, 1).addReg(Op0r);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::FNSTSW8r, 0);
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, X86::SAHF, 1);
|
2004-02-03 18:54:04 +00:00
|
|
|
return OpNum;
|
|
|
|
}
|
|
|
|
|
2003-08-24 19:19:47 +00:00
|
|
|
unsigned Op1r = getReg(Op1, MBB, IP);
|
2002-11-21 15:52:38 +00:00
|
|
|
switch (Class) {
|
2003-01-13 00:32:26 +00:00
|
|
|
default: assert(0 && "Unknown type class!");
|
2002-11-21 15:52:38 +00:00
|
|
|
// Emit: cmp <var1>, <var2> (do the comparison). We can
|
|
|
|
// compare 8-bit with 8-bit, 16-bit with 16-bit, 32-bit with
|
|
|
|
// 32-bit.
|
|
|
|
case cByte:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::CMP8rr, 2).addReg(Op0r).addReg(Op1r);
|
2002-11-21 15:52:38 +00:00
|
|
|
break;
|
|
|
|
case cShort:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::CMP16rr, 2).addReg(Op0r).addReg(Op1r);
|
2002-11-21 15:52:38 +00:00
|
|
|
break;
|
|
|
|
case cInt:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::CMP32rr, 2).addReg(Op0r).addReg(Op1r);
|
2002-11-21 15:52:38 +00:00
|
|
|
break;
|
2003-01-13 00:32:26 +00:00
|
|
|
case cFP:
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, X86::FpUCOM, 2).addReg(Op0r).addReg(Op1r);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::FNSTSW8r, 0);
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, X86::SAHF, 1);
|
2002-11-21 15:52:38 +00:00
|
|
|
break;
|
2003-01-13 00:32:26 +00:00
|
|
|
|
2002-11-21 15:52:38 +00:00
|
|
|
case cLong:
|
2003-01-13 00:32:26 +00:00
|
|
|
if (OpNum < 2) { // seteq, setne
|
|
|
|
unsigned LoTmp = makeAnotherReg(Type::IntTy);
|
|
|
|
unsigned HiTmp = makeAnotherReg(Type::IntTy);
|
|
|
|
unsigned FinalTmp = makeAnotherReg(Type::IntTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::XOR32rr, 2, LoTmp).addReg(Op0r).addReg(Op1r);
|
|
|
|
BuildMI(*MBB, IP, X86::XOR32rr, 2, HiTmp).addReg(Op0r+1).addReg(Op1r+1);
|
|
|
|
BuildMI(*MBB, IP, X86::OR32rr, 2, FinalTmp).addReg(LoTmp).addReg(HiTmp);
|
2003-01-13 00:32:26 +00:00
|
|
|
break; // Allow the sete or setne to be generated from flags set by OR
|
|
|
|
} else {
|
|
|
|
// Emit a sequence of code which compares the high and low parts once
|
|
|
|
// each, then uses a conditional move to handle the overflow case. For
|
|
|
|
// example, a setlt for long would generate code like this:
|
|
|
|
//
|
|
|
|
// AL = lo(op1) < lo(op2) // Signedness depends on operands
|
|
|
|
// BL = hi(op1) < hi(op2) // Always unsigned comparison
|
|
|
|
// dest = hi(op1) == hi(op2) ? AL : BL;
|
|
|
|
//
|
2002-11-21 15:52:38 +00:00
|
|
|
|
2003-01-16 16:43:00 +00:00
|
|
|
// FIXME: This would be much better if we had hierarchical register
|
2003-01-13 00:32:26 +00:00
|
|
|
// classes! Until then, hardcode registers so that we can deal with their
|
|
|
|
// aliases (because we don't have conditional byte moves).
|
|
|
|
//
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::CMP32rr, 2).addReg(Op0r).addReg(Op1r);
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, SetCCOpcodeTab[0][OpNum], 0, X86::AL);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::CMP32rr, 2).addReg(Op0r+1).addReg(Op1r+1);
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, SetCCOpcodeTab[CompTy->isSigned()][OpNum], 0, X86::BL);
|
|
|
|
BuildMI(*MBB, IP, X86::IMPLICIT_DEF, 0, X86::BH);
|
|
|
|
BuildMI(*MBB, IP, X86::IMPLICIT_DEF, 0, X86::AH);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::CMOVE16rr, 2, X86::BX).addReg(X86::BX)
|
2004-02-29 07:22:16 +00:00
|
|
|
.addReg(X86::AX);
|
2003-01-16 16:43:00 +00:00
|
|
|
// NOTE: visitSetCondInst knows that the value is dumped into the BL
|
|
|
|
// register at this point for long values...
|
2003-10-19 21:09:10 +00:00
|
|
|
return OpNum;
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
2002-11-21 15:52:38 +00:00
|
|
|
}
|
2003-10-19 21:09:10 +00:00
|
|
|
return OpNum;
|
2003-01-16 16:43:00 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/// SetCC instructions - Here we just emit boilerplate code to set a byte-sized
|
|
|
|
/// register, then move it to wherever the result should be.
|
|
|
|
///
|
|
|
|
void ISel::visitSetCondInst(SetCondInst &I) {
|
2004-03-30 22:39:09 +00:00
|
|
|
if (canFoldSetCCIntoBranchOrSelect(&I))
|
|
|
|
return; // Fold this into a branch or select.
|
2003-01-16 16:43:00 +00:00
|
|
|
|
|
|
|
unsigned DestReg = getReg(I);
|
2003-08-24 19:19:47 +00:00
|
|
|
MachineBasicBlock::iterator MII = BB->end();
|
|
|
|
emitSetCCOperation(BB, MII, I.getOperand(0), I.getOperand(1), I.getOpcode(),
|
|
|
|
DestReg);
|
|
|
|
}
|
2002-11-21 15:52:38 +00:00
|
|
|
|
2003-08-24 19:19:47 +00:00
|
|
|
/// emitSetCCOperation - Common code shared between visitSetCondInst and
|
|
|
|
/// constant expression support.
|
2004-03-01 23:53:11 +00:00
|
|
|
///
|
2003-08-24 19:19:47 +00:00
|
|
|
void ISel::emitSetCCOperation(MachineBasicBlock *MBB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2003-08-24 19:19:47 +00:00
|
|
|
Value *Op0, Value *Op1, unsigned Opcode,
|
|
|
|
unsigned TargetReg) {
|
|
|
|
unsigned OpNum = getSetCCNumber(Opcode);
|
2003-10-19 21:09:10 +00:00
|
|
|
OpNum = EmitComparison(OpNum, Op0, Op1, MBB, IP);
|
2003-08-24 19:19:47 +00:00
|
|
|
|
2003-10-19 21:09:10 +00:00
|
|
|
const Type *CompTy = Op0->getType();
|
|
|
|
unsigned CompClass = getClassB(CompTy);
|
|
|
|
bool isSigned = CompTy->isSigned() && CompClass != cFP;
|
|
|
|
|
|
|
|
if (CompClass != cLong || OpNum < 2) {
|
2003-01-16 16:43:00 +00:00
|
|
|
// Handle normal comparisons with a setcc instruction...
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, SetCCOpcodeTab[isSigned][OpNum], 0, TargetReg);
|
2003-01-16 16:43:00 +00:00
|
|
|
} else {
|
|
|
|
// Handle long comparisons by copying the value which is already in BL into
|
|
|
|
// the register we want...
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV8rr, 1, TargetReg).addReg(X86::BL);
|
2003-01-16 16:43:00 +00:00
|
|
|
}
|
2002-11-07 17:59:21 +00:00
|
|
|
}
|
2002-11-02 19:45:49 +00:00
|
|
|
|
2004-03-30 21:22:00 +00:00
|
|
|
void ISel::visitSelectInst(SelectInst &SI) {
|
|
|
|
unsigned DestReg = getReg(SI);
|
|
|
|
MachineBasicBlock::iterator MII = BB->end();
|
|
|
|
emitSelectOperation(BB, MII, SI.getCondition(), SI.getTrueValue(),
|
|
|
|
SI.getFalseValue(), DestReg);
|
|
|
|
}
|
|
|
|
|
|
|
|
/// emitSelect - Common code shared between visitSelectInst and the constant
|
|
|
|
/// expression support.
|
|
|
|
void ISel::emitSelectOperation(MachineBasicBlock *MBB,
|
|
|
|
MachineBasicBlock::iterator IP,
|
|
|
|
Value *Cond, Value *TrueVal, Value *FalseVal,
|
|
|
|
unsigned DestReg) {
|
|
|
|
unsigned SelectClass = getClassB(TrueVal->getType());
|
|
|
|
|
|
|
|
// We don't support 8-bit conditional moves. If we have incoming constants,
|
|
|
|
// transform them into 16-bit constants to avoid having a run-time conversion.
|
|
|
|
if (SelectClass == cByte) {
|
|
|
|
if (Constant *T = dyn_cast<Constant>(TrueVal))
|
|
|
|
TrueVal = ConstantExpr::getCast(T, Type::ShortTy);
|
|
|
|
if (Constant *F = dyn_cast<Constant>(FalseVal))
|
|
|
|
FalseVal = ConstantExpr::getCast(F, Type::ShortTy);
|
|
|
|
}
|
|
|
|
|
2004-03-30 22:39:09 +00:00
|
|
|
|
|
|
|
unsigned Opcode;
|
|
|
|
if (SetCondInst *SCI = canFoldSetCCIntoBranchOrSelect(Cond)) {
|
|
|
|
// We successfully folded the setcc into the select instruction.
|
|
|
|
|
|
|
|
unsigned OpNum = getSetCCNumber(SCI->getOpcode());
|
|
|
|
OpNum = EmitComparison(OpNum, SCI->getOperand(0), SCI->getOperand(1), MBB,
|
|
|
|
IP);
|
|
|
|
|
|
|
|
const Type *CompTy = SCI->getOperand(0)->getType();
|
|
|
|
bool isSigned = CompTy->isSigned() && getClassB(CompTy) != cFP;
|
|
|
|
|
|
|
|
// LLVM -> X86 signed X86 unsigned
|
|
|
|
// ----- ---------- ------------
|
|
|
|
// seteq -> cmovNE cmovNE
|
|
|
|
// setne -> cmovE cmovE
|
|
|
|
// setlt -> cmovGE cmovAE
|
|
|
|
// setge -> cmovL cmovB
|
|
|
|
// setgt -> cmovLE cmovBE
|
|
|
|
// setle -> cmovG cmovA
|
|
|
|
// ----
|
|
|
|
// cmovNS // Used by comparison with 0 optimization
|
|
|
|
// cmovS
|
|
|
|
|
|
|
|
switch (SelectClass) {
|
|
|
|
default:
|
|
|
|
case cFP:
|
|
|
|
assert(0 && "We don't support floating point selects yet, they should "
|
|
|
|
"have been lowered!");
|
|
|
|
case cByte:
|
|
|
|
case cShort: {
|
|
|
|
static const unsigned OpcodeTab[2][8] = {
|
|
|
|
{ X86::CMOVNE16rr, X86::CMOVE16rr, X86::CMOVAE16rr, X86::CMOVB16rr,
|
|
|
|
X86::CMOVBE16rr, X86::CMOVA16rr, 0, 0 },
|
|
|
|
{ X86::CMOVNE16rr, X86::CMOVE16rr, X86::CMOVGE16rr, X86::CMOVL16rr,
|
|
|
|
X86::CMOVLE16rr, X86::CMOVG16rr, X86::CMOVNS16rr, X86::CMOVS16rr },
|
|
|
|
};
|
|
|
|
Opcode = OpcodeTab[isSigned][OpNum];
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case cInt:
|
|
|
|
case cLong: {
|
|
|
|
static const unsigned OpcodeTab[2][8] = {
|
|
|
|
{ X86::CMOVNE32rr, X86::CMOVE32rr, X86::CMOVAE32rr, X86::CMOVB32rr,
|
|
|
|
X86::CMOVBE32rr, X86::CMOVA32rr, 0, 0 },
|
|
|
|
{ X86::CMOVNE32rr, X86::CMOVE32rr, X86::CMOVGE32rr, X86::CMOVL32rr,
|
|
|
|
X86::CMOVLE32rr, X86::CMOVG32rr, X86::CMOVNS32rr, X86::CMOVS32rr },
|
|
|
|
};
|
|
|
|
Opcode = OpcodeTab[isSigned][OpNum];
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// Get the value being branched on, and use it to set the condition codes.
|
|
|
|
unsigned CondReg = getReg(Cond, MBB, IP);
|
|
|
|
BuildMI(*MBB, IP, X86::CMP8ri, 2).addReg(CondReg).addImm(0);
|
|
|
|
switch (SelectClass) {
|
|
|
|
default:
|
|
|
|
case cFP:
|
|
|
|
assert(0 && "We don't support floating point selects yet, they should "
|
|
|
|
"have been lowered!");
|
|
|
|
case cByte:
|
|
|
|
case cShort:
|
|
|
|
Opcode = X86::CMOVE16rr;
|
|
|
|
break;
|
|
|
|
case cInt:
|
|
|
|
case cLong:
|
|
|
|
Opcode = X86::CMOVE32rr;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2004-03-30 21:22:00 +00:00
|
|
|
|
|
|
|
unsigned TrueReg = getReg(TrueVal, MBB, IP);
|
|
|
|
unsigned FalseReg = getReg(FalseVal, MBB, IP);
|
|
|
|
unsigned RealDestReg = DestReg;
|
|
|
|
|
|
|
|
|
|
|
|
// Annoyingly enough, X86 doesn't HAVE 8-bit conditional moves. Because of
|
|
|
|
// this, we have to promote the incoming values to 16 bits, perform a 16-bit
|
|
|
|
// cmove, then truncate the result.
|
|
|
|
if (SelectClass == cByte) {
|
|
|
|
DestReg = makeAnotherReg(Type::ShortTy);
|
|
|
|
if (getClassB(TrueVal->getType()) == cByte) {
|
|
|
|
// Promote the true value, by storing it into AL, and reading from AX.
|
|
|
|
BuildMI(*MBB, IP, X86::MOV8rr, 1, X86::AL).addReg(TrueReg);
|
|
|
|
BuildMI(*MBB, IP, X86::MOV8ri, 1, X86::AH).addImm(0);
|
|
|
|
TrueReg = makeAnotherReg(Type::ShortTy);
|
|
|
|
BuildMI(*MBB, IP, X86::MOV16rr, 1, TrueReg).addReg(X86::AX);
|
|
|
|
}
|
|
|
|
if (getClassB(FalseVal->getType()) == cByte) {
|
|
|
|
// Promote the true value, by storing it into CL, and reading from CX.
|
|
|
|
BuildMI(*MBB, IP, X86::MOV8rr, 1, X86::CL).addReg(FalseReg);
|
|
|
|
BuildMI(*MBB, IP, X86::MOV8ri, 1, X86::CH).addImm(0);
|
|
|
|
FalseReg = makeAnotherReg(Type::ShortTy);
|
|
|
|
BuildMI(*MBB, IP, X86::MOV16rr, 1, FalseReg).addReg(X86::CX);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
BuildMI(*MBB, IP, Opcode, 2, DestReg).addReg(TrueReg).addReg(FalseReg);
|
|
|
|
|
|
|
|
switch (SelectClass) {
|
|
|
|
case cByte:
|
|
|
|
// We did the computation with 16-bit registers. Truncate back to our
|
|
|
|
// result by copying into AX then copying out AL.
|
|
|
|
BuildMI(*MBB, IP, X86::MOV16rr, 1, X86::AX).addReg(DestReg);
|
|
|
|
BuildMI(*MBB, IP, X86::MOV8rr, 1, RealDestReg).addReg(X86::AL);
|
|
|
|
break;
|
|
|
|
case cLong:
|
|
|
|
// Move the upper half of the value as well.
|
|
|
|
BuildMI(*MBB, IP, Opcode, 2,DestReg+1).addReg(TrueReg+1).addReg(FalseReg+1);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2003-08-24 19:19:47 +00:00
|
|
|
|
|
|
|
|
|
|
|
|
2002-11-30 11:57:28 +00:00
|
|
|
/// promote32 - Emit instructions to turn a narrow operand into a 32-bit-wide
|
|
|
|
/// operand, in the specified target register.
|
2004-03-01 23:53:11 +00:00
|
|
|
///
|
2003-01-13 00:32:26 +00:00
|
|
|
void ISel::promote32(unsigned targetReg, const ValueRecord &VR) {
|
|
|
|
bool isUnsigned = VR.Ty->isUnsigned();
|
2003-08-04 02:12:48 +00:00
|
|
|
|
|
|
|
// Make sure we have the register number for this value...
|
|
|
|
unsigned Reg = VR.Val ? getReg(VR.Val) : VR.Reg;
|
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
switch (getClassB(VR.Ty)) {
|
2002-12-25 05:13:53 +00:00
|
|
|
case cByte:
|
|
|
|
// Extend value into target register (8->32)
|
|
|
|
if (isUnsigned)
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOVZX32rr8, 1, targetReg).addReg(Reg);
|
2002-12-25 05:13:53 +00:00
|
|
|
else
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOVSX32rr8, 1, targetReg).addReg(Reg);
|
2002-12-25 05:13:53 +00:00
|
|
|
break;
|
|
|
|
case cShort:
|
|
|
|
// Extend value into target register (16->32)
|
|
|
|
if (isUnsigned)
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOVZX32rr16, 1, targetReg).addReg(Reg);
|
2002-12-25 05:13:53 +00:00
|
|
|
else
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOVSX32rr16, 1, targetReg).addReg(Reg);
|
2002-12-25 05:13:53 +00:00
|
|
|
break;
|
|
|
|
case cInt:
|
|
|
|
// Move value into target register (32->32)
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV32rr, 1, targetReg).addReg(Reg);
|
2002-12-25 05:13:53 +00:00
|
|
|
break;
|
|
|
|
default:
|
|
|
|
assert(0 && "Unpromotable operand class in promote32");
|
|
|
|
}
|
2002-11-30 11:57:28 +00:00
|
|
|
}
|
2002-10-27 21:16:59 +00:00
|
|
|
|
2002-10-25 22:55:53 +00:00
|
|
|
/// 'ret' instruction - Here we are interested in meeting the x86 ABI. As such,
|
|
|
|
/// we have the following possibilities:
|
|
|
|
///
|
|
|
|
/// ret void: No return value, simply emit a 'ret' instruction
|
|
|
|
/// ret sbyte, ubyte : Extend value into EAX and return
|
|
|
|
/// ret short, ushort: Extend value into EAX and return
|
|
|
|
/// ret int, uint : Move value into EAX and return
|
|
|
|
/// ret pointer : Move value into EAX and return
|
2002-11-17 21:56:38 +00:00
|
|
|
/// ret long, ulong : Move value into EAX/EDX and return
|
|
|
|
/// ret float/double : Top of FP stack
|
2002-10-25 22:55:53 +00:00
|
|
|
///
|
2003-01-13 00:32:26 +00:00
|
|
|
void ISel::visitReturnInst(ReturnInst &I) {
|
2002-12-25 05:13:53 +00:00
|
|
|
if (I.getNumOperands() == 0) {
|
|
|
|
BuildMI(BB, X86::RET, 0); // Just emit a 'ret' instruction
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
Value *RetVal = I.getOperand(0);
|
2003-01-13 00:32:26 +00:00
|
|
|
unsigned RetReg = getReg(RetVal);
|
|
|
|
switch (getClassB(RetVal->getType())) {
|
2002-12-25 05:13:53 +00:00
|
|
|
case cByte: // integral return values: extend or move into EAX and return
|
|
|
|
case cShort:
|
|
|
|
case cInt:
|
2003-01-13 00:32:26 +00:00
|
|
|
promote32(X86::EAX, ValueRecord(RetReg, RetVal->getType()));
|
2003-05-06 21:32:22 +00:00
|
|
|
// Declare that EAX is live on exit
|
2003-05-07 19:21:28 +00:00
|
|
|
BuildMI(BB, X86::IMPLICIT_USE, 2).addReg(X86::EAX).addReg(X86::ESP);
|
2002-12-25 05:13:53 +00:00
|
|
|
break;
|
|
|
|
case cFP: // Floats & Doubles: Return in ST(0)
|
2003-01-13 00:32:26 +00:00
|
|
|
BuildMI(BB, X86::FpSETRESULT, 1).addReg(RetReg);
|
2003-05-06 21:32:22 +00:00
|
|
|
// Declare that top-of-stack is live on exit
|
2003-05-07 19:21:28 +00:00
|
|
|
BuildMI(BB, X86::IMPLICIT_USE, 2).addReg(X86::ST0).addReg(X86::ESP);
|
2002-12-25 05:13:53 +00:00
|
|
|
break;
|
|
|
|
case cLong:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV32rr, 1, X86::EAX).addReg(RetReg);
|
|
|
|
BuildMI(BB, X86::MOV32rr, 1, X86::EDX).addReg(RetReg+1);
|
2003-05-06 21:32:22 +00:00
|
|
|
// Declare that EAX & EDX are live on exit
|
2003-10-23 16:22:08 +00:00
|
|
|
BuildMI(BB, X86::IMPLICIT_USE, 3).addReg(X86::EAX).addReg(X86::EDX)
|
|
|
|
.addReg(X86::ESP);
|
2003-01-13 00:32:26 +00:00
|
|
|
break;
|
2002-12-25 05:13:53 +00:00
|
|
|
default:
|
2003-01-13 00:32:26 +00:00
|
|
|
visitInstruction(I);
|
2002-12-25 05:13:53 +00:00
|
|
|
}
|
2002-11-17 20:07:45 +00:00
|
|
|
// Emit a 'ret' instruction
|
2002-12-25 05:13:53 +00:00
|
|
|
BuildMI(BB, X86::RET, 0);
|
2002-10-25 22:55:53 +00:00
|
|
|
}
|
|
|
|
|
2003-01-16 18:07:23 +00:00
|
|
|
// getBlockAfter - Return the basic block which occurs lexically after the
|
|
|
|
// specified one.
|
|
|
|
static inline BasicBlock *getBlockAfter(BasicBlock *BB) {
|
|
|
|
Function::iterator I = BB; ++I; // Get iterator to next block
|
|
|
|
return I != BB->getParent()->end() ? &*I : 0;
|
|
|
|
}
|
|
|
|
|
2002-11-02 19:45:49 +00:00
|
|
|
/// visitBranchInst - Handle conditional and unconditional branches here. Note
|
|
|
|
/// that since code layout is frozen at this point, that if we are trying to
|
|
|
|
/// jump to a block that is the immediate successor of the current block, we can
|
2003-01-16 16:43:00 +00:00
|
|
|
/// just make a fall-through (but we don't currently).
|
2002-11-02 19:45:49 +00:00
|
|
|
///
|
2002-12-25 05:13:53 +00:00
|
|
|
void ISel::visitBranchInst(BranchInst &BI) {
|
2003-01-16 18:07:23 +00:00
|
|
|
BasicBlock *NextBB = getBlockAfter(BI.getParent()); // BB after current one
|
|
|
|
|
|
|
|
if (!BI.isConditional()) { // Unconditional branch?
|
2004-01-30 22:13:44 +00:00
|
|
|
if (BI.getSuccessor(0) != NextBB)
|
2003-01-16 18:07:23 +00:00
|
|
|
BuildMI(BB, X86::JMP, 1).addPCDisp(BI.getSuccessor(0));
|
2003-01-16 16:43:00 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// See if we can fold the setcc into the branch itself...
|
2004-03-30 22:39:09 +00:00
|
|
|
SetCondInst *SCI = canFoldSetCCIntoBranchOrSelect(BI.getCondition());
|
2003-01-16 16:43:00 +00:00
|
|
|
if (SCI == 0) {
|
|
|
|
// Nope, cannot fold setcc into this branch. Emit a branch on a condition
|
|
|
|
// computed some other way...
|
2002-12-28 20:24:02 +00:00
|
|
|
unsigned condReg = getReg(BI.getCondition());
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::CMP8ri, 2).addReg(condReg).addImm(0);
|
2003-01-16 18:07:23 +00:00
|
|
|
if (BI.getSuccessor(1) == NextBB) {
|
|
|
|
if (BI.getSuccessor(0) != NextBB)
|
|
|
|
BuildMI(BB, X86::JNE, 1).addPCDisp(BI.getSuccessor(0));
|
|
|
|
} else {
|
|
|
|
BuildMI(BB, X86::JE, 1).addPCDisp(BI.getSuccessor(1));
|
|
|
|
|
|
|
|
if (BI.getSuccessor(0) != NextBB)
|
|
|
|
BuildMI(BB, X86::JMP, 1).addPCDisp(BI.getSuccessor(0));
|
|
|
|
}
|
2003-01-16 16:43:00 +00:00
|
|
|
return;
|
2002-12-25 05:13:53 +00:00
|
|
|
}
|
2003-01-16 16:43:00 +00:00
|
|
|
|
|
|
|
unsigned OpNum = getSetCCNumber(SCI->getOpcode());
|
2003-08-24 19:19:47 +00:00
|
|
|
MachineBasicBlock::iterator MII = BB->end();
|
2003-10-23 16:22:08 +00:00
|
|
|
OpNum = EmitComparison(OpNum, SCI->getOperand(0), SCI->getOperand(1), BB,MII);
|
2003-10-19 21:09:10 +00:00
|
|
|
|
|
|
|
const Type *CompTy = SCI->getOperand(0)->getType();
|
|
|
|
bool isSigned = CompTy->isSigned() && getClassB(CompTy) != cFP;
|
2003-01-16 16:43:00 +00:00
|
|
|
|
2003-10-19 21:09:10 +00:00
|
|
|
|
2003-01-16 16:43:00 +00:00
|
|
|
// LLVM -> X86 signed X86 unsigned
|
|
|
|
// ----- ---------- ------------
|
|
|
|
// seteq -> je je
|
|
|
|
// setne -> jne jne
|
|
|
|
// setlt -> jl jb
|
2003-01-16 18:07:23 +00:00
|
|
|
// setge -> jge jae
|
2003-01-16 16:43:00 +00:00
|
|
|
// setgt -> jg ja
|
|
|
|
// setle -> jle jbe
|
2003-10-19 21:09:10 +00:00
|
|
|
// ----
|
|
|
|
// js // Used by comparison with 0 optimization
|
|
|
|
// jns
|
|
|
|
|
|
|
|
static const unsigned OpcodeTab[2][8] = {
|
|
|
|
{ X86::JE, X86::JNE, X86::JB, X86::JAE, X86::JA, X86::JBE, 0, 0 },
|
|
|
|
{ X86::JE, X86::JNE, X86::JL, X86::JGE, X86::JG, X86::JLE,
|
|
|
|
X86::JS, X86::JNS },
|
2003-01-16 16:43:00 +00:00
|
|
|
};
|
|
|
|
|
2003-01-16 18:07:23 +00:00
|
|
|
if (BI.getSuccessor(0) != NextBB) {
|
|
|
|
BuildMI(BB, OpcodeTab[isSigned][OpNum], 1).addPCDisp(BI.getSuccessor(0));
|
|
|
|
if (BI.getSuccessor(1) != NextBB)
|
|
|
|
BuildMI(BB, X86::JMP, 1).addPCDisp(BI.getSuccessor(1));
|
|
|
|
} else {
|
|
|
|
// Change to the inverse condition...
|
|
|
|
if (BI.getSuccessor(1) != NextBB) {
|
|
|
|
OpNum ^= 1;
|
|
|
|
BuildMI(BB, OpcodeTab[isSigned][OpNum], 1).addPCDisp(BI.getSuccessor(1));
|
|
|
|
}
|
|
|
|
}
|
2002-11-02 19:27:56 +00:00
|
|
|
}
|
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
/// doCall - This emits an abstract call instruction, setting up the arguments
|
|
|
|
/// and the return value as appropriate. For the actual function call itself,
|
|
|
|
/// it inserts the specified CallMI instruction into the stream.
|
|
|
|
///
|
|
|
|
void ISel::doCall(const ValueRecord &Ret, MachineInstr *CallMI,
|
2003-10-23 16:22:08 +00:00
|
|
|
const std::vector<ValueRecord> &Args) {
|
2003-01-13 00:32:26 +00:00
|
|
|
|
2002-12-28 20:24:02 +00:00
|
|
|
// Count how many bytes are to be pushed on the stack...
|
|
|
|
unsigned NumBytes = 0;
|
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
if (!Args.empty()) {
|
|
|
|
for (unsigned i = 0, e = Args.size(); i != e; ++i)
|
|
|
|
switch (getClassB(Args[i].Ty)) {
|
2002-12-28 20:24:02 +00:00
|
|
|
case cByte: case cShort: case cInt:
|
2003-10-23 16:22:08 +00:00
|
|
|
NumBytes += 4; break;
|
2002-12-28 20:24:02 +00:00
|
|
|
case cLong:
|
2003-10-23 16:22:08 +00:00
|
|
|
NumBytes += 8; break;
|
2002-12-28 20:24:02 +00:00
|
|
|
case cFP:
|
2003-10-23 16:22:08 +00:00
|
|
|
NumBytes += Args[i].Ty == Type::FloatTy ? 4 : 8;
|
|
|
|
break;
|
2002-12-28 20:24:02 +00:00
|
|
|
default: assert(0 && "Unknown class!");
|
|
|
|
}
|
|
|
|
|
|
|
|
// Adjust the stack pointer for the new arguments...
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(BB, X86::ADJCALLSTACKDOWN, 1).addImm(NumBytes);
|
2002-12-28 20:24:02 +00:00
|
|
|
|
|
|
|
// Arguments go on the stack in reverse order, as specified by the ABI.
|
|
|
|
unsigned ArgOffset = 0;
|
2003-01-13 00:32:26 +00:00
|
|
|
for (unsigned i = 0, e = Args.size(); i != e; ++i) {
|
Fix a minor code-quality issue. When passing 8 and 16-bit integer constants
to function calls, we would emit dead code, like this:
int Y(int, short, double);
int X() {
Y(4, 123, 4);
}
--- Old
X:
sub %ESP, 20
mov %EAX, 4
mov DWORD PTR [%ESP], %EAX
*** mov %AX, 123
mov %AX, 123
movsx %EAX, %AX
mov DWORD PTR [%ESP + 4], %EAX
fld QWORD PTR [.CPIX_0]
fstp QWORD PTR [%ESP + 8]
call Y
mov %EAX, 0
# IMPLICIT_USE %EAX %ESP
add %ESP, 20
ret
Now we emit:
X:
sub %ESP, 20
mov %EAX, 4
mov DWORD PTR [%ESP], %EAX
mov %AX, 123
movsx %EAX, %AX
mov DWORD PTR [%ESP + 4], %EAX
fld QWORD PTR [.CPIX_0]
fstp QWORD PTR [%ESP + 8]
call Y
mov %EAX, 0
# IMPLICIT_USE %EAX %ESP
add %ESP, 20
ret
Next up, eliminate the mov AX and movsx entirely!
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@12026 91177308-0d34-0410-b5e6-96231b3b80d8
2004-03-01 02:34:08 +00:00
|
|
|
unsigned ArgReg;
|
2003-01-13 00:32:26 +00:00
|
|
|
switch (getClassB(Args[i].Ty)) {
|
2002-12-28 20:24:02 +00:00
|
|
|
case cByte:
|
2004-03-01 02:42:43 +00:00
|
|
|
case cShort:
|
|
|
|
if (Args[i].Val && isa<ConstantInt>(Args[i].Val)) {
|
|
|
|
// Zero/Sign extend constant, then stuff into memory.
|
|
|
|
ConstantInt *Val = cast<ConstantInt>(Args[i].Val);
|
|
|
|
Val = cast<ConstantInt>(ConstantExpr::getCast(Val, Type::IntTy));
|
|
|
|
addRegOffset(BuildMI(BB, X86::MOV32mi, 5), X86::ESP, ArgOffset)
|
|
|
|
.addImm(Val->getRawValue() & 0xFFFFFFFF);
|
|
|
|
} else {
|
|
|
|
// Promote arg to 32 bits wide into a temporary register...
|
|
|
|
ArgReg = makeAnotherReg(Type::UIntTy);
|
|
|
|
promote32(ArgReg, Args[i]);
|
|
|
|
addRegOffset(BuildMI(BB, X86::MOV32mr, 5),
|
|
|
|
X86::ESP, ArgOffset).addReg(ArgReg);
|
|
|
|
}
|
2003-10-23 16:22:08 +00:00
|
|
|
break;
|
2002-12-28 20:24:02 +00:00
|
|
|
case cInt:
|
2004-03-01 02:42:43 +00:00
|
|
|
if (Args[i].Val && isa<ConstantInt>(Args[i].Val)) {
|
|
|
|
unsigned Val = cast<ConstantInt>(Args[i].Val)->getRawValue();
|
|
|
|
addRegOffset(BuildMI(BB, X86::MOV32mi, 5),
|
|
|
|
X86::ESP, ArgOffset).addImm(Val);
|
|
|
|
} else {
|
|
|
|
ArgReg = Args[i].Val ? getReg(Args[i].Val) : Args[i].Reg;
|
|
|
|
addRegOffset(BuildMI(BB, X86::MOV32mr, 5),
|
|
|
|
X86::ESP, ArgOffset).addReg(ArgReg);
|
|
|
|
}
|
2003-10-23 16:22:08 +00:00
|
|
|
break;
|
2003-01-13 00:32:26 +00:00
|
|
|
case cLong:
|
Fix a minor code-quality issue. When passing 8 and 16-bit integer constants
to function calls, we would emit dead code, like this:
int Y(int, short, double);
int X() {
Y(4, 123, 4);
}
--- Old
X:
sub %ESP, 20
mov %EAX, 4
mov DWORD PTR [%ESP], %EAX
*** mov %AX, 123
mov %AX, 123
movsx %EAX, %AX
mov DWORD PTR [%ESP + 4], %EAX
fld QWORD PTR [.CPIX_0]
fstp QWORD PTR [%ESP + 8]
call Y
mov %EAX, 0
# IMPLICIT_USE %EAX %ESP
add %ESP, 20
ret
Now we emit:
X:
sub %ESP, 20
mov %EAX, 4
mov DWORD PTR [%ESP], %EAX
mov %AX, 123
movsx %EAX, %AX
mov DWORD PTR [%ESP + 4], %EAX
fld QWORD PTR [.CPIX_0]
fstp QWORD PTR [%ESP + 8]
call Y
mov %EAX, 0
# IMPLICIT_USE %EAX %ESP
add %ESP, 20
ret
Next up, eliminate the mov AX and movsx entirely!
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@12026 91177308-0d34-0410-b5e6-96231b3b80d8
2004-03-01 02:34:08 +00:00
|
|
|
ArgReg = Args[i].Val ? getReg(Args[i].Val) : Args[i].Reg;
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addRegOffset(BuildMI(BB, X86::MOV32mr, 5),
|
2003-10-23 16:22:08 +00:00
|
|
|
X86::ESP, ArgOffset).addReg(ArgReg);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addRegOffset(BuildMI(BB, X86::MOV32mr, 5),
|
2003-10-23 16:22:08 +00:00
|
|
|
X86::ESP, ArgOffset+4).addReg(ArgReg+1);
|
|
|
|
ArgOffset += 4; // 8 byte entry, not 4.
|
|
|
|
break;
|
|
|
|
|
2002-12-28 20:24:02 +00:00
|
|
|
case cFP:
|
Fix a minor code-quality issue. When passing 8 and 16-bit integer constants
to function calls, we would emit dead code, like this:
int Y(int, short, double);
int X() {
Y(4, 123, 4);
}
--- Old
X:
sub %ESP, 20
mov %EAX, 4
mov DWORD PTR [%ESP], %EAX
*** mov %AX, 123
mov %AX, 123
movsx %EAX, %AX
mov DWORD PTR [%ESP + 4], %EAX
fld QWORD PTR [.CPIX_0]
fstp QWORD PTR [%ESP + 8]
call Y
mov %EAX, 0
# IMPLICIT_USE %EAX %ESP
add %ESP, 20
ret
Now we emit:
X:
sub %ESP, 20
mov %EAX, 4
mov DWORD PTR [%ESP], %EAX
mov %AX, 123
movsx %EAX, %AX
mov DWORD PTR [%ESP + 4], %EAX
fld QWORD PTR [.CPIX_0]
fstp QWORD PTR [%ESP + 8]
call Y
mov %EAX, 0
# IMPLICIT_USE %EAX %ESP
add %ESP, 20
ret
Next up, eliminate the mov AX and movsx entirely!
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@12026 91177308-0d34-0410-b5e6-96231b3b80d8
2004-03-01 02:34:08 +00:00
|
|
|
ArgReg = Args[i].Val ? getReg(Args[i].Val) : Args[i].Reg;
|
2003-10-23 16:22:08 +00:00
|
|
|
if (Args[i].Ty == Type::FloatTy) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addRegOffset(BuildMI(BB, X86::FST32m, 5),
|
2003-10-23 16:22:08 +00:00
|
|
|
X86::ESP, ArgOffset).addReg(ArgReg);
|
|
|
|
} else {
|
|
|
|
assert(Args[i].Ty == Type::DoubleTy && "Unknown FP type!");
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addRegOffset(BuildMI(BB, X86::FST64m, 5),
|
2003-10-23 16:22:08 +00:00
|
|
|
X86::ESP, ArgOffset).addReg(ArgReg);
|
|
|
|
ArgOffset += 4; // 8 byte entry, not 4.
|
|
|
|
}
|
|
|
|
break;
|
2002-12-28 20:24:02 +00:00
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
default: assert(0 && "Unknown class!");
|
2002-12-28 20:24:02 +00:00
|
|
|
}
|
|
|
|
ArgOffset += 4;
|
2002-11-29 12:01:58 +00:00
|
|
|
}
|
2002-12-13 14:13:27 +00:00
|
|
|
} else {
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(BB, X86::ADJCALLSTACKDOWN, 1).addImm(0);
|
2002-12-13 14:13:27 +00:00
|
|
|
}
|
2002-12-04 19:22:53 +00:00
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
BB->push_back(CallMI);
|
|
|
|
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(BB, X86::ADJCALLSTACKUP, 1).addImm(NumBytes);
|
2002-12-04 23:45:28 +00:00
|
|
|
|
|
|
|
// If there is a return value, scavenge the result from the location the call
|
|
|
|
// leaves it in...
|
|
|
|
//
|
2003-01-13 00:32:26 +00:00
|
|
|
if (Ret.Ty != Type::VoidTy) {
|
|
|
|
unsigned DestClass = getClassB(Ret.Ty);
|
|
|
|
switch (DestClass) {
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
case cByte:
|
|
|
|
case cShort:
|
|
|
|
case cInt: {
|
|
|
|
// Integral results are in %eax, or the appropriate portion
|
|
|
|
// thereof.
|
|
|
|
static const unsigned regRegMove[] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
X86::MOV8rr, X86::MOV16rr, X86::MOV32rr
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
};
|
|
|
|
static const unsigned AReg[] = { X86::AL, X86::AX, X86::EAX };
|
2003-01-13 00:32:26 +00:00
|
|
|
BuildMI(BB, regRegMove[DestClass], 1, Ret.Reg).addReg(AReg[DestClass]);
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
break;
|
|
|
|
}
|
2002-12-25 05:13:53 +00:00
|
|
|
case cFP: // Floating-point return values live in %ST(0)
|
2003-01-13 00:32:26 +00:00
|
|
|
BuildMI(BB, X86::FpGETRESULT, 1, Ret.Reg);
|
2002-12-04 23:50:28 +00:00
|
|
|
break;
|
2003-01-13 00:32:26 +00:00
|
|
|
case cLong: // Long values are left in EDX:EAX
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV32rr, 1, Ret.Reg).addReg(X86::EAX);
|
|
|
|
BuildMI(BB, X86::MOV32rr, 1, Ret.Reg+1).addReg(X86::EDX);
|
2003-01-13 00:32:26 +00:00
|
|
|
break;
|
|
|
|
default: assert(0 && "Unknown class!");
|
2002-12-04 23:50:28 +00:00
|
|
|
}
|
2002-12-04 23:45:28 +00:00
|
|
|
}
|
2002-11-22 11:07:01 +00:00
|
|
|
}
|
2002-11-02 19:27:56 +00:00
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
/// visitCallInst - Push args on stack and do a procedure call instruction.
|
|
|
|
void ISel::visitCallInst(CallInst &CI) {
|
|
|
|
MachineInstr *TheCall;
|
|
|
|
if (Function *F = CI.getCalledFunction()) {
|
2003-05-08 19:44:13 +00:00
|
|
|
// Is it an intrinsic function call?
|
2003-11-11 22:41:34 +00:00
|
|
|
if (Intrinsic::ID ID = (Intrinsic::ID)F->getIntrinsicID()) {
|
2003-05-08 19:44:13 +00:00
|
|
|
visitIntrinsicCall(ID, CI); // Special intrinsics are not handled here
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
// Emit a CALL instruction with PC-relative displacement.
|
|
|
|
TheCall = BuildMI(X86::CALLpcrel32, 1).addGlobalAddress(F, true);
|
|
|
|
} else { // Emit an indirect call...
|
|
|
|
unsigned Reg = getReg(CI.getCalledValue());
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
TheCall = BuildMI(X86::CALL32r, 1).addReg(Reg);
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
std::vector<ValueRecord> Args;
|
|
|
|
for (unsigned i = 1, e = CI.getNumOperands(); i != e; ++i)
|
2003-08-04 02:12:48 +00:00
|
|
|
Args.push_back(ValueRecord(CI.getOperand(i)));
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
unsigned DestReg = CI.getType() != Type::VoidTy ? getReg(CI) : 0;
|
|
|
|
doCall(ValueRecord(DestReg, CI.getType()), TheCall, Args);
|
2003-10-23 16:22:08 +00:00
|
|
|
}
|
2003-01-13 00:32:26 +00:00
|
|
|
|
2003-08-28 21:23:43 +00:00
|
|
|
|
2003-12-28 09:47:19 +00:00
|
|
|
/// LowerUnknownIntrinsicFunctionCalls - This performs a prepass over the
|
|
|
|
/// function, lowering any calls to unknown intrinsic functions into the
|
|
|
|
/// equivalent LLVM code.
|
2004-03-01 23:53:11 +00:00
|
|
|
///
|
2003-12-28 09:47:19 +00:00
|
|
|
void ISel::LowerUnknownIntrinsicFunctionCalls(Function &F) {
|
|
|
|
for (Function::iterator BB = F.begin(), E = F.end(); BB != E; ++BB)
|
|
|
|
for (BasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; )
|
|
|
|
if (CallInst *CI = dyn_cast<CallInst>(I++))
|
|
|
|
if (Function *F = CI->getCalledFunction())
|
|
|
|
switch (F->getIntrinsicID()) {
|
2003-12-28 09:53:23 +00:00
|
|
|
case Intrinsic::not_intrinsic:
|
2004-03-13 00:24:00 +00:00
|
|
|
case Intrinsic::vastart:
|
|
|
|
case Intrinsic::vacopy:
|
|
|
|
case Intrinsic::vaend:
|
2004-02-15 01:04:03 +00:00
|
|
|
case Intrinsic::returnaddress:
|
|
|
|
case Intrinsic::frameaddress:
|
2004-02-12 17:53:22 +00:00
|
|
|
case Intrinsic::memcpy:
|
2004-02-14 04:46:05 +00:00
|
|
|
case Intrinsic::memset:
|
2003-12-28 09:47:19 +00:00
|
|
|
// We directly implement these intrinsics
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// All other intrinsic calls we must lower.
|
|
|
|
Instruction *Before = CI->getPrev();
|
2003-12-28 21:23:38 +00:00
|
|
|
TM.getIntrinsicLowering().LowerIntrinsicCall(CI);
|
2003-12-28 09:47:19 +00:00
|
|
|
if (Before) { // Move iterator to instruction after call
|
|
|
|
I = Before; ++I;
|
|
|
|
} else {
|
|
|
|
I = BB->begin();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2003-11-11 22:41:34 +00:00
|
|
|
void ISel::visitIntrinsicCall(Intrinsic::ID ID, CallInst &CI) {
|
2003-05-08 19:44:13 +00:00
|
|
|
unsigned TmpReg1, TmpReg2;
|
|
|
|
switch (ID) {
|
2004-03-13 00:24:52 +00:00
|
|
|
case Intrinsic::vastart:
|
2003-05-08 19:44:13 +00:00
|
|
|
// Get the address of the first vararg value...
|
2003-10-18 05:56:40 +00:00
|
|
|
TmpReg1 = getReg(CI);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(BB, X86::LEA32r, 5, TmpReg1), VarArgsFrameIndex);
|
2003-05-08 19:44:13 +00:00
|
|
|
return;
|
|
|
|
|
2004-03-13 00:24:52 +00:00
|
|
|
case Intrinsic::vacopy:
|
2003-10-18 05:56:40 +00:00
|
|
|
TmpReg1 = getReg(CI);
|
|
|
|
TmpReg2 = getReg(CI.getOperand(1));
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV32rr, 1, TmpReg1).addReg(TmpReg2);
|
2003-05-08 19:44:13 +00:00
|
|
|
return;
|
2004-03-13 00:24:52 +00:00
|
|
|
case Intrinsic::vaend: return; // Noop on X86
|
2003-05-08 19:44:13 +00:00
|
|
|
|
2004-02-15 01:04:03 +00:00
|
|
|
case Intrinsic::returnaddress:
|
|
|
|
case Intrinsic::frameaddress:
|
|
|
|
TmpReg1 = getReg(CI);
|
|
|
|
if (cast<Constant>(CI.getOperand(1))->isNullValue()) {
|
|
|
|
if (ID == Intrinsic::returnaddress) {
|
|
|
|
// Just load the return address
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(BB, X86::MOV32rm, 4, TmpReg1),
|
2004-02-15 01:04:03 +00:00
|
|
|
ReturnAddressIndex);
|
|
|
|
} else {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(BB, X86::LEA32r, 4, TmpReg1),
|
2004-02-15 01:04:03 +00:00
|
|
|
ReturnAddressIndex, -4);
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// Values other than zero are not implemented yet.
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV32ri, 1, TmpReg1).addImm(0);
|
2004-02-15 01:04:03 +00:00
|
|
|
}
|
|
|
|
return;
|
|
|
|
|
2004-02-12 17:53:22 +00:00
|
|
|
case Intrinsic::memcpy: {
|
|
|
|
assert(CI.getNumOperands() == 5 && "Illegal llvm.memcpy call!");
|
|
|
|
unsigned Align = 1;
|
|
|
|
if (ConstantInt *AlignC = dyn_cast<ConstantInt>(CI.getOperand(4))) {
|
|
|
|
Align = AlignC->getRawValue();
|
|
|
|
if (Align == 0) Align = 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Turn the byte code into # iterations
|
|
|
|
unsigned CountReg;
|
2004-02-14 04:46:05 +00:00
|
|
|
unsigned Opcode;
|
2004-02-12 17:53:22 +00:00
|
|
|
switch (Align & 3) {
|
|
|
|
case 2: // WORD aligned
|
2004-02-13 23:36:47 +00:00
|
|
|
if (ConstantInt *I = dyn_cast<ConstantInt>(CI.getOperand(3))) {
|
|
|
|
CountReg = getReg(ConstantUInt::get(Type::UIntTy, I->getRawValue()/2));
|
|
|
|
} else {
|
|
|
|
CountReg = makeAnotherReg(Type::IntTy);
|
2004-02-26 01:20:02 +00:00
|
|
|
unsigned ByteReg = getReg(CI.getOperand(3));
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::SHR32ri, 2, CountReg).addReg(ByteReg).addImm(1);
|
2004-02-13 23:36:47 +00:00
|
|
|
}
|
2004-02-14 04:46:05 +00:00
|
|
|
Opcode = X86::REP_MOVSW;
|
2004-02-12 17:53:22 +00:00
|
|
|
break;
|
|
|
|
case 0: // DWORD aligned
|
2004-02-13 23:36:47 +00:00
|
|
|
if (ConstantInt *I = dyn_cast<ConstantInt>(CI.getOperand(3))) {
|
|
|
|
CountReg = getReg(ConstantUInt::get(Type::UIntTy, I->getRawValue()/4));
|
|
|
|
} else {
|
|
|
|
CountReg = makeAnotherReg(Type::IntTy);
|
2004-02-26 01:20:02 +00:00
|
|
|
unsigned ByteReg = getReg(CI.getOperand(3));
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::SHR32ri, 2, CountReg).addReg(ByteReg).addImm(2);
|
2004-02-13 23:36:47 +00:00
|
|
|
}
|
2004-02-14 04:46:05 +00:00
|
|
|
Opcode = X86::REP_MOVSD;
|
2004-02-12 17:53:22 +00:00
|
|
|
break;
|
2004-02-26 01:20:02 +00:00
|
|
|
default: // BYTE aligned
|
2004-02-13 23:36:47 +00:00
|
|
|
CountReg = getReg(CI.getOperand(3));
|
2004-02-14 04:46:05 +00:00
|
|
|
Opcode = X86::REP_MOVSB;
|
2004-02-12 17:53:22 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
// No matter what the alignment is, we put the source in ESI, the
|
|
|
|
// destination in EDI, and the count in ECX.
|
|
|
|
TmpReg1 = getReg(CI.getOperand(1));
|
|
|
|
TmpReg2 = getReg(CI.getOperand(2));
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV32rr, 1, X86::ECX).addReg(CountReg);
|
|
|
|
BuildMI(BB, X86::MOV32rr, 1, X86::EDI).addReg(TmpReg1);
|
|
|
|
BuildMI(BB, X86::MOV32rr, 1, X86::ESI).addReg(TmpReg2);
|
2004-02-14 04:46:05 +00:00
|
|
|
BuildMI(BB, Opcode, 0);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
case Intrinsic::memset: {
|
|
|
|
assert(CI.getNumOperands() == 5 && "Illegal llvm.memset call!");
|
|
|
|
unsigned Align = 1;
|
|
|
|
if (ConstantInt *AlignC = dyn_cast<ConstantInt>(CI.getOperand(4))) {
|
|
|
|
Align = AlignC->getRawValue();
|
|
|
|
if (Align == 0) Align = 1;
|
|
|
|
}
|
2004-02-12 17:53:22 +00:00
|
|
|
|
2004-02-14 04:46:05 +00:00
|
|
|
// Turn the byte code into # iterations
|
|
|
|
unsigned CountReg;
|
|
|
|
unsigned Opcode;
|
|
|
|
if (ConstantInt *ValC = dyn_cast<ConstantInt>(CI.getOperand(2))) {
|
|
|
|
unsigned Val = ValC->getRawValue() & 255;
|
|
|
|
|
|
|
|
// If the value is a constant, then we can potentially use larger copies.
|
|
|
|
switch (Align & 3) {
|
|
|
|
case 2: // WORD aligned
|
|
|
|
if (ConstantInt *I = dyn_cast<ConstantInt>(CI.getOperand(3))) {
|
2004-02-14 06:00:36 +00:00
|
|
|
CountReg =getReg(ConstantUInt::get(Type::UIntTy, I->getRawValue()/2));
|
2004-02-14 04:46:05 +00:00
|
|
|
} else {
|
|
|
|
CountReg = makeAnotherReg(Type::IntTy);
|
2004-02-26 01:20:02 +00:00
|
|
|
unsigned ByteReg = getReg(CI.getOperand(3));
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::SHR32ri, 2, CountReg).addReg(ByteReg).addImm(1);
|
2004-02-14 04:46:05 +00:00
|
|
|
}
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV16ri, 1, X86::AX).addImm((Val << 8) | Val);
|
2004-02-14 04:46:05 +00:00
|
|
|
Opcode = X86::REP_STOSW;
|
|
|
|
break;
|
|
|
|
case 0: // DWORD aligned
|
|
|
|
if (ConstantInt *I = dyn_cast<ConstantInt>(CI.getOperand(3))) {
|
2004-02-14 06:00:36 +00:00
|
|
|
CountReg =getReg(ConstantUInt::get(Type::UIntTy, I->getRawValue()/4));
|
2004-02-14 04:46:05 +00:00
|
|
|
} else {
|
|
|
|
CountReg = makeAnotherReg(Type::IntTy);
|
2004-02-26 01:20:02 +00:00
|
|
|
unsigned ByteReg = getReg(CI.getOperand(3));
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::SHR32ri, 2, CountReg).addReg(ByteReg).addImm(2);
|
2004-02-14 04:46:05 +00:00
|
|
|
}
|
|
|
|
Val = (Val << 8) | Val;
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV32ri, 1, X86::EAX).addImm((Val << 16) | Val);
|
2004-02-14 04:46:05 +00:00
|
|
|
Opcode = X86::REP_STOSD;
|
|
|
|
break;
|
2004-02-26 01:20:02 +00:00
|
|
|
default: // BYTE aligned
|
2004-02-14 04:46:05 +00:00
|
|
|
CountReg = getReg(CI.getOperand(3));
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV8ri, 1, X86::AL).addImm(Val);
|
2004-02-14 04:46:05 +00:00
|
|
|
Opcode = X86::REP_STOSB;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// If it's not a constant value we are storing, just fall back. We could
|
|
|
|
// try to be clever to form 16 bit and 32 bit values, but we don't yet.
|
|
|
|
unsigned ValReg = getReg(CI.getOperand(2));
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV8rr, 1, X86::AL).addReg(ValReg);
|
2004-02-14 04:46:05 +00:00
|
|
|
CountReg = getReg(CI.getOperand(3));
|
|
|
|
Opcode = X86::REP_STOSB;
|
2004-02-12 17:53:22 +00:00
|
|
|
}
|
|
|
|
|
2004-02-14 04:46:05 +00:00
|
|
|
// No matter what the alignment is, we put the source in ESI, the
|
|
|
|
// destination in EDI, and the count in ECX.
|
|
|
|
TmpReg1 = getReg(CI.getOperand(1));
|
|
|
|
//TmpReg2 = getReg(CI.getOperand(2));
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV32rr, 1, X86::ECX).addReg(CountReg);
|
|
|
|
BuildMI(BB, X86::MOV32rr, 1, X86::EDI).addReg(TmpReg1);
|
2004-02-14 04:46:05 +00:00
|
|
|
BuildMI(BB, Opcode, 0);
|
2004-02-12 17:53:22 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2003-12-28 09:47:19 +00:00
|
|
|
default: assert(0 && "Error: unknown intrinsics should have been lowered!");
|
2003-05-08 19:44:13 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
Implement folding explicit load instructions into binary operations. For a
testcase like this:
int %test(int* %P, int %A) {
%Pv = load int* %P
%B = add int %A, %Pv
ret int %B
}
We now generate:
test:
mov %ECX, DWORD PTR [%ESP + 4]
mov %EAX, DWORD PTR [%ESP + 8]
add %EAX, DWORD PTR [%ECX]
ret
Instead of:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
mov %EAX, DWORD PTR [%EAX]
add %EAX, %ECX
ret
... saving one instruction, and often a register. Note that there are a lot
of other instructions that could use this, but they aren't handled. I'm not
really interested in adding them, but mul/div and all of the FP instructions
could be supported as well if someone wanted to add them.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@12204 91177308-0d34-0410-b5e6-96231b3b80d8
2004-03-08 01:58:35 +00:00
|
|
|
static bool isSafeToFoldLoadIntoInstruction(LoadInst &LI, Instruction &User) {
|
|
|
|
if (LI.getParent() != User.getParent())
|
|
|
|
return false;
|
|
|
|
BasicBlock::iterator It = &LI;
|
|
|
|
// Check all of the instructions between the load and the user. We should
|
|
|
|
// really use alias analysis here, but for now we just do something simple.
|
|
|
|
for (++It; It != BasicBlock::iterator(&User); ++It) {
|
|
|
|
switch (It->getOpcode()) {
|
2004-03-18 06:29:54 +00:00
|
|
|
case Instruction::Free:
|
Implement folding explicit load instructions into binary operations. For a
testcase like this:
int %test(int* %P, int %A) {
%Pv = load int* %P
%B = add int %A, %Pv
ret int %B
}
We now generate:
test:
mov %ECX, DWORD PTR [%ESP + 4]
mov %EAX, DWORD PTR [%ESP + 8]
add %EAX, DWORD PTR [%ECX]
ret
Instead of:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
mov %EAX, DWORD PTR [%EAX]
add %EAX, %ECX
ret
... saving one instruction, and often a register. Note that there are a lot
of other instructions that could use this, but they aren't handled. I'm not
really interested in adding them, but mul/div and all of the FP instructions
could be supported as well if someone wanted to add them.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@12204 91177308-0d34-0410-b5e6-96231b3b80d8
2004-03-08 01:58:35 +00:00
|
|
|
case Instruction::Store:
|
|
|
|
case Instruction::Call:
|
|
|
|
case Instruction::Invoke:
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2003-05-08 19:44:13 +00:00
|
|
|
|
2003-05-08 20:49:25 +00:00
|
|
|
/// visitSimpleBinary - Implement simple binary operators for integral types...
|
|
|
|
/// OperatorClass is one of: 0 for Add, 1 for Sub, 2 for And, 3 for Or, 4 for
|
|
|
|
/// Xor.
|
2004-03-01 23:53:11 +00:00
|
|
|
///
|
2003-05-08 20:49:25 +00:00
|
|
|
void ISel::visitSimpleBinary(BinaryOperator &B, unsigned OperatorClass) {
|
|
|
|
unsigned DestReg = getReg(B);
|
|
|
|
MachineBasicBlock::iterator MI = BB->end();
|
2004-03-08 01:18:36 +00:00
|
|
|
Value *Op0 = B.getOperand(0), *Op1 = B.getOperand(1);
|
|
|
|
|
Implement folding explicit load instructions into binary operations. For a
testcase like this:
int %test(int* %P, int %A) {
%Pv = load int* %P
%B = add int %A, %Pv
ret int %B
}
We now generate:
test:
mov %ECX, DWORD PTR [%ESP + 4]
mov %EAX, DWORD PTR [%ESP + 8]
add %EAX, DWORD PTR [%ECX]
ret
Instead of:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
mov %EAX, DWORD PTR [%EAX]
add %EAX, %ECX
ret
... saving one instruction, and often a register. Note that there are a lot
of other instructions that could use this, but they aren't handled. I'm not
really interested in adding them, but mul/div and all of the FP instructions
could be supported as well if someone wanted to add them.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@12204 91177308-0d34-0410-b5e6-96231b3b80d8
2004-03-08 01:58:35 +00:00
|
|
|
// Special case: op Reg, load [mem]
|
|
|
|
if (isa<LoadInst>(Op0) && !isa<LoadInst>(Op1))
|
|
|
|
if (!B.swapOperands())
|
|
|
|
std::swap(Op0, Op1); // Make sure any loads are in the RHS.
|
|
|
|
|
|
|
|
unsigned Class = getClassB(B.getType());
|
|
|
|
if (isa<LoadInst>(Op1) && Class < cFP &&
|
|
|
|
isSafeToFoldLoadIntoInstruction(*cast<LoadInst>(Op1), B)) {
|
|
|
|
|
|
|
|
static const unsigned OpcodeTab[][3] = {
|
|
|
|
// Arithmetic operators
|
|
|
|
{ X86::ADD8rm, X86::ADD16rm, X86::ADD32rm }, // ADD
|
|
|
|
{ X86::SUB8rm, X86::SUB16rm, X86::SUB32rm }, // SUB
|
|
|
|
|
|
|
|
// Bitwise operators
|
|
|
|
{ X86::AND8rm, X86::AND16rm, X86::AND32rm }, // AND
|
|
|
|
{ X86:: OR8rm, X86:: OR16rm, X86:: OR32rm }, // OR
|
|
|
|
{ X86::XOR8rm, X86::XOR16rm, X86::XOR32rm }, // XOR
|
|
|
|
};
|
|
|
|
|
|
|
|
assert(Class < cFP && "General code handles 64-bit integer types!");
|
|
|
|
unsigned Opcode = OpcodeTab[OperatorClass][Class];
|
|
|
|
|
|
|
|
unsigned BaseReg, Scale, IndexReg, Disp;
|
|
|
|
getAddressingMode(cast<LoadInst>(Op1)->getOperand(0), BaseReg,
|
|
|
|
Scale, IndexReg, Disp);
|
|
|
|
|
|
|
|
unsigned Op0r = getReg(Op0);
|
|
|
|
addFullAddress(BuildMI(BB, Opcode, 2, DestReg).addReg(Op0r),
|
|
|
|
BaseReg, Scale, IndexReg, Disp);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2004-03-08 01:18:36 +00:00
|
|
|
emitSimpleBinaryOperation(BB, MI, Op0, Op1, OperatorClass, DestReg);
|
2003-05-08 20:49:25 +00:00
|
|
|
}
|
2003-01-13 00:32:26 +00:00
|
|
|
|
2003-10-19 21:09:10 +00:00
|
|
|
/// emitSimpleBinaryOperation - Implement simple binary operators for integral
|
|
|
|
/// types... OperatorClass is one of: 0 for Add, 1 for Sub, 2 for And, 3 for
|
|
|
|
/// Or, 4 for Xor.
|
2002-11-02 20:13:22 +00:00
|
|
|
///
|
2003-05-08 20:49:25 +00:00
|
|
|
/// emitSimpleBinaryOperation - Common code shared between visitSimpleBinary
|
|
|
|
/// and constant expression support.
|
2003-10-19 21:09:10 +00:00
|
|
|
///
|
|
|
|
void ISel::emitSimpleBinaryOperation(MachineBasicBlock *MBB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2003-05-08 20:49:25 +00:00
|
|
|
Value *Op0, Value *Op1,
|
2003-10-19 21:09:10 +00:00
|
|
|
unsigned OperatorClass, unsigned DestReg) {
|
2003-05-08 20:49:25 +00:00
|
|
|
unsigned Class = getClassB(Op0->getType());
|
2003-10-19 21:09:10 +00:00
|
|
|
|
|
|
|
// sub 0, X -> neg X
|
|
|
|
if (OperatorClass == 1 && Class != cLong)
|
2004-02-02 18:56:30 +00:00
|
|
|
if (ConstantInt *CI = dyn_cast<ConstantInt>(Op0)) {
|
2003-10-19 21:09:10 +00:00
|
|
|
if (CI->isNullValue()) {
|
|
|
|
unsigned op1Reg = getReg(Op1, MBB, IP);
|
|
|
|
switch (Class) {
|
|
|
|
default: assert(0 && "Unknown class for this function!");
|
|
|
|
case cByte:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::NEG8r, 1, DestReg).addReg(op1Reg);
|
2003-10-19 21:09:10 +00:00
|
|
|
return;
|
|
|
|
case cShort:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::NEG16r, 1, DestReg).addReg(op1Reg);
|
2003-10-19 21:09:10 +00:00
|
|
|
return;
|
|
|
|
case cInt:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::NEG32r, 1, DestReg).addReg(op1Reg);
|
2003-10-19 21:09:10 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2004-02-02 19:31:38 +00:00
|
|
|
} else if (ConstantFP *CFP = dyn_cast<ConstantFP>(Op0))
|
|
|
|
if (CFP->isExactlyValue(-0.0)) {
|
|
|
|
// -0.0 - X === -X
|
|
|
|
unsigned op1Reg = getReg(Op1, MBB, IP);
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, X86::FCHS, 1, DestReg).addReg(op1Reg);
|
2004-02-02 19:31:38 +00:00
|
|
|
return;
|
|
|
|
}
|
2003-10-19 21:09:10 +00:00
|
|
|
|
2004-03-08 01:18:36 +00:00
|
|
|
// Special case: op Reg, <const>
|
|
|
|
if (Class != cLong && isa<ConstantInt>(Op1)) {
|
|
|
|
ConstantInt *Op1C = cast<ConstantInt>(Op1);
|
|
|
|
unsigned Op0r = getReg(Op0, MBB, IP);
|
|
|
|
|
|
|
|
// xor X, -1 -> not X
|
|
|
|
if (OperatorClass == 4 && Op1C->isAllOnesValue()) {
|
|
|
|
static unsigned const NOTTab[] = { X86::NOT8r, X86::NOT16r, X86::NOT32r };
|
|
|
|
BuildMI(*MBB, IP, NOTTab[Class], 1, DestReg).addReg(Op0r);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// add X, -1 -> dec X
|
|
|
|
if (OperatorClass == 0 && Op1C->isAllOnesValue()) {
|
|
|
|
static unsigned const DECTab[] = { X86::DEC8r, X86::DEC16r, X86::DEC32r };
|
|
|
|
BuildMI(*MBB, IP, DECTab[Class], 1, DestReg).addReg(Op0r);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// add X, 1 -> inc X
|
|
|
|
if (OperatorClass == 0 && Op1C->equalsInt(1)) {
|
|
|
|
static unsigned const DECTab[] = { X86::INC8r, X86::INC16r, X86::INC32r };
|
|
|
|
BuildMI(*MBB, IP, DECTab[Class], 1, DestReg).addReg(Op0r);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
static const unsigned OpcodeTab[][3] = {
|
2003-06-05 18:28:55 +00:00
|
|
|
// Arithmetic operators
|
2004-03-08 01:18:36 +00:00
|
|
|
{ X86::ADD8ri, X86::ADD16ri, X86::ADD32ri }, // ADD
|
|
|
|
{ X86::SUB8ri, X86::SUB16ri, X86::SUB32ri }, // SUB
|
|
|
|
|
2003-06-05 18:28:55 +00:00
|
|
|
// Bitwise operators
|
2004-03-08 01:18:36 +00:00
|
|
|
{ X86::AND8ri, X86::AND16ri, X86::AND32ri }, // AND
|
|
|
|
{ X86:: OR8ri, X86:: OR16ri, X86:: OR32ri }, // OR
|
|
|
|
{ X86::XOR8ri, X86::XOR16ri, X86::XOR32ri }, // XOR
|
2003-06-05 18:28:55 +00:00
|
|
|
};
|
2004-03-08 01:18:36 +00:00
|
|
|
|
|
|
|
assert(Class < cFP && "General code handles 64-bit integer types!");
|
2003-06-05 18:28:55 +00:00
|
|
|
unsigned Opcode = OpcodeTab[OperatorClass][Class];
|
2002-11-02 20:13:22 +00:00
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
|
2004-03-08 01:18:36 +00:00
|
|
|
uint64_t Op1v = cast<ConstantInt>(Op1C)->getRawValue();
|
|
|
|
BuildMI(*MBB, IP, Opcode, 5, DestReg).addReg(Op0r).addImm(Op1v);
|
2003-10-19 21:09:10 +00:00
|
|
|
return;
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
2003-10-19 21:09:10 +00:00
|
|
|
|
2004-03-08 01:18:36 +00:00
|
|
|
// Finally, handle the general case now.
|
|
|
|
static const unsigned OpcodeTab[][4] = {
|
2003-10-19 21:09:10 +00:00
|
|
|
// Arithmetic operators
|
2004-03-08 01:18:36 +00:00
|
|
|
{ X86::ADD8rr, X86::ADD16rr, X86::ADD32rr, X86::FpADD }, // ADD
|
|
|
|
{ X86::SUB8rr, X86::SUB16rr, X86::SUB32rr, X86::FpSUB }, // SUB
|
|
|
|
|
2003-10-19 21:09:10 +00:00
|
|
|
// Bitwise operators
|
2004-03-08 01:18:36 +00:00
|
|
|
{ X86::AND8rr, X86::AND16rr, X86::AND32rr, 0 }, // AND
|
|
|
|
{ X86:: OR8rr, X86:: OR16rr, X86:: OR32rr, 0 }, // OR
|
|
|
|
{ X86::XOR8rr, X86::XOR16rr, X86::XOR32rr, 0 }, // XOR
|
2003-10-19 21:09:10 +00:00
|
|
|
};
|
2004-03-08 01:18:36 +00:00
|
|
|
|
|
|
|
bool isLong = false;
|
|
|
|
if (Class == cLong) {
|
|
|
|
isLong = true;
|
|
|
|
Class = cInt; // Bottom 32 bits are handled just like ints
|
|
|
|
}
|
|
|
|
|
2003-10-19 21:09:10 +00:00
|
|
|
unsigned Opcode = OpcodeTab[OperatorClass][Class];
|
2004-03-08 01:18:36 +00:00
|
|
|
assert(Opcode && "Floating point arguments to logical inst?");
|
|
|
|
unsigned Op0r = getReg(Op0, MBB, IP);
|
|
|
|
unsigned Op1r = getReg(Op1, MBB, IP);
|
|
|
|
BuildMI(*MBB, IP, Opcode, 2, DestReg).addReg(Op0r).addReg(Op1r);
|
|
|
|
|
|
|
|
if (isLong) { // Handle the upper 32 bits of long values...
|
|
|
|
static const unsigned TopTab[] = {
|
|
|
|
X86::ADC32rr, X86::SBB32rr, X86::AND32rr, X86::OR32rr, X86::XOR32rr
|
|
|
|
};
|
|
|
|
BuildMI(*MBB, IP, TopTab[OperatorClass], 2,
|
|
|
|
DestReg+1).addReg(Op0r+1).addReg(Op1r+1);
|
|
|
|
}
|
2002-11-02 20:04:26 +00:00
|
|
|
}
|
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
/// doMultiply - Emit appropriate instructions to multiply together the
|
|
|
|
/// registers op0Reg and op1Reg, and put the result in DestReg. The type of the
|
|
|
|
/// result should be given as DestTy.
|
|
|
|
///
|
2004-02-23 03:10:10 +00:00
|
|
|
void ISel::doMultiply(MachineBasicBlock *MBB, MachineBasicBlock::iterator MBBI,
|
2003-01-13 00:32:26 +00:00
|
|
|
unsigned DestReg, const Type *DestTy,
|
2002-12-16 19:32:50 +00:00
|
|
|
unsigned op0Reg, unsigned op1Reg) {
|
2003-01-13 00:32:26 +00:00
|
|
|
unsigned Class = getClass(DestTy);
|
2002-12-25 05:13:53 +00:00
|
|
|
switch (Class) {
|
|
|
|
case cFP: // Floating point multiply
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, MBBI, X86::FpMUL, 2, DestReg).addReg(op0Reg).addReg(op1Reg);
|
2002-12-25 05:13:53 +00:00
|
|
|
return;
|
2003-06-21 17:16:58 +00:00
|
|
|
case cInt:
|
|
|
|
case cShort:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, MBBI, Class == cInt ? X86::IMUL32rr:X86::IMUL16rr, 2, DestReg)
|
2003-06-21 17:16:58 +00:00
|
|
|
.addReg(op0Reg).addReg(op1Reg);
|
|
|
|
return;
|
|
|
|
case cByte:
|
|
|
|
// Must use the MUL instruction, which forces use of AL...
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, MBBI, X86::MOV8rr, 1, X86::AL).addReg(op0Reg);
|
|
|
|
BuildMI(*MBB, MBBI, X86::MUL8r, 1).addReg(op1Reg);
|
|
|
|
BuildMI(*MBB, MBBI, X86::MOV8rr, 1, DestReg).addReg(X86::AL);
|
2003-06-21 17:16:58 +00:00
|
|
|
return;
|
2002-12-25 05:13:53 +00:00
|
|
|
default:
|
2003-01-13 00:32:26 +00:00
|
|
|
case cLong: assert(0 && "doMultiply cannot operate on LONG values!");
|
2002-12-25 05:13:53 +00:00
|
|
|
}
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
}
|
|
|
|
|
2003-10-19 21:09:10 +00:00
|
|
|
// ExactLog2 - This function solves for (Val == 1 << (N-1)) and returns N. It
|
|
|
|
// returns zero when the input is not exactly a power of two.
|
|
|
|
static unsigned ExactLog2(unsigned Val) {
|
|
|
|
if (Val == 0) return 0;
|
|
|
|
unsigned Count = 0;
|
|
|
|
while (Val != 1) {
|
|
|
|
if (Val & 1) return 0;
|
|
|
|
Val >>= 1;
|
|
|
|
++Count;
|
|
|
|
}
|
|
|
|
return Count+1;
|
|
|
|
}
|
|
|
|
|
|
|
|
void ISel::doMultiplyConst(MachineBasicBlock *MBB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2003-10-19 21:09:10 +00:00
|
|
|
unsigned DestReg, const Type *DestTy,
|
|
|
|
unsigned op0Reg, unsigned ConstRHS) {
|
|
|
|
unsigned Class = getClass(DestTy);
|
|
|
|
|
|
|
|
// If the element size is exactly a power of 2, use a shift to get it.
|
|
|
|
if (unsigned Shift = ExactLog2(ConstRHS)) {
|
|
|
|
switch (Class) {
|
|
|
|
default: assert(0 && "Unknown class for this function!");
|
|
|
|
case cByte:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::SHL32ri,2, DestReg).addReg(op0Reg).addImm(Shift-1);
|
2003-10-19 21:09:10 +00:00
|
|
|
return;
|
|
|
|
case cShort:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::SHL32ri,2, DestReg).addReg(op0Reg).addImm(Shift-1);
|
2003-10-19 21:09:10 +00:00
|
|
|
return;
|
|
|
|
case cInt:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::SHL32ri,2, DestReg).addReg(op0Reg).addImm(Shift-1);
|
2003-10-19 21:09:10 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2003-10-20 03:42:58 +00:00
|
|
|
|
|
|
|
if (Class == cShort) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::IMUL16rri,2,DestReg).addReg(op0Reg).addImm(ConstRHS);
|
2003-10-20 03:42:58 +00:00
|
|
|
return;
|
|
|
|
} else if (Class == cInt) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::IMUL32rri,2,DestReg).addReg(op0Reg).addImm(ConstRHS);
|
2003-10-20 03:42:58 +00:00
|
|
|
return;
|
|
|
|
}
|
2003-10-19 21:09:10 +00:00
|
|
|
|
|
|
|
// Most general case, emit a normal multiply...
|
2004-02-17 06:16:44 +00:00
|
|
|
static const unsigned MOVriTab[] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
X86::MOV8ri, X86::MOV16ri, X86::MOV32ri
|
2003-10-19 21:09:10 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
unsigned TmpReg = makeAnotherReg(DestTy);
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, MOVriTab[Class], 1, TmpReg).addImm(ConstRHS);
|
2003-10-19 21:09:10 +00:00
|
|
|
|
|
|
|
// Emit a MUL to multiply the register holding the index by
|
|
|
|
// elementSize, putting the result in OffsetReg.
|
|
|
|
doMultiply(MBB, IP, DestReg, DestTy, op0Reg, TmpReg);
|
|
|
|
}
|
|
|
|
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
/// visitMul - Multiplies are not simple binary operators because they must deal
|
|
|
|
/// with the EAX register explicitly.
|
|
|
|
///
|
|
|
|
void ISel::visitMul(BinaryOperator &I) {
|
2002-12-13 13:07:42 +00:00
|
|
|
unsigned Op0Reg = getReg(I.getOperand(0));
|
2003-01-13 00:32:26 +00:00
|
|
|
unsigned DestReg = getReg(I);
|
|
|
|
|
|
|
|
// Simple scalar multiply?
|
|
|
|
if (I.getType() != Type::LongTy && I.getType() != Type::ULongTy) {
|
2003-10-19 21:09:10 +00:00
|
|
|
if (ConstantInt *CI = dyn_cast<ConstantInt>(I.getOperand(1))) {
|
|
|
|
unsigned Val = (unsigned)CI->getRawValue(); // Cannot be 64-bit constant
|
|
|
|
MachineBasicBlock::iterator MBBI = BB->end();
|
|
|
|
doMultiplyConst(BB, MBBI, DestReg, I.getType(), Op0Reg, Val);
|
|
|
|
} else {
|
|
|
|
unsigned Op1Reg = getReg(I.getOperand(1));
|
|
|
|
MachineBasicBlock::iterator MBBI = BB->end();
|
|
|
|
doMultiply(BB, MBBI, DestReg, I.getType(), Op0Reg, Op1Reg);
|
|
|
|
}
|
2003-01-13 00:32:26 +00:00
|
|
|
} else {
|
2003-10-19 21:09:10 +00:00
|
|
|
unsigned Op1Reg = getReg(I.getOperand(1));
|
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
// Long value. We have to do things the hard way...
|
|
|
|
// Multiply the two low parts... capturing carry into EDX
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV32rr, 1, X86::EAX).addReg(Op0Reg);
|
|
|
|
BuildMI(BB, X86::MUL32r, 1).addReg(Op1Reg); // AL*BL
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
unsigned OverflowReg = makeAnotherReg(Type::UIntTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV32rr, 1, DestReg).addReg(X86::EAX); // AL*BL
|
|
|
|
BuildMI(BB, X86::MOV32rr, 1, OverflowReg).addReg(X86::EDX); // AL*BL >> 32
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
MachineBasicBlock::iterator MBBI = BB->end();
|
2003-06-21 18:15:27 +00:00
|
|
|
unsigned AHBLReg = makeAnotherReg(Type::UIntTy); // AH*BL
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, MBBI, X86::IMUL32rr,2,AHBLReg).addReg(Op0Reg+1).addReg(Op1Reg);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
unsigned AHBLplusOverflowReg = makeAnotherReg(Type::UIntTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, MBBI, X86::ADD32rr, 2, // AH*BL+(AL*BL >> 32)
|
2003-10-23 16:22:08 +00:00
|
|
|
AHBLplusOverflowReg).addReg(AHBLReg).addReg(OverflowReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
MBBI = BB->end();
|
2003-06-21 18:15:27 +00:00
|
|
|
unsigned ALBHReg = makeAnotherReg(Type::UIntTy); // AL*BH
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, MBBI, X86::IMUL32rr,2,ALBHReg).addReg(Op0Reg).addReg(Op1Reg+1);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, MBBI, X86::ADD32rr, 2, // AL*BH + AH*BL + (AL*BL >> 32)
|
2003-10-23 16:22:08 +00:00
|
|
|
DestReg+1).addReg(AHBLplusOverflowReg).addReg(ALBHReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
2002-11-02 20:54:46 +00:00
|
|
|
}
|
|
|
|
|
2002-11-17 21:56:38 +00:00
|
|
|
|
2002-11-02 20:54:46 +00:00
|
|
|
/// visitDivRem - Handle division and remainder instructions... these
|
|
|
|
/// instruction both require the same instructions to be generated, they just
|
|
|
|
/// select the result from a different register. Note that both of these
|
|
|
|
/// instructions work differently for signed and unsigned operands.
|
|
|
|
///
|
|
|
|
void ISel::visitDivRem(BinaryOperator &I) {
|
2003-10-23 17:21:43 +00:00
|
|
|
unsigned Op0Reg = getReg(I.getOperand(0));
|
|
|
|
unsigned Op1Reg = getReg(I.getOperand(1));
|
|
|
|
unsigned ResultReg = getReg(I);
|
|
|
|
|
|
|
|
MachineBasicBlock::iterator IP = BB->end();
|
|
|
|
emitDivRemOperation(BB, IP, Op0Reg, Op1Reg, I.getOpcode() == Instruction::Div,
|
|
|
|
I.getType(), ResultReg);
|
|
|
|
}
|
2002-12-25 05:13:53 +00:00
|
|
|
|
2003-10-23 17:21:43 +00:00
|
|
|
void ISel::emitDivRemOperation(MachineBasicBlock *BB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2003-10-23 17:21:43 +00:00
|
|
|
unsigned Op0Reg, unsigned Op1Reg, bool isDiv,
|
|
|
|
const Type *Ty, unsigned ResultReg) {
|
|
|
|
unsigned Class = getClass(Ty);
|
2002-12-25 05:13:53 +00:00
|
|
|
switch (Class) {
|
2003-01-13 00:32:26 +00:00
|
|
|
case cFP: // Floating point divide
|
2003-10-23 17:21:43 +00:00
|
|
|
if (isDiv) {
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, X86::FpDIV, 2, ResultReg).addReg(Op0Reg).addReg(Op1Reg);
|
2003-08-04 02:12:48 +00:00
|
|
|
} else { // Floating point remainder...
|
2003-01-13 00:32:26 +00:00
|
|
|
MachineInstr *TheCall =
|
2003-10-23 16:22:08 +00:00
|
|
|
BuildMI(X86::CALLpcrel32, 1).addExternalSymbol("fmod", true);
|
2003-01-13 00:32:26 +00:00
|
|
|
std::vector<ValueRecord> Args;
|
2003-10-23 17:21:43 +00:00
|
|
|
Args.push_back(ValueRecord(Op0Reg, Type::DoubleTy));
|
|
|
|
Args.push_back(ValueRecord(Op1Reg, Type::DoubleTy));
|
2003-01-13 00:32:26 +00:00
|
|
|
doCall(ValueRecord(ResultReg, Type::DoubleTy), TheCall, Args);
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
case cLong: {
|
|
|
|
static const char *FnName[] =
|
|
|
|
{ "__moddi3", "__divdi3", "__umoddi3", "__udivdi3" };
|
|
|
|
|
2003-10-23 17:21:43 +00:00
|
|
|
unsigned NameIdx = Ty->isUnsigned()*2 + isDiv;
|
2003-01-13 00:32:26 +00:00
|
|
|
MachineInstr *TheCall =
|
|
|
|
BuildMI(X86::CALLpcrel32, 1).addExternalSymbol(FnName[NameIdx], true);
|
|
|
|
|
|
|
|
std::vector<ValueRecord> Args;
|
2003-10-23 17:21:43 +00:00
|
|
|
Args.push_back(ValueRecord(Op0Reg, Type::LongTy));
|
|
|
|
Args.push_back(ValueRecord(Op1Reg, Type::LongTy));
|
2003-01-13 00:32:26 +00:00
|
|
|
doCall(ValueRecord(ResultReg, Type::LongTy), TheCall, Args);
|
2002-12-25 05:13:53 +00:00
|
|
|
return;
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
|
|
|
case cByte: case cShort: case cInt:
|
2003-10-10 17:57:28 +00:00
|
|
|
break; // Small integrals, handled below...
|
2003-01-13 00:32:26 +00:00
|
|
|
default: assert(0 && "Unknown class!");
|
2002-12-25 05:13:53 +00:00
|
|
|
}
|
2002-11-02 20:54:46 +00:00
|
|
|
|
|
|
|
static const unsigned Regs[] ={ X86::AL , X86::AX , X86::EAX };
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
static const unsigned MovOpcode[]={ X86::MOV8rr, X86::MOV16rr, X86::MOV32rr };
|
|
|
|
static const unsigned SarOpcode[]={ X86::SAR8ri, X86::SAR16ri, X86::SAR32ri };
|
|
|
|
static const unsigned ClrOpcode[]={ X86::MOV8ri, X86::MOV16ri, X86::MOV32ri };
|
2002-11-02 20:54:46 +00:00
|
|
|
static const unsigned ExtRegs[] ={ X86::AH , X86::DX , X86::EDX };
|
|
|
|
|
|
|
|
static const unsigned DivOpcode[][4] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
{ X86::DIV8r , X86::DIV16r , X86::DIV32r , 0 }, // Unsigned division
|
|
|
|
{ X86::IDIV8r, X86::IDIV16r, X86::IDIV32r, 0 }, // Signed division
|
2002-11-02 20:54:46 +00:00
|
|
|
};
|
2002-11-02 20:28:58 +00:00
|
|
|
|
2003-10-23 17:21:43 +00:00
|
|
|
bool isSigned = Ty->isSigned();
|
2002-11-02 20:54:46 +00:00
|
|
|
unsigned Reg = Regs[Class];
|
|
|
|
unsigned ExtReg = ExtRegs[Class];
|
|
|
|
|
|
|
|
// Put the first operand into one of the A registers...
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, MovOpcode[Class], 1, Reg).addReg(Op0Reg);
|
2002-11-02 20:54:46 +00:00
|
|
|
|
|
|
|
if (isSigned) {
|
|
|
|
// Emit a sign extension instruction...
|
2003-10-23 17:21:43 +00:00
|
|
|
unsigned ShiftResult = makeAnotherReg(Ty);
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, SarOpcode[Class], 2,ShiftResult).addReg(Op0Reg).addImm(31);
|
|
|
|
BuildMI(*BB, IP, MovOpcode[Class], 1, ExtReg).addReg(ShiftResult);
|
2002-11-02 20:54:46 +00:00
|
|
|
} else {
|
2004-01-12 07:22:45 +00:00
|
|
|
// If unsigned, emit a zeroing instruction... (reg = 0)
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, ClrOpcode[Class], 2, ExtReg).addImm(0);
|
2002-11-02 20:54:46 +00:00
|
|
|
}
|
|
|
|
|
2002-11-17 21:56:38 +00:00
|
|
|
// Emit the appropriate divide or remainder instruction...
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, DivOpcode[isSigned][Class], 1).addReg(Op1Reg);
|
2002-11-17 21:56:38 +00:00
|
|
|
|
2002-11-02 20:54:46 +00:00
|
|
|
// Figure out which register we want to pick the result out of...
|
2003-10-23 17:21:43 +00:00
|
|
|
unsigned DestReg = isDiv ? Reg : ExtReg;
|
2002-11-02 20:54:46 +00:00
|
|
|
|
|
|
|
// Put the result into the destination register...
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, MovOpcode[Class], 1, ResultReg).addReg(DestReg);
|
2002-11-02 20:28:58 +00:00
|
|
|
}
|
2002-11-02 20:04:26 +00:00
|
|
|
|
2002-11-17 21:56:38 +00:00
|
|
|
|
2002-10-31 23:03:59 +00:00
|
|
|
/// Shift instructions: 'shl', 'sar', 'shr' - Some special cases here
|
|
|
|
/// for constant immediate shift values, and for constant immediate
|
|
|
|
/// shift values equal to 1. Even the general case is sort of special,
|
|
|
|
/// because the shift amount has to be in CL, not just any old register.
|
|
|
|
///
|
2003-01-13 00:32:26 +00:00
|
|
|
void ISel::visitShiftInst(ShiftInst &I) {
|
2003-11-22 06:49:41 +00:00
|
|
|
MachineBasicBlock::iterator IP = BB->end ();
|
|
|
|
emitShiftOperation (BB, IP, I.getOperand (0), I.getOperand (1),
|
|
|
|
I.getOpcode () == Instruction::Shl, I.getType (),
|
|
|
|
getReg (I));
|
|
|
|
}
|
|
|
|
|
|
|
|
/// emitShiftOperation - Common code shared between visitShiftInst and
|
|
|
|
/// constant expression support.
|
|
|
|
void ISel::emitShiftOperation(MachineBasicBlock *MBB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2003-11-22 06:49:41 +00:00
|
|
|
Value *Op, Value *ShiftAmount, bool isLeftShift,
|
|
|
|
const Type *ResultTy, unsigned DestReg) {
|
|
|
|
unsigned SrcReg = getReg (Op, MBB, IP);
|
|
|
|
bool isSigned = ResultTy->isSigned ();
|
|
|
|
unsigned Class = getClass (ResultTy);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
static const unsigned ConstantOperand[][4] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
{ X86::SHR8ri, X86::SHR16ri, X86::SHR32ri, X86::SHRD32rri8 }, // SHR
|
|
|
|
{ X86::SAR8ri, X86::SAR16ri, X86::SAR32ri, X86::SHRD32rri8 }, // SAR
|
|
|
|
{ X86::SHL8ri, X86::SHL16ri, X86::SHL32ri, X86::SHLD32rri8 }, // SHL
|
|
|
|
{ X86::SHL8ri, X86::SHL16ri, X86::SHL32ri, X86::SHLD32rri8 }, // SAL = SHL
|
2003-01-13 00:32:26 +00:00
|
|
|
};
|
2002-11-02 01:15:18 +00:00
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
static const unsigned NonConstantOperand[][4] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
{ X86::SHR8rCL, X86::SHR16rCL, X86::SHR32rCL }, // SHR
|
|
|
|
{ X86::SAR8rCL, X86::SAR16rCL, X86::SAR32rCL }, // SAR
|
|
|
|
{ X86::SHL8rCL, X86::SHL16rCL, X86::SHL32rCL }, // SHL
|
|
|
|
{ X86::SHL8rCL, X86::SHL16rCL, X86::SHL32rCL }, // SAL = SHL
|
2003-01-13 00:32:26 +00:00
|
|
|
};
|
2002-11-02 01:15:18 +00:00
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
// Longs, as usual, are handled specially...
|
|
|
|
if (Class == cLong) {
|
|
|
|
// If we have a constant shift, we can generate much more efficient code
|
|
|
|
// than otherwise...
|
|
|
|
//
|
2003-11-22 06:49:41 +00:00
|
|
|
if (ConstantUInt *CUI = dyn_cast<ConstantUInt>(ShiftAmount)) {
|
2003-01-13 00:32:26 +00:00
|
|
|
unsigned Amount = CUI->getValue();
|
|
|
|
if (Amount < 32) {
|
2003-10-23 16:22:08 +00:00
|
|
|
const unsigned *Opc = ConstantOperand[isLeftShift*2+isSigned];
|
|
|
|
if (isLeftShift) {
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, Opc[3], 3,
|
|
|
|
DestReg+1).addReg(SrcReg+1).addReg(SrcReg).addImm(Amount);
|
|
|
|
BuildMI(*MBB, IP, Opc[2], 2, DestReg).addReg(SrcReg).addImm(Amount);
|
2003-10-23 16:22:08 +00:00
|
|
|
} else {
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, Opc[3], 3,
|
|
|
|
DestReg).addReg(SrcReg ).addReg(SrcReg+1).addImm(Amount);
|
|
|
|
BuildMI(*MBB, IP, Opc[2],2,DestReg+1).addReg(SrcReg+1).addImm(Amount);
|
2003-10-23 16:22:08 +00:00
|
|
|
}
|
2003-01-13 00:32:26 +00:00
|
|
|
} else { // Shifting more than 32 bits
|
2003-10-23 16:22:08 +00:00
|
|
|
Amount -= 32;
|
|
|
|
if (isLeftShift) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::SHL32ri, 2,
|
2004-02-29 07:22:16 +00:00
|
|
|
DestReg + 1).addReg(SrcReg).addImm(Amount);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV32ri, 1,
|
2004-02-29 07:22:16 +00:00
|
|
|
DestReg).addImm(0);
|
2003-10-23 16:22:08 +00:00
|
|
|
} else {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
unsigned Opcode = isSigned ? X86::SAR32ri : X86::SHR32ri;
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, Opcode, 2, DestReg).addReg(SrcReg+1).addImm(Amount);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV32ri, 1, DestReg+1).addImm(0);
|
2003-10-23 16:22:08 +00:00
|
|
|
}
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
|
|
|
} else {
|
2003-06-01 01:56:54 +00:00
|
|
|
unsigned TmpReg = makeAnotherReg(Type::IntTy);
|
|
|
|
|
|
|
|
if (!isLeftShift && isSigned) {
|
|
|
|
// If this is a SHR of a Long, then we need to do funny sign extension
|
|
|
|
// stuff. TmpReg gets the value to use as the high-part if we are
|
|
|
|
// shifting more than 32 bits.
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::SAR32ri, 2, TmpReg).addReg(SrcReg).addImm(31);
|
2003-06-01 01:56:54 +00:00
|
|
|
} else {
|
|
|
|
// Other shifts use a fixed zero value if the shift is more than 32
|
|
|
|
// bits.
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV32ri, 1, TmpReg).addImm(0);
|
2003-06-01 01:56:54 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Initialize CL with the shift amount...
|
2003-11-22 06:49:41 +00:00
|
|
|
unsigned ShiftAmountReg = getReg(ShiftAmount, MBB, IP);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV8rr, 1, X86::CL).addReg(ShiftAmountReg);
|
2003-06-01 01:56:54 +00:00
|
|
|
|
|
|
|
unsigned TmpReg2 = makeAnotherReg(Type::IntTy);
|
|
|
|
unsigned TmpReg3 = makeAnotherReg(Type::IntTy);
|
|
|
|
if (isLeftShift) {
|
|
|
|
// TmpReg2 = shld inHi, inLo
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::SHLD32rrCL,2,TmpReg2).addReg(SrcReg+1)
|
2004-02-29 07:22:16 +00:00
|
|
|
.addReg(SrcReg);
|
2003-06-01 01:56:54 +00:00
|
|
|
// TmpReg3 = shl inLo, CL
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::SHL32rCL, 1, TmpReg3).addReg(SrcReg);
|
2003-06-01 01:56:54 +00:00
|
|
|
|
|
|
|
// Set the flags to indicate whether the shift was by more than 32 bits.
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::TEST8ri, 2).addReg(X86::CL).addImm(32);
|
2003-06-01 01:56:54 +00:00
|
|
|
|
|
|
|
// DestHi = (>32) ? TmpReg3 : TmpReg2;
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::CMOVNE32rr, 2,
|
2003-06-01 01:56:54 +00:00
|
|
|
DestReg+1).addReg(TmpReg2).addReg(TmpReg3);
|
|
|
|
// DestLo = (>32) ? TmpReg : TmpReg3;
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::CMOVNE32rr, 2,
|
2003-11-22 06:49:41 +00:00
|
|
|
DestReg).addReg(TmpReg3).addReg(TmpReg);
|
2003-06-01 01:56:54 +00:00
|
|
|
} else {
|
|
|
|
// TmpReg2 = shrd inLo, inHi
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::SHRD32rrCL,2,TmpReg2).addReg(SrcReg)
|
2004-02-29 07:22:16 +00:00
|
|
|
.addReg(SrcReg+1);
|
2003-06-01 01:56:54 +00:00
|
|
|
// TmpReg3 = s[ah]r inHi, CL
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, isSigned ? X86::SAR32rCL : X86::SHR32rCL, 1, TmpReg3)
|
2003-06-01 01:56:54 +00:00
|
|
|
.addReg(SrcReg+1);
|
|
|
|
|
|
|
|
// Set the flags to indicate whether the shift was by more than 32 bits.
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::TEST8ri, 2).addReg(X86::CL).addImm(32);
|
2003-06-01 01:56:54 +00:00
|
|
|
|
|
|
|
// DestLo = (>32) ? TmpReg3 : TmpReg2;
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::CMOVNE32rr, 2,
|
2003-06-01 01:56:54 +00:00
|
|
|
DestReg).addReg(TmpReg2).addReg(TmpReg3);
|
|
|
|
|
|
|
|
// DestHi = (>32) ? TmpReg : TmpReg3;
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::CMOVNE32rr, 2,
|
2003-06-01 01:56:54 +00:00
|
|
|
DestReg+1).addReg(TmpReg3).addReg(TmpReg);
|
|
|
|
}
|
2002-10-31 23:03:59 +00:00
|
|
|
}
|
2003-01-13 00:32:26 +00:00
|
|
|
return;
|
|
|
|
}
|
2002-11-02 01:41:55 +00:00
|
|
|
|
2003-11-22 06:49:41 +00:00
|
|
|
if (ConstantUInt *CUI = dyn_cast<ConstantUInt>(ShiftAmount)) {
|
2003-01-13 00:32:26 +00:00
|
|
|
// The shift amount is constant, guaranteed to be a ubyte. Get its value.
|
|
|
|
assert(CUI->getType() == Type::UByteTy && "Shift amount not a ubyte?");
|
2002-11-02 01:15:18 +00:00
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
const unsigned *Opc = ConstantOperand[isLeftShift*2+isSigned];
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, Opc[Class], 2,
|
|
|
|
DestReg).addReg(SrcReg).addImm(CUI->getValue());
|
2003-01-13 00:32:26 +00:00
|
|
|
} else { // The shift amount is non-constant.
|
2003-11-22 06:49:41 +00:00
|
|
|
unsigned ShiftAmountReg = getReg (ShiftAmount, MBB, IP);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV8rr, 1, X86::CL).addReg(ShiftAmountReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
const unsigned *Opc = NonConstantOperand[isLeftShift*2+isSigned];
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*MBB, IP, Opc[Class], 1, DestReg).addReg(SrcReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
|
|
|
}
|
2002-11-02 01:15:18 +00:00
|
|
|
|
|
|
|
|
2004-03-08 01:18:36 +00:00
|
|
|
void ISel::getAddressingMode(Value *Addr, unsigned &BaseReg, unsigned &Scale,
|
|
|
|
unsigned &IndexReg, unsigned &Disp) {
|
|
|
|
BaseReg = 0; Scale = 1; IndexReg = 0; Disp = 0;
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
if (GetElementPtrInst *GEP = dyn_cast<GetElementPtrInst>(Addr)) {
|
|
|
|
if (isGEPFoldable(BB, GEP->getOperand(0), GEP->op_begin()+1, GEP->op_end(),
|
|
|
|
BaseReg, Scale, IndexReg, Disp))
|
2004-03-08 01:18:36 +00:00
|
|
|
return;
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
} else if (ConstantExpr *CE = dyn_cast<ConstantExpr>(Addr)) {
|
|
|
|
if (CE->getOpcode() == Instruction::GetElementPtr)
|
|
|
|
if (isGEPFoldable(BB, CE->getOperand(0), CE->op_begin()+1, CE->op_end(),
|
|
|
|
BaseReg, Scale, IndexReg, Disp))
|
2004-03-08 01:18:36 +00:00
|
|
|
return;
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
}
|
2002-12-24 00:03:11 +00:00
|
|
|
|
2004-03-08 01:18:36 +00:00
|
|
|
// If it's not foldable, reset addr mode.
|
|
|
|
BaseReg = getReg(Addr);
|
|
|
|
Scale = 1; IndexReg = 0; Disp = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/// visitLoadInst - Implement LLVM load instructions in terms of the x86 'mov'
|
|
|
|
/// instruction. The load and store instructions are the only place where we
|
|
|
|
/// need to worry about the memory layout of the target machine.
|
|
|
|
///
|
|
|
|
void ISel::visitLoadInst(LoadInst &I) {
|
Implement folding explicit load instructions into binary operations. For a
testcase like this:
int %test(int* %P, int %A) {
%Pv = load int* %P
%B = add int %A, %Pv
ret int %B
}
We now generate:
test:
mov %ECX, DWORD PTR [%ESP + 4]
mov %EAX, DWORD PTR [%ESP + 8]
add %EAX, DWORD PTR [%ECX]
ret
Instead of:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
mov %EAX, DWORD PTR [%EAX]
add %EAX, %ECX
ret
... saving one instruction, and often a register. Note that there are a lot
of other instructions that could use this, but they aren't handled. I'm not
really interested in adding them, but mul/div and all of the FP instructions
could be supported as well if someone wanted to add them.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@12204 91177308-0d34-0410-b5e6-96231b3b80d8
2004-03-08 01:58:35 +00:00
|
|
|
// Check to see if this load instruction is going to be folded into a binary
|
|
|
|
// instruction, like add. If so, we don't want to emit it. Wouldn't a real
|
|
|
|
// pattern matching instruction selector be nice?
|
|
|
|
if (I.hasOneUse() && getClassB(I.getType()) < cFP) {
|
|
|
|
Instruction *User = cast<Instruction>(I.use_back());
|
|
|
|
switch (User->getOpcode()) {
|
|
|
|
default: User = 0; break;
|
|
|
|
case Instruction::Add:
|
|
|
|
case Instruction::Sub:
|
|
|
|
case Instruction::And:
|
|
|
|
case Instruction::Or:
|
|
|
|
case Instruction::Xor:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (User) {
|
|
|
|
// Okay, we found a user. If the load is the first operand and there is
|
|
|
|
// no second operand load, reverse the operand ordering. Note that this
|
|
|
|
// can fail for a subtract (ie, no change will be made).
|
|
|
|
if (!isa<LoadInst>(User->getOperand(1)))
|
|
|
|
cast<BinaryOperator>(User)->swapOperands();
|
|
|
|
|
|
|
|
// Okay, now that everything is set up, if this load is used by the second
|
|
|
|
// operand, and if there are no instructions that invalidate the load
|
|
|
|
// before the binary operator, eliminate the load.
|
|
|
|
if (User->getOperand(1) == &I &&
|
|
|
|
isSafeToFoldLoadIntoInstruction(I, *User))
|
|
|
|
return; // Eliminate the load!
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2004-03-08 01:18:36 +00:00
|
|
|
unsigned DestReg = getReg(I);
|
|
|
|
unsigned BaseReg = 0, Scale = 1, IndexReg = 0, Disp = 0;
|
|
|
|
getAddressingMode(I.getOperand(0), BaseReg, Scale, IndexReg, Disp);
|
2003-10-20 04:48:06 +00:00
|
|
|
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
unsigned Class = getClassB(I.getType());
|
2003-10-20 04:48:06 +00:00
|
|
|
if (Class == cLong) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFullAddress(BuildMI(BB, X86::MOV32rm, 4, DestReg),
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
BaseReg, Scale, IndexReg, Disp);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFullAddress(BuildMI(BB, X86::MOV32rm, 4, DestReg+1),
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
BaseReg, Scale, IndexReg, Disp+4);
|
2002-12-25 05:13:53 +00:00
|
|
|
return;
|
|
|
|
}
|
2002-12-24 00:03:11 +00:00
|
|
|
|
2003-10-20 04:48:06 +00:00
|
|
|
static const unsigned Opcodes[] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
X86::MOV8rm, X86::MOV16rm, X86::MOV32rm, X86::FLD32m
|
2003-01-13 00:32:26 +00:00
|
|
|
};
|
2003-10-20 04:48:06 +00:00
|
|
|
unsigned Opcode = Opcodes[Class];
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
if (I.getType() == Type::DoubleTy) Opcode = X86::FLD64m;
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
addFullAddress(BuildMI(BB, Opcode, 4, DestReg),
|
|
|
|
BaseReg, Scale, IndexReg, Disp);
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
|
|
|
|
2002-11-17 21:11:55 +00:00
|
|
|
/// visitStoreInst - Implement LLVM store instructions in terms of the x86 'mov'
|
|
|
|
/// instruction.
|
|
|
|
///
|
|
|
|
void ISel::visitStoreInst(StoreInst &I) {
|
2004-03-08 01:18:36 +00:00
|
|
|
unsigned BaseReg, Scale, IndexReg, Disp;
|
|
|
|
getAddressingMode(I.getOperand(1), BaseReg, Scale, IndexReg, Disp);
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
|
2003-10-20 04:11:23 +00:00
|
|
|
const Type *ValTy = I.getOperand(0)->getType();
|
|
|
|
unsigned Class = getClassB(ValTy);
|
2003-10-20 04:48:06 +00:00
|
|
|
|
2004-02-25 02:56:58 +00:00
|
|
|
if (ConstantInt *CI = dyn_cast<ConstantInt>(I.getOperand(0))) {
|
|
|
|
uint64_t Val = CI->getRawValue();
|
|
|
|
if (Class == cLong) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFullAddress(BuildMI(BB, X86::MOV32mi, 5),
|
2004-02-29 07:22:16 +00:00
|
|
|
BaseReg, Scale, IndexReg, Disp).addImm(Val & ~0U);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFullAddress(BuildMI(BB, X86::MOV32mi, 5),
|
2004-02-29 07:22:16 +00:00
|
|
|
BaseReg, Scale, IndexReg, Disp+4).addImm(Val>>32);
|
2004-02-25 02:56:58 +00:00
|
|
|
} else {
|
|
|
|
static const unsigned Opcodes[] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
X86::MOV8mi, X86::MOV16mi, X86::MOV32mi
|
2004-02-25 02:56:58 +00:00
|
|
|
};
|
|
|
|
unsigned Opcode = Opcodes[Class];
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
addFullAddress(BuildMI(BB, Opcode, 5),
|
2004-02-29 07:22:16 +00:00
|
|
|
BaseReg, Scale, IndexReg, Disp).addImm(Val);
|
2004-02-25 02:56:58 +00:00
|
|
|
}
|
|
|
|
} else if (ConstantBool *CB = dyn_cast<ConstantBool>(I.getOperand(0))) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFullAddress(BuildMI(BB, X86::MOV8mi, 5),
|
2004-02-29 07:22:16 +00:00
|
|
|
BaseReg, Scale, IndexReg, Disp).addImm(CB->getValue());
|
2004-02-25 02:56:58 +00:00
|
|
|
} else {
|
|
|
|
if (Class == cLong) {
|
|
|
|
unsigned ValReg = getReg(I.getOperand(0));
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFullAddress(BuildMI(BB, X86::MOV32mr, 5),
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
BaseReg, Scale, IndexReg, Disp).addReg(ValReg);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFullAddress(BuildMI(BB, X86::MOV32mr, 5),
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
BaseReg, Scale, IndexReg, Disp+4).addReg(ValReg+1);
|
2004-02-25 02:56:58 +00:00
|
|
|
} else {
|
|
|
|
unsigned ValReg = getReg(I.getOperand(0));
|
|
|
|
static const unsigned Opcodes[] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
X86::MOV8mr, X86::MOV16mr, X86::MOV32mr, X86::FST32m
|
2004-02-25 02:56:58 +00:00
|
|
|
};
|
|
|
|
unsigned Opcode = Opcodes[Class];
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
if (ValTy == Type::DoubleTy) Opcode = X86::FST64m;
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
addFullAddress(BuildMI(BB, Opcode, 1+4),
|
|
|
|
BaseReg, Scale, IndexReg, Disp).addReg(ValReg);
|
2004-02-25 02:56:58 +00:00
|
|
|
}
|
2002-12-25 05:13:53 +00:00
|
|
|
}
|
2002-11-17 21:11:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2004-03-01 23:53:11 +00:00
|
|
|
/// visitCastInst - Here we have various kinds of copying with or without sign
|
|
|
|
/// extension going on.
|
|
|
|
///
|
2003-01-13 00:32:26 +00:00
|
|
|
void ISel::visitCastInst(CastInst &CI) {
|
2003-06-21 16:01:24 +00:00
|
|
|
Value *Op = CI.getOperand(0);
|
|
|
|
// If this is a cast from a 32-bit integer to a Long type, and the only uses
|
|
|
|
// of the case are GEP instructions, then the cast does not need to be
|
|
|
|
// generated explicitly, it will be folded into the GEP.
|
|
|
|
if (CI.getType() == Type::LongTy &&
|
|
|
|
(Op->getType() == Type::IntTy || Op->getType() == Type::UIntTy)) {
|
|
|
|
bool AllUsesAreGEPs = true;
|
|
|
|
for (Value::use_iterator I = CI.use_begin(), E = CI.use_end(); I != E; ++I)
|
|
|
|
if (!isa<GetElementPtrInst>(*I)) {
|
|
|
|
AllUsesAreGEPs = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
// No need to codegen this cast if all users are getelementptr instrs...
|
|
|
|
if (AllUsesAreGEPs) return;
|
|
|
|
}
|
|
|
|
|
2003-04-23 17:22:12 +00:00
|
|
|
unsigned DestReg = getReg(CI);
|
|
|
|
MachineBasicBlock::iterator MI = BB->end();
|
2003-06-21 16:01:24 +00:00
|
|
|
emitCastOperation(BB, MI, Op, CI.getType(), DestReg);
|
2003-04-23 17:22:12 +00:00
|
|
|
}
|
|
|
|
|
2004-03-01 23:53:11 +00:00
|
|
|
/// emitCastOperation - Common code shared between visitCastInst and constant
|
|
|
|
/// expression cast support.
|
|
|
|
///
|
2003-04-23 17:22:12 +00:00
|
|
|
void ISel::emitCastOperation(MachineBasicBlock *BB,
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2003-04-23 17:22:12 +00:00
|
|
|
Value *Src, const Type *DestTy,
|
|
|
|
unsigned DestReg) {
|
2003-04-23 17:57:48 +00:00
|
|
|
unsigned SrcReg = getReg(Src, BB, IP);
|
2003-01-13 00:32:26 +00:00
|
|
|
const Type *SrcTy = Src->getType();
|
|
|
|
unsigned SrcClass = getClassB(SrcTy);
|
|
|
|
unsigned DestClass = getClassB(DestTy);
|
|
|
|
|
|
|
|
// Implement casts to bool by using compare on the operand followed by set if
|
|
|
|
// not zero on the result.
|
|
|
|
if (DestTy == Type::BoolTy) {
|
2003-06-01 03:38:24 +00:00
|
|
|
switch (SrcClass) {
|
|
|
|
case cByte:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::TEST8rr, 2).addReg(SrcReg).addReg(SrcReg);
|
2003-06-01 03:38:24 +00:00
|
|
|
break;
|
|
|
|
case cShort:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::TEST16rr, 2).addReg(SrcReg).addReg(SrcReg);
|
2003-06-01 03:38:24 +00:00
|
|
|
break;
|
|
|
|
case cInt:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::TEST32rr, 2).addReg(SrcReg).addReg(SrcReg);
|
2003-06-01 03:38:24 +00:00
|
|
|
break;
|
|
|
|
case cLong: {
|
|
|
|
unsigned TmpReg = makeAnotherReg(Type::IntTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::OR32rr, 2, TmpReg).addReg(SrcReg).addReg(SrcReg+1);
|
2003-06-01 03:38:24 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
case cFP:
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, X86::FTST, 1).addReg(SrcReg);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::FNSTSW8r, 0);
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, X86::SAHF, 1);
|
2004-02-23 03:21:41 +00:00
|
|
|
break;
|
2003-06-01 03:38:24 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// If the zero flag is not set, then the value is true, set the byte to
|
|
|
|
// true.
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, X86::SETNEr, 1, DestReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
return;
|
|
|
|
}
|
2002-12-13 11:31:59 +00:00
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
static const unsigned RegRegMove[] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
X86::MOV8rr, X86::MOV16rr, X86::MOV32rr, X86::FpMOV, X86::MOV32rr
|
2002-12-06 10:49:33 +00:00
|
|
|
};
|
2002-12-25 05:13:53 +00:00
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
// Implement casts between values of the same type class (as determined by
|
|
|
|
// getClass) by using a register-to-register move.
|
|
|
|
if (SrcClass == DestClass) {
|
|
|
|
if (SrcClass <= cInt || (SrcClass == cFP && SrcTy == DestTy)) {
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, RegRegMove[SrcClass], 1, DestReg).addReg(SrcReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
} else if (SrcClass == cFP) {
|
|
|
|
if (SrcTy == Type::FloatTy) { // double -> float
|
2003-10-23 16:22:08 +00:00
|
|
|
assert(DestTy == Type::DoubleTy && "Unknown cFP member!");
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, X86::FpMOV, 1, DestReg).addReg(SrcReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
} else { // float -> double
|
2003-10-23 16:22:08 +00:00
|
|
|
assert(SrcTy == Type::DoubleTy && DestTy == Type::FloatTy &&
|
|
|
|
"Unknown cFP member!");
|
|
|
|
// Truncate from double to float by storing to memory as short, then
|
|
|
|
// reading it back.
|
|
|
|
unsigned FltAlign = TM.getTargetData().getFloatAlignment();
|
2003-01-13 00:32:26 +00:00
|
|
|
int FrameIdx = F->getFrameInfo()->CreateStackObject(4, FltAlign);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::FST32m, 5), FrameIdx).addReg(SrcReg);
|
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::FLD32m, 5, DestReg), FrameIdx);
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
|
|
|
} else if (SrcClass == cLong) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::MOV32rr, 1, DestReg).addReg(SrcReg);
|
|
|
|
BuildMI(*BB, IP, X86::MOV32rr, 1, DestReg+1).addReg(SrcReg+1);
|
2003-01-13 00:32:26 +00:00
|
|
|
} else {
|
2003-05-12 20:16:58 +00:00
|
|
|
assert(0 && "Cannot handle this type of cast instruction!");
|
2003-04-23 17:22:12 +00:00
|
|
|
abort();
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
2002-12-25 05:13:53 +00:00
|
|
|
return;
|
|
|
|
}
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
// Handle cast of SMALLER int to LARGER int using a move with sign extension
|
|
|
|
// or zero extension, depending on whether the source type was signed.
|
|
|
|
if (SrcClass <= cInt && (DestClass <= cInt || DestClass == cLong) &&
|
|
|
|
SrcClass < DestClass) {
|
|
|
|
bool isLong = DestClass == cLong;
|
|
|
|
if (isLong) DestClass = cInt;
|
|
|
|
|
|
|
|
static const unsigned Opc[][4] = {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
{ X86::MOVSX16rr8, X86::MOVSX32rr8, X86::MOVSX32rr16, X86::MOV32rr }, // s
|
|
|
|
{ X86::MOVZX16rr8, X86::MOVZX32rr8, X86::MOVZX32rr16, X86::MOV32rr } // u
|
2003-01-13 00:32:26 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
bool isUnsigned = SrcTy->isUnsigned();
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, Opc[isUnsigned][SrcClass + DestClass - 1], 1,
|
2003-04-23 17:22:12 +00:00
|
|
|
DestReg).addReg(SrcReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
if (isLong) { // Handle upper 32 bits as appropriate...
|
|
|
|
if (isUnsigned) // Zero out top bits...
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::MOV32ri, 1, DestReg+1).addImm(0);
|
2003-01-13 00:32:26 +00:00
|
|
|
else // Sign extend bottom half...
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::SAR32ri, 2, DestReg+1).addReg(DestReg).addImm(31);
|
2002-12-06 10:49:33 +00:00
|
|
|
}
|
2003-01-13 00:32:26 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Special case long -> int ...
|
|
|
|
if (SrcClass == cLong && DestClass == cInt) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::MOV32rr, 1, DestReg).addReg(SrcReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Handle cast of LARGER int to SMALLER int using a move to EAX followed by a
|
|
|
|
// move out of AX or AL.
|
|
|
|
if ((SrcClass <= cInt || SrcClass == cLong) && DestClass <= cInt
|
|
|
|
&& SrcClass > DestClass) {
|
|
|
|
static const unsigned AReg[] = { X86::AL, X86::AX, X86::EAX, 0, X86::EAX };
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, RegRegMove[SrcClass], 1, AReg[SrcClass]).addReg(SrcReg);
|
|
|
|
BuildMI(*BB, IP, RegRegMove[DestClass], 1, DestReg).addReg(AReg[DestClass]);
|
2003-01-13 00:32:26 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Handle casts from integer to floating point now...
|
|
|
|
if (DestClass == cFP) {
|
2003-05-12 20:36:13 +00:00
|
|
|
// Promote the integer to a type supported by FLD. We do this because there
|
|
|
|
// are no unsigned FLD instructions, so we must promote an unsigned value to
|
|
|
|
// a larger signed value, then use FLD on the larger value.
|
|
|
|
//
|
|
|
|
const Type *PromoteType = 0;
|
|
|
|
unsigned PromoteOpcode;
|
2004-02-23 03:10:10 +00:00
|
|
|
unsigned RealDestReg = DestReg;
|
2003-05-12 20:36:13 +00:00
|
|
|
switch (SrcTy->getPrimitiveID()) {
|
|
|
|
case Type::BoolTyID:
|
|
|
|
case Type::SByteTyID:
|
|
|
|
// We don't have the facilities for directly loading byte sized data from
|
|
|
|
// memory (even signed). Promote it to 16 bits.
|
|
|
|
PromoteType = Type::ShortTy;
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
PromoteOpcode = X86::MOVSX16rr8;
|
2003-05-12 20:36:13 +00:00
|
|
|
break;
|
|
|
|
case Type::UByteTyID:
|
|
|
|
PromoteType = Type::ShortTy;
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
PromoteOpcode = X86::MOVZX16rr8;
|
2003-05-12 20:36:13 +00:00
|
|
|
break;
|
|
|
|
case Type::UShortTyID:
|
|
|
|
PromoteType = Type::IntTy;
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
PromoteOpcode = X86::MOVZX32rr16;
|
2003-05-12 20:36:13 +00:00
|
|
|
break;
|
|
|
|
case Type::UIntTyID: {
|
|
|
|
// Make a 64 bit temporary... and zero out the top of it...
|
|
|
|
unsigned TmpReg = makeAnotherReg(Type::LongTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::MOV32rr, 1, TmpReg).addReg(SrcReg);
|
|
|
|
BuildMI(*BB, IP, X86::MOV32ri, 1, TmpReg+1).addImm(0);
|
2003-05-12 20:36:13 +00:00
|
|
|
SrcTy = Type::LongTy;
|
|
|
|
SrcClass = cLong;
|
|
|
|
SrcReg = TmpReg;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case Type::ULongTyID:
|
2004-02-23 03:10:10 +00:00
|
|
|
// Don't fild into the read destination.
|
|
|
|
DestReg = makeAnotherReg(Type::DoubleTy);
|
|
|
|
break;
|
2003-05-12 20:36:13 +00:00
|
|
|
default: // No promotion needed...
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (PromoteType) {
|
|
|
|
unsigned TmpReg = makeAnotherReg(PromoteType);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
unsigned Opc = SrcTy->isSigned() ? X86::MOVSX16rr8 : X86::MOVZX16rr8;
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, Opc, 1, TmpReg).addReg(SrcReg);
|
2003-05-12 20:36:13 +00:00
|
|
|
SrcTy = PromoteType;
|
|
|
|
SrcClass = getClass(PromoteType);
|
2003-01-13 00:32:26 +00:00
|
|
|
SrcReg = TmpReg;
|
2002-12-06 10:49:33 +00:00
|
|
|
}
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
// Spill the integer to memory and reload it from there...
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
int FrameIdx =
|
|
|
|
F->getFrameInfo()->CreateStackObject(SrcTy, TM.getTargetData());
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
if (SrcClass == cLong) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::MOV32mr, 5),
|
2004-02-29 07:22:16 +00:00
|
|
|
FrameIdx).addReg(SrcReg);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::MOV32mr, 5),
|
2003-10-23 16:22:08 +00:00
|
|
|
FrameIdx, 4).addReg(SrcReg+1);
|
2003-01-13 00:32:26 +00:00
|
|
|
} else {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
static const unsigned Op1[] = { X86::MOV8mr, X86::MOV16mr, X86::MOV32mr };
|
2004-02-29 07:22:16 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, Op1[SrcClass], 5),
|
|
|
|
FrameIdx).addReg(SrcReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static const unsigned Op2[] =
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
{ 0/*byte*/, X86::FILD16m, X86::FILD32m, 0/*FP*/, X86::FILD64m };
|
2004-02-29 07:22:16 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, Op2[SrcClass], 5, DestReg), FrameIdx);
|
2004-02-23 03:10:10 +00:00
|
|
|
|
|
|
|
// We need special handling for unsigned 64-bit integer sources. If the
|
|
|
|
// input number has the "sign bit" set, then we loaded it incorrectly as a
|
|
|
|
// negative 64-bit number. In this case, add an offset value.
|
|
|
|
if (SrcTy == Type::ULongTy) {
|
|
|
|
// Emit a test instruction to see if the dynamic input value was signed.
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::TEST32rr, 2).addReg(SrcReg+1).addReg(SrcReg+1);
|
2004-02-23 03:10:10 +00:00
|
|
|
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
// If the sign bit is set, get a pointer to an offset, otherwise get a
|
|
|
|
// pointer to a zero.
|
2004-02-23 03:10:10 +00:00
|
|
|
MachineConstantPool *CP = F->getConstantPool();
|
|
|
|
unsigned Zero = makeAnotherReg(Type::IntTy);
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
Constant *Null = Constant::getNullValue(Type::UIntTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addConstantPoolReference(BuildMI(*BB, IP, X86::LEA32r, 5, Zero),
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
CP->getConstantPoolIndex(Null));
|
2004-02-23 03:10:10 +00:00
|
|
|
unsigned Offset = makeAnotherReg(Type::IntTy);
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
Constant *OffsetCst = ConstantUInt::get(Type::UIntTy, 0x5f800000);
|
|
|
|
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addConstantPoolReference(BuildMI(*BB, IP, X86::LEA32r, 5, Offset),
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
CP->getConstantPoolIndex(OffsetCst));
|
2004-02-23 03:10:10 +00:00
|
|
|
unsigned Addr = makeAnotherReg(Type::IntTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*BB, IP, X86::CMOVS32rr, 2, Addr).addReg(Zero).addReg(Offset);
|
2004-02-23 03:10:10 +00:00
|
|
|
|
|
|
|
// Load the constant for an add. FIXME: this could make an 'fadd' that
|
|
|
|
// reads directly from memory, but we don't support these yet.
|
|
|
|
unsigned ConstReg = makeAnotherReg(Type::DoubleTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addDirectMem(BuildMI(*BB, IP, X86::FLD32m, 4, ConstReg), Addr);
|
2004-02-23 03:10:10 +00:00
|
|
|
|
2004-02-29 07:22:16 +00:00
|
|
|
BuildMI(*BB, IP, X86::FpADD, 2, RealDestReg)
|
|
|
|
.addReg(ConstReg).addReg(DestReg);
|
2004-02-23 03:10:10 +00:00
|
|
|
}
|
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Handle casts from floating point to integer now...
|
|
|
|
if (SrcClass == cFP) {
|
|
|
|
// Change the floating point control register to use "round towards zero"
|
|
|
|
// mode when truncating to an integer value.
|
|
|
|
//
|
|
|
|
int CWFrameIdx = F->getFrameInfo()->CreateStackObject(2, 2);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::FNSTCW16m, 4), CWFrameIdx);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
// Load the old value of the high byte of the control word...
|
|
|
|
unsigned HighPartOfCW = makeAnotherReg(Type::UByteTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::MOV8rm, 4, HighPartOfCW),
|
2004-02-29 07:22:16 +00:00
|
|
|
CWFrameIdx, 1);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
// Set the high part to be round to zero...
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::MOV8mi, 5),
|
2004-02-29 07:22:16 +00:00
|
|
|
CWFrameIdx, 1).addImm(12);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
// Reload the modified control word now...
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::FLDCW16m, 4), CWFrameIdx);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
// Restore the memory image of control word to original value
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::MOV8mr, 5),
|
2003-10-23 16:22:08 +00:00
|
|
|
CWFrameIdx, 1).addReg(HighPartOfCW);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
// We don't have the facilities for directly storing byte sized data to
|
|
|
|
// memory. Promote it to 16 bits. We also must promote unsigned values to
|
|
|
|
// larger classes because we only have signed FP stores.
|
|
|
|
unsigned StoreClass = DestClass;
|
|
|
|
const Type *StoreTy = DestTy;
|
|
|
|
if (StoreClass == cByte || DestTy->isUnsigned())
|
|
|
|
switch (StoreClass) {
|
|
|
|
case cByte: StoreTy = Type::ShortTy; StoreClass = cShort; break;
|
|
|
|
case cShort: StoreTy = Type::IntTy; StoreClass = cInt; break;
|
|
|
|
case cInt: StoreTy = Type::LongTy; StoreClass = cLong; break;
|
2003-07-18 20:23:43 +00:00
|
|
|
// The following treatment of cLong may not be perfectly right,
|
|
|
|
// but it survives chains of casts of the form
|
|
|
|
// double->ulong->double.
|
|
|
|
case cLong: StoreTy = Type::LongTy; StoreClass = cLong; break;
|
2003-01-13 00:32:26 +00:00
|
|
|
default: assert(0 && "Unknown store class!");
|
|
|
|
}
|
|
|
|
|
|
|
|
// Spill the integer to memory and reload it from there...
|
|
|
|
int FrameIdx =
|
|
|
|
F->getFrameInfo()->CreateStackObject(StoreTy, TM.getTargetData());
|
|
|
|
|
|
|
|
static const unsigned Op1[] =
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
{ 0, X86::FIST16m, X86::FIST32m, 0, X86::FISTP64m };
|
2004-02-29 07:22:16 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, Op1[StoreClass], 5),
|
|
|
|
FrameIdx).addReg(SrcReg);
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
if (DestClass == cLong) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::MOV32rm, 4, DestReg), FrameIdx);
|
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::MOV32rm, 4, DestReg+1),
|
2004-02-29 07:22:16 +00:00
|
|
|
FrameIdx, 4);
|
2003-01-13 00:32:26 +00:00
|
|
|
} else {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
static const unsigned Op2[] = { X86::MOV8rm, X86::MOV16rm, X86::MOV32rm };
|
2004-02-29 07:22:16 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, Op2[DestClass], 4, DestReg), FrameIdx);
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Reload the original control word now...
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(*BB, IP, X86::FLDCW16m, 4), CWFrameIdx);
|
2003-01-13 00:32:26 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2002-12-06 10:49:33 +00:00
|
|
|
// Anything we haven't handled already, we can't (yet) handle at all.
|
2003-05-12 20:16:58 +00:00
|
|
|
assert(0 && "Unhandled cast instruction!");
|
2003-04-23 17:22:12 +00:00
|
|
|
abort();
|
2002-11-22 11:07:01 +00:00
|
|
|
}
|
2002-10-31 23:03:59 +00:00
|
|
|
|
2003-10-18 05:56:40 +00:00
|
|
|
/// visitVANextInst - Implement the va_next instruction...
|
2003-05-08 19:44:13 +00:00
|
|
|
///
|
2003-10-18 05:56:40 +00:00
|
|
|
void ISel::visitVANextInst(VANextInst &I) {
|
|
|
|
unsigned VAList = getReg(I.getOperand(0));
|
2003-05-08 19:44:13 +00:00
|
|
|
unsigned DestReg = getReg(I);
|
|
|
|
|
|
|
|
unsigned Size;
|
2003-10-18 05:56:40 +00:00
|
|
|
switch (I.getArgType()->getPrimitiveID()) {
|
2003-05-08 19:44:13 +00:00
|
|
|
default:
|
|
|
|
std::cerr << I;
|
2003-10-18 05:56:40 +00:00
|
|
|
assert(0 && "Error: bad type for va_next instruction!");
|
2003-05-08 19:44:13 +00:00
|
|
|
return;
|
|
|
|
case Type::PointerTyID:
|
|
|
|
case Type::UIntTyID:
|
|
|
|
case Type::IntTyID:
|
|
|
|
Size = 4;
|
|
|
|
break;
|
|
|
|
case Type::ULongTyID:
|
|
|
|
case Type::LongTyID:
|
2003-10-18 05:56:40 +00:00
|
|
|
case Type::DoubleTyID:
|
2003-05-08 19:44:13 +00:00
|
|
|
Size = 8;
|
2003-10-18 05:56:40 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Increment the VAList pointer...
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::ADD32ri, 2, DestReg).addReg(VAList).addImm(Size);
|
2003-10-18 05:56:40 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ISel::visitVAArgInst(VAArgInst &I) {
|
|
|
|
unsigned VAList = getReg(I.getOperand(0));
|
|
|
|
unsigned DestReg = getReg(I);
|
|
|
|
|
|
|
|
switch (I.getType()->getPrimitiveID()) {
|
|
|
|
default:
|
|
|
|
std::cerr << I;
|
|
|
|
assert(0 && "Error: bad type for va_next instruction!");
|
|
|
|
return;
|
|
|
|
case Type::PointerTyID:
|
|
|
|
case Type::UIntTyID:
|
|
|
|
case Type::IntTyID:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addDirectMem(BuildMI(BB, X86::MOV32rm, 4, DestReg), VAList);
|
2003-10-18 05:56:40 +00:00
|
|
|
break;
|
|
|
|
case Type::ULongTyID:
|
|
|
|
case Type::LongTyID:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addDirectMem(BuildMI(BB, X86::MOV32rm, 4, DestReg), VAList);
|
|
|
|
addRegOffset(BuildMI(BB, X86::MOV32rm, 4, DestReg+1), VAList, 4);
|
2003-05-08 19:44:13 +00:00
|
|
|
break;
|
|
|
|
case Type::DoubleTyID:
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addDirectMem(BuildMI(BB, X86::FLD64m, 4, DestReg), VAList);
|
2003-05-08 19:44:13 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2004-03-01 23:53:11 +00:00
|
|
|
/// visitGetElementPtrInst - instruction-select GEP instructions
|
|
|
|
///
|
2003-01-13 00:32:26 +00:00
|
|
|
void ISel::visitGetElementPtrInst(GetElementPtrInst &I) {
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
// If this GEP instruction will be folded into all of its users, we don't need
|
|
|
|
// to explicitly calculate it!
|
|
|
|
unsigned A, B, C, D;
|
|
|
|
if (isGEPFoldable(0, I.getOperand(0), I.op_begin()+1, I.op_end(), A,B,C,D)) {
|
|
|
|
// Check all of the users of the instruction to see if they are loads and
|
|
|
|
// stores.
|
|
|
|
bool AllWillFold = true;
|
|
|
|
for (Value::use_iterator UI = I.use_begin(), E = I.use_end(); UI != E; ++UI)
|
|
|
|
if (cast<Instruction>(*UI)->getOpcode() != Instruction::Load)
|
|
|
|
if (cast<Instruction>(*UI)->getOpcode() != Instruction::Store ||
|
|
|
|
cast<Instruction>(*UI)->getOperand(0) == &I) {
|
|
|
|
AllWillFold = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
// If the instruction is foldable, and will be folded into all users, don't
|
|
|
|
// emit it!
|
|
|
|
if (AllWillFold) return;
|
|
|
|
}
|
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
unsigned outputReg = getReg(I);
|
2004-02-22 17:05:38 +00:00
|
|
|
emitGEPOperation(BB, BB->end(), I.getOperand(0),
|
2002-12-16 04:23:29 +00:00
|
|
|
I.op_begin()+1, I.op_end(), outputReg);
|
2002-12-13 06:56:29 +00:00
|
|
|
}
|
|
|
|
|
2004-02-25 03:45:50 +00:00
|
|
|
/// getGEPIndex - Inspect the getelementptr operands specified with GEPOps and
|
|
|
|
/// GEPTypes (the derived types being stepped through at each level). On return
|
|
|
|
/// from this function, if some indexes of the instruction are representable as
|
|
|
|
/// an X86 lea instruction, the machine operands are put into the Ops
|
|
|
|
/// instruction and the consumed indexes are poped from the GEPOps/GEPTypes
|
|
|
|
/// lists. Otherwise, GEPOps.size() is returned. If this returns a an
|
|
|
|
/// addressing mode that only partially consumes the input, the BaseReg input of
|
|
|
|
/// the addressing mode must be left free.
|
|
|
|
///
|
|
|
|
/// Note that there is one fewer entry in GEPTypes than there is in GEPOps.
|
|
|
|
///
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
void ISel::getGEPIndex(MachineBasicBlock *MBB, MachineBasicBlock::iterator IP,
|
|
|
|
std::vector<Value*> &GEPOps,
|
|
|
|
std::vector<const Type*> &GEPTypes, unsigned &BaseReg,
|
|
|
|
unsigned &Scale, unsigned &IndexReg, unsigned &Disp) {
|
|
|
|
const TargetData &TD = TM.getTargetData();
|
|
|
|
|
2004-02-25 03:45:50 +00:00
|
|
|
// Clear out the state we are working with...
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
BaseReg = 0; // No base register
|
|
|
|
Scale = 1; // Unit scale
|
|
|
|
IndexReg = 0; // No index register
|
|
|
|
Disp = 0; // No displacement
|
|
|
|
|
2004-02-25 03:45:50 +00:00
|
|
|
// While there are GEP indexes that can be folded into the current address,
|
|
|
|
// keep processing them.
|
|
|
|
while (!GEPTypes.empty()) {
|
|
|
|
if (const StructType *StTy = dyn_cast<StructType>(GEPTypes.back())) {
|
|
|
|
// It's a struct access. CUI is the index into the structure,
|
|
|
|
// which names the field. This index must have unsigned type.
|
|
|
|
const ConstantUInt *CUI = cast<ConstantUInt>(GEPOps.back());
|
|
|
|
|
|
|
|
// Use the TargetData structure to pick out what the layout of the
|
|
|
|
// structure is in memory. Since the structure index must be constant, we
|
|
|
|
// can get its value and use it to find the right byte offset from the
|
|
|
|
// StructLayout class's list of structure member offsets.
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
Disp += TD.getStructLayout(StTy)->MemberOffsets[CUI->getValue()];
|
2004-02-25 03:45:50 +00:00
|
|
|
GEPOps.pop_back(); // Consume a GEP operand
|
|
|
|
GEPTypes.pop_back();
|
|
|
|
} else {
|
|
|
|
// It's an array or pointer access: [ArraySize x ElementType].
|
|
|
|
const SequentialType *SqTy = cast<SequentialType>(GEPTypes.back());
|
|
|
|
Value *idx = GEPOps.back();
|
|
|
|
|
|
|
|
// idx is the index into the array. Unlike with structure
|
|
|
|
// indices, we may not know its actual value at code-generation
|
|
|
|
// time.
|
|
|
|
assert(idx->getType() == Type::LongTy && "Bad GEP array index!");
|
|
|
|
|
|
|
|
// If idx is a constant, fold it into the offset.
|
Teach the instruction selector how to transform 'array' GEP computations into X86
scaled indexes. This allows us to compile GEP's like this:
int* %test([10 x { int, { int } }]* %X, int %Idx) {
%Idx = cast int %Idx to long
%X = getelementptr [10 x { int, { int } }]* %X, long 0, long %Idx, ubyte 1, ubyte 0
ret int* %X
}
Into a single address computation:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
lea %EAX, DWORD PTR [%EAX + 8*%ECX + 4]
ret
Before it generated:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
shl %ECX, 3
add %EAX, %ECX
lea %EAX, DWORD PTR [%EAX + 4]
ret
This is useful for things like int/float/double arrays, as the indexing can be folded into
the loads&stores, reducing register pressure and decreasing the pressure on the decode unit.
With these changes, I expect our performance on 256.bzip2 and gzip to improve a lot. On
bzip2 for example, we go from this:
10665 asm-printer - Number of machine instrs printed
40 ra-local - Number of loads/stores folded into instructions
1708 ra-local - Number of loads added
1532 ra-local - Number of stores added
1354 twoaddressinstruction - Number of instructions added
1354 twoaddressinstruction - Number of two-address instructions
2794 x86-peephole - Number of peephole optimization performed
to this:
9873 asm-printer - Number of machine instrs printed
41 ra-local - Number of loads/stores folded into instructions
1710 ra-local - Number of loads added
1521 ra-local - Number of stores added
789 twoaddressinstruction - Number of instructions added
789 twoaddressinstruction - Number of two-address instructions
2142 x86-peephole - Number of peephole optimization performed
... and these types of instructions are often in tight loops.
Linear scan is also helped, but not as much. It goes from:
8787 asm-printer - Number of machine instrs printed
2389 liveintervals - Number of identity moves eliminated after coalescing
2288 liveintervals - Number of interval joins performed
3522 liveintervals - Number of intervals after coalescing
5810 liveintervals - Number of original intervals
700 spiller - Number of loads added
487 spiller - Number of stores added
303 spiller - Number of register spills
1354 twoaddressinstruction - Number of instructions added
1354 twoaddressinstruction - Number of two-address instructions
363 x86-peephole - Number of peephole optimization performed
to:
7982 asm-printer - Number of machine instrs printed
1759 liveintervals - Number of identity moves eliminated after coalescing
1658 liveintervals - Number of interval joins performed
3282 liveintervals - Number of intervals after coalescing
4940 liveintervals - Number of original intervals
635 spiller - Number of loads added
452 spiller - Number of stores added
288 spiller - Number of register spills
789 twoaddressinstruction - Number of instructions added
789 twoaddressinstruction - Number of two-address instructions
258 x86-peephole - Number of peephole optimization performed
Though I'm not complaining about the drop in the number of intervals. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11820 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 07:00:55 +00:00
|
|
|
unsigned TypeSize = TD.getTypeSize(SqTy->getElementType());
|
2004-02-25 03:45:50 +00:00
|
|
|
if (ConstantSInt *CSI = dyn_cast<ConstantSInt>(idx)) {
|
Teach the instruction selector how to transform 'array' GEP computations into X86
scaled indexes. This allows us to compile GEP's like this:
int* %test([10 x { int, { int } }]* %X, int %Idx) {
%Idx = cast int %Idx to long
%X = getelementptr [10 x { int, { int } }]* %X, long 0, long %Idx, ubyte 1, ubyte 0
ret int* %X
}
Into a single address computation:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
lea %EAX, DWORD PTR [%EAX + 8*%ECX + 4]
ret
Before it generated:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
shl %ECX, 3
add %EAX, %ECX
lea %EAX, DWORD PTR [%EAX + 4]
ret
This is useful for things like int/float/double arrays, as the indexing can be folded into
the loads&stores, reducing register pressure and decreasing the pressure on the decode unit.
With these changes, I expect our performance on 256.bzip2 and gzip to improve a lot. On
bzip2 for example, we go from this:
10665 asm-printer - Number of machine instrs printed
40 ra-local - Number of loads/stores folded into instructions
1708 ra-local - Number of loads added
1532 ra-local - Number of stores added
1354 twoaddressinstruction - Number of instructions added
1354 twoaddressinstruction - Number of two-address instructions
2794 x86-peephole - Number of peephole optimization performed
to this:
9873 asm-printer - Number of machine instrs printed
41 ra-local - Number of loads/stores folded into instructions
1710 ra-local - Number of loads added
1521 ra-local - Number of stores added
789 twoaddressinstruction - Number of instructions added
789 twoaddressinstruction - Number of two-address instructions
2142 x86-peephole - Number of peephole optimization performed
... and these types of instructions are often in tight loops.
Linear scan is also helped, but not as much. It goes from:
8787 asm-printer - Number of machine instrs printed
2389 liveintervals - Number of identity moves eliminated after coalescing
2288 liveintervals - Number of interval joins performed
3522 liveintervals - Number of intervals after coalescing
5810 liveintervals - Number of original intervals
700 spiller - Number of loads added
487 spiller - Number of stores added
303 spiller - Number of register spills
1354 twoaddressinstruction - Number of instructions added
1354 twoaddressinstruction - Number of two-address instructions
363 x86-peephole - Number of peephole optimization performed
to:
7982 asm-printer - Number of machine instrs printed
1759 liveintervals - Number of identity moves eliminated after coalescing
1658 liveintervals - Number of interval joins performed
3282 liveintervals - Number of intervals after coalescing
4940 liveintervals - Number of original intervals
635 spiller - Number of loads added
452 spiller - Number of stores added
288 spiller - Number of register spills
789 twoaddressinstruction - Number of instructions added
789 twoaddressinstruction - Number of two-address instructions
258 x86-peephole - Number of peephole optimization performed
Though I'm not complaining about the drop in the number of intervals. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11820 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 07:00:55 +00:00
|
|
|
Disp += TypeSize*CSI->getValue();
|
2004-02-25 03:45:50 +00:00
|
|
|
} else {
|
Teach the instruction selector how to transform 'array' GEP computations into X86
scaled indexes. This allows us to compile GEP's like this:
int* %test([10 x { int, { int } }]* %X, int %Idx) {
%Idx = cast int %Idx to long
%X = getelementptr [10 x { int, { int } }]* %X, long 0, long %Idx, ubyte 1, ubyte 0
ret int* %X
}
Into a single address computation:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
lea %EAX, DWORD PTR [%EAX + 8*%ECX + 4]
ret
Before it generated:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
shl %ECX, 3
add %EAX, %ECX
lea %EAX, DWORD PTR [%EAX + 4]
ret
This is useful for things like int/float/double arrays, as the indexing can be folded into
the loads&stores, reducing register pressure and decreasing the pressure on the decode unit.
With these changes, I expect our performance on 256.bzip2 and gzip to improve a lot. On
bzip2 for example, we go from this:
10665 asm-printer - Number of machine instrs printed
40 ra-local - Number of loads/stores folded into instructions
1708 ra-local - Number of loads added
1532 ra-local - Number of stores added
1354 twoaddressinstruction - Number of instructions added
1354 twoaddressinstruction - Number of two-address instructions
2794 x86-peephole - Number of peephole optimization performed
to this:
9873 asm-printer - Number of machine instrs printed
41 ra-local - Number of loads/stores folded into instructions
1710 ra-local - Number of loads added
1521 ra-local - Number of stores added
789 twoaddressinstruction - Number of instructions added
789 twoaddressinstruction - Number of two-address instructions
2142 x86-peephole - Number of peephole optimization performed
... and these types of instructions are often in tight loops.
Linear scan is also helped, but not as much. It goes from:
8787 asm-printer - Number of machine instrs printed
2389 liveintervals - Number of identity moves eliminated after coalescing
2288 liveintervals - Number of interval joins performed
3522 liveintervals - Number of intervals after coalescing
5810 liveintervals - Number of original intervals
700 spiller - Number of loads added
487 spiller - Number of stores added
303 spiller - Number of register spills
1354 twoaddressinstruction - Number of instructions added
1354 twoaddressinstruction - Number of two-address instructions
363 x86-peephole - Number of peephole optimization performed
to:
7982 asm-printer - Number of machine instrs printed
1759 liveintervals - Number of identity moves eliminated after coalescing
1658 liveintervals - Number of interval joins performed
3282 liveintervals - Number of intervals after coalescing
4940 liveintervals - Number of original intervals
635 spiller - Number of loads added
452 spiller - Number of stores added
288 spiller - Number of register spills
789 twoaddressinstruction - Number of instructions added
789 twoaddressinstruction - Number of two-address instructions
258 x86-peephole - Number of peephole optimization performed
Though I'm not complaining about the drop in the number of intervals. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11820 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 07:00:55 +00:00
|
|
|
// If the index reg is already taken, we can't handle this index.
|
|
|
|
if (IndexReg) return;
|
|
|
|
|
|
|
|
// If this is a size that we can handle, then add the index as
|
|
|
|
switch (TypeSize) {
|
|
|
|
case 1: case 2: case 4: case 8:
|
|
|
|
// These are all acceptable scales on X86.
|
|
|
|
Scale = TypeSize;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// Otherwise, we can't handle this scale
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (CastInst *CI = dyn_cast<CastInst>(idx))
|
|
|
|
if (CI->getOperand(0)->getType() == Type::IntTy ||
|
|
|
|
CI->getOperand(0)->getType() == Type::UIntTy)
|
|
|
|
idx = CI->getOperand(0);
|
|
|
|
|
|
|
|
IndexReg = MBB ? getReg(idx, MBB, IP) : 1;
|
2004-02-25 03:45:50 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
GEPOps.pop_back(); // Consume a GEP operand
|
|
|
|
GEPTypes.pop_back();
|
|
|
|
}
|
|
|
|
}
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
|
|
|
|
// GEPTypes is empty, which means we have a single operand left. See if we
|
|
|
|
// can set it as the base register.
|
|
|
|
//
|
|
|
|
// FIXME: When addressing modes are more powerful/correct, we could load
|
|
|
|
// global addresses directly as 32-bit immediates.
|
|
|
|
assert(BaseReg == 0);
|
Teach the instruction selector how to transform 'array' GEP computations into X86
scaled indexes. This allows us to compile GEP's like this:
int* %test([10 x { int, { int } }]* %X, int %Idx) {
%Idx = cast int %Idx to long
%X = getelementptr [10 x { int, { int } }]* %X, long 0, long %Idx, ubyte 1, ubyte 0
ret int* %X
}
Into a single address computation:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
lea %EAX, DWORD PTR [%EAX + 8*%ECX + 4]
ret
Before it generated:
test:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
shl %ECX, 3
add %EAX, %ECX
lea %EAX, DWORD PTR [%EAX + 4]
ret
This is useful for things like int/float/double arrays, as the indexing can be folded into
the loads&stores, reducing register pressure and decreasing the pressure on the decode unit.
With these changes, I expect our performance on 256.bzip2 and gzip to improve a lot. On
bzip2 for example, we go from this:
10665 asm-printer - Number of machine instrs printed
40 ra-local - Number of loads/stores folded into instructions
1708 ra-local - Number of loads added
1532 ra-local - Number of stores added
1354 twoaddressinstruction - Number of instructions added
1354 twoaddressinstruction - Number of two-address instructions
2794 x86-peephole - Number of peephole optimization performed
to this:
9873 asm-printer - Number of machine instrs printed
41 ra-local - Number of loads/stores folded into instructions
1710 ra-local - Number of loads added
1521 ra-local - Number of stores added
789 twoaddressinstruction - Number of instructions added
789 twoaddressinstruction - Number of two-address instructions
2142 x86-peephole - Number of peephole optimization performed
... and these types of instructions are often in tight loops.
Linear scan is also helped, but not as much. It goes from:
8787 asm-printer - Number of machine instrs printed
2389 liveintervals - Number of identity moves eliminated after coalescing
2288 liveintervals - Number of interval joins performed
3522 liveintervals - Number of intervals after coalescing
5810 liveintervals - Number of original intervals
700 spiller - Number of loads added
487 spiller - Number of stores added
303 spiller - Number of register spills
1354 twoaddressinstruction - Number of instructions added
1354 twoaddressinstruction - Number of two-address instructions
363 x86-peephole - Number of peephole optimization performed
to:
7982 asm-printer - Number of machine instrs printed
1759 liveintervals - Number of identity moves eliminated after coalescing
1658 liveintervals - Number of interval joins performed
3282 liveintervals - Number of intervals after coalescing
4940 liveintervals - Number of original intervals
635 spiller - Number of loads added
452 spiller - Number of stores added
288 spiller - Number of register spills
789 twoaddressinstruction - Number of instructions added
789 twoaddressinstruction - Number of two-address instructions
258 x86-peephole - Number of peephole optimization performed
Though I'm not complaining about the drop in the number of intervals. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11820 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 07:00:55 +00:00
|
|
|
BaseReg = MBB ? getReg(GEPOps[0], MBB, IP) : 1;
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
GEPOps.pop_back(); // Consume the last GEP operand
|
2004-02-25 03:45:50 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
/// isGEPFoldable - Return true if the specified GEP can be completely
|
|
|
|
/// folded into the addressing mode of a load/store or lea instruction.
|
|
|
|
bool ISel::isGEPFoldable(MachineBasicBlock *MBB,
|
|
|
|
Value *Src, User::op_iterator IdxBegin,
|
|
|
|
User::op_iterator IdxEnd, unsigned &BaseReg,
|
|
|
|
unsigned &Scale, unsigned &IndexReg, unsigned &Disp) {
|
|
|
|
if (ConstantPointerRef *CPR = dyn_cast<ConstantPointerRef>(Src))
|
|
|
|
Src = CPR->getValue();
|
|
|
|
|
|
|
|
std::vector<Value*> GEPOps;
|
|
|
|
GEPOps.resize(IdxEnd-IdxBegin+1);
|
|
|
|
GEPOps[0] = Src;
|
|
|
|
std::copy(IdxBegin, IdxEnd, GEPOps.begin()+1);
|
|
|
|
|
|
|
|
std::vector<const Type*> GEPTypes;
|
|
|
|
GEPTypes.assign(gep_type_begin(Src->getType(), IdxBegin, IdxEnd),
|
|
|
|
gep_type_end(Src->getType(), IdxBegin, IdxEnd));
|
|
|
|
|
|
|
|
MachineBasicBlock::iterator IP;
|
|
|
|
if (MBB) IP = MBB->end();
|
|
|
|
getGEPIndex(MBB, IP, GEPOps, GEPTypes, BaseReg, Scale, IndexReg, Disp);
|
|
|
|
|
|
|
|
// We can fold it away iff the getGEPIndex call eliminated all operands.
|
|
|
|
return GEPOps.empty();
|
|
|
|
}
|
|
|
|
|
2002-12-13 11:22:48 +00:00
|
|
|
void ISel::emitGEPOperation(MachineBasicBlock *MBB,
|
2004-02-22 17:05:38 +00:00
|
|
|
MachineBasicBlock::iterator IP,
|
2002-12-13 10:09:43 +00:00
|
|
|
Value *Src, User::op_iterator IdxBegin,
|
2002-12-13 06:56:29 +00:00
|
|
|
User::op_iterator IdxEnd, unsigned TargetReg) {
|
|
|
|
const TargetData &TD = TM.getTargetData();
|
2004-02-22 17:35:42 +00:00
|
|
|
if (ConstantPointerRef *CPR = dyn_cast<ConstantPointerRef>(Src))
|
|
|
|
Src = CPR->getValue();
|
|
|
|
|
2004-02-22 07:04:00 +00:00
|
|
|
std::vector<Value*> GEPOps;
|
|
|
|
GEPOps.resize(IdxEnd-IdxBegin+1);
|
|
|
|
GEPOps[0] = Src;
|
|
|
|
std::copy(IdxBegin, IdxEnd, GEPOps.begin()+1);
|
|
|
|
|
|
|
|
std::vector<const Type*> GEPTypes;
|
|
|
|
GEPTypes.assign(gep_type_begin(Src->getType(), IdxBegin, IdxEnd),
|
|
|
|
gep_type_end(Src->getType(), IdxBegin, IdxEnd));
|
|
|
|
|
|
|
|
// Keep emitting instructions until we consume the entire GEP instruction.
|
|
|
|
while (!GEPOps.empty()) {
|
|
|
|
unsigned OldSize = GEPOps.size();
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
unsigned BaseReg, Scale, IndexReg, Disp;
|
|
|
|
getGEPIndex(MBB, IP, GEPOps, GEPTypes, BaseReg, Scale, IndexReg, Disp);
|
2004-02-22 07:04:00 +00:00
|
|
|
|
2004-02-25 03:45:50 +00:00
|
|
|
if (GEPOps.size() != OldSize) {
|
|
|
|
// getGEPIndex consumed some of the input. Build an LEA instruction here.
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
unsigned NextTarget = 0;
|
|
|
|
if (!GEPOps.empty()) {
|
|
|
|
assert(BaseReg == 0 &&
|
|
|
|
"getGEPIndex should have left the base register open for chaining!");
|
|
|
|
NextTarget = BaseReg = makeAnotherReg(Type::UIntTy);
|
2004-02-25 03:45:50 +00:00
|
|
|
}
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
|
|
|
|
if (IndexReg == 0 && Disp == 0)
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV32rr, 1, TargetReg).addReg(BaseReg);
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
else
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFullAddress(BuildMI(*MBB, IP, X86::LEA32r, 5, TargetReg),
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
BaseReg, Scale, IndexReg, Disp);
|
|
|
|
--IP;
|
|
|
|
TargetReg = NextTarget;
|
2004-02-25 03:45:50 +00:00
|
|
|
} else if (GEPTypes.empty()) {
|
2004-02-22 07:04:00 +00:00
|
|
|
// The getGEPIndex operation didn't want to build an LEA. Check to see if
|
|
|
|
// all operands are consumed but the base pointer. If so, just load it
|
|
|
|
// into the register.
|
2004-02-22 17:35:42 +00:00
|
|
|
if (GlobalValue *GV = dyn_cast<GlobalValue>(GEPOps[0])) {
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV32ri, 1, TargetReg).addGlobalAddress(GV);
|
2004-02-22 17:35:42 +00:00
|
|
|
} else {
|
|
|
|
unsigned BaseReg = getReg(GEPOps[0], MBB, IP);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::MOV32rr, 1, TargetReg).addReg(BaseReg);
|
2004-02-22 17:35:42 +00:00
|
|
|
}
|
|
|
|
break; // we are now done
|
* Make the previous patch more efficient by not allocating a temporary MachineInstr
to do analysis.
*** FOLD getelementptr instructions into loads and stores when possible,
making use of some of the crazy X86 addressing modes.
For example, the following C++ program fragment:
struct complex {
double re, im;
complex(double r, double i) : re(r), im(i) {}
};
inline complex operator+(const complex& a, const complex& b) {
return complex(a.re+b.re, a.im+b.im);
}
complex addone(const complex& arg) {
return arg + complex(1,0);
}
Used to be compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
*** mov %EDX, %ECX
fld QWORD PTR [%EDX]
fld1
faddp %ST(1)
*** add %ECX, 8
fld QWORD PTR [%ECX]
fldz
faddp %ST(1)
*** mov %ECX, %EAX
fxch %ST(1)
fstp QWORD PTR [%ECX]
*** add %EAX, 8
fstp QWORD PTR [%EAX]
ret
Now it is compiled to:
_Z6addoneRK7complex:
mov %EAX, DWORD PTR [%ESP + 4]
mov %ECX, DWORD PTR [%ESP + 8]
fld QWORD PTR [%ECX]
fld1
faddp %ST(1)
fld QWORD PTR [%ECX + 8]
fldz
faddp %ST(1)
fxch %ST(1)
fstp QWORD PTR [%EAX]
fstp QWORD PTR [%EAX + 8]
ret
Other programs should see similar improvements, across the board. Note that
in addition to reducing instruction count, this also reduces register pressure
a lot, always a good thing on X86. :)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11819 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-25 06:13:04 +00:00
|
|
|
|
2004-02-22 07:04:00 +00:00
|
|
|
} else {
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
// It's an array or pointer access: [ArraySize x ElementType].
|
2004-02-22 07:04:00 +00:00
|
|
|
const SequentialType *SqTy = cast<SequentialType>(GEPTypes.back());
|
|
|
|
Value *idx = GEPOps.back();
|
|
|
|
GEPOps.pop_back(); // Consume a GEP operand
|
|
|
|
GEPTypes.pop_back();
|
2002-12-16 19:32:50 +00:00
|
|
|
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
// idx is the index into the array. Unlike with structure
|
|
|
|
// indices, we may not know its actual value at code-generation
|
|
|
|
// time.
|
2002-12-16 19:32:50 +00:00
|
|
|
assert(idx->getType() == Type::LongTy && "Bad GEP array index!");
|
|
|
|
|
2003-06-21 16:01:24 +00:00
|
|
|
// Most GEP instructions use a [cast (int/uint) to LongTy] as their
|
|
|
|
// operand on X86. Handle this case directly now...
|
|
|
|
if (CastInst *CI = dyn_cast<CastInst>(idx))
|
|
|
|
if (CI->getOperand(0)->getType() == Type::IntTy ||
|
|
|
|
CI->getOperand(0)->getType() == Type::UIntTy)
|
|
|
|
idx = CI->getOperand(0);
|
|
|
|
|
2003-01-13 00:32:26 +00:00
|
|
|
// We want to add BaseReg to(idxReg * sizeof ElementType). First, we
|
2002-12-16 19:32:50 +00:00
|
|
|
// must find the size of the pointed-to type (Not coincidentally, the next
|
|
|
|
// type is the type of the elements in the array).
|
2004-02-22 07:04:00 +00:00
|
|
|
const Type *ElTy = SqTy->getElementType();
|
|
|
|
unsigned elementSize = TD.getTypeSize(ElTy);
|
2002-12-16 19:32:50 +00:00
|
|
|
|
|
|
|
// If idxReg is a constant, we don't need to perform the multiply!
|
|
|
|
if (ConstantSInt *CSI = dyn_cast<ConstantSInt>(idx)) {
|
2003-01-13 00:32:26 +00:00
|
|
|
if (!CSI->isNullValue()) {
|
2002-12-16 19:32:50 +00:00
|
|
|
unsigned Offset = elementSize*CSI->getValue();
|
2004-02-22 07:04:00 +00:00
|
|
|
unsigned Reg = makeAnotherReg(Type::UIntTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::ADD32ri, 2, TargetReg)
|
2004-02-29 07:22:16 +00:00
|
|
|
.addReg(Reg).addImm(Offset);
|
2004-02-22 07:04:00 +00:00
|
|
|
--IP; // Insert the next instruction before this one.
|
|
|
|
TargetReg = Reg; // Codegen the rest of the GEP into this
|
2002-12-16 19:32:50 +00:00
|
|
|
}
|
|
|
|
} else if (elementSize == 1) {
|
|
|
|
// If the element size is 1, we don't have to multiply, just add
|
|
|
|
unsigned idxReg = getReg(idx, MBB, IP);
|
2004-02-22 07:04:00 +00:00
|
|
|
unsigned Reg = makeAnotherReg(Type::UIntTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::ADD32rr, 2,TargetReg).addReg(Reg).addReg(idxReg);
|
2004-02-22 07:04:00 +00:00
|
|
|
--IP; // Insert the next instruction before this one.
|
|
|
|
TargetReg = Reg; // Codegen the rest of the GEP into this
|
2002-12-16 19:32:50 +00:00
|
|
|
} else {
|
|
|
|
unsigned idxReg = getReg(idx, MBB, IP);
|
|
|
|
unsigned OffsetReg = makeAnotherReg(Type::UIntTy);
|
2003-10-19 21:09:10 +00:00
|
|
|
|
2004-02-22 07:04:00 +00:00
|
|
|
// Make sure we can back the iterator up to point to the first
|
|
|
|
// instruction emitted.
|
|
|
|
MachineBasicBlock::iterator BeforeIt = IP;
|
|
|
|
if (IP == MBB->begin())
|
|
|
|
BeforeIt = MBB->end();
|
|
|
|
else
|
|
|
|
--BeforeIt;
|
2003-10-19 21:09:10 +00:00
|
|
|
doMultiplyConst(MBB, IP, OffsetReg, Type::IntTy, idxReg, elementSize);
|
|
|
|
|
2002-12-16 19:32:50 +00:00
|
|
|
// Emit an ADD to add OffsetReg to the basePtr.
|
2004-02-22 07:04:00 +00:00
|
|
|
unsigned Reg = makeAnotherReg(Type::UIntTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(*MBB, IP, X86::ADD32rr, 2, TargetReg)
|
2004-02-29 07:22:16 +00:00
|
|
|
.addReg(Reg).addReg(OffsetReg);
|
2004-02-22 07:04:00 +00:00
|
|
|
|
|
|
|
// Step to the first instruction of the multiply.
|
|
|
|
if (BeforeIt == MBB->end())
|
|
|
|
IP = MBB->begin();
|
|
|
|
else
|
|
|
|
IP = ++BeforeIt;
|
|
|
|
|
|
|
|
TargetReg = Reg; // Codegen the rest of the GEP into this
|
2002-12-16 19:32:50 +00:00
|
|
|
}
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2002-12-28 20:24:02 +00:00
|
|
|
/// visitAllocaInst - If this is a fixed size alloca, allocate space from the
|
|
|
|
/// frame manager, otherwise do it the hard way.
|
|
|
|
///
|
|
|
|
void ISel::visitAllocaInst(AllocaInst &I) {
|
|
|
|
// Find the data size of the alloca inst's getAllocatedType.
|
|
|
|
const Type *Ty = I.getAllocatedType();
|
|
|
|
unsigned TySize = TM.getTargetData().getTypeSize(Ty);
|
2002-12-13 06:46:31 +00:00
|
|
|
|
2002-12-28 20:24:02 +00:00
|
|
|
// If this is a fixed size alloca in the entry block for the function,
|
|
|
|
// statically stack allocate the space.
|
|
|
|
//
|
|
|
|
if (ConstantUInt *CUI = dyn_cast<ConstantUInt>(I.getArraySize())) {
|
|
|
|
if (I.getParent() == I.getParent()->getParent()->begin()) {
|
|
|
|
TySize *= CUI->getValue(); // Get total allocated size...
|
|
|
|
unsigned Alignment = TM.getTargetData().getTypeAlignment(Ty);
|
|
|
|
|
|
|
|
// Create a new stack object using the frame manager...
|
|
|
|
int FrameIdx = F->getFrameInfo()->CreateStackObject(TySize, Alignment);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
addFrameReference(BuildMI(BB, X86::LEA32r, 5, getReg(I)), FrameIdx);
|
2002-12-28 20:24:02 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Create a register to hold the temporary result of multiplying the type size
|
|
|
|
// constant by the variable amount.
|
|
|
|
unsigned TotalSizeReg = makeAnotherReg(Type::UIntTy);
|
|
|
|
unsigned SrcReg1 = getReg(I.getArraySize());
|
|
|
|
|
|
|
|
// TotalSizeReg = mul <numelements>, <TypeSize>
|
|
|
|
MachineBasicBlock::iterator MBBI = BB->end();
|
2003-10-19 21:09:10 +00:00
|
|
|
doMultiplyConst(BB, MBBI, TotalSizeReg, Type::UIntTy, SrcReg1, TySize);
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
|
2002-12-28 20:24:02 +00:00
|
|
|
// AddedSize = add <TotalSizeReg>, 15
|
|
|
|
unsigned AddedSizeReg = makeAnotherReg(Type::UIntTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::ADD32ri, 2, AddedSizeReg).addReg(TotalSizeReg).addImm(15);
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
|
2002-12-28 20:24:02 +00:00
|
|
|
// AlignedSize = and <AddedSize>, ~15
|
|
|
|
unsigned AlignedSize = makeAnotherReg(Type::UIntTy);
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::AND32ri, 2, AlignedSize).addReg(AddedSizeReg).addImm(~15);
|
2002-12-28 20:24:02 +00:00
|
|
|
|
2002-12-13 06:46:31 +00:00
|
|
|
// Subtract size from stack pointer, thereby allocating some space.
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::SUB32rr, 2, X86::ESP).addReg(X86::ESP).addReg(AlignedSize);
|
2002-12-28 20:24:02 +00:00
|
|
|
|
2002-12-13 06:46:31 +00:00
|
|
|
// Put a pointer to the space into the result register, by copying
|
|
|
|
// the stack pointer.
|
A big X86 instruction rename. The instructions are renamed to make
their names more decriptive. A name consists of the base name, a
default operand size followed by a character per operand with an
optional special size. For example:
ADD8rr -> add, 8-bit register, 8-bit register
IMUL16rmi -> imul, 16-bit register, 16-bit memory, 16-bit immediate
IMUL16rmi8 -> imul, 16-bit register, 16-bit memory, 8-bit immediate
MOVSX32rm16 -> movsx, 32-bit register, 16-bit memory
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@11995 91177308-0d34-0410-b5e6-96231b3b80d8
2004-02-29 08:50:03 +00:00
|
|
|
BuildMI(BB, X86::MOV32rr, 1, getReg(I)).addReg(X86::ESP);
|
2002-12-28 20:24:02 +00:00
|
|
|
|
2003-05-03 02:18:17 +00:00
|
|
|
// Inform the Frame Information that we have just allocated a variable-sized
|
2002-12-28 20:24:02 +00:00
|
|
|
// object.
|
|
|
|
F->getFrameInfo()->CreateVariableSizedObject();
|
This checkin is brought to you by the brian gaeke allnighter fund.
(lib/Target/X86) InstSelectSimple.cpp:
Include llvm/DerivedTypes.h and iostream.
Refactor visitMul out into a wrapper around doMultiply(), so that we
can do multiplications on temporary values when we are doing
getelementptrs.
Refactor part of getReg out into makeAnotherReg, so that we can create
registers willy-nilly to hold temporary values, when we are doing
getelementptrs.
Add stub implementations of visitMallocInst and visitAllocaInst.
Add initial implementation of visitGetElementPtrInst.
In copyConstantToRegister:
We throw a *lot* of our asserts here. So, when we want to throw an
assert, print out to stderr whatever expr or whatever constant made
us barf.
Support copying ConstantPointerNull to register, using a move immediate
of zero.
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
Teach visitCallInst to extract byte- and short-class return values
from subregs of EAX. Add a FIXME note about how we would do it for
float-class return values.
Add a FIXME note about how we would cast float to int and back.
X86InstrInfo.def:
Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings
of the numbers in the other instruction names. All uses modified.
(tools/jello) GlobalVars.cpp:
Include iostream.
If we have to emit a floating-point constant to memory, gamble and use
the same method as for ints.
If we have to emit a ConstantPointerNull to memory, try using a "void *"
and "NULL".
Otherwise, if we are going to throw an assert, print out whatever constant
made us barf, first.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8
2002-12-12 15:33:40 +00:00
|
|
|
}
|
2003-01-13 00:32:26 +00:00
|
|
|
|
|
|
|
/// visitMallocInst - Malloc instructions are code generated into direct calls
|
|
|
|
/// to the library malloc.
|
|
|
|
///
|
|
|
|
void ISel::visitMallocInst(MallocInst &I) {
|
|
|
|
unsigned AllocSize = TM.getTargetData().getTypeSize(I.getAllocatedType());
|
|
|
|
unsigned Arg;
|
|
|
|
|
|
|
|
if (ConstantUInt *C = dyn_cast<ConstantUInt>(I.getOperand(0))) {
|
|
|
|
Arg = getReg(ConstantUInt::get(Type::UIntTy, C->getValue() * AllocSize));
|
|
|
|
} else {
|
|
|
|
Arg = makeAnotherReg(Type::UIntTy);
|
2003-10-19 21:09:10 +00:00
|
|
|
unsigned Op0Reg = getReg(I.getOperand(0));
|
2003-01-13 00:32:26 +00:00
|
|
|
MachineBasicBlock::iterator MBBI = BB->end();
|
2003-10-19 21:09:10 +00:00
|
|
|
doMultiplyConst(BB, MBBI, Arg, Type::UIntTy, Op0Reg, AllocSize);
|
2003-01-13 00:32:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
std::vector<ValueRecord> Args;
|
|
|
|
Args.push_back(ValueRecord(Arg, Type::UIntTy));
|
|
|
|
MachineInstr *TheCall = BuildMI(X86::CALLpcrel32,
|
2003-10-23 16:22:08 +00:00
|
|
|
1).addExternalSymbol("malloc", true);
|
2003-01-13 00:32:26 +00:00
|
|
|
doCall(ValueRecord(getReg(I), I.getType()), TheCall, Args);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/// visitFreeInst - Free instructions are code gen'd to call the free libc
|
|
|
|
/// function.
|
|
|
|
///
|
|
|
|
void ISel::visitFreeInst(FreeInst &I) {
|
|
|
|
std::vector<ValueRecord> Args;
|
2003-08-04 02:12:48 +00:00
|
|
|
Args.push_back(ValueRecord(I.getOperand(0)));
|
2003-01-13 00:32:26 +00:00
|
|
|
MachineInstr *TheCall = BuildMI(X86::CALLpcrel32,
|
2003-10-23 16:22:08 +00:00
|
|
|
1).addExternalSymbol("free", true);
|
2003-01-13 00:32:26 +00:00
|
|
|
doCall(ValueRecord(0, Type::VoidTy), TheCall, Args);
|
|
|
|
}
|
|
|
|
|
2003-07-26 23:49:58 +00:00
|
|
|
/// createX86SimpleInstructionSelector - This pass converts an LLVM function
|
2002-10-29 22:37:54 +00:00
|
|
|
/// into a machine code representation is a very simple peep-hole fashion. The
|
2002-10-25 22:55:53 +00:00
|
|
|
/// generated code sucks but the implementation is nice and simple.
|
|
|
|
///
|
2003-12-28 21:23:38 +00:00
|
|
|
FunctionPass *llvm::createX86SimpleInstructionSelector(TargetMachine &TM) {
|
|
|
|
return new ISel(TM);
|
2002-10-25 22:55:53 +00:00
|
|
|
}
|