From 20244b7e2ca8ae116fad1bcfb82ea372220363b0 Mon Sep 17 00:00:00 2001 From: Brian Gaeke Date: Thu, 12 Dec 2002 15:33:40 +0000 Subject: [PATCH] This checkin is brought to you by the brian gaeke allnighter fund. (lib/Target/X86) InstSelectSimple.cpp: Include llvm/DerivedTypes.h and iostream. Refactor visitMul out into a wrapper around doMultiply(), so that we can do multiplications on temporary values when we are doing getelementptrs. Refactor part of getReg out into makeAnotherReg, so that we can create registers willy-nilly to hold temporary values, when we are doing getelementptrs. Add stub implementations of visitMallocInst and visitAllocaInst. Add initial implementation of visitGetElementPtrInst. In copyConstantToRegister: We throw a *lot* of our asserts here. So, when we want to throw an assert, print out to stderr whatever expr or whatever constant made us barf. Support copying ConstantPointerNull to register, using a move immediate of zero. Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings of the numbers in the other instruction names. All uses modified. Teach visitCallInst to extract byte- and short-class return values from subregs of EAX. Add a FIXME note about how we would do it for float-class return values. Add a FIXME note about how we would cast float to int and back. X86InstrInfo.def: Rename FLDr4 and FLDr8 to FLDr32 and FLDr64, so that they match the meanings of the numbers in the other instruction names. All uses modified. (tools/jello) GlobalVars.cpp: Include iostream. If we have to emit a floating-point constant to memory, gamble and use the same method as for ints. If we have to emit a ConstantPointerNull to memory, try using a "void *" and "NULL". Otherwise, if we are going to throw an assert, print out whatever constant made us barf, first. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@4973 91177308-0d34-0410-b5e6-96231b3b80d8 --- lib/Target/X86/InstSelectSimple.cpp | 228 ++++++++++++++++++++++++---- lib/Target/X86/X86ISelSimple.cpp | 228 ++++++++++++++++++++++++---- lib/Target/X86/X86InstrInfo.def | 4 +- tools/jello/GlobalVars.cpp | 16 ++ 4 files changed, 410 insertions(+), 66 deletions(-) diff --git a/lib/Target/X86/InstSelectSimple.cpp b/lib/Target/X86/InstSelectSimple.cpp index 217b219ba2a..e88354a6ad1 100644 --- a/lib/Target/X86/InstSelectSimple.cpp +++ b/lib/Target/X86/InstSelectSimple.cpp @@ -14,6 +14,7 @@ #include "llvm/iPHINode.h" #include "llvm/iMemory.h" #include "llvm/Type.h" +#include "llvm/DerivedTypes.h" #include "llvm/Constants.h" #include "llvm/Pass.h" #include "llvm/CodeGen/MachineFunction.h" @@ -22,6 +23,7 @@ #include "llvm/Support/InstVisitor.h" #include "llvm/Target/MRegisterInfo.h" #include +#include using namespace MOTy; // Get Use, Def, UseAndDef @@ -73,6 +75,8 @@ namespace { void visitSimpleBinary(BinaryOperator &B, unsigned OpcodeClass); void visitAdd(BinaryOperator &B) { visitSimpleBinary(B, 0); } void visitSub(BinaryOperator &B) { visitSimpleBinary(B, 1); } + void doMultiply(unsigned destReg, const Type *resultType, + unsigned op0Reg, unsigned op1Reg); void visitMul(BinaryOperator &B); void visitDiv(BinaryOperator &B) { visitDivRem(B); } @@ -96,7 +100,10 @@ namespace { // Memory Instructions void visitLoadInst(LoadInst &I); void visitStoreInst(StoreInst &I); - + void visitGetElementPtrInst(GetElementPtrInst &I); + void visitMallocInst(MallocInst &I); + void visitAllocaInst(AllocaInst &I); + // Other operators void visitShiftInst(ShiftInst &I); void visitPHINode(PHINode &I); @@ -114,6 +121,13 @@ namespace { /// void copyConstantToRegister(Constant *C, unsigned Reg); + /// makeAnotherReg - This method returns the next register number + /// we haven't yet used. + unsigned makeAnotherReg (void) { + unsigned Reg = CurReg++; + return Reg; + } + /// getReg - This method turns an LLVM value into a register number. This /// is guaranteed to produce the same register number for a particular value /// every time it is queried. @@ -122,7 +136,7 @@ namespace { unsigned getReg(Value *V) { unsigned &Reg = RegMap[V]; if (Reg == 0) { - Reg = CurReg++; + Reg = makeAnotherReg (); RegMap[V] = Reg; // Add the mapping of regnumber => reg class to MachineFunction @@ -182,6 +196,11 @@ static inline TypeClass getClass(const Type *Ty) { /// specified constant into the specified register. /// void ISel::copyConstantToRegister(Constant *C, unsigned R) { + if (isa (C)) { + // FIXME: We really need to handle getelementptr exprs, among + // other things. + std::cerr << "Offending expr: " << C << "\n"; + } assert (!isa(C) && "Constant expressions not yet handled!\n"); if (C->getType()->isIntegral()) { @@ -199,7 +218,11 @@ void ISel::copyConstantToRegister(Constant *C, unsigned R) { ConstantUInt *CUI = cast(C); BuildMI(BB, IntegralOpcodeTab[Class], 1, R).addZImm(CUI->getValue()); } + } else if (isa (C)) { + // Copy zero (null pointer) to the register. + BuildMI (BB, X86::MOVir32, 1, R).addZImm(0); } else { + std::cerr << "Offending constant: " << C << "\n"; assert(0 && "Type not handled yet!"); } } @@ -236,12 +259,12 @@ void ISel::visitSetCCInst(SetCondInst &I, unsigned OpNum) { // FIXME: assuming var1, var2 are in memory, if not, spill to // stack first case cFloat: // Floats - BuildMI (BB, X86::FLDr4, 1).addReg (reg1); - BuildMI (BB, X86::FLDr4, 1).addReg (reg2); + BuildMI (BB, X86::FLDr32, 1).addReg (reg1); + BuildMI (BB, X86::FLDr32, 1).addReg (reg2); break; case cDouble: // Doubles - BuildMI (BB, X86::FLDr8, 1).addReg (reg1); - BuildMI (BB, X86::FLDr8, 1).addReg (reg2); + BuildMI (BB, X86::FLDr64, 1).addReg (reg1); + BuildMI (BB, X86::FLDr64, 1).addReg (reg2); break; case cLong: default: @@ -345,10 +368,10 @@ ISel::visitReturnInst (ReturnInst &I) // ret float/double: top of FP stack // FLD case cFloat: // Floats - BuildMI (BB, X86::FLDr4, 1).addReg (getReg (rv)); + BuildMI (BB, X86::FLDr32, 1).addReg (getReg (rv)); break; case cDouble: // Doubles - BuildMI (BB, X86::FLDr8, 1).addReg (getReg (rv)); + BuildMI (BB, X86::FLDr64, 1).addReg (getReg (rv)); break; case cLong: // ret long: use EAX(least significant 32 bits)/EDX (most @@ -435,11 +458,31 @@ ISel::visitCallInst (CallInst & CI) // leaves it in... // if (CI.getType() != Type::VoidTy) { - switch (getClass(CI.getType())) { - case cInt: - BuildMI(BB, X86::MOVrr32, 1, getReg(CI)).addReg(X86::EAX); + unsigned resultTypeClass = getClass (CI.getType ()); + switch (resultTypeClass) { + case cByte: + case cShort: + case cInt: { + // Integral results are in %eax, or the appropriate portion + // thereof. + static const unsigned regRegMove[] = { + X86::MOVrr8, X86::MOVrr16, X86::MOVrr32 + }; + static const unsigned AReg[] = { X86::AL, X86::AX, X86::EAX }; + BuildMI (BB, regRegMove[resultTypeClass], 1, + getReg (CI)).addReg (AReg[resultTypeClass]); + break; + } + case cFloat: + // Floating-point return values live in %st(0) (i.e., the top of + // the FP stack.) The general way to approach this is to do a + // FSTP to save the top of the FP stack on the real stack, then + // do a MOV to load the top of the real stack into the target + // register. + visitInstruction (CI); // FIXME: add the right args for the calls below + // BuildMI (BB, X86::FSTPm32, 0); + // BuildMI (BB, X86::MOVmr32, 0); break; - default: std::cerr << "Cannot get return value for call of type '" << *CI.getType() << "'\n"; @@ -477,30 +520,41 @@ void ISel::visitSimpleBinary(BinaryOperator &B, unsigned OperatorClass) { BuildMI(BB, Opcode, 2, getReg(B)).addReg(Op0r).addReg(Op1r); } +/// doMultiply - Emit appropriate instructions to multiply together +/// the registers op0Reg and op1Reg, and put the result in destReg. +/// The type of the result should be given as resultType. +void +ISel::doMultiply(unsigned destReg, const Type *resultType, + unsigned op0Reg, unsigned op1Reg) +{ + unsigned Class = getClass (resultType); + + // FIXME: + assert (Class <= 2 && "Someday, we will learn how to multiply" + "longs and floating-point numbers. This is not that day."); + + static const unsigned Regs[] ={ X86::AL , X86::AX , X86::EAX }; + static const unsigned MulOpcode[]={ X86::MULrr8, X86::MULrr16, X86::MULrr32 }; + static const unsigned MovOpcode[]={ X86::MOVrr8, X86::MOVrr16, X86::MOVrr32 }; + unsigned Reg = Regs[Class]; + + // Emit a MOV to put the first operand into the appropriately-sized + // subreg of EAX. + BuildMI (BB, MovOpcode[Class], 1, Reg).addReg (op0Reg); + + // Emit the appropriate multiply instruction. + BuildMI (BB, MulOpcode[Class], 1).addReg (op1Reg); + + // Emit another MOV to put the result into the destination register. + BuildMI (BB, MovOpcode[Class], 1, destReg).addReg (Reg); +} + /// visitMul - Multiplies are not simple binary operators because they must deal /// with the EAX register explicitly. /// void ISel::visitMul(BinaryOperator &I) { - unsigned Class = getClass(I.getType()); - if (Class > 2) // FIXME: Handle longs - visitInstruction(I); - - static const unsigned Regs[] ={ X86::AL , X86::AX , X86::EAX }; - static const unsigned MulOpcode[]={ X86::MULrr8, X86::MULrr16, X86::MULrr32 }; - static const unsigned MovOpcode[]={ X86::MOVrr8, X86::MOVrr16, X86::MOVrr32 }; - - unsigned Reg = Regs[Class]; - unsigned Op0Reg = getReg(I.getOperand(0)); - unsigned Op1Reg = getReg(I.getOperand(1)); - - // Put the first operand into one of the A registers... - BuildMI(BB, MovOpcode[Class], 1, Reg).addReg(Op0Reg); - - // Emit the appropriate multiply instruction... - BuildMI(BB, MulOpcode[Class], 1).addReg(Op1Reg); - - // Put the result into the destination register... - BuildMI(BB, MovOpcode[Class], 1, getReg(I)).addReg(Reg); + doMultiply (getReg (I), I.getType (), + getReg (I.getOperand (0)), getReg (I.getOperand (1))); } @@ -732,9 +786,119 @@ ISel::visitCastInst (CastInst &CI) return; } // Anything we haven't handled already, we can't (yet) handle at all. + // + // FP to integral casts can be handled with FISTP to store onto the + // stack while converting to integer, followed by a MOV to load from + // the stack into the result register. Integral to FP casts can be + // handled with MOV to store onto the stack, followed by a FILD to + // load from the stack while converting to FP. For the moment, I + // can't quite get straight in my head how to borrow myself some + // stack space and write on it. Otherwise, this would be trivial. visitInstruction (CI); } +/// visitGetElementPtrInst - I don't know, most programs don't have +/// getelementptr instructions, right? That means we can put off +/// implementing this, right? Right. This method emits machine +/// instructions to perform type-safe pointer arithmetic. I am +/// guessing this could be cleaned up somewhat to use fewer temporary +/// registers. +void +ISel::visitGetElementPtrInst (GetElementPtrInst &I) +{ + Value *basePtr = I.getPointerOperand (); + const TargetData &TD = TM.DataLayout; + unsigned basePtrReg = getReg (basePtr); + unsigned resultReg = getReg (I); + const Type *Ty = basePtr->getType(); + // GEPs have zero or more indices; we must perform a struct access + // or array access for each one. + for (GetElementPtrInst::op_iterator oi = I.idx_begin (), + oe = I.idx_end (); oi != oe; ++oi) { + Value *idx = *oi; + unsigned nextBasePtrReg = makeAnotherReg (); + if (const StructType *StTy = dyn_cast (Ty)) { + // It's a struct access. idx is the index into the structure, + // which names the field. This index must have ubyte type. + const ConstantUInt *CUI = cast (idx); + assert (CUI->getType () == Type::UByteTy + && "Funny-looking structure index in GEP"); + // Use the TargetData structure to pick out what the layout of + // the structure is in memory. Since the structure index must + // be constant, we can get its value and use it to find the + // right byte offset from the StructLayout class's list of + // structure member offsets. + unsigned idxValue = CUI->getValue (); + unsigned memberOffset = + TD.getStructLayout (StTy)->MemberOffsets[idxValue]; + // Emit an ADD to add memberOffset to the basePtr. + BuildMI (BB, X86::ADDri32, 2, + nextBasePtrReg).addReg (basePtrReg).addZImm (memberOffset); + // The next type is the member of the structure selected by the + // index. + Ty = StTy->getElementTypes ()[idxValue]; + } else if (const SequentialType *SqTy = cast (Ty)) { + // It's an array or pointer access: [ArraySize x ElementType]. + // The documentation does not seem to match the code on the type + // of array indices. The code seems to use long, and the docs + // (and the comments) say uint. If it is long, I don't know what + // we are going to do, because the X86 loves 64-bit types. + const Type *typeOfSequentialTypeIndex = SqTy->getIndexType (); + // idx is the index into the array. Unlike with structure + // indices, we may not know its actual value at code-generation + // time. + assert (idx->getType () == typeOfSequentialTypeIndex + && "Funny-looking array index in GEP"); + // We want to add basePtrReg to (idxReg * sizeof + // ElementType). First, we must find the size of the pointed-to + // type. (Not coincidentally, the next type is the type of the + // elements in the array.) + Ty = SqTy->getElementType (); + unsigned elementSize = TD.getTypeSize (Ty); + unsigned elementSizeReg = makeAnotherReg (); + copyConstantToRegister (ConstantInt::get (typeOfSequentialTypeIndex, + elementSize), + elementSizeReg); + unsigned idxReg = getReg (idx); + // Emit a MUL to multiply the register holding the index by + // elementSize, putting the result in memberOffsetReg. + unsigned memberOffsetReg = makeAnotherReg (); + doMultiply (memberOffsetReg, typeOfSequentialTypeIndex, + elementSizeReg, idxReg); + // Emit an ADD to add memberOffsetReg to the basePtr. + BuildMI (BB, X86::ADDrr32, 2, + nextBasePtrReg).addReg (basePtrReg).addReg (memberOffsetReg); + } + // Now that we are here, further indices refer to subtypes of this + // one, so we don't need to worry about basePtrReg itself, anymore. + basePtrReg = nextBasePtrReg; + } + // After we have processed all the indices, the result is left in + // basePtrReg. Move it to the register where we were expected to + // put the answer. A 32-bit move should do it, because we are in + // ILP32 land. + BuildMI (BB, X86::MOVrr32, 1, getReg (I)).addReg (basePtrReg); +} + + +/// visitMallocInst - I know that personally, whenever I want to remember +/// something, I have to clear off some space in my brain. +void +ISel::visitMallocInst (MallocInst &I) +{ + visitInstruction (I); +} + + +/// visitAllocaInst - I want some stack space. Come on, man, I said I +/// want some freakin' stack space. +void +ISel::visitAllocaInst (AllocaInst &I) +{ + visitInstruction (I); +} + + /// createSimpleX86InstructionSelector - This pass converts an LLVM function /// into a machine code representation is a very simple peep-hole fashion. The /// generated code sucks but the implementation is nice and simple. diff --git a/lib/Target/X86/X86ISelSimple.cpp b/lib/Target/X86/X86ISelSimple.cpp index 217b219ba2a..e88354a6ad1 100644 --- a/lib/Target/X86/X86ISelSimple.cpp +++ b/lib/Target/X86/X86ISelSimple.cpp @@ -14,6 +14,7 @@ #include "llvm/iPHINode.h" #include "llvm/iMemory.h" #include "llvm/Type.h" +#include "llvm/DerivedTypes.h" #include "llvm/Constants.h" #include "llvm/Pass.h" #include "llvm/CodeGen/MachineFunction.h" @@ -22,6 +23,7 @@ #include "llvm/Support/InstVisitor.h" #include "llvm/Target/MRegisterInfo.h" #include +#include using namespace MOTy; // Get Use, Def, UseAndDef @@ -73,6 +75,8 @@ namespace { void visitSimpleBinary(BinaryOperator &B, unsigned OpcodeClass); void visitAdd(BinaryOperator &B) { visitSimpleBinary(B, 0); } void visitSub(BinaryOperator &B) { visitSimpleBinary(B, 1); } + void doMultiply(unsigned destReg, const Type *resultType, + unsigned op0Reg, unsigned op1Reg); void visitMul(BinaryOperator &B); void visitDiv(BinaryOperator &B) { visitDivRem(B); } @@ -96,7 +100,10 @@ namespace { // Memory Instructions void visitLoadInst(LoadInst &I); void visitStoreInst(StoreInst &I); - + void visitGetElementPtrInst(GetElementPtrInst &I); + void visitMallocInst(MallocInst &I); + void visitAllocaInst(AllocaInst &I); + // Other operators void visitShiftInst(ShiftInst &I); void visitPHINode(PHINode &I); @@ -114,6 +121,13 @@ namespace { /// void copyConstantToRegister(Constant *C, unsigned Reg); + /// makeAnotherReg - This method returns the next register number + /// we haven't yet used. + unsigned makeAnotherReg (void) { + unsigned Reg = CurReg++; + return Reg; + } + /// getReg - This method turns an LLVM value into a register number. This /// is guaranteed to produce the same register number for a particular value /// every time it is queried. @@ -122,7 +136,7 @@ namespace { unsigned getReg(Value *V) { unsigned &Reg = RegMap[V]; if (Reg == 0) { - Reg = CurReg++; + Reg = makeAnotherReg (); RegMap[V] = Reg; // Add the mapping of regnumber => reg class to MachineFunction @@ -182,6 +196,11 @@ static inline TypeClass getClass(const Type *Ty) { /// specified constant into the specified register. /// void ISel::copyConstantToRegister(Constant *C, unsigned R) { + if (isa (C)) { + // FIXME: We really need to handle getelementptr exprs, among + // other things. + std::cerr << "Offending expr: " << C << "\n"; + } assert (!isa(C) && "Constant expressions not yet handled!\n"); if (C->getType()->isIntegral()) { @@ -199,7 +218,11 @@ void ISel::copyConstantToRegister(Constant *C, unsigned R) { ConstantUInt *CUI = cast(C); BuildMI(BB, IntegralOpcodeTab[Class], 1, R).addZImm(CUI->getValue()); } + } else if (isa (C)) { + // Copy zero (null pointer) to the register. + BuildMI (BB, X86::MOVir32, 1, R).addZImm(0); } else { + std::cerr << "Offending constant: " << C << "\n"; assert(0 && "Type not handled yet!"); } } @@ -236,12 +259,12 @@ void ISel::visitSetCCInst(SetCondInst &I, unsigned OpNum) { // FIXME: assuming var1, var2 are in memory, if not, spill to // stack first case cFloat: // Floats - BuildMI (BB, X86::FLDr4, 1).addReg (reg1); - BuildMI (BB, X86::FLDr4, 1).addReg (reg2); + BuildMI (BB, X86::FLDr32, 1).addReg (reg1); + BuildMI (BB, X86::FLDr32, 1).addReg (reg2); break; case cDouble: // Doubles - BuildMI (BB, X86::FLDr8, 1).addReg (reg1); - BuildMI (BB, X86::FLDr8, 1).addReg (reg2); + BuildMI (BB, X86::FLDr64, 1).addReg (reg1); + BuildMI (BB, X86::FLDr64, 1).addReg (reg2); break; case cLong: default: @@ -345,10 +368,10 @@ ISel::visitReturnInst (ReturnInst &I) // ret float/double: top of FP stack // FLD case cFloat: // Floats - BuildMI (BB, X86::FLDr4, 1).addReg (getReg (rv)); + BuildMI (BB, X86::FLDr32, 1).addReg (getReg (rv)); break; case cDouble: // Doubles - BuildMI (BB, X86::FLDr8, 1).addReg (getReg (rv)); + BuildMI (BB, X86::FLDr64, 1).addReg (getReg (rv)); break; case cLong: // ret long: use EAX(least significant 32 bits)/EDX (most @@ -435,11 +458,31 @@ ISel::visitCallInst (CallInst & CI) // leaves it in... // if (CI.getType() != Type::VoidTy) { - switch (getClass(CI.getType())) { - case cInt: - BuildMI(BB, X86::MOVrr32, 1, getReg(CI)).addReg(X86::EAX); + unsigned resultTypeClass = getClass (CI.getType ()); + switch (resultTypeClass) { + case cByte: + case cShort: + case cInt: { + // Integral results are in %eax, or the appropriate portion + // thereof. + static const unsigned regRegMove[] = { + X86::MOVrr8, X86::MOVrr16, X86::MOVrr32 + }; + static const unsigned AReg[] = { X86::AL, X86::AX, X86::EAX }; + BuildMI (BB, regRegMove[resultTypeClass], 1, + getReg (CI)).addReg (AReg[resultTypeClass]); + break; + } + case cFloat: + // Floating-point return values live in %st(0) (i.e., the top of + // the FP stack.) The general way to approach this is to do a + // FSTP to save the top of the FP stack on the real stack, then + // do a MOV to load the top of the real stack into the target + // register. + visitInstruction (CI); // FIXME: add the right args for the calls below + // BuildMI (BB, X86::FSTPm32, 0); + // BuildMI (BB, X86::MOVmr32, 0); break; - default: std::cerr << "Cannot get return value for call of type '" << *CI.getType() << "'\n"; @@ -477,30 +520,41 @@ void ISel::visitSimpleBinary(BinaryOperator &B, unsigned OperatorClass) { BuildMI(BB, Opcode, 2, getReg(B)).addReg(Op0r).addReg(Op1r); } +/// doMultiply - Emit appropriate instructions to multiply together +/// the registers op0Reg and op1Reg, and put the result in destReg. +/// The type of the result should be given as resultType. +void +ISel::doMultiply(unsigned destReg, const Type *resultType, + unsigned op0Reg, unsigned op1Reg) +{ + unsigned Class = getClass (resultType); + + // FIXME: + assert (Class <= 2 && "Someday, we will learn how to multiply" + "longs and floating-point numbers. This is not that day."); + + static const unsigned Regs[] ={ X86::AL , X86::AX , X86::EAX }; + static const unsigned MulOpcode[]={ X86::MULrr8, X86::MULrr16, X86::MULrr32 }; + static const unsigned MovOpcode[]={ X86::MOVrr8, X86::MOVrr16, X86::MOVrr32 }; + unsigned Reg = Regs[Class]; + + // Emit a MOV to put the first operand into the appropriately-sized + // subreg of EAX. + BuildMI (BB, MovOpcode[Class], 1, Reg).addReg (op0Reg); + + // Emit the appropriate multiply instruction. + BuildMI (BB, MulOpcode[Class], 1).addReg (op1Reg); + + // Emit another MOV to put the result into the destination register. + BuildMI (BB, MovOpcode[Class], 1, destReg).addReg (Reg); +} + /// visitMul - Multiplies are not simple binary operators because they must deal /// with the EAX register explicitly. /// void ISel::visitMul(BinaryOperator &I) { - unsigned Class = getClass(I.getType()); - if (Class > 2) // FIXME: Handle longs - visitInstruction(I); - - static const unsigned Regs[] ={ X86::AL , X86::AX , X86::EAX }; - static const unsigned MulOpcode[]={ X86::MULrr8, X86::MULrr16, X86::MULrr32 }; - static const unsigned MovOpcode[]={ X86::MOVrr8, X86::MOVrr16, X86::MOVrr32 }; - - unsigned Reg = Regs[Class]; - unsigned Op0Reg = getReg(I.getOperand(0)); - unsigned Op1Reg = getReg(I.getOperand(1)); - - // Put the first operand into one of the A registers... - BuildMI(BB, MovOpcode[Class], 1, Reg).addReg(Op0Reg); - - // Emit the appropriate multiply instruction... - BuildMI(BB, MulOpcode[Class], 1).addReg(Op1Reg); - - // Put the result into the destination register... - BuildMI(BB, MovOpcode[Class], 1, getReg(I)).addReg(Reg); + doMultiply (getReg (I), I.getType (), + getReg (I.getOperand (0)), getReg (I.getOperand (1))); } @@ -732,9 +786,119 @@ ISel::visitCastInst (CastInst &CI) return; } // Anything we haven't handled already, we can't (yet) handle at all. + // + // FP to integral casts can be handled with FISTP to store onto the + // stack while converting to integer, followed by a MOV to load from + // the stack into the result register. Integral to FP casts can be + // handled with MOV to store onto the stack, followed by a FILD to + // load from the stack while converting to FP. For the moment, I + // can't quite get straight in my head how to borrow myself some + // stack space and write on it. Otherwise, this would be trivial. visitInstruction (CI); } +/// visitGetElementPtrInst - I don't know, most programs don't have +/// getelementptr instructions, right? That means we can put off +/// implementing this, right? Right. This method emits machine +/// instructions to perform type-safe pointer arithmetic. I am +/// guessing this could be cleaned up somewhat to use fewer temporary +/// registers. +void +ISel::visitGetElementPtrInst (GetElementPtrInst &I) +{ + Value *basePtr = I.getPointerOperand (); + const TargetData &TD = TM.DataLayout; + unsigned basePtrReg = getReg (basePtr); + unsigned resultReg = getReg (I); + const Type *Ty = basePtr->getType(); + // GEPs have zero or more indices; we must perform a struct access + // or array access for each one. + for (GetElementPtrInst::op_iterator oi = I.idx_begin (), + oe = I.idx_end (); oi != oe; ++oi) { + Value *idx = *oi; + unsigned nextBasePtrReg = makeAnotherReg (); + if (const StructType *StTy = dyn_cast (Ty)) { + // It's a struct access. idx is the index into the structure, + // which names the field. This index must have ubyte type. + const ConstantUInt *CUI = cast (idx); + assert (CUI->getType () == Type::UByteTy + && "Funny-looking structure index in GEP"); + // Use the TargetData structure to pick out what the layout of + // the structure is in memory. Since the structure index must + // be constant, we can get its value and use it to find the + // right byte offset from the StructLayout class's list of + // structure member offsets. + unsigned idxValue = CUI->getValue (); + unsigned memberOffset = + TD.getStructLayout (StTy)->MemberOffsets[idxValue]; + // Emit an ADD to add memberOffset to the basePtr. + BuildMI (BB, X86::ADDri32, 2, + nextBasePtrReg).addReg (basePtrReg).addZImm (memberOffset); + // The next type is the member of the structure selected by the + // index. + Ty = StTy->getElementTypes ()[idxValue]; + } else if (const SequentialType *SqTy = cast (Ty)) { + // It's an array or pointer access: [ArraySize x ElementType]. + // The documentation does not seem to match the code on the type + // of array indices. The code seems to use long, and the docs + // (and the comments) say uint. If it is long, I don't know what + // we are going to do, because the X86 loves 64-bit types. + const Type *typeOfSequentialTypeIndex = SqTy->getIndexType (); + // idx is the index into the array. Unlike with structure + // indices, we may not know its actual value at code-generation + // time. + assert (idx->getType () == typeOfSequentialTypeIndex + && "Funny-looking array index in GEP"); + // We want to add basePtrReg to (idxReg * sizeof + // ElementType). First, we must find the size of the pointed-to + // type. (Not coincidentally, the next type is the type of the + // elements in the array.) + Ty = SqTy->getElementType (); + unsigned elementSize = TD.getTypeSize (Ty); + unsigned elementSizeReg = makeAnotherReg (); + copyConstantToRegister (ConstantInt::get (typeOfSequentialTypeIndex, + elementSize), + elementSizeReg); + unsigned idxReg = getReg (idx); + // Emit a MUL to multiply the register holding the index by + // elementSize, putting the result in memberOffsetReg. + unsigned memberOffsetReg = makeAnotherReg (); + doMultiply (memberOffsetReg, typeOfSequentialTypeIndex, + elementSizeReg, idxReg); + // Emit an ADD to add memberOffsetReg to the basePtr. + BuildMI (BB, X86::ADDrr32, 2, + nextBasePtrReg).addReg (basePtrReg).addReg (memberOffsetReg); + } + // Now that we are here, further indices refer to subtypes of this + // one, so we don't need to worry about basePtrReg itself, anymore. + basePtrReg = nextBasePtrReg; + } + // After we have processed all the indices, the result is left in + // basePtrReg. Move it to the register where we were expected to + // put the answer. A 32-bit move should do it, because we are in + // ILP32 land. + BuildMI (BB, X86::MOVrr32, 1, getReg (I)).addReg (basePtrReg); +} + + +/// visitMallocInst - I know that personally, whenever I want to remember +/// something, I have to clear off some space in my brain. +void +ISel::visitMallocInst (MallocInst &I) +{ + visitInstruction (I); +} + + +/// visitAllocaInst - I want some stack space. Come on, man, I said I +/// want some freakin' stack space. +void +ISel::visitAllocaInst (AllocaInst &I) +{ + visitInstruction (I); +} + + /// createSimpleX86InstructionSelector - This pass converts an LLVM function /// into a machine code representation is a very simple peep-hole fashion. The /// generated code sucks but the implementation is nice and simple. diff --git a/lib/Target/X86/X86InstrInfo.def b/lib/Target/X86/X86InstrInfo.def index bf9dba83453..d7796655f9b 100644 --- a/lib/Target/X86/X86InstrInfo.def +++ b/lib/Target/X86/X86InstrInfo.def @@ -152,8 +152,8 @@ I(SARir16 , "sarw", 0xC1, 0, X86II::MRMS7r | X86II::OpSize, NoI I(SARir32 , "sarl", 0xC1, 0, X86II::MRMS7r, NoIR, NoIR) // R32 >>= imm8 // Floating point loads -I(FLDr4 , "flds", 0xD9, 0, X86II::MRMS0m, NoIR, NoIR) // push float -I(FLDr8 , "fldl ", 0xDD, 0, X86II::MRMS0m, NoIR, NoIR) // push double +I(FLDr32 , "flds", 0xD9, 0, X86II::MRMS0m, NoIR, NoIR) // push float +I(FLDr64 , "fldl", 0xDD, 0, X86II::MRMS0m, NoIR, NoIR) // push double // Floating point compares I(FUCOMPP , "fucompp", 0xDA, 0, X86II::Void, NoIR, NoIR) // compare+pop2x diff --git a/tools/jello/GlobalVars.cpp b/tools/jello/GlobalVars.cpp index a9bda6279dc..b13511c0460 100644 --- a/tools/jello/GlobalVars.cpp +++ b/tools/jello/GlobalVars.cpp @@ -9,6 +9,7 @@ #include "llvm/Constants.h" #include "llvm/Target/TargetMachine.h" #include "VM.h" +#include /// EmitGlobals - Emit all of the global variables to memory, storing their /// addresses into GlobalAddress. This must make sure to copy the contents of @@ -77,6 +78,20 @@ void VM::emitConstantToMemory(Constant *Init, void *Addr) { return; default: break; } + } else if (ConstantFP *CF = dyn_cast (Init)) { + switch (CF->getType ()->getPrimitiveID ()) { + case Type::FloatTyID: + *(float*)Addr = CF->getValue (); + return; + case Type::DoubleTyID: + *(double*)Addr = CF->getValue (); + return; + default: break; + } + } else if (ConstantPointerNull *CP = dyn_cast (Init)) { + // Fill the space with a NULL pointer. + *(void **)Addr = NULL; + return; } else if (ConstantArray *CA = dyn_cast(Init)) { unsigned ElementSize = TD.getTypeSize(CA->getType()->getElementType()); for (unsigned i = 0, e = CA->getType()->getNumElements(); i != e; ++i) { @@ -86,5 +101,6 @@ void VM::emitConstantToMemory(Constant *Init, void *Addr) { return; } + std::cerr << "Offending constant: " << Init << "\n"; assert(0 && "Don't know how to emit this constant to memory!"); }