Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 1 | //===-- ReaderInternals.h - Definitions internal to the reader ---*- C++ -*--=// |
| 2 | // |
| 3 | // This header file defines various stuff that is used by the bytecode reader. |
| 4 | // |
| 5 | //===----------------------------------------------------------------------===// |
| 6 | |
| 7 | #ifndef READER_INTERNALS_H |
| 8 | #define READER_INTERNALS_H |
| 9 | |
| 10 | #include "llvm/Bytecode/Primitives.h" |
Chris Lattner | c9aa7df | 2002-03-29 03:51:11 +0000 | [diff] [blame] | 11 | #include "llvm/Function.h" |
Chris Lattner | 221d688 | 2002-02-12 21:07:25 +0000 | [diff] [blame] | 12 | #include "llvm/BasicBlock.h" |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 13 | #include "llvm/Instruction.h" |
Chris Lattner | 7061dc5 | 2001-12-03 18:02:31 +0000 | [diff] [blame] | 14 | #include "llvm/DerivedTypes.h" |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 15 | #include <map> |
| 16 | #include <utility> |
Chris Lattner | 3ff4387 | 2001-09-28 22:56:31 +0000 | [diff] [blame] | 17 | #include <list> |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 18 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 19 | // Enable to trace to figure out what the heck is going on when parsing fails |
Chris Lattner | f608608 | 2001-10-24 05:14:35 +0000 | [diff] [blame] | 20 | #define TRACE_LEVEL 0 |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 21 | |
| 22 | #if TRACE_LEVEL // ByteCodeReading_TRACEer |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 23 | #define BCR_TRACE(n, X) if (n < TRACE_LEVEL) cerr << std::string(n*2, ' ') << X |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 24 | #else |
| 25 | #define BCR_TRACE(n, X) |
| 26 | #endif |
| 27 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 28 | typedef unsigned char uchar; |
| 29 | |
| 30 | struct RawInst { // The raw fields out of the bytecode stream... |
| 31 | unsigned NumOperands; |
| 32 | unsigned Opcode; |
| 33 | const Type *Ty; |
| 34 | unsigned Arg1, Arg2; |
| 35 | union { |
| 36 | unsigned Arg3; |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 37 | std::vector<unsigned> *VarArgs; // Contains arg #3,4,5... if NumOperands > 3 |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 38 | }; |
| 39 | }; |
| 40 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 41 | class BytecodeParser : public AbstractTypeUser { |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 42 | std::string Error; // Error message string goes here... |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 43 | public: |
| 44 | BytecodeParser() { |
| 45 | // Define this in case we don't see a ModuleGlobalInfo block. |
| 46 | FirstDerivedTyID = Type::FirstDerivedTyID; |
| 47 | } |
| 48 | |
| 49 | Module *ParseBytecode(const uchar *Buf, const uchar *EndBuf); |
Chris Lattner | d6b6525 | 2001-10-24 01:15:12 +0000 | [diff] [blame] | 50 | |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 51 | std::string getError() const { return Error; } |
Chris Lattner | d6b6525 | 2001-10-24 01:15:12 +0000 | [diff] [blame] | 52 | |
Chris Lattner | b3afb1f | 2002-04-04 19:24:11 +0000 | [diff] [blame] | 53 | void dump() const { |
| 54 | cerr << "BytecodeParser instance!\n"; |
| 55 | } |
| 56 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 57 | private: // All of this data is transient across calls to ParseBytecode |
Chris Lattner | 05950c3 | 2001-10-13 06:47:01 +0000 | [diff] [blame] | 58 | Module *TheModule; // Current Module being read into... |
| 59 | |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 60 | typedef std::vector<Value *> ValueList; |
| 61 | typedef std::vector<ValueList> ValueTable; |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 62 | ValueTable Values, LateResolveValues; |
| 63 | ValueTable ModuleValues, LateResolveModuleValues; |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 64 | |
Chris Lattner | 05950c3 | 2001-10-13 06:47:01 +0000 | [diff] [blame] | 65 | // GlobalRefs - This maintains a mapping between <Type, Slot #>'s and forward |
| 66 | // references to global values. Global values may be referenced before they |
| 67 | // are defined, and if so, the temporary object that they represent is held |
| 68 | // here. |
| 69 | // |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 70 | typedef std::map<std::pair<const PointerType *, unsigned>, |
| 71 | GlobalVariable*> GlobalRefsType; |
Chris Lattner | 05950c3 | 2001-10-13 06:47:01 +0000 | [diff] [blame] | 72 | GlobalRefsType GlobalRefs; |
| 73 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 74 | // TypesLoaded - This vector mirrors the Values[TypeTyID] plane. It is used |
| 75 | // to deal with forward references to types. |
| 76 | // |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 77 | typedef std::vector<PATypeHandle<Type> > TypeValuesListTy; |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 78 | TypeValuesListTy ModuleTypeValues; |
| 79 | TypeValuesListTy MethodTypeValues; |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 80 | |
| 81 | // Information read from the ModuleGlobalInfo section of the file... |
| 82 | unsigned FirstDerivedTyID; |
| 83 | |
| 84 | // When the ModuleGlobalInfo section is read, we load the type of each method |
| 85 | // and the 'ModuleValues' slot that it lands in. We then load a placeholder |
| 86 | // into its slot to reserve it. When the method is loaded, this placeholder |
| 87 | // is replaced. |
| 88 | // |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 89 | std::list<std::pair<const PointerType *, unsigned> > MethodSignatureList; |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 90 | |
| 91 | private: |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 92 | bool ParseModule (const uchar * Buf, const uchar *End, Module *&); |
| 93 | bool ParseModuleGlobalInfo(const uchar *&Buf, const uchar *End, Module *); |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 94 | bool ParseSymbolTable (const uchar *&Buf, const uchar *End, SymbolTable *); |
| 95 | bool ParseMethod (const uchar *&Buf, const uchar *End, Module *); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 96 | bool ParseBasicBlock (const uchar *&Buf, const uchar *End, BasicBlock *&); |
| 97 | bool ParseInstruction (const uchar *&Buf, const uchar *End, Instruction *&); |
| 98 | bool ParseRawInst (const uchar *&Buf, const uchar *End, RawInst &); |
| 99 | |
| 100 | bool ParseConstantPool(const uchar *&Buf, const uchar *EndBuf, |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 101 | ValueTable &Tab, TypeValuesListTy &TypeTab); |
Chris Lattner | e9bb2df | 2001-12-03 22:26:30 +0000 | [diff] [blame] | 102 | bool parseConstantValue(const uchar *&Buf, const uchar *End, |
| 103 | const Type *Ty, Constant *&V); |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 104 | bool parseTypeConstants(const uchar *&Buf, const uchar *EndBuf, |
| 105 | TypeValuesListTy &Tab, unsigned NumEntries); |
| 106 | const Type *parseTypeConstant(const uchar *&Buf, const uchar *EndBuf); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 107 | |
| 108 | Value *getValue(const Type *Ty, unsigned num, bool Create = true); |
| 109 | const Type *getType(unsigned ID); |
| 110 | |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 111 | int insertValue(Value *D, std::vector<ValueList> &D); // -1 = Failure |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 112 | bool postResolveValues(ValueTable &ValTab); |
| 113 | |
| 114 | bool getTypeSlot(const Type *Ty, unsigned &Slot); |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 115 | |
Chris Lattner | 05950c3 | 2001-10-13 06:47:01 +0000 | [diff] [blame] | 116 | // DeclareNewGlobalValue - Patch up forward references to global values in the |
Chris Lattner | e9bb2df | 2001-12-03 22:26:30 +0000 | [diff] [blame] | 117 | // form of ConstantPointerRefs. |
Chris Lattner | 05950c3 | 2001-10-13 06:47:01 +0000 | [diff] [blame] | 118 | // |
| 119 | void DeclareNewGlobalValue(GlobalValue *GV, unsigned Slot); |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 120 | |
| 121 | // refineAbstractType - The callback method is invoked when one of the |
| 122 | // elements of TypeValues becomes more concrete... |
| 123 | // |
| 124 | virtual void refineAbstractType(const DerivedType *OldTy, const Type *NewTy); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 125 | }; |
| 126 | |
| 127 | template<class SuperType> |
| 128 | class PlaceholderDef : public SuperType { |
| 129 | unsigned ID; |
| 130 | public: |
| 131 | PlaceholderDef(const Type *Ty, unsigned id) : SuperType(Ty), ID(id) {} |
| 132 | unsigned getID() { return ID; } |
| 133 | }; |
| 134 | |
| 135 | struct InstPlaceHolderHelper : public Instruction { |
| 136 | InstPlaceHolderHelper(const Type *Ty) : Instruction(Ty, UserOp1, "") {} |
Chris Lattner | a41f50d | 2001-07-07 19:24:15 +0000 | [diff] [blame] | 137 | virtual const char *getOpcodeName() const { return "placeholder"; } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 138 | |
| 139 | virtual Instruction *clone() const { abort(); return 0; } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 140 | }; |
| 141 | |
| 142 | struct BBPlaceHolderHelper : public BasicBlock { |
| 143 | BBPlaceHolderHelper(const Type *Ty) : BasicBlock() { |
Chris Lattner | 35e309a | 2002-04-08 21:59:36 +0000 | [diff] [blame] | 144 | assert(Ty == Type::LabelTy); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 145 | } |
| 146 | }; |
| 147 | |
Chris Lattner | c9aa7df | 2002-03-29 03:51:11 +0000 | [diff] [blame] | 148 | struct MethPlaceHolderHelper : public Function { |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 149 | MethPlaceHolderHelper(const Type *Ty) |
Chris Lattner | c9aa7df | 2002-03-29 03:51:11 +0000 | [diff] [blame] | 150 | : Function(cast<const FunctionType>(Ty), true) { |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 151 | } |
| 152 | }; |
| 153 | |
| 154 | typedef PlaceholderDef<InstPlaceHolderHelper> DefPHolder; |
| 155 | typedef PlaceholderDef<BBPlaceHolderHelper> BBPHolder; |
| 156 | typedef PlaceholderDef<MethPlaceHolderHelper> MethPHolder; |
| 157 | |
| 158 | static inline unsigned getValueIDNumberFromPlaceHolder(Value *Def) { |
| 159 | switch (Def->getType()->getPrimitiveID()) { |
Chris Lattner | c9aa7df | 2002-03-29 03:51:11 +0000 | [diff] [blame] | 160 | case Type::LabelTyID: return ((BBPHolder*)Def)->getID(); |
| 161 | case Type::FunctionTyID: return ((MethPHolder*)Def)->getID(); |
| 162 | default: return ((DefPHolder*)Def)->getID(); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 163 | } |
| 164 | } |
| 165 | |
| 166 | static inline bool readBlock(const uchar *&Buf, const uchar *EndBuf, |
| 167 | unsigned &Type, unsigned &Size) { |
| 168 | #if DEBUG_OUTPUT |
| 169 | bool Result = read(Buf, EndBuf, Type) || read(Buf, EndBuf, Size); |
| 170 | cerr << "StartLoc = " << ((unsigned)Buf & 4095) |
| 171 | << " Type = " << Type << " Size = " << Size << endl; |
| 172 | return Result; |
| 173 | #else |
| 174 | return read(Buf, EndBuf, Type) || read(Buf, EndBuf, Size); |
| 175 | #endif |
| 176 | } |
| 177 | |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 178 | |
| 179 | // failure Template - This template function is used as a place to put |
| 180 | // breakpoints in to debug failures of the bytecode parser. |
| 181 | // |
| 182 | template <typename X> |
| 183 | static X failure(X Value) { |
| 184 | return Value; |
| 185 | } |
| 186 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 187 | #endif |