Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 1 | //===-- ReaderInternals.h - Definitions internal to the reader ---*- C++ -*--=// |
| 2 | // |
| 3 | // This header file defines various stuff that is used by the bytecode reader. |
| 4 | // |
| 5 | //===----------------------------------------------------------------------===// |
| 6 | |
| 7 | #ifndef READER_INTERNALS_H |
| 8 | #define READER_INTERNALS_H |
| 9 | |
| 10 | #include "llvm/Bytecode/Primitives.h" |
Chris Lattner | 7061dc5 | 2001-12-03 18:02:31 +0000 | [diff] [blame] | 11 | #include "llvm/DerivedTypes.h" |
Chris Lattner | 7473413 | 2002-08-17 22:01:27 +0000 | [diff] [blame] | 12 | #include "llvm/Function.h" |
Vikram S. Adve | c668b7c | 2002-07-14 23:05:09 +0000 | [diff] [blame] | 13 | #include "llvm/Constant.h" |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 14 | #include <utility> |
Chris Lattner | 7473413 | 2002-08-17 22:01:27 +0000 | [diff] [blame] | 15 | #include <map> |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 16 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 17 | // Enable to trace to figure out what the heck is going on when parsing fails |
Chris Lattner | f608608 | 2001-10-24 05:14:35 +0000 | [diff] [blame] | 18 | #define TRACE_LEVEL 0 |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 19 | |
| 20 | #if TRACE_LEVEL // ByteCodeReading_TRACEer |
Chris Lattner | 52e20b0 | 2003-03-19 20:54:26 +0000 | [diff] [blame^] | 21 | #define BCR_TRACE(n, X) \ |
| 22 | if (n < TRACE_LEVEL) std::cerr << std::string(n*2, ' ') << X |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 23 | #else |
| 24 | #define BCR_TRACE(n, X) |
| 25 | #endif |
| 26 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 27 | typedef unsigned char uchar; |
| 28 | |
| 29 | struct RawInst { // The raw fields out of the bytecode stream... |
| 30 | unsigned NumOperands; |
| 31 | unsigned Opcode; |
| 32 | const Type *Ty; |
| 33 | unsigned Arg1, Arg2; |
| 34 | union { |
| 35 | unsigned Arg3; |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 36 | std::vector<unsigned> *VarArgs; // Contains arg #3,4,5... if NumOperands > 3 |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 37 | }; |
| 38 | }; |
| 39 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 40 | class BytecodeParser : public AbstractTypeUser { |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 41 | std::string Error; // Error message string goes here... |
Chris Lattner | 7473413 | 2002-08-17 22:01:27 +0000 | [diff] [blame] | 42 | BytecodeParser(const BytecodeParser &); // DO NOT IMPLEMENT |
| 43 | void operator=(const BytecodeParser &); // DO NOT IMPLEMENT |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 44 | public: |
| 45 | BytecodeParser() { |
| 46 | // Define this in case we don't see a ModuleGlobalInfo block. |
| 47 | FirstDerivedTyID = Type::FirstDerivedTyID; |
| 48 | } |
Chris Lattner | 52e20b0 | 2003-03-19 20:54:26 +0000 | [diff] [blame^] | 49 | ~BytecodeParser() { |
| 50 | freeTable(Values); |
| 51 | freeTable(LateResolveValues); |
| 52 | freeTable(ModuleValues); |
| 53 | } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 54 | |
| 55 | Module *ParseBytecode(const uchar *Buf, const uchar *EndBuf); |
Chris Lattner | d6b6525 | 2001-10-24 01:15:12 +0000 | [diff] [blame] | 56 | |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 57 | std::string getError() const { return Error; } |
Chris Lattner | d6b6525 | 2001-10-24 01:15:12 +0000 | [diff] [blame] | 58 | |
Chris Lattner | b3afb1f | 2002-04-04 19:24:11 +0000 | [diff] [blame] | 59 | void dump() const { |
Anand Shukla | eea60fc | 2002-06-25 20:44:04 +0000 | [diff] [blame] | 60 | std::cerr << "BytecodeParser instance!\n"; |
Chris Lattner | b3afb1f | 2002-04-04 19:24:11 +0000 | [diff] [blame] | 61 | } |
| 62 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 63 | private: // All of this data is transient across calls to ParseBytecode |
Chris Lattner | 52e20b0 | 2003-03-19 20:54:26 +0000 | [diff] [blame^] | 64 | struct ValueList : public User { |
| 65 | ValueList() : User(Type::TypeTy, Value::TypeVal) { |
| 66 | } |
| 67 | ~ValueList() {} |
| 68 | |
| 69 | // vector compatibility methods |
| 70 | unsigned size() const { return getNumOperands(); } |
| 71 | void push_back(Value *V) { Operands.push_back(Use(V, this)); } |
| 72 | Value *back() const { return Operands.back(); } |
| 73 | void pop_back() { Operands.pop_back(); } |
| 74 | bool empty() const { return Operands.empty(); } |
| 75 | |
| 76 | virtual void print(std::ostream& OS) const { |
| 77 | OS << "Bytecode Reader UseHandle!"; |
| 78 | } |
| 79 | }; |
| 80 | |
Chris Lattner | 05950c3 | 2001-10-13 06:47:01 +0000 | [diff] [blame] | 81 | Module *TheModule; // Current Module being read into... |
| 82 | |
Chris Lattner | 036b8aa | 2003-03-06 17:55:45 +0000 | [diff] [blame] | 83 | // Information about the module, extracted from the bytecode revision number. |
| 84 | unsigned char RevisionNum; // The rev # itself |
| 85 | unsigned char FirstDerivedTyID; // First variable index to use for type |
| 86 | bool HasImplicitZeroInitializer; // Is entry 0 of every slot implicity zeros? |
| 87 | bool isBigEndian, hasLongPointers;// Information about the target compiled for |
| 88 | |
Chris Lattner | 52e20b0 | 2003-03-19 20:54:26 +0000 | [diff] [blame^] | 89 | typedef std::vector<ValueList*> ValueTable; |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 90 | ValueTable Values, LateResolveValues; |
Chris Lattner | 52e20b0 | 2003-03-19 20:54:26 +0000 | [diff] [blame^] | 91 | ValueTable ModuleValues; |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 92 | |
Chris Lattner | 7473413 | 2002-08-17 22:01:27 +0000 | [diff] [blame] | 93 | // GlobalRefs - This maintains a mapping between <Type, Slot #>'s and forward |
| 94 | // references to global values or constants. Such values may be referenced |
| 95 | // before they are defined, and if so, the temporary object that they |
| 96 | // represent is held here. |
| 97 | // |
Chris Lattner | 52e20b0 | 2003-03-19 20:54:26 +0000 | [diff] [blame^] | 98 | typedef std::map<std::pair<const Type *, unsigned>, Value*> GlobalRefsType; |
Chris Lattner | 7473413 | 2002-08-17 22:01:27 +0000 | [diff] [blame] | 99 | GlobalRefsType GlobalRefs; |
Chris Lattner | 05950c3 | 2001-10-13 06:47:01 +0000 | [diff] [blame] | 100 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 101 | // TypesLoaded - This vector mirrors the Values[TypeTyID] plane. It is used |
| 102 | // to deal with forward references to types. |
| 103 | // |
Chris Lattner | 697954c | 2002-01-20 22:54:45 +0000 | [diff] [blame] | 104 | typedef std::vector<PATypeHandle<Type> > TypeValuesListTy; |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 105 | TypeValuesListTy ModuleTypeValues; |
Chris Lattner | 6e5a0e4 | 2003-03-06 17:18:14 +0000 | [diff] [blame] | 106 | TypeValuesListTy FunctionTypeValues; |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 107 | |
Chris Lattner | 52e20b0 | 2003-03-19 20:54:26 +0000 | [diff] [blame^] | 108 | // When the ModuleGlobalInfo section is read, we create a function object for |
| 109 | // each function in the module. When the function is loaded, this function is |
| 110 | // filled in. |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 111 | // |
Chris Lattner | 52e20b0 | 2003-03-19 20:54:26 +0000 | [diff] [blame^] | 112 | std::vector<std::pair<Function*, unsigned> > FunctionSignatureList; |
| 113 | |
| 114 | // Constant values are read in after global variables. Because of this, we |
| 115 | // must defer setting the initializers on global variables until after module |
| 116 | // level constants have been read. In the mean time, this list keeps track of |
| 117 | // what we must do. |
| 118 | // |
| 119 | std::vector<std::pair<GlobalVariable*, unsigned> > GlobalInits; |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 120 | |
| 121 | private: |
Chris Lattner | 52e20b0 | 2003-03-19 20:54:26 +0000 | [diff] [blame^] | 122 | void freeTable(ValueTable &Tab) { |
| 123 | while (!Tab.empty()) { |
| 124 | delete Tab.back(); |
| 125 | Tab.pop_back(); |
| 126 | } |
| 127 | } |
| 128 | |
Chris Lattner | 2a7b6ba | 2003-03-06 17:15:19 +0000 | [diff] [blame] | 129 | bool ParseModule (const uchar * Buf, const uchar *End); |
Chris Lattner | 036b8aa | 2003-03-06 17:55:45 +0000 | [diff] [blame] | 130 | bool ParseVersionInfo (const uchar *&Buf, const uchar *End); |
Chris Lattner | 2a7b6ba | 2003-03-06 17:15:19 +0000 | [diff] [blame] | 131 | bool ParseModuleGlobalInfo(const uchar *&Buf, const uchar *End); |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 132 | bool ParseSymbolTable (const uchar *&Buf, const uchar *End, SymbolTable *); |
Chris Lattner | 6e5a0e4 | 2003-03-06 17:18:14 +0000 | [diff] [blame] | 133 | bool ParseFunction (const uchar *&Buf, const uchar *End); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 134 | bool ParseBasicBlock (const uchar *&Buf, const uchar *End, BasicBlock *&); |
Chris Lattner | 352eef7 | 2002-08-21 22:55:27 +0000 | [diff] [blame] | 135 | bool ParseInstruction (const uchar *&Buf, const uchar *End, Instruction *&, |
| 136 | BasicBlock *BB /*HACK*/); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 137 | bool ParseRawInst (const uchar *&Buf, const uchar *End, RawInst &); |
| 138 | |
Chris Lattner | 52e20b0 | 2003-03-19 20:54:26 +0000 | [diff] [blame^] | 139 | bool ParseGlobalTypes(const uchar *&Buf, const uchar *EndBuf); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 140 | bool ParseConstantPool(const uchar *&Buf, const uchar *EndBuf, |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 141 | ValueTable &Tab, TypeValuesListTy &TypeTab); |
Chris Lattner | e9bb2df | 2001-12-03 22:26:30 +0000 | [diff] [blame] | 142 | bool parseConstantValue(const uchar *&Buf, const uchar *End, |
| 143 | const Type *Ty, Constant *&V); |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 144 | bool parseTypeConstants(const uchar *&Buf, const uchar *EndBuf, |
| 145 | TypeValuesListTy &Tab, unsigned NumEntries); |
| 146 | const Type *parseTypeConstant(const uchar *&Buf, const uchar *EndBuf); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 147 | |
| 148 | Value *getValue(const Type *Ty, unsigned num, bool Create = true); |
| 149 | const Type *getType(unsigned ID); |
Chris Lattner | bbd4b30 | 2002-10-14 03:33:02 +0000 | [diff] [blame] | 150 | Constant *getConstantValue(const Type *Ty, unsigned num); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 151 | |
Chris Lattner | 52e20b0 | 2003-03-19 20:54:26 +0000 | [diff] [blame^] | 152 | int insertValue(Value *V, ValueTable &Table); // -1 = Failure |
| 153 | void setValueTo(ValueTable &D, unsigned Slot, Value *V); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 154 | bool postResolveValues(ValueTable &ValTab); |
| 155 | |
| 156 | bool getTypeSlot(const Type *Ty, unsigned &Slot); |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 157 | |
Chris Lattner | 7473413 | 2002-08-17 22:01:27 +0000 | [diff] [blame] | 158 | // resolve all references to the placeholder (if any) for the given value |
| 159 | void ResolveReferencesToValue(Value *Val, unsigned Slot); |
| 160 | |
Vikram S. Adve | c668b7c | 2002-07-14 23:05:09 +0000 | [diff] [blame] | 161 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 162 | // refineAbstractType - The callback method is invoked when one of the |
| 163 | // elements of TypeValues becomes more concrete... |
| 164 | // |
| 165 | virtual void refineAbstractType(const DerivedType *OldTy, const Type *NewTy); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 166 | }; |
| 167 | |
| 168 | template<class SuperType> |
| 169 | class PlaceholderDef : public SuperType { |
| 170 | unsigned ID; |
Chris Lattner | 7473413 | 2002-08-17 22:01:27 +0000 | [diff] [blame] | 171 | PlaceholderDef(); // DO NOT IMPLEMENT |
| 172 | void operator=(const PlaceholderDef &); // DO NOT IMPLEMENT |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 173 | public: |
| 174 | PlaceholderDef(const Type *Ty, unsigned id) : SuperType(Ty), ID(id) {} |
| 175 | unsigned getID() { return ID; } |
| 176 | }; |
| 177 | |
| 178 | struct InstPlaceHolderHelper : public Instruction { |
| 179 | InstPlaceHolderHelper(const Type *Ty) : Instruction(Ty, UserOp1, "") {} |
Chris Lattner | a41f50d | 2001-07-07 19:24:15 +0000 | [diff] [blame] | 180 | virtual const char *getOpcodeName() const { return "placeholder"; } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 181 | |
| 182 | virtual Instruction *clone() const { abort(); return 0; } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 183 | }; |
| 184 | |
| 185 | struct BBPlaceHolderHelper : public BasicBlock { |
| 186 | BBPlaceHolderHelper(const Type *Ty) : BasicBlock() { |
Chris Lattner | 35e309a | 2002-04-08 21:59:36 +0000 | [diff] [blame] | 187 | assert(Ty == Type::LabelTy); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 188 | } |
| 189 | }; |
| 190 | |
Vikram S. Adve | c668b7c | 2002-07-14 23:05:09 +0000 | [diff] [blame] | 191 | struct ConstantPlaceHolderHelper : public Constant { |
| 192 | ConstantPlaceHolderHelper(const Type *Ty) |
| 193 | : Constant(Ty) {} |
| 194 | virtual bool isNullValue() const { return false; } |
| 195 | }; |
| 196 | |
Chris Lattner | 7473413 | 2002-08-17 22:01:27 +0000 | [diff] [blame] | 197 | typedef PlaceholderDef<InstPlaceHolderHelper> ValPHolder; |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 198 | typedef PlaceholderDef<BBPlaceHolderHelper> BBPHolder; |
Vikram S. Adve | c668b7c | 2002-07-14 23:05:09 +0000 | [diff] [blame] | 199 | typedef PlaceholderDef<ConstantPlaceHolderHelper> ConstPHolder; |
| 200 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 201 | |
Chris Lattner | 7473413 | 2002-08-17 22:01:27 +0000 | [diff] [blame] | 202 | static inline unsigned getValueIDNumberFromPlaceHolder(Value *Val) { |
| 203 | if (isa<Constant>(Val)) |
| 204 | return ((ConstPHolder*)Val)->getID(); |
Vikram S. Adve | c668b7c | 2002-07-14 23:05:09 +0000 | [diff] [blame] | 205 | |
| 206 | // else discriminate by type |
Chris Lattner | 7473413 | 2002-08-17 22:01:27 +0000 | [diff] [blame] | 207 | switch (Val->getType()->getPrimitiveID()) { |
| 208 | case Type::LabelTyID: return ((BBPHolder*)Val)->getID(); |
Chris Lattner | 7473413 | 2002-08-17 22:01:27 +0000 | [diff] [blame] | 209 | default: return ((ValPHolder*)Val)->getID(); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 210 | } |
| 211 | } |
| 212 | |
| 213 | static inline bool readBlock(const uchar *&Buf, const uchar *EndBuf, |
| 214 | unsigned &Type, unsigned &Size) { |
| 215 | #if DEBUG_OUTPUT |
| 216 | bool Result = read(Buf, EndBuf, Type) || read(Buf, EndBuf, Size); |
Anand Shukla | eea60fc | 2002-06-25 20:44:04 +0000 | [diff] [blame] | 217 | std::cerr << "StartLoc = " << ((unsigned)Buf & 4095) |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 218 | << " Type = " << Type << " Size = " << Size << endl; |
| 219 | return Result; |
| 220 | #else |
| 221 | return read(Buf, EndBuf, Type) || read(Buf, EndBuf, Size); |
| 222 | #endif |
| 223 | } |
| 224 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 225 | #endif |