blob: a8528e4113adca397582eae9e9d3b62617515d52 [file] [log] [blame]
Chris Lattner00950542001-06-06 20:29:01 +00001//===-- ReaderInternals.h - Definitions internal to the reader ---*- C++ -*--=//
2//
3// This header file defines various stuff that is used by the bytecode reader.
4//
5//===----------------------------------------------------------------------===//
6
7#ifndef READER_INTERNALS_H
8#define READER_INTERNALS_H
9
10#include "llvm/Bytecode/Primitives.h"
Chris Lattner7061dc52001-12-03 18:02:31 +000011#include "llvm/DerivedTypes.h"
Chris Lattner74734132002-08-17 22:01:27 +000012#include "llvm/Function.h"
Vikram S. Advec668b7c2002-07-14 23:05:09 +000013#include "llvm/Constant.h"
Chris Lattner00950542001-06-06 20:29:01 +000014#include <utility>
Chris Lattner74734132002-08-17 22:01:27 +000015#include <map>
Chris Lattner00950542001-06-06 20:29:01 +000016
Chris Lattner1d670cc2001-09-07 16:37:43 +000017// Enable to trace to figure out what the heck is going on when parsing fails
Chris Lattnerf6086082001-10-24 05:14:35 +000018#define TRACE_LEVEL 0
Chris Lattner1d670cc2001-09-07 16:37:43 +000019
20#if TRACE_LEVEL // ByteCodeReading_TRACEer
Chris Lattner52e20b02003-03-19 20:54:26 +000021#define BCR_TRACE(n, X) \
22 if (n < TRACE_LEVEL) std::cerr << std::string(n*2, ' ') << X
Chris Lattner1d670cc2001-09-07 16:37:43 +000023#else
24#define BCR_TRACE(n, X)
25#endif
26
Chris Lattner00950542001-06-06 20:29:01 +000027typedef unsigned char uchar;
28
29struct RawInst { // The raw fields out of the bytecode stream...
30 unsigned NumOperands;
31 unsigned Opcode;
32 const Type *Ty;
33 unsigned Arg1, Arg2;
34 union {
35 unsigned Arg3;
Chris Lattner697954c2002-01-20 22:54:45 +000036 std::vector<unsigned> *VarArgs; // Contains arg #3,4,5... if NumOperands > 3
Chris Lattner00950542001-06-06 20:29:01 +000037 };
38};
39
Chris Lattner1d670cc2001-09-07 16:37:43 +000040class BytecodeParser : public AbstractTypeUser {
Chris Lattner697954c2002-01-20 22:54:45 +000041 std::string Error; // Error message string goes here...
Chris Lattner74734132002-08-17 22:01:27 +000042 BytecodeParser(const BytecodeParser &); // DO NOT IMPLEMENT
43 void operator=(const BytecodeParser &); // DO NOT IMPLEMENT
Chris Lattner00950542001-06-06 20:29:01 +000044public:
45 BytecodeParser() {
46 // Define this in case we don't see a ModuleGlobalInfo block.
47 FirstDerivedTyID = Type::FirstDerivedTyID;
48 }
Chris Lattner52e20b02003-03-19 20:54:26 +000049 ~BytecodeParser() {
50 freeTable(Values);
51 freeTable(LateResolveValues);
52 freeTable(ModuleValues);
53 }
Chris Lattner00950542001-06-06 20:29:01 +000054
Chris Lattner75f20532003-04-22 18:02:52 +000055 Module *ParseBytecode(const uchar *Buf, const uchar *EndBuf,
56 const std::string &ModuleID);
Chris Lattnerd6b65252001-10-24 01:15:12 +000057
Chris Lattner697954c2002-01-20 22:54:45 +000058 std::string getError() const { return Error; }
Chris Lattnerd6b65252001-10-24 01:15:12 +000059
Chris Lattnerb3afb1f2002-04-04 19:24:11 +000060 void dump() const {
Anand Shuklaeea60fc2002-06-25 20:44:04 +000061 std::cerr << "BytecodeParser instance!\n";
Chris Lattnerb3afb1f2002-04-04 19:24:11 +000062 }
63
Chris Lattner00950542001-06-06 20:29:01 +000064private: // All of this data is transient across calls to ParseBytecode
Chris Lattner52e20b02003-03-19 20:54:26 +000065 struct ValueList : public User {
66 ValueList() : User(Type::TypeTy, Value::TypeVal) {
67 }
68 ~ValueList() {}
69
70 // vector compatibility methods
71 unsigned size() const { return getNumOperands(); }
72 void push_back(Value *V) { Operands.push_back(Use(V, this)); }
73 Value *back() const { return Operands.back(); }
74 void pop_back() { Operands.pop_back(); }
75 bool empty() const { return Operands.empty(); }
76
77 virtual void print(std::ostream& OS) const {
78 OS << "Bytecode Reader UseHandle!";
79 }
80 };
81
Chris Lattner05950c32001-10-13 06:47:01 +000082 Module *TheModule; // Current Module being read into...
83
Chris Lattner036b8aa2003-03-06 17:55:45 +000084 // Information about the module, extracted from the bytecode revision number.
85 unsigned char RevisionNum; // The rev # itself
86 unsigned char FirstDerivedTyID; // First variable index to use for type
87 bool HasImplicitZeroInitializer; // Is entry 0 of every slot implicity zeros?
88 bool isBigEndian, hasLongPointers;// Information about the target compiled for
Chris Lattnere3869c82003-04-16 21:16:05 +000089 bool hasInternalMarkerOnly; // Only types of linkage are intern/external
Chris Lattner036b8aa2003-03-06 17:55:45 +000090
Chris Lattner52e20b02003-03-19 20:54:26 +000091 typedef std::vector<ValueList*> ValueTable;
Chris Lattner00950542001-06-06 20:29:01 +000092 ValueTable Values, LateResolveValues;
Chris Lattner52e20b02003-03-19 20:54:26 +000093 ValueTable ModuleValues;
Chris Lattner1d670cc2001-09-07 16:37:43 +000094
Chris Lattner74734132002-08-17 22:01:27 +000095 // GlobalRefs - This maintains a mapping between <Type, Slot #>'s and forward
96 // references to global values or constants. Such values may be referenced
97 // before they are defined, and if so, the temporary object that they
98 // represent is held here.
99 //
Chris Lattner52e20b02003-03-19 20:54:26 +0000100 typedef std::map<std::pair<const Type *, unsigned>, Value*> GlobalRefsType;
Chris Lattner74734132002-08-17 22:01:27 +0000101 GlobalRefsType GlobalRefs;
Chris Lattner05950c32001-10-13 06:47:01 +0000102
Chris Lattner1d670cc2001-09-07 16:37:43 +0000103 // TypesLoaded - This vector mirrors the Values[TypeTyID] plane. It is used
104 // to deal with forward references to types.
105 //
Chris Lattner697954c2002-01-20 22:54:45 +0000106 typedef std::vector<PATypeHandle<Type> > TypeValuesListTy;
Chris Lattner1d670cc2001-09-07 16:37:43 +0000107 TypeValuesListTy ModuleTypeValues;
Chris Lattner6e5a0e42003-03-06 17:18:14 +0000108 TypeValuesListTy FunctionTypeValues;
Chris Lattner00950542001-06-06 20:29:01 +0000109
Chris Lattner52e20b02003-03-19 20:54:26 +0000110 // When the ModuleGlobalInfo section is read, we create a function object for
111 // each function in the module. When the function is loaded, this function is
112 // filled in.
Chris Lattner00950542001-06-06 20:29:01 +0000113 //
Chris Lattner52e20b02003-03-19 20:54:26 +0000114 std::vector<std::pair<Function*, unsigned> > FunctionSignatureList;
115
116 // Constant values are read in after global variables. Because of this, we
117 // must defer setting the initializers on global variables until after module
118 // level constants have been read. In the mean time, this list keeps track of
119 // what we must do.
120 //
121 std::vector<std::pair<GlobalVariable*, unsigned> > GlobalInits;
Chris Lattner00950542001-06-06 20:29:01 +0000122
123private:
Chris Lattner52e20b02003-03-19 20:54:26 +0000124 void freeTable(ValueTable &Tab) {
125 while (!Tab.empty()) {
126 delete Tab.back();
127 Tab.pop_back();
128 }
129 }
130
Chris Lattner2a7b6ba2003-03-06 17:15:19 +0000131 bool ParseModule (const uchar * Buf, const uchar *End);
Chris Lattner036b8aa2003-03-06 17:55:45 +0000132 bool ParseVersionInfo (const uchar *&Buf, const uchar *End);
Chris Lattner2a7b6ba2003-03-06 17:15:19 +0000133 bool ParseModuleGlobalInfo(const uchar *&Buf, const uchar *End);
Chris Lattner1d670cc2001-09-07 16:37:43 +0000134 bool ParseSymbolTable (const uchar *&Buf, const uchar *End, SymbolTable *);
Chris Lattner6e5a0e42003-03-06 17:18:14 +0000135 bool ParseFunction (const uchar *&Buf, const uchar *End);
Chris Lattner00950542001-06-06 20:29:01 +0000136 bool ParseBasicBlock (const uchar *&Buf, const uchar *End, BasicBlock *&);
Chris Lattner352eef72002-08-21 22:55:27 +0000137 bool ParseInstruction (const uchar *&Buf, const uchar *End, Instruction *&,
138 BasicBlock *BB /*HACK*/);
Chris Lattner00950542001-06-06 20:29:01 +0000139 bool ParseRawInst (const uchar *&Buf, const uchar *End, RawInst &);
140
Chris Lattner52e20b02003-03-19 20:54:26 +0000141 bool ParseGlobalTypes(const uchar *&Buf, const uchar *EndBuf);
Chris Lattner00950542001-06-06 20:29:01 +0000142 bool ParseConstantPool(const uchar *&Buf, const uchar *EndBuf,
Chris Lattner1d670cc2001-09-07 16:37:43 +0000143 ValueTable &Tab, TypeValuesListTy &TypeTab);
Chris Lattnere9bb2df2001-12-03 22:26:30 +0000144 bool parseConstantValue(const uchar *&Buf, const uchar *End,
145 const Type *Ty, Constant *&V);
Chris Lattner1d670cc2001-09-07 16:37:43 +0000146 bool parseTypeConstants(const uchar *&Buf, const uchar *EndBuf,
147 TypeValuesListTy &Tab, unsigned NumEntries);
148 const Type *parseTypeConstant(const uchar *&Buf, const uchar *EndBuf);
Chris Lattner00950542001-06-06 20:29:01 +0000149
150 Value *getValue(const Type *Ty, unsigned num, bool Create = true);
151 const Type *getType(unsigned ID);
Chris Lattnerbbd4b302002-10-14 03:33:02 +0000152 Constant *getConstantValue(const Type *Ty, unsigned num);
Chris Lattner00950542001-06-06 20:29:01 +0000153
Chris Lattner52e20b02003-03-19 20:54:26 +0000154 int insertValue(Value *V, ValueTable &Table); // -1 = Failure
155 void setValueTo(ValueTable &D, unsigned Slot, Value *V);
Chris Lattner00950542001-06-06 20:29:01 +0000156 bool postResolveValues(ValueTable &ValTab);
157
158 bool getTypeSlot(const Type *Ty, unsigned &Slot);
Chris Lattner1d670cc2001-09-07 16:37:43 +0000159
Chris Lattner74734132002-08-17 22:01:27 +0000160 // resolve all references to the placeholder (if any) for the given value
161 void ResolveReferencesToValue(Value *Val, unsigned Slot);
162
Vikram S. Advec668b7c2002-07-14 23:05:09 +0000163
Chris Lattner1d670cc2001-09-07 16:37:43 +0000164 // refineAbstractType - The callback method is invoked when one of the
165 // elements of TypeValues becomes more concrete...
166 //
167 virtual void refineAbstractType(const DerivedType *OldTy, const Type *NewTy);
Chris Lattner00950542001-06-06 20:29:01 +0000168};
169
170template<class SuperType>
171class PlaceholderDef : public SuperType {
172 unsigned ID;
Chris Lattner74734132002-08-17 22:01:27 +0000173 PlaceholderDef(); // DO NOT IMPLEMENT
174 void operator=(const PlaceholderDef &); // DO NOT IMPLEMENT
Chris Lattner00950542001-06-06 20:29:01 +0000175public:
176 PlaceholderDef(const Type *Ty, unsigned id) : SuperType(Ty), ID(id) {}
177 unsigned getID() { return ID; }
178};
179
180struct InstPlaceHolderHelper : public Instruction {
181 InstPlaceHolderHelper(const Type *Ty) : Instruction(Ty, UserOp1, "") {}
Chris Lattnera41f50d2001-07-07 19:24:15 +0000182 virtual const char *getOpcodeName() const { return "placeholder"; }
Chris Lattner00950542001-06-06 20:29:01 +0000183
184 virtual Instruction *clone() const { abort(); return 0; }
Chris Lattner00950542001-06-06 20:29:01 +0000185};
186
187struct BBPlaceHolderHelper : public BasicBlock {
188 BBPlaceHolderHelper(const Type *Ty) : BasicBlock() {
Chris Lattner35e309a2002-04-08 21:59:36 +0000189 assert(Ty == Type::LabelTy);
Chris Lattner00950542001-06-06 20:29:01 +0000190 }
191};
192
Vikram S. Advec668b7c2002-07-14 23:05:09 +0000193struct ConstantPlaceHolderHelper : public Constant {
194 ConstantPlaceHolderHelper(const Type *Ty)
195 : Constant(Ty) {}
196 virtual bool isNullValue() const { return false; }
197};
198
Chris Lattner74734132002-08-17 22:01:27 +0000199typedef PlaceholderDef<InstPlaceHolderHelper> ValPHolder;
Chris Lattner00950542001-06-06 20:29:01 +0000200typedef PlaceholderDef<BBPlaceHolderHelper> BBPHolder;
Vikram S. Advec668b7c2002-07-14 23:05:09 +0000201typedef PlaceholderDef<ConstantPlaceHolderHelper> ConstPHolder;
202
Chris Lattner00950542001-06-06 20:29:01 +0000203
Chris Lattner74734132002-08-17 22:01:27 +0000204static inline unsigned getValueIDNumberFromPlaceHolder(Value *Val) {
205 if (isa<Constant>(Val))
206 return ((ConstPHolder*)Val)->getID();
Vikram S. Advec668b7c2002-07-14 23:05:09 +0000207
208 // else discriminate by type
Chris Lattner74734132002-08-17 22:01:27 +0000209 switch (Val->getType()->getPrimitiveID()) {
210 case Type::LabelTyID: return ((BBPHolder*)Val)->getID();
Chris Lattner74734132002-08-17 22:01:27 +0000211 default: return ((ValPHolder*)Val)->getID();
Chris Lattner00950542001-06-06 20:29:01 +0000212 }
213}
214
215static inline bool readBlock(const uchar *&Buf, const uchar *EndBuf,
216 unsigned &Type, unsigned &Size) {
217#if DEBUG_OUTPUT
218 bool Result = read(Buf, EndBuf, Type) || read(Buf, EndBuf, Size);
Anand Shuklaeea60fc2002-06-25 20:44:04 +0000219 std::cerr << "StartLoc = " << ((unsigned)Buf & 4095)
Chris Lattner00950542001-06-06 20:29:01 +0000220 << " Type = " << Type << " Size = " << Size << endl;
221 return Result;
222#else
223 return read(Buf, EndBuf, Type) || read(Buf, EndBuf, Size);
224#endif
225}
226
Chris Lattner00950542001-06-06 20:29:01 +0000227#endif