blob: f5ef3d90b612ad5b2ec4c38971d5609d2f7f3aea [file] [log] [blame]
Chris Lattnerd9113c72003-10-13 04:22:07 +00001//===-- ReaderInternals.h - Definitions internal to the reader --*- C++ -*-===//
John Criswell856ba762003-10-21 15:17:13 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by the LLVM research group and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
Chris Lattner00950542001-06-06 20:29:01 +00009//
10// This header file defines various stuff that is used by the bytecode reader.
11//
12//===----------------------------------------------------------------------===//
13
14#ifndef READER_INTERNALS_H
15#define READER_INTERNALS_H
16
Chris Lattner3446ae82004-01-10 19:00:15 +000017#include "ReaderPrimitives.h"
Chris Lattner8dc6ba92003-11-14 06:38:46 +000018#include "llvm/Constants.h"
Chris Lattner7061dc52001-12-03 18:02:31 +000019#include "llvm/DerivedTypes.h"
Chris Lattner74734132002-08-17 22:01:27 +000020#include "llvm/Function.h"
Misha Brukman12c29d12003-09-22 23:38:23 +000021#include "llvm/ModuleProvider.h"
Chris Lattner00950542001-06-06 20:29:01 +000022#include <utility>
Chris Lattner74734132002-08-17 22:01:27 +000023#include <map>
Chris Lattner00950542001-06-06 20:29:01 +000024
Brian Gaeked0fde302003-11-11 22:41:34 +000025namespace llvm {
26
Chris Lattner1d670cc2001-09-07 16:37:43 +000027// Enable to trace to figure out what the heck is going on when parsing fails
Chris Lattnerd256ed82003-09-04 23:47:07 +000028//#define TRACE_LEVEL 10
Alkis Evlogimenos60048b82003-10-30 18:33:58 +000029//#define DEBUG_OUTPUT
Chris Lattner1d670cc2001-09-07 16:37:43 +000030
Misha Brukman12c29d12003-09-22 23:38:23 +000031#if TRACE_LEVEL // ByteCodeReading_TRACEr
Chris Lattner52e20b02003-03-19 20:54:26 +000032#define BCR_TRACE(n, X) \
33 if (n < TRACE_LEVEL) std::cerr << std::string(n*2, ' ') << X
Chris Lattner1d670cc2001-09-07 16:37:43 +000034#else
35#define BCR_TRACE(n, X)
36#endif
37
Misha Brukman12c29d12003-09-22 23:38:23 +000038struct LazyFunctionInfo {
39 const unsigned char *Buf, *EndBuf;
Chris Lattner29b789b2003-11-19 17:27:18 +000040 LazyFunctionInfo(const unsigned char *B = 0, const unsigned char *EB = 0)
41 : Buf(B), EndBuf(EB) {}
Misha Brukman12c29d12003-09-22 23:38:23 +000042};
43
Chris Lattner00413e32003-10-04 20:14:59 +000044class BytecodeParser : public ModuleProvider {
Chris Lattner74734132002-08-17 22:01:27 +000045 BytecodeParser(const BytecodeParser &); // DO NOT IMPLEMENT
46 void operator=(const BytecodeParser &); // DO NOT IMPLEMENT
Chris Lattner00950542001-06-06 20:29:01 +000047public:
Chris Lattner89e02532004-01-18 21:08:15 +000048 BytecodeParser() {}
Misha Brukman12c29d12003-09-22 23:38:23 +000049
Chris Lattner52e20b02003-03-19 20:54:26 +000050 ~BytecodeParser() {
Chris Lattnera2602f32003-05-22 18:26:48 +000051 freeState();
52 }
53 void freeState() {
Chris Lattner52e20b02003-03-19 20:54:26 +000054 freeTable(Values);
Chris Lattner52e20b02003-03-19 20:54:26 +000055 freeTable(ModuleValues);
56 }
Chris Lattner00950542001-06-06 20:29:01 +000057
Misha Brukman12c29d12003-09-22 23:38:23 +000058 Module* releaseModule() {
59 // Since we're losing control of this Module, we must hand it back complete
Chris Lattner927b1852003-10-09 20:22:47 +000060 Module *M = ModuleProvider::releaseModule();
Misha Brukman12c29d12003-09-22 23:38:23 +000061 freeState();
Chris Lattner927b1852003-10-09 20:22:47 +000062 return M;
Misha Brukman12c29d12003-09-22 23:38:23 +000063 }
Chris Lattnerd6b65252001-10-24 01:15:12 +000064
Misha Brukman12c29d12003-09-22 23:38:23 +000065 void ParseBytecode(const unsigned char *Buf, unsigned Length,
66 const std::string &ModuleID);
Chris Lattnerd6b65252001-10-24 01:15:12 +000067
Chris Lattnerb3afb1f2002-04-04 19:24:11 +000068 void dump() const {
Anand Shuklaeea60fc2002-06-25 20:44:04 +000069 std::cerr << "BytecodeParser instance!\n";
Chris Lattnerb3afb1f2002-04-04 19:24:11 +000070 }
71
Chris Lattner6e448022003-10-08 21:51:46 +000072private:
Chris Lattner52e20b02003-03-19 20:54:26 +000073 struct ValueList : public User {
Chris Lattner6e448022003-10-08 21:51:46 +000074 ValueList() : User(Type::TypeTy, Value::TypeVal) {}
Chris Lattner52e20b02003-03-19 20:54:26 +000075
76 // vector compatibility methods
77 unsigned size() const { return getNumOperands(); }
78 void push_back(Value *V) { Operands.push_back(Use(V, this)); }
79 Value *back() const { return Operands.back(); }
80 void pop_back() { Operands.pop_back(); }
81 bool empty() const { return Operands.empty(); }
82
83 virtual void print(std::ostream& OS) const {
84 OS << "Bytecode Reader UseHandle!";
85 }
86 };
87
Chris Lattner036b8aa2003-03-06 17:55:45 +000088 // Information about the module, extracted from the bytecode revision number.
89 unsigned char RevisionNum; // The rev # itself
Chris Lattnercb7e2e22003-10-18 05:54:18 +000090 bool hasExtendedLinkageSpecs; // Supports more than 4 linkage types
91 bool hasOldStyleVarargs; // Has old version of varargs intrinsics?
92 bool hasVarArgCallPadding; // Bytecode has extra padding in vararg call
93
94 bool usesOldStyleVarargs; // Does this module USE old style varargs?
Chris Lattner036b8aa2003-03-06 17:55:45 +000095
Chris Lattner80b97342004-01-17 23:25:43 +000096 // Flags to distinguish LLVM 1.0 & 1.1 bytecode formats (revision #0)
97
98 // Revision #0 had an explicit alignment of data only for the ModuleGlobalInfo
99 // block. This was fixed to be like all other blocks in 1.2
Chris Lattner44d0eeb2004-01-15 17:55:01 +0000100 bool hasInconsistentModuleGlobalInfo;
101
Chris Lattner80b97342004-01-17 23:25:43 +0000102 // Revision #0 also explicitly encoded zero values for primitive types like
103 // int/sbyte/etc.
104 bool hasExplicitPrimitiveZeros;
105
Chris Lattner52e20b02003-03-19 20:54:26 +0000106 typedef std::vector<ValueList*> ValueTable;
Chris Lattner8eb10ce2003-10-09 06:05:40 +0000107 ValueTable Values;
Chris Lattner52e20b02003-03-19 20:54:26 +0000108 ValueTable ModuleValues;
Chris Lattner8eb10ce2003-10-09 06:05:40 +0000109 std::map<std::pair<unsigned,unsigned>, Value*> ForwardReferences;
Chris Lattner1d670cc2001-09-07 16:37:43 +0000110
Chris Lattner89e02532004-01-18 21:08:15 +0000111 /// CompactionTable - If a compaction table is active in the current function,
112 /// this is the mapping that it contains.
113 std::vector<std::vector<Value*> > CompactionTable;
114
Chris Lattner4ee8ef22003-10-08 22:52:54 +0000115 std::vector<BasicBlock*> ParsedBasicBlocks;
116
Chris Lattner29b789b2003-11-19 17:27:18 +0000117 // ConstantFwdRefs - This maintains a mapping between <Type, Slot #>'s and
118 // forward references to constants. Such values may be referenced before they
119 // are defined, and if so, the temporary object that they represent is held
120 // here.
Chris Lattner74734132002-08-17 22:01:27 +0000121 //
Chris Lattner29b789b2003-11-19 17:27:18 +0000122 typedef std::map<std::pair<const Type*,unsigned>, Constant*> ConstantRefsType;
123 ConstantRefsType ConstantFwdRefs;
Chris Lattner05950c32001-10-13 06:47:01 +0000124
Chris Lattner1d670cc2001-09-07 16:37:43 +0000125 // TypesLoaded - This vector mirrors the Values[TypeTyID] plane. It is used
126 // to deal with forward references to types.
127 //
Chris Lattnerc7b6f032003-10-02 20:26:18 +0000128 typedef std::vector<PATypeHolder> TypeValuesListTy;
Chris Lattner1d670cc2001-09-07 16:37:43 +0000129 TypeValuesListTy ModuleTypeValues;
Chris Lattner6e5a0e42003-03-06 17:18:14 +0000130 TypeValuesListTy FunctionTypeValues;
Chris Lattner00950542001-06-06 20:29:01 +0000131
Chris Lattner52e20b02003-03-19 20:54:26 +0000132 // When the ModuleGlobalInfo section is read, we create a function object for
133 // each function in the module. When the function is loaded, this function is
134 // filled in.
Chris Lattner00950542001-06-06 20:29:01 +0000135 //
Chris Lattner29b789b2003-11-19 17:27:18 +0000136 std::vector<Function*> FunctionSignatureList;
Chris Lattner52e20b02003-03-19 20:54:26 +0000137
138 // Constant values are read in after global variables. Because of this, we
139 // must defer setting the initializers on global variables until after module
140 // level constants have been read. In the mean time, this list keeps track of
141 // what we must do.
142 //
143 std::vector<std::pair<GlobalVariable*, unsigned> > GlobalInits;
Chris Lattner00950542001-06-06 20:29:01 +0000144
Misha Brukman12c29d12003-09-22 23:38:23 +0000145 // For lazy reading-in of functions, we need to save away several pieces of
146 // information about each function: its begin and end pointer in the buffer
147 // and its FunctionSlot.
148 //
Chris Lattner29b789b2003-11-19 17:27:18 +0000149 std::map<Function*, LazyFunctionInfo> LazyFunctionLoadMap;
Misha Brukman12c29d12003-09-22 23:38:23 +0000150
Chris Lattner00950542001-06-06 20:29:01 +0000151private:
Chris Lattner52e20b02003-03-19 20:54:26 +0000152 void freeTable(ValueTable &Tab) {
153 while (!Tab.empty()) {
154 delete Tab.back();
155 Tab.pop_back();
156 }
157 }
158
Chris Lattner89e02532004-01-18 21:08:15 +0000159 /// getGlobalTableType - This is just like getType, but when a compaction
160 /// table is in use, it is ignored. Also, no forward references or other
161 /// fancy features are supported.
162 const Type *getGlobalTableType(unsigned Slot) {
163 if (Slot < Type::FirstDerivedTyID) {
164 const Type *Ty = Type::getPrimitiveType((Type::PrimitiveID)Slot);
165 assert(Ty && "Not a primitive type ID?");
166 return Ty;
167 }
168 Slot -= Type::FirstDerivedTyID;
169 if (Slot >= ModuleTypeValues.size())
170 throw std::string("Illegal compaction table type reference!");
171 return ModuleTypeValues[Slot];
172 }
173
174 unsigned getGlobalTableTypeSlot(const Type *Ty) {
175 if (Ty->isPrimitiveType())
176 return Ty->getPrimitiveID();
177 TypeValuesListTy::iterator I = find(ModuleTypeValues.begin(),
178 ModuleTypeValues.end(), Ty);
179 if (I == ModuleTypeValues.end())
180 throw std::string("Didn't find type in ModuleTypeValues.");
181 return Type::FirstDerivedTyID + (&*I - &ModuleTypeValues[0]);
182 }
183
184 /// getGlobalTableValue - This is just like getValue, but when a compaction
185 /// table is in use, it is ignored. Also, no forward references or other
186 /// fancy features are supported.
187 Value *getGlobalTableValue(const Type *Ty, unsigned SlotNo) {
188 // FIXME: getTypeSlot is inefficient!
189 unsigned TyID = getGlobalTableTypeSlot(Ty);
190
191 if (TyID != Type::LabelTyID) {
192 if (SlotNo == 0)
193 return Constant::getNullValue(Ty);
194 --SlotNo;
195 }
196
197 if (TyID >= ModuleValues.size() || ModuleValues[TyID] == 0 ||
198 SlotNo >= ModuleValues[TyID]->getNumOperands()) {
199 std::cerr << TyID << ", " << SlotNo << ": " << ModuleValues.size() << ", "
200 << (void*)ModuleValues[TyID] << ", "
201 << ModuleValues[TyID]->getNumOperands() << "\n";
202 throw std::string("Corrupt compaction table entry!");
203 }
204 return ModuleValues[TyID]->getOperand(SlotNo);
205 }
206
Misha Brukman12c29d12003-09-22 23:38:23 +0000207public:
208 void ParseModule(const unsigned char * Buf, const unsigned char *End);
209 void materializeFunction(Function *F);
210
211private:
212 void ParseVersionInfo (const unsigned char *&Buf, const unsigned char *End);
213 void ParseModuleGlobalInfo(const unsigned char *&Buf, const unsigned char *E);
214 void ParseSymbolTable(const unsigned char *&Buf, const unsigned char *End,
Chris Lattner4ee8ef22003-10-08 22:52:54 +0000215 SymbolTable *, Function *CurrentFunction);
Misha Brukman12c29d12003-09-22 23:38:23 +0000216 void ParseFunction(const unsigned char *&Buf, const unsigned char *End);
Chris Lattner89e02532004-01-18 21:08:15 +0000217 void ParseCompactionTable(const unsigned char *&Buf,const unsigned char *End);
Misha Brukman12c29d12003-09-22 23:38:23 +0000218 void ParseGlobalTypes(const unsigned char *&Buf, const unsigned char *EndBuf);
219
Chris Lattner4ee8ef22003-10-08 22:52:54 +0000220 BasicBlock *ParseBasicBlock(const unsigned char *&Buf,
221 const unsigned char *End,
222 unsigned BlockNo);
Chris Lattner8d1dbd22003-12-01 07:05:31 +0000223 unsigned ParseInstructionList(Function *F, const unsigned char *&Buf,
224 const unsigned char *EndBuf);
225
Chris Lattnercb7e2e22003-10-18 05:54:18 +0000226 void ParseInstruction(const unsigned char *&Buf, const unsigned char *End,
227 std::vector<unsigned> &Args, BasicBlock *BB);
Chris Lattner00950542001-06-06 20:29:01 +0000228
Misha Brukman12c29d12003-09-22 23:38:23 +0000229 void ParseConstantPool(const unsigned char *&Buf, const unsigned char *EndBuf,
230 ValueTable &Tab, TypeValuesListTy &TypeTab);
Chris Lattner9e460f22003-10-04 20:00:03 +0000231 Constant *parseConstantValue(const unsigned char *&Buf,
232 const unsigned char *End,
Chris Lattner29b789b2003-11-19 17:27:18 +0000233 unsigned TypeID);
Misha Brukman12c29d12003-09-22 23:38:23 +0000234 void parseTypeConstants(const unsigned char *&Buf,
Chris Lattner12e64652003-05-22 18:08:30 +0000235 const unsigned char *EndBuf,
Misha Brukman12c29d12003-09-22 23:38:23 +0000236 TypeValuesListTy &Tab, unsigned NumEntries);
Chris Lattner12e64652003-05-22 18:08:30 +0000237 const Type *parseTypeConstant(const unsigned char *&Buf,
238 const unsigned char *EndBuf);
Chris Lattner9e893e82004-01-14 23:35:21 +0000239 void parseStringConstants(const unsigned char *&Buf,
240 const unsigned char *EndBuf,
241 unsigned NumEntries, ValueTable &Tab);
Chris Lattner00950542001-06-06 20:29:01 +0000242
Chris Lattner36392bc2003-10-08 21:18:57 +0000243 Value *getValue(unsigned TypeID, unsigned num, bool Create = true);
Chris Lattner00950542001-06-06 20:29:01 +0000244 const Type *getType(unsigned ID);
Chris Lattner4ee8ef22003-10-08 22:52:54 +0000245 BasicBlock *getBasicBlock(unsigned ID);
Chris Lattner1c3673b2003-11-19 06:01:12 +0000246 Constant *getConstantValue(unsigned TypeID, unsigned num);
247 Constant *getConstantValue(const Type *Ty, unsigned num) {
248 return getConstantValue(getTypeSlot(Ty), num);
249 }
Chris Lattner00950542001-06-06 20:29:01 +0000250
Chris Lattnerf0d92732003-10-13 14:34:59 +0000251 unsigned insertValue(Value *V, unsigned Type, ValueTable &Table);
Chris Lattner00950542001-06-06 20:29:01 +0000252
Chris Lattner9e460f22003-10-04 20:00:03 +0000253 unsigned getTypeSlot(const Type *Ty);
Chris Lattner1d670cc2001-09-07 16:37:43 +0000254
Chris Lattner29b789b2003-11-19 17:27:18 +0000255 // resolve all references to the placeholder (if any) for the given constant
256 void ResolveReferencesToConstant(Constant *C, unsigned Slot);
Chris Lattner00950542001-06-06 20:29:01 +0000257};
258
259template<class SuperType>
260class PlaceholderDef : public SuperType {
261 unsigned ID;
Chris Lattner74734132002-08-17 22:01:27 +0000262 PlaceholderDef(); // DO NOT IMPLEMENT
263 void operator=(const PlaceholderDef &); // DO NOT IMPLEMENT
Chris Lattner00950542001-06-06 20:29:01 +0000264public:
265 PlaceholderDef(const Type *Ty, unsigned id) : SuperType(Ty), ID(id) {}
266 unsigned getID() { return ID; }
267};
268
Chris Lattner8dc6ba92003-11-14 06:38:46 +0000269struct ConstantPlaceHolderHelper : public ConstantExpr {
Chris Lattnerdb9546e2003-11-14 16:34:25 +0000270 ConstantPlaceHolderHelper(const Type *Ty)
271 : ConstantExpr(Instruction::UserOp1, Constant::getNullValue(Ty), Ty) {}
Vikram S. Advec668b7c2002-07-14 23:05:09 +0000272};
273
Vikram S. Advec668b7c2002-07-14 23:05:09 +0000274typedef PlaceholderDef<ConstantPlaceHolderHelper> ConstPHolder;
275
Misha Brukman12c29d12003-09-22 23:38:23 +0000276static inline void readBlock(const unsigned char *&Buf,
Chris Lattner12e64652003-05-22 18:08:30 +0000277 const unsigned char *EndBuf,
Misha Brukman12c29d12003-09-22 23:38:23 +0000278 unsigned &Type, unsigned &Size) {
Chris Lattner7969dc22004-01-15 06:13:09 +0000279 Type = read(Buf, EndBuf);
280 Size = read(Buf, EndBuf);
Chris Lattner00950542001-06-06 20:29:01 +0000281}
282
Brian Gaeked0fde302003-11-11 22:41:34 +0000283} // End llvm namespace
284
Chris Lattner00950542001-06-06 20:29:01 +0000285#endif