Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 1 | //===- Reader.cpp - Code to read bytecode files -----------------------------=== |
| 2 | // |
| 3 | // This library implements the functionality defined in llvm/Bytecode/Reader.h |
| 4 | // |
| 5 | // Note that this library should be as fast as possible, reentrant, and |
| 6 | // threadsafe!! |
| 7 | // |
| 8 | // TODO: Make error message outputs be configurable depending on an option? |
| 9 | // TODO: Allow passing in an option to ignore the symbol table |
| 10 | // |
| 11 | //===------------------------------------------------------------------------=== |
| 12 | |
| 13 | #include "llvm/Bytecode/Reader.h" |
| 14 | #include "llvm/Bytecode/Format.h" |
Chris Lattner | 70cc339 | 2001-09-10 07:58:01 +0000 | [diff] [blame] | 15 | #include "llvm/GlobalVariable.h" |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 16 | #include "llvm/Module.h" |
| 17 | #include "llvm/BasicBlock.h" |
| 18 | #include "llvm/DerivedTypes.h" |
| 19 | #include "llvm/ConstPoolVals.h" |
| 20 | #include "llvm/iOther.h" |
| 21 | #include "ReaderInternals.h" |
| 22 | #include <sys/types.h> |
| 23 | #include <sys/mman.h> |
| 24 | #include <sys/stat.h> |
| 25 | #include <fcntl.h> |
| 26 | #include <unistd.h> |
| 27 | #include <algorithm> |
| 28 | |
| 29 | bool BytecodeParser::getTypeSlot(const Type *Ty, unsigned &Slot) { |
| 30 | if (Ty->isPrimitiveType()) { |
| 31 | Slot = Ty->getPrimitiveID(); |
| 32 | } else { |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 33 | // Check the method level types first... |
| 34 | TypeValuesListTy::iterator I = find(MethodTypeValues.begin(), |
| 35 | MethodTypeValues.end(), Ty); |
| 36 | if (I != MethodTypeValues.end()) { |
| 37 | Slot = FirstDerivedTyID+ModuleTypeValues.size()+ |
| 38 | (&*I - &MethodTypeValues[0]); |
| 39 | } else { |
| 40 | I = find(ModuleTypeValues.begin(), ModuleTypeValues.end(), Ty); |
| 41 | if (I == ModuleTypeValues.end()) return true; // Didn't find type! |
| 42 | Slot = FirstDerivedTyID + (&*I - &ModuleTypeValues[0]); |
| 43 | } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 44 | } |
| 45 | //cerr << "getTypeSlot '" << Ty->getName() << "' = " << Slot << endl; |
| 46 | return false; |
| 47 | } |
| 48 | |
| 49 | const Type *BytecodeParser::getType(unsigned ID) { |
| 50 | const Type *T = Type::getPrimitiveType((Type::PrimitiveID)ID); |
| 51 | if (T) return T; |
| 52 | |
| 53 | //cerr << "Looking up Type ID: " << ID << endl; |
| 54 | |
| 55 | const Value *D = getValue(Type::TypeTy, ID, false); |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 56 | if (D == 0) return failure<const Type*>(0); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 57 | |
Chris Lattner | cfe26c9 | 2001-10-01 18:26:53 +0000 | [diff] [blame] | 58 | return cast<Type>(D); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 59 | } |
| 60 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 61 | bool BytecodeParser::insertValue(Value *Val, vector<ValueList> &ValueTab) { |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 62 | unsigned type; |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 63 | if (getTypeSlot(Val->getType(), type)) return failure(true); |
| 64 | assert(type != Type::TypeTyID && "Types should never be insertValue'd!"); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 65 | |
| 66 | if (ValueTab.size() <= type) |
| 67 | ValueTab.resize(type+1, ValueList()); |
| 68 | |
| 69 | //cerr << "insertValue Values[" << type << "][" << ValueTab[type].size() |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 70 | // << "] = " << Val << endl; |
| 71 | ValueTab[type].push_back(Val); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 72 | |
| 73 | return false; |
| 74 | } |
| 75 | |
| 76 | Value *BytecodeParser::getValue(const Type *Ty, unsigned oNum, bool Create) { |
| 77 | unsigned Num = oNum; |
| 78 | unsigned type; // The type plane it lives in... |
| 79 | |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 80 | if (getTypeSlot(Ty, type)) return failure<Value*>(0); // TODO: true |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 81 | |
| 82 | if (type == Type::TypeTyID) { // The 'type' plane has implicit values |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 83 | assert(Create == false); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 84 | const Type *T = Type::getPrimitiveType((Type::PrimitiveID)Num); |
| 85 | if (T) return (Value*)T; // Asked for a primitive type... |
| 86 | |
| 87 | // Otherwise, derived types need offset... |
| 88 | Num -= FirstDerivedTyID; |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 89 | |
| 90 | // Is it a module level type? |
| 91 | if (Num < ModuleTypeValues.size()) |
| 92 | return (Value*)(const Type*)ModuleTypeValues[Num]; |
| 93 | |
| 94 | // Nope, is it a method level type? |
| 95 | Num -= ModuleTypeValues.size(); |
| 96 | if (Num < MethodTypeValues.size()) |
| 97 | return (Value*)(const Type*)MethodTypeValues[Num]; |
| 98 | |
| 99 | return 0; |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 100 | } |
| 101 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 102 | if (type < ModuleValues.size()) { |
| 103 | if (Num < ModuleValues[type].size()) |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 104 | return ModuleValues[type][Num]; |
| 105 | Num -= ModuleValues[type].size(); |
| 106 | } |
| 107 | |
| 108 | if (Values.size() > type && Values[type].size() > Num) |
| 109 | return Values[type][Num]; |
| 110 | |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 111 | if (!Create) return failure<Value*>(0); // Do not create a placeholder? |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 112 | |
| 113 | Value *d = 0; |
| 114 | switch (Ty->getPrimitiveID()) { |
| 115 | case Type::LabelTyID: d = new BBPHolder(Ty, oNum); break; |
| 116 | case Type::MethodTyID: |
| 117 | cerr << "Creating method pholder! : " << type << ":" << oNum << " " |
| 118 | << Ty->getName() << endl; |
| 119 | d = new MethPHolder(Ty, oNum); |
| 120 | insertValue(d, LateResolveModuleValues); |
| 121 | return d; |
| 122 | default: d = new DefPHolder(Ty, oNum); break; |
| 123 | } |
| 124 | |
| 125 | assert(d != 0 && "How did we not make something?"); |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 126 | if (insertValue(d, LateResolveValues)) return failure<Value*>(0); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 127 | return d; |
| 128 | } |
| 129 | |
| 130 | bool BytecodeParser::postResolveValues(ValueTable &ValTab) { |
| 131 | bool Error = false; |
Chris Lattner | 7fc9fe3 | 2001-06-27 23:41:11 +0000 | [diff] [blame] | 132 | for (unsigned ty = 0; ty < ValTab.size(); ++ty) { |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 133 | ValueList &DL = ValTab[ty]; |
| 134 | unsigned Size; |
| 135 | while ((Size = DL.size())) { |
| 136 | unsigned IDNumber = getValueIDNumberFromPlaceHolder(DL[Size-1]); |
| 137 | |
| 138 | Value *D = DL[Size-1]; |
| 139 | DL.pop_back(); |
| 140 | |
| 141 | Value *NewDef = getValue(D->getType(), IDNumber, false); |
| 142 | if (NewDef == 0) { |
| 143 | Error = true; // Unresolved thinger |
| 144 | cerr << "Unresolvable reference found: <" << D->getType()->getName() |
| 145 | << ">:" << IDNumber << "!\n"; |
| 146 | } else { |
| 147 | // Fixup all of the uses of this placeholder def... |
| 148 | D->replaceAllUsesWith(NewDef); |
| 149 | |
| 150 | // Now that all the uses are gone, delete the placeholder... |
| 151 | // If we couldn't find a def (error case), then leak a little |
| 152 | delete D; // memory, 'cause otherwise we can't remove all uses! |
| 153 | } |
| 154 | } |
| 155 | } |
| 156 | |
| 157 | return Error; |
| 158 | } |
| 159 | |
| 160 | bool BytecodeParser::ParseBasicBlock(const uchar *&Buf, const uchar *EndBuf, |
| 161 | BasicBlock *&BB) { |
| 162 | BB = new BasicBlock(); |
| 163 | |
| 164 | while (Buf < EndBuf) { |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 165 | Instruction *Inst; |
| 166 | if (ParseInstruction(Buf, EndBuf, Inst)) { |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 167 | delete BB; |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 168 | return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 169 | } |
| 170 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 171 | if (Inst == 0) { delete BB; return failure(true); } |
| 172 | if (insertValue(Inst, Values)) { delete BB; return failure(true); } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 173 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 174 | BB->getInstList().push_back(Inst); |
| 175 | |
| 176 | BCR_TRACE(4, Inst); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 177 | } |
| 178 | |
| 179 | return false; |
| 180 | } |
| 181 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 182 | bool BytecodeParser::ParseSymbolTable(const uchar *&Buf, const uchar *EndBuf, |
| 183 | SymbolTable *ST) { |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 184 | while (Buf < EndBuf) { |
| 185 | // Symtab block header: [num entries][type id number] |
| 186 | unsigned NumEntries, Typ; |
| 187 | if (read_vbr(Buf, EndBuf, NumEntries) || |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 188 | read_vbr(Buf, EndBuf, Typ)) return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 189 | const Type *Ty = getType(Typ); |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 190 | if (Ty == 0) return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 191 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 192 | BCR_TRACE(3, "Plane Type: '" << Ty << "' with " << NumEntries << |
| 193 | " entries\n"); |
| 194 | |
Chris Lattner | 7fc9fe3 | 2001-06-27 23:41:11 +0000 | [diff] [blame] | 195 | for (unsigned i = 0; i < NumEntries; ++i) { |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 196 | // Symtab entry: [def slot #][name] |
| 197 | unsigned slot; |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 198 | if (read_vbr(Buf, EndBuf, slot)) return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 199 | string Name; |
| 200 | if (read(Buf, EndBuf, Name, false)) // Not aligned... |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 201 | return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 202 | |
| 203 | Value *D = getValue(Ty, slot, false); // Find mapping... |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 204 | if (D == 0) { |
| 205 | BCR_TRACE(3, "FAILED LOOKUP: Slot #" << slot << endl); |
| 206 | return failure(true); |
| 207 | } |
| 208 | BCR_TRACE(4, "Map: '" << Name << "' to #" << slot << ":" << D; |
Chris Lattner | 1d87bcf | 2001-10-01 20:11:19 +0000 | [diff] [blame] | 209 | if (!isa<Instruction>(D)) cerr << endl); |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 210 | |
| 211 | D->setName(Name, ST); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 212 | } |
| 213 | } |
| 214 | |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 215 | if (Buf > EndBuf) return failure(true); |
| 216 | return false; |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 217 | } |
| 218 | |
| 219 | |
| 220 | bool BytecodeParser::ParseMethod(const uchar *&Buf, const uchar *EndBuf, |
| 221 | Module *C) { |
| 222 | // Clear out the local values table... |
| 223 | Values.clear(); |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 224 | if (MethodSignatureList.empty()) return failure(true); // Unexpected method! |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 225 | |
Chris Lattner | ef9c23f | 2001-10-03 14:53:21 +0000 | [diff] [blame^] | 226 | const PointerType *PMTy = MethodSignatureList.front().first; // PtrMeth |
| 227 | const MethodType *MTy = dyn_cast<const MethodType>(PMTy->getValueType()); |
| 228 | if (MTy == 0) return failure(true); // Not ptr to method! |
| 229 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 230 | unsigned MethSlot = MethodSignatureList.front().second; |
| 231 | MethodSignatureList.pop_front(); |
| 232 | Method *M = new Method(MTy); |
| 233 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 234 | BCR_TRACE(2, "METHOD TYPE: " << MTy << endl); |
| 235 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 236 | const MethodType::ParamTypes &Params = MTy->getParamTypes(); |
| 237 | for (MethodType::ParamTypes::const_iterator It = Params.begin(); |
Chris Lattner | 7fc9fe3 | 2001-06-27 23:41:11 +0000 | [diff] [blame] | 238 | It != Params.end(); ++It) { |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 239 | MethodArgument *MA = new MethodArgument(*It); |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 240 | if (insertValue(MA, Values)) { delete M; return failure(true); } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 241 | M->getArgumentList().push_back(MA); |
| 242 | } |
| 243 | |
| 244 | while (Buf < EndBuf) { |
| 245 | unsigned Type, Size; |
| 246 | const uchar *OldBuf = Buf; |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 247 | if (readBlock(Buf, EndBuf, Type, Size)) { delete M; return failure(true); } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 248 | |
| 249 | switch (Type) { |
| 250 | case BytecodeFormat::ConstantPool: |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 251 | BCR_TRACE(2, "BLOCK BytecodeFormat::ConstantPool: {\n"); |
| 252 | if (ParseConstantPool(Buf, Buf+Size, Values, MethodTypeValues)) { |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 253 | delete M; return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 254 | } |
| 255 | break; |
| 256 | |
| 257 | case BytecodeFormat::BasicBlock: { |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 258 | BCR_TRACE(2, "BLOCK BytecodeFormat::BasicBlock: {\n"); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 259 | BasicBlock *BB; |
| 260 | if (ParseBasicBlock(Buf, Buf+Size, BB) || |
| 261 | insertValue(BB, Values)) { |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 262 | delete M; return failure(true); // Parse error... :( |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 263 | } |
| 264 | |
| 265 | M->getBasicBlocks().push_back(BB); |
| 266 | break; |
| 267 | } |
| 268 | |
| 269 | case BytecodeFormat::SymbolTable: |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 270 | BCR_TRACE(2, "BLOCK BytecodeFormat::SymbolTable: {\n"); |
| 271 | if (ParseSymbolTable(Buf, Buf+Size, M->getSymbolTableSure())) { |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 272 | delete M; return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 273 | } |
| 274 | break; |
| 275 | |
| 276 | default: |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 277 | BCR_TRACE(2, "BLOCK <unknown>:ignored! {\n"); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 278 | Buf += Size; |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 279 | if (OldBuf > Buf) return failure(true); // Wrap around! |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 280 | break; |
| 281 | } |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 282 | BCR_TRACE(2, "} end block\n"); |
| 283 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 284 | if (align32(Buf, EndBuf)) { |
| 285 | delete M; // Malformed bc file, read past end of block. |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 286 | return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 287 | } |
| 288 | } |
| 289 | |
| 290 | if (postResolveValues(LateResolveValues) || |
| 291 | postResolveValues(LateResolveModuleValues)) { |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 292 | delete M; return failure(true); // Unresolvable references! |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 293 | } |
| 294 | |
Chris Lattner | ef9c23f | 2001-10-03 14:53:21 +0000 | [diff] [blame^] | 295 | Value *MethPHolder = getValue(PMTy, MethSlot, false); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 296 | assert(MethPHolder && "Something is broken no placeholder found!"); |
Chris Lattner | 1d87bcf | 2001-10-01 20:11:19 +0000 | [diff] [blame] | 297 | assert(isa<Method>(MethPHolder) && "Not a method?"); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 298 | |
| 299 | unsigned type; // Type slot |
| 300 | assert(!getTypeSlot(MTy, type) && "How can meth type not exist?"); |
Chris Lattner | ef9c23f | 2001-10-03 14:53:21 +0000 | [diff] [blame^] | 301 | getTypeSlot(PMTy, type); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 302 | |
| 303 | C->getMethodList().push_back(M); |
| 304 | |
| 305 | // Replace placeholder with the real method pointer... |
| 306 | ModuleValues[type][MethSlot] = M; |
| 307 | |
Chris Lattner | e4d71a1 | 2001-09-14 22:03:42 +0000 | [diff] [blame] | 308 | // Clear out method level types... |
| 309 | MethodTypeValues.clear(); |
| 310 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 311 | // If anyone is using the placeholder make them use the real method instead |
| 312 | MethPHolder->replaceAllUsesWith(M); |
| 313 | |
| 314 | // We don't need the placeholder anymore! |
| 315 | delete MethPHolder; |
| 316 | |
| 317 | return false; |
| 318 | } |
| 319 | |
| 320 | bool BytecodeParser::ParseModuleGlobalInfo(const uchar *&Buf, const uchar *End, |
| 321 | Module *C) { |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 322 | if (!MethodSignatureList.empty()) |
| 323 | return failure(true); // Two ModuleGlobal blocks? |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 324 | |
Chris Lattner | 70cc339 | 2001-09-10 07:58:01 +0000 | [diff] [blame] | 325 | // Read global variables... |
| 326 | unsigned VarType; |
| 327 | if (read_vbr(Buf, End, VarType)) return failure(true); |
| 328 | while (VarType != Type::VoidTyID) { // List is terminated by Void |
Chris Lattner | d70684f | 2001-09-18 04:01:05 +0000 | [diff] [blame] | 329 | // VarType Fields: bit0 = isConstant, bit1 = hasInitializer, bit2+ = slot# |
| 330 | const Type *Ty = getType(VarType >> 2); |
Chris Lattner | 70cc339 | 2001-09-10 07:58:01 +0000 | [diff] [blame] | 331 | if (!Ty || !Ty->isPointerType()) { |
| 332 | cerr << "Global not pointer type! Ty = " << Ty << endl; |
| 333 | return failure(true); |
| 334 | } |
| 335 | |
Chris Lattner | ef9c23f | 2001-10-03 14:53:21 +0000 | [diff] [blame^] | 336 | const PointerType *PTy = cast<const PointerType>(Ty); |
| 337 | Ty = PTy->getValueType(); |
| 338 | |
Chris Lattner | d70684f | 2001-09-18 04:01:05 +0000 | [diff] [blame] | 339 | ConstPoolVal *Initializer = 0; |
| 340 | if (VarType & 2) { // Does it have an initalizer? |
| 341 | // Do not improvise... values must have been stored in the constant pool, |
| 342 | // which should have been read before now. |
| 343 | // |
| 344 | unsigned InitSlot; |
| 345 | if (read_vbr(Buf, End, InitSlot)) return failure(true); |
| 346 | |
Chris Lattner | ef9c23f | 2001-10-03 14:53:21 +0000 | [diff] [blame^] | 347 | Value *V = getValue(Ty, InitSlot, false); |
Chris Lattner | d70684f | 2001-09-18 04:01:05 +0000 | [diff] [blame] | 348 | if (V == 0) return failure(true); |
Chris Lattner | cfe26c9 | 2001-10-01 18:26:53 +0000 | [diff] [blame] | 349 | Initializer = cast<ConstPoolVal>(V); |
Chris Lattner | d70684f | 2001-09-18 04:01:05 +0000 | [diff] [blame] | 350 | } |
| 351 | |
Chris Lattner | 70cc339 | 2001-09-10 07:58:01 +0000 | [diff] [blame] | 352 | // Create the global variable... |
Chris Lattner | d70684f | 2001-09-18 04:01:05 +0000 | [diff] [blame] | 353 | GlobalVariable *GV = new GlobalVariable(Ty, VarType & 1, Initializer); |
Chris Lattner | 70cc339 | 2001-09-10 07:58:01 +0000 | [diff] [blame] | 354 | insertValue(GV, ModuleValues); |
| 355 | C->getGlobalList().push_back(GV); |
| 356 | |
| 357 | if (read_vbr(Buf, End, VarType)) return failure(true); |
Chris Lattner | ef9c23f | 2001-10-03 14:53:21 +0000 | [diff] [blame^] | 358 | BCR_TRACE(2, "Global Variable of type: " << PTy->getDescription() << endl); |
Chris Lattner | 70cc339 | 2001-09-10 07:58:01 +0000 | [diff] [blame] | 359 | } |
| 360 | |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 361 | // Read the method signatures for all of the methods that are coming, and |
| 362 | // create fillers in the Value tables. |
| 363 | unsigned MethSignature; |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 364 | if (read_vbr(Buf, End, MethSignature)) return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 365 | while (MethSignature != Type::VoidTyID) { // List is terminated by Void |
| 366 | const Type *Ty = getType(MethSignature); |
Chris Lattner | ef9c23f | 2001-10-03 14:53:21 +0000 | [diff] [blame^] | 367 | if (!Ty || !isa<PointerType>(Ty) || |
| 368 | !isa<MethodType>(cast<PointerType>(Ty)->getValueType())) { |
| 369 | cerr << "Method not ptr to meth type! Ty = " << Ty << endl; |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 370 | return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 371 | } |
Chris Lattner | ef9c23f | 2001-10-03 14:53:21 +0000 | [diff] [blame^] | 372 | |
| 373 | // We create methods by passing the underlying MethodType to create... |
| 374 | Ty = cast<PointerType>(Ty)->getValueType(); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 375 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 376 | // When the ModuleGlobalInfo section is read, we load the type of each |
| 377 | // method and the 'ModuleValues' slot that it lands in. We then load a |
| 378 | // placeholder into its slot to reserve it. When the method is loaded, this |
| 379 | // placeholder is replaced. |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 380 | |
| 381 | // Insert the placeholder... |
Chris Lattner | ef9c23f | 2001-10-03 14:53:21 +0000 | [diff] [blame^] | 382 | Value *Val = new MethPHolder(Ty, 0); |
| 383 | insertValue(Val, ModuleValues); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 384 | |
| 385 | // Figure out which entry of its typeslot it went into... |
| 386 | unsigned TypeSlot; |
Chris Lattner | ef9c23f | 2001-10-03 14:53:21 +0000 | [diff] [blame^] | 387 | if (getTypeSlot(Val->getType(), TypeSlot)) return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 388 | |
| 389 | unsigned SlotNo = ModuleValues[TypeSlot].size()-1; |
| 390 | |
| 391 | // Keep track of this information in a linked list that is emptied as |
| 392 | // methods are loaded... |
| 393 | // |
Chris Lattner | ef9c23f | 2001-10-03 14:53:21 +0000 | [diff] [blame^] | 394 | MethodSignatureList.push_back( |
| 395 | make_pair(cast<const PointerType>(Val->getType()), SlotNo)); |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 396 | if (read_vbr(Buf, End, MethSignature)) return failure(true); |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 397 | BCR_TRACE(2, "Method of type: " << Ty << endl); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 398 | } |
| 399 | |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 400 | if (align32(Buf, End)) return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 401 | |
| 402 | // This is for future proofing... in the future extra fields may be added that |
| 403 | // we don't understand, so we transparently ignore them. |
| 404 | // |
| 405 | Buf = End; |
| 406 | return false; |
| 407 | } |
| 408 | |
| 409 | bool BytecodeParser::ParseModule(const uchar *Buf, const uchar *EndBuf, |
| 410 | Module *&C) { |
| 411 | |
| 412 | unsigned Type, Size; |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 413 | if (readBlock(Buf, EndBuf, Type, Size)) return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 414 | if (Type != BytecodeFormat::Module || Buf+Size != EndBuf) |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 415 | return failure(true); // Hrm, not a class? |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 416 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 417 | BCR_TRACE(0, "BLOCK BytecodeFormat::Module: {\n"); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 418 | MethodSignatureList.clear(); // Just in case... |
| 419 | |
| 420 | // Read into instance variables... |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 421 | if (read_vbr(Buf, EndBuf, FirstDerivedTyID)) return failure(true); |
| 422 | if (align32(Buf, EndBuf)) return failure(true); |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 423 | BCR_TRACE(1, "FirstDerivedTyID = " << FirstDerivedTyID << "\n"); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 424 | |
| 425 | C = new Module(); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 426 | while (Buf < EndBuf) { |
| 427 | const uchar *OldBuf = Buf; |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 428 | if (readBlock(Buf, EndBuf, Type, Size)) { delete C; return failure(true); } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 429 | switch (Type) { |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 430 | case BytecodeFormat::ConstantPool: |
| 431 | BCR_TRACE(1, "BLOCK BytecodeFormat::ConstantPool: {\n"); |
| 432 | if (ParseConstantPool(Buf, Buf+Size, ModuleValues, ModuleTypeValues)) { |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 433 | delete C; return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 434 | } |
| 435 | break; |
| 436 | |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 437 | case BytecodeFormat::ModuleGlobalInfo: |
| 438 | BCR_TRACE(1, "BLOCK BytecodeFormat::ModuleGlobalInfo: {\n"); |
| 439 | |
| 440 | if (ParseModuleGlobalInfo(Buf, Buf+Size, C)) { |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 441 | delete C; return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 442 | } |
| 443 | break; |
| 444 | |
| 445 | case BytecodeFormat::Method: { |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 446 | BCR_TRACE(1, "BLOCK BytecodeFormat::Method: {\n"); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 447 | if (ParseMethod(Buf, Buf+Size, C)) { |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 448 | delete C; return failure(true); // Error parsing method |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 449 | } |
| 450 | break; |
| 451 | } |
| 452 | |
| 453 | case BytecodeFormat::SymbolTable: |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 454 | BCR_TRACE(1, "BLOCK BytecodeFormat::SymbolTable: {\n"); |
| 455 | if (ParseSymbolTable(Buf, Buf+Size, C->getSymbolTableSure())) { |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 456 | delete C; return failure(true); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 457 | } |
| 458 | break; |
| 459 | |
| 460 | default: |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 461 | cerr << " Unknown class block: " << Type << endl; |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 462 | Buf += Size; |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 463 | if (OldBuf > Buf) return failure(true); // Wrap around! |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 464 | break; |
| 465 | } |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 466 | BCR_TRACE(1, "} end block\n"); |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 467 | if (align32(Buf, EndBuf)) { delete C; return failure(true); } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 468 | } |
| 469 | |
| 470 | if (!MethodSignatureList.empty()) // Expected more methods! |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 471 | return failure(true); |
Chris Lattner | 1d670cc | 2001-09-07 16:37:43 +0000 | [diff] [blame] | 472 | |
| 473 | BCR_TRACE(0, "} end block\n\n"); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 474 | return false; |
| 475 | } |
| 476 | |
| 477 | Module *BytecodeParser::ParseBytecode(const uchar *Buf, const uchar *EndBuf) { |
| 478 | LateResolveValues.clear(); |
| 479 | unsigned Sig; |
| 480 | // Read and check signature... |
| 481 | if (read(Buf, EndBuf, Sig) || |
| 482 | Sig != ('l' | ('l' << 8) | ('v' << 16) | 'm' << 24)) |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 483 | return failure<Module*>(0); // Invalid signature! |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 484 | |
| 485 | Module *Result; |
| 486 | if (ParseModule(Buf, EndBuf, Result)) return 0; |
| 487 | return Result; |
| 488 | } |
| 489 | |
| 490 | |
| 491 | Module *ParseBytecodeBuffer(const uchar *Buffer, unsigned Length) { |
| 492 | BytecodeParser Parser; |
| 493 | return Parser.ParseBytecode(Buffer, Buffer+Length); |
| 494 | } |
| 495 | |
| 496 | // Parse and return a class file... |
| 497 | // |
| 498 | Module *ParseBytecodeFile(const string &Filename) { |
| 499 | struct stat StatBuf; |
| 500 | Module *Result = 0; |
| 501 | |
| 502 | if (Filename != string("-")) { // Read from a file... |
Chris Lattner | b49ff5c | 2001-07-23 18:51:23 +0000 | [diff] [blame] | 503 | int FD = open(Filename.c_str(), O_RDONLY); |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 504 | if (FD == -1) return failure<Module*>(0); |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 505 | |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 506 | if (fstat(FD, &StatBuf) == -1) { close(FD); return failure<Module*>(0); } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 507 | |
| 508 | int Length = StatBuf.st_size; |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 509 | if (Length == 0) { close(FD); return failure<Module*>(0); } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 510 | uchar *Buffer = (uchar*)mmap(0, Length, PROT_READ, |
| 511 | MAP_PRIVATE, FD, 0); |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 512 | if (Buffer == (uchar*)-1) { close(FD); return failure<Module*>(0); } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 513 | |
| 514 | BytecodeParser Parser; |
| 515 | Result = Parser.ParseBytecode(Buffer, Buffer+Length); |
| 516 | |
| 517 | munmap((char*)Buffer, Length); |
| 518 | close(FD); |
| 519 | } else { // Read from stdin |
| 520 | size_t FileSize = 0; |
| 521 | int BlockSize; |
| 522 | uchar Buffer[4096], *FileData = 0; |
| 523 | while ((BlockSize = read(0, Buffer, 4))) { |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 524 | if (BlockSize == -1) { free(FileData); return failure<Module*>(0); } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 525 | |
| 526 | FileData = (uchar*)realloc(FileData, FileSize+BlockSize); |
| 527 | memcpy(FileData+FileSize, Buffer, BlockSize); |
| 528 | FileSize += BlockSize; |
| 529 | } |
| 530 | |
Chris Lattner | 3d3f289 | 2001-07-28 17:50:18 +0000 | [diff] [blame] | 531 | if (FileSize == 0) { free(FileData); return failure<Module*>(0); } |
Chris Lattner | 0095054 | 2001-06-06 20:29:01 +0000 | [diff] [blame] | 532 | |
| 533 | #define ALIGN_PTRS 1 |
| 534 | #if ALIGN_PTRS |
| 535 | uchar *Buf = (uchar*)mmap(0, FileSize, PROT_READ|PROT_WRITE, |
| 536 | MAP_PRIVATE|MAP_ANONYMOUS, -1, 0); |
| 537 | assert((Buf != (uchar*)-1) && "mmap returned error!"); |
| 538 | free(FileData); |
| 539 | memcpy(Buf, FileData, FileSize); |
| 540 | #else |
| 541 | uchar *Buf = FileData; |
| 542 | #endif |
| 543 | |
| 544 | BytecodeParser Parser; |
| 545 | Result = Parser.ParseBytecode(Buf, Buf+FileSize); |
| 546 | |
| 547 | #if ALIGN_PTRS |
| 548 | munmap((char*)Buf, FileSize); // Free mmap'd data area |
| 549 | #else |
| 550 | free(FileData); // Free realloc'd block of memory |
| 551 | #endif |
| 552 | } |
| 553 | |
| 554 | return Result; |
| 555 | } |