Chris Lattner | 2eacf26 | 2004-01-05 05:25:10 +0000 | [diff] [blame] | 1 | //===-- ProgramInfo.cpp - Compute and cache info about a program ----------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file was developed by the LLVM research group and is distributed under |
| 6 | // the University of Illinois Open Source License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file implements the ProgramInfo and related classes, by sorting through |
| 11 | // the loaded Module. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #include "llvm/Debugger/ProgramInfo.h" |
| 16 | #include "llvm/Constants.h" |
| 17 | #include "llvm/DerivedTypes.h" |
| 18 | #include "llvm/Intrinsics.h" |
Chris Lattner | 4ab78e0 | 2004-07-29 17:15:38 +0000 | [diff] [blame] | 19 | #include "llvm/Instructions.h" |
Chris Lattner | 2eacf26 | 2004-01-05 05:25:10 +0000 | [diff] [blame] | 20 | #include "llvm/Module.h" |
| 21 | #include "llvm/Debugger/SourceFile.h" |
| 22 | #include "llvm/Debugger/SourceLanguage.h" |
Reid Spencer | 551ccae | 2004-09-01 22:55:40 +0000 | [diff] [blame] | 23 | #include "llvm/Support/FileUtilities.h" |
| 24 | #include "llvm/Support/SlowOperationInformer.h" |
| 25 | #include "llvm/ADT/STLExtras.h" |
Reid Spencer | 954da37 | 2004-07-04 12:19:56 +0000 | [diff] [blame] | 26 | #include <iostream> |
| 27 | |
Chris Lattner | 2eacf26 | 2004-01-05 05:25:10 +0000 | [diff] [blame] | 28 | using namespace llvm; |
| 29 | |
| 30 | /// getGlobalVariablesUsing - Return all of the global variables which have the |
| 31 | /// specified value in their initializer somewhere. |
| 32 | static void getGlobalVariablesUsing(Value *V, |
| 33 | std::vector<GlobalVariable*> &Found) { |
| 34 | for (Value::use_iterator I = V->use_begin(), E = V->use_end(); I != E; ++I) { |
| 35 | if (GlobalVariable *GV = dyn_cast<GlobalVariable>(*I)) |
| 36 | Found.push_back(GV); |
| 37 | else if (Constant *C = dyn_cast<Constant>(*I)) |
| 38 | getGlobalVariablesUsing(C, Found); |
| 39 | } |
| 40 | } |
| 41 | |
| 42 | /// getStringValue - Turn an LLVM constant pointer that eventually points to a |
| 43 | /// global into a string value. Return an empty string if we can't do it. |
| 44 | /// |
| 45 | static std::string getStringValue(Value *V, unsigned Offset = 0) { |
| 46 | if (GlobalVariable *GV = dyn_cast<GlobalVariable>(V)) { |
| 47 | if (GV->hasInitializer() && isa<ConstantArray>(GV->getInitializer())) { |
| 48 | ConstantArray *Init = cast<ConstantArray>(GV->getInitializer()); |
Chris Lattner | e3f84f5 | 2004-01-14 17:07:46 +0000 | [diff] [blame] | 49 | if (Init->isString()) { |
Chris Lattner | 2eacf26 | 2004-01-05 05:25:10 +0000 | [diff] [blame] | 50 | std::string Result = Init->getAsString(); |
| 51 | if (Offset < Result.size()) { |
| 52 | // If we are pointing INTO The string, erase the beginning... |
| 53 | Result.erase(Result.begin(), Result.begin()+Offset); |
| 54 | |
| 55 | // Take off the null terminator, and any string fragments after it. |
| 56 | std::string::size_type NullPos = Result.find_first_of((char)0); |
| 57 | if (NullPos != std::string::npos) |
| 58 | Result.erase(Result.begin()+NullPos, Result.end()); |
| 59 | return Result; |
| 60 | } |
| 61 | } |
| 62 | } |
| 63 | } else if (Constant *C = dyn_cast<Constant>(V)) { |
Reid Spencer | 518310c | 2004-07-18 00:44:37 +0000 | [diff] [blame] | 64 | if (GlobalValue *GV = dyn_cast<GlobalValue>(C)) |
| 65 | return getStringValue(GV, Offset); |
Chris Lattner | 2eacf26 | 2004-01-05 05:25:10 +0000 | [diff] [blame] | 66 | else if (ConstantExpr *CE = dyn_cast<ConstantExpr>(C)) { |
| 67 | if (CE->getOpcode() == Instruction::GetElementPtr) { |
| 68 | // Turn a gep into the specified offset. |
| 69 | if (CE->getNumOperands() == 3 && |
| 70 | cast<Constant>(CE->getOperand(1))->isNullValue() && |
| 71 | isa<ConstantInt>(CE->getOperand(2))) { |
| 72 | return getStringValue(CE->getOperand(0), |
| 73 | Offset+cast<ConstantInt>(CE->getOperand(2))->getRawValue()); |
| 74 | } |
| 75 | } |
| 76 | } |
| 77 | } |
| 78 | return ""; |
| 79 | } |
| 80 | |
| 81 | /// getNextStopPoint - Follow the def-use chains of the specified LLVM value, |
| 82 | /// traversing the use chains until we get to a stoppoint. When we do, return |
| 83 | /// the source location of the stoppoint. If we don't find a stoppoint, return |
| 84 | /// null. |
| 85 | static const GlobalVariable *getNextStopPoint(const Value *V, unsigned &LineNo, |
| 86 | unsigned &ColNo) { |
| 87 | // The use-def chains can fork. As such, we pick the lowest numbered one we |
| 88 | // find. |
| 89 | const GlobalVariable *LastDesc = 0; |
| 90 | unsigned LastLineNo = ~0; |
| 91 | unsigned LastColNo = ~0; |
| 92 | |
| 93 | for (Value::use_const_iterator UI = V->use_begin(), E = V->use_end(); |
| 94 | UI != E; ++UI) { |
| 95 | bool ShouldRecurse = true; |
| 96 | if (cast<Instruction>(*UI)->getOpcode() == Instruction::PHI) { |
| 97 | // Infinite loops == bad, ignore PHI nodes. |
| 98 | ShouldRecurse = false; |
| 99 | } else if (const CallInst *CI = dyn_cast<CallInst>(*UI)) { |
| 100 | // If we found a stop point, check to see if it is earlier than what we |
| 101 | // already have. If so, remember it. |
| 102 | if (const Function *F = CI->getCalledFunction()) |
| 103 | if (F->getIntrinsicID() == Intrinsic::dbg_stoppoint) { |
| 104 | unsigned CurLineNo = ~0, CurColNo = ~0; |
| 105 | const GlobalVariable *CurDesc = 0; |
| 106 | if (const ConstantInt *C = dyn_cast<ConstantInt>(CI->getOperand(2))) |
| 107 | CurLineNo = C->getRawValue(); |
| 108 | if (const ConstantInt *C = dyn_cast<ConstantInt>(CI->getOperand(3))) |
| 109 | CurColNo = C->getRawValue(); |
| 110 | const Value *Op = CI->getOperand(4); |
Chris Lattner | 2eacf26 | 2004-01-05 05:25:10 +0000 | [diff] [blame] | 111 | |
| 112 | if ((CurDesc = dyn_cast<GlobalVariable>(Op)) && |
| 113 | (LineNo < LastLineNo || |
| 114 | (LineNo == LastLineNo && ColNo < LastColNo))) { |
| 115 | LastDesc = CurDesc; |
| 116 | LastLineNo = CurLineNo; |
| 117 | LastColNo = CurColNo; |
| 118 | } |
| 119 | ShouldRecurse = false; |
| 120 | } |
| 121 | |
| 122 | } |
| 123 | |
| 124 | // If this is not a phi node or a stopping point, recursively scan the users |
| 125 | // of this instruction to skip over region.begin's and the like. |
| 126 | if (ShouldRecurse) { |
| 127 | unsigned CurLineNo, CurColNo; |
| 128 | if (const GlobalVariable *GV = getNextStopPoint(*UI, CurLineNo,CurColNo)){ |
| 129 | if (LineNo < LastLineNo || (LineNo == LastLineNo && ColNo < LastColNo)){ |
| 130 | LastDesc = GV; |
| 131 | LastLineNo = CurLineNo; |
| 132 | LastColNo = CurColNo; |
| 133 | } |
| 134 | } |
| 135 | } |
| 136 | } |
| 137 | |
| 138 | if (LastDesc) { |
| 139 | LineNo = LastLineNo != ~0U ? LastLineNo : 0; |
| 140 | ColNo = LastColNo != ~0U ? LastColNo : 0; |
| 141 | } |
| 142 | return LastDesc; |
| 143 | } |
| 144 | |
| 145 | |
| 146 | //===----------------------------------------------------------------------===// |
| 147 | // SourceFileInfo implementation |
| 148 | // |
| 149 | |
| 150 | SourceFileInfo::SourceFileInfo(const GlobalVariable *Desc, |
| 151 | const SourceLanguage &Lang) |
| 152 | : Language(&Lang), Descriptor(Desc) { |
| 153 | Version = 0; |
| 154 | SourceText = 0; |
| 155 | |
| 156 | if (Desc && Desc->hasInitializer()) |
| 157 | if (ConstantStruct *CS = dyn_cast<ConstantStruct>(Desc->getInitializer())) |
| 158 | if (CS->getNumOperands() > 4) { |
| 159 | if (ConstantUInt *CUI = dyn_cast<ConstantUInt>(CS->getOperand(1))) |
| 160 | Version = CUI->getValue(); |
| 161 | |
| 162 | BaseName = getStringValue(CS->getOperand(3)); |
| 163 | Directory = getStringValue(CS->getOperand(4)); |
| 164 | } |
| 165 | } |
| 166 | |
| 167 | SourceFileInfo::~SourceFileInfo() { |
| 168 | delete SourceText; |
| 169 | } |
| 170 | |
| 171 | SourceFile &SourceFileInfo::getSourceText() const { |
| 172 | // FIXME: this should take into account the source search directories! |
Reid Spencer | 663601c | 2004-12-13 02:59:15 +0000 | [diff] [blame^] | 173 | if (SourceText == 0) { // Read the file in if we haven't already. |
| 174 | sys::Path tmpPath; |
| 175 | if (!Directory.empty()) |
| 176 | tmpPath.setDirectory(Directory); |
| 177 | tmpPath.appendFile(BaseName); |
| 178 | if (tmpPath.readable()) |
| 179 | SourceText = new SourceFile(tmpPath.toString(), Descriptor); |
Chris Lattner | 2eacf26 | 2004-01-05 05:25:10 +0000 | [diff] [blame] | 180 | else |
| 181 | SourceText = new SourceFile(BaseName, Descriptor); |
Reid Spencer | 663601c | 2004-12-13 02:59:15 +0000 | [diff] [blame^] | 182 | } |
Chris Lattner | 2eacf26 | 2004-01-05 05:25:10 +0000 | [diff] [blame] | 183 | return *SourceText; |
| 184 | } |
| 185 | |
| 186 | |
| 187 | //===----------------------------------------------------------------------===// |
| 188 | // SourceFunctionInfo implementation |
| 189 | // |
| 190 | SourceFunctionInfo::SourceFunctionInfo(ProgramInfo &PI, |
| 191 | const GlobalVariable *Desc) |
| 192 | : Descriptor(Desc) { |
| 193 | LineNo = ColNo = 0; |
| 194 | if (Desc && Desc->hasInitializer()) |
| 195 | if (ConstantStruct *CS = dyn_cast<ConstantStruct>(Desc->getInitializer())) |
| 196 | if (CS->getNumOperands() > 2) { |
| 197 | // Entry #1 is the file descriptor. |
Reid Spencer | 518310c | 2004-07-18 00:44:37 +0000 | [diff] [blame] | 198 | if (const GlobalVariable *GV = |
| 199 | dyn_cast<GlobalVariable>(CS->getOperand(1))) |
| 200 | SourceFile = &PI.getSourceFile(GV); |
Chris Lattner | 2eacf26 | 2004-01-05 05:25:10 +0000 | [diff] [blame] | 201 | |
| 202 | // Entry #2 is the function name. |
| 203 | Name = getStringValue(CS->getOperand(2)); |
| 204 | } |
| 205 | } |
| 206 | |
| 207 | /// getSourceLocation - This method returns the location of the first stopping |
| 208 | /// point in the function. |
| 209 | void SourceFunctionInfo::getSourceLocation(unsigned &RetLineNo, |
| 210 | unsigned &RetColNo) const { |
| 211 | // If we haven't computed this yet... |
| 212 | if (!LineNo) { |
| 213 | // Look at all of the users of the function descriptor, looking for calls to |
| 214 | // %llvm.dbg.func.start. |
| 215 | for (Value::use_const_iterator UI = Descriptor->use_begin(), |
| 216 | E = Descriptor->use_end(); UI != E; ++UI) |
| 217 | if (const CallInst *CI = dyn_cast<CallInst>(*UI)) |
| 218 | if (const Function *F = CI->getCalledFunction()) |
| 219 | if (F->getIntrinsicID() == Intrinsic::dbg_func_start) { |
| 220 | // We found the start of the function. Check to see if there are |
| 221 | // any stop points on the use-list of the function start. |
| 222 | const GlobalVariable *SD = getNextStopPoint(CI, LineNo, ColNo); |
| 223 | if (SD) { // We found the first stop point! |
| 224 | // This is just a sanity check. |
| 225 | if (getSourceFile().getDescriptor() != SD) |
| 226 | std::cout << "WARNING: first line of function is not in the" |
| 227 | " file that the function descriptor claims it is in.\n"; |
| 228 | break; |
| 229 | } |
| 230 | } |
| 231 | } |
| 232 | RetLineNo = LineNo; RetColNo = ColNo; |
| 233 | } |
| 234 | |
| 235 | //===----------------------------------------------------------------------===// |
| 236 | // ProgramInfo implementation |
| 237 | // |
| 238 | |
| 239 | ProgramInfo::ProgramInfo(Module *m) : M(m) { |
| 240 | assert(M && "Cannot create program information with a null module!"); |
| 241 | ProgramTimeStamp = getFileTimestamp(M->getModuleIdentifier()); |
| 242 | |
| 243 | SourceFilesIsComplete = false; |
| 244 | SourceFunctionsIsComplete = false; |
| 245 | } |
| 246 | |
| 247 | ProgramInfo::~ProgramInfo() { |
| 248 | // Delete cached information about source program objects... |
| 249 | for (std::map<const GlobalVariable*, SourceFileInfo*>::iterator |
| 250 | I = SourceFiles.begin(), E = SourceFiles.end(); I != E; ++I) |
| 251 | delete I->second; |
| 252 | for (std::map<const GlobalVariable*, SourceFunctionInfo*>::iterator |
| 253 | I = SourceFunctions.begin(), E = SourceFunctions.end(); I != E; ++I) |
| 254 | delete I->second; |
| 255 | |
| 256 | // Delete the source language caches. |
| 257 | for (unsigned i = 0, e = LanguageCaches.size(); i != e; ++i) |
| 258 | delete LanguageCaches[i].second; |
| 259 | } |
| 260 | |
| 261 | |
| 262 | //===----------------------------------------------------------------------===// |
| 263 | // SourceFileInfo tracking... |
| 264 | // |
| 265 | |
| 266 | /// getSourceFile - Return source file information for the specified source file |
| 267 | /// descriptor object, adding it to the collection as needed. This method |
| 268 | /// always succeeds (is unambiguous), and is always efficient. |
| 269 | /// |
| 270 | const SourceFileInfo & |
| 271 | ProgramInfo::getSourceFile(const GlobalVariable *Desc) { |
| 272 | SourceFileInfo *&Result = SourceFiles[Desc]; |
| 273 | if (Result) return *Result; |
| 274 | |
| 275 | // Figure out what language this source file comes from... |
| 276 | unsigned LangID = 0; // Zero is unknown language |
| 277 | if (Desc && Desc->hasInitializer()) |
| 278 | if (ConstantStruct *CS = dyn_cast<ConstantStruct>(Desc->getInitializer())) |
| 279 | if (CS->getNumOperands() > 2) |
| 280 | if (ConstantUInt *CUI = dyn_cast<ConstantUInt>(CS->getOperand(2))) |
| 281 | LangID = CUI->getValue(); |
| 282 | |
| 283 | const SourceLanguage &Lang = SourceLanguage::get(LangID); |
| 284 | SourceFileInfo *New = Lang.createSourceFileInfo(Desc, *this); |
| 285 | |
| 286 | // FIXME: this should check to see if there is already a Filename/WorkingDir |
| 287 | // pair that matches this one. If so, we shouldn't create the duplicate! |
| 288 | // |
| 289 | SourceFileIndex.insert(std::make_pair(New->getBaseName(), New)); |
| 290 | return *(Result = New); |
| 291 | } |
| 292 | |
| 293 | |
| 294 | /// getSourceFiles - Index all of the source files in the program and return |
| 295 | /// a mapping of it. This information is lazily computed the first time |
| 296 | /// that it is requested. Since this information can take a long time to |
| 297 | /// compute, the user is given a chance to cancel it. If this occurs, an |
| 298 | /// exception is thrown. |
| 299 | const std::map<const GlobalVariable*, SourceFileInfo*> & |
| 300 | ProgramInfo::getSourceFiles(bool RequiresCompleteMap) { |
| 301 | // If we have a fully populated map, or if the client doesn't need one, just |
| 302 | // return what we have. |
| 303 | if (SourceFilesIsComplete || !RequiresCompleteMap) |
| 304 | return SourceFiles; |
| 305 | |
| 306 | // Ok, all of the source file descriptors (compile_unit in dwarf terms), |
| 307 | // should be on the use list of the llvm.dbg.translation_units global. |
| 308 | // |
| 309 | GlobalVariable *Units = |
| 310 | M->getGlobalVariable("llvm.dbg.translation_units", |
| 311 | StructType::get(std::vector<const Type*>())); |
| 312 | if (Units == 0) |
| 313 | throw "Program contains no debugging information!"; |
| 314 | |
| 315 | std::vector<GlobalVariable*> TranslationUnits; |
| 316 | getGlobalVariablesUsing(Units, TranslationUnits); |
| 317 | |
| 318 | SlowOperationInformer SOI("building source files index"); |
| 319 | |
| 320 | // Loop over all of the translation units found, building the SourceFiles |
| 321 | // mapping. |
| 322 | for (unsigned i = 0, e = TranslationUnits.size(); i != e; ++i) { |
| 323 | getSourceFile(TranslationUnits[i]); |
| 324 | SOI.progress(i+1, e); |
| 325 | } |
| 326 | |
| 327 | // Ok, if we got this far, then we indexed the whole program. |
| 328 | SourceFilesIsComplete = true; |
| 329 | return SourceFiles; |
| 330 | } |
| 331 | |
| 332 | /// getSourceFile - Look up the file with the specified name. If there is |
| 333 | /// more than one match for the specified filename, prompt the user to pick |
| 334 | /// one. If there is no source file that matches the specified name, throw |
| 335 | /// an exception indicating that we can't find the file. Otherwise, return |
| 336 | /// the file information for that file. |
| 337 | const SourceFileInfo &ProgramInfo::getSourceFile(const std::string &Filename) { |
| 338 | std::multimap<std::string, SourceFileInfo*>::const_iterator Start, End; |
| 339 | getSourceFiles(); |
| 340 | tie(Start, End) = SourceFileIndex.equal_range(Filename); |
| 341 | |
| 342 | if (Start == End) throw "Could not find source file '" + Filename + "'!"; |
| 343 | const SourceFileInfo &SFI = *Start->second; |
| 344 | ++Start; |
| 345 | if (Start == End) return SFI; |
| 346 | |
| 347 | throw "FIXME: Multiple source files with the same name not implemented!"; |
| 348 | } |
| 349 | |
| 350 | |
| 351 | //===----------------------------------------------------------------------===// |
| 352 | // SourceFunctionInfo tracking... |
| 353 | // |
| 354 | |
| 355 | |
| 356 | /// getFunction - Return function information for the specified function |
| 357 | /// descriptor object, adding it to the collection as needed. This method |
| 358 | /// always succeeds (is unambiguous), and is always efficient. |
| 359 | /// |
| 360 | const SourceFunctionInfo & |
| 361 | ProgramInfo::getFunction(const GlobalVariable *Desc) { |
| 362 | SourceFunctionInfo *&Result = SourceFunctions[Desc]; |
| 363 | if (Result) return *Result; |
| 364 | |
| 365 | // Figure out what language this function comes from... |
| 366 | const GlobalVariable *SourceFileDesc = 0; |
| 367 | if (Desc && Desc->hasInitializer()) |
| 368 | if (ConstantStruct *CS = dyn_cast<ConstantStruct>(Desc->getInitializer())) |
| 369 | if (CS->getNumOperands() > 0) |
Reid Spencer | 518310c | 2004-07-18 00:44:37 +0000 | [diff] [blame] | 370 | if (const GlobalVariable *GV = |
| 371 | dyn_cast<GlobalVariable>(CS->getOperand(1))) |
| 372 | SourceFileDesc = GV; |
Chris Lattner | 2eacf26 | 2004-01-05 05:25:10 +0000 | [diff] [blame] | 373 | |
| 374 | const SourceLanguage &Lang = getSourceFile(SourceFileDesc).getLanguage(); |
| 375 | return *(Result = Lang.createSourceFunctionInfo(Desc, *this)); |
| 376 | } |
| 377 | |
| 378 | |
| 379 | // getSourceFunctions - Index all of the functions in the program and return |
| 380 | // them. This information is lazily computed the first time that it is |
| 381 | // requested. Since this information can take a long time to compute, the user |
| 382 | // is given a chance to cancel it. If this occurs, an exception is thrown. |
| 383 | const std::map<const GlobalVariable*, SourceFunctionInfo*> & |
| 384 | ProgramInfo::getSourceFunctions(bool RequiresCompleteMap) { |
| 385 | if (SourceFunctionsIsComplete || !RequiresCompleteMap) |
| 386 | return SourceFunctions; |
| 387 | |
| 388 | // Ok, all of the source function descriptors (subprogram in dwarf terms), |
| 389 | // should be on the use list of the llvm.dbg.translation_units global. |
| 390 | // |
| 391 | GlobalVariable *Units = |
| 392 | M->getGlobalVariable("llvm.dbg.globals", |
| 393 | StructType::get(std::vector<const Type*>())); |
| 394 | if (Units == 0) |
| 395 | throw "Program contains no debugging information!"; |
| 396 | |
| 397 | std::vector<GlobalVariable*> Functions; |
| 398 | getGlobalVariablesUsing(Units, Functions); |
| 399 | |
| 400 | SlowOperationInformer SOI("building functions index"); |
| 401 | |
| 402 | // Loop over all of the functions found, building the SourceFunctions mapping. |
| 403 | for (unsigned i = 0, e = Functions.size(); i != e; ++i) { |
| 404 | getFunction(Functions[i]); |
| 405 | SOI.progress(i+1, e); |
| 406 | } |
| 407 | |
| 408 | // Ok, if we got this far, then we indexed the whole program. |
| 409 | SourceFunctionsIsComplete = true; |
| 410 | return SourceFunctions; |
| 411 | } |