Eugene Zelenko | 1df42fa | 2017-04-24 23:21:38 +0000 | [diff] [blame] | 1 | //===- IRSymtab.cpp - implementation of IR symbol tables ------------------===// |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | |
Chandler Carruth | 6bda14b | 2017-06-06 11:49:48 +0000 | [diff] [blame] | 10 | #include "llvm/Object/IRSymtab.h" |
Eugene Zelenko | 1df42fa | 2017-04-24 23:21:38 +0000 | [diff] [blame] | 11 | #include "llvm/ADT/ArrayRef.h" |
| 12 | #include "llvm/ADT/DenseMap.h" |
| 13 | #include "llvm/ADT/SmallPtrSet.h" |
| 14 | #include "llvm/ADT/SmallString.h" |
| 15 | #include "llvm/ADT/SmallVector.h" |
| 16 | #include "llvm/ADT/StringRef.h" |
| 17 | #include "llvm/ADT/Triple.h" |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 18 | #include "llvm/Analysis/ObjectUtils.h" |
Eugene Zelenko | 1df42fa | 2017-04-24 23:21:38 +0000 | [diff] [blame] | 19 | #include "llvm/IR/Comdat.h" |
| 20 | #include "llvm/IR/DataLayout.h" |
| 21 | #include "llvm/IR/GlobalAlias.h" |
| 22 | #include "llvm/IR/GlobalObject.h" |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 23 | #include "llvm/IR/Mangler.h" |
Eugene Zelenko | 1df42fa | 2017-04-24 23:21:38 +0000 | [diff] [blame] | 24 | #include "llvm/IR/Metadata.h" |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 25 | #include "llvm/IR/Module.h" |
Peter Collingbourne | c00c2b2 | 2017-06-08 01:26:14 +0000 | [diff] [blame] | 26 | #include "llvm/Bitcode/BitcodeReader.h" |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 27 | #include "llvm/MC/StringTableBuilder.h" |
Peter Collingbourne | c00c2b2 | 2017-06-08 01:26:14 +0000 | [diff] [blame] | 28 | #include "llvm/Object/IRObjectFile.h" |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 29 | #include "llvm/Object/ModuleSymbolTable.h" |
Eugene Zelenko | 1df42fa | 2017-04-24 23:21:38 +0000 | [diff] [blame] | 30 | #include "llvm/Object/SymbolicFile.h" |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 31 | #include "llvm/Support/Allocator.h" |
Eugene Zelenko | 1df42fa | 2017-04-24 23:21:38 +0000 | [diff] [blame] | 32 | #include "llvm/Support/Casting.h" |
| 33 | #include "llvm/Support/Error.h" |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 34 | #include "llvm/Support/StringSaver.h" |
Chandler Carruth | 6bda14b | 2017-06-06 11:49:48 +0000 | [diff] [blame] | 35 | #include "llvm/Support/raw_ostream.h" |
Eugene Zelenko | 1df42fa | 2017-04-24 23:21:38 +0000 | [diff] [blame] | 36 | #include <cassert> |
| 37 | #include <string> |
| 38 | #include <utility> |
| 39 | #include <vector> |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 40 | |
| 41 | using namespace llvm; |
| 42 | using namespace irsymtab; |
| 43 | |
| 44 | namespace { |
| 45 | |
| 46 | /// Stores the temporary state that is required to build an IR symbol table. |
| 47 | struct Builder { |
| 48 | SmallVector<char, 0> &Symtab; |
| 49 | SmallVector<char, 0> &Strtab; |
Eugene Zelenko | 1df42fa | 2017-04-24 23:21:38 +0000 | [diff] [blame] | 50 | |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 51 | Builder(SmallVector<char, 0> &Symtab, SmallVector<char, 0> &Strtab) |
| 52 | : Symtab(Symtab), Strtab(Strtab) {} |
| 53 | |
Peter Collingbourne | c74cf06 | 2017-04-17 17:55:24 +0000 | [diff] [blame] | 54 | StringTableBuilder StrtabBuilder{StringTableBuilder::RAW}; |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 55 | |
| 56 | BumpPtrAllocator Alloc; |
| 57 | StringSaver Saver{Alloc}; |
| 58 | |
| 59 | DenseMap<const Comdat *, unsigned> ComdatMap; |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 60 | Mangler Mang; |
| 61 | Triple TT; |
| 62 | |
| 63 | std::vector<storage::Comdat> Comdats; |
| 64 | std::vector<storage::Module> Mods; |
| 65 | std::vector<storage::Symbol> Syms; |
| 66 | std::vector<storage::Uncommon> Uncommons; |
| 67 | |
| 68 | std::string COFFLinkerOpts; |
| 69 | raw_string_ostream COFFLinkerOptsOS{COFFLinkerOpts}; |
| 70 | |
| 71 | void setStr(storage::Str &S, StringRef Value) { |
| 72 | S.Offset = StrtabBuilder.add(Value); |
Peter Collingbourne | c74cf06 | 2017-04-17 17:55:24 +0000 | [diff] [blame] | 73 | S.Size = Value.size(); |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 74 | } |
Eugene Zelenko | 1df42fa | 2017-04-24 23:21:38 +0000 | [diff] [blame] | 75 | |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 76 | template <typename T> |
| 77 | void writeRange(storage::Range<T> &R, const std::vector<T> &Objs) { |
| 78 | R.Offset = Symtab.size(); |
| 79 | R.Size = Objs.size(); |
| 80 | Symtab.insert(Symtab.end(), reinterpret_cast<const char *>(Objs.data()), |
| 81 | reinterpret_cast<const char *>(Objs.data() + Objs.size())); |
| 82 | } |
| 83 | |
| 84 | Error addModule(Module *M); |
Peter Collingbourne | 76423dc | 2017-04-17 23:43:49 +0000 | [diff] [blame] | 85 | Error addSymbol(const ModuleSymbolTable &Msymtab, |
| 86 | const SmallPtrSet<GlobalValue *, 8> &Used, |
| 87 | ModuleSymbolTable::Symbol Sym); |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 88 | |
| 89 | Error build(ArrayRef<Module *> Mods); |
| 90 | }; |
| 91 | |
| 92 | Error Builder::addModule(Module *M) { |
Peter Collingbourne | dc8c018 | 2017-06-08 22:04:24 +0000 | [diff] [blame] | 93 | if (M->getDataLayoutStr().empty()) |
| 94 | return make_error<StringError>("input module has no datalayout", |
| 95 | inconvertibleErrorCode()); |
| 96 | |
Peter Collingbourne | 76423dc | 2017-04-17 23:43:49 +0000 | [diff] [blame] | 97 | SmallPtrSet<GlobalValue *, 8> Used; |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 98 | collectUsedGlobalVariables(*M, Used, /*CompilerUsed*/ false); |
| 99 | |
Peter Collingbourne | 76423dc | 2017-04-17 23:43:49 +0000 | [diff] [blame] | 100 | ModuleSymbolTable Msymtab; |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 101 | Msymtab.addModule(M); |
Peter Collingbourne | 76423dc | 2017-04-17 23:43:49 +0000 | [diff] [blame] | 102 | |
| 103 | storage::Module Mod; |
| 104 | Mod.Begin = Syms.size(); |
| 105 | Mod.End = Syms.size() + Msymtab.symbols().size(); |
| 106 | Mod.UncBegin = Uncommons.size(); |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 107 | Mods.push_back(Mod); |
| 108 | |
| 109 | if (TT.isOSBinFormatCOFF()) { |
| 110 | if (auto E = M->materializeMetadata()) |
| 111 | return E; |
Peter Collingbourne | 89061b2 | 2017-06-12 20:10:48 +0000 | [diff] [blame^] | 112 | if (NamedMDNode *LinkerOptions = |
| 113 | M->getNamedMetadata("llvm.linker.options")) { |
| 114 | for (MDNode *MDOptions : LinkerOptions->operands()) |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 115 | for (const MDOperand &MDOption : cast<MDNode>(MDOptions)->operands()) |
| 116 | COFFLinkerOptsOS << " " << cast<MDString>(MDOption)->getString(); |
| 117 | } |
| 118 | } |
| 119 | |
Peter Collingbourne | 76423dc | 2017-04-17 23:43:49 +0000 | [diff] [blame] | 120 | for (ModuleSymbolTable::Symbol Msym : Msymtab.symbols()) |
| 121 | if (Error Err = addSymbol(Msymtab, Used, Msym)) |
| 122 | return Err; |
| 123 | |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 124 | return Error::success(); |
| 125 | } |
| 126 | |
Peter Collingbourne | 76423dc | 2017-04-17 23:43:49 +0000 | [diff] [blame] | 127 | Error Builder::addSymbol(const ModuleSymbolTable &Msymtab, |
| 128 | const SmallPtrSet<GlobalValue *, 8> &Used, |
| 129 | ModuleSymbolTable::Symbol Msym) { |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 130 | Syms.emplace_back(); |
| 131 | storage::Symbol &Sym = Syms.back(); |
| 132 | Sym = {}; |
| 133 | |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 134 | storage::Uncommon *Unc = nullptr; |
| 135 | auto Uncommon = [&]() -> storage::Uncommon & { |
| 136 | if (Unc) |
| 137 | return *Unc; |
Peter Collingbourne | 76423dc | 2017-04-17 23:43:49 +0000 | [diff] [blame] | 138 | Sym.Flags |= 1 << storage::Symbol::FB_has_uncommon; |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 139 | Uncommons.emplace_back(); |
| 140 | Unc = &Uncommons.back(); |
| 141 | *Unc = {}; |
| 142 | setStr(Unc->COFFWeakExternFallbackName, ""); |
| 143 | return *Unc; |
| 144 | }; |
| 145 | |
| 146 | SmallString<64> Name; |
| 147 | { |
| 148 | raw_svector_ostream OS(Name); |
| 149 | Msymtab.printSymbolName(OS, Msym); |
| 150 | } |
| 151 | setStr(Sym.Name, Saver.save(StringRef(Name))); |
| 152 | |
| 153 | auto Flags = Msymtab.getSymbolFlags(Msym); |
| 154 | if (Flags & object::BasicSymbolRef::SF_Undefined) |
| 155 | Sym.Flags |= 1 << storage::Symbol::FB_undefined; |
| 156 | if (Flags & object::BasicSymbolRef::SF_Weak) |
| 157 | Sym.Flags |= 1 << storage::Symbol::FB_weak; |
| 158 | if (Flags & object::BasicSymbolRef::SF_Common) |
| 159 | Sym.Flags |= 1 << storage::Symbol::FB_common; |
| 160 | if (Flags & object::BasicSymbolRef::SF_Indirect) |
| 161 | Sym.Flags |= 1 << storage::Symbol::FB_indirect; |
| 162 | if (Flags & object::BasicSymbolRef::SF_Global) |
| 163 | Sym.Flags |= 1 << storage::Symbol::FB_global; |
| 164 | if (Flags & object::BasicSymbolRef::SF_FormatSpecific) |
| 165 | Sym.Flags |= 1 << storage::Symbol::FB_format_specific; |
Tobias Edler von Koch | 90df1f48 | 2017-04-13 16:24:14 +0000 | [diff] [blame] | 166 | if (Flags & object::BasicSymbolRef::SF_Executable) |
| 167 | Sym.Flags |= 1 << storage::Symbol::FB_executable; |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 168 | |
| 169 | Sym.ComdatIndex = -1; |
| 170 | auto *GV = Msym.dyn_cast<GlobalValue *>(); |
| 171 | if (!GV) { |
Peter Collingbourne | fa58f75 | 2017-04-26 17:53:39 +0000 | [diff] [blame] | 172 | // Undefined module asm symbols act as GC roots and are implicitly used. |
| 173 | if (Flags & object::BasicSymbolRef::SF_Undefined) |
| 174 | Sym.Flags |= 1 << storage::Symbol::FB_used; |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 175 | setStr(Sym.IRName, ""); |
| 176 | return Error::success(); |
| 177 | } |
| 178 | |
| 179 | setStr(Sym.IRName, GV->getName()); |
| 180 | |
| 181 | if (Used.count(GV)) |
| 182 | Sym.Flags |= 1 << storage::Symbol::FB_used; |
| 183 | if (GV->isThreadLocal()) |
| 184 | Sym.Flags |= 1 << storage::Symbol::FB_tls; |
| 185 | if (GV->hasGlobalUnnamedAddr()) |
| 186 | Sym.Flags |= 1 << storage::Symbol::FB_unnamed_addr; |
| 187 | if (canBeOmittedFromSymbolTable(GV)) |
| 188 | Sym.Flags |= 1 << storage::Symbol::FB_may_omit; |
| 189 | Sym.Flags |= unsigned(GV->getVisibility()) << storage::Symbol::FB_visibility; |
| 190 | |
| 191 | if (Flags & object::BasicSymbolRef::SF_Common) { |
| 192 | Uncommon().CommonSize = GV->getParent()->getDataLayout().getTypeAllocSize( |
| 193 | GV->getType()->getElementType()); |
| 194 | Uncommon().CommonAlign = GV->getAlignment(); |
| 195 | } |
| 196 | |
| 197 | const GlobalObject *Base = GV->getBaseObject(); |
| 198 | if (!Base) |
| 199 | return make_error<StringError>("Unable to determine comdat of alias!", |
| 200 | inconvertibleErrorCode()); |
| 201 | if (const Comdat *C = Base->getComdat()) { |
| 202 | auto P = ComdatMap.insert(std::make_pair(C, Comdats.size())); |
| 203 | Sym.ComdatIndex = P.first->second; |
| 204 | |
| 205 | if (P.second) { |
| 206 | storage::Comdat Comdat; |
| 207 | setStr(Comdat.Name, C->getName()); |
| 208 | Comdats.push_back(Comdat); |
| 209 | } |
| 210 | } |
| 211 | |
| 212 | if (TT.isOSBinFormatCOFF()) { |
| 213 | emitLinkerFlagsForGlobalCOFF(COFFLinkerOptsOS, GV, TT, Mang); |
| 214 | |
| 215 | if ((Flags & object::BasicSymbolRef::SF_Weak) && |
| 216 | (Flags & object::BasicSymbolRef::SF_Indirect)) { |
| 217 | std::string FallbackName; |
| 218 | raw_string_ostream OS(FallbackName); |
| 219 | Msymtab.printSymbolName( |
| 220 | OS, cast<GlobalValue>( |
| 221 | cast<GlobalAlias>(GV)->getAliasee()->stripPointerCasts())); |
| 222 | OS.flush(); |
| 223 | setStr(Uncommon().COFFWeakExternFallbackName, Saver.save(FallbackName)); |
| 224 | } |
| 225 | } |
| 226 | |
| 227 | return Error::success(); |
| 228 | } |
| 229 | |
| 230 | Error Builder::build(ArrayRef<Module *> IRMods) { |
| 231 | storage::Header Hdr; |
| 232 | |
| 233 | assert(!IRMods.empty()); |
Peter Collingbourne | 8446f1f | 2017-04-14 02:55:06 +0000 | [diff] [blame] | 234 | setStr(Hdr.TargetTriple, IRMods[0]->getTargetTriple()); |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 235 | setStr(Hdr.SourceFileName, IRMods[0]->getSourceFileName()); |
| 236 | TT = Triple(IRMods[0]->getTargetTriple()); |
| 237 | |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 238 | for (auto *M : IRMods) |
| 239 | if (Error Err = addModule(M)) |
| 240 | return Err; |
| 241 | |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 242 | COFFLinkerOptsOS.flush(); |
| 243 | setStr(Hdr.COFFLinkerOpts, COFFLinkerOpts); |
| 244 | |
| 245 | // We are about to fill in the header's range fields, so reserve space for it |
| 246 | // and copy it in afterwards. |
| 247 | Symtab.resize(sizeof(storage::Header)); |
| 248 | writeRange(Hdr.Modules, Mods); |
| 249 | writeRange(Hdr.Comdats, Comdats); |
| 250 | writeRange(Hdr.Symbols, Syms); |
| 251 | writeRange(Hdr.Uncommons, Uncommons); |
| 252 | |
| 253 | *reinterpret_cast<storage::Header *>(Symtab.data()) = Hdr; |
| 254 | |
| 255 | raw_svector_ostream OS(Strtab); |
| 256 | StrtabBuilder.finalizeInOrder(); |
| 257 | StrtabBuilder.write(OS); |
| 258 | |
| 259 | return Error::success(); |
| 260 | } |
| 261 | |
Eugene Zelenko | 1df42fa | 2017-04-24 23:21:38 +0000 | [diff] [blame] | 262 | } // end anonymous namespace |
Peter Collingbourne | 7b30f16 | 2017-03-31 04:47:07 +0000 | [diff] [blame] | 263 | |
| 264 | Error irsymtab::build(ArrayRef<Module *> Mods, SmallVector<char, 0> &Symtab, |
| 265 | SmallVector<char, 0> &Strtab) { |
| 266 | return Builder(Symtab, Strtab).build(Mods); |
| 267 | } |
Peter Collingbourne | c00c2b2 | 2017-06-08 01:26:14 +0000 | [diff] [blame] | 268 | |
Peter Collingbourne | 8dde4cb | 2017-06-08 22:00:24 +0000 | [diff] [blame] | 269 | // Upgrade a vector of bitcode modules created by an old version of LLVM by |
| 270 | // creating an irsymtab for them in the current format. |
| 271 | static Expected<FileContents> upgrade(ArrayRef<BitcodeModule> BMs) { |
Peter Collingbourne | c00c2b2 | 2017-06-08 01:26:14 +0000 | [diff] [blame] | 272 | FileContents FC; |
Peter Collingbourne | c00c2b2 | 2017-06-08 01:26:14 +0000 | [diff] [blame] | 273 | |
| 274 | LLVMContext Ctx; |
| 275 | std::vector<Module *> Mods; |
| 276 | std::vector<std::unique_ptr<Module>> OwnedMods; |
| 277 | for (auto BM : BMs) { |
| 278 | Expected<std::unique_ptr<Module>> MOrErr = |
| 279 | BM.getLazyModule(Ctx, /*ShouldLazyLoadMetadata*/ true, |
| 280 | /*IsImporting*/ false); |
| 281 | if (!MOrErr) |
| 282 | return MOrErr.takeError(); |
| 283 | |
Peter Collingbourne | c00c2b2 | 2017-06-08 01:26:14 +0000 | [diff] [blame] | 284 | Mods.push_back(MOrErr->get()); |
| 285 | OwnedMods.push_back(std::move(*MOrErr)); |
| 286 | } |
| 287 | |
| 288 | if (Error E = build(Mods, FC.Symtab, FC.Strtab)) |
| 289 | return std::move(E); |
| 290 | |
| 291 | FC.TheReader = {{FC.Symtab.data(), FC.Symtab.size()}, |
| 292 | {FC.Strtab.data(), FC.Strtab.size()}}; |
| 293 | return std::move(FC); |
| 294 | } |
Peter Collingbourne | 8dde4cb | 2017-06-08 22:00:24 +0000 | [diff] [blame] | 295 | |
| 296 | Expected<FileContents> irsymtab::readBitcode(const BitcodeFileContents &BFC) { |
| 297 | if (BFC.Mods.empty()) |
| 298 | return make_error<StringError>("Bitcode file does not contain any modules", |
| 299 | inconvertibleErrorCode()); |
| 300 | |
| 301 | // Right now we have no on-disk representation of symbol tables, so we always |
| 302 | // upgrade. |
| 303 | return upgrade(BFC.Mods); |
| 304 | } |