blob: 82bd17a068a43d49063aa0ecafdbff1244cc936e [file] [log] [blame]
Rui Ueyama411c63602015-05-28 19:09:30 +00001//===- SymbolTable.cpp ----------------------------------------------------===//
2//
3// The LLVM Linker
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#include "Config.h"
11#include "Driver.h"
Rui Ueyama8fd9fb92015-06-01 02:58:15 +000012#include "Error.h"
Rui Ueyama411c63602015-05-28 19:09:30 +000013#include "SymbolTable.h"
Rui Ueyama411c63602015-05-28 19:09:30 +000014#include "llvm/ADT/STLExtras.h"
Peter Collingbourne60c16162015-06-01 20:10:10 +000015#include "llvm/LTO/LTOCodeGenerator.h"
Rui Ueyama411c63602015-05-28 19:09:30 +000016#include "llvm/Support/Debug.h"
17#include "llvm/Support/raw_ostream.h"
Rui Ueyamaf5313b32015-06-28 22:16:41 +000018#include <utility>
Rui Ueyama411c63602015-05-28 19:09:30 +000019
Rui Ueyamad68ff342015-05-31 03:57:30 +000020using namespace llvm;
21
Rui Ueyama411c63602015-05-28 19:09:30 +000022namespace lld {
23namespace coff {
24
25SymbolTable::SymbolTable() {
Rui Ueyama07e661f2015-06-03 05:39:12 +000026 resolve(new (Alloc) DefinedAbsolute("__ImageBase", Config->ImageBase));
Rui Ueyama5cff6852015-05-31 03:34:08 +000027 if (!Config->EntryName.empty())
Rui Ueyama07e661f2015-06-03 05:39:12 +000028 resolve(new (Alloc) Undefined(Config->EntryName));
Rui Ueyama411c63602015-05-28 19:09:30 +000029}
30
Rui Ueyama0d2e9992015-06-23 23:56:39 +000031void SymbolTable::addFile(std::unique_ptr<InputFile> File) {
32 Files.push_back(std::move(File));
Rui Ueyama411c63602015-05-28 19:09:30 +000033}
34
Rui Ueyama0d2e9992015-06-23 23:56:39 +000035std::error_code SymbolTable::run() {
36 while (FileIdx < Files.size()) {
37 InputFile *F = Files[FileIdx++].get();
38 if (Config->Verbose)
39 llvm::outs() << "Reading " << F->getShortName() << "\n";
40 if (auto EC = F->parse())
41 return EC;
42 if (auto *P = dyn_cast<ObjectFile>(F)) {
43 ObjectFiles.push_back(P);
44 } else if (auto *P = dyn_cast<ArchiveFile>(F)) {
45 ArchiveFiles.push_back(P);
46 } else if (auto *P = dyn_cast<BitcodeFile>(F)) {
47 BitcodeFiles.push_back(P);
48 } else {
49 ImportFiles.push_back(cast<ImportFile>(F));
Rui Ueyamaeeae5dd2015-06-08 06:00:10 +000050 }
Rui Ueyama0d2e9992015-06-23 23:56:39 +000051
52 for (SymbolBody *B : F->getSymbols())
53 if (B->isExternal())
54 if (auto EC = resolve(B))
55 return EC;
56
57 // If a object file contains .drectve section,
58 // read that and add files listed there.
59 StringRef S = F->getDirectives();
60 if (!S.empty())
61 if (auto EC = Driver->parseDirectives(S))
62 return EC;
Rui Ueyamaeeae5dd2015-06-08 06:00:10 +000063 }
Peter Collingbourneace2f092015-06-06 02:00:45 +000064 return std::error_code();
65}
66
Rui Ueyama411c63602015-05-28 19:09:30 +000067bool SymbolTable::reportRemainingUndefines() {
68 bool Ret = false;
69 for (auto &I : Symtab) {
70 Symbol *Sym = I.second;
71 auto *Undef = dyn_cast<Undefined>(Sym->Body);
72 if (!Undef)
73 continue;
Rui Ueyamad7666532015-06-25 02:21:44 +000074 StringRef Name = Undef->getName();
Rui Ueyamaf24e6f82015-06-28 20:34:09 +000075 // The weak alias may have been resovled, so check for that.
Rui Ueyama411c63602015-05-28 19:09:30 +000076 if (SymbolBody *Alias = Undef->getWeakAlias()) {
Rui Ueyamaf24e6f82015-06-28 20:34:09 +000077 if (auto *D = dyn_cast<Defined>(Alias->getReplacement())) {
78 Sym->Body = D;
79 continue;
Rui Ueyama411c63602015-05-28 19:09:30 +000080 }
Rui Ueyama411c63602015-05-28 19:09:30 +000081 }
Rui Ueyamad7666532015-06-25 02:21:44 +000082 // If we can resolve a symbol by removing __imp_ prefix, do that.
83 // This odd rule is for compatibility with MSVC linker.
84 if (Name.startswith("__imp_")) {
85 if (Defined *Imp = find(Name.substr(strlen("__imp_")))) {
Rui Ueyama88e0f922015-06-25 03:31:47 +000086 auto *S = new (Alloc) DefinedLocalImport(Name, Imp);
87 LocalImportChunks.push_back(S->getChunk());
88 Sym->Body = S;
Rui Ueyamad7666532015-06-25 02:21:44 +000089 continue;
90 }
91 }
92 llvm::errs() << "undefined symbol: " << Name << "\n";
Rui Ueyama95925fd2015-06-28 19:35:15 +000093 // Remaining undefined symbols are not fatal if /force is specified.
94 // They are replaced with dummy defined symbols.
95 if (Config->Force) {
96 Sym->Body = new (Alloc) DefinedAbsolute(Name, 0);
97 continue;
98 }
Rui Ueyama411c63602015-05-28 19:09:30 +000099 Ret = true;
100 }
101 return Ret;
102}
103
104// This function resolves conflicts if there's an existing symbol with
105// the same name. Decisions are made based on symbol type.
106std::error_code SymbolTable::resolve(SymbolBody *New) {
107 // Find an existing Symbol or create and insert a new one.
108 StringRef Name = New->getName();
109 Symbol *&Sym = Symtab[Name];
110 if (!Sym) {
111 Sym = new (Alloc) Symbol(New);
112 New->setBackref(Sym);
Rui Ueyama573bf7d2015-06-19 21:12:48 +0000113 ++Version;
Rui Ueyama411c63602015-05-28 19:09:30 +0000114 return std::error_code();
115 }
116 New->setBackref(Sym);
117
118 // compare() returns -1, 0, or 1 if the lhs symbol is less preferable,
119 // equivalent (conflicting), or more preferable, respectively.
120 SymbolBody *Existing = Sym->Body;
121 int comp = Existing->compare(New);
Rui Ueyama573bf7d2015-06-19 21:12:48 +0000122 if (comp < 0) {
Rui Ueyama411c63602015-05-28 19:09:30 +0000123 Sym->Body = New;
Rui Ueyama573bf7d2015-06-19 21:12:48 +0000124 ++Version;
125 }
Rui Ueyama8fd9fb92015-06-01 02:58:15 +0000126 if (comp == 0) {
Rui Ueyama68633f12015-06-25 23:22:00 +0000127 llvm::errs() << "duplicate symbol: " << Existing->getDebugName()
128 << " and " << New->getDebugName() << "\n";
Rui Ueyama8fd9fb92015-06-01 02:58:15 +0000129 return make_error_code(LLDError::DuplicateSymbols);
130 }
Rui Ueyama411c63602015-05-28 19:09:30 +0000131
132 // If we have an Undefined symbol for a Lazy symbol, we need
133 // to read an archive member to replace the Lazy symbol with
134 // a Defined symbol.
135 if (isa<Undefined>(Existing) || isa<Undefined>(New))
136 if (auto *B = dyn_cast<Lazy>(Sym->Body))
137 return addMemberFile(B);
138 return std::error_code();
139}
140
141// Reads an archive member file pointed by a given symbol.
142std::error_code SymbolTable::addMemberFile(Lazy *Body) {
143 auto FileOrErr = Body->getMember();
144 if (auto EC = FileOrErr.getError())
145 return EC;
146 std::unique_ptr<InputFile> File = std::move(FileOrErr.get());
147
148 // getMember returns an empty buffer if the member was already
149 // read from the library.
150 if (!File)
151 return std::error_code();
152 if (Config->Verbose)
Rui Ueyama5b2588a2015-06-08 05:43:50 +0000153 llvm::outs() << "Loaded " << File->getShortName() << " for "
Rui Ueyama411c63602015-05-28 19:09:30 +0000154 << Body->getName() << "\n";
Rui Ueyama0d2e9992015-06-23 23:56:39 +0000155 addFile(std::move(File));
156 return std::error_code();
Rui Ueyama411c63602015-05-28 19:09:30 +0000157}
158
159std::vector<Chunk *> SymbolTable::getChunks() {
160 std::vector<Chunk *> Res;
Rui Ueyama0d2e9992015-06-23 23:56:39 +0000161 for (ObjectFile *File : ObjectFiles) {
Rui Ueyama411c63602015-05-28 19:09:30 +0000162 std::vector<Chunk *> &V = File->getChunks();
163 Res.insert(Res.end(), V.begin(), V.end());
164 }
165 return Res;
166}
167
Rui Ueyama5cff6852015-05-31 03:34:08 +0000168Defined *SymbolTable::find(StringRef Name) {
Rui Ueyama411c63602015-05-28 19:09:30 +0000169 auto It = Symtab.find(Name);
170 if (It == Symtab.end())
171 return nullptr;
Rui Ueyama5cff6852015-05-31 03:34:08 +0000172 if (auto *Def = dyn_cast<Defined>(It->second->Body))
173 return Def;
174 return nullptr;
175}
176
Rui Ueyama45044f42015-06-29 01:03:53 +0000177// Find a given symbol. If a lazy symbol is found,
178// resolve that before returning.
179Defined *SymbolTable::findLazy(StringRef Name) {
180 auto It = Symtab.find(Name);
181 if (It == Symtab.end())
182 return nullptr;
183 Symbol *Sym = It->second;
184 if (auto *B = dyn_cast<Defined>(Sym->Body))
185 return B;
186 if (auto *B = dyn_cast<Lazy>(Sym->Body)) {
187 if (addMemberFile(B))
188 return nullptr;
189 if (run())
190 return nullptr;
191 return cast<Defined>(Sym->Body);
192 }
193 return nullptr;
194}
195
Rui Ueyamaf5313b32015-06-28 22:16:41 +0000196// Find a given symbol or its mangled symbol.
197std::pair<StringRef, Symbol *> SymbolTable::findMangled(StringRef S) {
198 auto It = Symtab.find(S);
199 if (It != Symtab.end()) {
200 Symbol *Sym = It->second;
201 if (isa<Defined>(Sym->Body))
202 return std::make_pair(S, Sym);
203 }
204
205 // In Microsoft ABI, a non-member function name is mangled this way.
206 std::string Prefix = ("?" + S + "@@Y").str();
207 for (auto I : Symtab) {
208 StringRef Name = I.first;
209 Symbol *Sym = I.second;
210 if (!Name.startswith(Prefix))
211 continue;
Rui Ueyama6b79ed12015-06-29 14:27:10 +0000212 if (auto *B = dyn_cast<Lazy>(Sym->Body)) {
213 addMemberFile(B);
214 run();
215 }
Rui Ueyamaf5313b32015-06-28 22:16:41 +0000216 if (isa<Defined>(Sym->Body))
217 return std::make_pair(Name, Sym);
218 }
219 return std::make_pair(S, nullptr);
220}
221
Rui Ueyamae042fa9a2015-05-31 19:55:40 +0000222std::error_code SymbolTable::addUndefined(StringRef Name) {
Rui Ueyama07e661f2015-06-03 05:39:12 +0000223 return resolve(new (Alloc) Undefined(Name));
Rui Ueyamae042fa9a2015-05-31 19:55:40 +0000224}
225
Rui Ueyama360bace2015-05-31 22:31:31 +0000226// Resolve To, and make From an alias to To.
227std::error_code SymbolTable::rename(StringRef From, StringRef To) {
Rui Ueyama4d2834b2015-06-19 19:23:43 +0000228 // If From is not undefined, do nothing.
229 // Otherwise, rename it to see if To can be resolved instead.
230 auto It = Symtab.find(From);
231 if (It == Symtab.end())
232 return std::error_code();
233 Symbol *Sym = It->second;
234 if (!isa<Undefined>(Sym->Body))
235 return std::error_code();
Rui Ueyama360bace2015-05-31 22:31:31 +0000236 SymbolBody *Body = new (Alloc) Undefined(To);
237 if (auto EC = resolve(Body))
238 return EC;
Rui Ueyama45044f42015-06-29 01:03:53 +0000239 SymbolBody *Repl = Body->getReplacement();
240 if (isa<Undefined>(Repl))
241 return std::error_code();
242 Sym->Body = Repl;
Rui Ueyama4d2834b2015-06-19 19:23:43 +0000243 Body->setBackref(Sym);
Rui Ueyama573bf7d2015-06-19 21:12:48 +0000244 ++Version;
Rui Ueyama360bace2015-05-31 22:31:31 +0000245 return std::error_code();
246}
247
Peter Collingbournebe549552015-06-26 18:58:24 +0000248void SymbolTable::printMap(llvm::raw_ostream &OS) {
249 for (ObjectFile *File : ObjectFiles) {
250 OS << File->getShortName() << ":\n";
251 for (SymbolBody *Body : File->getSymbols())
252 if (auto *R = dyn_cast<DefinedRegular>(Body))
253 if (R->isLive())
254 OS << Twine::utohexstr(Config->ImageBase + R->getRVA())
255 << " " << R->getName() << "\n";
256 }
257}
258
Peter Collingbourne60c16162015-06-01 20:10:10 +0000259std::error_code SymbolTable::addCombinedLTOObject() {
260 if (BitcodeFiles.empty())
261 return std::error_code();
262
Peter Collingbourne60c16162015-06-01 20:10:10 +0000263 // Create an object file and add it to the symbol table by replacing any
264 // DefinedBitcode symbols with the definitions in the object file.
Rui Ueyamaefba7812015-06-09 17:52:17 +0000265 LTOCodeGenerator CG;
266 auto FileOrErr = createLTOObject(&CG);
267 if (auto EC = FileOrErr.getError())
Peter Collingbourne60c16162015-06-01 20:10:10 +0000268 return EC;
Rui Ueyamaefba7812015-06-09 17:52:17 +0000269 ObjectFile *Obj = FileOrErr.get();
270
Rui Ueyama0d2e9992015-06-23 23:56:39 +0000271 // Skip the combined object file as the file is processed below
272 // rather than by run().
273 ++FileIdx;
274
Peter Collingbourne60c16162015-06-01 20:10:10 +0000275 for (SymbolBody *Body : Obj->getSymbols()) {
276 if (!Body->isExternal())
277 continue;
Peter Collingbourned9e4e982015-06-09 02:53:09 +0000278 // Find an existing Symbol. We should not see any new undefined symbols at
279 // this point.
Peter Collingbourne60c16162015-06-01 20:10:10 +0000280 StringRef Name = Body->getName();
Peter Collingbourned9e4e982015-06-09 02:53:09 +0000281 Symbol *&Sym = Symtab[Name];
Peter Collingbourne60c16162015-06-01 20:10:10 +0000282 if (!Sym) {
Peter Collingbourned9e4e982015-06-09 02:53:09 +0000283 if (!isa<Defined>(Body)) {
284 llvm::errs() << "LTO: undefined symbol: " << Name << '\n';
285 return make_error_code(LLDError::BrokenFile);
286 }
287 Sym = new (Alloc) Symbol(Body);
288 Body->setBackref(Sym);
289 continue;
Peter Collingbourne60c16162015-06-01 20:10:10 +0000290 }
291 Body->setBackref(Sym);
292
293 if (isa<DefinedBitcode>(Sym->Body)) {
294 // The symbol should now be defined.
295 if (!isa<Defined>(Body)) {
296 llvm::errs() << "LTO: undefined symbol: " << Name << '\n';
297 return make_error_code(LLDError::BrokenFile);
298 }
299 Sym->Body = Body;
Peter Collingbourne1b6fd1f2015-06-11 21:49:54 +0000300 } else {
301 int comp = Sym->Body->compare(Body);
302 if (comp < 0)
303 Sym->Body = Body;
304 if (comp == 0) {
305 llvm::errs() << "LTO: unexpected duplicate symbol: " << Name << "\n";
306 return make_error_code(LLDError::BrokenFile);
307 }
Peter Collingbourne60c16162015-06-01 20:10:10 +0000308 }
Peter Collingbourne73b75e32015-06-09 04:29:54 +0000309
310 // We may see new references to runtime library symbols such as __chkstk
311 // here. These symbols must be wholly defined in non-bitcode files.
Rui Ueyama0d2e9992015-06-23 23:56:39 +0000312 if (auto *B = dyn_cast<Lazy>(Sym->Body))
Peter Collingbourne2ed4c8f2015-06-24 00:12:34 +0000313 if (auto EC = addMemberFile(B))
314 return EC;
Rui Ueyama0d2e9992015-06-23 23:56:39 +0000315 }
316
317 size_t NumBitcodeFiles = BitcodeFiles.size();
318 if (auto EC = run())
319 return EC;
320 if (BitcodeFiles.size() != NumBitcodeFiles) {
321 llvm::errs() << "LTO: late loaded symbol created new bitcode reference\n";
322 return make_error_code(LLDError::BrokenFile);
Peter Collingbourne60c16162015-06-01 20:10:10 +0000323 }
324
Peter Collingbourne73b75e32015-06-09 04:29:54 +0000325 // New runtime library symbol references may have created undefined references.
326 if (reportRemainingUndefines())
327 return make_error_code(LLDError::BrokenFile);
Peter Collingbourne60c16162015-06-01 20:10:10 +0000328 return std::error_code();
329}
330
Rui Ueyamaefba7812015-06-09 17:52:17 +0000331// Combine and compile bitcode files and then return the result
332// as a regular COFF object file.
333ErrorOr<ObjectFile *> SymbolTable::createLTOObject(LTOCodeGenerator *CG) {
334 // All symbols referenced by non-bitcode objects must be preserved.
Rui Ueyama0d2e9992015-06-23 23:56:39 +0000335 for (ObjectFile *File : ObjectFiles)
Rui Ueyamaefba7812015-06-09 17:52:17 +0000336 for (SymbolBody *Body : File->getSymbols())
337 if (auto *S = dyn_cast<DefinedBitcode>(Body->getReplacement()))
338 CG->addMustPreserveSymbol(S->getName());
339
Peter Collingbourne1b6fd1f2015-06-11 21:49:54 +0000340 // Likewise for bitcode symbols which we initially resolved to non-bitcode.
Rui Ueyama0d2e9992015-06-23 23:56:39 +0000341 for (BitcodeFile *File : BitcodeFiles)
Peter Collingbourne1b6fd1f2015-06-11 21:49:54 +0000342 for (SymbolBody *Body : File->getSymbols())
343 if (isa<DefinedBitcode>(Body) &&
344 !isa<DefinedBitcode>(Body->getReplacement()))
345 CG->addMustPreserveSymbol(Body->getName());
346
Rui Ueyamaefba7812015-06-09 17:52:17 +0000347 // Likewise for other symbols that must be preserved.
348 for (StringRef Name : Config->GCRoots)
349 if (isa<DefinedBitcode>(Symtab[Name]->Body))
350 CG->addMustPreserveSymbol(Name);
351
352 CG->setModule(BitcodeFiles[0]->releaseModule());
353 for (unsigned I = 1, E = BitcodeFiles.size(); I != E; ++I)
354 CG->addModule(BitcodeFiles[I]->getModule());
355
356 std::string ErrMsg;
357 LTOMB = CG->compile(false, false, false, ErrMsg); // take MB ownership
358 if (!LTOMB) {
359 llvm::errs() << ErrMsg << '\n';
360 return make_error_code(LLDError::BrokenFile);
361 }
Rui Ueyama0d2e9992015-06-23 23:56:39 +0000362 auto *Obj = new ObjectFile(LTOMB->getMemBufferRef());
363 Files.emplace_back(Obj);
364 ObjectFiles.push_back(Obj);
Rui Ueyamaefba7812015-06-09 17:52:17 +0000365 if (auto EC = Obj->parse())
366 return EC;
367 return Obj;
368}
369
Rui Ueyama411c63602015-05-28 19:09:30 +0000370} // namespace coff
371} // namespace lld