blob: 095ad86764c62719432222a388af6b331c8e0969 [file] [log] [blame]
Michael J. Spencer84487f12015-07-24 21:03:07 +00001//===- SymbolTable.cpp ----------------------------------------------------===//
2//
3// The LLVM Linker
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
Rui Ueyama34f29242015-10-13 19:51:57 +00009//
10// Symbol table is a bag of all known symbols. We put all symbols of
Rui Ueyamac9559d92016-01-05 20:47:37 +000011// all input files to the symbol table. The symbol table is basically
Rui Ueyama34f29242015-10-13 19:51:57 +000012// a hash table with the logic to resolve symbol name conflicts using
13// the symbol types.
14//
15//===----------------------------------------------------------------------===//
Michael J. Spencer84487f12015-07-24 21:03:07 +000016
17#include "SymbolTable.h"
Rafael Espindola4340aad2015-09-11 22:42:45 +000018#include "Config.h"
Rafael Espindola192e1fa2015-08-06 15:08:23 +000019#include "Error.h"
Michael J. Spencer84487f12015-07-24 21:03:07 +000020#include "Symbols.h"
Rafael Espindola9f77ef02016-02-12 20:54:57 +000021#include "llvm/Bitcode/ReaderWriter.h"
22#include "llvm/IR/LegacyPassManager.h"
23#include "llvm/Linker/Linker.h"
Rui Ueyamadeb15402016-01-07 17:20:07 +000024#include "llvm/Support/StringSaver.h"
Rafael Espindola9f77ef02016-02-12 20:54:57 +000025#include "llvm/Support/TargetRegistry.h"
26#include "llvm/Target/TargetMachine.h"
Michael J. Spencer84487f12015-07-24 21:03:07 +000027
28using namespace llvm;
Rafael Espindoladaa92a62015-08-31 01:16:19 +000029using namespace llvm::object;
Rafael Espindola01205f72015-09-22 18:19:46 +000030using namespace llvm::ELF;
Michael J. Spencer84487f12015-07-24 21:03:07 +000031
32using namespace lld;
Rafael Espindolae0df00b2016-02-28 00:25:54 +000033using namespace lld::elf;
Michael J. Spencer84487f12015-07-24 21:03:07 +000034
Rui Ueyamac9559d92016-01-05 20:47:37 +000035// All input object files must be for the same architecture
36// (e.g. it does not make sense to link x86 object files with
37// MIPS object files.) This function checks for that error.
Rui Ueyama16ba6692016-01-29 19:41:13 +000038template <class ELFT> static bool isCompatible(InputFile *FileP) {
Rui Ueyama25b44c92015-12-16 23:31:22 +000039 auto *F = dyn_cast<ELFFileBase<ELFT>>(FileP);
40 if (!F)
Rui Ueyama16ba6692016-01-29 19:41:13 +000041 return true;
Rui Ueyama25b44c92015-12-16 23:31:22 +000042 if (F->getELFKind() == Config->EKind && F->getEMachine() == Config->EMachine)
Rui Ueyama16ba6692016-01-29 19:41:13 +000043 return true;
Rui Ueyama25b44c92015-12-16 23:31:22 +000044 StringRef A = F->getName();
45 StringRef B = Config->Emulation;
46 if (B.empty())
47 B = Config->FirstElf->getName();
Rui Ueyama16ba6692016-01-29 19:41:13 +000048 error(A + " is incompatible with " + B);
49 return false;
Rui Ueyama25b44c92015-12-16 23:31:22 +000050}
51
Rui Ueyamac9559d92016-01-05 20:47:37 +000052// Add symbols in File to the symbol table.
Rui Ueyama25b44c92015-12-16 23:31:22 +000053template <class ELFT>
Rui Ueyama3ce825e2015-10-09 21:07:25 +000054void SymbolTable<ELFT>::addFile(std::unique_ptr<InputFile> File) {
Rafael Espindola21f7bd42015-12-23 14:35:51 +000055 InputFile *FileP = File.get();
Rui Ueyama16ba6692016-01-29 19:41:13 +000056 if (!isCompatible<ELFT>(FileP))
57 return;
Rafael Espindola525914d2015-10-11 03:36:49 +000058
Rui Ueyama89575742015-12-16 22:59:13 +000059 // .a file
60 if (auto *F = dyn_cast<ArchiveFile>(FileP)) {
Rafael Espindola21f7bd42015-12-23 14:35:51 +000061 ArchiveFiles.emplace_back(cast<ArchiveFile>(File.release()));
Rui Ueyama89575742015-12-16 22:59:13 +000062 F->parse();
63 for (Lazy &Sym : F->getLazySymbols())
Michael J. Spencer1b348a62015-09-04 22:28:10 +000064 addLazy(&Sym);
65 return;
66 }
Rui Ueyama3d451792015-10-12 18:03:21 +000067
Rui Ueyama89575742015-12-16 22:59:13 +000068 // .so file
69 if (auto *F = dyn_cast<SharedFile<ELFT>>(FileP)) {
70 // DSOs are uniquified not by filename but by soname.
71 F->parseSoName();
Rui Ueyama131e0ff2016-01-08 22:17:42 +000072 if (!SoNames.insert(F->getSoName()).second)
Rafael Espindola6a3b5de2015-10-01 19:52:48 +000073 return;
Rui Ueyama89575742015-12-16 22:59:13 +000074
Rafael Espindola21f7bd42015-12-23 14:35:51 +000075 SharedFiles.emplace_back(cast<SharedFile<ELFT>>(File.release()));
Rui Ueyama7c713312016-01-06 01:56:36 +000076 F->parseRest();
Rui Ueyama89575742015-12-16 22:59:13 +000077 for (SharedSymbol<ELFT> &B : F->getSharedSymbols())
78 resolve(&B);
79 return;
Rafael Espindola6a3b5de2015-10-01 19:52:48 +000080 }
Rui Ueyama89575742015-12-16 22:59:13 +000081
Rafael Espindola9f77ef02016-02-12 20:54:57 +000082 // LLVM bitcode file.
83 if (auto *F = dyn_cast<BitcodeFile>(FileP)) {
84 BitcodeFiles.emplace_back(cast<BitcodeFile>(File.release()));
85 F->parse();
Rafael Espindola297ce4e2016-02-26 21:31:34 +000086 for (SymbolBody *B : F->getSymbols())
Rafael Espindola9f77ef02016-02-12 20:54:57 +000087 resolve(B);
88 return;
89 }
90
Rui Ueyama89575742015-12-16 22:59:13 +000091 // .o file
92 auto *F = cast<ObjectFile<ELFT>>(FileP);
Rafael Espindola21f7bd42015-12-23 14:35:51 +000093 ObjectFiles.emplace_back(cast<ObjectFile<ELFT>>(File.release()));
Rui Ueyama52d3b672016-01-06 02:06:33 +000094 F->parse(ComdatGroups);
Rui Ueyama89575742015-12-16 22:59:13 +000095 for (SymbolBody *B : F->getSymbols())
96 resolve(B);
Michael J. Spencer84487f12015-07-24 21:03:07 +000097}
98
Rafael Espindola9f77ef02016-02-12 20:54:57 +000099// Codegen the module M and returns the resulting InputFile.
100template <class ELFT>
101std::unique_ptr<InputFile> SymbolTable<ELFT>::codegen(Module &M) {
102 StringRef TripleStr = M.getTargetTriple();
103 Triple TheTriple(TripleStr);
104
105 // FIXME: Should we have a default triple? The gold plugin uses
106 // sys::getDefaultTargetTriple(), but that is probably wrong given that this
107 // might be a cross linker.
108
109 std::string ErrMsg;
110 const Target *TheTarget = TargetRegistry::lookupTarget(TripleStr, ErrMsg);
111 if (!TheTarget)
112 fatal("Target not found: " + ErrMsg);
113
114 TargetOptions Options;
115 std::unique_ptr<TargetMachine> TM(
116 TheTarget->createTargetMachine(TripleStr, "", "", Options));
117
118 raw_svector_ostream OS(OwningLTOData);
119 legacy::PassManager CodeGenPasses;
120 if (TM->addPassesToEmitFile(CodeGenPasses, OS,
121 TargetMachine::CGFT_ObjectFile))
122 fatal("Failed to setup codegen");
123 CodeGenPasses.run(M);
124 LtoBuffer = MemoryBuffer::getMemBuffer(OwningLTOData, "", false);
125 return createObjectFile(*LtoBuffer);
126}
127
128// Merge all the bitcode files we have seen, codegen the result and return
129// the resulting ObjectFile.
130template <class ELFT>
131ObjectFile<ELFT> *SymbolTable<ELFT>::createCombinedLtoObject() {
132 LLVMContext Context;
133 Module Combined("ld-temp.o", Context);
134 Linker L(Combined);
135 for (const std::unique_ptr<BitcodeFile> &F : BitcodeFiles) {
136 std::unique_ptr<MemoryBuffer> Buffer =
137 MemoryBuffer::getMemBuffer(F->MB, false);
138 ErrorOr<std::unique_ptr<Module>> MOrErr =
139 getLazyBitcodeModule(std::move(Buffer), Context,
140 /*ShouldLazyLoadMetadata*/ true);
141 fatal(MOrErr);
142 std::unique_ptr<Module> &M = *MOrErr;
143 L.linkInModule(std::move(M));
144 }
145 std::unique_ptr<InputFile> F = codegen(Combined);
146 ObjectFiles.emplace_back(cast<ObjectFile<ELFT>>(F.release()));
147 return &*ObjectFiles.back();
148}
149
150template <class ELFT> void SymbolTable<ELFT>::addCombinedLtoObject() {
151 if (BitcodeFiles.empty())
152 return;
153 ObjectFile<ELFT> *Obj = createCombinedLtoObject();
154 // FIXME: We probably have to ignore comdats here.
155 Obj->parse(ComdatGroups);
156 for (SymbolBody *Body : Obj->getSymbols()) {
157 Symbol *Sym = insert(Body);
Rafael Espindola9f77ef02016-02-12 20:54:57 +0000158 Sym->Body = Body;
159 }
160}
161
Rui Ueyama01a65b12015-12-24 10:37:32 +0000162// Add an undefined symbol.
Rui Ueyamaff777682015-10-09 21:12:40 +0000163template <class ELFT>
164SymbolBody *SymbolTable<ELFT>::addUndefined(StringRef Name) {
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000165 auto *Sym = new (Alloc) Undefined(Name, false, STV_DEFAULT, false);
Rui Ueyamaff777682015-10-09 21:12:40 +0000166 resolve(Sym);
167 return Sym;
Rafael Espindola1d6063e2015-09-22 21:24:52 +0000168}
169
Rui Ueyama01a65b12015-12-24 10:37:32 +0000170// Add an undefined symbol. Unlike addUndefined, that symbol
171// doesn't have to be resolved, thus "opt" (optional).
Rui Ueyamaff777682015-10-09 21:12:40 +0000172template <class ELFT>
173SymbolBody *SymbolTable<ELFT>::addUndefinedOpt(StringRef Name) {
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000174 auto *Sym = new (Alloc) Undefined(Name, false, STV_HIDDEN, true);
Rui Ueyamaff777682015-10-09 21:12:40 +0000175 resolve(Sym);
176 return Sym;
Denis Protivensky22220d52015-10-05 09:43:57 +0000177}
178
Rafael Espindola0e604f92015-09-25 18:56:53 +0000179template <class ELFT>
Rui Ueyama79c73732016-01-08 21:53:28 +0000180SymbolBody *SymbolTable<ELFT>::addAbsolute(StringRef Name, Elf_Sym &ESym) {
181 // Pass nullptr because absolute symbols have no corresponding input sections.
182 auto *Sym = new (Alloc) DefinedRegular<ELFT>(Name, ESym, nullptr);
183 resolve(Sym);
184 return Sym;
Igor Kudrin15cd9ff2015-11-06 07:43:03 +0000185}
186
187template <class ELFT>
Rui Ueyama79c73732016-01-08 21:53:28 +0000188SymbolBody *SymbolTable<ELFT>::addSynthetic(StringRef Name,
George Rimaraa4dc202016-03-01 16:23:13 +0000189 OutputSectionBase<ELFT> &Sec,
190 uintX_t Val, uint8_t Visibility) {
191 auto *Sym = new (Alloc) DefinedSynthetic<ELFT>(Name, Val, Sec, Visibility);
Rui Ueyama3ce825e2015-10-09 21:07:25 +0000192 resolve(Sym);
Rui Ueyama79c73732016-01-08 21:53:28 +0000193 return Sym;
Rafael Espindola0e604f92015-09-25 18:56:53 +0000194}
195
Rui Ueyamac9559d92016-01-05 20:47:37 +0000196// Add Name as an "ignored" symbol. An ignored symbol is a regular
197// linker-synthesized defined symbol, but it is not recorded to the output
198// file's symbol table. Such symbols are useful for some linker-defined symbols.
Simon Atanasyan09dae7c2015-12-16 14:45:09 +0000199template <class ELFT>
Rui Ueyamadd7d9982015-12-16 22:31:14 +0000200SymbolBody *SymbolTable<ELFT>::addIgnored(StringRef Name) {
Rafael Espindola65e80b92016-01-19 21:19:52 +0000201 return addAbsolute(Name, ElfSym<ELFT>::Ignored);
Rafael Espindola5d413262015-10-01 21:22:26 +0000202}
203
Rui Ueyamadeb15402016-01-07 17:20:07 +0000204// Rename SYM as __wrap_SYM. The original symbol is preserved as __real_SYM.
205// Used to implement --wrap.
206template <class ELFT> void SymbolTable<ELFT>::wrap(StringRef Name) {
207 if (Symtab.count(Name) == 0)
208 return;
209 StringSaver Saver(Alloc);
210 Symbol *Sym = addUndefined(Name)->getSymbol();
211 Symbol *Real = addUndefined(Saver.save("__real_" + Name))->getSymbol();
212 Symbol *Wrap = addUndefined(Saver.save("__wrap_" + Name))->getSymbol();
213 Real->Body = Sym->Body;
214 Sym->Body = Wrap->Body;
215}
216
Rui Ueyama533336a2015-12-16 22:26:48 +0000217// Returns a file from which symbol B was created.
Rui Ueyama2a65a492016-01-05 20:01:29 +0000218// If B does not belong to any file, returns a nullptr.
Rafael Espindola18f09502016-02-26 21:49:38 +0000219template <class ELFT> InputFile *SymbolTable<ELFT>::findFile(SymbolBody *B) {
Rui Ueyama533336a2015-12-16 22:26:48 +0000220 for (const std::unique_ptr<ObjectFile<ELFT>> &F : ObjectFiles) {
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000221 ArrayRef<SymbolBody *> Syms = F->getSymbols();
222 if (std::find(Syms.begin(), Syms.end(), B) != Syms.end())
Rui Ueyama533336a2015-12-16 22:26:48 +0000223 return F.get();
Rafael Espindola1a49e582015-09-23 14:10:24 +0000224 }
Rafael Espindola18f09502016-02-26 21:49:38 +0000225 for (const std::unique_ptr<BitcodeFile> &F : BitcodeFiles) {
226 ArrayRef<SymbolBody *> Syms = F->getSymbols();
227 if (std::find(Syms.begin(), Syms.end(), B) != Syms.end())
228 return F.get();
229 }
Rui Ueyama533336a2015-12-16 22:26:48 +0000230 return nullptr;
231}
232
Rui Ueyama71c066d2016-02-02 08:22:41 +0000233// Returns "(internal)", "foo.a(bar.o)" or "baz.o".
Rafael Espindola18f09502016-02-26 21:49:38 +0000234static std::string getFilename(InputFile *F) {
Rui Ueyama71c066d2016-02-02 08:22:41 +0000235 if (!F)
236 return "(internal)";
237 if (!F->ArchiveName.empty())
238 return (F->ArchiveName + "(" + F->getName() + ")").str();
239 return F->getName();
240}
241
Rui Ueyamab4de5952016-01-08 22:01:33 +0000242// Construct a string in the form of "Sym in File1 and File2".
243// Used to construct an error message.
Rui Ueyama533336a2015-12-16 22:26:48 +0000244template <class ELFT>
245std::string SymbolTable<ELFT>::conflictMsg(SymbolBody *Old, SymbolBody *New) {
Rafael Espindola18f09502016-02-26 21:49:38 +0000246 InputFile *F1 = findFile(Old);
247 InputFile *F2 = findFile(New);
Rui Ueyamaf0904012015-12-16 22:26:45 +0000248 StringRef Sym = Old->getName();
Rui Ueyama71c066d2016-02-02 08:22:41 +0000249 return demangle(Sym) + " in " + getFilename(F1) + " and " + getFilename(F2);
Rafael Espindola1a49e582015-09-23 14:10:24 +0000250}
251
Michael J. Spencer84487f12015-07-24 21:03:07 +0000252// This function resolves conflicts if there's an existing symbol with
253// the same name. Decisions are made based on symbol type.
Rui Ueyama3ce825e2015-10-09 21:07:25 +0000254template <class ELFT> void SymbolTable<ELFT>::resolve(SymbolBody *New) {
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000255 Symbol *Sym = insert(New);
256 if (Sym->Body == New)
257 return;
258
259 SymbolBody *Existing = Sym->Body;
260
261 if (Lazy *L = dyn_cast<Lazy>(Existing)) {
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000262 if (auto *Undef = dyn_cast<Undefined>(New)) {
Rui Ueyamac5b95122015-12-16 23:23:14 +0000263 addMemberFile(Undef, L);
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000264 return;
265 }
Rui Ueyamac5b95122015-12-16 23:23:14 +0000266 // Found a definition for something also in an archive.
267 // Ignore the archive definition.
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000268 Sym->Body = New;
269 return;
270 }
271
Rafael Espindola5e8b54a2016-02-22 23:16:05 +0000272 if (New->IsTls != Existing->IsTls) {
Rui Ueyama16ba6692016-01-29 19:41:13 +0000273 error("TLS attribute mismatch for symbol: " + conflictMsg(Existing, New));
274 return;
275 }
Igor Kudrin65bddea2015-10-09 09:58:39 +0000276
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000277 // compare() returns -1, 0, or 1 if the lhs symbol is less preferable,
278 // equivalent (conflicting), or more preferable, respectively.
Rui Ueyama2e0a9ff2016-01-06 00:09:39 +0000279 int Comp = Existing->compare<ELFT>(New);
280 if (Comp == 0) {
Rui Ueyamaf0904012015-12-16 22:26:45 +0000281 std::string S = "duplicate symbol: " + conflictMsg(Existing, New);
Rui Ueyama16ba6692016-01-29 19:41:13 +0000282 if (Config->AllowMultipleDefinition)
283 warning(S);
284 else
285 error(S);
Rui Ueyamaf0904012015-12-16 22:26:45 +0000286 return;
287 }
Rui Ueyama2e0a9ff2016-01-06 00:09:39 +0000288 if (Comp < 0)
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000289 Sym->Body = New;
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000290}
291
Rui Ueyamab4de5952016-01-08 22:01:33 +0000292// Find an existing symbol or create and insert a new one.
Rui Ueyama3ce825e2015-10-09 21:07:25 +0000293template <class ELFT> Symbol *SymbolTable<ELFT>::insert(SymbolBody *New) {
Michael J. Spencer84487f12015-07-24 21:03:07 +0000294 StringRef Name = New->getName();
295 Symbol *&Sym = Symtab[Name];
Rui Ueyama38dcc9e2015-12-16 23:25:31 +0000296 if (!Sym)
Rui Ueyama3554f592015-12-17 00:01:25 +0000297 Sym = new (Alloc) Symbol{New};
Michael J. Spencer84487f12015-07-24 21:03:07 +0000298 New->setBackref(Sym);
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000299 return Sym;
300}
Michael J. Spencer84487f12015-07-24 21:03:07 +0000301
Rui Ueyamaf8432d92015-10-13 16:34:14 +0000302template <class ELFT> SymbolBody *SymbolTable<ELFT>::find(StringRef Name) {
303 auto It = Symtab.find(Name);
304 if (It == Symtab.end())
305 return nullptr;
306 return It->second->Body;
307}
308
Rui Ueyamac5b95122015-12-16 23:23:14 +0000309template <class ELFT> void SymbolTable<ELFT>::addLazy(Lazy *L) {
310 Symbol *Sym = insert(L);
311 if (Sym->Body == L)
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000312 return;
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000313 if (auto *Undef = dyn_cast<Undefined>(Sym->Body)) {
Rui Ueyamac5b95122015-12-16 23:23:14 +0000314 Sym->Body = L;
315 addMemberFile(Undef, L);
Rafael Espindola8614c562015-10-06 14:33:58 +0000316 }
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000317}
318
Rui Ueyama3d451792015-10-12 18:03:21 +0000319template <class ELFT>
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000320void SymbolTable<ELFT>::addMemberFile(Undefined *Undef, Lazy *L) {
Rui Ueyamac5b95122015-12-16 23:23:14 +0000321 // Weak undefined symbols should not fetch members from archives.
322 // If we were to keep old symbol we would not know that an archive member was
323 // available if a strong undefined symbol shows up afterwards in the link.
324 // If a strong undefined symbol never shows up, this lazy symbol will
325 // get to the end of the link and must be treated as the weak undefined one.
326 // We set UsedInRegularObj in a similar way to what is done with shared
Rafael Espindola8176d572016-02-22 23:19:29 +0000327 // symbols and copy information to reduce how many special cases are needed.
Rui Ueyamac5b95122015-12-16 23:23:14 +0000328 if (Undef->isWeak()) {
329 L->setUsedInRegularObj();
330 L->setWeak();
Rafael Espindola8176d572016-02-22 23:19:29 +0000331
332 // FIXME: Do we need to copy more?
333 L->IsTls = Undef->IsTls;
Rui Ueyamac5b95122015-12-16 23:23:14 +0000334 return;
335 }
336
337 // Fetch a member file that has the definition for L.
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000338 // getMember returns nullptr if the member was already read from the library.
Rui Ueyamac5b95122015-12-16 23:23:14 +0000339 if (std::unique_ptr<InputFile> File = L->getMember())
Rui Ueyama690db672015-10-14 22:32:10 +0000340 addFile(std::move(File));
Michael J. Spencer84487f12015-07-24 21:03:07 +0000341}
Rafael Espindola0e604f92015-09-25 18:56:53 +0000342
Rui Ueyama93bfee52015-10-13 18:10:33 +0000343// This function takes care of the case in which shared libraries depend on
344// the user program (not the other way, which is usual). Shared libraries
345// may have undefined symbols, expecting that the user program provides
346// the definitions for them. An example is BSD's __progname symbol.
347// We need to put such symbols to the main program's .dynsym so that
348// shared libraries can find them.
349// Except this, we ignore undefined symbols in DSOs.
350template <class ELFT> void SymbolTable<ELFT>::scanShlibUndefined() {
Rui Ueyamaf8432d92015-10-13 16:34:14 +0000351 for (std::unique_ptr<SharedFile<ELFT>> &File : SharedFiles)
352 for (StringRef U : File->getUndefinedSymbols())
353 if (SymbolBody *Sym = find(U))
354 if (Sym->isDefined())
Rafael Espindolaabebed92016-02-05 15:27:15 +0000355 Sym->MustBeInDynSym = true;
Rui Ueyamaf8432d92015-10-13 16:34:14 +0000356}
357
Rafael Espindolae0df00b2016-02-28 00:25:54 +0000358template class elf::SymbolTable<ELF32LE>;
359template class elf::SymbolTable<ELF32BE>;
360template class elf::SymbolTable<ELF64LE>;
361template class elf::SymbolTable<ELF64BE>;