blob: 8857d654aa9f566e07cb371e64524796405eb7c3 [file] [log] [blame]
Michael J. Spencer84487f12015-07-24 21:03:07 +00001//===- SymbolTable.cpp ----------------------------------------------------===//
2//
3// The LLVM Linker
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
Rui Ueyama34f29242015-10-13 19:51:57 +00009//
10// Symbol table is a bag of all known symbols. We put all symbols of
Rui Ueyamac9559d92016-01-05 20:47:37 +000011// all input files to the symbol table. The symbol table is basically
Rui Ueyama34f29242015-10-13 19:51:57 +000012// a hash table with the logic to resolve symbol name conflicts using
13// the symbol types.
14//
15//===----------------------------------------------------------------------===//
Michael J. Spencer84487f12015-07-24 21:03:07 +000016
17#include "SymbolTable.h"
Rafael Espindola4340aad2015-09-11 22:42:45 +000018#include "Config.h"
Rafael Espindola192e1fa2015-08-06 15:08:23 +000019#include "Error.h"
Michael J. Spencer84487f12015-07-24 21:03:07 +000020#include "Symbols.h"
Rafael Espindola9f77ef02016-02-12 20:54:57 +000021#include "llvm/Bitcode/ReaderWriter.h"
22#include "llvm/IR/LegacyPassManager.h"
23#include "llvm/Linker/Linker.h"
Rui Ueyamadeb15402016-01-07 17:20:07 +000024#include "llvm/Support/StringSaver.h"
Rafael Espindola9f77ef02016-02-12 20:54:57 +000025#include "llvm/Support/TargetRegistry.h"
26#include "llvm/Target/TargetMachine.h"
Michael J. Spencer84487f12015-07-24 21:03:07 +000027
28using namespace llvm;
Rafael Espindoladaa92a62015-08-31 01:16:19 +000029using namespace llvm::object;
Rafael Espindola01205f72015-09-22 18:19:46 +000030using namespace llvm::ELF;
Michael J. Spencer84487f12015-07-24 21:03:07 +000031
32using namespace lld;
Rafael Espindolae0df00b2016-02-28 00:25:54 +000033using namespace lld::elf;
Michael J. Spencer84487f12015-07-24 21:03:07 +000034
Rui Ueyamac9559d92016-01-05 20:47:37 +000035// All input object files must be for the same architecture
36// (e.g. it does not make sense to link x86 object files with
37// MIPS object files.) This function checks for that error.
Rui Ueyama16ba6692016-01-29 19:41:13 +000038template <class ELFT> static bool isCompatible(InputFile *FileP) {
Rui Ueyama25b44c92015-12-16 23:31:22 +000039 auto *F = dyn_cast<ELFFileBase<ELFT>>(FileP);
40 if (!F)
Rui Ueyama16ba6692016-01-29 19:41:13 +000041 return true;
Rui Ueyama25b44c92015-12-16 23:31:22 +000042 if (F->getELFKind() == Config->EKind && F->getEMachine() == Config->EMachine)
Rui Ueyama16ba6692016-01-29 19:41:13 +000043 return true;
Rui Ueyama25b44c92015-12-16 23:31:22 +000044 StringRef A = F->getName();
45 StringRef B = Config->Emulation;
46 if (B.empty())
47 B = Config->FirstElf->getName();
Rui Ueyama16ba6692016-01-29 19:41:13 +000048 error(A + " is incompatible with " + B);
49 return false;
Rui Ueyama25b44c92015-12-16 23:31:22 +000050}
51
Rui Ueyamac9559d92016-01-05 20:47:37 +000052// Add symbols in File to the symbol table.
Rui Ueyama25b44c92015-12-16 23:31:22 +000053template <class ELFT>
Rui Ueyama3ce825e2015-10-09 21:07:25 +000054void SymbolTable<ELFT>::addFile(std::unique_ptr<InputFile> File) {
Rafael Espindola21f7bd42015-12-23 14:35:51 +000055 InputFile *FileP = File.get();
Rui Ueyama16ba6692016-01-29 19:41:13 +000056 if (!isCompatible<ELFT>(FileP))
57 return;
Rafael Espindola525914d2015-10-11 03:36:49 +000058
Rui Ueyama89575742015-12-16 22:59:13 +000059 // .a file
60 if (auto *F = dyn_cast<ArchiveFile>(FileP)) {
Rafael Espindola21f7bd42015-12-23 14:35:51 +000061 ArchiveFiles.emplace_back(cast<ArchiveFile>(File.release()));
Rui Ueyama89575742015-12-16 22:59:13 +000062 F->parse();
63 for (Lazy &Sym : F->getLazySymbols())
Michael J. Spencer1b348a62015-09-04 22:28:10 +000064 addLazy(&Sym);
65 return;
66 }
Rui Ueyama3d451792015-10-12 18:03:21 +000067
Rui Ueyama89575742015-12-16 22:59:13 +000068 // .so file
69 if (auto *F = dyn_cast<SharedFile<ELFT>>(FileP)) {
70 // DSOs are uniquified not by filename but by soname.
71 F->parseSoName();
Rui Ueyama131e0ff2016-01-08 22:17:42 +000072 if (!SoNames.insert(F->getSoName()).second)
Rafael Espindola6a3b5de2015-10-01 19:52:48 +000073 return;
Rui Ueyama89575742015-12-16 22:59:13 +000074
Rafael Espindola21f7bd42015-12-23 14:35:51 +000075 SharedFiles.emplace_back(cast<SharedFile<ELFT>>(File.release()));
Rui Ueyama7c713312016-01-06 01:56:36 +000076 F->parseRest();
Rui Ueyama89575742015-12-16 22:59:13 +000077 for (SharedSymbol<ELFT> &B : F->getSharedSymbols())
78 resolve(&B);
79 return;
Rafael Espindola6a3b5de2015-10-01 19:52:48 +000080 }
Rui Ueyama89575742015-12-16 22:59:13 +000081
Rafael Espindola9f77ef02016-02-12 20:54:57 +000082 // LLVM bitcode file.
83 if (auto *F = dyn_cast<BitcodeFile>(FileP)) {
84 BitcodeFiles.emplace_back(cast<BitcodeFile>(File.release()));
85 F->parse();
Rafael Espindola297ce4e2016-02-26 21:31:34 +000086 for (SymbolBody *B : F->getSymbols())
Rafael Espindola9f77ef02016-02-12 20:54:57 +000087 resolve(B);
88 return;
89 }
90
Rui Ueyama89575742015-12-16 22:59:13 +000091 // .o file
92 auto *F = cast<ObjectFile<ELFT>>(FileP);
Rafael Espindola21f7bd42015-12-23 14:35:51 +000093 ObjectFiles.emplace_back(cast<ObjectFile<ELFT>>(File.release()));
Rui Ueyama52d3b672016-01-06 02:06:33 +000094 F->parse(ComdatGroups);
Rui Ueyama89575742015-12-16 22:59:13 +000095 for (SymbolBody *B : F->getSymbols())
96 resolve(B);
Michael J. Spencer84487f12015-07-24 21:03:07 +000097}
98
Rafael Espindola9f77ef02016-02-12 20:54:57 +000099// Codegen the module M and returns the resulting InputFile.
100template <class ELFT>
101std::unique_ptr<InputFile> SymbolTable<ELFT>::codegen(Module &M) {
102 StringRef TripleStr = M.getTargetTriple();
103 Triple TheTriple(TripleStr);
104
105 // FIXME: Should we have a default triple? The gold plugin uses
106 // sys::getDefaultTargetTriple(), but that is probably wrong given that this
107 // might be a cross linker.
108
109 std::string ErrMsg;
110 const Target *TheTarget = TargetRegistry::lookupTarget(TripleStr, ErrMsg);
111 if (!TheTarget)
112 fatal("Target not found: " + ErrMsg);
113
114 TargetOptions Options;
115 std::unique_ptr<TargetMachine> TM(
116 TheTarget->createTargetMachine(TripleStr, "", "", Options));
117
118 raw_svector_ostream OS(OwningLTOData);
119 legacy::PassManager CodeGenPasses;
120 if (TM->addPassesToEmitFile(CodeGenPasses, OS,
121 TargetMachine::CGFT_ObjectFile))
122 fatal("Failed to setup codegen");
123 CodeGenPasses.run(M);
124 LtoBuffer = MemoryBuffer::getMemBuffer(OwningLTOData, "", false);
125 return createObjectFile(*LtoBuffer);
126}
127
128// Merge all the bitcode files we have seen, codegen the result and return
129// the resulting ObjectFile.
130template <class ELFT>
131ObjectFile<ELFT> *SymbolTable<ELFT>::createCombinedLtoObject() {
132 LLVMContext Context;
133 Module Combined("ld-temp.o", Context);
134 Linker L(Combined);
135 for (const std::unique_ptr<BitcodeFile> &F : BitcodeFiles) {
136 std::unique_ptr<MemoryBuffer> Buffer =
137 MemoryBuffer::getMemBuffer(F->MB, false);
138 ErrorOr<std::unique_ptr<Module>> MOrErr =
139 getLazyBitcodeModule(std::move(Buffer), Context,
140 /*ShouldLazyLoadMetadata*/ true);
141 fatal(MOrErr);
142 std::unique_ptr<Module> &M = *MOrErr;
143 L.linkInModule(std::move(M));
144 }
145 std::unique_ptr<InputFile> F = codegen(Combined);
146 ObjectFiles.emplace_back(cast<ObjectFile<ELFT>>(F.release()));
147 return &*ObjectFiles.back();
148}
149
150template <class ELFT> void SymbolTable<ELFT>::addCombinedLtoObject() {
151 if (BitcodeFiles.empty())
152 return;
153 ObjectFile<ELFT> *Obj = createCombinedLtoObject();
154 // FIXME: We probably have to ignore comdats here.
155 Obj->parse(ComdatGroups);
156 for (SymbolBody *Body : Obj->getSymbols()) {
157 Symbol *Sym = insert(Body);
158 assert(isa<DefinedBitcode>(Sym->Body));
159 Sym->Body = Body;
160 }
161}
162
Rui Ueyama01a65b12015-12-24 10:37:32 +0000163// Add an undefined symbol.
Rui Ueyamaff777682015-10-09 21:12:40 +0000164template <class ELFT>
165SymbolBody *SymbolTable<ELFT>::addUndefined(StringRef Name) {
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000166 auto *Sym = new (Alloc) Undefined(Name, false, STV_DEFAULT, false);
Rui Ueyamaff777682015-10-09 21:12:40 +0000167 resolve(Sym);
168 return Sym;
Rafael Espindola1d6063e2015-09-22 21:24:52 +0000169}
170
Rui Ueyama01a65b12015-12-24 10:37:32 +0000171// Add an undefined symbol. Unlike addUndefined, that symbol
172// doesn't have to be resolved, thus "opt" (optional).
Rui Ueyamaff777682015-10-09 21:12:40 +0000173template <class ELFT>
174SymbolBody *SymbolTable<ELFT>::addUndefinedOpt(StringRef Name) {
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000175 auto *Sym = new (Alloc) Undefined(Name, false, STV_HIDDEN, true);
Rui Ueyamaff777682015-10-09 21:12:40 +0000176 resolve(Sym);
177 return Sym;
Denis Protivensky22220d52015-10-05 09:43:57 +0000178}
179
Rafael Espindola0e604f92015-09-25 18:56:53 +0000180template <class ELFT>
Rui Ueyama79c73732016-01-08 21:53:28 +0000181SymbolBody *SymbolTable<ELFT>::addAbsolute(StringRef Name, Elf_Sym &ESym) {
182 // Pass nullptr because absolute symbols have no corresponding input sections.
183 auto *Sym = new (Alloc) DefinedRegular<ELFT>(Name, ESym, nullptr);
184 resolve(Sym);
185 return Sym;
Igor Kudrin15cd9ff2015-11-06 07:43:03 +0000186}
187
188template <class ELFT>
Rui Ueyama79c73732016-01-08 21:53:28 +0000189SymbolBody *SymbolTable<ELFT>::addSynthetic(StringRef Name,
190 OutputSectionBase<ELFT> &Section,
191 uintX_t Value) {
Rafael Espindola4d4b06a2015-12-24 00:47:42 +0000192 auto *Sym = new (Alloc) DefinedSynthetic<ELFT>(Name, Value, Section);
Rui Ueyama3ce825e2015-10-09 21:07:25 +0000193 resolve(Sym);
Rui Ueyama79c73732016-01-08 21:53:28 +0000194 return Sym;
Rafael Espindola0e604f92015-09-25 18:56:53 +0000195}
196
Rui Ueyamac9559d92016-01-05 20:47:37 +0000197// Add Name as an "ignored" symbol. An ignored symbol is a regular
198// linker-synthesized defined symbol, but it is not recorded to the output
199// file's symbol table. Such symbols are useful for some linker-defined symbols.
Simon Atanasyan09dae7c2015-12-16 14:45:09 +0000200template <class ELFT>
Rui Ueyamadd7d9982015-12-16 22:31:14 +0000201SymbolBody *SymbolTable<ELFT>::addIgnored(StringRef Name) {
Rafael Espindola65e80b92016-01-19 21:19:52 +0000202 return addAbsolute(Name, ElfSym<ELFT>::Ignored);
Rafael Espindola5d413262015-10-01 21:22:26 +0000203}
204
Rui Ueyamadeb15402016-01-07 17:20:07 +0000205// Rename SYM as __wrap_SYM. The original symbol is preserved as __real_SYM.
206// Used to implement --wrap.
207template <class ELFT> void SymbolTable<ELFT>::wrap(StringRef Name) {
208 if (Symtab.count(Name) == 0)
209 return;
210 StringSaver Saver(Alloc);
211 Symbol *Sym = addUndefined(Name)->getSymbol();
212 Symbol *Real = addUndefined(Saver.save("__real_" + Name))->getSymbol();
213 Symbol *Wrap = addUndefined(Saver.save("__wrap_" + Name))->getSymbol();
214 Real->Body = Sym->Body;
215 Sym->Body = Wrap->Body;
216}
217
Rui Ueyama533336a2015-12-16 22:26:48 +0000218// Returns a file from which symbol B was created.
Rui Ueyama2a65a492016-01-05 20:01:29 +0000219// If B does not belong to any file, returns a nullptr.
Rafael Espindola18f09502016-02-26 21:49:38 +0000220template <class ELFT> InputFile *SymbolTable<ELFT>::findFile(SymbolBody *B) {
Rui Ueyama533336a2015-12-16 22:26:48 +0000221 for (const std::unique_ptr<ObjectFile<ELFT>> &F : ObjectFiles) {
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000222 ArrayRef<SymbolBody *> Syms = F->getSymbols();
223 if (std::find(Syms.begin(), Syms.end(), B) != Syms.end())
Rui Ueyama533336a2015-12-16 22:26:48 +0000224 return F.get();
Rafael Espindola1a49e582015-09-23 14:10:24 +0000225 }
Rafael Espindola18f09502016-02-26 21:49:38 +0000226 for (const std::unique_ptr<BitcodeFile> &F : BitcodeFiles) {
227 ArrayRef<SymbolBody *> Syms = F->getSymbols();
228 if (std::find(Syms.begin(), Syms.end(), B) != Syms.end())
229 return F.get();
230 }
Rui Ueyama533336a2015-12-16 22:26:48 +0000231 return nullptr;
232}
233
Rui Ueyama71c066d2016-02-02 08:22:41 +0000234// Returns "(internal)", "foo.a(bar.o)" or "baz.o".
Rafael Espindola18f09502016-02-26 21:49:38 +0000235static std::string getFilename(InputFile *F) {
Rui Ueyama71c066d2016-02-02 08:22:41 +0000236 if (!F)
237 return "(internal)";
238 if (!F->ArchiveName.empty())
239 return (F->ArchiveName + "(" + F->getName() + ")").str();
240 return F->getName();
241}
242
Rui Ueyamab4de5952016-01-08 22:01:33 +0000243// Construct a string in the form of "Sym in File1 and File2".
244// Used to construct an error message.
Rui Ueyama533336a2015-12-16 22:26:48 +0000245template <class ELFT>
246std::string SymbolTable<ELFT>::conflictMsg(SymbolBody *Old, SymbolBody *New) {
Rafael Espindola18f09502016-02-26 21:49:38 +0000247 InputFile *F1 = findFile(Old);
248 InputFile *F2 = findFile(New);
Rui Ueyamaf0904012015-12-16 22:26:45 +0000249 StringRef Sym = Old->getName();
Rui Ueyama71c066d2016-02-02 08:22:41 +0000250 return demangle(Sym) + " in " + getFilename(F1) + " and " + getFilename(F2);
Rafael Espindola1a49e582015-09-23 14:10:24 +0000251}
252
Michael J. Spencer84487f12015-07-24 21:03:07 +0000253// This function resolves conflicts if there's an existing symbol with
254// the same name. Decisions are made based on symbol type.
Rui Ueyama3ce825e2015-10-09 21:07:25 +0000255template <class ELFT> void SymbolTable<ELFT>::resolve(SymbolBody *New) {
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000256 Symbol *Sym = insert(New);
257 if (Sym->Body == New)
258 return;
259
260 SymbolBody *Existing = Sym->Body;
261
262 if (Lazy *L = dyn_cast<Lazy>(Existing)) {
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000263 if (auto *Undef = dyn_cast<Undefined>(New)) {
Rui Ueyamac5b95122015-12-16 23:23:14 +0000264 addMemberFile(Undef, L);
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000265 return;
266 }
Rui Ueyamac5b95122015-12-16 23:23:14 +0000267 // Found a definition for something also in an archive.
268 // Ignore the archive definition.
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000269 Sym->Body = New;
270 return;
271 }
272
Rafael Espindola5e8b54a2016-02-22 23:16:05 +0000273 if (New->IsTls != Existing->IsTls) {
Rui Ueyama16ba6692016-01-29 19:41:13 +0000274 error("TLS attribute mismatch for symbol: " + conflictMsg(Existing, New));
275 return;
276 }
Igor Kudrin65bddea2015-10-09 09:58:39 +0000277
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000278 // compare() returns -1, 0, or 1 if the lhs symbol is less preferable,
279 // equivalent (conflicting), or more preferable, respectively.
Rui Ueyama2e0a9ff2016-01-06 00:09:39 +0000280 int Comp = Existing->compare<ELFT>(New);
281 if (Comp == 0) {
Rui Ueyamaf0904012015-12-16 22:26:45 +0000282 std::string S = "duplicate symbol: " + conflictMsg(Existing, New);
Rui Ueyama16ba6692016-01-29 19:41:13 +0000283 if (Config->AllowMultipleDefinition)
284 warning(S);
285 else
286 error(S);
Rui Ueyamaf0904012015-12-16 22:26:45 +0000287 return;
288 }
Rui Ueyama2e0a9ff2016-01-06 00:09:39 +0000289 if (Comp < 0)
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000290 Sym->Body = New;
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000291}
292
Rui Ueyamab4de5952016-01-08 22:01:33 +0000293// Find an existing symbol or create and insert a new one.
Rui Ueyama3ce825e2015-10-09 21:07:25 +0000294template <class ELFT> Symbol *SymbolTable<ELFT>::insert(SymbolBody *New) {
Michael J. Spencer84487f12015-07-24 21:03:07 +0000295 StringRef Name = New->getName();
296 Symbol *&Sym = Symtab[Name];
Rui Ueyama38dcc9e2015-12-16 23:25:31 +0000297 if (!Sym)
Rui Ueyama3554f592015-12-17 00:01:25 +0000298 Sym = new (Alloc) Symbol{New};
Michael J. Spencer84487f12015-07-24 21:03:07 +0000299 New->setBackref(Sym);
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000300 return Sym;
301}
Michael J. Spencer84487f12015-07-24 21:03:07 +0000302
Rui Ueyamaf8432d92015-10-13 16:34:14 +0000303template <class ELFT> SymbolBody *SymbolTable<ELFT>::find(StringRef Name) {
304 auto It = Symtab.find(Name);
305 if (It == Symtab.end())
306 return nullptr;
307 return It->second->Body;
308}
309
Rui Ueyamac5b95122015-12-16 23:23:14 +0000310template <class ELFT> void SymbolTable<ELFT>::addLazy(Lazy *L) {
311 Symbol *Sym = insert(L);
312 if (Sym->Body == L)
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000313 return;
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000314 if (auto *Undef = dyn_cast<Undefined>(Sym->Body)) {
Rui Ueyamac5b95122015-12-16 23:23:14 +0000315 Sym->Body = L;
316 addMemberFile(Undef, L);
Rafael Espindola8614c562015-10-06 14:33:58 +0000317 }
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000318}
319
Rui Ueyama3d451792015-10-12 18:03:21 +0000320template <class ELFT>
Rafael Espindola5d7593b2015-12-22 23:00:50 +0000321void SymbolTable<ELFT>::addMemberFile(Undefined *Undef, Lazy *L) {
Rui Ueyamac5b95122015-12-16 23:23:14 +0000322 // Weak undefined symbols should not fetch members from archives.
323 // If we were to keep old symbol we would not know that an archive member was
324 // available if a strong undefined symbol shows up afterwards in the link.
325 // If a strong undefined symbol never shows up, this lazy symbol will
326 // get to the end of the link and must be treated as the weak undefined one.
327 // We set UsedInRegularObj in a similar way to what is done with shared
Rafael Espindola8176d572016-02-22 23:19:29 +0000328 // symbols and copy information to reduce how many special cases are needed.
Rui Ueyamac5b95122015-12-16 23:23:14 +0000329 if (Undef->isWeak()) {
330 L->setUsedInRegularObj();
331 L->setWeak();
Rafael Espindola8176d572016-02-22 23:19:29 +0000332
333 // FIXME: Do we need to copy more?
334 L->IsTls = Undef->IsTls;
Rui Ueyamac5b95122015-12-16 23:23:14 +0000335 return;
336 }
337
338 // Fetch a member file that has the definition for L.
Michael J. Spencer1b348a62015-09-04 22:28:10 +0000339 // getMember returns nullptr if the member was already read from the library.
Rui Ueyamac5b95122015-12-16 23:23:14 +0000340 if (std::unique_ptr<InputFile> File = L->getMember())
Rui Ueyama690db672015-10-14 22:32:10 +0000341 addFile(std::move(File));
Michael J. Spencer84487f12015-07-24 21:03:07 +0000342}
Rafael Espindola0e604f92015-09-25 18:56:53 +0000343
Rui Ueyama93bfee52015-10-13 18:10:33 +0000344// This function takes care of the case in which shared libraries depend on
345// the user program (not the other way, which is usual). Shared libraries
346// may have undefined symbols, expecting that the user program provides
347// the definitions for them. An example is BSD's __progname symbol.
348// We need to put such symbols to the main program's .dynsym so that
349// shared libraries can find them.
350// Except this, we ignore undefined symbols in DSOs.
351template <class ELFT> void SymbolTable<ELFT>::scanShlibUndefined() {
Rui Ueyamaf8432d92015-10-13 16:34:14 +0000352 for (std::unique_ptr<SharedFile<ELFT>> &File : SharedFiles)
353 for (StringRef U : File->getUndefinedSymbols())
354 if (SymbolBody *Sym = find(U))
355 if (Sym->isDefined())
Rafael Espindolaabebed92016-02-05 15:27:15 +0000356 Sym->MustBeInDynSym = true;
Rui Ueyamaf8432d92015-10-13 16:34:14 +0000357}
358
Rafael Espindolae0df00b2016-02-28 00:25:54 +0000359template class elf::SymbolTable<ELF32LE>;
360template class elf::SymbolTable<ELF32BE>;
361template class elf::SymbolTable<ELF64LE>;
362template class elf::SymbolTable<ELF64BE>;