blob: 9c967ffa81d217484f3af5f07f021bf1e685e1b2 [file] [log] [blame]
Sam Cleggc94d3932017-11-17 18:14:09 +00001//===- SymbolTable.cpp ----------------------------------------------------===//
2//
3// The LLVM Linker
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#include "SymbolTable.h"
Sam Cleggc94d3932017-11-17 18:14:09 +000011#include "Config.h"
Sam Clegg5fa274b2018-01-10 01:13:34 +000012#include "InputChunks.h"
Sam Clegg93102972018-02-23 05:08:53 +000013#include "InputGlobal.h"
Sam Cleggb8621592017-11-30 01:40:08 +000014#include "WriterUtils.h"
Sam Cleggc94d3932017-11-17 18:14:09 +000015#include "lld/Common/ErrorHandler.h"
Rui Ueyama2017d522017-11-28 20:39:17 +000016#include "lld/Common/Memory.h"
Rui Ueyama7d67dd12018-02-13 22:30:52 +000017#include "llvm/ADT/SetVector.h"
Sam Cleggc94d3932017-11-17 18:14:09 +000018
19#define DEBUG_TYPE "lld"
20
21using namespace llvm;
Sam Clegg20db3812018-01-10 00:52:20 +000022using namespace llvm::wasm;
Sam Clegg45218f42018-11-27 01:08:16 +000023using namespace llvm::object;
Sam Cleggc94d3932017-11-17 18:14:09 +000024using namespace lld;
25using namespace lld::wasm;
26
27SymbolTable *lld::wasm::Symtab;
28
29void SymbolTable::addFile(InputFile *File) {
30 log("Processing: " + toString(File));
31 File->parse();
32
Sam Cleggc729c1b2018-05-30 18:07:52 +000033 // LLVM bitcode file
34 if (auto *F = dyn_cast<BitcodeFile>(File))
35 BitcodeFiles.push_back(F);
36 else if (auto *F = dyn_cast<ObjFile>(File))
Sam Cleggc94d3932017-11-17 18:14:09 +000037 ObjectFiles.push_back(F);
38}
39
Sam Cleggc729c1b2018-05-30 18:07:52 +000040// This function is where all the optimizations of link-time
41// optimization happens. When LTO is in use, some input files are
42// not in native object file format but in the LLVM bitcode format.
43// This function compiles bitcode files into a few big native files
44// using LLVM functions and replaces bitcode symbols with the results.
45// Because all bitcode files that the program consists of are passed
46// to the compiler at once, it can do whole-program optimization.
47void SymbolTable::addCombinedLTOObject() {
48 if (BitcodeFiles.empty())
49 return;
50
51 // Compile bitcode files and replace bitcode symbols.
52 LTO.reset(new BitcodeCompiler);
53 for (BitcodeFile *F : BitcodeFiles)
54 LTO->add(*F);
55
56 for (StringRef Filename : LTO->compile()) {
57 auto *Obj = make<ObjFile>(MemoryBufferRef(Filename, "lto.tmp"));
58 Obj->parse();
59 ObjectFiles.push_back(Obj);
60 }
61}
62
Sam Cleggc94d3932017-11-17 18:14:09 +000063void SymbolTable::reportRemainingUndefines() {
Sam Clegg74fe0ba2017-12-07 01:51:24 +000064 for (Symbol *Sym : SymVector) {
Sam Cleggc729c1b2018-05-30 18:07:52 +000065 if (!Sym->isUndefined() || Sym->isWeak())
66 continue;
67 if (Config->AllowUndefinedSymbols.count(Sym->getName()) != 0)
68 continue;
69 if (!Sym->IsUsedInRegularObj)
70 continue;
Sam Clegg47e2b6b2018-08-04 00:04:06 +000071 error(toString(Sym->getFile()) + ": undefined symbol: " + toString(*Sym));
Sam Cleggc94d3932017-11-17 18:14:09 +000072 }
Sam Cleggc94d3932017-11-17 18:14:09 +000073}
74
75Symbol *SymbolTable::find(StringRef Name) {
Rui Ueyama67d69082018-02-28 23:03:06 +000076 return SymMap.lookup(CachedHashStringRef(Name));
Sam Cleggc94d3932017-11-17 18:14:09 +000077}
78
Sam Clegg4c2cbfe2018-08-02 20:39:19 +000079std::pair<Symbol *, bool> SymbolTable::insert(StringRef Name, InputFile *File) {
80 bool Inserted = false;
Sam Clegga80d94d2017-11-27 23:16:06 +000081 Symbol *&Sym = SymMap[CachedHashStringRef(Name)];
Sam Clegg4c2cbfe2018-08-02 20:39:19 +000082 if (!Sym) {
83 Sym = reinterpret_cast<Symbol *>(make<SymbolUnion>());
84 Sym->IsUsedInRegularObj = false;
85 SymVector.emplace_back(Sym);
86 Inserted = true;
87 }
88 if (!File || File->kind() == InputFile::ObjectKind)
89 Sym->IsUsedInRegularObj = true;
90 return {Sym, Inserted};
Sam Cleggc94d3932017-11-17 18:14:09 +000091}
92
Rui Ueyamae3498ec2018-02-28 00:09:22 +000093static void reportTypeError(const Symbol *Existing, const InputFile *File,
Sam Clegg3876d89a2018-05-14 22:42:33 +000094 llvm::wasm::WasmSymbolType Type) {
Rui Ueyamae3498ec2018-02-28 00:09:22 +000095 error("symbol type mismatch: " + toString(*Existing) + "\n>>> defined as " +
96 toString(Existing->getWasmType()) + " in " +
Sam Clegg3876d89a2018-05-14 22:42:33 +000097 toString(Existing->getFile()) + "\n>>> defined as " + toString(Type) +
98 " in " + toString(File));
Rui Ueyamae3498ec2018-02-28 00:09:22 +000099}
100
Heejin Ahn6f4286f2018-11-19 23:31:28 +0000101// Check the type of new symbol matches that of the symbol is replacing.
102// For functions this can also involve verifying that the signatures match.
Sam Cleggcefbf9a2018-06-28 16:53:53 +0000103static void checkFunctionType(Symbol *Existing, const InputFile *File,
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000104 const WasmSignature *NewSig) {
Sam Clegg65d63802018-05-14 23:01:16 +0000105 auto ExistingFunction = dyn_cast<FunctionSymbol>(Existing);
106 if (!ExistingFunction) {
Sam Clegg3876d89a2018-05-14 22:42:33 +0000107 reportTypeError(Existing, File, WASM_SYMBOL_TYPE_FUNCTION);
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000108 return;
109 }
110
Sam Cleggcefbf9a2018-06-28 16:53:53 +0000111 if (!NewSig)
112 return;
113
114 const WasmSignature *OldSig = ExistingFunction->FunctionType;
115 if (!OldSig) {
116 ExistingFunction->FunctionType = NewSig;
117 return;
118 }
119
120 if (*NewSig != *OldSig)
Sam Cleggffd0aaf2018-06-22 15:13:10 +0000121 warn("function signature mismatch: " + Existing->getName() +
122 "\n>>> defined as " + toString(*OldSig) + " in " +
123 toString(Existing->getFile()) + "\n>>> defined as " +
124 toString(*NewSig) + " in " + toString(File));
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000125}
126
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000127static void checkGlobalType(const Symbol *Existing, const InputFile *File,
128 const WasmGlobalType *NewType) {
129 if (!isa<GlobalSymbol>(Existing)) {
Sam Clegg3876d89a2018-05-14 22:42:33 +0000130 reportTypeError(Existing, File, WASM_SYMBOL_TYPE_GLOBAL);
Sam Cleggb8621592017-11-30 01:40:08 +0000131 return;
132 }
133
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000134 const WasmGlobalType *OldType = cast<GlobalSymbol>(Existing)->getGlobalType();
135 if (*NewType != *OldType) {
136 error("Global type mismatch: " + Existing->getName() + "\n>>> defined as " +
137 toString(*OldType) + " in " + toString(Existing->getFile()) +
138 "\n>>> defined as " + toString(*NewType) + " in " + toString(File));
Sam Clegg93102972018-02-23 05:08:53 +0000139 }
Sam Clegg24b3dcd2018-01-28 19:57:01 +0000140}
141
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000142static void checkDataType(const Symbol *Existing, const InputFile *File) {
143 if (!isa<DataSymbol>(Existing))
Sam Clegg3876d89a2018-05-14 22:42:33 +0000144 reportTypeError(Existing, File, WASM_SYMBOL_TYPE_DATA);
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000145}
146
Sam Cleggdfb0b2c2018-02-14 18:27:59 +0000147DefinedFunction *SymbolTable::addSyntheticFunction(StringRef Name,
Nicholas Wilsonebda41f2018-03-09 16:43:05 +0000148 uint32_t Flags,
149 InputFunction *Function) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000150 LLVM_DEBUG(dbgs() << "addSyntheticFunction: " << Name << "\n");
Rui Ueyamab961abc2018-02-28 22:51:51 +0000151 assert(!find(Name));
Nicholas Wilsonebda41f2018-03-09 16:43:05 +0000152 SyntheticFunctions.emplace_back(Function);
Sam Clegg4c2cbfe2018-08-02 20:39:19 +0000153 return replaceSymbol<DefinedFunction>(insert(Name, nullptr).first, Name,
154 Flags, nullptr, Function);
Sam Clegg50686852018-01-12 18:35:13 +0000155}
156
Sam Clegg00245532018-02-20 23:38:27 +0000157DefinedData *SymbolTable::addSyntheticDataSymbol(StringRef Name,
158 uint32_t Flags) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000159 LLVM_DEBUG(dbgs() << "addSyntheticDataSymbol: " << Name << "\n");
Rui Ueyamab961abc2018-02-28 22:51:51 +0000160 assert(!find(Name));
Sam Clegg4c2cbfe2018-08-02 20:39:19 +0000161 return replaceSymbol<DefinedData>(insert(Name, nullptr).first, Name, Flags);
Sam Cleggc94d3932017-11-17 18:14:09 +0000162}
163
Sam Clegg93102972018-02-23 05:08:53 +0000164DefinedGlobal *SymbolTable::addSyntheticGlobal(StringRef Name, uint32_t Flags,
165 InputGlobal *Global) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000166 LLVM_DEBUG(dbgs() << "addSyntheticGlobal: " << Name << " -> " << Global
167 << "\n");
Rui Ueyamab961abc2018-02-28 22:51:51 +0000168 assert(!find(Name));
Nicholas Wilsonebda41f2018-03-09 16:43:05 +0000169 SyntheticGlobals.emplace_back(Global);
Sam Clegg4c2cbfe2018-08-02 20:39:19 +0000170 return replaceSymbol<DefinedGlobal>(insert(Name, nullptr).first, Name, Flags,
171 nullptr, Global);
Sam Clegg93102972018-02-23 05:08:53 +0000172}
173
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000174static bool shouldReplace(const Symbol *Existing, InputFile *NewFile,
175 uint32_t NewFlags) {
Rui Ueyamac03c9042018-02-20 21:08:47 +0000176 // If existing symbol is undefined, replace it.
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000177 if (!Existing->isDefined()) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000178 LLVM_DEBUG(dbgs() << "resolving existing undefined symbol: "
179 << Existing->getName() << "\n");
Rui Ueyamac03c9042018-02-20 21:08:47 +0000180 return true;
181 }
182
183 // Now we have two defined symbols. If the new one is weak, we can ignore it.
184 if ((NewFlags & WASM_SYMBOL_BINDING_MASK) == WASM_SYMBOL_BINDING_WEAK) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000185 LLVM_DEBUG(dbgs() << "existing symbol takes precedence\n");
Rui Ueyamac03c9042018-02-20 21:08:47 +0000186 return false;
187 }
188
189 // If the existing symbol is weak, we should replace it.
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000190 if (Existing->isWeak()) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000191 LLVM_DEBUG(dbgs() << "replacing existing weak symbol\n");
Rui Ueyamac03c9042018-02-20 21:08:47 +0000192 return true;
193 }
194
195 // Neither symbol is week. They conflict.
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000196 error("duplicate symbol: " + toString(*Existing) + "\n>>> defined in " +
197 toString(Existing->getFile()) + "\n>>> defined in " +
198 toString(NewFile));
Rui Ueyamac03c9042018-02-20 21:08:47 +0000199 return true;
Sam Clegg93e559b2018-02-20 18:55:06 +0000200}
201
202Symbol *SymbolTable::addDefinedFunction(StringRef Name, uint32_t Flags,
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000203 InputFile *File,
204 InputFunction *Function) {
Sam Clegg8b0b48f2018-09-28 16:50:14 +0000205 LLVM_DEBUG(dbgs() << "addDefinedFunction: " << Name << " ["
206 << (Function ? toString(Function->Signature) : "none")
207 << "]\n");
Sam Clegg93e559b2018-02-20 18:55:06 +0000208 Symbol *S;
209 bool WasInserted;
Sam Clegg4c2cbfe2018-08-02 20:39:19 +0000210 std::tie(S, WasInserted) = insert(Name, File);
Sam Cleggc729c1b2018-05-30 18:07:52 +0000211
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000212 if (WasInserted || S->isLazy()) {
213 replaceSymbol<DefinedFunction>(S, Name, Flags, File, Function);
214 return S;
215 }
216
Sam Cleggc729c1b2018-05-30 18:07:52 +0000217 if (Function)
218 checkFunctionType(S, File, &Function->Signature);
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000219
Sam Clegg8b0b48f2018-09-28 16:50:14 +0000220 if (shouldReplace(S, File, Flags)) {
221 // If the new defined function doesn't have signture (i.e. bitcode
222 // functions) but the old symbols does then preserve the old signature
223 const WasmSignature *OldSig = nullptr;
224 if (auto* F = dyn_cast<FunctionSymbol>(S))
225 OldSig = F->FunctionType;
226 auto NewSym = replaceSymbol<DefinedFunction>(S, Name, Flags, File, Function);
227 if (!NewSym->FunctionType)
228 NewSym->FunctionType = OldSig;
229 }
Sam Clegg93e559b2018-02-20 18:55:06 +0000230 return S;
231}
232
Sam Clegg00245532018-02-20 23:38:27 +0000233Symbol *SymbolTable::addDefinedData(StringRef Name, uint32_t Flags,
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000234 InputFile *File, InputSegment *Segment,
Sam Clegg93102972018-02-23 05:08:53 +0000235 uint32_t Address, uint32_t Size) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000236 LLVM_DEBUG(dbgs() << "addDefinedData:" << Name << " addr:" << Address
237 << "\n");
Sam Clegg93e559b2018-02-20 18:55:06 +0000238 Symbol *S;
239 bool WasInserted;
Sam Clegg4c2cbfe2018-08-02 20:39:19 +0000240 std::tie(S, WasInserted) = insert(Name, File);
Sam Cleggc729c1b2018-05-30 18:07:52 +0000241
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000242 if (WasInserted || S->isLazy()) {
243 replaceSymbol<DefinedData>(S, Name, Flags, File, Segment, Address, Size);
244 return S;
245 }
246
247 checkDataType(S, File);
248
249 if (shouldReplace(S, File, Flags))
250 replaceSymbol<DefinedData>(S, Name, Flags, File, Segment, Address, Size);
Sam Cleggc94d3932017-11-17 18:14:09 +0000251 return S;
252}
253
Sam Clegg93102972018-02-23 05:08:53 +0000254Symbol *SymbolTable::addDefinedGlobal(StringRef Name, uint32_t Flags,
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000255 InputFile *File, InputGlobal *Global) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000256 LLVM_DEBUG(dbgs() << "addDefinedGlobal:" << Name << "\n");
Sam Clegg4c2cbfe2018-08-02 20:39:19 +0000257
Sam Clegg93102972018-02-23 05:08:53 +0000258 Symbol *S;
259 bool WasInserted;
Sam Clegg4c2cbfe2018-08-02 20:39:19 +0000260 std::tie(S, WasInserted) = insert(Name, File);
Sam Cleggc729c1b2018-05-30 18:07:52 +0000261
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000262 if (WasInserted || S->isLazy()) {
263 replaceSymbol<DefinedGlobal>(S, Name, Flags, File, Global);
264 return S;
265 }
266
267 checkGlobalType(S, File, &Global->getType());
268
269 if (shouldReplace(S, File, Flags))
270 replaceSymbol<DefinedGlobal>(S, Name, Flags, File, Global);
Sam Clegg93102972018-02-23 05:08:53 +0000271 return S;
272}
273
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000274Symbol *SymbolTable::addUndefinedFunction(StringRef Name, uint32_t Flags,
275 InputFile *File,
276 const WasmSignature *Sig) {
Sam Clegg8b0b48f2018-09-28 16:50:14 +0000277 LLVM_DEBUG(dbgs() << "addUndefinedFunction: " << Name <<
278 " [" << (Sig ? toString(*Sig) : "none") << "]\n");
Rui Ueyamac03c9042018-02-20 21:08:47 +0000279
Sam Cleggc94d3932017-11-17 18:14:09 +0000280 Symbol *S;
281 bool WasInserted;
Sam Clegg4c2cbfe2018-08-02 20:39:19 +0000282 std::tie(S, WasInserted) = insert(Name, File);
Sam Cleggc729c1b2018-05-30 18:07:52 +0000283
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000284 if (WasInserted)
285 replaceSymbol<UndefinedFunction>(S, Name, Flags, File, Sig);
286 else if (auto *Lazy = dyn_cast<LazySymbol>(S))
Rui Ueyamab961abc2018-02-28 22:51:51 +0000287 Lazy->fetch();
Sam Cleggcefbf9a2018-06-28 16:53:53 +0000288 else
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000289 checkFunctionType(S, File, Sig);
Sam Cleggcefbf9a2018-06-28 16:53:53 +0000290
Sam Cleggc94d3932017-11-17 18:14:09 +0000291 return S;
292}
293
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000294Symbol *SymbolTable::addUndefinedData(StringRef Name, uint32_t Flags,
295 InputFile *File) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000296 LLVM_DEBUG(dbgs() << "addUndefinedData: " << Name << "\n");
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000297
298 Symbol *S;
299 bool WasInserted;
Sam Clegg4c2cbfe2018-08-02 20:39:19 +0000300 std::tie(S, WasInserted) = insert(Name, File);
Sam Cleggf989a922018-07-17 19:15:02 +0000301
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000302 if (WasInserted)
303 replaceSymbol<UndefinedData>(S, Name, Flags, File);
304 else if (auto *Lazy = dyn_cast<LazySymbol>(S))
Rui Ueyamab961abc2018-02-28 22:51:51 +0000305 Lazy->fetch();
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000306 else if (S->isDefined())
307 checkDataType(S, File);
308 return S;
309}
310
311Symbol *SymbolTable::addUndefinedGlobal(StringRef Name, uint32_t Flags,
312 InputFile *File,
313 const WasmGlobalType *Type) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000314 LLVM_DEBUG(dbgs() << "addUndefinedGlobal: " << Name << "\n");
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000315
316 Symbol *S;
317 bool WasInserted;
Sam Clegg4c2cbfe2018-08-02 20:39:19 +0000318 std::tie(S, WasInserted) = insert(Name, File);
Sam Cleggc729c1b2018-05-30 18:07:52 +0000319
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000320 if (WasInserted)
321 replaceSymbol<UndefinedGlobal>(S, Name, Flags, File, Type);
322 else if (auto *Lazy = dyn_cast<LazySymbol>(S))
Rui Ueyamab961abc2018-02-28 22:51:51 +0000323 Lazy->fetch();
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000324 else if (S->isDefined())
325 checkGlobalType(S, File, Type);
326 return S;
327}
328
329void SymbolTable::addLazy(ArchiveFile *File, const Archive::Symbol *Sym) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000330 LLVM_DEBUG(dbgs() << "addLazy: " << Sym->getName() << "\n");
Sam Cleggc94d3932017-11-17 18:14:09 +0000331 StringRef Name = Sym->getName();
Rui Ueyamac03c9042018-02-20 21:08:47 +0000332
Sam Cleggc94d3932017-11-17 18:14:09 +0000333 Symbol *S;
334 bool WasInserted;
Sam Clegg4c2cbfe2018-08-02 20:39:19 +0000335 std::tie(S, WasInserted) = insert(Name, nullptr);
Rui Ueyamac03c9042018-02-20 21:08:47 +0000336
Sam Cleggc94d3932017-11-17 18:14:09 +0000337 if (WasInserted) {
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000338 replaceSymbol<LazySymbol>(S, Name, File, *Sym);
Rui Ueyamac03c9042018-02-20 21:08:47 +0000339 return;
340 }
341
342 // If there is an existing undefined symbol, load a new one from the archive.
343 if (S->isUndefined()) {
Nicola Zaghene7245b42018-05-15 13:36:20 +0000344 LLVM_DEBUG(dbgs() << "replacing existing undefined\n");
Rui Ueyamae3498ec2018-02-28 00:09:22 +0000345 File->addMember(Sym);
Sam Cleggc94d3932017-11-17 18:14:09 +0000346 }
347}
Sam Clegge0f6fcd2018-01-12 22:25:17 +0000348
Nicholas Wilsonc4d9aa12018-03-14 15:45:11 +0000349bool SymbolTable::addComdat(StringRef Name) {
350 return Comdats.insert(CachedHashStringRef(Name)).second;
Sam Clegge0f6fcd2018-01-12 22:25:17 +0000351}