blob: 98267d1cd8de72500e53facf0fb354ba26088671 [file] [log] [blame]
Sam Clegg03626332018-01-31 01:45:47 +00001//===- MarkLive.cpp -------------------------------------------------------===//
2//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Sam Clegg03626332018-01-31 01:45:47 +00006//
7//===----------------------------------------------------------------------===//
8//
9// This file implements --gc-sections, which is a feature to remove unused
10// chunks from the output. Unused chunks are those that are not reachable from
11// known root symbols or chunks. This feature is implemented as a mark-sweep
12// garbage collector.
13//
14// Here's how it works. Each InputChunk has a "Live" bit. The bit is off by
15// default. Starting with the GC-roots, visit all reachable chunks and set their
16// Live bits. The Writer will then ignore chunks whose Live bits are off, so
17// that such chunk are not appear in the output.
18//
19//===----------------------------------------------------------------------===//
20
21#include "MarkLive.h"
22#include "Config.h"
23#include "InputChunks.h"
Heejin Ahne915a712018-12-08 06:17:43 +000024#include "InputEvent.h"
Nicholas Wilson358af382018-04-20 17:28:12 +000025#include "InputGlobal.h"
Sam Clegg03626332018-01-31 01:45:47 +000026#include "SymbolTable.h"
27#include "Symbols.h"
28
29#define DEBUG_TYPE "lld"
30
31using namespace llvm;
32using namespace llvm::wasm;
Sam Clegg03626332018-01-31 01:45:47 +000033
34void lld::wasm::markLive() {
Rui Ueyama136d27a2019-07-11 05:40:30 +000035 if (!config->gcSections)
Sam Cleggffd0aaf2018-06-22 15:13:10 +000036 return;
37
Nicola Zaghene7245b42018-05-15 13:36:20 +000038 LLVM_DEBUG(dbgs() << "markLive\n");
Rui Ueyama136d27a2019-07-11 05:40:30 +000039 SmallVector<InputChunk *, 256> q;
Sam Clegg03626332018-01-31 01:45:47 +000040
Rui Ueyama136d27a2019-07-11 05:40:30 +000041 std::function<void(Symbol*)> enqueue = [&](Symbol *sym) {
42 if (!sym || sym->isLive())
Sam Clegg03626332018-01-31 01:45:47 +000043 return;
Rui Ueyama136d27a2019-07-11 05:40:30 +000044 LLVM_DEBUG(dbgs() << "markLive: " << sym->getName() << "\n");
45 sym->markLive();
46 if (InputChunk *chunk = sym->getChunk())
47 q.push_back(chunk);
Sam Clegg0e6b42f2019-03-01 22:35:47 +000048
Fangrui Song33fdf822019-07-16 08:08:17 +000049 // The ctor functions are all referenced by the synthetic callCtors
Sam Clegg0e6b42f2019-03-01 22:35:47 +000050 // function. However, this function does not contain relocations so we
Fangrui Song33fdf822019-07-16 08:08:17 +000051 // have to manually mark the ctors as live if callCtors itself is live.
Rui Ueyama136d27a2019-07-11 05:40:30 +000052 if (sym == WasmSym::callCtors) {
Rui Ueyama136d27a2019-07-11 05:40:30 +000053 if (config->isPic)
54 enqueue(WasmSym::applyRelocs);
55 for (const ObjFile *obj : symtab->objectFiles) {
56 const WasmLinkingData &l = obj->getWasmObj()->linkingData();
57 for (const WasmInitFunc &f : l.InitFunctions) {
58 auto* initSym = obj->getFunctionSymbol(f.Symbol);
59 if (!initSym->isDiscarded())
60 enqueue(initSym);
Sam Cleggfd54fa52019-06-07 06:00:46 +000061 }
Sam Clegg0e6b42f2019-03-01 22:35:47 +000062 }
63 }
Sam Clegg03626332018-01-31 01:45:47 +000064 };
65
66 // Add GC root symbols.
Rui Ueyama136d27a2019-07-11 05:40:30 +000067 if (!config->entry.empty())
68 enqueue(symtab->find(config->entry));
Sam Clegg03626332018-01-31 01:45:47 +000069
Dan Gohman7cb9c8a2019-08-29 22:41:05 +000070 // We need to preserve any no-strip or exported symbol
Rui Ueyama136d27a2019-07-11 05:40:30 +000071 for (Symbol *sym : symtab->getSymbols())
Dan Gohman7cb9c8a2019-08-29 22:41:05 +000072 if (sym->isNoStrip() || sym->isExported())
Rui Ueyama136d27a2019-07-11 05:40:30 +000073 enqueue(sym);
Sam Clegg03626332018-01-31 01:45:47 +000074
Sam Clegg0e6b42f2019-03-01 22:35:47 +000075 // For relocatable output, we need to preserve all the ctor functions
Rui Ueyama136d27a2019-07-11 05:40:30 +000076 if (config->relocatable) {
77 for (const ObjFile *obj : symtab->objectFiles) {
78 const WasmLinkingData &l = obj->getWasmObj()->linkingData();
79 for (const WasmInitFunc &f : l.InitFunctions)
80 enqueue(obj->getFunctionSymbol(f.Symbol));
Sam Clegg0e6b42f2019-03-01 22:35:47 +000081 }
Sam Clegg03626332018-01-31 01:45:47 +000082 }
83
Rui Ueyama136d27a2019-07-11 05:40:30 +000084 if (config->isPic)
85 enqueue(WasmSym::callCtors);
Sam Clegg09137be2019-04-04 18:40:51 +000086
Thomas Lively09768c52019-09-04 19:50:39 +000087 if (config->sharedMemory && !config->shared)
88 enqueue(WasmSym::initMemory);
89
Rui Ueyama34133b232018-02-19 22:34:47 +000090 // Follow relocations to mark all reachable chunks.
Rui Ueyama136d27a2019-07-11 05:40:30 +000091 while (!q.empty()) {
92 InputChunk *c = q.pop_back_val();
Rui Ueyama34133b232018-02-19 22:34:47 +000093
Rui Ueyama136d27a2019-07-11 05:40:30 +000094 for (const WasmRelocation reloc : c->getRelocations()) {
95 if (reloc.Type == R_WASM_TYPE_INDEX_LEB)
Nicholas Wilson2e55ee72018-03-09 17:06:38 +000096 continue;
Rui Ueyama136d27a2019-07-11 05:40:30 +000097 Symbol *sym = c->file->getSymbol(reloc.Index);
Nicholas Wilson2e55ee72018-03-09 17:06:38 +000098
99 // If the function has been assigned the special index zero in the table,
100 // the relocation doesn't pull in the function body, since the function
101 // won't actually go in the table (the runtime will trap attempts to call
102 // that index, since we don't use it). A function with a table index of
103 // zero is only reachable via "call", not via "call_indirect". The stub
104 // functions used for weak-undefined symbols have this behaviour (compare
105 // equal to null pointer, only reachable via direct call).
Rui Ueyama136d27a2019-07-11 05:40:30 +0000106 if (reloc.Type == R_WASM_TABLE_INDEX_SLEB ||
107 reloc.Type == R_WASM_TABLE_INDEX_I32) {
108 auto *funcSym = cast<FunctionSymbol>(sym);
109 if (funcSym->hasTableIndex() && funcSym->getTableIndex() == 0)
Nicholas Wilson2e55ee72018-03-09 17:06:38 +0000110 continue;
111 }
112
Rui Ueyama136d27a2019-07-11 05:40:30 +0000113 enqueue(sym);
Sam Clegg03626332018-01-31 01:45:47 +0000114 }
Rui Ueyama34133b232018-02-19 22:34:47 +0000115 }
Sam Clegg03626332018-01-31 01:45:47 +0000116
117 // Report garbage-collected sections.
Rui Ueyama136d27a2019-07-11 05:40:30 +0000118 if (config->printGcSections) {
119 for (const ObjFile *obj : symtab->objectFiles) {
120 for (InputChunk *c : obj->functions)
121 if (!c->live)
122 message("removing unused section " + toString(c));
123 for (InputChunk *c : obj->segments)
124 if (!c->live)
125 message("removing unused section " + toString(c));
126 for (InputGlobal *g : obj->globals)
127 if (!g->live)
128 message("removing unused section " + toString(g));
129 for (InputEvent *e : obj->events)
130 if (!e->live)
131 message("removing unused section " + toString(e));
Sam Clegg03626332018-01-31 01:45:47 +0000132 }
Rui Ueyama136d27a2019-07-11 05:40:30 +0000133 for (InputChunk *c : symtab->syntheticFunctions)
134 if (!c->live)
135 message("removing unused section " + toString(c));
136 for (InputGlobal *g : symtab->syntheticGlobals)
137 if (!g->live)
138 message("removing unused section " + toString(g));
Sam Clegg03626332018-01-31 01:45:47 +0000139 }
140}