blob: cdc2c0e539523c4d90d04beeeafc69f17a78778d [file] [log] [blame]
Michael J. Spencer84487f12015-07-24 21:03:07 +00001//===- Writer.cpp ---------------------------------------------------------===//
2//
3// The LLVM Linker
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Michael J. Spencerf8325412015-09-04 22:48:30 +000010#include "Writer.h"
Rui Ueyamacb8474ed2015-08-05 23:51:50 +000011#include "Config.h"
Rui Ueyama9b55e922017-03-24 00:15:16 +000012#include "Filesystem.h"
Rui Ueyama717677a2016-02-11 21:17:59 +000013#include "LinkerScript.h"
Rafael Espindola1ebfc592017-01-13 21:05:46 +000014#include "MapFile.h"
Rui Ueyama9381eb12016-12-18 14:06:06 +000015#include "Memory.h"
Rafael Espindola5805c4f2015-09-21 21:38:08 +000016#include "OutputSections.h"
Rui Ueyama0fcdc732016-05-24 20:24:43 +000017#include "Relocations.h"
Rui Ueyamafbbde542016-06-29 09:08:02 +000018#include "Strings.h"
Rui Ueyamaafff74e22015-08-05 23:24:46 +000019#include "SymbolTable.h"
Rui Ueyama6dc7fcb2016-11-01 20:28:21 +000020#include "SyntheticSections.h"
Rafael Espindola01205f72015-09-22 18:19:46 +000021#include "Target.h"
George Rimardbf93392017-04-17 08:58:12 +000022#include "Threads.h"
Denis Protivensky8e3b38a2015-11-12 09:52:08 +000023#include "llvm/ADT/StringMap.h"
Hal Finkel3bae2d82015-10-12 20:51:48 +000024#include "llvm/ADT/StringSwitch.h"
Rui Ueyamaafff74e22015-08-05 23:24:46 +000025#include "llvm/Support/FileOutputBuffer.h"
Rui Ueyamae8b2df42016-09-29 01:45:22 +000026#include <climits>
Michael J. Spencer84487f12015-07-24 21:03:07 +000027
28using namespace llvm;
29using namespace llvm::ELF;
30using namespace llvm::object;
Peter Smith0a259f32016-10-10 09:39:26 +000031using namespace llvm::support;
32using namespace llvm::support::endian;
Michael J. Spencer84487f12015-07-24 21:03:07 +000033
34using namespace lld;
Rafael Espindolae0df00b2016-02-28 00:25:54 +000035using namespace lld::elf;
Michael J. Spencer84487f12015-07-24 21:03:07 +000036
Rui Ueyamaafff74e22015-08-05 23:24:46 +000037namespace {
38// The writer writes a SymbolTable result to a file.
39template <class ELFT> class Writer {
40public:
Rui Ueyama9328b2c2016-03-14 23:16:09 +000041 typedef typename ELFT::Shdr Elf_Shdr;
42 typedef typename ELFT::Ehdr Elf_Ehdr;
43 typedef typename ELFT::Phdr Elf_Phdr;
Rui Ueyama0ce388b2017-04-05 21:46:06 +000044
Rui Ueyamaafff74e22015-08-05 23:24:46 +000045 void run();
46
47private:
Rui Ueyamaf83aca42016-11-01 23:17:45 +000048 void createSyntheticSections();
Rui Ueyama5a9640b2015-10-08 23:49:30 +000049 void copyLocalSymbols();
Rafael Espindola08d6a3f2017-02-11 01:40:49 +000050 void addSectionSymbols();
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +000051 void addReservedSymbols();
George Rimar9e694502016-07-29 16:18:47 +000052 void createSections();
Rafael Espindolab4c9b812017-02-23 02:28:28 +000053 void forEachRelSec(std::function<void(InputSectionBase &)> Fn);
Rafael Espindola24c073d2016-09-21 22:36:19 +000054 void sortSections();
Eugene Leviante63d81b2016-07-20 14:43:20 +000055 void finalizeSections();
Rui Ueyama84417f82015-12-26 07:50:41 +000056 void addPredefinedSections();
Rafael Espindola4d560162017-09-12 16:38:01 +000057 void setReservedSymbolSections();
Rui Ueyama2df0fd82015-12-25 07:38:58 +000058
George Rimaraa354182017-07-27 07:46:50 +000059 std::vector<PhdrEntry *> createPhdrs();
Rafael Espindola074ba932016-12-06 13:43:34 +000060 void removeEmptyPTLoad();
George Rimaraa354182017-07-27 07:46:50 +000061 void addPtArmExid(std::vector<PhdrEntry *> &Phdrs);
Rui Ueyamae044e9c2016-04-01 17:07:17 +000062 void assignFileOffsets();
George Rimar86ce2672016-08-25 09:05:47 +000063 void assignFileOffsetsBinary();
Rui Ueyamae044e9c2016-04-01 17:07:17 +000064 void setPhdrs();
Rui Ueyama47091902016-03-30 19:41:51 +000065 void fixSectionAlignments();
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +000066 void openFile();
Petr Hosekedd6c352017-08-02 16:35:00 +000067 void writeTrapInstr();
Rui Ueyamaafff74e22015-08-05 23:24:46 +000068 void writeHeader();
69 void writeSections();
George Rimar86ce2672016-08-25 09:05:47 +000070 void writeSectionsBinary();
Rui Ueyama634ddf02016-03-11 20:51:53 +000071 void writeBuildId();
Rui Ueyamaafff74e22015-08-05 23:24:46 +000072
Rui Ueyama818bb2f2016-07-16 18:55:47 +000073 std::unique_ptr<FileOutputBuffer> Buffer;
Michael J. Spencer2f008242015-09-17 19:58:07 +000074
Rafael Espindola05531242017-07-06 16:40:44 +000075 OutputSectionFactory Factory;
Rafael Espindola4fc60442016-02-10 22:43:13 +000076
Rui Ueyama01687222015-12-26 09:47:57 +000077 void addRelIpltSymbols();
Rui Ueyamaa5d79d12015-12-26 09:48:00 +000078 void addStartEndSymbols();
Rafael Espindola24e6f362017-02-24 15:07:30 +000079 void addStartStopSymbols(OutputSection *Sec);
Rui Ueyama6bd38222017-04-05 21:37:09 +000080 uint64_t getEntryAddr();
Rafael Espindola8c022ca2017-07-27 19:22:43 +000081 OutputSection *findSection(StringRef Name);
Rui Ueyama2f1b79f2015-10-10 22:34:30 +000082
George Rimaraa354182017-07-27 07:46:50 +000083 std::vector<PhdrEntry *> Phdrs;
Michael J. Spencer2f008242015-09-17 19:58:07 +000084
Rui Ueyama6bd38222017-04-05 21:37:09 +000085 uint64_t FileSize;
86 uint64_t SectionHeaderOff;
Peter Smith113a59e2017-06-26 10:22:17 +000087
88 bool HasGotBaseSym = false;
Rui Ueyamaafff74e22015-08-05 23:24:46 +000089};
90} // anonymous namespace
91
Rui Ueyama55518e72016-10-28 20:57:25 +000092StringRef elf::getOutputSectionName(StringRef Name) {
George Rimar60a0ea12017-06-05 12:49:21 +000093 // ".zdebug_" is a prefix for ZLIB-compressed sections.
94 // Because we decompressed input sections, we want to remove 'z'.
95 if (Name.startswith(".zdebug_"))
96 return Saver.save("." + Name.substr(2));
97
Eugene Levianta8d12ef2016-10-05 10:10:45 +000098 if (Config->Relocatable)
99 return Name;
100
Rafael Espindola7d382732016-09-19 19:59:21 +0000101 for (StringRef V :
George Rimar1ab9cf42017-03-17 10:14:53 +0000102 {".text.", ".rodata.", ".data.rel.ro.", ".data.", ".bss.rel.ro.",
103 ".bss.", ".init_array.", ".fini_array.", ".ctors.", ".dtors.", ".tbss.",
Peter Smith691ff762017-06-28 09:12:38 +0000104 ".gcc_except_table.", ".tdata.", ".ARM.exidx.", ".ARM.extab."}) {
Rafael Espindola7d382732016-09-19 19:59:21 +0000105 StringRef Prefix = V.drop_back();
106 if (Name.startswith(V) || Name == Prefix)
107 return Prefix;
108 }
Rui Ueyama05384082016-10-12 22:36:31 +0000109
Rui Ueyamae8a61022016-11-05 23:05:47 +0000110 // CommonSection is identified as "COMMON" in linker scripts.
111 // By default, it should go to .bss section.
112 if (Name == "COMMON")
113 return ".bss";
114
George Rimar5d53d1f2016-07-12 08:50:42 +0000115 return Name;
116}
117
George Rimar696a7f92017-09-19 09:20:54 +0000118static bool needsInterpSection() {
119 return !SharedFiles.empty() && !Config->DynamicLinker.empty() &&
Rui Ueyamae03ba022017-10-08 03:52:15 +0000120 Script->needsInterpSection();
Rui Ueyamafd03cfd2016-07-21 11:01:23 +0000121}
122
George Rimard8b27762016-11-14 10:14:18 +0000123template <class ELFT> void elf::writeResult() { Writer<ELFT>().run(); }
Rafael Espindola4fc60442016-02-10 22:43:13 +0000124
Rafael Espindola074ba932016-12-06 13:43:34 +0000125template <class ELFT> void Writer<ELFT>::removeEmptyPTLoad() {
George Rimar60608a82017-08-28 09:28:15 +0000126 llvm::erase_if(Phdrs, [&](const PhdrEntry *P) {
George Rimaraa354182017-07-27 07:46:50 +0000127 if (P->p_type != PT_LOAD)
Rafael Espindola074ba932016-12-06 13:43:34 +0000128 return false;
George Rimar6823c5f2017-09-07 11:01:10 +0000129 if (!P->FirstSec)
Rafael Espindola41217612016-12-08 03:17:05 +0000130 return true;
George Rimar6823c5f2017-09-07 11:01:10 +0000131 uint64_t Size = P->LastSec->Addr + P->LastSec->Size - P->FirstSec->Addr;
Rafael Espindola074ba932016-12-06 13:43:34 +0000132 return Size == 0;
133 });
Rafael Espindola074ba932016-12-06 13:43:34 +0000134}
135
Petr Hosek7b793212017-03-10 20:00:42 +0000136template <class ELFT> static void combineEhFrameSections() {
137 for (InputSectionBase *&S : InputSections) {
138 EhInputSection *ES = dyn_cast<EhInputSection>(S);
Rafael Espindolaa1565552017-03-15 12:31:54 +0000139 if (!ES || !ES->Live)
Petr Hosek7b793212017-03-10 20:00:42 +0000140 continue;
141
142 In<ELFT>::EhFrame->addSection(ES);
143 S = nullptr;
144 }
145
146 std::vector<InputSectionBase *> &V = InputSections;
147 V.erase(std::remove(V.begin(), V.end(), nullptr), V.end());
148}
149
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000150// The main function of the writer.
151template <class ELFT> void Writer<ELFT>::run() {
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000152 // Create linker-synthesized sections such as .got or .plt.
153 // Such sections are of type input section.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000154 createSyntheticSections();
George Rimar7beff422016-11-15 08:19:02 +0000155
Petr Hosek7b793212017-03-10 20:00:42 +0000156 if (!Config->Relocatable)
157 combineEhFrameSections<ELFT>();
158
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000159 // We need to create some reserved symbols such as _end. Create them.
George Rimar7beff422016-11-15 08:19:02 +0000160 if (!Config->Relocatable)
161 addReservedSymbols();
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000162
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000163 // Create output sections.
Rui Ueyamaac27de92017-10-11 01:19:33 +0000164 if (Script->HasSections) {
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000165 // If linker script contains SECTIONS commands, let it create sections.
George Rimara8dba482017-03-20 10:09:58 +0000166 Script->processCommands(Factory);
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000167
168 // Linker scripts may have left some input sections unassigned.
169 // Assign such sections using the default rule.
George Rimara8dba482017-03-20 10:09:58 +0000170 Script->addOrphanSections(Factory);
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000171 } else {
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000172 // If linker script does not contain SECTIONS commands, create
173 // output sections by default rules. We still need to give the
174 // linker script a chance to run, because it might contain
175 // non-SECTIONS commands such as ASSERT.
George Rimara8dba482017-03-20 10:09:58 +0000176 Script->processCommands(Factory);
Rafael Espindola21263342017-07-05 23:36:24 +0000177 createSections();
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000178 }
179
180 if (Config->Discard != DiscardPolicy::All)
181 copyLocalSymbols();
182
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000183 if (Config->CopyRelocs)
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000184 addSectionSymbols();
185
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000186 // Now that we have a complete set of output sections. This function
187 // completes section contents. For example, we need to add strings
188 // to the string table, and add entries to .got and .plt.
189 // finalizeSections does that.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000190 finalizeSections();
Rui Ueyamaf373dd72016-11-24 01:43:21 +0000191 if (ErrorCount)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000192 return;
193
Rafael Espindola55b169b2017-05-24 18:08:04 +0000194 // If -compressed-debug-sections is specified, we need to compress
195 // .debug_* sections. Do it right now because it changes the size of
196 // output sections.
George Rimara9b07142017-08-04 08:30:16 +0000197 parallelForEach(OutputSections,
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000198 [](OutputSection *Sec) { Sec->maybeCompress<ELFT>(); });
Rafael Espindola805f5152017-06-01 16:30:12 +0000199
Peter Smith5aedebf2017-07-05 09:12:54 +0000200 Script->assignAddresses();
201 Script->allocateHeaders(Phdrs);
Rafael Espindola189860c2017-06-07 02:24:08 +0000202
203 // Remove empty PT_LOAD to avoid causing the dynamic linker to try to mmap a
204 // 0 sized region. This has to be done late since only after assignAddresses
205 // we know the size of the sections.
206 removeEmptyPTLoad();
207
208 if (!Config->OFormatBinary)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000209 assignFileOffsets();
Rafael Espindola189860c2017-06-07 02:24:08 +0000210 else
211 assignFileOffsetsBinary();
212
213 setPhdrs();
214
215 if (Config->Relocatable) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000216 for (OutputSection *Sec : OutputSections)
217 Sec->Addr = 0;
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000218 }
219
George Rimar2ddab6d2017-01-17 13:50:34 +0000220 // It does not make sense try to open the file if we have error already.
221 if (ErrorCount)
222 return;
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000223 // Write the result down to a file.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000224 openFile();
Rui Ueyamaf373dd72016-11-24 01:43:21 +0000225 if (ErrorCount)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000226 return;
Rafael Espindola3f235c72017-06-01 16:32:58 +0000227
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000228 if (!Config->OFormatBinary) {
Petr Hosekedd6c352017-08-02 16:35:00 +0000229 writeTrapInstr();
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000230 writeHeader();
231 writeSections();
232 } else {
233 writeSectionsBinary();
234 }
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000235
236 // Backfill .note.gnu.build-id section content. This is done at last
237 // because the content is usually a hash value of the entire output file.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000238 writeBuildId();
Rui Ueyamaf373dd72016-11-24 01:43:21 +0000239 if (ErrorCount)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000240 return;
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000241
Rui Ueyama40eaa992017-01-18 03:34:38 +0000242 // Handle -Map option.
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000243 writeMapFile<ELFT>();
Rui Ueyama40eaa992017-01-18 03:34:38 +0000244 if (ErrorCount)
245 return;
246
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000247 if (auto EC = Buffer->commit())
Rui Ueyamac8d3a832017-01-12 22:18:04 +0000248 error("failed to write to the output file: " + EC.message());
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000249}
250
Rui Ueyama9d1bacb12017-02-27 02:31:26 +0000251// Initialize Out members.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000252template <class ELFT> void Writer<ELFT>::createSyntheticSections() {
253 // Initialize all pointers with NULL. This is needed because
254 // you can call lld::elf::main more than once as a library.
Rui Ueyama9d1bacb12017-02-27 02:31:26 +0000255 memset(&Out::First, 0, sizeof(Out));
Rui Ueyamacfadbd92016-11-01 23:12:51 +0000256
Rui Ueyama536a2672017-02-27 02:32:08 +0000257 auto Add = [](InputSectionBase *Sec) { InputSections.push_back(Sec); };
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000258
Rafael Espindola895aea62017-05-11 22:02:41 +0000259 InX::DynStrTab = make<StringTableSection>(".dynstr", true);
Rafael Espindola5ab19892017-05-11 23:16:43 +0000260 InX::Dynamic = make<DynamicSection<ELFT>>();
Eugene Levianta96d9022016-11-16 10:02:27 +0000261 In<ELFT>::RelaDyn = make<RelocationSection<ELFT>>(
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000262 Config->IsRela ? ".rela.dyn" : ".rel.dyn", Config->ZCombreloc);
Rafael Espindola895aea62017-05-11 22:02:41 +0000263 InX::ShStrTab = make<StringTableSection>(".shstrtab", false);
Rui Ueyama4197a6a2016-02-05 18:41:40 +0000264
Rui Ueyama9d1bacb12017-02-27 02:31:26 +0000265 Out::ElfHeader = make<OutputSection>("", 0, SHF_ALLOC);
266 Out::ElfHeader->Size = sizeof(Elf_Ehdr);
267 Out::ProgramHeaders = make<OutputSection>("", 0, SHF_ALLOC);
Rui Ueyama8befefb2017-10-07 00:58:34 +0000268 Out::ProgramHeaders->Alignment = Config->Wordsize;
Rui Ueyama4197a6a2016-02-05 18:41:40 +0000269
George Rimar696a7f92017-09-19 09:20:54 +0000270 if (needsInterpSection()) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000271 InX::Interp = createInterpSection();
272 Add(InX::Interp);
Rui Ueyamae8a61022016-11-05 23:05:47 +0000273 } else {
Rafael Espindola895aea62017-05-11 22:02:41 +0000274 InX::Interp = nullptr;
Rui Ueyamae8a61022016-11-05 23:05:47 +0000275 }
Rui Ueyama3a41be22016-04-07 22:49:21 +0000276
George Rimarf21aade2016-08-31 08:38:11 +0000277 if (Config->Strip != StripPolicy::All) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000278 InX::StrTab = make<StringTableSection>(".strtab", false);
George Rimarf45f6812017-05-16 08:53:30 +0000279 InX::SymTab = make<SymbolTableSection<ELFT>>(*InX::StrTab);
Rui Ueyama4197a6a2016-02-05 18:41:40 +0000280 }
Rui Ueyamacfadbd92016-11-01 23:12:51 +0000281
Rui Ueyamac4030a12016-11-22 00:54:15 +0000282 if (Config->BuildId != BuildIdKind::None) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000283 InX::BuildId = make<BuildIdSection>();
284 Add(InX::BuildId);
Rui Ueyamac4030a12016-11-22 00:54:15 +0000285 }
Rui Ueyamae8a61022016-11-05 23:05:47 +0000286
Rui Ueyama732f4e22017-10-04 00:21:17 +0000287 InX::Bss = make<BssSection>(".bss", 0, 1);
Rafael Espindola895aea62017-05-11 22:02:41 +0000288 Add(InX::Bss);
Rui Ueyama732f4e22017-10-04 00:21:17 +0000289 InX::BssRelRo = make<BssSection>(".bss.rel.ro", 0, 1);
Rafael Espindola895aea62017-05-11 22:02:41 +0000290 Add(InX::BssRelRo);
George Rimar1ab9cf42017-03-17 10:14:53 +0000291
Rui Ueyama1d75de02016-11-22 04:28:39 +0000292 // Add MIPS-specific sections.
Simon Atanasyance02cf02016-11-09 21:36:56 +0000293 if (Config->EMachine == EM_MIPS) {
Rafael Espindolae05e2f82017-09-15 18:05:02 +0000294 if (!Config->Shared && Config->HasDynSymTab) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000295 InX::MipsRldMap = make<MipsRldMapSection>();
296 Add(InX::MipsRldMap);
Eugene Leviant17b7a572016-11-22 17:49:14 +0000297 }
Rui Ueyama1d75de02016-11-22 04:28:39 +0000298 if (auto *Sec = MipsAbiFlagsSection<ELFT>::create())
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000299 Add(Sec);
Rui Ueyama1d75de02016-11-22 04:28:39 +0000300 if (auto *Sec = MipsOptionsSection<ELFT>::create())
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000301 Add(Sec);
Rui Ueyama1d75de02016-11-22 04:28:39 +0000302 if (auto *Sec = MipsReginfoSection<ELFT>::create())
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000303 Add(Sec);
Simon Atanasyance02cf02016-11-09 21:36:56 +0000304 }
Eugene Leviant41ca3272016-11-10 09:48:29 +0000305
Rafael Espindolae05e2f82017-09-15 18:05:02 +0000306 if (Config->HasDynSymTab) {
George Rimar69b17c32017-05-16 10:04:42 +0000307 InX::DynSymTab = make<SymbolTableSection<ELFT>>(*InX::DynStrTab);
308 Add(InX::DynSymTab);
George Rimar11992c862016-11-25 08:05:41 +0000309
310 In<ELFT>::VerSym = make<VersionTableSection<ELFT>>();
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000311 Add(In<ELFT>::VerSym);
George Rimar11992c862016-11-25 08:05:41 +0000312
313 if (!Config->VersionDefinitions.empty()) {
314 In<ELFT>::VerDef = make<VersionDefinitionSection<ELFT>>();
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000315 Add(In<ELFT>::VerDef);
George Rimar11992c862016-11-25 08:05:41 +0000316 }
317
318 In<ELFT>::VerNeed = make<VersionNeedSection<ELFT>>();
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000319 Add(In<ELFT>::VerNeed);
George Rimar11992c862016-11-25 08:05:41 +0000320
321 if (Config->GnuHash) {
George Rimar69b17c32017-05-16 10:04:42 +0000322 InX::GnuHashTab = make<GnuHashTableSection>();
323 Add(InX::GnuHashTab);
George Rimar11992c862016-11-25 08:05:41 +0000324 }
325
326 if (Config->SysvHash) {
George Rimaraaf54712017-09-27 09:14:59 +0000327 InX::HashTab = make<HashTableSection>();
328 Add(InX::HashTab);
George Rimar11992c862016-11-25 08:05:41 +0000329 }
330
Rafael Espindola5ab19892017-05-11 23:16:43 +0000331 Add(InX::Dynamic);
Rafael Espindola895aea62017-05-11 22:02:41 +0000332 Add(InX::DynStrTab);
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000333 Add(In<ELFT>::RelaDyn);
George Rimar11992c862016-11-25 08:05:41 +0000334 }
335
Rui Ueyama1d75de02016-11-22 04:28:39 +0000336 // Add .got. MIPS' .got is so different from the other archs,
337 // it has its own class.
George Rimar11992c862016-11-25 08:05:41 +0000338 if (Config->EMachine == EM_MIPS) {
Rafael Espindolab3aa2c92017-05-11 21:33:30 +0000339 InX::MipsGot = make<MipsGotSection>();
340 Add(InX::MipsGot);
George Rimar11992c862016-11-25 08:05:41 +0000341 } else {
Rafael Espindolaa6465bb2017-05-18 16:45:36 +0000342 InX::Got = make<GotSection>();
Rafael Espindola88ab9fb2017-05-11 23:26:03 +0000343 Add(InX::Got);
George Rimar11992c862016-11-25 08:05:41 +0000344 }
Simon Atanasyan725dc142016-11-16 21:01:02 +0000345
Rafael Espindola4b1c3692017-05-11 21:23:38 +0000346 InX::GotPlt = make<GotPltSection>();
347 Add(InX::GotPlt);
Rafael Espindola895aea62017-05-11 22:02:41 +0000348 InX::IgotPlt = make<IgotPltSection>();
349 Add(InX::IgotPlt);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000350
351 if (Config->GdbIndex) {
Rafael Espindola300b3862017-07-12 23:56:53 +0000352 InX::GdbIndex = createGdbIndex<ELFT>();
Rafael Espindola895aea62017-05-11 22:02:41 +0000353 Add(InX::GdbIndex);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000354 }
355
356 // We always need to add rel[a].plt to output if it has entries.
357 // Even for static linking it can contain R_[*]_IRELATIVE relocations.
358 In<ELFT>::RelaPlt = make<RelocationSection<ELFT>>(
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000359 Config->IsRela ? ".rela.plt" : ".rel.plt", false /*Sort*/);
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000360 Add(In<ELFT>::RelaPlt);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000361
Peter Smithbaffdb82016-12-08 12:58:55 +0000362 // The RelaIplt immediately follows .rel.plt (.rel.dyn for ARM) to ensure
363 // that the IRelative relocations are processed last by the dynamic loader
364 In<ELFT>::RelaIplt = make<RelocationSection<ELFT>>(
365 (Config->EMachine == EM_ARM) ? ".rel.dyn" : In<ELFT>::RelaPlt->Name,
366 false /*Sort*/);
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000367 Add(In<ELFT>::RelaIplt);
Peter Smithbaffdb82016-12-08 12:58:55 +0000368
Rafael Espindola895aea62017-05-11 22:02:41 +0000369 InX::Plt = make<PltSection>(Target->PltHeaderSize);
370 Add(InX::Plt);
371 InX::Iplt = make<PltSection>(0);
372 Add(InX::Iplt);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000373
Rafael Espindola66b4e212017-02-23 22:06:28 +0000374 if (!Config->Relocatable) {
George Rimar1c74c2f2017-03-09 08:45:25 +0000375 if (Config->EhFrameHdr) {
376 In<ELFT>::EhFrameHdr = make<EhFrameHeader<ELFT>>();
377 Add(In<ELFT>::EhFrameHdr);
378 }
Rafael Espindola66b4e212017-02-23 22:06:28 +0000379 In<ELFT>::EhFrame = make<EhFrameSection<ELFT>>();
380 Add(In<ELFT>::EhFrame);
381 }
382
George Rimar69b17c32017-05-16 10:04:42 +0000383 if (InX::SymTab)
384 Add(InX::SymTab);
Rafael Espindola895aea62017-05-11 22:02:41 +0000385 Add(InX::ShStrTab);
386 if (InX::StrTab)
387 Add(InX::StrTab);
Michael J. Spencer84487f12015-07-24 21:03:07 +0000388}
389
Rafael Espindola5616adf2017-03-08 22:36:28 +0000390static bool shouldKeepInSymtab(SectionBase *Sec, StringRef SymName,
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000391 const SymbolBody &B) {
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000392 if (B.isFile() || B.isSection())
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000393 return false;
394
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000395 // If sym references a section in a discarded group, don't keep it.
Rafael Espindola774ea7d2017-02-23 16:49:07 +0000396 if (Sec == &InputSection::Discarded)
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000397 return false;
398
George Rimar9503f6d2016-08-31 08:46:30 +0000399 if (Config->Discard == DiscardPolicy::None)
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000400 return true;
401
402 // In ELF assembly .L symbols are normally discarded by the assembler.
403 // If the assembler fails to do so, the linker discards them if
404 // * --discard-locals is used.
405 // * The symbol is in a SHF_MERGE section, which is normally the reason for
406 // the assembler keeping the .L symbol.
407 if (!SymName.startswith(".L") && !SymName.empty())
408 return true;
409
George Rimar9503f6d2016-08-31 08:46:30 +0000410 if (Config->Discard == DiscardPolicy::Locals)
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000411 return false;
412
Rafael Espindola1854a8e2016-10-26 12:36:56 +0000413 return !Sec || !(Sec->Flags & SHF_MERGE);
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000414}
415
George Rimar7702bc22017-03-16 11:20:02 +0000416static bool includeInSymtab(const SymbolBody &B) {
Rafael Espindola474eb012016-05-05 16:40:28 +0000417 if (!B.isLocal() && !B.symbol()->IsUsedInRegularObj)
418 return false;
419
Rui Ueyama80474a22017-02-28 19:29:55 +0000420 if (auto *D = dyn_cast<DefinedRegular>(&B)) {
Rafael Espindola474eb012016-05-05 16:40:28 +0000421 // Always include absolute symbols.
Rafael Espindola5616adf2017-03-08 22:36:28 +0000422 SectionBase *Sec = D->Section;
423 if (!Sec)
Rafael Espindola474eb012016-05-05 16:40:28 +0000424 return true;
Rafael Espindola5616adf2017-03-08 22:36:28 +0000425 if (auto *IS = dyn_cast<InputSectionBase>(Sec)) {
426 Sec = IS->Repl;
427 IS = cast<InputSectionBase>(Sec);
428 // Exclude symbols pointing to garbage-collected sections.
429 if (!IS->Live)
430 return false;
431 }
432 if (auto *S = dyn_cast<MergeInputSection>(Sec))
Rui Ueyama90fa3722016-05-22 00:41:38 +0000433 if (!S->getSectionPiece(D->Value)->Live)
Rafael Espindola474eb012016-05-05 16:40:28 +0000434 return false;
435 }
436 return true;
437}
Rafael Espindola462220d2016-05-05 16:38:46 +0000438
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000439// Local symbols are not in the linker's symbol table. This function scans
440// each object file's symbol table to copy local symbols to the output.
441template <class ELFT> void Writer<ELFT>::copyLocalSymbols() {
George Rimar69b17c32017-05-16 10:04:42 +0000442 if (!InX::SymTab)
Rui Ueyama90f76fb2016-01-21 03:07:38 +0000443 return;
George Rimar696a7f92017-09-19 09:20:54 +0000444 for (InputFile *File : ObjectFiles) {
445 ObjFile<ELFT> *F = cast<ObjFile<ELFT>>(File);
Rafael Espindola67d72c02016-03-11 12:06:30 +0000446 for (SymbolBody *B : F->getLocalSymbols()) {
George Rimar78fe56e2016-10-11 09:07:14 +0000447 if (!B->IsLocal)
Rui Ueyama3fc0f7e2016-11-23 18:07:33 +0000448 fatal(toString(F) +
George Rimar78fe56e2016-10-11 09:07:14 +0000449 ": broken object: getLocalSymbols returns a non-local symbol");
Rui Ueyama80474a22017-02-28 19:29:55 +0000450 auto *DR = dyn_cast<DefinedRegular>(B);
Rui Ueyama3fc0f7e2016-11-23 18:07:33 +0000451
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000452 // No reason to keep local undefined symbol in symtab.
453 if (!DR)
Rafael Espindola444576d2015-10-09 19:25:07 +0000454 continue;
George Rimar7702bc22017-03-16 11:20:02 +0000455 if (!includeInSymtab(*B))
Rafael Espindola462220d2016-05-05 16:38:46 +0000456 continue;
Rui Ueyama3fc0f7e2016-11-23 18:07:33 +0000457
Rafael Espindola5616adf2017-03-08 22:36:28 +0000458 SectionBase *Sec = DR->Section;
George Rimar7702bc22017-03-16 11:20:02 +0000459 if (!shouldKeepInSymtab(Sec, B->getName(), *B))
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000460 continue;
George Rimar69b17c32017-05-16 10:04:42 +0000461 InX::SymTab->addSymbol(B);
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000462 }
463 }
464}
465
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000466template <class ELFT> void Writer<ELFT>::addSectionSymbols() {
467 // Create one STT_SECTION symbol for each output section we might
468 // have a relocation with.
Rui Ueyamaac27de92017-10-11 01:19:33 +0000469 for (BaseCommand *Base : Script->Commands) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000470 auto *Sec = dyn_cast<OutputSection>(Base);
471 if (!Sec)
Rui Ueyama73d29ab2017-02-28 19:43:54 +0000472 continue;
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000473 auto I = llvm::find_if(Sec->Commands, [](BaseCommand *Base) {
Rafael Espindolad48b2082017-07-04 19:08:40 +0000474 if (auto *ISD = dyn_cast<InputSectionDescription>(Base))
475 return !ISD->Sections.empty();
476 return false;
477 });
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000478 if (I == Sec->Commands.end())
Rafael Espindolad48b2082017-07-04 19:08:40 +0000479 continue;
480 InputSection *IS = cast<InputSectionDescription>(*I)->Sections[0];
Rui Ueyama73d29ab2017-02-28 19:43:54 +0000481 if (isa<SyntheticSection>(IS) || IS->Type == SHT_REL ||
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000482 IS->Type == SHT_RELA)
483 continue;
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000484
Rui Ueyama175e81c2017-02-28 19:36:30 +0000485 auto *Sym =
486 make<DefinedRegular>("", /*IsLocal=*/true, /*StOther=*/0, STT_SECTION,
Rafael Espindola6e93d052017-08-04 22:31:42 +0000487 /*Value=*/0, /*Size=*/0, IS);
George Rimar69b17c32017-05-16 10:04:42 +0000488 InX::SymTab->addSymbol(Sym);
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000489 }
490}
491
Rui Ueyama26ad0572017-02-16 04:51:46 +0000492// Today's loaders have a feature to make segments read-only after
493// processing dynamic relocations to enhance security. PT_GNU_RELRO
494// is defined for that.
495//
496// This function returns true if a section needs to be put into a
497// PT_GNU_RELRO segment.
Rafael Espindoladc49af92017-07-24 23:55:33 +0000498static bool isRelroSection(const OutputSection *Sec) {
Rafael Espindola4fc60442016-02-10 22:43:13 +0000499 if (!Config->ZRelro)
500 return false;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000501
Rafael Espindolae08e78d2016-11-09 23:23:45 +0000502 uint64_t Flags = Sec->Flags;
Rui Ueyama9d773f32017-04-13 05:40:07 +0000503
504 // Non-allocatable or non-writable sections don't need RELRO because
505 // they are not writable or not even mapped to memory in the first place.
506 // RELRO is for sections that are essentially read-only but need to
507 // be writable only at process startup to allow dynamic linker to
508 // apply relocations.
George Rimare3336c02015-11-24 10:15:50 +0000509 if (!(Flags & SHF_ALLOC) || !(Flags & SHF_WRITE))
510 return false;
Rui Ueyama9d773f32017-04-13 05:40:07 +0000511
512 // Once initialized, TLS data segments are used as data templates
513 // for a thread-local storage. For each new thread, runtime
514 // allocates memory for a TLS and copy templates there. No thread
515 // are supposed to use templates directly. Thus, it can be in RELRO.
Rui Ueyamaccfc3262015-12-10 19:13:08 +0000516 if (Flags & SHF_TLS)
517 return true;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000518
Rui Ueyama9d773f32017-04-13 05:40:07 +0000519 // .init_array, .preinit_array and .fini_array contain pointers to
520 // functions that are executed on process startup or exit. These
521 // pointers are set by the static linker, and they are not expected
522 // to change at runtime. But if you are an attacker, you could do
523 // interesting things by manipulating pointers in .fini_array, for
524 // example. So they are put into RELRO.
Rafael Espindola04a2e342016-11-09 01:42:41 +0000525 uint32_t Type = Sec->Type;
Rui Ueyamaccfc3262015-12-10 19:13:08 +0000526 if (Type == SHT_INIT_ARRAY || Type == SHT_FINI_ARRAY ||
527 Type == SHT_PREINIT_ARRAY)
George Rimare3336c02015-11-24 10:15:50 +0000528 return true;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000529
Rui Ueyama9d773f32017-04-13 05:40:07 +0000530 // .got contains pointers to external symbols. They are resolved by
531 // the dynamic linker when a module is loaded into memory, and after
532 // that they are not expected to change. So, it can be in RELRO.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000533 if (InX::Got && Sec == InX::Got->getParent())
Simon Atanasyan725dc142016-11-16 21:01:02 +0000534 return true;
Rui Ueyama9d773f32017-04-13 05:40:07 +0000535
536 // .got.plt contains pointers to external function symbols. They are
537 // by default resolved lazily, so we usually cannot put it into RELRO.
538 // However, if "-z now" is given, the lazy symbol resolution is
539 // disabled, which enables us to put it into RELRO.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000540 if (Sec == InX::GotPlt->getParent())
Rui Ueyama9d773f32017-04-13 05:40:07 +0000541 return Config->ZNow;
542
543 // .dynamic section contains data for the dynamic linker, and
544 // there's no need to write to it at runtime, so it's better to put
545 // it into RELRO.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000546 if (Sec == InX::Dynamic->getParent())
Rui Ueyama9d773f32017-04-13 05:40:07 +0000547 return true;
548
549 // .bss.rel.ro is used for copy relocations for read-only symbols.
550 // Since the dynamic linker needs to process copy relocations, the
551 // section cannot be read-only, but once initialized, they shouldn't
552 // change.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000553 if (Sec == InX::BssRelRo->getParent())
Peter Collingbournefeb66292017-01-10 01:21:50 +0000554 return true;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000555
Rui Ueyama9d773f32017-04-13 05:40:07 +0000556 // Sections with some special names are put into RELRO. This is a
557 // bit unfortunate because section names shouldn't be significant in
558 // ELF in spirit. But in reality many linker features depend on
559 // magic section names.
Rafael Espindola40849412017-02-24 14:28:00 +0000560 StringRef S = Sec->Name;
Rui Ueyama01faef02015-12-10 19:19:04 +0000561 return S == ".data.rel.ro" || S == ".ctors" || S == ".dtors" || S == ".jcr" ||
George Rimard003c7f2016-12-20 11:28:54 +0000562 S == ".eh_frame" || S == ".openbsd.randomdata";
George Rimare3336c02015-11-24 10:15:50 +0000563}
564
Rafael Espindola52101412017-05-12 14:52:22 +0000565// We compute a rank for each section. The rank indicates where the
566// section should be placed in the file. Instead of using simple
567// numbers (0,1,2...), we use a series of flags. One for each decision
568// point when placing the section.
569// Using flags has two key properties:
570// * It is easy to check if a give branch was taken.
571// * It is easy two see how similar two ranks are (see getRankProximity).
572enum RankFlags {
Rafael Espindolad23e9262017-05-26 17:23:25 +0000573 RF_NOT_ADDR_SET = 1 << 16,
574 RF_NOT_INTERP = 1 << 15,
575 RF_NOT_ALLOC = 1 << 14,
576 RF_WRITE = 1 << 13,
577 RF_EXEC_WRITE = 1 << 12,
Rafael Espindola246c1c42017-05-18 16:20:12 +0000578 RF_EXEC = 1 << 11,
579 RF_NON_TLS_BSS = 1 << 10,
580 RF_NON_TLS_BSS_RO = 1 << 9,
581 RF_NOT_TLS = 1 << 8,
582 RF_BSS = 1 << 7,
583 RF_PPC_NOT_TOCBSS = 1 << 6,
584 RF_PPC_OPD = 1 << 5,
585 RF_PPC_TOCL = 1 << 4,
586 RF_PPC_TOC = 1 << 3,
587 RF_PPC_BRANCH_LT = 1 << 2,
588 RF_MIPS_GPREL = 1 << 1,
589 RF_MIPS_NOT_GOT = 1 << 0
Rafael Espindola52101412017-05-12 14:52:22 +0000590};
Rui Ueyamae288eef2016-11-02 18:58:44 +0000591
Rafael Espindola52101412017-05-12 14:52:22 +0000592static unsigned getSectionRank(const OutputSection *Sec) {
593 unsigned Rank = 0;
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000594
Rafael Espindola5967c972016-12-19 21:21:07 +0000595 // We want to put section specified by -T option first, so we
596 // can start assigning VA starting from them later.
Rafael Espindola52101412017-05-12 14:52:22 +0000597 if (Config->SectionStartMap.count(Sec->Name))
598 return Rank;
599 Rank |= RF_NOT_ADDR_SET;
600
601 // Put .interp first because some loaders want to see that section
602 // on the first page of the executable file when loaded into memory.
603 if (Sec->Name == ".interp")
604 return Rank;
605 Rank |= RF_NOT_INTERP;
606
607 // Allocatable sections go first to reduce the total PT_LOAD size and
608 // so debug info doesn't change addresses in actual code.
609 if (!(Sec->Flags & SHF_ALLOC))
610 return Rank | RF_NOT_ALLOC;
Rafael Espindola5967c972016-12-19 21:21:07 +0000611
Rafael Espindolad23e9262017-05-26 17:23:25 +0000612 // Sort sections based on their access permission in the following
613 // order: R, RX, RWX, RW. This order is based on the following
614 // considerations:
615 // * Read-only sections come first such that they go in the
616 // PT_LOAD covering the program headers at the start of the file.
617 // * Read-only, executable sections come next, unless the
618 // -no-rosegment option is used.
619 // * Writable, executable sections follow such that .plt on
620 // architectures where it needs to be writable will be placed
621 // between .text and .data.
622 // * Writable sections come last, such that .bss lands at the very
623 // end of the last PT_LOAD.
624 bool IsExec = Sec->Flags & SHF_EXECINSTR;
625 bool IsWrite = Sec->Flags & SHF_WRITE;
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000626
Rafael Espindolad23e9262017-05-26 17:23:25 +0000627 if (IsExec) {
628 if (IsWrite)
629 Rank |= RF_EXEC_WRITE;
630 else if (!Config->SingleRoRx)
Rafael Espindola52101412017-05-12 14:52:22 +0000631 Rank |= RF_EXEC;
Rafael Espindolad23e9262017-05-26 17:23:25 +0000632 } else {
633 if (IsWrite)
634 Rank |= RF_WRITE;
Rafael Espindolae979fd12016-09-29 22:48:55 +0000635 }
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000636
Hal Finkel0d7e83b2015-10-13 17:57:46 +0000637 // If we got here we know that both A and B are in the same PT_LOAD.
Michael J. Spencer1bf73002015-10-16 23:11:07 +0000638
Rafael Espindola52101412017-05-12 14:52:22 +0000639 bool IsTls = Sec->Flags & SHF_TLS;
640 bool IsNoBits = Sec->Type == SHT_NOBITS;
Hal Finkel3bae2d82015-10-12 20:51:48 +0000641
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000642 // The first requirement we have is to put (non-TLS) nobits sections last. The
643 // reason is that the only thing the dynamic linker will see about them is a
644 // p_memsz that is larger than p_filesz. Seeing that it zeros the end of the
645 // PT_LOAD, so that has to correspond to the nobits sections.
Rafael Espindola52101412017-05-12 14:52:22 +0000646 bool IsNonTlsNoBits = IsNoBits && !IsTls;
647 if (IsNonTlsNoBits)
648 Rank |= RF_NON_TLS_BSS;
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000649
650 // We place nobits RelRo sections before plain r/w ones, and non-nobits RelRo
651 // sections after r/w ones, so that the RelRo sections are contiguous.
Rafael Espindola52101412017-05-12 14:52:22 +0000652 bool IsRelRo = isRelroSection(Sec);
653 if (IsNonTlsNoBits && !IsRelRo)
654 Rank |= RF_NON_TLS_BSS_RO;
655 if (!IsNonTlsNoBits && IsRelRo)
656 Rank |= RF_NON_TLS_BSS_RO;
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000657
658 // The TLS initialization block needs to be a single contiguous block in a R/W
659 // PT_LOAD, so stick TLS sections directly before the other RelRo R/W
660 // sections. The TLS NOBITS sections are placed here as they don't take up
661 // virtual address space in the PT_LOAD.
Rafael Espindola52101412017-05-12 14:52:22 +0000662 if (!IsTls)
663 Rank |= RF_NOT_TLS;
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000664
665 // Within the TLS initialization block, the non-nobits sections need to appear
666 // first.
Rafael Espindola52101412017-05-12 14:52:22 +0000667 if (IsNoBits)
668 Rank |= RF_BSS;
George Rimare3336c02015-11-24 10:15:50 +0000669
Ben Dunbobbin95637552017-08-18 16:15:36 +0000670 // Some architectures have additional ordering restrictions for sections
671 // within the same PT_LOAD.
Rafael Espindola52101412017-05-12 14:52:22 +0000672 if (Config->EMachine == EM_PPC64) {
673 // PPC64 has a number of special SHT_PROGBITS+SHF_ALLOC+SHF_WRITE sections
674 // that we would like to make sure appear is a specific order to maximize
675 // their coverage by a single signed 16-bit offset from the TOC base
676 // pointer. Conversely, the special .tocbss section should be first among
677 // all SHT_NOBITS sections. This will put it next to the loaded special
678 // PPC64 sections (and, thus, within reach of the TOC base pointer).
679 StringRef Name = Sec->Name;
680 if (Name != ".tocbss")
681 Rank |= RF_PPC_NOT_TOCBSS;
Hal Finkel9abc2a52015-10-13 19:07:29 +0000682
Rafael Espindola52101412017-05-12 14:52:22 +0000683 if (Name == ".opd")
684 Rank |= RF_PPC_OPD;
685
686 if (Name == ".toc1")
687 Rank |= RF_PPC_TOCL;
688
689 if (Name == ".toc")
690 Rank |= RF_PPC_TOC;
691
692 if (Name == ".branch_lt")
693 Rank |= RF_PPC_BRANCH_LT;
694 }
695 if (Config->EMachine == EM_MIPS) {
696 // All sections with SHF_MIPS_GPREL flag should be grouped together
697 // because data in these sections is addressable with a gp relative address.
698 if (Sec->Flags & SHF_MIPS_GPREL)
699 Rank |= RF_MIPS_GPREL;
700
701 if (Sec->Name != ".got")
702 Rank |= RF_MIPS_NOT_GOT;
703 }
704
705 return Rank;
706}
707
Rafael Espindola383971d2017-06-15 21:51:01 +0000708static bool compareSections(const BaseCommand *ACmd, const BaseCommand *BCmd) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000709 const OutputSection *A = cast<OutputSection>(ACmd);
710 const OutputSection *B = cast<OutputSection>(BCmd);
Rafael Espindola52101412017-05-12 14:52:22 +0000711 if (A->SortRank != B->SortRank)
712 return A->SortRank < B->SortRank;
713 if (!(A->SortRank & RF_NOT_ADDR_SET))
714 return Config->SectionStartMap.lookup(A->Name) <
715 Config->SectionStartMap.lookup(B->Name);
Rafael Espindola24c073d2016-09-21 22:36:19 +0000716 return false;
717}
718
Rafael Espindola24e6f362017-02-24 15:07:30 +0000719void PhdrEntry::add(OutputSection *Sec) {
George Rimar6823c5f2017-09-07 11:01:10 +0000720 LastSec = Sec;
721 if (!FirstSec)
722 FirstSec = Sec;
Rafael Espindola37707632017-03-07 14:55:52 +0000723 p_align = std::max(p_align, Sec->Alignment);
Rafael Espindola17cb7c02016-12-19 17:01:01 +0000724 if (p_type == PT_LOAD)
George Rimar582ede82017-09-07 10:53:07 +0000725 Sec->PtLoad = this;
Eugene Leviantbbe38602016-07-19 09:25:43 +0000726}
727
Denis Protivensky8e3b38a2015-11-12 09:52:08 +0000728template <class ELFT>
Rafael Espindola5616adf2017-03-08 22:36:28 +0000729static Symbol *addRegular(StringRef Name, SectionBase *Sec, uint64_t Value,
730 uint8_t StOther = STV_HIDDEN,
731 uint8_t Binding = STB_WEAK) {
Rafael Espindoladab02d42016-11-17 21:20:16 +0000732 // The linker generated symbols are added as STB_WEAK to allow user defined
733 // ones to override them.
Rafael Espindola244ef982017-07-26 18:42:48 +0000734 return Symtab->addRegular<ELFT>(Name, StOther, STT_NOTYPE, Value,
735 /*Size=*/0, Binding, Sec,
736 /*File=*/nullptr);
Eugene Leviantad4439e2016-11-11 11:33:32 +0000737}
738
739template <class ELFT>
Rafael Espindola5616adf2017-03-08 22:36:28 +0000740static DefinedRegular *
741addOptionalRegular(StringRef Name, SectionBase *Sec, uint64_t Val,
742 uint8_t StOther = STV_HIDDEN, uint8_t Binding = STB_GLOBAL) {
Rafael Espindola244ef982017-07-26 18:42:48 +0000743 SymbolBody *S = Symtab->find(Name);
Eugene Leviantad4439e2016-11-11 11:33:32 +0000744 if (!S)
745 return nullptr;
Rafael Espindola1d6d1b42017-01-17 16:08:06 +0000746 if (S->isInCurrentDSO())
Rafael Espindola5616adf2017-03-08 22:36:28 +0000747 return nullptr;
748 return cast<DefinedRegular>(
749 addRegular<ELFT>(Name, Sec, Val, StOther, Binding)->body());
Eugene Leviantad4439e2016-11-11 11:33:32 +0000750}
751
Rui Ueyama01687222015-12-26 09:47:57 +0000752// The beginning and the ending of .rel[a].plt section are marked
753// with __rel[a]_iplt_{start,end} symbols if it is a statically linked
754// executable. The runtime needs these symbols in order to resolve
755// all IRELATIVE relocs on startup. For dynamic executables, we don't
756// need these symbols, since IRELATIVE relocs are resolved through GOT
757// and PLT. For details, see http://www.airs.com/blog/archives/403.
George Rimaree741cf2016-04-14 13:23:02 +0000758template <class ELFT> void Writer<ELFT>::addRelIpltSymbols() {
Shoaib Meenai335fad12017-08-05 05:01:07 +0000759 if (!Config->Static)
George Rimara07ff662015-12-21 10:12:06 +0000760 return;
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000761 StringRef S = Config->IsRela ? "__rela_iplt_start" : "__rel_iplt_start";
Rafael Espindola5616adf2017-03-08 22:36:28 +0000762 addOptionalRegular<ELFT>(S, In<ELFT>::RelaIplt, 0, STV_HIDDEN, STB_WEAK);
Rui Ueyama01687222015-12-26 09:47:57 +0000763
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000764 S = Config->IsRela ? "__rela_iplt_end" : "__rel_iplt_end";
Rafael Espindola5616adf2017-03-08 22:36:28 +0000765 addOptionalRegular<ELFT>(S, In<ELFT>::RelaIplt, -1, STV_HIDDEN, STB_WEAK);
George Rimara07ff662015-12-21 10:12:06 +0000766}
767
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +0000768// The linker is expected to define some symbols depending on
769// the linking result. This function defines such symbols.
770template <class ELFT> void Writer<ELFT>::addReservedSymbols() {
George Rimar7beff422016-11-15 08:19:02 +0000771 if (Config->EMachine == EM_MIPS) {
Rafael Espindola9b3f99e2016-04-12 02:24:43 +0000772 // Define _gp for MIPS. st_value of _gp symbol will be updated by Writer
Simon Atanasyan6a4eb752016-12-08 06:19:47 +0000773 // so that it points to an absolute address which by default is relative
774 // to GOT. Default offset is 0x7ff0.
Rafael Espindola9b3f99e2016-04-12 02:24:43 +0000775 // See "Global Data Symbols" in Chapter 6 in the following document:
776 // ftp://www.linux-mips.org/pub/linux/mips/doc/ABI/mipsabi.pdf
Rafael Espindola244ef982017-07-26 18:42:48 +0000777 ElfSym::MipsGp = Symtab->addAbsolute<ELFT>("_gp", STV_HIDDEN, STB_LOCAL);
Rafael Espindola9b3f99e2016-04-12 02:24:43 +0000778
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000779 // On MIPS O32 ABI, _gp_disp is a magic symbol designates offset between
Simon Atanasyand34a3632017-03-20 21:03:43 +0000780 // start of function and 'gp' pointer into GOT.
Rafael Espindola244ef982017-07-26 18:42:48 +0000781 if (Symtab->find("_gp_disp"))
Rui Ueyama80474a22017-02-28 19:29:55 +0000782 ElfSym::MipsGpDisp =
Rafael Espindola244ef982017-07-26 18:42:48 +0000783 Symtab->addAbsolute<ELFT>("_gp_disp", STV_HIDDEN, STB_LOCAL);
Peter Collingbourne6f535b72016-05-03 18:03:45 +0000784
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000785 // The __gnu_local_gp is a magic symbol equal to the current value of 'gp'
786 // pointer. This symbol is used in the code generated by .cpload pseudo-op
787 // in case of using -mno-shared option.
788 // https://sourceware.org/ml/binutils/2004-12/msg00094.html
Rafael Espindola244ef982017-07-26 18:42:48 +0000789 if (Symtab->find("__gnu_local_gp"))
Rui Ueyama80474a22017-02-28 19:29:55 +0000790 ElfSym::MipsLocalGp =
Rafael Espindola244ef982017-07-26 18:42:48 +0000791 Symtab->addAbsolute<ELFT>("__gnu_local_gp", STV_HIDDEN, STB_LOCAL);
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000792 }
793
Peter Smith113a59e2017-06-26 10:22:17 +0000794 // The _GLOBAL_OFFSET_TABLE_ symbol is defined by target convention to
795 // be at some offset from the base of the .got section, usually 0 or the end
796 // of the .got
Rui Ueyama92c37812017-06-26 15:11:24 +0000797 InputSection *GotSection = InX::MipsGot ? cast<InputSection>(InX::MipsGot)
798 : cast<InputSection>(InX::Got);
799 ElfSym::GlobalOffsetTable = addOptionalRegular<ELFT>(
800 "_GLOBAL_OFFSET_TABLE_", GotSection, Target->GotBaseSymOff);
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000801
Petr Hosek6b936bf2017-05-10 16:20:33 +0000802 // __ehdr_start is the location of ELF file headers. Note that we define
803 // this symbol unconditionally even when using a linker script, which
804 // differs from the behavior implemented by GNU linker which only define
805 // this symbol if ELF headers are in the memory mapped segment.
Rafael Espindola0e454a92017-06-06 16:18:48 +0000806 // __executable_start is not documented, but the expectation of at
807 // least the android libc is that it points to the elf header too.
808 // __dso_handle symbol is passed to cxa_finalize as a marker to identify
809 // each DSO. The address of the symbol doesn't matter as long as they are
810 // different in different DSOs, so we chose the start address of the DSO.
811 for (const char *Name :
812 {"__ehdr_start", "__executable_start", "__dso_handle"})
813 addOptionalRegular<ELFT>(Name, Out::ElfHeader, 0, STV_HIDDEN);
Petr Hosek6b936bf2017-05-10 16:20:33 +0000814
George Rimar28ac19c2016-08-08 08:42:48 +0000815 // If linker script do layout we do not need to create any standart symbols.
Rui Ueyamaac27de92017-10-11 01:19:33 +0000816 if (Script->HasSections)
George Rimar28ac19c2016-08-08 08:42:48 +0000817 return;
818
Davide Italiano763febc2017-09-18 18:31:49 +0000819 auto Add = [](StringRef S, int64_t Pos) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000820 return addOptionalRegular<ELFT>(S, Out::ElfHeader, Pos, STV_DEFAULT);
George Rimar9e859392016-02-26 14:36:36 +0000821 };
822
Rafael Espindola4d560162017-09-12 16:38:01 +0000823 ElfSym::Bss = Add("__bss_start", 0);
Davide Italiano763febc2017-09-18 18:31:49 +0000824 ElfSym::End1 = Add("end", -1);
825 ElfSym::End2 = Add("_end", -1);
826 ElfSym::Etext1 = Add("etext", -1);
827 ElfSym::Etext2 = Add("_etext", -1);
828 ElfSym::Edata1 = Add("edata", -1);
829 ElfSym::Edata2 = Add("_edata", -1);
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +0000830}
831
Rui Ueyamac4185702016-02-10 23:20:42 +0000832// Sort input sections by section name suffixes for
833// __attribute__((init_priority(N))).
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000834static void sortInitFini(OutputSection *Cmd) {
Rafael Espindola21263342017-07-05 23:36:24 +0000835 if (Cmd)
836 Cmd->sortInitFini();
Rui Ueyama5af83682016-02-11 23:41:38 +0000837}
838
839// Sort input sections by the special rule for .ctors and .dtors.
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000840static void sortCtorsDtors(OutputSection *Cmd) {
Rafael Espindola21263342017-07-05 23:36:24 +0000841 if (Cmd)
842 Cmd->sortCtorsDtors();
Rui Ueyamac4185702016-02-10 23:20:42 +0000843}
844
George Rimar1a33c0f2016-11-10 09:05:20 +0000845// Sort input sections using the list provided by --symbol-ordering-file.
George Rimar696a7f92017-09-19 09:20:54 +0000846static void sortBySymbolsOrder() {
George Rimar1a33c0f2016-11-10 09:05:20 +0000847 if (Config->SymbolOrderingFile.empty())
848 return;
849
Rui Ueyama31270312016-12-20 01:51:08 +0000850 // Sort sections by priority.
George Rimar696a7f92017-09-19 09:20:54 +0000851 DenseMap<SectionBase *, int> SectionOrder = buildSectionOrder();
Rui Ueyamaac27de92017-10-11 01:19:33 +0000852 for (BaseCommand *Base : Script->Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000853 if (auto *Sec = dyn_cast<OutputSection>(Base))
854 Sec->sort([&](InputSectionBase *S) { return SectionOrder.lookup(S); });
George Rimar1a33c0f2016-11-10 09:05:20 +0000855}
856
Eugene Leviante63d81b2016-07-20 14:43:20 +0000857template <class ELFT>
Rafael Espindolab4c9b812017-02-23 02:28:28 +0000858void Writer<ELFT>::forEachRelSec(std::function<void(InputSectionBase &)> Fn) {
George Rimarcb888a62017-09-13 07:54:47 +0000859 // Scan all relocations. Each relocation goes through a series
860 // of tests to determine if it needs special treatment, such as
861 // creating GOT, PLT, copy relocations, etc.
862 // Note that relocations for non-alloc sections are directly
863 // processed by InputSection::relocateNonAlloc.
864 for (InputSectionBase *IS : InputSections)
865 if (IS->Live && isa<InputSection>(IS) && (IS->Flags & SHF_ALLOC))
Rafael Espindola9f0c4bb2016-11-10 14:53:24 +0000866 Fn(*IS);
George Rimarcb888a62017-09-13 07:54:47 +0000867 for (EhInputSection *ES : In<ELFT>::EhFrame->Sections)
868 Fn(*ES);
Rafael Espindola0f7ceda2016-07-20 17:58:07 +0000869}
870
Eugene Leviant282251a2016-11-01 09:49:24 +0000871template <class ELFT> void Writer<ELFT>::createSections() {
Rui Ueyamac54d5b12017-10-06 23:34:43 +0000872 std::vector<OutputSection *> Vec;
Rui Ueyama536a2672017-02-27 02:32:08 +0000873 for (InputSectionBase *IS : InputSections)
Rafael Espindola82902742017-02-16 17:32:26 +0000874 if (IS)
Rui Ueyamac54d5b12017-10-06 23:34:43 +0000875 if (OutputSection *Sec =
876 Factory.addInputSec(IS, getOutputSectionName(IS->Name)))
877 Vec.push_back(Sec);
878
Rui Ueyamaac27de92017-10-11 01:19:33 +0000879 Script->Commands.insert(Script->Commands.begin(), Vec.begin(), Vec.end());
Eugene Leviantceabe802016-08-11 07:56:43 +0000880
Rafael Espindola21263342017-07-05 23:36:24 +0000881 Script->fabricateDefaultCommands();
George Rimar696a7f92017-09-19 09:20:54 +0000882 sortBySymbolsOrder();
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000883 sortInitFini(findSection(".init_array"));
884 sortInitFini(findSection(".fini_array"));
885 sortCtorsDtors(findSection(".ctors"));
886 sortCtorsDtors(findSection(".dtors"));
Eugene Leviante63d81b2016-07-20 14:43:20 +0000887}
888
Petr Hosek18821b62017-09-01 02:23:31 +0000889// This function generates assignments for predefined symbols (e.g. _end or
890// _etext) and inserts them into the commands sequence to be processed at the
891// appropriate time. This ensures that the value is going to be correct by the
892// time any references to these symbols are processed and is equivalent to
893// defining these symbols explicitly in the linker script.
Rafael Espindola4d560162017-09-12 16:38:01 +0000894template <class ELFT> void Writer<ELFT>::setReservedSymbolSections() {
Petr Hosek18821b62017-09-01 02:23:31 +0000895 PhdrEntry *Last = nullptr;
896 PhdrEntry *LastRO = nullptr;
897 PhdrEntry *LastRW = nullptr;
Rui Ueyama888da8c2017-09-05 20:17:37 +0000898
Petr Hosek18821b62017-09-01 02:23:31 +0000899 for (PhdrEntry *P : Phdrs) {
900 if (P->p_type != PT_LOAD)
901 continue;
902 Last = P;
903 if (P->p_flags & PF_W)
904 LastRW = P;
905 else
906 LastRO = P;
907 }
908
Rui Ueyama888da8c2017-09-05 20:17:37 +0000909 // _end is the first location after the uninitialized data region.
Petr Hosek18821b62017-09-01 02:23:31 +0000910 if (Last) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000911 if (ElfSym::End1)
912 ElfSym::End1->Section = Last->LastSec;
913 if (ElfSym::End2)
914 ElfSym::End2->Section = Last->LastSec;
Petr Hosek18821b62017-09-01 02:23:31 +0000915 }
Rui Ueyama888da8c2017-09-05 20:17:37 +0000916
917 // _etext is the first location after the last read-only loadable segment.
Petr Hosek18821b62017-09-01 02:23:31 +0000918 if (LastRO) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000919 if (ElfSym::Etext1)
920 ElfSym::Etext1->Section = LastRO->LastSec;
921 if (ElfSym::Etext2)
922 ElfSym::Etext2->Section = LastRO->LastSec;
Petr Hosek18821b62017-09-01 02:23:31 +0000923 }
Rui Ueyama888da8c2017-09-05 20:17:37 +0000924
925 // _edata points to the end of the last non SHT_NOBITS section.
Petr Hosek18821b62017-09-01 02:23:31 +0000926 if (LastRW) {
Rui Ueyama888da8c2017-09-05 20:17:37 +0000927 size_t I = 0;
Rafael Espindola4d560162017-09-12 16:38:01 +0000928 for (; I < OutputSections.size(); ++I)
929 if (OutputSections[I] == LastRW->FirstSec)
Rui Ueyama888da8c2017-09-05 20:17:37 +0000930 break;
931
Rafael Espindola4d560162017-09-12 16:38:01 +0000932 for (; I < OutputSections.size(); ++I) {
933 if (OutputSections[I]->Type != SHT_NOBITS)
Rui Ueyama888da8c2017-09-05 20:17:37 +0000934 continue;
Rui Ueyama888da8c2017-09-05 20:17:37 +0000935 break;
Petr Hosek18821b62017-09-01 02:23:31 +0000936 }
Rafael Espindola4d560162017-09-12 16:38:01 +0000937 if (ElfSym::Edata1)
938 ElfSym::Edata1->Section = OutputSections[I - 1];
939 if (ElfSym::Edata2)
940 ElfSym::Edata2->Section = OutputSections[I - 1];
941 }
942
943 if (ElfSym::Bss)
944 ElfSym::Bss->Section = findSection(".bss");
945
946 // Setup MIPS _gp_disp/__gnu_local_gp symbols which should
947 // be equal to the _gp symbol's value.
Rafael Espindola9be24cf2017-09-20 18:30:57 +0000948 if (ElfSym::MipsGp) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000949 // Find GP-relative section with the lowest address
950 // and use this address to calculate default _gp value.
951 for (OutputSection *OS : OutputSections) {
952 if (OS->Flags & SHF_MIPS_GPREL) {
953 ElfSym::MipsGp->Section = OS;
954 ElfSym::MipsGp->Value = 0x7ff0;
955 break;
956 }
957 }
Petr Hosek18821b62017-09-01 02:23:31 +0000958 }
959}
960
Rafael Espindola52101412017-05-12 14:52:22 +0000961// We want to find how similar two ranks are.
962// The more branches in getSectionRank that match, the more similar they are.
963// Since each branch corresponds to a bit flag, we can just use
964// countLeadingZeros.
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000965static int getRankProximityAux(OutputSection *A, OutputSection *B) {
Rafael Espindola52101412017-05-12 14:52:22 +0000966 return countLeadingZeros(A->SortRank ^ B->SortRank);
Eugene Leviantbae1c652016-11-08 10:44:48 +0000967}
968
Rafael Espindola383971d2017-06-15 21:51:01 +0000969static int getRankProximity(OutputSection *A, BaseCommand *B) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000970 if (auto *Sec = dyn_cast<OutputSection>(B))
971 if (Sec->Live)
972 return getRankProximityAux(A, Sec);
Rafael Espindola383971d2017-06-15 21:51:01 +0000973 return -1;
974}
975
976// When placing orphan sections, we want to place them after symbol assignments
977// so that an orphan after
978// begin_foo = .;
979// foo : { *(foo) }
980// end_foo = .;
981// doesn't break the intended meaning of the begin/end symbols.
982// We don't want to go over sections since findOrphanPos is the
983// one in charge of deciding the order of the sections.
984// We don't want to go over changes to '.', since doing so in
985// rx_sec : { *(rx_sec) }
986// . = ALIGN(0x1000);
987// /* The RW PT_LOAD starts here*/
988// rw_sec : { *(rw_sec) }
989// would mean that the RW PT_LOAD would become unaligned.
990static bool shouldSkip(BaseCommand *Cmd) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000991 if (isa<OutputSection>(Cmd))
Rafael Espindola383971d2017-06-15 21:51:01 +0000992 return false;
993 if (auto *Assign = dyn_cast<SymbolAssignment>(Cmd))
994 return Assign->Name != ".";
995 return true;
996}
997
Rafael Espindola52101412017-05-12 14:52:22 +0000998// We want to place orphan sections so that they share as much
999// characteristics with their neighbors as possible. For example, if
1000// both are rw, or both are tls.
Rafael Espindola0ca37122017-05-09 13:58:46 +00001001template <typename ELFT>
Rafael Espindola383971d2017-06-15 21:51:01 +00001002static std::vector<BaseCommand *>::iterator
1003findOrphanPos(std::vector<BaseCommand *>::iterator B,
1004 std::vector<BaseCommand *>::iterator E) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001005 OutputSection *Sec = cast<OutputSection>(*E);
Rafael Espindola0ca37122017-05-09 13:58:46 +00001006
Rafael Espindola52101412017-05-12 14:52:22 +00001007 // Find the first element that has as close a rank as possible.
Rafael Espindola383971d2017-06-15 21:51:01 +00001008 auto I = std::max_element(B, E, [=](BaseCommand *A, BaseCommand *B) {
Rafael Espindola52101412017-05-12 14:52:22 +00001009 return getRankProximity(Sec, A) < getRankProximity(Sec, B);
1010 });
1011 if (I == E)
Rafael Espindola0ca37122017-05-09 13:58:46 +00001012 return E;
1013
Rafael Espindola52101412017-05-12 14:52:22 +00001014 // Consider all existing sections with the same proximity.
Rafael Espindola383971d2017-06-15 21:51:01 +00001015 int Proximity = getRankProximity(Sec, *I);
1016 for (; I != E; ++I) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001017 auto *CurSec = dyn_cast<OutputSection>(*I);
1018 if (!CurSec || !CurSec->Live)
Rafael Espindola383971d2017-06-15 21:51:01 +00001019 continue;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001020 if (getRankProximity(Sec, CurSec) != Proximity ||
1021 Sec->SortRank < CurSec->SortRank)
Rafael Espindola383971d2017-06-15 21:51:01 +00001022 break;
1023 }
Andrew Ng4d54a4b2017-10-10 10:05:52 +00001024 auto J = std::find_if(llvm::make_reverse_iterator(I),
1025 llvm::make_reverse_iterator(B), [](BaseCommand *Cmd) {
1026 auto *OS = dyn_cast<OutputSection>(Cmd);
1027 return OS && OS->Live;
1028 });
Rafael Espindola383971d2017-06-15 21:51:01 +00001029 I = J.base();
Rafael Espindolaaad64e02017-09-19 17:29:58 +00001030
1031 // As a special case, if the orphan section is the last section, put
1032 // it at the very end, past any other commands.
1033 // This matches bfd's behavior and is convenient when the linker script fully
1034 // specifies the start of the file, but doesn't care about the end (the non
1035 // alloc sections for example).
1036 auto NextSec = std::find_if(
1037 I, E, [](BaseCommand *Cmd) { return isa<OutputSection>(Cmd); });
1038 if (NextSec == E)
1039 return E;
1040
Rafael Espindola383971d2017-06-15 21:51:01 +00001041 while (I != E && shouldSkip(*I))
Rafael Espindola52101412017-05-12 14:52:22 +00001042 ++I;
1043 return I;
Rafael Espindola0ca37122017-05-09 13:58:46 +00001044}
1045
Rafael Espindola24c073d2016-09-21 22:36:19 +00001046template <class ELFT> void Writer<ELFT>::sortSections() {
George Rimarba455842017-10-02 09:11:13 +00001047 Script->adjustSectionsBeforeSorting();
George Rimare0b43df2017-06-28 09:59:34 +00001048
Rafael Espindola1960bcd2016-11-11 22:43:27 +00001049 // Don't sort if using -r. It is not necessary and we want to preserve the
1050 // relative order for SHF_LINK_ORDER sections.
1051 if (Config->Relocatable)
Rafael Espindola85de6782017-06-28 22:44:11 +00001052 return;
Rafael Espindola52101412017-05-12 14:52:22 +00001053
Rui Ueyamaac27de92017-10-11 01:19:33 +00001054 for (BaseCommand *Base : Script->Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001055 if (auto *Sec = dyn_cast<OutputSection>(Base))
1056 Sec->SortRank = getSectionRank(Sec);
Rafael Espindola52101412017-05-12 14:52:22 +00001057
Rui Ueyamaac27de92017-10-11 01:19:33 +00001058 if (!Script->HasSections) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001059 // We know that all the OutputSections are contiguous in
Rafael Espindola383971d2017-06-15 21:51:01 +00001060 // this case.
Rui Ueyamaac27de92017-10-11 01:19:33 +00001061 auto E = Script->Commands.end();
1062 auto I = Script->Commands.begin();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001063 auto IsSection = [](BaseCommand *Base) { return isa<OutputSection>(Base); };
Rafael Espindola383971d2017-06-15 21:51:01 +00001064 I = std::find_if(I, E, IsSection);
Rafael Espindolac54b1c82017-06-15 22:03:06 +00001065 E = std::find_if(llvm::make_reverse_iterator(E),
1066 llvm::make_reverse_iterator(I), IsSection)
Rafael Espindola383971d2017-06-15 21:51:01 +00001067 .base();
1068 std::stable_sort(I, E, compareSections);
Rafael Espindola24c073d2016-09-21 22:36:19 +00001069 return;
1070 }
1071
Rafael Espindola383971d2017-06-15 21:51:01 +00001072 // Orphan sections are sections present in the input files which are
1073 // not explicitly placed into the output file by the linker script.
1074 //
1075 // The sections in the linker script are already in the correct
1076 // order. We have to figuere out where to insert the orphan
1077 // sections.
1078 //
Rafael Espindola24c073d2016-09-21 22:36:19 +00001079 // The order of the sections in the script is arbitrary and may not agree with
Rafael Espindola383971d2017-06-15 21:51:01 +00001080 // compareSections. This means that we cannot easily define a strict weak
1081 // ordering. To see why, consider a comparison of a section in the script and
1082 // one not in the script. We have a two simple options:
Rafael Espindola24c073d2016-09-21 22:36:19 +00001083 // * Make them equivalent (a is not less than b, and b is not less than a).
1084 // The problem is then that equivalence has to be transitive and we can
1085 // have sections a, b and c with only b in a script and a less than c
1086 // which breaks this property.
1087 // * Use compareSectionsNonScript. Given that the script order doesn't have
1088 // to match, we can end up with sections a, b, c, d where b and c are in the
1089 // script and c is compareSectionsNonScript less than b. In which case d
1090 // can be equivalent to c, a to b and d < a. As a concrete example:
1091 // .a (rx) # not in script
1092 // .b (rx) # in script
1093 // .c (ro) # in script
1094 // .d (ro) # not in script
1095 //
1096 // The way we define an order then is:
Rafael Espindola383971d2017-06-15 21:51:01 +00001097 // * Sort only the orphan sections. They are in the end right now.
1098 // * Move each orphan section to its preferred position. We try
Eugene Leviantbae1c652016-11-08 10:44:48 +00001099 // to put each section in the last position where it it can share
1100 // a PT_LOAD.
Rafael Espindola383971d2017-06-15 21:51:01 +00001101 //
1102 // There is some ambiguity as to where exactly a new entry should be
Rui Ueyamaac27de92017-10-11 01:19:33 +00001103 // inserted, because Commands contains not only output section
Rafael Espindola383971d2017-06-15 21:51:01 +00001104 // commands but also other types of commands such as symbol assignment
1105 // expressions. There's no correct answer here due to the lack of the
1106 // formal specification of the linker script. We use heuristics to
1107 // determine whether a new output command should be added before or
1108 // after another commands. For the details, look at shouldSkip
1109 // function.
Rafael Espindola24c073d2016-09-21 22:36:19 +00001110
Rui Ueyamaac27de92017-10-11 01:19:33 +00001111 auto I = Script->Commands.begin();
1112 auto E = Script->Commands.end();
Rafael Espindola383971d2017-06-15 21:51:01 +00001113 auto NonScriptI = std::find_if(I, E, [](BaseCommand *Base) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001114 if (auto *Sec = dyn_cast<OutputSection>(Base))
1115 return Sec->Live && Sec->SectionIndex == INT_MAX;
Rafael Espindola383971d2017-06-15 21:51:01 +00001116 return false;
1117 });
Rafael Espindola24c073d2016-09-21 22:36:19 +00001118
Rafael Espindola383971d2017-06-15 21:51:01 +00001119 // Sort the orphan sections.
1120 std::stable_sort(NonScriptI, E, compareSections);
1121
1122 // As a horrible special case, skip the first . assignment if it is before any
1123 // section. We do this because it is common to set a load address by starting
1124 // the script with ". = 0xabcd" and the expectation is that every section is
1125 // after that.
1126 auto FirstSectionOrDotAssignment =
1127 std::find_if(I, E, [](BaseCommand *Cmd) { return !shouldSkip(Cmd); });
1128 if (FirstSectionOrDotAssignment != E &&
1129 isa<SymbolAssignment>(**FirstSectionOrDotAssignment))
1130 ++FirstSectionOrDotAssignment;
1131 I = FirstSectionOrDotAssignment;
1132
Rafael Espindola52101412017-05-12 14:52:22 +00001133 while (NonScriptI != E) {
1134 auto Pos = findOrphanPos<ELFT>(I, NonScriptI);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001135 OutputSection *Orphan = cast<OutputSection>(*NonScriptI);
Rafael Espindola52101412017-05-12 14:52:22 +00001136
1137 // As an optimization, find all sections with the same sort rank
1138 // and insert them with one rotate.
Rafael Espindola383971d2017-06-15 21:51:01 +00001139 unsigned Rank = Orphan->SortRank;
1140 auto End = std::find_if(NonScriptI + 1, E, [=](BaseCommand *Cmd) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001141 return cast<OutputSection>(Cmd)->SortRank != Rank;
Rafael Espindola52101412017-05-12 14:52:22 +00001142 });
1143 std::rotate(Pos, NonScriptI, End);
1144 NonScriptI = End;
1145 }
Rafael Espindolaf7a17442016-11-14 15:39:38 +00001146
George Rimara8dba482017-03-20 10:09:58 +00001147 Script->adjustSectionsAfterSorting();
Rafael Espindola24c073d2016-09-21 22:36:19 +00001148}
1149
Peter Smith1ec42d92017-03-08 14:06:24 +00001150static void applySynthetic(const std::vector<SyntheticSection *> &Sections,
1151 std::function<void(SyntheticSection *)> Fn) {
Rui Ueyama9320cb02017-02-27 02:56:02 +00001152 for (SyntheticSection *SS : Sections)
Rafael Espindolad57c58d2017-06-07 02:31:19 +00001153 if (SS && SS->getParent() && !SS->empty())
Peter Smith1ec42d92017-03-08 14:06:24 +00001154 Fn(SS);
Eugene Leviant6380ce22016-11-15 12:26:55 +00001155}
1156
Rui Ueyama6aeea182017-10-02 18:54:59 +00001157// In order to allow users to manipulate linker-synthesized sections,
1158// we had to add synthetic sections to the input section list early,
1159// even before we make decisions whether they are needed. This allows
1160// users to write scripts like this: ".mygot : { .got }".
1161//
1162// Doing it has an unintended side effects. If it turns out that we
1163// don't need a .got (for example) at all because there's no
1164// relocation that needs a .got, we don't want to emit .got.
1165//
1166// To deal with the above problem, this function is called after
1167// scanRelocations is called to remove synthetic sections that turn
1168// out to be empty.
Rafael Espindolac080ff62017-07-03 16:54:39 +00001169static void removeUnusedSyntheticSections() {
Rafael Espindola9e9754b2017-02-03 13:06:18 +00001170 // All input synthetic sections that can be empty are placed after
1171 // all regular ones. We iterate over them all and exit at first
1172 // non-synthetic.
Rui Ueyama536a2672017-02-27 02:32:08 +00001173 for (InputSectionBase *S : llvm::reverse(InputSections)) {
Rui Ueyama9320cb02017-02-27 02:56:02 +00001174 SyntheticSection *SS = dyn_cast<SyntheticSection>(S);
Rui Ueyamac38860b2016-12-05 21:39:35 +00001175 if (!SS)
George Rimar11992c862016-11-25 08:05:41 +00001176 return;
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001177 OutputSection *OS = SS->getParent();
1178 if (!SS->empty() || !OS)
George Rimar11992c862016-11-25 08:05:41 +00001179 continue;
Rafael Espindolac080ff62017-07-03 16:54:39 +00001180
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001181 std::vector<BaseCommand *>::iterator Empty = OS->Commands.end();
1182 for (auto I = OS->Commands.begin(), E = OS->Commands.end(); I != E; ++I) {
Rafael Espindola43ee3602017-07-03 17:32:09 +00001183 BaseCommand *B = *I;
Rafael Espindolac080ff62017-07-03 16:54:39 +00001184 if (auto *ISD = dyn_cast<InputSectionDescription>(B)) {
George Rimar7ac38252017-09-08 13:26:45 +00001185 llvm::erase_if(ISD->Sections,
1186 [=](InputSection *IS) { return IS == SS; });
Rafael Espindolac080ff62017-07-03 16:54:39 +00001187 if (ISD->Sections.empty())
Rafael Espindola43ee3602017-07-03 17:32:09 +00001188 Empty = I;
Rafael Espindolac080ff62017-07-03 16:54:39 +00001189 }
1190 }
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001191 if (Empty != OS->Commands.end())
1192 OS->Commands.erase(Empty);
Rafael Espindolac080ff62017-07-03 16:54:39 +00001193
James Henderson7ee22752017-04-06 09:40:03 +00001194 // If there are no other sections in the output section, remove it from the
1195 // output.
George Rimar9a2da392017-09-08 13:40:07 +00001196 if (OS->Commands.empty())
George Rimarba455842017-10-02 09:11:13 +00001197 OS->Live = false;
George Rimar11992c862016-11-25 08:05:41 +00001198 }
1199}
1200
Rafael Espindola35c908f2017-08-10 15:05:37 +00001201// Returns true if a symbol can be replaced at load-time by a symbol
1202// with the same name defined in other ELF executable or DSO.
1203static bool computeIsPreemptible(const SymbolBody &B) {
1204 assert(!B.isLocal());
Rafael Espindola35c908f2017-08-10 15:05:37 +00001205 // Only symbols that appear in dynsym can be preempted.
1206 if (!B.symbol()->includeInDynsym())
1207 return false;
1208
1209 // Only default visibility symbols can be preempted.
1210 if (B.symbol()->Visibility != STV_DEFAULT)
1211 return false;
1212
Rafael Espindola30ea5cf2017-09-12 17:18:03 +00001213 // At this point copy relocations have not been created yet, so any
1214 // symbol that is not defined locally is preemptible.
Rafael Espindolaee6a3522017-09-08 18:41:49 +00001215 if (!B.isInCurrentDSO())
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001216 return true;
1217
1218 // If we have a dynamic list it specifies which local symbols are preemptible.
Rafael Espindola8016bdf2017-09-08 18:53:43 +00001219 if (Config->HasDynamicList)
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001220 return false;
1221
Rafael Espindola35c908f2017-08-10 15:05:37 +00001222 if (!Config->Shared)
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001223 return false;
Rafael Espindola35c908f2017-08-10 15:05:37 +00001224
1225 // -Bsymbolic means that definitions are not preempted.
1226 if (Config->Bsymbolic || (Config->BsymbolicFunctions && B.isFunc()))
Rafael Espindola716c57b2017-09-08 18:23:25 +00001227 return false;
Rafael Espindola35c908f2017-08-10 15:05:37 +00001228 return true;
1229}
1230
Eugene Leviante63d81b2016-07-20 14:43:20 +00001231// Create output section objects and add them to OutputSections.
1232template <class ELFT> void Writer<ELFT>::finalizeSections() {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001233 Out::DebugInfo = findSection(".debug_info");
1234 Out::PreinitArray = findSection(".preinit_array");
1235 Out::InitArray = findSection(".init_array");
1236 Out::FiniArray = findSection(".fini_array");
Rafael Espindola77572242015-10-02 19:37:55 +00001237
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001238 // The linker needs to define SECNAME_start, SECNAME_end and SECNAME_stop
1239 // symbols for sections, so that the runtime can get the start and end
1240 // addresses of each section by section name. Add such symbols.
George Rimarc1034a82016-03-01 19:12:35 +00001241 if (!Config->Relocatable) {
1242 addStartEndSymbols();
Rui Ueyamaac27de92017-10-11 01:19:33 +00001243 for (BaseCommand *Base : Script->Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001244 if (auto *Sec = dyn_cast<OutputSection>(Base))
1245 addStartStopSymbols(Sec);
George Rimarc1034a82016-03-01 19:12:35 +00001246 }
Rui Ueyamad4530c62016-03-04 18:34:14 +00001247
1248 // Add _DYNAMIC symbol. Unlike GNU gold, our _DYNAMIC symbol has no type.
1249 // It should be okay as no one seems to care about the type.
1250 // Even the author of gold doesn't remember why gold behaves that way.
1251 // https://sourceware.org/ml/binutils/2002-03/msg00360.html
George Rimar69b17c32017-05-16 10:04:42 +00001252 if (InX::DynSymTab)
Rafael Espindola5ab19892017-05-11 23:16:43 +00001253 addRegular<ELFT>("_DYNAMIC", InX::Dynamic, 0);
Rafael Espindola334c3e12015-10-19 15:21:42 +00001254
Rafael Espindolade9857e2016-02-04 21:33:05 +00001255 // Define __rel[a]_iplt_{start,end} symbols if needed.
1256 addRelIpltSymbols();
1257
Rafael Espindola66b4e212017-02-23 22:06:28 +00001258 // This responsible for splitting up .eh_frame section into
Peter Smith1ec42d92017-03-08 14:06:24 +00001259 // pieces. The relocation scan uses those pieces, so this has to be
Rafael Espindola66b4e212017-02-23 22:06:28 +00001260 // earlier.
George Rimar49a47f22017-03-16 10:29:44 +00001261 applySynthetic({In<ELFT>::EhFrame},
1262 [](SyntheticSection *SS) { SS->finalizeContents(); });
Rafael Espindola56004c52016-04-07 14:22:09 +00001263
Rafael Espindola0ff545c2017-09-08 01:09:52 +00001264 for (Symbol *S : Symtab->getSymbols())
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001265 S->body()->IsPreemptible |= computeIsPreemptible(*S->body());
Rafael Espindola35c908f2017-08-10 15:05:37 +00001266
Rafael Espindola0f7ceda2016-07-20 17:58:07 +00001267 // Scan relocations. This must be done after every symbol is declared so that
1268 // we can correctly decide if a dynamic relocation is needed.
George Rimarcb888a62017-09-13 07:54:47 +00001269 if (!Config->Relocatable)
1270 forEachRelSec(scanRelocations<ELFT>);
Rafael Espindola0f7ceda2016-07-20 17:58:07 +00001271
Rafael Espindola895aea62017-05-11 22:02:41 +00001272 if (InX::Plt && !InX::Plt->empty())
1273 InX::Plt->addSymbols();
1274 if (InX::Iplt && !InX::Iplt->empty())
1275 InX::Iplt->addSymbols();
Peter Smith96943762017-01-25 10:31:16 +00001276
Peter Smith55865432017-02-20 11:12:33 +00001277 // Now that we have defined all possible global symbols including linker-
Rui Ueyama1b2a8bf2015-12-26 10:22:16 +00001278 // synthesized ones. Visit all symbols to give the finishing touches.
Rafael Espindola244ef982017-07-26 18:42:48 +00001279 for (Symbol *S : Symtab->getSymbols()) {
Peter Collingbourne4f952702016-05-01 04:55:03 +00001280 SymbolBody *Body = S->body();
Rafael Espindola0baa73f2016-04-26 13:56:26 +00001281
George Rimar7702bc22017-03-16 11:20:02 +00001282 if (!includeInSymtab(*Body))
Rafael Espindola05a3dd22015-09-22 23:38:23 +00001283 continue;
George Rimar69b17c32017-05-16 10:04:42 +00001284 if (InX::SymTab)
1285 InX::SymTab->addSymbol(Body);
Rafael Espindola05a3dd22015-09-22 23:38:23 +00001286
George Rimar69b17c32017-05-16 10:04:42 +00001287 if (InX::DynSymTab && S->includeInDynsym()) {
1288 InX::DynSymTab->addSymbol(Body);
Rui Ueyama4076fa12017-02-26 23:35:34 +00001289 if (auto *SS = dyn_cast<SharedSymbol>(Body))
Rafael Espindola6e93d052017-08-04 22:31:42 +00001290 if (cast<SharedFile<ELFT>>(S->File)->isNeeded())
Eugene Leviante9bab5d2016-11-21 16:59:33 +00001291 In<ELFT>::VerNeed->addSymbol(SS);
Peter Collingbourne21a12fc2016-04-27 20:22:31 +00001292 }
Rafael Espindola05a3dd22015-09-22 23:38:23 +00001293 }
Rui Ueyamac2a0d7e2016-01-28 22:56:29 +00001294
1295 // Do not proceed if there was an undefined symbol.
Rui Ueyamaf373dd72016-11-24 01:43:21 +00001296 if (ErrorCount)
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +00001297 return;
Rui Ueyamac2a0d7e2016-01-28 22:56:29 +00001298
Rafael Espindola1eb3a0f2017-07-04 18:26:21 +00001299 addPredefinedSections();
Rafael Espindolac080ff62017-07-03 16:54:39 +00001300 removeUnusedSyntheticSections();
1301
Rafael Espindola24c073d2016-09-21 22:36:19 +00001302 sortSections();
George Rimarba455842017-10-02 09:11:13 +00001303 Script->removeEmptyCommands();
Rafael Espindola383971d2017-06-15 21:51:01 +00001304
1305 // Now that we have the final list, create a list of all the
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001306 // OutputSections for convenience.
Rui Ueyamaac27de92017-10-11 01:19:33 +00001307 for (BaseCommand *Base : Script->Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001308 if (auto *Sec = dyn_cast<OutputSection>(Base))
1309 OutputSections.push_back(Sec);
Rui Ueyama84417f82015-12-26 07:50:41 +00001310
Rafael Espindola9c0395e2017-06-20 01:51:50 +00001311 // Prefer command line supplied address over other constraints.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001312 for (OutputSection *Sec : OutputSections) {
1313 auto I = Config->SectionStartMap.find(Sec->Name);
Rafael Espindola9c0395e2017-06-20 01:51:50 +00001314 if (I != Config->SectionStartMap.end())
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001315 Sec->AddrExpr = [=] { return I->second; };
Rafael Espindola9c0395e2017-06-20 01:51:50 +00001316 }
1317
Rafael Espindola78493a22017-01-28 17:48:21 +00001318 // This is a bit of a hack. A value of 0 means undef, so we set it
1319 // to 1 t make __ehdr_start defined. The section number is not
1320 // particularly relevant.
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001321 Out::ElfHeader->SectionIndex = 1;
Rafael Espindola78493a22017-01-28 17:48:21 +00001322
George Rimar7ca06272016-04-06 07:20:45 +00001323 unsigned I = 1;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001324 for (OutputSection *Sec : OutputSections) {
George Rimar7ca06272016-04-06 07:20:45 +00001325 Sec->SectionIndex = I++;
Rafael Espindola895aea62017-05-11 22:02:41 +00001326 Sec->ShName = InX::ShStrTab->addString(Sec->Name);
George Rimar7ca06272016-04-06 07:20:45 +00001327 }
Rui Ueyama84417f82015-12-26 07:50:41 +00001328
Rafael Espindola5967c972016-12-19 21:21:07 +00001329 // Binary and relocatable output does not have PHDRS.
1330 // The headers have to be created before finalize as that can influence the
1331 // image base and the dynamic section on mips includes the image base.
1332 if (!Config->Relocatable && !Config->OFormatBinary) {
Rafael Espindolaf51c8052017-06-13 23:26:31 +00001333 Phdrs = Script->hasPhdrsCommands() ? Script->createPhdrs() : createPhdrs();
Rafael Espindola5967c972016-12-19 21:21:07 +00001334 addPtArmExid(Phdrs);
Rafael Espindola02ed7572017-05-04 19:34:17 +00001335 Out::ProgramHeaders->Size = sizeof(Elf_Phdr) * Phdrs.size();
Rafael Espindola5967c972016-12-19 21:21:07 +00001336 }
1337
Rafael Espindola4d560162017-09-12 16:38:01 +00001338 // Some symbols are defined in term of program headers. Now that we
1339 // have the headers, we can find out which sections they point to.
1340 setReservedSymbolSections();
1341
Eugene Leviantbe809a72016-11-18 06:44:18 +00001342 // Dynamic section must be the last one in this list and dynamic
1343 // symbol table section (DynSymTab) must be the first one.
Rui Ueyama2b6631b2017-08-15 17:01:39 +00001344 applySynthetic({InX::DynSymTab, InX::Bss,
1345 InX::BssRelRo, InX::GnuHashTab,
George Rimaraaf54712017-09-27 09:14:59 +00001346 InX::HashTab, InX::SymTab,
Rui Ueyama2b6631b2017-08-15 17:01:39 +00001347 InX::ShStrTab, InX::StrTab,
1348 In<ELFT>::VerDef, InX::DynStrTab,
1349 InX::Got, InX::MipsGot,
1350 InX::IgotPlt, InX::GotPlt,
1351 In<ELFT>::RelaDyn, In<ELFT>::RelaIplt,
1352 In<ELFT>::RelaPlt, InX::Plt,
1353 InX::Iplt, In<ELFT>::EhFrameHdr,
1354 In<ELFT>::VerSym, In<ELFT>::VerNeed,
1355 InX::Dynamic},
George Rimar49a47f22017-03-16 10:29:44 +00001356 [](SyntheticSection *SS) { SS->finalizeContents(); });
Peter Smith1ec42d92017-03-08 14:06:24 +00001357
Rui Ueyamaac27de92017-10-11 01:19:33 +00001358 if (!Script->HasSections && !Config->Relocatable)
Peter Smith3ef89b02017-09-06 14:02:14 +00001359 fixSectionAlignments();
1360
Peter Smith1ec42d92017-03-08 14:06:24 +00001361 // Some architectures use small displacements for jump instructions.
1362 // It is linker's responsibility to create thunks containing long
1363 // jump instructions if jump targets are too far. Create thunks.
1364 if (Target->NeedsThunks) {
1365 // FIXME: only ARM Interworking and Mips LA25 Thunks are implemented,
1366 // these
1367 // do not require address information. To support range extension Thunks
1368 // we need to assign addresses so that we can tell if jump instructions
1369 // are out of range. This will need to turn into a loop that converges
1370 // when no more Thunks are added
George Rimarec84ffc2017-05-17 07:10:59 +00001371 ThunkCreator TC;
Peter Smith96f813d2017-07-07 10:03:37 +00001372 Script->assignAddresses();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001373 if (TC.createThunks(OutputSections)) {
Rafael Espindolab3aa2c92017-05-11 21:33:30 +00001374 applySynthetic({InX::MipsGot},
George Rimar49a47f22017-03-16 10:29:44 +00001375 [](SyntheticSection *SS) { SS->updateAllocSize(); });
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001376 if (TC.createThunks(OutputSections))
Peter Smith32980272017-06-16 13:10:08 +00001377 fatal("All non-range thunks should be created in first call");
1378 }
Peter Smith1ec42d92017-03-08 14:06:24 +00001379 }
Peter Smith43e852f2017-06-05 08:51:15 +00001380
Peter Smith1ec42d92017-03-08 14:06:24 +00001381 // Fill other section headers. The dynamic table is finalized
1382 // at the end because some tags like RELSZ depend on result
1383 // of finalizing other sections.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001384 for (OutputSection *Sec : OutputSections)
1385 Sec->finalize<ELFT>();
Peter Smith1ec42d92017-03-08 14:06:24 +00001386
1387 // createThunks may have added local symbols to the static symbol table
George Rimar69b17c32017-05-16 10:04:42 +00001388 applySynthetic({InX::SymTab, InX::ShStrTab, InX::StrTab},
George Rimar49a47f22017-03-16 10:29:44 +00001389 [](SyntheticSection *SS) { SS->postThunkContents(); });
Rui Ueyama84417f82015-12-26 07:50:41 +00001390}
1391
Rui Ueyama84417f82015-12-26 07:50:41 +00001392template <class ELFT> void Writer<ELFT>::addPredefinedSections() {
Rui Ueyamadec4ab02017-02-16 04:19:03 +00001393 // ARM ABI requires .ARM.exidx to be terminated by some piece of data.
1394 // We have the terminater synthetic section class. Add that at the end.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001395 OutputSection *Cmd = findSection(".ARM.exidx");
1396 if (!Cmd || !Cmd->Live || Config->Relocatable)
Peter Smith626c9972017-05-30 11:51:02 +00001397 return;
1398
1399 auto *Sentinel = make<ARMExidxSentinelSection>();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001400 Cmd->addSection(Sentinel);
Rafael Espindolaabad6182015-08-13 15:23:46 +00001401}
1402
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001403// The linker is expected to define SECNAME_start and SECNAME_end
1404// symbols for a few sections. This function defines them.
1405template <class ELFT> void Writer<ELFT>::addStartEndSymbols() {
Rafael Espindola24e6f362017-02-24 15:07:30 +00001406 auto Define = [&](StringRef Start, StringRef End, OutputSection *OS) {
Peter Collingbourne0fab40b2016-10-24 20:46:21 +00001407 // These symbols resolve to the image base if the section does not exist.
Rui Ueyama4f2f50d2016-12-21 08:40:09 +00001408 // A special value -1 indicates end of the section.
Peter Collingbournef8435a92017-03-13 16:40:20 +00001409 if (OS) {
1410 addOptionalRegular<ELFT>(Start, OS, 0);
1411 addOptionalRegular<ELFT>(End, OS, -1);
1412 } else {
Rui Ueyamad57e74b72017-03-17 23:29:01 +00001413 if (Config->Pic)
Peter Collingbournef8435a92017-03-13 16:40:20 +00001414 OS = Out::ElfHeader;
1415 addOptionalRegular<ELFT>(Start, OS, 0);
1416 addOptionalRegular<ELFT>(End, OS, 0);
1417 }
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001418 };
1419
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001420 Define("__preinit_array_start", "__preinit_array_end", Out::PreinitArray);
1421 Define("__init_array_start", "__init_array_end", Out::InitArray);
1422 Define("__fini_array_start", "__fini_array_end", Out::FiniArray);
Peter Smith17cd3752016-10-27 10:28:53 +00001423
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001424 if (OutputSection *Sec = findSection(".ARM.exidx"))
Peter Smith17cd3752016-10-27 10:28:53 +00001425 Define("__exidx_start", "__exidx_end", Sec);
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001426}
1427
Rui Ueyamad9189ce2015-10-15 17:11:03 +00001428// If a section name is valid as a C identifier (which is rare because of
1429// the leading '.'), linkers are expected to define __start_<secname> and
1430// __stop_<secname> symbols. They are at beginning and end of the section,
1431// respectively. This is not requested by the ELF standard, but GNU ld and
1432// gold provide the feature, and used by many programs.
1433template <class ELFT>
Rafael Espindola24e6f362017-02-24 15:07:30 +00001434void Writer<ELFT>::addStartStopSymbols(OutputSection *Sec) {
Rafael Espindola40849412017-02-24 14:28:00 +00001435 StringRef S = Sec->Name;
Rui Ueyamad9189ce2015-10-15 17:11:03 +00001436 if (!isValidCIdentifier(S))
1437 return;
Rafael Espindola5616adf2017-03-08 22:36:28 +00001438 addOptionalRegular<ELFT>(Saver.save("__start_" + S), Sec, 0, STV_DEFAULT);
1439 addOptionalRegular<ELFT>(Saver.save("__stop_" + S), Sec, -1, STV_DEFAULT);
Rui Ueyamad9189ce2015-10-15 17:11:03 +00001440}
1441
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001442template <class ELFT> OutputSection *Writer<ELFT>::findSection(StringRef Name) {
Rui Ueyamaac27de92017-10-11 01:19:33 +00001443 for (BaseCommand *Base : Script->Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001444 if (auto *Sec = dyn_cast<OutputSection>(Base))
1445 if (Sec->Name == Name)
1446 return Sec;
Rafael Espindola43e76cd2017-05-26 17:48:27 +00001447 return nullptr;
1448}
1449
George Rimar7702bc22017-03-16 11:20:02 +00001450static bool needsPtLoad(OutputSection *Sec) {
Rafael Espindola04a2e342016-11-09 01:42:41 +00001451 if (!(Sec->Flags & SHF_ALLOC))
Rafael Espindolaef762f22016-02-10 23:29:38 +00001452 return false;
1453
1454 // Don't allocate VA space for TLS NOBITS sections. The PT_TLS PHDR is
1455 // responsible for allocating space for them, not the PT_LOAD that
1456 // contains the TLS initialization image.
Rafael Espindola04a2e342016-11-09 01:42:41 +00001457 if (Sec->Flags & SHF_TLS && Sec->Type == SHT_NOBITS)
Rafael Espindolaef762f22016-02-10 23:29:38 +00001458 return false;
1459 return true;
Michael J. Spencer1d299a82015-09-09 20:48:09 +00001460}
1461
Rafael Espindolab45fd702016-09-20 15:22:27 +00001462// Linker scripts are responsible for aligning addresses. Unfortunately, most
1463// linker scripts are designed for creating two PT_LOADs only, one RX and one
1464// RW. This means that there is no alignment in the RO to RX transition and we
1465// cannot create a PT_LOAD there.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001466static uint64_t computeFlags(uint64_t Flags) {
Rui Ueyamaa37ace8d2017-02-25 01:52:03 +00001467 if (Config->Omagic)
George Rimar595a7632016-11-29 09:43:51 +00001468 return PF_R | PF_W | PF_X;
Rui Ueyama6bd38222017-04-05 21:37:09 +00001469 if (Config->SingleRoRx && !(Flags & PF_W))
1470 return Flags | PF_X;
1471 return Flags;
Rafael Espindolab45fd702016-09-20 15:22:27 +00001472}
1473
Rafael Espindola4fc60442016-02-10 22:43:13 +00001474// Decide which program headers to create and which sections to include in each
1475// one.
George Rimaraa354182017-07-27 07:46:50 +00001476template <class ELFT> std::vector<PhdrEntry *> Writer<ELFT>::createPhdrs() {
1477 std::vector<PhdrEntry *> Ret;
Rafael Espindola17cb7c02016-12-19 17:01:01 +00001478 auto AddHdr = [&](unsigned Type, unsigned Flags) -> PhdrEntry * {
George Rimaraa354182017-07-27 07:46:50 +00001479 Ret.push_back(make<PhdrEntry>(Type, Flags));
1480 return Ret.back();
Rafael Espindola4fc60442016-02-10 22:43:13 +00001481 };
George Rimare3336c02015-11-24 10:15:50 +00001482
Rui Ueyama803195e2015-10-23 21:45:59 +00001483 // The first phdr entry is PT_PHDR which describes the program header itself.
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001484 AddHdr(PT_PHDR, PF_R)->add(Out::ProgramHeaders);
Rui Ueyama953c2c42015-10-10 23:59:57 +00001485
Rui Ueyama803195e2015-10-23 21:45:59 +00001486 // PT_INTERP must be the second entry if exists.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001487 if (OutputSection *Cmd = findSection(".interp"))
1488 AddHdr(PT_INTERP, Cmd->getPhdrFlags())->add(Cmd);
Rafael Espindola70107762015-09-11 18:49:42 +00001489
Rui Ueyama803195e2015-10-23 21:45:59 +00001490 // Add the first PT_LOAD segment for regular output sections.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001491 uint64_t Flags = computeFlags(PF_R);
Rafael Espindola17cb7c02016-12-19 17:01:01 +00001492 PhdrEntry *Load = AddHdr(PT_LOAD, Flags);
Rafael Espindola02ed7572017-05-04 19:34:17 +00001493
1494 // Add the headers. We will remove them if they don't fit.
1495 Load->add(Out::ElfHeader);
1496 Load->add(Out::ProgramHeaders);
1497
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001498 for (OutputSection *Sec : OutputSections) {
Rafael Espindola04a2e342016-11-09 01:42:41 +00001499 if (!(Sec->Flags & SHF_ALLOC))
Rafael Espindolaaab6d5c2016-09-16 21:29:07 +00001500 break;
George Rimar7702bc22017-03-16 11:20:02 +00001501 if (!needsPtLoad(Sec))
Rafael Espindolaef762f22016-02-10 23:29:38 +00001502 continue;
1503
George Rimar8ceadb32016-08-17 07:44:19 +00001504 // Segments are contiguous memory regions that has the same attributes
1505 // (e.g. executable or writable). There is one phdr for each segment.
1506 // Therefore, we need to create a new phdr when the next section has
1507 // different flags or is loaded at a discontiguous address using AT linker
1508 // script command.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001509 uint64_t NewFlags = computeFlags(Sec->getPhdrFlags());
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001510 if (Sec->LMAExpr || Flags != NewFlags) {
Rafael Espindolae090fb22016-03-09 21:37:22 +00001511 Load = AddHdr(PT_LOAD, NewFlags);
Rafael Espindola4fc60442016-02-10 22:43:13 +00001512 Flags = NewFlags;
1513 }
Michael J. Spencer78aa1de2015-11-03 00:34:39 +00001514
Rui Ueyama18f084f2016-07-20 19:36:41 +00001515 Load->add(Sec);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001516 }
Rafael Espindola6b83b902015-08-12 00:00:24 +00001517
Rui Ueyamadb00b612017-02-01 22:42:17 +00001518 // Add a TLS segment if any.
George Rimaraa354182017-07-27 07:46:50 +00001519 PhdrEntry *TlsHdr = make<PhdrEntry>(PT_TLS, PF_R);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001520 for (OutputSection *Sec : OutputSections)
Rui Ueyamadb00b612017-02-01 22:42:17 +00001521 if (Sec->Flags & SHF_TLS)
George Rimaraa354182017-07-27 07:46:50 +00001522 TlsHdr->add(Sec);
George Rimar6823c5f2017-09-07 11:01:10 +00001523 if (TlsHdr->FirstSec)
George Rimaraa354182017-07-27 07:46:50 +00001524 Ret.push_back(TlsHdr);
Michael J. Spencer78aa1de2015-11-03 00:34:39 +00001525
Rui Ueyama803195e2015-10-23 21:45:59 +00001526 // Add an entry for .dynamic.
George Rimar69b17c32017-05-16 10:04:42 +00001527 if (InX::DynSymTab)
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001528 AddHdr(PT_DYNAMIC, InX::Dynamic->getParent()->getPhdrFlags())
1529 ->add(InX::Dynamic->getParent());
Rafael Espindola91009b32015-08-12 01:45:28 +00001530
Rafael Espindola4fc60442016-02-10 22:43:13 +00001531 // PT_GNU_RELRO includes all sections that should be marked as
1532 // read-only by dynamic linker after proccessing relocations.
George Rimaraa354182017-07-27 07:46:50 +00001533 PhdrEntry *RelRo = make<PhdrEntry>(PT_GNU_RELRO, PF_R);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001534 for (OutputSection *Sec : OutputSections)
Rafael Espindola9e889eb2017-05-11 23:31:06 +00001535 if (needsPtLoad(Sec) && isRelroSection(Sec))
George Rimaraa354182017-07-27 07:46:50 +00001536 RelRo->add(Sec);
George Rimar6823c5f2017-09-07 11:01:10 +00001537 if (RelRo->FirstSec)
George Rimaraa354182017-07-27 07:46:50 +00001538 Ret.push_back(RelRo);
George Rimare3336c02015-11-24 10:15:50 +00001539
Rafael Espindola4fc60442016-02-10 22:43:13 +00001540 // PT_GNU_EH_FRAME is a special section pointing on .eh_frame_hdr.
Eugene Leviant30c1b432017-03-14 08:49:09 +00001541 if (!In<ELFT>::EhFrame->empty() && In<ELFT>::EhFrameHdr &&
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001542 In<ELFT>::EhFrame->getParent() && In<ELFT>::EhFrameHdr->getParent())
1543 AddHdr(PT_GNU_EH_FRAME, In<ELFT>::EhFrameHdr->getParent()->getPhdrFlags())
1544 ->add(In<ELFT>::EhFrameHdr->getParent());
George Rimarf6bc65a2016-01-15 13:34:52 +00001545
Rui Ueyama81cb7102017-03-24 00:15:57 +00001546 // PT_OPENBSD_RANDOMIZE is an OpenBSD-specific feature. That makes
1547 // the dynamic linker fill the segment with random data.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001548 if (OutputSection *Cmd = findSection(".openbsd.randomdata"))
1549 AddHdr(PT_OPENBSD_RANDOMIZE, Cmd->getPhdrFlags())->add(Cmd);
George Rimar270173f2016-10-14 13:02:22 +00001550
Rui Ueyamae79b09a2015-11-21 22:19:32 +00001551 // PT_GNU_STACK is a special section to tell the loader to make the
Rui Ueyamaa7e87252017-02-23 08:09:51 +00001552 // pages for the stack non-executable. If you really want an executable
1553 // stack, you can pass -z execstack, but that's not recommended for
1554 // security reasons.
1555 unsigned Perm;
1556 if (Config->ZExecstack)
1557 Perm = PF_R | PF_W | PF_X;
1558 else
1559 Perm = PF_R | PF_W;
1560 AddHdr(PT_GNU_STACK, Perm)->p_memsz = Config->ZStackSize;
Rafael Espindola9907eb02016-03-01 13:23:29 +00001561
George Rimarcc6e5672016-10-14 10:34:36 +00001562 // PT_OPENBSD_WXNEEDED is a OpenBSD-specific header to mark the executable
1563 // is expected to perform W^X violations, such as calling mprotect(2) or
1564 // mmap(2) with PROT_WRITE | PROT_EXEC, which is prohibited by default on
1565 // OpenBSD.
1566 if (Config->ZWxneeded)
1567 AddHdr(PT_OPENBSD_WXNEEDED, PF_X);
1568
Petr Hosek4d65ef3b2017-02-01 20:58:41 +00001569 // Create one PT_NOTE per a group of contiguous .note sections.
1570 PhdrEntry *Note = nullptr;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001571 for (OutputSection *Sec : OutputSections) {
Petr Hosek4d65ef3b2017-02-01 20:58:41 +00001572 if (Sec->Type == SHT_NOTE) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001573 if (!Note || Sec->LMAExpr)
Petr Hosek4d65ef3b2017-02-01 20:58:41 +00001574 Note = AddHdr(PT_NOTE, PF_R);
1575 Note->add(Sec);
1576 } else {
1577 Note = nullptr;
1578 }
1579 }
Rui Ueyama703296a2016-07-20 19:36:39 +00001580 return Ret;
Rafael Espindola4fc60442016-02-10 22:43:13 +00001581}
1582
Rafael Espindola8e670002016-11-28 00:40:21 +00001583template <class ELFT>
George Rimaraa354182017-07-27 07:46:50 +00001584void Writer<ELFT>::addPtArmExid(std::vector<PhdrEntry *> &Phdrs) {
Rafael Espindola8e670002016-11-28 00:40:21 +00001585 if (Config->EMachine != EM_ARM)
1586 return;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001587 auto I = llvm::find_if(OutputSections, [](OutputSection *Cmd) {
1588 return Cmd->Type == SHT_ARM_EXIDX;
George Rimara951d5c2017-07-04 13:10:37 +00001589 });
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001590 if (I == OutputSections.end())
Rafael Espindola8e670002016-11-28 00:40:21 +00001591 return;
1592
1593 // PT_ARM_EXIDX is the ARM EHABI equivalent of PT_GNU_EH_FRAME
George Rimaraa354182017-07-27 07:46:50 +00001594 PhdrEntry *ARMExidx = make<PhdrEntry>(PT_ARM_EXIDX, PF_R);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001595 ARMExidx->add(*I);
Rafael Espindola8e670002016-11-28 00:40:21 +00001596 Phdrs.push_back(ARMExidx);
1597}
1598
Peter Collingbourne628ec9f2017-01-10 01:21:30 +00001599// The first section of each PT_LOAD, the first section in PT_GNU_RELRO and the
1600// first section after PT_GNU_RELRO have to be page aligned so that the dynamic
1601// linker can set the permissions.
Rui Ueyama47091902016-03-30 19:41:51 +00001602template <class ELFT> void Writer<ELFT>::fixSectionAlignments() {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001603 auto PageAlign = [](OutputSection *Cmd) {
Rafael Espindola0f7dc0e2017-06-02 01:37:58 +00001604 if (Cmd && !Cmd->AddrExpr)
1605 Cmd->AddrExpr = [=] {
1606 return alignTo(Script->getDot(), Config->MaxPageSize);
1607 };
1608 };
1609
George Rimaraa354182017-07-27 07:46:50 +00001610 for (const PhdrEntry *P : Phdrs)
George Rimar6823c5f2017-09-07 11:01:10 +00001611 if (P->p_type == PT_LOAD && P->FirstSec)
1612 PageAlign(P->FirstSec);
Rui Ueyama47091902016-03-30 19:41:51 +00001613
George Rimaraa354182017-07-27 07:46:50 +00001614 for (const PhdrEntry *P : Phdrs) {
1615 if (P->p_type != PT_GNU_RELRO)
Rui Ueyama47091902016-03-30 19:41:51 +00001616 continue;
George Rimar6823c5f2017-09-07 11:01:10 +00001617 if (P->FirstSec)
1618 PageAlign(P->FirstSec);
Rui Ueyama47091902016-03-30 19:41:51 +00001619 // Find the first section after PT_GNU_RELRO. If it is in a PT_LOAD we
1620 // have to align it to a page.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001621 auto End = OutputSections.end();
George Rimar6823c5f2017-09-07 11:01:10 +00001622 auto I = std::find(OutputSections.begin(), End, P->LastSec);
Rui Ueyama47091902016-03-30 19:41:51 +00001623 if (I == End || (I + 1) == End)
1624 continue;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001625 OutputSection *Cmd = (*(I + 1));
1626 if (needsPtLoad(Cmd))
1627 PageAlign(Cmd);
Rui Ueyama47091902016-03-30 19:41:51 +00001628 }
1629}
1630
George Rimar5f857322016-04-27 09:16:28 +00001631// Adjusts the file alignment for a given output section and returns
1632// its new file offset. The file offset must be the same with its
1633// virtual address (modulo the page size) so that the loader can load
1634// executables without any address adjustment.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001635static uint64_t getFileAlignment(uint64_t Off, OutputSection *Cmd) {
Rafael Espindola8b8f74f2016-12-07 20:20:39 +00001636 // If the section is not in a PT_LOAD, we just have to align it.
George Rimar582ede82017-09-07 10:53:07 +00001637 if (!Cmd->PtLoad)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001638 return alignTo(Off, Cmd->Alignment);
Eugene Leviant3d9abec2016-09-29 09:20:33 +00001639
George Rimar6823c5f2017-09-07 11:01:10 +00001640 OutputSection *First = Cmd->PtLoad->FirstSec;
Rafael Espindola8b8f74f2016-12-07 20:20:39 +00001641 // The first section in a PT_LOAD has to have congruent offset and address
1642 // module the page size.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001643 if (Cmd == First)
1644 return alignTo(Off, std::max<uint64_t>(Cmd->Alignment, Config->MaxPageSize),
1645 Cmd->Addr);
Rafael Espindola8b8f74f2016-12-07 20:20:39 +00001646
1647 // If two sections share the same PT_LOAD the file offset is calculated
1648 // using this formula: Off2 = Off1 + (VA2 - VA1).
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001649 return First->Offset + Cmd->Addr - First->Addr;
George Rimar5f857322016-04-27 09:16:28 +00001650}
1651
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001652static uint64_t setOffset(OutputSection *Cmd, uint64_t Off) {
1653 if (Cmd->Type == SHT_NOBITS) {
1654 Cmd->Offset = Off;
Rui Ueyama35723f02017-02-14 23:35:42 +00001655 return Off;
George Rimar86ce2672016-08-25 09:05:47 +00001656 }
1657
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001658 Off = getFileAlignment(Off, Cmd);
1659 Cmd->Offset = Off;
1660 return Off + Cmd->Size;
George Rimar86ce2672016-08-25 09:05:47 +00001661}
1662
1663template <class ELFT> void Writer<ELFT>::assignFileOffsetsBinary() {
Rui Ueyama6bd38222017-04-05 21:37:09 +00001664 uint64_t Off = 0;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001665 for (OutputSection *Sec : OutputSections)
Rafael Espindola04a2e342016-11-09 01:42:41 +00001666 if (Sec->Flags & SHF_ALLOC)
Rui Ueyama6bd38222017-04-05 21:37:09 +00001667 Off = setOffset(Sec, Off);
1668 FileSize = alignTo(Off, Config->Wordsize);
George Rimar86ce2672016-08-25 09:05:47 +00001669}
1670
Rui Ueyamae044e9c2016-04-01 17:07:17 +00001671// Assign file offsets to output sections.
1672template <class ELFT> void Writer<ELFT>::assignFileOffsets() {
Rui Ueyama6bd38222017-04-05 21:37:09 +00001673 uint64_t Off = 0;
1674 Off = setOffset(Out::ElfHeader, Off);
1675 Off = setOffset(Out::ProgramHeaders, Off);
George Rimar7ca06272016-04-06 07:20:45 +00001676
Petr Hosekedd6c352017-08-02 16:35:00 +00001677 PhdrEntry *LastRX = nullptr;
1678 for (PhdrEntry *P : Phdrs)
1679 if (P->p_type == PT_LOAD && (P->p_flags & PF_X))
1680 LastRX = P;
1681
1682 for (OutputSection *Sec : OutputSections) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001683 Off = setOffset(Sec, Off);
Rui Ueyamaac27de92017-10-11 01:19:33 +00001684 if (Script->HasSections)
Petr Hosekedd6c352017-08-02 16:35:00 +00001685 continue;
1686 // If this is a last section of the last executable segment and that
1687 // segment is the last loadable segment, align the offset of the
1688 // following section to avoid loading non-segments parts of the file.
George Rimar6823c5f2017-09-07 11:01:10 +00001689 if (LastRX && LastRX->LastSec == Sec)
Petr Hosekedd6c352017-08-02 16:35:00 +00001690 Off = alignTo(Off, Target->PageSize);
1691 }
Eugene Leviant467c4d52016-07-01 10:27:36 +00001692
Rui Ueyama6bd38222017-04-05 21:37:09 +00001693 SectionHeaderOff = alignTo(Off, Config->Wordsize);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001694 FileSize = SectionHeaderOff + (OutputSections.size() + 1) * sizeof(Elf_Shdr);
Rui Ueyamae044e9c2016-04-01 17:07:17 +00001695}
1696
1697// Finalize the program headers. We call this function after we assign
1698// file offsets and VAs to all sections.
1699template <class ELFT> void Writer<ELFT>::setPhdrs() {
George Rimaraa354182017-07-27 07:46:50 +00001700 for (PhdrEntry *P : Phdrs) {
George Rimar6823c5f2017-09-07 11:01:10 +00001701 OutputSection *First = P->FirstSec;
1702 OutputSection *Last = P->LastSec;
Rui Ueyamae8a45e42016-04-01 22:42:04 +00001703 if (First) {
George Rimaraa354182017-07-27 07:46:50 +00001704 P->p_filesz = Last->Offset - First->Offset;
Rafael Espindola04a2e342016-11-09 01:42:41 +00001705 if (Last->Type != SHT_NOBITS)
George Rimaraa354182017-07-27 07:46:50 +00001706 P->p_filesz += Last->Size;
1707 P->p_memsz = Last->Addr + Last->Size - First->Addr;
1708 P->p_offset = First->Offset;
1709 P->p_vaddr = First->Addr;
1710 if (!P->HasLMA)
1711 P->p_paddr = First->getLMA();
Rafael Espindola4fc60442016-02-10 22:43:13 +00001712 }
George Rimaraa354182017-07-27 07:46:50 +00001713 if (P->p_type == PT_LOAD)
1714 P->p_align = std::max<uint64_t>(P->p_align, Config->MaxPageSize);
1715 else if (P->p_type == PT_GNU_RELRO) {
1716 P->p_align = 1;
Peter Collingbourne7b5088b2017-01-04 18:56:15 +00001717 // The glibc dynamic loader rounds the size down, so we need to round up
1718 // to protect the last page. This is a no-op on FreeBSD which always
1719 // rounds up.
George Rimaraa354182017-07-27 07:46:50 +00001720 P->p_memsz = alignTo(P->p_memsz, Target->PageSize);
Peter Collingbourne7b5088b2017-01-04 18:56:15 +00001721 }
George Rimar8ceadb32016-08-17 07:44:19 +00001722
Rafael Espindola4fc60442016-02-10 22:43:13 +00001723 // The TLS pointer goes after PT_TLS. At least glibc will align it,
1724 // so round up the size to make sure the offsets are correct.
George Rimaraa354182017-07-27 07:46:50 +00001725 if (P->p_type == PT_TLS) {
1726 Out::TlsPhdr = P;
1727 if (P->p_memsz)
1728 P->p_memsz = alignTo(P->p_memsz, P->p_align);
Rui Ueyama803195e2015-10-23 21:45:59 +00001729 }
1730 }
Michael J. Spencer84487f12015-07-24 21:03:07 +00001731}
1732
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001733// The entry point address is chosen in the following ways.
1734//
1735// 1. the '-e' entry command-line option;
1736// 2. the ENTRY(symbol) command in a linker control script;
1737// 3. the value of the symbol start, if present;
1738// 4. the address of the first byte of the .text section, if present;
1739// 5. the address 0.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001740template <class ELFT> uint64_t Writer<ELFT>::getEntryAddr() {
Rui Ueyamaa1407c42016-12-07 03:23:06 +00001741 // Case 1, 2 or 3. As a special case, if the symbol is actually
1742 // a number, we'll use that number as an address.
Rafael Espindola244ef982017-07-26 18:42:48 +00001743 if (SymbolBody *B = Symtab->find(Config->Entry))
George Rimarf64618a2017-03-17 11:56:54 +00001744 return B->getVA();
Rui Ueyamaa1407c42016-12-07 03:23:06 +00001745 uint64_t Addr;
George Rimarab947682017-05-16 08:19:25 +00001746 if (to_integer(Config->Entry, Addr))
Rui Ueyamaa1407c42016-12-07 03:23:06 +00001747 return Addr;
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001748
1749 // Case 4
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001750 if (OutputSection *Sec = findSection(".text")) {
Rui Ueyama9e5f5ef2016-12-07 04:06:21 +00001751 if (Config->WarnMissingEntry)
Petr Hosek2f50fef2016-12-07 02:26:16 +00001752 warn("cannot find entry symbol " + Config->Entry + "; defaulting to 0x" +
1753 utohexstr(Sec->Addr));
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001754 return Sec->Addr;
1755 }
1756
1757 // Case 5
Rui Ueyama9e5f5ef2016-12-07 04:06:21 +00001758 if (Config->WarnMissingEntry)
Petr Hosek2f50fef2016-12-07 02:26:16 +00001759 warn("cannot find entry symbol " + Config->Entry +
1760 "; not setting start address");
Rui Ueyama8da7aa02016-10-20 00:07:36 +00001761 return 0;
Rui Ueyama3bfaba92015-12-24 08:37:34 +00001762}
1763
Rui Ueyama4cea4e82016-02-25 19:28:37 +00001764static uint16_t getELFType() {
Rui Ueyamad57e74b72017-03-17 23:29:01 +00001765 if (Config->Pic)
Rui Ueyama4cea4e82016-02-25 19:28:37 +00001766 return ET_DYN;
1767 if (Config->Relocatable)
1768 return ET_REL;
1769 return ET_EXEC;
1770}
1771
Michael J. Spencer84487f12015-07-24 21:03:07 +00001772template <class ELFT> void Writer<ELFT>::writeHeader() {
1773 uint8_t *Buf = Buffer->getBufferStart();
Rui Ueyamae08cd672015-10-23 22:44:39 +00001774 memcpy(Buf, "\177ELF", 4);
1775
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001776 // Write the ELF header.
Rafael Espindola18608a02015-09-08 21:57:31 +00001777 auto *EHdr = reinterpret_cast<Elf_Ehdr *>(Buf);
Rui Ueyamaf2dc4362017-04-05 21:08:47 +00001778 EHdr->e_ident[EI_CLASS] = Config->Is64 ? ELFCLASS64 : ELFCLASS32;
1779 EHdr->e_ident[EI_DATA] = Config->IsLE ? ELFDATA2LSB : ELFDATA2MSB;
Michael J. Spencer84487f12015-07-24 21:03:07 +00001780 EHdr->e_ident[EI_VERSION] = EV_CURRENT;
Rafael Espindola7cc713a2016-10-27 14:00:51 +00001781 EHdr->e_ident[EI_OSABI] = Config->OSABI;
Rui Ueyama4cea4e82016-02-25 19:28:37 +00001782 EHdr->e_type = getELFType();
Rafael Espindola7cc713a2016-10-27 14:00:51 +00001783 EHdr->e_machine = Config->EMachine;
Michael J. Spencer84487f12015-07-24 21:03:07 +00001784 EHdr->e_version = EV_CURRENT;
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001785 EHdr->e_entry = getEntryAddr();
Michael J. Spencer8039dae22015-07-29 00:30:10 +00001786 EHdr->e_shoff = SectionHeaderOff;
Rafael Espindola18608a02015-09-08 21:57:31 +00001787 EHdr->e_ehsize = sizeof(Elf_Ehdr);
Rui Ueyama2f1b79f2015-10-10 22:34:30 +00001788 EHdr->e_phnum = Phdrs.size();
Rafael Espindola18608a02015-09-08 21:57:31 +00001789 EHdr->e_shentsize = sizeof(Elf_Shdr);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001790 EHdr->e_shnum = OutputSections.size() + 1;
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001791 EHdr->e_shstrndx = InX::ShStrTab->getParent()->SectionIndex;
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001792
Rui Ueyama1e2e8ea2016-09-13 20:51:32 +00001793 if (Config->EMachine == EM_ARM)
1794 // We don't currently use any features incompatible with EF_ARM_EABI_VER5,
1795 // but we don't have any firm guarantees of conformance. Linux AArch64
1796 // kernels (as of 2016) require an EABI version to be set.
1797 EHdr->e_flags = EF_ARM_EABI_VER5;
1798 else if (Config->EMachine == EM_MIPS)
Simon Atanasyan649e4d32017-10-02 14:56:41 +00001799 EHdr->e_flags = Config->MipsEFlags;
Rui Ueyama22b5d1f2016-03-13 19:29:17 +00001800
George Rimar58941ee2016-02-25 08:23:37 +00001801 if (!Config->Relocatable) {
1802 EHdr->e_phoff = sizeof(Elf_Ehdr);
1803 EHdr->e_phentsize = sizeof(Elf_Phdr);
1804 }
1805
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001806 // Write the program header table.
Rafael Espindola4fc60442016-02-10 22:43:13 +00001807 auto *HBuf = reinterpret_cast<Elf_Phdr *>(Buf + EHdr->e_phoff);
George Rimaraa354182017-07-27 07:46:50 +00001808 for (PhdrEntry *P : Phdrs) {
1809 HBuf->p_type = P->p_type;
1810 HBuf->p_flags = P->p_flags;
1811 HBuf->p_offset = P->p_offset;
1812 HBuf->p_vaddr = P->p_vaddr;
1813 HBuf->p_paddr = P->p_paddr;
1814 HBuf->p_filesz = P->p_filesz;
1815 HBuf->p_memsz = P->p_memsz;
1816 HBuf->p_align = P->p_align;
Rafael Espindola17cb7c02016-12-19 17:01:01 +00001817 ++HBuf;
1818 }
Rafael Espindolae438e072015-09-08 22:55:28 +00001819
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001820 // Write the section header table. Note that the first table entry is null.
Rui Ueyamaad59b652016-02-25 23:58:21 +00001821 auto *SHdrs = reinterpret_cast<Elf_Shdr *>(Buf + EHdr->e_shoff);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001822 for (OutputSection *Sec : OutputSections)
1823 Sec->writeHeaderTo<ELFT>(++SHdrs);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001824}
1825
Rui Ueyama6d12eae2016-12-05 17:40:37 +00001826// Open a result file.
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +00001827template <class ELFT> void Writer<ELFT>::openFile() {
Rui Ueyama6bd38222017-04-05 21:37:09 +00001828 if (!Config->Is64 && FileSize > UINT32_MAX) {
1829 error("output file too large: " + Twine(FileSize) + " bytes");
1830 return;
1831 }
1832
Rui Ueyama6d12eae2016-12-05 17:40:37 +00001833 unlinkAsync(Config->OutputFile);
Rafael Espindolabdc8f2f2015-08-13 00:31:46 +00001834 ErrorOr<std::unique_ptr<FileOutputBuffer>> BufferOrErr =
Rui Ueyamacbe39262016-02-02 22:48:04 +00001835 FileOutputBuffer::create(Config->OutputFile, FileSize,
1836 FileOutputBuffer::F_executable);
Rui Ueyama6d12eae2016-12-05 17:40:37 +00001837
Rui Ueyamaaa2db882016-07-15 01:38:54 +00001838 if (auto EC = BufferOrErr.getError())
Rui Ueyamac8d3a832017-01-12 22:18:04 +00001839 error("failed to open " + Config->OutputFile + ": " + EC.message());
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +00001840 else
Rui Ueyamaaa2db882016-07-15 01:38:54 +00001841 Buffer = std::move(*BufferOrErr);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001842}
1843
George Rimar86ce2672016-08-25 09:05:47 +00001844template <class ELFT> void Writer<ELFT>::writeSectionsBinary() {
1845 uint8_t *Buf = Buffer->getBufferStart();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001846 for (OutputSection *Sec : OutputSections)
Rafael Espindola04a2e342016-11-09 01:42:41 +00001847 if (Sec->Flags & SHF_ALLOC)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001848 Sec->writeTo<ELFT>(Buf + Sec->Offset);
George Rimar86ce2672016-08-25 09:05:47 +00001849}
1850
Rui Ueyama6238ed22017-08-14 21:18:12 +00001851static void fillTrap(uint8_t *I, uint8_t *End) {
George Rimarf7ef2a12017-08-21 08:31:14 +00001852 for (; I + 4 <= End; I += 4)
Petr Hosekedd6c352017-08-02 16:35:00 +00001853 memcpy(I, &Target->TrapInstr, 4);
1854}
1855
Rui Ueyama6238ed22017-08-14 21:18:12 +00001856// Fill the last page of executable segments with trap instructions
1857// instead of leaving them as zero. Even though it is not required by any
1858// standard, it is in general a good thing to do for security reasons.
1859//
1860// We'll leave other pages in segments as-is because the rest will be
1861// overwritten by output sections.
Petr Hosekedd6c352017-08-02 16:35:00 +00001862template <class ELFT> void Writer<ELFT>::writeTrapInstr() {
Rui Ueyamaac27de92017-10-11 01:19:33 +00001863 if (Script->HasSections)
Petr Hosekedd6c352017-08-02 16:35:00 +00001864 return;
1865
Rui Ueyama6238ed22017-08-14 21:18:12 +00001866 // Fill the last page.
Petr Hosekedd6c352017-08-02 16:35:00 +00001867 uint8_t *Buf = Buffer->getBufferStart();
Rui Ueyama6238ed22017-08-14 21:18:12 +00001868 for (PhdrEntry *P : Phdrs)
1869 if (P->p_type == PT_LOAD && (P->p_flags & PF_X))
1870 fillTrap(Buf + alignDown(P->p_offset + P->p_filesz, Target->PageSize),
1871 Buf + alignTo(P->p_offset + P->p_filesz, Target->PageSize));
Petr Hosekedd6c352017-08-02 16:35:00 +00001872
Rui Ueyama6238ed22017-08-14 21:18:12 +00001873 // Round up the file size of the last segment to the page boundary iff it is
1874 // an executable segment to ensure that other other tools don't accidentally
1875 // trim the instruction padding (e.g. when stripping the file).
Petr Hosekedd6c352017-08-02 16:35:00 +00001876 PhdrEntry *LastRX = nullptr;
1877 for (PhdrEntry *P : Phdrs) {
1878 if (P->p_type != PT_LOAD)
1879 continue;
1880 if (P->p_flags & PF_X)
1881 LastRX = P;
1882 else
1883 LastRX = nullptr;
1884 }
Petr Hosekedd6c352017-08-02 16:35:00 +00001885 if (LastRX)
Petr Hosek7ab9f7b2017-09-01 21:48:20 +00001886 LastRX->p_memsz = LastRX->p_filesz =
1887 alignTo(LastRX->p_filesz, Target->PageSize);
Petr Hosekedd6c352017-08-02 16:35:00 +00001888}
1889
Michael J. Spencer84487f12015-07-24 21:03:07 +00001890// Write section contents to a mmap'ed file.
1891template <class ELFT> void Writer<ELFT>::writeSections() {
1892 uint8_t *Buf = Buffer->getBufferStart();
Hal Finkeldaedc122015-10-12 23:16:53 +00001893
Rui Ueyama75118252016-08-09 01:35:37 +00001894 // PPC64 needs to process relocations in the .opd section
1895 // before processing relocations in code-containing sections.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001896 if (auto *OpdCmd = findSection(".opd")) {
1897 Out::Opd = OpdCmd;
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001898 Out::OpdBuf = Buf + Out::Opd->Offset;
Rafael Espindola55b169b2017-05-24 18:08:04 +00001899 OpdCmd->template writeTo<ELFT>(Buf + Out::Opd->Offset);
Rafael Espindola7a513052015-10-13 14:45:51 +00001900 }
Hal Finkeldaedc122015-10-12 23:16:53 +00001901
Rafael Espindola24e6f362017-02-24 15:07:30 +00001902 OutputSection *EhFrameHdr =
Rafael Espindola881cc162017-05-26 17:28:17 +00001903 (In<ELFT>::EhFrameHdr && !In<ELFT>::EhFrameHdr->empty())
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001904 ? In<ELFT>::EhFrameHdr->getParent()
Rafael Espindola881cc162017-05-26 17:28:17 +00001905 : nullptr;
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001906
1907 // In -r or -emit-relocs mode, write the relocation sections first as in
1908 // ELf_Rel targets we might find out that we need to modify the relocated
1909 // section while doing it.
Rui Ueyama8ad23dc2017-10-06 20:12:43 +00001910 for (OutputSection *Sec : OutputSections)
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001911 if (Sec->Type == SHT_REL || Sec->Type == SHT_RELA)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001912 Sec->writeTo<ELFT>(Buf + Sec->Offset);
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001913
Rui Ueyama8ad23dc2017-10-06 20:12:43 +00001914 for (OutputSection *Sec : OutputSections)
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001915 if (Sec != Out::Opd && Sec != EhFrameHdr && Sec->Type != SHT_REL &&
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001916 Sec->Type != SHT_RELA)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001917 Sec->writeTo<ELFT>(Buf + Sec->Offset);
Eugene Leviante4f590f2016-08-31 07:43:50 +00001918
1919 // The .eh_frame_hdr depends on .eh_frame section contents, therefore
1920 // it should be written after .eh_frame is written.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001921 if (EhFrameHdr)
1922 EhFrameHdr->writeTo<ELFT>(Buf + EhFrameHdr->Offset);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001923}
Rui Ueyama3ce825e2015-10-09 21:07:25 +00001924
Rui Ueyama634ddf02016-03-11 20:51:53 +00001925template <class ELFT> void Writer<ELFT>::writeBuildId() {
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001926 if (!InX::BuildId || !InX::BuildId->getParent())
Rui Ueyama634ddf02016-03-11 20:51:53 +00001927 return;
1928
Petr Hosekfdfcb792016-09-01 22:43:03 +00001929 // Compute a hash of all sections of the output file.
Rui Ueyama634ddf02016-03-11 20:51:53 +00001930 uint8_t *Start = Buffer->getBufferStart();
Petr Hosekfdfcb792016-09-01 22:43:03 +00001931 uint8_t *End = Start + FileSize;
Rafael Espindola895aea62017-05-11 22:02:41 +00001932 InX::BuildId->writeBuildId({Start, End});
Rui Ueyama634ddf02016-03-11 20:51:53 +00001933}
1934
Rui Ueyama84907c52016-08-09 03:38:23 +00001935template void elf::writeResult<ELF32LE>();
1936template void elf::writeResult<ELF32BE>();
1937template void elf::writeResult<ELF64LE>();
1938template void elf::writeResult<ELF64BE>();