blob: 62748082fa443ec1c855d761662de1615297db58 [file] [log] [blame]
Michael J. Spencer84487f12015-07-24 21:03:07 +00001//===- Writer.cpp ---------------------------------------------------------===//
2//
3// The LLVM Linker
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Michael J. Spencerf8325412015-09-04 22:48:30 +000010#include "Writer.h"
Rui Ueyamacb8474ed2015-08-05 23:51:50 +000011#include "Config.h"
Rui Ueyama9b55e922017-03-24 00:15:16 +000012#include "Filesystem.h"
Rui Ueyama717677a2016-02-11 21:17:59 +000013#include "LinkerScript.h"
Rafael Espindola1ebfc592017-01-13 21:05:46 +000014#include "MapFile.h"
Rui Ueyama9381eb12016-12-18 14:06:06 +000015#include "Memory.h"
Rafael Espindola5805c4f2015-09-21 21:38:08 +000016#include "OutputSections.h"
Rui Ueyama0fcdc732016-05-24 20:24:43 +000017#include "Relocations.h"
Rui Ueyamafbbde542016-06-29 09:08:02 +000018#include "Strings.h"
Rui Ueyamaafff74e22015-08-05 23:24:46 +000019#include "SymbolTable.h"
Rui Ueyama6dc7fcb2016-11-01 20:28:21 +000020#include "SyntheticSections.h"
Rafael Espindola01205f72015-09-22 18:19:46 +000021#include "Target.h"
George Rimardbf93392017-04-17 08:58:12 +000022#include "Threads.h"
Denis Protivensky8e3b38a2015-11-12 09:52:08 +000023#include "llvm/ADT/StringMap.h"
Hal Finkel3bae2d82015-10-12 20:51:48 +000024#include "llvm/ADT/StringSwitch.h"
Rui Ueyamaafff74e22015-08-05 23:24:46 +000025#include "llvm/Support/FileOutputBuffer.h"
Rui Ueyamae8b2df42016-09-29 01:45:22 +000026#include <climits>
Michael J. Spencer84487f12015-07-24 21:03:07 +000027
28using namespace llvm;
29using namespace llvm::ELF;
30using namespace llvm::object;
Peter Smith0a259f32016-10-10 09:39:26 +000031using namespace llvm::support;
32using namespace llvm::support::endian;
Michael J. Spencer84487f12015-07-24 21:03:07 +000033
34using namespace lld;
Rafael Espindolae0df00b2016-02-28 00:25:54 +000035using namespace lld::elf;
Michael J. Spencer84487f12015-07-24 21:03:07 +000036
Rui Ueyamaafff74e22015-08-05 23:24:46 +000037namespace {
38// The writer writes a SymbolTable result to a file.
39template <class ELFT> class Writer {
40public:
Rui Ueyama9328b2c2016-03-14 23:16:09 +000041 typedef typename ELFT::Shdr Elf_Shdr;
42 typedef typename ELFT::Ehdr Elf_Ehdr;
43 typedef typename ELFT::Phdr Elf_Phdr;
Rui Ueyama0ce388b2017-04-05 21:46:06 +000044
Rui Ueyamaafff74e22015-08-05 23:24:46 +000045 void run();
46
47private:
Rui Ueyamaf83aca42016-11-01 23:17:45 +000048 void createSyntheticSections();
Rui Ueyama5a9640b2015-10-08 23:49:30 +000049 void copyLocalSymbols();
Rafael Espindola08d6a3f2017-02-11 01:40:49 +000050 void addSectionSymbols();
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +000051 void addReservedSymbols();
George Rimar9e694502016-07-29 16:18:47 +000052 void createSections();
Rafael Espindolab4c9b812017-02-23 02:28:28 +000053 void forEachRelSec(std::function<void(InputSectionBase &)> Fn);
Rafael Espindola24c073d2016-09-21 22:36:19 +000054 void sortSections();
Eugene Leviante63d81b2016-07-20 14:43:20 +000055 void finalizeSections();
Rui Ueyama84417f82015-12-26 07:50:41 +000056 void addPredefinedSections();
Rafael Espindola4d560162017-09-12 16:38:01 +000057 void setReservedSymbolSections();
Rui Ueyama2df0fd82015-12-25 07:38:58 +000058
George Rimaraa354182017-07-27 07:46:50 +000059 std::vector<PhdrEntry *> createPhdrs();
Rafael Espindola074ba932016-12-06 13:43:34 +000060 void removeEmptyPTLoad();
George Rimaraa354182017-07-27 07:46:50 +000061 void addPtArmExid(std::vector<PhdrEntry *> &Phdrs);
Rui Ueyamae044e9c2016-04-01 17:07:17 +000062 void assignFileOffsets();
George Rimar86ce2672016-08-25 09:05:47 +000063 void assignFileOffsetsBinary();
Rui Ueyamae044e9c2016-04-01 17:07:17 +000064 void setPhdrs();
Rui Ueyama47091902016-03-30 19:41:51 +000065 void fixSectionAlignments();
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +000066 void openFile();
Petr Hosekedd6c352017-08-02 16:35:00 +000067 void writeTrapInstr();
Rui Ueyamaafff74e22015-08-05 23:24:46 +000068 void writeHeader();
69 void writeSections();
George Rimar86ce2672016-08-25 09:05:47 +000070 void writeSectionsBinary();
Rui Ueyama634ddf02016-03-11 20:51:53 +000071 void writeBuildId();
Rui Ueyamaafff74e22015-08-05 23:24:46 +000072
Rui Ueyama818bb2f2016-07-16 18:55:47 +000073 std::unique_ptr<FileOutputBuffer> Buffer;
Michael J. Spencer2f008242015-09-17 19:58:07 +000074
Rafael Espindola05531242017-07-06 16:40:44 +000075 OutputSectionFactory Factory;
Rafael Espindola4fc60442016-02-10 22:43:13 +000076
Rui Ueyama01687222015-12-26 09:47:57 +000077 void addRelIpltSymbols();
Rui Ueyamaa5d79d12015-12-26 09:48:00 +000078 void addStartEndSymbols();
Rafael Espindola24e6f362017-02-24 15:07:30 +000079 void addStartStopSymbols(OutputSection *Sec);
Rui Ueyama6bd38222017-04-05 21:37:09 +000080 uint64_t getEntryAddr();
Rafael Espindola8c022ca2017-07-27 19:22:43 +000081 OutputSection *findSection(StringRef Name);
Rui Ueyama2f1b79f2015-10-10 22:34:30 +000082
George Rimaraa354182017-07-27 07:46:50 +000083 std::vector<PhdrEntry *> Phdrs;
Michael J. Spencer2f008242015-09-17 19:58:07 +000084
Rui Ueyama6bd38222017-04-05 21:37:09 +000085 uint64_t FileSize;
86 uint64_t SectionHeaderOff;
Peter Smith113a59e2017-06-26 10:22:17 +000087
88 bool HasGotBaseSym = false;
Rui Ueyamaafff74e22015-08-05 23:24:46 +000089};
90} // anonymous namespace
91
Rui Ueyama55518e72016-10-28 20:57:25 +000092StringRef elf::getOutputSectionName(StringRef Name) {
George Rimar60a0ea12017-06-05 12:49:21 +000093 // ".zdebug_" is a prefix for ZLIB-compressed sections.
94 // Because we decompressed input sections, we want to remove 'z'.
95 if (Name.startswith(".zdebug_"))
96 return Saver.save("." + Name.substr(2));
97
Eugene Levianta8d12ef2016-10-05 10:10:45 +000098 if (Config->Relocatable)
99 return Name;
100
Rafael Espindola7d382732016-09-19 19:59:21 +0000101 for (StringRef V :
George Rimar1ab9cf42017-03-17 10:14:53 +0000102 {".text.", ".rodata.", ".data.rel.ro.", ".data.", ".bss.rel.ro.",
103 ".bss.", ".init_array.", ".fini_array.", ".ctors.", ".dtors.", ".tbss.",
Peter Smith691ff762017-06-28 09:12:38 +0000104 ".gcc_except_table.", ".tdata.", ".ARM.exidx.", ".ARM.extab."}) {
Rafael Espindola7d382732016-09-19 19:59:21 +0000105 StringRef Prefix = V.drop_back();
106 if (Name.startswith(V) || Name == Prefix)
107 return Prefix;
108 }
Rui Ueyama05384082016-10-12 22:36:31 +0000109
Rui Ueyamae8a61022016-11-05 23:05:47 +0000110 // CommonSection is identified as "COMMON" in linker scripts.
111 // By default, it should go to .bss section.
112 if (Name == "COMMON")
113 return ".bss";
114
George Rimar5d53d1f2016-07-12 08:50:42 +0000115 return Name;
116}
117
George Rimar696a7f92017-09-19 09:20:54 +0000118static bool needsInterpSection() {
119 return !SharedFiles.empty() && !Config->DynamicLinker.empty() &&
120 !Script->ignoreInterpSection();
Rui Ueyamafd03cfd2016-07-21 11:01:23 +0000121}
122
George Rimard8b27762016-11-14 10:14:18 +0000123template <class ELFT> void elf::writeResult() { Writer<ELFT>().run(); }
Rafael Espindola4fc60442016-02-10 22:43:13 +0000124
Rafael Espindola074ba932016-12-06 13:43:34 +0000125template <class ELFT> void Writer<ELFT>::removeEmptyPTLoad() {
George Rimar60608a82017-08-28 09:28:15 +0000126 llvm::erase_if(Phdrs, [&](const PhdrEntry *P) {
George Rimaraa354182017-07-27 07:46:50 +0000127 if (P->p_type != PT_LOAD)
Rafael Espindola074ba932016-12-06 13:43:34 +0000128 return false;
George Rimar6823c5f2017-09-07 11:01:10 +0000129 if (!P->FirstSec)
Rafael Espindola41217612016-12-08 03:17:05 +0000130 return true;
George Rimar6823c5f2017-09-07 11:01:10 +0000131 uint64_t Size = P->LastSec->Addr + P->LastSec->Size - P->FirstSec->Addr;
Rafael Espindola074ba932016-12-06 13:43:34 +0000132 return Size == 0;
133 });
Rafael Espindola074ba932016-12-06 13:43:34 +0000134}
135
Petr Hosek7b793212017-03-10 20:00:42 +0000136template <class ELFT> static void combineEhFrameSections() {
137 for (InputSectionBase *&S : InputSections) {
138 EhInputSection *ES = dyn_cast<EhInputSection>(S);
Rafael Espindolaa1565552017-03-15 12:31:54 +0000139 if (!ES || !ES->Live)
Petr Hosek7b793212017-03-10 20:00:42 +0000140 continue;
141
142 In<ELFT>::EhFrame->addSection(ES);
143 S = nullptr;
144 }
145
146 std::vector<InputSectionBase *> &V = InputSections;
147 V.erase(std::remove(V.begin(), V.end(), nullptr), V.end());
148}
149
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000150// The main function of the writer.
151template <class ELFT> void Writer<ELFT>::run() {
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000152 // Create linker-synthesized sections such as .got or .plt.
153 // Such sections are of type input section.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000154 createSyntheticSections();
George Rimar7beff422016-11-15 08:19:02 +0000155
Petr Hosek7b793212017-03-10 20:00:42 +0000156 if (!Config->Relocatable)
157 combineEhFrameSections<ELFT>();
158
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000159 // We need to create some reserved symbols such as _end. Create them.
George Rimar7beff422016-11-15 08:19:02 +0000160 if (!Config->Relocatable)
161 addReservedSymbols();
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000162
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000163 // Create output sections.
Rui Ueyamaa34da932017-03-21 23:03:09 +0000164 if (Script->Opt.HasSections) {
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000165 // If linker script contains SECTIONS commands, let it create sections.
George Rimara8dba482017-03-20 10:09:58 +0000166 Script->processCommands(Factory);
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000167
168 // Linker scripts may have left some input sections unassigned.
169 // Assign such sections using the default rule.
George Rimara8dba482017-03-20 10:09:58 +0000170 Script->addOrphanSections(Factory);
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000171 } else {
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000172 // If linker script does not contain SECTIONS commands, create
173 // output sections by default rules. We still need to give the
174 // linker script a chance to run, because it might contain
175 // non-SECTIONS commands such as ASSERT.
George Rimara8dba482017-03-20 10:09:58 +0000176 Script->processCommands(Factory);
Rafael Espindola21263342017-07-05 23:36:24 +0000177 createSections();
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000178 }
179
180 if (Config->Discard != DiscardPolicy::All)
181 copyLocalSymbols();
182
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000183 if (Config->CopyRelocs)
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000184 addSectionSymbols();
185
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000186 // Now that we have a complete set of output sections. This function
187 // completes section contents. For example, we need to add strings
188 // to the string table, and add entries to .got and .plt.
189 // finalizeSections does that.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000190 finalizeSections();
Rui Ueyamaf373dd72016-11-24 01:43:21 +0000191 if (ErrorCount)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000192 return;
193
Rafael Espindola55b169b2017-05-24 18:08:04 +0000194 // If -compressed-debug-sections is specified, we need to compress
195 // .debug_* sections. Do it right now because it changes the size of
196 // output sections.
George Rimara9b07142017-08-04 08:30:16 +0000197 parallelForEach(OutputSections,
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000198 [](OutputSection *Sec) { Sec->maybeCompress<ELFT>(); });
Rafael Espindola805f5152017-06-01 16:30:12 +0000199
Peter Smith5aedebf2017-07-05 09:12:54 +0000200 Script->assignAddresses();
201 Script->allocateHeaders(Phdrs);
Rafael Espindola189860c2017-06-07 02:24:08 +0000202
203 // Remove empty PT_LOAD to avoid causing the dynamic linker to try to mmap a
204 // 0 sized region. This has to be done late since only after assignAddresses
205 // we know the size of the sections.
206 removeEmptyPTLoad();
207
208 if (!Config->OFormatBinary)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000209 assignFileOffsets();
Rafael Espindola189860c2017-06-07 02:24:08 +0000210 else
211 assignFileOffsetsBinary();
212
213 setPhdrs();
214
215 if (Config->Relocatable) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000216 for (OutputSection *Sec : OutputSections)
217 Sec->Addr = 0;
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000218 }
219
George Rimar2ddab6d2017-01-17 13:50:34 +0000220 // It does not make sense try to open the file if we have error already.
221 if (ErrorCount)
222 return;
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000223 // Write the result down to a file.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000224 openFile();
Rui Ueyamaf373dd72016-11-24 01:43:21 +0000225 if (ErrorCount)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000226 return;
Rafael Espindola3f235c72017-06-01 16:32:58 +0000227
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000228 if (!Config->OFormatBinary) {
Petr Hosekedd6c352017-08-02 16:35:00 +0000229 writeTrapInstr();
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000230 writeHeader();
231 writeSections();
232 } else {
233 writeSectionsBinary();
234 }
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000235
236 // Backfill .note.gnu.build-id section content. This is done at last
237 // because the content is usually a hash value of the entire output file.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000238 writeBuildId();
Rui Ueyamaf373dd72016-11-24 01:43:21 +0000239 if (ErrorCount)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000240 return;
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000241
Rui Ueyama40eaa992017-01-18 03:34:38 +0000242 // Handle -Map option.
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000243 writeMapFile<ELFT>();
Rui Ueyama40eaa992017-01-18 03:34:38 +0000244 if (ErrorCount)
245 return;
246
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000247 if (auto EC = Buffer->commit())
Rui Ueyamac8d3a832017-01-12 22:18:04 +0000248 error("failed to write to the output file: " + EC.message());
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000249
250 // Flush the output streams and exit immediately. A full shutdown
251 // is a good test that we are keeping track of all allocated memory,
252 // but actually freeing it is a waste of time in a regular linker run.
253 if (Config->ExitEarly)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000254 exitLld(0);
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000255}
256
Rui Ueyama9d1bacb12017-02-27 02:31:26 +0000257// Initialize Out members.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000258template <class ELFT> void Writer<ELFT>::createSyntheticSections() {
259 // Initialize all pointers with NULL. This is needed because
260 // you can call lld::elf::main more than once as a library.
Rui Ueyama9d1bacb12017-02-27 02:31:26 +0000261 memset(&Out::First, 0, sizeof(Out));
Rui Ueyamacfadbd92016-11-01 23:12:51 +0000262
Rui Ueyama536a2672017-02-27 02:32:08 +0000263 auto Add = [](InputSectionBase *Sec) { InputSections.push_back(Sec); };
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000264
Rafael Espindola895aea62017-05-11 22:02:41 +0000265 InX::DynStrTab = make<StringTableSection>(".dynstr", true);
Rafael Espindola5ab19892017-05-11 23:16:43 +0000266 InX::Dynamic = make<DynamicSection<ELFT>>();
Eugene Levianta96d9022016-11-16 10:02:27 +0000267 In<ELFT>::RelaDyn = make<RelocationSection<ELFT>>(
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000268 Config->IsRela ? ".rela.dyn" : ".rel.dyn", Config->ZCombreloc);
Rafael Espindola895aea62017-05-11 22:02:41 +0000269 InX::ShStrTab = make<StringTableSection>(".shstrtab", false);
Rui Ueyama4197a6a2016-02-05 18:41:40 +0000270
Rui Ueyama9d1bacb12017-02-27 02:31:26 +0000271 Out::ElfHeader = make<OutputSection>("", 0, SHF_ALLOC);
272 Out::ElfHeader->Size = sizeof(Elf_Ehdr);
273 Out::ProgramHeaders = make<OutputSection>("", 0, SHF_ALLOC);
Rui Ueyama6bd38222017-04-05 21:37:09 +0000274 Out::ProgramHeaders->updateAlignment(Config->Wordsize);
Rui Ueyama4197a6a2016-02-05 18:41:40 +0000275
George Rimar696a7f92017-09-19 09:20:54 +0000276 if (needsInterpSection()) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000277 InX::Interp = createInterpSection();
278 Add(InX::Interp);
Rui Ueyamae8a61022016-11-05 23:05:47 +0000279 } else {
Rafael Espindola895aea62017-05-11 22:02:41 +0000280 InX::Interp = nullptr;
Rui Ueyamae8a61022016-11-05 23:05:47 +0000281 }
Rui Ueyama3a41be22016-04-07 22:49:21 +0000282
George Rimarf21aade2016-08-31 08:38:11 +0000283 if (Config->Strip != StripPolicy::All) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000284 InX::StrTab = make<StringTableSection>(".strtab", false);
George Rimarf45f6812017-05-16 08:53:30 +0000285 InX::SymTab = make<SymbolTableSection<ELFT>>(*InX::StrTab);
Rui Ueyama4197a6a2016-02-05 18:41:40 +0000286 }
Rui Ueyamacfadbd92016-11-01 23:12:51 +0000287
Rui Ueyamac4030a12016-11-22 00:54:15 +0000288 if (Config->BuildId != BuildIdKind::None) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000289 InX::BuildId = make<BuildIdSection>();
290 Add(InX::BuildId);
Rui Ueyamac4030a12016-11-22 00:54:15 +0000291 }
Rui Ueyamae8a61022016-11-05 23:05:47 +0000292
Rafael Espindola895aea62017-05-11 22:02:41 +0000293 InX::Bss = make<BssSection>(".bss");
294 Add(InX::Bss);
295 InX::BssRelRo = make<BssSection>(".bss.rel.ro");
296 Add(InX::BssRelRo);
George Rimar1ab9cf42017-03-17 10:14:53 +0000297
Rui Ueyama1d75de02016-11-22 04:28:39 +0000298 // Add MIPS-specific sections.
Simon Atanasyance02cf02016-11-09 21:36:56 +0000299 if (Config->EMachine == EM_MIPS) {
Rafael Espindolae05e2f82017-09-15 18:05:02 +0000300 if (!Config->Shared && Config->HasDynSymTab) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000301 InX::MipsRldMap = make<MipsRldMapSection>();
302 Add(InX::MipsRldMap);
Eugene Leviant17b7a572016-11-22 17:49:14 +0000303 }
Rui Ueyama1d75de02016-11-22 04:28:39 +0000304 if (auto *Sec = MipsAbiFlagsSection<ELFT>::create())
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000305 Add(Sec);
Rui Ueyama1d75de02016-11-22 04:28:39 +0000306 if (auto *Sec = MipsOptionsSection<ELFT>::create())
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000307 Add(Sec);
Rui Ueyama1d75de02016-11-22 04:28:39 +0000308 if (auto *Sec = MipsReginfoSection<ELFT>::create())
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000309 Add(Sec);
Simon Atanasyance02cf02016-11-09 21:36:56 +0000310 }
Eugene Leviant41ca3272016-11-10 09:48:29 +0000311
Rafael Espindolae05e2f82017-09-15 18:05:02 +0000312 if (Config->HasDynSymTab) {
George Rimar69b17c32017-05-16 10:04:42 +0000313 InX::DynSymTab = make<SymbolTableSection<ELFT>>(*InX::DynStrTab);
314 Add(InX::DynSymTab);
George Rimar11992c862016-11-25 08:05:41 +0000315
316 In<ELFT>::VerSym = make<VersionTableSection<ELFT>>();
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000317 Add(In<ELFT>::VerSym);
George Rimar11992c862016-11-25 08:05:41 +0000318
319 if (!Config->VersionDefinitions.empty()) {
320 In<ELFT>::VerDef = make<VersionDefinitionSection<ELFT>>();
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000321 Add(In<ELFT>::VerDef);
George Rimar11992c862016-11-25 08:05:41 +0000322 }
323
324 In<ELFT>::VerNeed = make<VersionNeedSection<ELFT>>();
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000325 Add(In<ELFT>::VerNeed);
George Rimar11992c862016-11-25 08:05:41 +0000326
327 if (Config->GnuHash) {
George Rimar69b17c32017-05-16 10:04:42 +0000328 InX::GnuHashTab = make<GnuHashTableSection>();
329 Add(InX::GnuHashTab);
George Rimar11992c862016-11-25 08:05:41 +0000330 }
331
332 if (Config->SysvHash) {
George Rimaraaf54712017-09-27 09:14:59 +0000333 InX::HashTab = make<HashTableSection>();
334 Add(InX::HashTab);
George Rimar11992c862016-11-25 08:05:41 +0000335 }
336
Rafael Espindola5ab19892017-05-11 23:16:43 +0000337 Add(InX::Dynamic);
Rafael Espindola895aea62017-05-11 22:02:41 +0000338 Add(InX::DynStrTab);
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000339 Add(In<ELFT>::RelaDyn);
George Rimar11992c862016-11-25 08:05:41 +0000340 }
341
Rui Ueyama1d75de02016-11-22 04:28:39 +0000342 // Add .got. MIPS' .got is so different from the other archs,
343 // it has its own class.
George Rimar11992c862016-11-25 08:05:41 +0000344 if (Config->EMachine == EM_MIPS) {
Rafael Espindolab3aa2c92017-05-11 21:33:30 +0000345 InX::MipsGot = make<MipsGotSection>();
346 Add(InX::MipsGot);
George Rimar11992c862016-11-25 08:05:41 +0000347 } else {
Rafael Espindolaa6465bb2017-05-18 16:45:36 +0000348 InX::Got = make<GotSection>();
Rafael Espindola88ab9fb2017-05-11 23:26:03 +0000349 Add(InX::Got);
George Rimar11992c862016-11-25 08:05:41 +0000350 }
Simon Atanasyan725dc142016-11-16 21:01:02 +0000351
Rafael Espindola4b1c3692017-05-11 21:23:38 +0000352 InX::GotPlt = make<GotPltSection>();
353 Add(InX::GotPlt);
Rafael Espindola895aea62017-05-11 22:02:41 +0000354 InX::IgotPlt = make<IgotPltSection>();
355 Add(InX::IgotPlt);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000356
357 if (Config->GdbIndex) {
Rafael Espindola300b3862017-07-12 23:56:53 +0000358 InX::GdbIndex = createGdbIndex<ELFT>();
Rafael Espindola895aea62017-05-11 22:02:41 +0000359 Add(InX::GdbIndex);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000360 }
361
362 // We always need to add rel[a].plt to output if it has entries.
363 // Even for static linking it can contain R_[*]_IRELATIVE relocations.
364 In<ELFT>::RelaPlt = make<RelocationSection<ELFT>>(
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000365 Config->IsRela ? ".rela.plt" : ".rel.plt", false /*Sort*/);
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000366 Add(In<ELFT>::RelaPlt);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000367
Peter Smithbaffdb82016-12-08 12:58:55 +0000368 // The RelaIplt immediately follows .rel.plt (.rel.dyn for ARM) to ensure
369 // that the IRelative relocations are processed last by the dynamic loader
370 In<ELFT>::RelaIplt = make<RelocationSection<ELFT>>(
371 (Config->EMachine == EM_ARM) ? ".rel.dyn" : In<ELFT>::RelaPlt->Name,
372 false /*Sort*/);
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000373 Add(In<ELFT>::RelaIplt);
Peter Smithbaffdb82016-12-08 12:58:55 +0000374
Rafael Espindola895aea62017-05-11 22:02:41 +0000375 InX::Plt = make<PltSection>(Target->PltHeaderSize);
376 Add(InX::Plt);
377 InX::Iplt = make<PltSection>(0);
378 Add(InX::Iplt);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000379
Rafael Espindola66b4e212017-02-23 22:06:28 +0000380 if (!Config->Relocatable) {
George Rimar1c74c2f2017-03-09 08:45:25 +0000381 if (Config->EhFrameHdr) {
382 In<ELFT>::EhFrameHdr = make<EhFrameHeader<ELFT>>();
383 Add(In<ELFT>::EhFrameHdr);
384 }
Rafael Espindola66b4e212017-02-23 22:06:28 +0000385 In<ELFT>::EhFrame = make<EhFrameSection<ELFT>>();
386 Add(In<ELFT>::EhFrame);
387 }
388
George Rimar69b17c32017-05-16 10:04:42 +0000389 if (InX::SymTab)
390 Add(InX::SymTab);
Rafael Espindola895aea62017-05-11 22:02:41 +0000391 Add(InX::ShStrTab);
392 if (InX::StrTab)
393 Add(InX::StrTab);
Michael J. Spencer84487f12015-07-24 21:03:07 +0000394}
395
Rafael Espindola5616adf2017-03-08 22:36:28 +0000396static bool shouldKeepInSymtab(SectionBase *Sec, StringRef SymName,
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000397 const SymbolBody &B) {
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000398 if (B.isFile() || B.isSection())
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000399 return false;
400
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000401 // If sym references a section in a discarded group, don't keep it.
Rafael Espindola774ea7d2017-02-23 16:49:07 +0000402 if (Sec == &InputSection::Discarded)
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000403 return false;
404
George Rimar9503f6d2016-08-31 08:46:30 +0000405 if (Config->Discard == DiscardPolicy::None)
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000406 return true;
407
408 // In ELF assembly .L symbols are normally discarded by the assembler.
409 // If the assembler fails to do so, the linker discards them if
410 // * --discard-locals is used.
411 // * The symbol is in a SHF_MERGE section, which is normally the reason for
412 // the assembler keeping the .L symbol.
413 if (!SymName.startswith(".L") && !SymName.empty())
414 return true;
415
George Rimar9503f6d2016-08-31 08:46:30 +0000416 if (Config->Discard == DiscardPolicy::Locals)
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000417 return false;
418
Rafael Espindola1854a8e2016-10-26 12:36:56 +0000419 return !Sec || !(Sec->Flags & SHF_MERGE);
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000420}
421
George Rimar7702bc22017-03-16 11:20:02 +0000422static bool includeInSymtab(const SymbolBody &B) {
Rafael Espindola474eb012016-05-05 16:40:28 +0000423 if (!B.isLocal() && !B.symbol()->IsUsedInRegularObj)
424 return false;
425
Rui Ueyama80474a22017-02-28 19:29:55 +0000426 if (auto *D = dyn_cast<DefinedRegular>(&B)) {
Rafael Espindola474eb012016-05-05 16:40:28 +0000427 // Always include absolute symbols.
Rafael Espindola5616adf2017-03-08 22:36:28 +0000428 SectionBase *Sec = D->Section;
429 if (!Sec)
Rafael Espindola474eb012016-05-05 16:40:28 +0000430 return true;
Rafael Espindola5616adf2017-03-08 22:36:28 +0000431 if (auto *IS = dyn_cast<InputSectionBase>(Sec)) {
432 Sec = IS->Repl;
433 IS = cast<InputSectionBase>(Sec);
434 // Exclude symbols pointing to garbage-collected sections.
435 if (!IS->Live)
436 return false;
437 }
438 if (auto *S = dyn_cast<MergeInputSection>(Sec))
Rui Ueyama90fa3722016-05-22 00:41:38 +0000439 if (!S->getSectionPiece(D->Value)->Live)
Rafael Espindola474eb012016-05-05 16:40:28 +0000440 return false;
441 }
442 return true;
443}
Rafael Espindola462220d2016-05-05 16:38:46 +0000444
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000445// Local symbols are not in the linker's symbol table. This function scans
446// each object file's symbol table to copy local symbols to the output.
447template <class ELFT> void Writer<ELFT>::copyLocalSymbols() {
George Rimar69b17c32017-05-16 10:04:42 +0000448 if (!InX::SymTab)
Rui Ueyama90f76fb2016-01-21 03:07:38 +0000449 return;
George Rimar696a7f92017-09-19 09:20:54 +0000450 for (InputFile *File : ObjectFiles) {
451 ObjFile<ELFT> *F = cast<ObjFile<ELFT>>(File);
Rafael Espindola67d72c02016-03-11 12:06:30 +0000452 for (SymbolBody *B : F->getLocalSymbols()) {
George Rimar78fe56e2016-10-11 09:07:14 +0000453 if (!B->IsLocal)
Rui Ueyama3fc0f7e2016-11-23 18:07:33 +0000454 fatal(toString(F) +
George Rimar78fe56e2016-10-11 09:07:14 +0000455 ": broken object: getLocalSymbols returns a non-local symbol");
Rui Ueyama80474a22017-02-28 19:29:55 +0000456 auto *DR = dyn_cast<DefinedRegular>(B);
Rui Ueyama3fc0f7e2016-11-23 18:07:33 +0000457
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000458 // No reason to keep local undefined symbol in symtab.
459 if (!DR)
Rafael Espindola444576d2015-10-09 19:25:07 +0000460 continue;
George Rimar7702bc22017-03-16 11:20:02 +0000461 if (!includeInSymtab(*B))
Rafael Espindola462220d2016-05-05 16:38:46 +0000462 continue;
Rui Ueyama3fc0f7e2016-11-23 18:07:33 +0000463
Rafael Espindola5616adf2017-03-08 22:36:28 +0000464 SectionBase *Sec = DR->Section;
George Rimar7702bc22017-03-16 11:20:02 +0000465 if (!shouldKeepInSymtab(Sec, B->getName(), *B))
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000466 continue;
George Rimar69b17c32017-05-16 10:04:42 +0000467 InX::SymTab->addSymbol(B);
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000468 }
469 }
470}
471
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000472template <class ELFT> void Writer<ELFT>::addSectionSymbols() {
473 // Create one STT_SECTION symbol for each output section we might
474 // have a relocation with.
Rafael Espindolad48b2082017-07-04 19:08:40 +0000475 for (BaseCommand *Base : Script->Opt.Commands) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000476 auto *Sec = dyn_cast<OutputSection>(Base);
477 if (!Sec)
Rui Ueyama73d29ab2017-02-28 19:43:54 +0000478 continue;
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000479 auto I = llvm::find_if(Sec->Commands, [](BaseCommand *Base) {
Rafael Espindolad48b2082017-07-04 19:08:40 +0000480 if (auto *ISD = dyn_cast<InputSectionDescription>(Base))
481 return !ISD->Sections.empty();
482 return false;
483 });
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000484 if (I == Sec->Commands.end())
Rafael Espindolad48b2082017-07-04 19:08:40 +0000485 continue;
486 InputSection *IS = cast<InputSectionDescription>(*I)->Sections[0];
Rui Ueyama73d29ab2017-02-28 19:43:54 +0000487 if (isa<SyntheticSection>(IS) || IS->Type == SHT_REL ||
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000488 IS->Type == SHT_RELA)
489 continue;
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000490
Rui Ueyama175e81c2017-02-28 19:36:30 +0000491 auto *Sym =
492 make<DefinedRegular>("", /*IsLocal=*/true, /*StOther=*/0, STT_SECTION,
Rafael Espindola6e93d052017-08-04 22:31:42 +0000493 /*Value=*/0, /*Size=*/0, IS);
George Rimar69b17c32017-05-16 10:04:42 +0000494 InX::SymTab->addSymbol(Sym);
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000495 }
496}
497
Rui Ueyama26ad0572017-02-16 04:51:46 +0000498// Today's loaders have a feature to make segments read-only after
499// processing dynamic relocations to enhance security. PT_GNU_RELRO
500// is defined for that.
501//
502// This function returns true if a section needs to be put into a
503// PT_GNU_RELRO segment.
Rafael Espindoladc49af92017-07-24 23:55:33 +0000504static bool isRelroSection(const OutputSection *Sec) {
Rafael Espindola4fc60442016-02-10 22:43:13 +0000505 if (!Config->ZRelro)
506 return false;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000507
Rafael Espindolae08e78d2016-11-09 23:23:45 +0000508 uint64_t Flags = Sec->Flags;
Rui Ueyama9d773f32017-04-13 05:40:07 +0000509
510 // Non-allocatable or non-writable sections don't need RELRO because
511 // they are not writable or not even mapped to memory in the first place.
512 // RELRO is for sections that are essentially read-only but need to
513 // be writable only at process startup to allow dynamic linker to
514 // apply relocations.
George Rimare3336c02015-11-24 10:15:50 +0000515 if (!(Flags & SHF_ALLOC) || !(Flags & SHF_WRITE))
516 return false;
Rui Ueyama9d773f32017-04-13 05:40:07 +0000517
518 // Once initialized, TLS data segments are used as data templates
519 // for a thread-local storage. For each new thread, runtime
520 // allocates memory for a TLS and copy templates there. No thread
521 // are supposed to use templates directly. Thus, it can be in RELRO.
Rui Ueyamaccfc3262015-12-10 19:13:08 +0000522 if (Flags & SHF_TLS)
523 return true;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000524
Rui Ueyama9d773f32017-04-13 05:40:07 +0000525 // .init_array, .preinit_array and .fini_array contain pointers to
526 // functions that are executed on process startup or exit. These
527 // pointers are set by the static linker, and they are not expected
528 // to change at runtime. But if you are an attacker, you could do
529 // interesting things by manipulating pointers in .fini_array, for
530 // example. So they are put into RELRO.
Rafael Espindola04a2e342016-11-09 01:42:41 +0000531 uint32_t Type = Sec->Type;
Rui Ueyamaccfc3262015-12-10 19:13:08 +0000532 if (Type == SHT_INIT_ARRAY || Type == SHT_FINI_ARRAY ||
533 Type == SHT_PREINIT_ARRAY)
George Rimare3336c02015-11-24 10:15:50 +0000534 return true;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000535
Rui Ueyama9d773f32017-04-13 05:40:07 +0000536 // .got contains pointers to external symbols. They are resolved by
537 // the dynamic linker when a module is loaded into memory, and after
538 // that they are not expected to change. So, it can be in RELRO.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000539 if (InX::Got && Sec == InX::Got->getParent())
Simon Atanasyan725dc142016-11-16 21:01:02 +0000540 return true;
Rui Ueyama9d773f32017-04-13 05:40:07 +0000541
542 // .got.plt contains pointers to external function symbols. They are
543 // by default resolved lazily, so we usually cannot put it into RELRO.
544 // However, if "-z now" is given, the lazy symbol resolution is
545 // disabled, which enables us to put it into RELRO.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000546 if (Sec == InX::GotPlt->getParent())
Rui Ueyama9d773f32017-04-13 05:40:07 +0000547 return Config->ZNow;
548
549 // .dynamic section contains data for the dynamic linker, and
550 // there's no need to write to it at runtime, so it's better to put
551 // it into RELRO.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000552 if (Sec == InX::Dynamic->getParent())
Rui Ueyama9d773f32017-04-13 05:40:07 +0000553 return true;
554
555 // .bss.rel.ro is used for copy relocations for read-only symbols.
556 // Since the dynamic linker needs to process copy relocations, the
557 // section cannot be read-only, but once initialized, they shouldn't
558 // change.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000559 if (Sec == InX::BssRelRo->getParent())
Peter Collingbournefeb66292017-01-10 01:21:50 +0000560 return true;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000561
Rui Ueyama9d773f32017-04-13 05:40:07 +0000562 // Sections with some special names are put into RELRO. This is a
563 // bit unfortunate because section names shouldn't be significant in
564 // ELF in spirit. But in reality many linker features depend on
565 // magic section names.
Rafael Espindola40849412017-02-24 14:28:00 +0000566 StringRef S = Sec->Name;
Rui Ueyama01faef02015-12-10 19:19:04 +0000567 return S == ".data.rel.ro" || S == ".ctors" || S == ".dtors" || S == ".jcr" ||
George Rimard003c7f2016-12-20 11:28:54 +0000568 S == ".eh_frame" || S == ".openbsd.randomdata";
George Rimare3336c02015-11-24 10:15:50 +0000569}
570
Rafael Espindola52101412017-05-12 14:52:22 +0000571// We compute a rank for each section. The rank indicates where the
572// section should be placed in the file. Instead of using simple
573// numbers (0,1,2...), we use a series of flags. One for each decision
574// point when placing the section.
575// Using flags has two key properties:
576// * It is easy to check if a give branch was taken.
577// * It is easy two see how similar two ranks are (see getRankProximity).
578enum RankFlags {
Rafael Espindolad23e9262017-05-26 17:23:25 +0000579 RF_NOT_ADDR_SET = 1 << 16,
580 RF_NOT_INTERP = 1 << 15,
581 RF_NOT_ALLOC = 1 << 14,
582 RF_WRITE = 1 << 13,
583 RF_EXEC_WRITE = 1 << 12,
Rafael Espindola246c1c42017-05-18 16:20:12 +0000584 RF_EXEC = 1 << 11,
585 RF_NON_TLS_BSS = 1 << 10,
586 RF_NON_TLS_BSS_RO = 1 << 9,
587 RF_NOT_TLS = 1 << 8,
588 RF_BSS = 1 << 7,
589 RF_PPC_NOT_TOCBSS = 1 << 6,
590 RF_PPC_OPD = 1 << 5,
591 RF_PPC_TOCL = 1 << 4,
592 RF_PPC_TOC = 1 << 3,
593 RF_PPC_BRANCH_LT = 1 << 2,
594 RF_MIPS_GPREL = 1 << 1,
595 RF_MIPS_NOT_GOT = 1 << 0
Rafael Espindola52101412017-05-12 14:52:22 +0000596};
Rui Ueyamae288eef2016-11-02 18:58:44 +0000597
Rafael Espindola52101412017-05-12 14:52:22 +0000598static unsigned getSectionRank(const OutputSection *Sec) {
599 unsigned Rank = 0;
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000600
Rafael Espindola5967c972016-12-19 21:21:07 +0000601 // We want to put section specified by -T option first, so we
602 // can start assigning VA starting from them later.
Rafael Espindola52101412017-05-12 14:52:22 +0000603 if (Config->SectionStartMap.count(Sec->Name))
604 return Rank;
605 Rank |= RF_NOT_ADDR_SET;
606
607 // Put .interp first because some loaders want to see that section
608 // on the first page of the executable file when loaded into memory.
609 if (Sec->Name == ".interp")
610 return Rank;
611 Rank |= RF_NOT_INTERP;
612
613 // Allocatable sections go first to reduce the total PT_LOAD size and
614 // so debug info doesn't change addresses in actual code.
615 if (!(Sec->Flags & SHF_ALLOC))
616 return Rank | RF_NOT_ALLOC;
Rafael Espindola5967c972016-12-19 21:21:07 +0000617
Rafael Espindolad23e9262017-05-26 17:23:25 +0000618 // Sort sections based on their access permission in the following
619 // order: R, RX, RWX, RW. This order is based on the following
620 // considerations:
621 // * Read-only sections come first such that they go in the
622 // PT_LOAD covering the program headers at the start of the file.
623 // * Read-only, executable sections come next, unless the
624 // -no-rosegment option is used.
625 // * Writable, executable sections follow such that .plt on
626 // architectures where it needs to be writable will be placed
627 // between .text and .data.
628 // * Writable sections come last, such that .bss lands at the very
629 // end of the last PT_LOAD.
630 bool IsExec = Sec->Flags & SHF_EXECINSTR;
631 bool IsWrite = Sec->Flags & SHF_WRITE;
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000632
Rafael Espindolad23e9262017-05-26 17:23:25 +0000633 if (IsExec) {
634 if (IsWrite)
635 Rank |= RF_EXEC_WRITE;
636 else if (!Config->SingleRoRx)
Rafael Espindola52101412017-05-12 14:52:22 +0000637 Rank |= RF_EXEC;
Rafael Espindolad23e9262017-05-26 17:23:25 +0000638 } else {
639 if (IsWrite)
640 Rank |= RF_WRITE;
Rafael Espindolae979fd12016-09-29 22:48:55 +0000641 }
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000642
Hal Finkel0d7e83b2015-10-13 17:57:46 +0000643 // If we got here we know that both A and B are in the same PT_LOAD.
Michael J. Spencer1bf73002015-10-16 23:11:07 +0000644
Rafael Espindola52101412017-05-12 14:52:22 +0000645 bool IsTls = Sec->Flags & SHF_TLS;
646 bool IsNoBits = Sec->Type == SHT_NOBITS;
Hal Finkel3bae2d82015-10-12 20:51:48 +0000647
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000648 // The first requirement we have is to put (non-TLS) nobits sections last. The
649 // reason is that the only thing the dynamic linker will see about them is a
650 // p_memsz that is larger than p_filesz. Seeing that it zeros the end of the
651 // PT_LOAD, so that has to correspond to the nobits sections.
Rafael Espindola52101412017-05-12 14:52:22 +0000652 bool IsNonTlsNoBits = IsNoBits && !IsTls;
653 if (IsNonTlsNoBits)
654 Rank |= RF_NON_TLS_BSS;
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000655
656 // We place nobits RelRo sections before plain r/w ones, and non-nobits RelRo
657 // sections after r/w ones, so that the RelRo sections are contiguous.
Rafael Espindola52101412017-05-12 14:52:22 +0000658 bool IsRelRo = isRelroSection(Sec);
659 if (IsNonTlsNoBits && !IsRelRo)
660 Rank |= RF_NON_TLS_BSS_RO;
661 if (!IsNonTlsNoBits && IsRelRo)
662 Rank |= RF_NON_TLS_BSS_RO;
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000663
664 // The TLS initialization block needs to be a single contiguous block in a R/W
665 // PT_LOAD, so stick TLS sections directly before the other RelRo R/W
666 // sections. The TLS NOBITS sections are placed here as they don't take up
667 // virtual address space in the PT_LOAD.
Rafael Espindola52101412017-05-12 14:52:22 +0000668 if (!IsTls)
669 Rank |= RF_NOT_TLS;
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000670
671 // Within the TLS initialization block, the non-nobits sections need to appear
672 // first.
Rafael Espindola52101412017-05-12 14:52:22 +0000673 if (IsNoBits)
674 Rank |= RF_BSS;
George Rimare3336c02015-11-24 10:15:50 +0000675
Ben Dunbobbin95637552017-08-18 16:15:36 +0000676 // Some architectures have additional ordering restrictions for sections
677 // within the same PT_LOAD.
Rafael Espindola52101412017-05-12 14:52:22 +0000678 if (Config->EMachine == EM_PPC64) {
679 // PPC64 has a number of special SHT_PROGBITS+SHF_ALLOC+SHF_WRITE sections
680 // that we would like to make sure appear is a specific order to maximize
681 // their coverage by a single signed 16-bit offset from the TOC base
682 // pointer. Conversely, the special .tocbss section should be first among
683 // all SHT_NOBITS sections. This will put it next to the loaded special
684 // PPC64 sections (and, thus, within reach of the TOC base pointer).
685 StringRef Name = Sec->Name;
686 if (Name != ".tocbss")
687 Rank |= RF_PPC_NOT_TOCBSS;
Hal Finkel9abc2a52015-10-13 19:07:29 +0000688
Rafael Espindola52101412017-05-12 14:52:22 +0000689 if (Name == ".opd")
690 Rank |= RF_PPC_OPD;
691
692 if (Name == ".toc1")
693 Rank |= RF_PPC_TOCL;
694
695 if (Name == ".toc")
696 Rank |= RF_PPC_TOC;
697
698 if (Name == ".branch_lt")
699 Rank |= RF_PPC_BRANCH_LT;
700 }
701 if (Config->EMachine == EM_MIPS) {
702 // All sections with SHF_MIPS_GPREL flag should be grouped together
703 // because data in these sections is addressable with a gp relative address.
704 if (Sec->Flags & SHF_MIPS_GPREL)
705 Rank |= RF_MIPS_GPREL;
706
707 if (Sec->Name != ".got")
708 Rank |= RF_MIPS_NOT_GOT;
709 }
710
711 return Rank;
712}
713
Rafael Espindola383971d2017-06-15 21:51:01 +0000714static bool compareSections(const BaseCommand *ACmd, const BaseCommand *BCmd) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000715 const OutputSection *A = cast<OutputSection>(ACmd);
716 const OutputSection *B = cast<OutputSection>(BCmd);
Rafael Espindola52101412017-05-12 14:52:22 +0000717 if (A->SortRank != B->SortRank)
718 return A->SortRank < B->SortRank;
719 if (!(A->SortRank & RF_NOT_ADDR_SET))
720 return Config->SectionStartMap.lookup(A->Name) <
721 Config->SectionStartMap.lookup(B->Name);
Rafael Espindola24c073d2016-09-21 22:36:19 +0000722 return false;
723}
724
Rafael Espindola24e6f362017-02-24 15:07:30 +0000725void PhdrEntry::add(OutputSection *Sec) {
George Rimar6823c5f2017-09-07 11:01:10 +0000726 LastSec = Sec;
727 if (!FirstSec)
728 FirstSec = Sec;
Rafael Espindola37707632017-03-07 14:55:52 +0000729 p_align = std::max(p_align, Sec->Alignment);
Rafael Espindola17cb7c02016-12-19 17:01:01 +0000730 if (p_type == PT_LOAD)
George Rimar582ede82017-09-07 10:53:07 +0000731 Sec->PtLoad = this;
Eugene Leviantbbe38602016-07-19 09:25:43 +0000732}
733
Denis Protivensky8e3b38a2015-11-12 09:52:08 +0000734template <class ELFT>
Rafael Espindola5616adf2017-03-08 22:36:28 +0000735static Symbol *addRegular(StringRef Name, SectionBase *Sec, uint64_t Value,
736 uint8_t StOther = STV_HIDDEN,
737 uint8_t Binding = STB_WEAK) {
Rafael Espindoladab02d42016-11-17 21:20:16 +0000738 // The linker generated symbols are added as STB_WEAK to allow user defined
739 // ones to override them.
Rafael Espindola244ef982017-07-26 18:42:48 +0000740 return Symtab->addRegular<ELFT>(Name, StOther, STT_NOTYPE, Value,
741 /*Size=*/0, Binding, Sec,
742 /*File=*/nullptr);
Eugene Leviantad4439e2016-11-11 11:33:32 +0000743}
744
745template <class ELFT>
Rafael Espindola5616adf2017-03-08 22:36:28 +0000746static DefinedRegular *
747addOptionalRegular(StringRef Name, SectionBase *Sec, uint64_t Val,
748 uint8_t StOther = STV_HIDDEN, uint8_t Binding = STB_GLOBAL) {
Rafael Espindola244ef982017-07-26 18:42:48 +0000749 SymbolBody *S = Symtab->find(Name);
Eugene Leviantad4439e2016-11-11 11:33:32 +0000750 if (!S)
751 return nullptr;
Rafael Espindola1d6d1b42017-01-17 16:08:06 +0000752 if (S->isInCurrentDSO())
Rafael Espindola5616adf2017-03-08 22:36:28 +0000753 return nullptr;
754 return cast<DefinedRegular>(
755 addRegular<ELFT>(Name, Sec, Val, StOther, Binding)->body());
Eugene Leviantad4439e2016-11-11 11:33:32 +0000756}
757
Rui Ueyama01687222015-12-26 09:47:57 +0000758// The beginning and the ending of .rel[a].plt section are marked
759// with __rel[a]_iplt_{start,end} symbols if it is a statically linked
760// executable. The runtime needs these symbols in order to resolve
761// all IRELATIVE relocs on startup. For dynamic executables, we don't
762// need these symbols, since IRELATIVE relocs are resolved through GOT
763// and PLT. For details, see http://www.airs.com/blog/archives/403.
George Rimaree741cf2016-04-14 13:23:02 +0000764template <class ELFT> void Writer<ELFT>::addRelIpltSymbols() {
Shoaib Meenai335fad12017-08-05 05:01:07 +0000765 if (!Config->Static)
George Rimara07ff662015-12-21 10:12:06 +0000766 return;
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000767 StringRef S = Config->IsRela ? "__rela_iplt_start" : "__rel_iplt_start";
Rafael Espindola5616adf2017-03-08 22:36:28 +0000768 addOptionalRegular<ELFT>(S, In<ELFT>::RelaIplt, 0, STV_HIDDEN, STB_WEAK);
Rui Ueyama01687222015-12-26 09:47:57 +0000769
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000770 S = Config->IsRela ? "__rela_iplt_end" : "__rel_iplt_end";
Rafael Espindola5616adf2017-03-08 22:36:28 +0000771 addOptionalRegular<ELFT>(S, In<ELFT>::RelaIplt, -1, STV_HIDDEN, STB_WEAK);
George Rimara07ff662015-12-21 10:12:06 +0000772}
773
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +0000774// The linker is expected to define some symbols depending on
775// the linking result. This function defines such symbols.
776template <class ELFT> void Writer<ELFT>::addReservedSymbols() {
George Rimar7beff422016-11-15 08:19:02 +0000777 if (Config->EMachine == EM_MIPS) {
Rafael Espindola9b3f99e2016-04-12 02:24:43 +0000778 // Define _gp for MIPS. st_value of _gp symbol will be updated by Writer
Simon Atanasyan6a4eb752016-12-08 06:19:47 +0000779 // so that it points to an absolute address which by default is relative
780 // to GOT. Default offset is 0x7ff0.
Rafael Espindola9b3f99e2016-04-12 02:24:43 +0000781 // See "Global Data Symbols" in Chapter 6 in the following document:
782 // ftp://www.linux-mips.org/pub/linux/mips/doc/ABI/mipsabi.pdf
Rafael Espindola244ef982017-07-26 18:42:48 +0000783 ElfSym::MipsGp = Symtab->addAbsolute<ELFT>("_gp", STV_HIDDEN, STB_LOCAL);
Rafael Espindola9b3f99e2016-04-12 02:24:43 +0000784
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000785 // On MIPS O32 ABI, _gp_disp is a magic symbol designates offset between
Simon Atanasyand34a3632017-03-20 21:03:43 +0000786 // start of function and 'gp' pointer into GOT.
Rafael Espindola244ef982017-07-26 18:42:48 +0000787 if (Symtab->find("_gp_disp"))
Rui Ueyama80474a22017-02-28 19:29:55 +0000788 ElfSym::MipsGpDisp =
Rafael Espindola244ef982017-07-26 18:42:48 +0000789 Symtab->addAbsolute<ELFT>("_gp_disp", STV_HIDDEN, STB_LOCAL);
Peter Collingbourne6f535b72016-05-03 18:03:45 +0000790
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000791 // The __gnu_local_gp is a magic symbol equal to the current value of 'gp'
792 // pointer. This symbol is used in the code generated by .cpload pseudo-op
793 // in case of using -mno-shared option.
794 // https://sourceware.org/ml/binutils/2004-12/msg00094.html
Rafael Espindola244ef982017-07-26 18:42:48 +0000795 if (Symtab->find("__gnu_local_gp"))
Rui Ueyama80474a22017-02-28 19:29:55 +0000796 ElfSym::MipsLocalGp =
Rafael Espindola244ef982017-07-26 18:42:48 +0000797 Symtab->addAbsolute<ELFT>("__gnu_local_gp", STV_HIDDEN, STB_LOCAL);
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000798 }
799
Peter Smith113a59e2017-06-26 10:22:17 +0000800 // The _GLOBAL_OFFSET_TABLE_ symbol is defined by target convention to
801 // be at some offset from the base of the .got section, usually 0 or the end
802 // of the .got
Rui Ueyama92c37812017-06-26 15:11:24 +0000803 InputSection *GotSection = InX::MipsGot ? cast<InputSection>(InX::MipsGot)
804 : cast<InputSection>(InX::Got);
805 ElfSym::GlobalOffsetTable = addOptionalRegular<ELFT>(
806 "_GLOBAL_OFFSET_TABLE_", GotSection, Target->GotBaseSymOff);
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000807
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +0000808 // __tls_get_addr is defined by the dynamic linker for dynamic ELFs. For
809 // static linking the linker is required to optimize away any references to
810 // __tls_get_addr, so it's not defined anywhere. Create a hidden definition
Rui Ueyamaa2a46a92017-04-25 04:44:54 +0000811 // to avoid the undefined symbol error.
George Rimar69b17c32017-05-16 10:04:42 +0000812 if (!InX::DynSymTab)
Rafael Espindola244ef982017-07-26 18:42:48 +0000813 Symtab->addIgnored<ELFT>("__tls_get_addr");
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +0000814
Petr Hosek6b936bf2017-05-10 16:20:33 +0000815 // __ehdr_start is the location of ELF file headers. Note that we define
816 // this symbol unconditionally even when using a linker script, which
817 // differs from the behavior implemented by GNU linker which only define
818 // this symbol if ELF headers are in the memory mapped segment.
Rafael Espindola0e454a92017-06-06 16:18:48 +0000819 // __executable_start is not documented, but the expectation of at
820 // least the android libc is that it points to the elf header too.
821 // __dso_handle symbol is passed to cxa_finalize as a marker to identify
822 // each DSO. The address of the symbol doesn't matter as long as they are
823 // different in different DSOs, so we chose the start address of the DSO.
824 for (const char *Name :
825 {"__ehdr_start", "__executable_start", "__dso_handle"})
826 addOptionalRegular<ELFT>(Name, Out::ElfHeader, 0, STV_HIDDEN);
Petr Hosek6b936bf2017-05-10 16:20:33 +0000827
George Rimar28ac19c2016-08-08 08:42:48 +0000828 // If linker script do layout we do not need to create any standart symbols.
Rui Ueyamaa34da932017-03-21 23:03:09 +0000829 if (Script->Opt.HasSections)
George Rimar28ac19c2016-08-08 08:42:48 +0000830 return;
831
Davide Italiano763febc2017-09-18 18:31:49 +0000832 auto Add = [](StringRef S, int64_t Pos) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000833 return addOptionalRegular<ELFT>(S, Out::ElfHeader, Pos, STV_DEFAULT);
George Rimar9e859392016-02-26 14:36:36 +0000834 };
835
Rafael Espindola4d560162017-09-12 16:38:01 +0000836 ElfSym::Bss = Add("__bss_start", 0);
Davide Italiano763febc2017-09-18 18:31:49 +0000837 ElfSym::End1 = Add("end", -1);
838 ElfSym::End2 = Add("_end", -1);
839 ElfSym::Etext1 = Add("etext", -1);
840 ElfSym::Etext2 = Add("_etext", -1);
841 ElfSym::Edata1 = Add("edata", -1);
842 ElfSym::Edata2 = Add("_edata", -1);
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +0000843}
844
Rui Ueyamac4185702016-02-10 23:20:42 +0000845// Sort input sections by section name suffixes for
846// __attribute__((init_priority(N))).
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000847static void sortInitFini(OutputSection *Cmd) {
Rafael Espindola21263342017-07-05 23:36:24 +0000848 if (Cmd)
849 Cmd->sortInitFini();
Rui Ueyama5af83682016-02-11 23:41:38 +0000850}
851
852// Sort input sections by the special rule for .ctors and .dtors.
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000853static void sortCtorsDtors(OutputSection *Cmd) {
Rafael Espindola21263342017-07-05 23:36:24 +0000854 if (Cmd)
855 Cmd->sortCtorsDtors();
Rui Ueyamac4185702016-02-10 23:20:42 +0000856}
857
George Rimar1a33c0f2016-11-10 09:05:20 +0000858// Sort input sections using the list provided by --symbol-ordering-file.
George Rimar696a7f92017-09-19 09:20:54 +0000859static void sortBySymbolsOrder() {
George Rimar1a33c0f2016-11-10 09:05:20 +0000860 if (Config->SymbolOrderingFile.empty())
861 return;
862
Rui Ueyama31270312016-12-20 01:51:08 +0000863 // Sort sections by priority.
George Rimar696a7f92017-09-19 09:20:54 +0000864 DenseMap<SectionBase *, int> SectionOrder = buildSectionOrder();
Rafael Espindola21263342017-07-05 23:36:24 +0000865 for (BaseCommand *Base : Script->Opt.Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000866 if (auto *Sec = dyn_cast<OutputSection>(Base))
867 Sec->sort([&](InputSectionBase *S) { return SectionOrder.lookup(S); });
George Rimar1a33c0f2016-11-10 09:05:20 +0000868}
869
Eugene Leviante63d81b2016-07-20 14:43:20 +0000870template <class ELFT>
Rafael Espindolab4c9b812017-02-23 02:28:28 +0000871void Writer<ELFT>::forEachRelSec(std::function<void(InputSectionBase &)> Fn) {
George Rimarcb888a62017-09-13 07:54:47 +0000872 // Scan all relocations. Each relocation goes through a series
873 // of tests to determine if it needs special treatment, such as
874 // creating GOT, PLT, copy relocations, etc.
875 // Note that relocations for non-alloc sections are directly
876 // processed by InputSection::relocateNonAlloc.
877 for (InputSectionBase *IS : InputSections)
878 if (IS->Live && isa<InputSection>(IS) && (IS->Flags & SHF_ALLOC))
Rafael Espindola9f0c4bb2016-11-10 14:53:24 +0000879 Fn(*IS);
George Rimarcb888a62017-09-13 07:54:47 +0000880 for (EhInputSection *ES : In<ELFT>::EhFrame->Sections)
881 Fn(*ES);
Rafael Espindola0f7ceda2016-07-20 17:58:07 +0000882}
883
Eugene Leviant282251a2016-11-01 09:49:24 +0000884template <class ELFT> void Writer<ELFT>::createSections() {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000885 std::vector<BaseCommand *> Old = Script->Opt.Commands;
886 Script->Opt.Commands.clear();
Rui Ueyama536a2672017-02-27 02:32:08 +0000887 for (InputSectionBase *IS : InputSections)
Rafael Espindola82902742017-02-16 17:32:26 +0000888 if (IS)
George Rimare21c3af2017-03-14 09:30:25 +0000889 Factory.addInputSec(IS, getOutputSectionName(IS->Name));
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000890 Script->Opt.Commands.insert(Script->Opt.Commands.end(), Old.begin(),
891 Old.end());
Eugene Leviantceabe802016-08-11 07:56:43 +0000892
Rafael Espindola21263342017-07-05 23:36:24 +0000893 Script->fabricateDefaultCommands();
George Rimar696a7f92017-09-19 09:20:54 +0000894 sortBySymbolsOrder();
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000895 sortInitFini(findSection(".init_array"));
896 sortInitFini(findSection(".fini_array"));
897 sortCtorsDtors(findSection(".ctors"));
898 sortCtorsDtors(findSection(".dtors"));
Eugene Leviante63d81b2016-07-20 14:43:20 +0000899}
900
Petr Hosek18821b62017-09-01 02:23:31 +0000901// This function generates assignments for predefined symbols (e.g. _end or
902// _etext) and inserts them into the commands sequence to be processed at the
903// appropriate time. This ensures that the value is going to be correct by the
904// time any references to these symbols are processed and is equivalent to
905// defining these symbols explicitly in the linker script.
Rafael Espindola4d560162017-09-12 16:38:01 +0000906template <class ELFT> void Writer<ELFT>::setReservedSymbolSections() {
Petr Hosek18821b62017-09-01 02:23:31 +0000907 PhdrEntry *Last = nullptr;
908 PhdrEntry *LastRO = nullptr;
909 PhdrEntry *LastRW = nullptr;
Rui Ueyama888da8c2017-09-05 20:17:37 +0000910
Petr Hosek18821b62017-09-01 02:23:31 +0000911 for (PhdrEntry *P : Phdrs) {
912 if (P->p_type != PT_LOAD)
913 continue;
914 Last = P;
915 if (P->p_flags & PF_W)
916 LastRW = P;
917 else
918 LastRO = P;
919 }
920
Rui Ueyama888da8c2017-09-05 20:17:37 +0000921 // _end is the first location after the uninitialized data region.
Petr Hosek18821b62017-09-01 02:23:31 +0000922 if (Last) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000923 if (ElfSym::End1)
924 ElfSym::End1->Section = Last->LastSec;
925 if (ElfSym::End2)
926 ElfSym::End2->Section = Last->LastSec;
Petr Hosek18821b62017-09-01 02:23:31 +0000927 }
Rui Ueyama888da8c2017-09-05 20:17:37 +0000928
929 // _etext is the first location after the last read-only loadable segment.
Petr Hosek18821b62017-09-01 02:23:31 +0000930 if (LastRO) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000931 if (ElfSym::Etext1)
932 ElfSym::Etext1->Section = LastRO->LastSec;
933 if (ElfSym::Etext2)
934 ElfSym::Etext2->Section = LastRO->LastSec;
Petr Hosek18821b62017-09-01 02:23:31 +0000935 }
Rui Ueyama888da8c2017-09-05 20:17:37 +0000936
937 // _edata points to the end of the last non SHT_NOBITS section.
Petr Hosek18821b62017-09-01 02:23:31 +0000938 if (LastRW) {
Rui Ueyama888da8c2017-09-05 20:17:37 +0000939 size_t I = 0;
Rafael Espindola4d560162017-09-12 16:38:01 +0000940 for (; I < OutputSections.size(); ++I)
941 if (OutputSections[I] == LastRW->FirstSec)
Rui Ueyama888da8c2017-09-05 20:17:37 +0000942 break;
943
Rafael Espindola4d560162017-09-12 16:38:01 +0000944 for (; I < OutputSections.size(); ++I) {
945 if (OutputSections[I]->Type != SHT_NOBITS)
Rui Ueyama888da8c2017-09-05 20:17:37 +0000946 continue;
Rui Ueyama888da8c2017-09-05 20:17:37 +0000947 break;
Petr Hosek18821b62017-09-01 02:23:31 +0000948 }
Rafael Espindola4d560162017-09-12 16:38:01 +0000949 if (ElfSym::Edata1)
950 ElfSym::Edata1->Section = OutputSections[I - 1];
951 if (ElfSym::Edata2)
952 ElfSym::Edata2->Section = OutputSections[I - 1];
953 }
954
955 if (ElfSym::Bss)
956 ElfSym::Bss->Section = findSection(".bss");
957
958 // Setup MIPS _gp_disp/__gnu_local_gp symbols which should
959 // be equal to the _gp symbol's value.
Rafael Espindola9be24cf2017-09-20 18:30:57 +0000960 if (ElfSym::MipsGp) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000961 // Find GP-relative section with the lowest address
962 // and use this address to calculate default _gp value.
963 for (OutputSection *OS : OutputSections) {
964 if (OS->Flags & SHF_MIPS_GPREL) {
965 ElfSym::MipsGp->Section = OS;
966 ElfSym::MipsGp->Value = 0x7ff0;
967 break;
968 }
969 }
Petr Hosek18821b62017-09-01 02:23:31 +0000970 }
971}
972
Rafael Espindola52101412017-05-12 14:52:22 +0000973// We want to find how similar two ranks are.
974// The more branches in getSectionRank that match, the more similar they are.
975// Since each branch corresponds to a bit flag, we can just use
976// countLeadingZeros.
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000977static int getRankProximityAux(OutputSection *A, OutputSection *B) {
Rafael Espindola52101412017-05-12 14:52:22 +0000978 return countLeadingZeros(A->SortRank ^ B->SortRank);
Eugene Leviantbae1c652016-11-08 10:44:48 +0000979}
980
Rafael Espindola383971d2017-06-15 21:51:01 +0000981static int getRankProximity(OutputSection *A, BaseCommand *B) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000982 if (auto *Sec = dyn_cast<OutputSection>(B))
983 if (Sec->Live)
984 return getRankProximityAux(A, Sec);
Rafael Espindola383971d2017-06-15 21:51:01 +0000985 return -1;
986}
987
988// When placing orphan sections, we want to place them after symbol assignments
989// so that an orphan after
990// begin_foo = .;
991// foo : { *(foo) }
992// end_foo = .;
993// doesn't break the intended meaning of the begin/end symbols.
994// We don't want to go over sections since findOrphanPos is the
995// one in charge of deciding the order of the sections.
996// We don't want to go over changes to '.', since doing so in
997// rx_sec : { *(rx_sec) }
998// . = ALIGN(0x1000);
999// /* The RW PT_LOAD starts here*/
1000// rw_sec : { *(rw_sec) }
1001// would mean that the RW PT_LOAD would become unaligned.
1002static bool shouldSkip(BaseCommand *Cmd) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001003 if (isa<OutputSection>(Cmd))
Rafael Espindola383971d2017-06-15 21:51:01 +00001004 return false;
1005 if (auto *Assign = dyn_cast<SymbolAssignment>(Cmd))
1006 return Assign->Name != ".";
1007 return true;
1008}
1009
Rafael Espindola52101412017-05-12 14:52:22 +00001010// We want to place orphan sections so that they share as much
1011// characteristics with their neighbors as possible. For example, if
1012// both are rw, or both are tls.
Rafael Espindola0ca37122017-05-09 13:58:46 +00001013template <typename ELFT>
Rafael Espindola383971d2017-06-15 21:51:01 +00001014static std::vector<BaseCommand *>::iterator
1015findOrphanPos(std::vector<BaseCommand *>::iterator B,
1016 std::vector<BaseCommand *>::iterator E) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001017 OutputSection *Sec = cast<OutputSection>(*E);
Rafael Espindola0ca37122017-05-09 13:58:46 +00001018
Rafael Espindola52101412017-05-12 14:52:22 +00001019 // Find the first element that has as close a rank as possible.
Rafael Espindola383971d2017-06-15 21:51:01 +00001020 auto I = std::max_element(B, E, [=](BaseCommand *A, BaseCommand *B) {
Rafael Espindola52101412017-05-12 14:52:22 +00001021 return getRankProximity(Sec, A) < getRankProximity(Sec, B);
1022 });
1023 if (I == E)
Rafael Espindola0ca37122017-05-09 13:58:46 +00001024 return E;
1025
Rafael Espindola52101412017-05-12 14:52:22 +00001026 // Consider all existing sections with the same proximity.
Rafael Espindola383971d2017-06-15 21:51:01 +00001027 int Proximity = getRankProximity(Sec, *I);
1028 for (; I != E; ++I) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001029 auto *CurSec = dyn_cast<OutputSection>(*I);
1030 if (!CurSec || !CurSec->Live)
Rafael Espindola383971d2017-06-15 21:51:01 +00001031 continue;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001032 if (getRankProximity(Sec, CurSec) != Proximity ||
1033 Sec->SortRank < CurSec->SortRank)
Rafael Espindola383971d2017-06-15 21:51:01 +00001034 break;
1035 }
1036 auto J = std::find_if(
Rafael Espindolac54b1c82017-06-15 22:03:06 +00001037 llvm::make_reverse_iterator(I), llvm::make_reverse_iterator(B),
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001038 [](BaseCommand *Cmd) { return isa<OutputSection>(Cmd); });
Rafael Espindola383971d2017-06-15 21:51:01 +00001039 I = J.base();
Rafael Espindolaaad64e02017-09-19 17:29:58 +00001040
1041 // As a special case, if the orphan section is the last section, put
1042 // it at the very end, past any other commands.
1043 // This matches bfd's behavior and is convenient when the linker script fully
1044 // specifies the start of the file, but doesn't care about the end (the non
1045 // alloc sections for example).
1046 auto NextSec = std::find_if(
1047 I, E, [](BaseCommand *Cmd) { return isa<OutputSection>(Cmd); });
1048 if (NextSec == E)
1049 return E;
1050
Rafael Espindola383971d2017-06-15 21:51:01 +00001051 while (I != E && shouldSkip(*I))
Rafael Espindola52101412017-05-12 14:52:22 +00001052 ++I;
1053 return I;
Rafael Espindola0ca37122017-05-09 13:58:46 +00001054}
1055
Rafael Espindola24c073d2016-09-21 22:36:19 +00001056template <class ELFT> void Writer<ELFT>::sortSections() {
George Rimarba455842017-10-02 09:11:13 +00001057 Script->adjustSectionsBeforeSorting();
George Rimare0b43df2017-06-28 09:59:34 +00001058
Rafael Espindola1960bcd2016-11-11 22:43:27 +00001059 // Don't sort if using -r. It is not necessary and we want to preserve the
1060 // relative order for SHF_LINK_ORDER sections.
1061 if (Config->Relocatable)
Rafael Espindola85de6782017-06-28 22:44:11 +00001062 return;
Rafael Espindola52101412017-05-12 14:52:22 +00001063
Rafael Espindola383971d2017-06-15 21:51:01 +00001064 for (BaseCommand *Base : Script->Opt.Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001065 if (auto *Sec = dyn_cast<OutputSection>(Base))
1066 Sec->SortRank = getSectionRank(Sec);
Rafael Espindola52101412017-05-12 14:52:22 +00001067
Rui Ueyamaa34da932017-03-21 23:03:09 +00001068 if (!Script->Opt.HasSections) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001069 // We know that all the OutputSections are contiguous in
Rafael Espindola383971d2017-06-15 21:51:01 +00001070 // this case.
1071 auto E = Script->Opt.Commands.end();
1072 auto I = Script->Opt.Commands.begin();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001073 auto IsSection = [](BaseCommand *Base) { return isa<OutputSection>(Base); };
Rafael Espindola383971d2017-06-15 21:51:01 +00001074 I = std::find_if(I, E, IsSection);
Rafael Espindolac54b1c82017-06-15 22:03:06 +00001075 E = std::find_if(llvm::make_reverse_iterator(E),
1076 llvm::make_reverse_iterator(I), IsSection)
Rafael Espindola383971d2017-06-15 21:51:01 +00001077 .base();
1078 std::stable_sort(I, E, compareSections);
Rafael Espindola24c073d2016-09-21 22:36:19 +00001079 return;
1080 }
1081
Rafael Espindola383971d2017-06-15 21:51:01 +00001082 // Orphan sections are sections present in the input files which are
1083 // not explicitly placed into the output file by the linker script.
1084 //
1085 // The sections in the linker script are already in the correct
1086 // order. We have to figuere out where to insert the orphan
1087 // sections.
1088 //
Rafael Espindola24c073d2016-09-21 22:36:19 +00001089 // The order of the sections in the script is arbitrary and may not agree with
Rafael Espindola383971d2017-06-15 21:51:01 +00001090 // compareSections. This means that we cannot easily define a strict weak
1091 // ordering. To see why, consider a comparison of a section in the script and
1092 // one not in the script. We have a two simple options:
Rafael Espindola24c073d2016-09-21 22:36:19 +00001093 // * Make them equivalent (a is not less than b, and b is not less than a).
1094 // The problem is then that equivalence has to be transitive and we can
1095 // have sections a, b and c with only b in a script and a less than c
1096 // which breaks this property.
1097 // * Use compareSectionsNonScript. Given that the script order doesn't have
1098 // to match, we can end up with sections a, b, c, d where b and c are in the
1099 // script and c is compareSectionsNonScript less than b. In which case d
1100 // can be equivalent to c, a to b and d < a. As a concrete example:
1101 // .a (rx) # not in script
1102 // .b (rx) # in script
1103 // .c (ro) # in script
1104 // .d (ro) # not in script
1105 //
1106 // The way we define an order then is:
Rafael Espindola383971d2017-06-15 21:51:01 +00001107 // * Sort only the orphan sections. They are in the end right now.
1108 // * Move each orphan section to its preferred position. We try
Eugene Leviantbae1c652016-11-08 10:44:48 +00001109 // to put each section in the last position where it it can share
1110 // a PT_LOAD.
Rafael Espindola383971d2017-06-15 21:51:01 +00001111 //
1112 // There is some ambiguity as to where exactly a new entry should be
1113 // inserted, because Opt.Commands contains not only output section
1114 // commands but also other types of commands such as symbol assignment
1115 // expressions. There's no correct answer here due to the lack of the
1116 // formal specification of the linker script. We use heuristics to
1117 // determine whether a new output command should be added before or
1118 // after another commands. For the details, look at shouldSkip
1119 // function.
Rafael Espindola24c073d2016-09-21 22:36:19 +00001120
Rafael Espindola383971d2017-06-15 21:51:01 +00001121 auto I = Script->Opt.Commands.begin();
1122 auto E = Script->Opt.Commands.end();
1123 auto NonScriptI = std::find_if(I, E, [](BaseCommand *Base) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001124 if (auto *Sec = dyn_cast<OutputSection>(Base))
1125 return Sec->Live && Sec->SectionIndex == INT_MAX;
Rafael Espindola383971d2017-06-15 21:51:01 +00001126 return false;
1127 });
Rafael Espindola24c073d2016-09-21 22:36:19 +00001128
Rafael Espindola383971d2017-06-15 21:51:01 +00001129 // Sort the orphan sections.
1130 std::stable_sort(NonScriptI, E, compareSections);
1131
1132 // As a horrible special case, skip the first . assignment if it is before any
1133 // section. We do this because it is common to set a load address by starting
1134 // the script with ". = 0xabcd" and the expectation is that every section is
1135 // after that.
1136 auto FirstSectionOrDotAssignment =
1137 std::find_if(I, E, [](BaseCommand *Cmd) { return !shouldSkip(Cmd); });
1138 if (FirstSectionOrDotAssignment != E &&
1139 isa<SymbolAssignment>(**FirstSectionOrDotAssignment))
1140 ++FirstSectionOrDotAssignment;
1141 I = FirstSectionOrDotAssignment;
1142
Rafael Espindola52101412017-05-12 14:52:22 +00001143 while (NonScriptI != E) {
1144 auto Pos = findOrphanPos<ELFT>(I, NonScriptI);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001145 OutputSection *Orphan = cast<OutputSection>(*NonScriptI);
Rafael Espindola52101412017-05-12 14:52:22 +00001146
1147 // As an optimization, find all sections with the same sort rank
1148 // and insert them with one rotate.
Rafael Espindola383971d2017-06-15 21:51:01 +00001149 unsigned Rank = Orphan->SortRank;
1150 auto End = std::find_if(NonScriptI + 1, E, [=](BaseCommand *Cmd) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001151 return cast<OutputSection>(Cmd)->SortRank != Rank;
Rafael Espindola52101412017-05-12 14:52:22 +00001152 });
1153 std::rotate(Pos, NonScriptI, End);
1154 NonScriptI = End;
1155 }
Rafael Espindolaf7a17442016-11-14 15:39:38 +00001156
George Rimara8dba482017-03-20 10:09:58 +00001157 Script->adjustSectionsAfterSorting();
Rafael Espindola24c073d2016-09-21 22:36:19 +00001158}
1159
Peter Smith1ec42d92017-03-08 14:06:24 +00001160static void applySynthetic(const std::vector<SyntheticSection *> &Sections,
1161 std::function<void(SyntheticSection *)> Fn) {
Rui Ueyama9320cb02017-02-27 02:56:02 +00001162 for (SyntheticSection *SS : Sections)
Rafael Espindolad57c58d2017-06-07 02:31:19 +00001163 if (SS && SS->getParent() && !SS->empty())
Peter Smith1ec42d92017-03-08 14:06:24 +00001164 Fn(SS);
Eugene Leviant6380ce22016-11-15 12:26:55 +00001165}
1166
George Rimar11992c862016-11-25 08:05:41 +00001167// We need to add input synthetic sections early in createSyntheticSections()
Rui Ueyamac38860b2016-12-05 21:39:35 +00001168// to make them visible from linkescript side. But not all sections are always
1169// required to be in output. For example we don't need dynamic section content
James Henderson7ee22752017-04-06 09:40:03 +00001170// sometimes. This function filters out such unused sections from the output.
Rafael Espindolac080ff62017-07-03 16:54:39 +00001171static void removeUnusedSyntheticSections() {
Rafael Espindola9e9754b2017-02-03 13:06:18 +00001172 // All input synthetic sections that can be empty are placed after
1173 // all regular ones. We iterate over them all and exit at first
1174 // non-synthetic.
Rui Ueyama536a2672017-02-27 02:32:08 +00001175 for (InputSectionBase *S : llvm::reverse(InputSections)) {
Rui Ueyama9320cb02017-02-27 02:56:02 +00001176 SyntheticSection *SS = dyn_cast<SyntheticSection>(S);
Rui Ueyamac38860b2016-12-05 21:39:35 +00001177 if (!SS)
George Rimar11992c862016-11-25 08:05:41 +00001178 return;
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001179 OutputSection *OS = SS->getParent();
1180 if (!SS->empty() || !OS)
George Rimar11992c862016-11-25 08:05:41 +00001181 continue;
Rafael Espindolac080ff62017-07-03 16:54:39 +00001182
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001183 std::vector<BaseCommand *>::iterator Empty = OS->Commands.end();
1184 for (auto I = OS->Commands.begin(), E = OS->Commands.end(); I != E; ++I) {
Rafael Espindola43ee3602017-07-03 17:32:09 +00001185 BaseCommand *B = *I;
Rafael Espindolac080ff62017-07-03 16:54:39 +00001186 if (auto *ISD = dyn_cast<InputSectionDescription>(B)) {
George Rimar7ac38252017-09-08 13:26:45 +00001187 llvm::erase_if(ISD->Sections,
1188 [=](InputSection *IS) { return IS == SS; });
Rafael Espindolac080ff62017-07-03 16:54:39 +00001189 if (ISD->Sections.empty())
Rafael Espindola43ee3602017-07-03 17:32:09 +00001190 Empty = I;
Rafael Espindolac080ff62017-07-03 16:54:39 +00001191 }
1192 }
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001193 if (Empty != OS->Commands.end())
1194 OS->Commands.erase(Empty);
Rafael Espindolac080ff62017-07-03 16:54:39 +00001195
James Henderson7ee22752017-04-06 09:40:03 +00001196 // If there are no other sections in the output section, remove it from the
1197 // output.
George Rimar9a2da392017-09-08 13:40:07 +00001198 if (OS->Commands.empty())
George Rimarba455842017-10-02 09:11:13 +00001199 OS->Live = false;
George Rimar11992c862016-11-25 08:05:41 +00001200 }
1201}
1202
Rafael Espindola35c908f2017-08-10 15:05:37 +00001203// Returns true if a symbol can be replaced at load-time by a symbol
1204// with the same name defined in other ELF executable or DSO.
1205static bool computeIsPreemptible(const SymbolBody &B) {
1206 assert(!B.isLocal());
Rafael Espindola35c908f2017-08-10 15:05:37 +00001207 // Only symbols that appear in dynsym can be preempted.
1208 if (!B.symbol()->includeInDynsym())
1209 return false;
1210
1211 // Only default visibility symbols can be preempted.
1212 if (B.symbol()->Visibility != STV_DEFAULT)
1213 return false;
1214
Rafael Espindola30ea5cf2017-09-12 17:18:03 +00001215 // At this point copy relocations have not been created yet, so any
1216 // symbol that is not defined locally is preemptible.
Rafael Espindolaee6a3522017-09-08 18:41:49 +00001217 if (!B.isInCurrentDSO())
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001218 return true;
1219
1220 // If we have a dynamic list it specifies which local symbols are preemptible.
Rafael Espindola8016bdf2017-09-08 18:53:43 +00001221 if (Config->HasDynamicList)
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001222 return false;
1223
Rafael Espindola35c908f2017-08-10 15:05:37 +00001224 if (!Config->Shared)
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001225 return false;
Rafael Espindola35c908f2017-08-10 15:05:37 +00001226
1227 // -Bsymbolic means that definitions are not preempted.
1228 if (Config->Bsymbolic || (Config->BsymbolicFunctions && B.isFunc()))
Rafael Espindola716c57b2017-09-08 18:23:25 +00001229 return false;
Rafael Espindola35c908f2017-08-10 15:05:37 +00001230 return true;
1231}
1232
Eugene Leviante63d81b2016-07-20 14:43:20 +00001233// Create output section objects and add them to OutputSections.
1234template <class ELFT> void Writer<ELFT>::finalizeSections() {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001235 Out::DebugInfo = findSection(".debug_info");
1236 Out::PreinitArray = findSection(".preinit_array");
1237 Out::InitArray = findSection(".init_array");
1238 Out::FiniArray = findSection(".fini_array");
Rafael Espindola77572242015-10-02 19:37:55 +00001239
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001240 // The linker needs to define SECNAME_start, SECNAME_end and SECNAME_stop
1241 // symbols for sections, so that the runtime can get the start and end
1242 // addresses of each section by section name. Add such symbols.
George Rimarc1034a82016-03-01 19:12:35 +00001243 if (!Config->Relocatable) {
1244 addStartEndSymbols();
Rafael Espindolab6915452017-07-04 19:05:03 +00001245 for (BaseCommand *Base : Script->Opt.Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001246 if (auto *Sec = dyn_cast<OutputSection>(Base))
1247 addStartStopSymbols(Sec);
George Rimarc1034a82016-03-01 19:12:35 +00001248 }
Rui Ueyamad4530c62016-03-04 18:34:14 +00001249
1250 // Add _DYNAMIC symbol. Unlike GNU gold, our _DYNAMIC symbol has no type.
1251 // It should be okay as no one seems to care about the type.
1252 // Even the author of gold doesn't remember why gold behaves that way.
1253 // https://sourceware.org/ml/binutils/2002-03/msg00360.html
George Rimar69b17c32017-05-16 10:04:42 +00001254 if (InX::DynSymTab)
Rafael Espindola5ab19892017-05-11 23:16:43 +00001255 addRegular<ELFT>("_DYNAMIC", InX::Dynamic, 0);
Rafael Espindola334c3e12015-10-19 15:21:42 +00001256
Rafael Espindolade9857e2016-02-04 21:33:05 +00001257 // Define __rel[a]_iplt_{start,end} symbols if needed.
1258 addRelIpltSymbols();
1259
Rafael Espindola66b4e212017-02-23 22:06:28 +00001260 // This responsible for splitting up .eh_frame section into
Peter Smith1ec42d92017-03-08 14:06:24 +00001261 // pieces. The relocation scan uses those pieces, so this has to be
Rafael Espindola66b4e212017-02-23 22:06:28 +00001262 // earlier.
George Rimar49a47f22017-03-16 10:29:44 +00001263 applySynthetic({In<ELFT>::EhFrame},
1264 [](SyntheticSection *SS) { SS->finalizeContents(); });
Rafael Espindola56004c52016-04-07 14:22:09 +00001265
Rafael Espindola0ff545c2017-09-08 01:09:52 +00001266 for (Symbol *S : Symtab->getSymbols())
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001267 S->body()->IsPreemptible |= computeIsPreemptible(*S->body());
Rafael Espindola35c908f2017-08-10 15:05:37 +00001268
Rafael Espindola0f7ceda2016-07-20 17:58:07 +00001269 // Scan relocations. This must be done after every symbol is declared so that
1270 // we can correctly decide if a dynamic relocation is needed.
George Rimarcb888a62017-09-13 07:54:47 +00001271 if (!Config->Relocatable)
1272 forEachRelSec(scanRelocations<ELFT>);
Rafael Espindola0f7ceda2016-07-20 17:58:07 +00001273
Rafael Espindola895aea62017-05-11 22:02:41 +00001274 if (InX::Plt && !InX::Plt->empty())
1275 InX::Plt->addSymbols();
1276 if (InX::Iplt && !InX::Iplt->empty())
1277 InX::Iplt->addSymbols();
Peter Smith96943762017-01-25 10:31:16 +00001278
Peter Smith55865432017-02-20 11:12:33 +00001279 // Now that we have defined all possible global symbols including linker-
Rui Ueyama1b2a8bf2015-12-26 10:22:16 +00001280 // synthesized ones. Visit all symbols to give the finishing touches.
Rafael Espindola244ef982017-07-26 18:42:48 +00001281 for (Symbol *S : Symtab->getSymbols()) {
Peter Collingbourne4f952702016-05-01 04:55:03 +00001282 SymbolBody *Body = S->body();
Rafael Espindola0baa73f2016-04-26 13:56:26 +00001283
George Rimar7702bc22017-03-16 11:20:02 +00001284 if (!includeInSymtab(*Body))
Rafael Espindola05a3dd22015-09-22 23:38:23 +00001285 continue;
George Rimar69b17c32017-05-16 10:04:42 +00001286 if (InX::SymTab)
1287 InX::SymTab->addSymbol(Body);
Rafael Espindola05a3dd22015-09-22 23:38:23 +00001288
George Rimar69b17c32017-05-16 10:04:42 +00001289 if (InX::DynSymTab && S->includeInDynsym()) {
1290 InX::DynSymTab->addSymbol(Body);
Rui Ueyama4076fa12017-02-26 23:35:34 +00001291 if (auto *SS = dyn_cast<SharedSymbol>(Body))
Rafael Espindola6e93d052017-08-04 22:31:42 +00001292 if (cast<SharedFile<ELFT>>(S->File)->isNeeded())
Eugene Leviante9bab5d2016-11-21 16:59:33 +00001293 In<ELFT>::VerNeed->addSymbol(SS);
Peter Collingbourne21a12fc2016-04-27 20:22:31 +00001294 }
Rafael Espindola05a3dd22015-09-22 23:38:23 +00001295 }
Rui Ueyamac2a0d7e2016-01-28 22:56:29 +00001296
1297 // Do not proceed if there was an undefined symbol.
Rui Ueyamaf373dd72016-11-24 01:43:21 +00001298 if (ErrorCount)
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +00001299 return;
Rui Ueyamac2a0d7e2016-01-28 22:56:29 +00001300
Rafael Espindola1eb3a0f2017-07-04 18:26:21 +00001301 addPredefinedSections();
Rafael Espindolac080ff62017-07-03 16:54:39 +00001302 removeUnusedSyntheticSections();
1303
Rafael Espindola24c073d2016-09-21 22:36:19 +00001304 sortSections();
George Rimarba455842017-10-02 09:11:13 +00001305 Script->removeEmptyCommands();
Rafael Espindola383971d2017-06-15 21:51:01 +00001306
1307 // Now that we have the final list, create a list of all the
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001308 // OutputSections for convenience.
Rafael Espindolacdf813b2017-06-13 22:36:20 +00001309 for (BaseCommand *Base : Script->Opt.Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001310 if (auto *Sec = dyn_cast<OutputSection>(Base))
1311 OutputSections.push_back(Sec);
Rui Ueyama84417f82015-12-26 07:50:41 +00001312
Rafael Espindola9c0395e2017-06-20 01:51:50 +00001313 // Prefer command line supplied address over other constraints.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001314 for (OutputSection *Sec : OutputSections) {
1315 auto I = Config->SectionStartMap.find(Sec->Name);
Rafael Espindola9c0395e2017-06-20 01:51:50 +00001316 if (I != Config->SectionStartMap.end())
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001317 Sec->AddrExpr = [=] { return I->second; };
Rafael Espindola9c0395e2017-06-20 01:51:50 +00001318 }
1319
Rafael Espindola78493a22017-01-28 17:48:21 +00001320 // This is a bit of a hack. A value of 0 means undef, so we set it
1321 // to 1 t make __ehdr_start defined. The section number is not
1322 // particularly relevant.
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001323 Out::ElfHeader->SectionIndex = 1;
Rafael Espindola78493a22017-01-28 17:48:21 +00001324
George Rimar7ca06272016-04-06 07:20:45 +00001325 unsigned I = 1;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001326 for (OutputSection *Sec : OutputSections) {
George Rimar7ca06272016-04-06 07:20:45 +00001327 Sec->SectionIndex = I++;
Rafael Espindola895aea62017-05-11 22:02:41 +00001328 Sec->ShName = InX::ShStrTab->addString(Sec->Name);
George Rimar7ca06272016-04-06 07:20:45 +00001329 }
Rui Ueyama84417f82015-12-26 07:50:41 +00001330
Rafael Espindola5967c972016-12-19 21:21:07 +00001331 // Binary and relocatable output does not have PHDRS.
1332 // The headers have to be created before finalize as that can influence the
1333 // image base and the dynamic section on mips includes the image base.
1334 if (!Config->Relocatable && !Config->OFormatBinary) {
Rafael Espindolaf51c8052017-06-13 23:26:31 +00001335 Phdrs = Script->hasPhdrsCommands() ? Script->createPhdrs() : createPhdrs();
Rafael Espindola5967c972016-12-19 21:21:07 +00001336 addPtArmExid(Phdrs);
Rafael Espindola02ed7572017-05-04 19:34:17 +00001337 Out::ProgramHeaders->Size = sizeof(Elf_Phdr) * Phdrs.size();
Rafael Espindola5967c972016-12-19 21:21:07 +00001338 }
1339
Rafael Espindola4d560162017-09-12 16:38:01 +00001340 // Some symbols are defined in term of program headers. Now that we
1341 // have the headers, we can find out which sections they point to.
1342 setReservedSymbolSections();
1343
Eugene Leviantbe809a72016-11-18 06:44:18 +00001344 // Dynamic section must be the last one in this list and dynamic
1345 // symbol table section (DynSymTab) must be the first one.
Rui Ueyama2b6631b2017-08-15 17:01:39 +00001346 applySynthetic({InX::DynSymTab, InX::Bss,
1347 InX::BssRelRo, InX::GnuHashTab,
George Rimaraaf54712017-09-27 09:14:59 +00001348 InX::HashTab, InX::SymTab,
Rui Ueyama2b6631b2017-08-15 17:01:39 +00001349 InX::ShStrTab, InX::StrTab,
1350 In<ELFT>::VerDef, InX::DynStrTab,
1351 InX::Got, InX::MipsGot,
1352 InX::IgotPlt, InX::GotPlt,
1353 In<ELFT>::RelaDyn, In<ELFT>::RelaIplt,
1354 In<ELFT>::RelaPlt, InX::Plt,
1355 InX::Iplt, In<ELFT>::EhFrameHdr,
1356 In<ELFT>::VerSym, In<ELFT>::VerNeed,
1357 InX::Dynamic},
George Rimar49a47f22017-03-16 10:29:44 +00001358 [](SyntheticSection *SS) { SS->finalizeContents(); });
Peter Smith1ec42d92017-03-08 14:06:24 +00001359
Peter Smith3ef89b02017-09-06 14:02:14 +00001360 if (!Script->Opt.HasSections && !Config->Relocatable)
1361 fixSectionAlignments();
1362
Peter Smith1ec42d92017-03-08 14:06:24 +00001363 // Some architectures use small displacements for jump instructions.
1364 // It is linker's responsibility to create thunks containing long
1365 // jump instructions if jump targets are too far. Create thunks.
1366 if (Target->NeedsThunks) {
1367 // FIXME: only ARM Interworking and Mips LA25 Thunks are implemented,
1368 // these
1369 // do not require address information. To support range extension Thunks
1370 // we need to assign addresses so that we can tell if jump instructions
1371 // are out of range. This will need to turn into a loop that converges
1372 // when no more Thunks are added
George Rimarec84ffc2017-05-17 07:10:59 +00001373 ThunkCreator TC;
Peter Smith96f813d2017-07-07 10:03:37 +00001374 Script->assignAddresses();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001375 if (TC.createThunks(OutputSections)) {
Rafael Espindolab3aa2c92017-05-11 21:33:30 +00001376 applySynthetic({InX::MipsGot},
George Rimar49a47f22017-03-16 10:29:44 +00001377 [](SyntheticSection *SS) { SS->updateAllocSize(); });
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001378 if (TC.createThunks(OutputSections))
Peter Smith32980272017-06-16 13:10:08 +00001379 fatal("All non-range thunks should be created in first call");
1380 }
Peter Smith1ec42d92017-03-08 14:06:24 +00001381 }
Peter Smith43e852f2017-06-05 08:51:15 +00001382
Peter Smith1ec42d92017-03-08 14:06:24 +00001383 // Fill other section headers. The dynamic table is finalized
1384 // at the end because some tags like RELSZ depend on result
1385 // of finalizing other sections.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001386 for (OutputSection *Sec : OutputSections)
1387 Sec->finalize<ELFT>();
Peter Smith1ec42d92017-03-08 14:06:24 +00001388
1389 // createThunks may have added local symbols to the static symbol table
George Rimar69b17c32017-05-16 10:04:42 +00001390 applySynthetic({InX::SymTab, InX::ShStrTab, InX::StrTab},
George Rimar49a47f22017-03-16 10:29:44 +00001391 [](SyntheticSection *SS) { SS->postThunkContents(); });
Rui Ueyama84417f82015-12-26 07:50:41 +00001392}
1393
Rui Ueyama84417f82015-12-26 07:50:41 +00001394template <class ELFT> void Writer<ELFT>::addPredefinedSections() {
Rui Ueyamadec4ab02017-02-16 04:19:03 +00001395 // ARM ABI requires .ARM.exidx to be terminated by some piece of data.
1396 // We have the terminater synthetic section class. Add that at the end.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001397 OutputSection *Cmd = findSection(".ARM.exidx");
1398 if (!Cmd || !Cmd->Live || Config->Relocatable)
Peter Smith626c9972017-05-30 11:51:02 +00001399 return;
1400
1401 auto *Sentinel = make<ARMExidxSentinelSection>();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001402 Cmd->addSection(Sentinel);
Rafael Espindolaabad6182015-08-13 15:23:46 +00001403}
1404
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001405// The linker is expected to define SECNAME_start and SECNAME_end
1406// symbols for a few sections. This function defines them.
1407template <class ELFT> void Writer<ELFT>::addStartEndSymbols() {
Rafael Espindola24e6f362017-02-24 15:07:30 +00001408 auto Define = [&](StringRef Start, StringRef End, OutputSection *OS) {
Peter Collingbourne0fab40b2016-10-24 20:46:21 +00001409 // These symbols resolve to the image base if the section does not exist.
Rui Ueyama4f2f50d2016-12-21 08:40:09 +00001410 // A special value -1 indicates end of the section.
Peter Collingbournef8435a92017-03-13 16:40:20 +00001411 if (OS) {
1412 addOptionalRegular<ELFT>(Start, OS, 0);
1413 addOptionalRegular<ELFT>(End, OS, -1);
1414 } else {
Rui Ueyamad57e74b72017-03-17 23:29:01 +00001415 if (Config->Pic)
Peter Collingbournef8435a92017-03-13 16:40:20 +00001416 OS = Out::ElfHeader;
1417 addOptionalRegular<ELFT>(Start, OS, 0);
1418 addOptionalRegular<ELFT>(End, OS, 0);
1419 }
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001420 };
1421
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001422 Define("__preinit_array_start", "__preinit_array_end", Out::PreinitArray);
1423 Define("__init_array_start", "__init_array_end", Out::InitArray);
1424 Define("__fini_array_start", "__fini_array_end", Out::FiniArray);
Peter Smith17cd3752016-10-27 10:28:53 +00001425
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001426 if (OutputSection *Sec = findSection(".ARM.exidx"))
Peter Smith17cd3752016-10-27 10:28:53 +00001427 Define("__exidx_start", "__exidx_end", Sec);
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001428}
1429
Rui Ueyamad9189ce2015-10-15 17:11:03 +00001430// If a section name is valid as a C identifier (which is rare because of
1431// the leading '.'), linkers are expected to define __start_<secname> and
1432// __stop_<secname> symbols. They are at beginning and end of the section,
1433// respectively. This is not requested by the ELF standard, but GNU ld and
1434// gold provide the feature, and used by many programs.
1435template <class ELFT>
Rafael Espindola24e6f362017-02-24 15:07:30 +00001436void Writer<ELFT>::addStartStopSymbols(OutputSection *Sec) {
Rafael Espindola40849412017-02-24 14:28:00 +00001437 StringRef S = Sec->Name;
Rui Ueyamad9189ce2015-10-15 17:11:03 +00001438 if (!isValidCIdentifier(S))
1439 return;
Rafael Espindola5616adf2017-03-08 22:36:28 +00001440 addOptionalRegular<ELFT>(Saver.save("__start_" + S), Sec, 0, STV_DEFAULT);
1441 addOptionalRegular<ELFT>(Saver.save("__stop_" + S), Sec, -1, STV_DEFAULT);
Rui Ueyamad9189ce2015-10-15 17:11:03 +00001442}
1443
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001444template <class ELFT> OutputSection *Writer<ELFT>::findSection(StringRef Name) {
Rafael Espindola1eb3a0f2017-07-04 18:26:21 +00001445 for (BaseCommand *Base : Script->Opt.Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001446 if (auto *Sec = dyn_cast<OutputSection>(Base))
1447 if (Sec->Name == Name)
1448 return Sec;
Rafael Espindola43e76cd2017-05-26 17:48:27 +00001449 return nullptr;
1450}
1451
George Rimar7702bc22017-03-16 11:20:02 +00001452static bool needsPtLoad(OutputSection *Sec) {
Rafael Espindola04a2e342016-11-09 01:42:41 +00001453 if (!(Sec->Flags & SHF_ALLOC))
Rafael Espindolaef762f22016-02-10 23:29:38 +00001454 return false;
1455
1456 // Don't allocate VA space for TLS NOBITS sections. The PT_TLS PHDR is
1457 // responsible for allocating space for them, not the PT_LOAD that
1458 // contains the TLS initialization image.
Rafael Espindola04a2e342016-11-09 01:42:41 +00001459 if (Sec->Flags & SHF_TLS && Sec->Type == SHT_NOBITS)
Rafael Espindolaef762f22016-02-10 23:29:38 +00001460 return false;
1461 return true;
Michael J. Spencer1d299a82015-09-09 20:48:09 +00001462}
1463
Rafael Espindolab45fd702016-09-20 15:22:27 +00001464// Linker scripts are responsible for aligning addresses. Unfortunately, most
1465// linker scripts are designed for creating two PT_LOADs only, one RX and one
1466// RW. This means that there is no alignment in the RO to RX transition and we
1467// cannot create a PT_LOAD there.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001468static uint64_t computeFlags(uint64_t Flags) {
Rui Ueyamaa37ace8d2017-02-25 01:52:03 +00001469 if (Config->Omagic)
George Rimar595a7632016-11-29 09:43:51 +00001470 return PF_R | PF_W | PF_X;
Rui Ueyama6bd38222017-04-05 21:37:09 +00001471 if (Config->SingleRoRx && !(Flags & PF_W))
1472 return Flags | PF_X;
1473 return Flags;
Rafael Espindolab45fd702016-09-20 15:22:27 +00001474}
1475
Rafael Espindola4fc60442016-02-10 22:43:13 +00001476// Decide which program headers to create and which sections to include in each
1477// one.
George Rimaraa354182017-07-27 07:46:50 +00001478template <class ELFT> std::vector<PhdrEntry *> Writer<ELFT>::createPhdrs() {
1479 std::vector<PhdrEntry *> Ret;
Rafael Espindola17cb7c02016-12-19 17:01:01 +00001480 auto AddHdr = [&](unsigned Type, unsigned Flags) -> PhdrEntry * {
George Rimaraa354182017-07-27 07:46:50 +00001481 Ret.push_back(make<PhdrEntry>(Type, Flags));
1482 return Ret.back();
Rafael Espindola4fc60442016-02-10 22:43:13 +00001483 };
George Rimare3336c02015-11-24 10:15:50 +00001484
Rui Ueyama803195e2015-10-23 21:45:59 +00001485 // The first phdr entry is PT_PHDR which describes the program header itself.
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001486 AddHdr(PT_PHDR, PF_R)->add(Out::ProgramHeaders);
Rui Ueyama953c2c42015-10-10 23:59:57 +00001487
Rui Ueyama803195e2015-10-23 21:45:59 +00001488 // PT_INTERP must be the second entry if exists.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001489 if (OutputSection *Cmd = findSection(".interp"))
1490 AddHdr(PT_INTERP, Cmd->getPhdrFlags())->add(Cmd);
Rafael Espindola70107762015-09-11 18:49:42 +00001491
Rui Ueyama803195e2015-10-23 21:45:59 +00001492 // Add the first PT_LOAD segment for regular output sections.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001493 uint64_t Flags = computeFlags(PF_R);
Rafael Espindola17cb7c02016-12-19 17:01:01 +00001494 PhdrEntry *Load = AddHdr(PT_LOAD, Flags);
Rafael Espindola02ed7572017-05-04 19:34:17 +00001495
1496 // Add the headers. We will remove them if they don't fit.
1497 Load->add(Out::ElfHeader);
1498 Load->add(Out::ProgramHeaders);
1499
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001500 for (OutputSection *Sec : OutputSections) {
Rafael Espindola04a2e342016-11-09 01:42:41 +00001501 if (!(Sec->Flags & SHF_ALLOC))
Rafael Espindolaaab6d5c2016-09-16 21:29:07 +00001502 break;
George Rimar7702bc22017-03-16 11:20:02 +00001503 if (!needsPtLoad(Sec))
Rafael Espindolaef762f22016-02-10 23:29:38 +00001504 continue;
1505
George Rimar8ceadb32016-08-17 07:44:19 +00001506 // Segments are contiguous memory regions that has the same attributes
1507 // (e.g. executable or writable). There is one phdr for each segment.
1508 // Therefore, we need to create a new phdr when the next section has
1509 // different flags or is loaded at a discontiguous address using AT linker
1510 // script command.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001511 uint64_t NewFlags = computeFlags(Sec->getPhdrFlags());
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001512 if (Sec->LMAExpr || Flags != NewFlags) {
Rafael Espindolae090fb22016-03-09 21:37:22 +00001513 Load = AddHdr(PT_LOAD, NewFlags);
Rafael Espindola4fc60442016-02-10 22:43:13 +00001514 Flags = NewFlags;
1515 }
Michael J. Spencer78aa1de2015-11-03 00:34:39 +00001516
Rui Ueyama18f084f2016-07-20 19:36:41 +00001517 Load->add(Sec);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001518 }
Rafael Espindola6b83b902015-08-12 00:00:24 +00001519
Rui Ueyamadb00b612017-02-01 22:42:17 +00001520 // Add a TLS segment if any.
George Rimaraa354182017-07-27 07:46:50 +00001521 PhdrEntry *TlsHdr = make<PhdrEntry>(PT_TLS, PF_R);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001522 for (OutputSection *Sec : OutputSections)
Rui Ueyamadb00b612017-02-01 22:42:17 +00001523 if (Sec->Flags & SHF_TLS)
George Rimaraa354182017-07-27 07:46:50 +00001524 TlsHdr->add(Sec);
George Rimar6823c5f2017-09-07 11:01:10 +00001525 if (TlsHdr->FirstSec)
George Rimaraa354182017-07-27 07:46:50 +00001526 Ret.push_back(TlsHdr);
Michael J. Spencer78aa1de2015-11-03 00:34:39 +00001527
Rui Ueyama803195e2015-10-23 21:45:59 +00001528 // Add an entry for .dynamic.
George Rimar69b17c32017-05-16 10:04:42 +00001529 if (InX::DynSymTab)
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001530 AddHdr(PT_DYNAMIC, InX::Dynamic->getParent()->getPhdrFlags())
1531 ->add(InX::Dynamic->getParent());
Rafael Espindola91009b32015-08-12 01:45:28 +00001532
Rafael Espindola4fc60442016-02-10 22:43:13 +00001533 // PT_GNU_RELRO includes all sections that should be marked as
1534 // read-only by dynamic linker after proccessing relocations.
George Rimaraa354182017-07-27 07:46:50 +00001535 PhdrEntry *RelRo = make<PhdrEntry>(PT_GNU_RELRO, PF_R);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001536 for (OutputSection *Sec : OutputSections)
Rafael Espindola9e889eb2017-05-11 23:31:06 +00001537 if (needsPtLoad(Sec) && isRelroSection(Sec))
George Rimaraa354182017-07-27 07:46:50 +00001538 RelRo->add(Sec);
George Rimar6823c5f2017-09-07 11:01:10 +00001539 if (RelRo->FirstSec)
George Rimaraa354182017-07-27 07:46:50 +00001540 Ret.push_back(RelRo);
George Rimare3336c02015-11-24 10:15:50 +00001541
Rafael Espindola4fc60442016-02-10 22:43:13 +00001542 // PT_GNU_EH_FRAME is a special section pointing on .eh_frame_hdr.
Eugene Leviant30c1b432017-03-14 08:49:09 +00001543 if (!In<ELFT>::EhFrame->empty() && In<ELFT>::EhFrameHdr &&
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001544 In<ELFT>::EhFrame->getParent() && In<ELFT>::EhFrameHdr->getParent())
1545 AddHdr(PT_GNU_EH_FRAME, In<ELFT>::EhFrameHdr->getParent()->getPhdrFlags())
1546 ->add(In<ELFT>::EhFrameHdr->getParent());
George Rimarf6bc65a2016-01-15 13:34:52 +00001547
Rui Ueyama81cb7102017-03-24 00:15:57 +00001548 // PT_OPENBSD_RANDOMIZE is an OpenBSD-specific feature. That makes
1549 // the dynamic linker fill the segment with random data.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001550 if (OutputSection *Cmd = findSection(".openbsd.randomdata"))
1551 AddHdr(PT_OPENBSD_RANDOMIZE, Cmd->getPhdrFlags())->add(Cmd);
George Rimar270173f2016-10-14 13:02:22 +00001552
Rui Ueyamae79b09a2015-11-21 22:19:32 +00001553 // PT_GNU_STACK is a special section to tell the loader to make the
Rui Ueyamaa7e87252017-02-23 08:09:51 +00001554 // pages for the stack non-executable. If you really want an executable
1555 // stack, you can pass -z execstack, but that's not recommended for
1556 // security reasons.
1557 unsigned Perm;
1558 if (Config->ZExecstack)
1559 Perm = PF_R | PF_W | PF_X;
1560 else
1561 Perm = PF_R | PF_W;
1562 AddHdr(PT_GNU_STACK, Perm)->p_memsz = Config->ZStackSize;
Rafael Espindola9907eb02016-03-01 13:23:29 +00001563
George Rimarcc6e5672016-10-14 10:34:36 +00001564 // PT_OPENBSD_WXNEEDED is a OpenBSD-specific header to mark the executable
1565 // is expected to perform W^X violations, such as calling mprotect(2) or
1566 // mmap(2) with PROT_WRITE | PROT_EXEC, which is prohibited by default on
1567 // OpenBSD.
1568 if (Config->ZWxneeded)
1569 AddHdr(PT_OPENBSD_WXNEEDED, PF_X);
1570
Petr Hosek4d65ef3b2017-02-01 20:58:41 +00001571 // Create one PT_NOTE per a group of contiguous .note sections.
1572 PhdrEntry *Note = nullptr;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001573 for (OutputSection *Sec : OutputSections) {
Petr Hosek4d65ef3b2017-02-01 20:58:41 +00001574 if (Sec->Type == SHT_NOTE) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001575 if (!Note || Sec->LMAExpr)
Petr Hosek4d65ef3b2017-02-01 20:58:41 +00001576 Note = AddHdr(PT_NOTE, PF_R);
1577 Note->add(Sec);
1578 } else {
1579 Note = nullptr;
1580 }
1581 }
Rui Ueyama703296a2016-07-20 19:36:39 +00001582 return Ret;
Rafael Espindola4fc60442016-02-10 22:43:13 +00001583}
1584
Rafael Espindola8e670002016-11-28 00:40:21 +00001585template <class ELFT>
George Rimaraa354182017-07-27 07:46:50 +00001586void Writer<ELFT>::addPtArmExid(std::vector<PhdrEntry *> &Phdrs) {
Rafael Espindola8e670002016-11-28 00:40:21 +00001587 if (Config->EMachine != EM_ARM)
1588 return;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001589 auto I = llvm::find_if(OutputSections, [](OutputSection *Cmd) {
1590 return Cmd->Type == SHT_ARM_EXIDX;
George Rimara951d5c2017-07-04 13:10:37 +00001591 });
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001592 if (I == OutputSections.end())
Rafael Espindola8e670002016-11-28 00:40:21 +00001593 return;
1594
1595 // PT_ARM_EXIDX is the ARM EHABI equivalent of PT_GNU_EH_FRAME
George Rimaraa354182017-07-27 07:46:50 +00001596 PhdrEntry *ARMExidx = make<PhdrEntry>(PT_ARM_EXIDX, PF_R);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001597 ARMExidx->add(*I);
Rafael Espindola8e670002016-11-28 00:40:21 +00001598 Phdrs.push_back(ARMExidx);
1599}
1600
Peter Collingbourne628ec9f2017-01-10 01:21:30 +00001601// The first section of each PT_LOAD, the first section in PT_GNU_RELRO and the
1602// first section after PT_GNU_RELRO have to be page aligned so that the dynamic
1603// linker can set the permissions.
Rui Ueyama47091902016-03-30 19:41:51 +00001604template <class ELFT> void Writer<ELFT>::fixSectionAlignments() {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001605 auto PageAlign = [](OutputSection *Cmd) {
Rafael Espindola0f7dc0e2017-06-02 01:37:58 +00001606 if (Cmd && !Cmd->AddrExpr)
1607 Cmd->AddrExpr = [=] {
1608 return alignTo(Script->getDot(), Config->MaxPageSize);
1609 };
1610 };
1611
George Rimaraa354182017-07-27 07:46:50 +00001612 for (const PhdrEntry *P : Phdrs)
George Rimar6823c5f2017-09-07 11:01:10 +00001613 if (P->p_type == PT_LOAD && P->FirstSec)
1614 PageAlign(P->FirstSec);
Rui Ueyama47091902016-03-30 19:41:51 +00001615
George Rimaraa354182017-07-27 07:46:50 +00001616 for (const PhdrEntry *P : Phdrs) {
1617 if (P->p_type != PT_GNU_RELRO)
Rui Ueyama47091902016-03-30 19:41:51 +00001618 continue;
George Rimar6823c5f2017-09-07 11:01:10 +00001619 if (P->FirstSec)
1620 PageAlign(P->FirstSec);
Rui Ueyama47091902016-03-30 19:41:51 +00001621 // Find the first section after PT_GNU_RELRO. If it is in a PT_LOAD we
1622 // have to align it to a page.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001623 auto End = OutputSections.end();
George Rimar6823c5f2017-09-07 11:01:10 +00001624 auto I = std::find(OutputSections.begin(), End, P->LastSec);
Rui Ueyama47091902016-03-30 19:41:51 +00001625 if (I == End || (I + 1) == End)
1626 continue;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001627 OutputSection *Cmd = (*(I + 1));
1628 if (needsPtLoad(Cmd))
1629 PageAlign(Cmd);
Rui Ueyama47091902016-03-30 19:41:51 +00001630 }
1631}
1632
George Rimar5f857322016-04-27 09:16:28 +00001633// Adjusts the file alignment for a given output section and returns
1634// its new file offset. The file offset must be the same with its
1635// virtual address (modulo the page size) so that the loader can load
1636// executables without any address adjustment.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001637static uint64_t getFileAlignment(uint64_t Off, OutputSection *Cmd) {
Rafael Espindola8b8f74f2016-12-07 20:20:39 +00001638 // If the section is not in a PT_LOAD, we just have to align it.
George Rimar582ede82017-09-07 10:53:07 +00001639 if (!Cmd->PtLoad)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001640 return alignTo(Off, Cmd->Alignment);
Eugene Leviant3d9abec2016-09-29 09:20:33 +00001641
George Rimar6823c5f2017-09-07 11:01:10 +00001642 OutputSection *First = Cmd->PtLoad->FirstSec;
Rafael Espindola8b8f74f2016-12-07 20:20:39 +00001643 // The first section in a PT_LOAD has to have congruent offset and address
1644 // module the page size.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001645 if (Cmd == First)
1646 return alignTo(Off, std::max<uint64_t>(Cmd->Alignment, Config->MaxPageSize),
1647 Cmd->Addr);
Rafael Espindola8b8f74f2016-12-07 20:20:39 +00001648
1649 // If two sections share the same PT_LOAD the file offset is calculated
1650 // using this formula: Off2 = Off1 + (VA2 - VA1).
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001651 return First->Offset + Cmd->Addr - First->Addr;
George Rimar5f857322016-04-27 09:16:28 +00001652}
1653
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001654static uint64_t setOffset(OutputSection *Cmd, uint64_t Off) {
1655 if (Cmd->Type == SHT_NOBITS) {
1656 Cmd->Offset = Off;
Rui Ueyama35723f02017-02-14 23:35:42 +00001657 return Off;
George Rimar86ce2672016-08-25 09:05:47 +00001658 }
1659
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001660 Off = getFileAlignment(Off, Cmd);
1661 Cmd->Offset = Off;
1662 return Off + Cmd->Size;
George Rimar86ce2672016-08-25 09:05:47 +00001663}
1664
1665template <class ELFT> void Writer<ELFT>::assignFileOffsetsBinary() {
Rui Ueyama6bd38222017-04-05 21:37:09 +00001666 uint64_t Off = 0;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001667 for (OutputSection *Sec : OutputSections)
Rafael Espindola04a2e342016-11-09 01:42:41 +00001668 if (Sec->Flags & SHF_ALLOC)
Rui Ueyama6bd38222017-04-05 21:37:09 +00001669 Off = setOffset(Sec, Off);
1670 FileSize = alignTo(Off, Config->Wordsize);
George Rimar86ce2672016-08-25 09:05:47 +00001671}
1672
Rui Ueyamae044e9c2016-04-01 17:07:17 +00001673// Assign file offsets to output sections.
1674template <class ELFT> void Writer<ELFT>::assignFileOffsets() {
Rui Ueyama6bd38222017-04-05 21:37:09 +00001675 uint64_t Off = 0;
1676 Off = setOffset(Out::ElfHeader, Off);
1677 Off = setOffset(Out::ProgramHeaders, Off);
George Rimar7ca06272016-04-06 07:20:45 +00001678
Petr Hosekedd6c352017-08-02 16:35:00 +00001679 PhdrEntry *LastRX = nullptr;
1680 for (PhdrEntry *P : Phdrs)
1681 if (P->p_type == PT_LOAD && (P->p_flags & PF_X))
1682 LastRX = P;
1683
1684 for (OutputSection *Sec : OutputSections) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001685 Off = setOffset(Sec, Off);
Petr Hosekedd6c352017-08-02 16:35:00 +00001686 if (Script->Opt.HasSections)
1687 continue;
1688 // If this is a last section of the last executable segment and that
1689 // segment is the last loadable segment, align the offset of the
1690 // following section to avoid loading non-segments parts of the file.
George Rimar6823c5f2017-09-07 11:01:10 +00001691 if (LastRX && LastRX->LastSec == Sec)
Petr Hosekedd6c352017-08-02 16:35:00 +00001692 Off = alignTo(Off, Target->PageSize);
1693 }
Eugene Leviant467c4d52016-07-01 10:27:36 +00001694
Rui Ueyama6bd38222017-04-05 21:37:09 +00001695 SectionHeaderOff = alignTo(Off, Config->Wordsize);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001696 FileSize = SectionHeaderOff + (OutputSections.size() + 1) * sizeof(Elf_Shdr);
Rui Ueyamae044e9c2016-04-01 17:07:17 +00001697}
1698
1699// Finalize the program headers. We call this function after we assign
1700// file offsets and VAs to all sections.
1701template <class ELFT> void Writer<ELFT>::setPhdrs() {
George Rimaraa354182017-07-27 07:46:50 +00001702 for (PhdrEntry *P : Phdrs) {
George Rimar6823c5f2017-09-07 11:01:10 +00001703 OutputSection *First = P->FirstSec;
1704 OutputSection *Last = P->LastSec;
Rui Ueyamae8a45e42016-04-01 22:42:04 +00001705 if (First) {
George Rimaraa354182017-07-27 07:46:50 +00001706 P->p_filesz = Last->Offset - First->Offset;
Rafael Espindola04a2e342016-11-09 01:42:41 +00001707 if (Last->Type != SHT_NOBITS)
George Rimaraa354182017-07-27 07:46:50 +00001708 P->p_filesz += Last->Size;
1709 P->p_memsz = Last->Addr + Last->Size - First->Addr;
1710 P->p_offset = First->Offset;
1711 P->p_vaddr = First->Addr;
1712 if (!P->HasLMA)
1713 P->p_paddr = First->getLMA();
Rafael Espindola4fc60442016-02-10 22:43:13 +00001714 }
George Rimaraa354182017-07-27 07:46:50 +00001715 if (P->p_type == PT_LOAD)
1716 P->p_align = std::max<uint64_t>(P->p_align, Config->MaxPageSize);
1717 else if (P->p_type == PT_GNU_RELRO) {
1718 P->p_align = 1;
Peter Collingbourne7b5088b2017-01-04 18:56:15 +00001719 // The glibc dynamic loader rounds the size down, so we need to round up
1720 // to protect the last page. This is a no-op on FreeBSD which always
1721 // rounds up.
George Rimaraa354182017-07-27 07:46:50 +00001722 P->p_memsz = alignTo(P->p_memsz, Target->PageSize);
Peter Collingbourne7b5088b2017-01-04 18:56:15 +00001723 }
George Rimar8ceadb32016-08-17 07:44:19 +00001724
Rafael Espindola4fc60442016-02-10 22:43:13 +00001725 // The TLS pointer goes after PT_TLS. At least glibc will align it,
1726 // so round up the size to make sure the offsets are correct.
George Rimaraa354182017-07-27 07:46:50 +00001727 if (P->p_type == PT_TLS) {
1728 Out::TlsPhdr = P;
1729 if (P->p_memsz)
1730 P->p_memsz = alignTo(P->p_memsz, P->p_align);
Rui Ueyama803195e2015-10-23 21:45:59 +00001731 }
1732 }
Michael J. Spencer84487f12015-07-24 21:03:07 +00001733}
1734
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001735// The entry point address is chosen in the following ways.
1736//
1737// 1. the '-e' entry command-line option;
1738// 2. the ENTRY(symbol) command in a linker control script;
1739// 3. the value of the symbol start, if present;
1740// 4. the address of the first byte of the .text section, if present;
1741// 5. the address 0.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001742template <class ELFT> uint64_t Writer<ELFT>::getEntryAddr() {
Rui Ueyamaa1407c42016-12-07 03:23:06 +00001743 // Case 1, 2 or 3. As a special case, if the symbol is actually
1744 // a number, we'll use that number as an address.
Rafael Espindola244ef982017-07-26 18:42:48 +00001745 if (SymbolBody *B = Symtab->find(Config->Entry))
George Rimarf64618a2017-03-17 11:56:54 +00001746 return B->getVA();
Rui Ueyamaa1407c42016-12-07 03:23:06 +00001747 uint64_t Addr;
George Rimarab947682017-05-16 08:19:25 +00001748 if (to_integer(Config->Entry, Addr))
Rui Ueyamaa1407c42016-12-07 03:23:06 +00001749 return Addr;
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001750
1751 // Case 4
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001752 if (OutputSection *Sec = findSection(".text")) {
Rui Ueyama9e5f5ef2016-12-07 04:06:21 +00001753 if (Config->WarnMissingEntry)
Petr Hosek2f50fef2016-12-07 02:26:16 +00001754 warn("cannot find entry symbol " + Config->Entry + "; defaulting to 0x" +
1755 utohexstr(Sec->Addr));
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001756 return Sec->Addr;
1757 }
1758
1759 // Case 5
Rui Ueyama9e5f5ef2016-12-07 04:06:21 +00001760 if (Config->WarnMissingEntry)
Petr Hosek2f50fef2016-12-07 02:26:16 +00001761 warn("cannot find entry symbol " + Config->Entry +
1762 "; not setting start address");
Rui Ueyama8da7aa02016-10-20 00:07:36 +00001763 return 0;
Rui Ueyama3bfaba92015-12-24 08:37:34 +00001764}
1765
Rui Ueyama4cea4e82016-02-25 19:28:37 +00001766static uint16_t getELFType() {
Rui Ueyamad57e74b72017-03-17 23:29:01 +00001767 if (Config->Pic)
Rui Ueyama4cea4e82016-02-25 19:28:37 +00001768 return ET_DYN;
1769 if (Config->Relocatable)
1770 return ET_REL;
1771 return ET_EXEC;
1772}
1773
Michael J. Spencer84487f12015-07-24 21:03:07 +00001774template <class ELFT> void Writer<ELFT>::writeHeader() {
1775 uint8_t *Buf = Buffer->getBufferStart();
Rui Ueyamae08cd672015-10-23 22:44:39 +00001776 memcpy(Buf, "\177ELF", 4);
1777
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001778 // Write the ELF header.
Rafael Espindola18608a02015-09-08 21:57:31 +00001779 auto *EHdr = reinterpret_cast<Elf_Ehdr *>(Buf);
Rui Ueyamaf2dc4362017-04-05 21:08:47 +00001780 EHdr->e_ident[EI_CLASS] = Config->Is64 ? ELFCLASS64 : ELFCLASS32;
1781 EHdr->e_ident[EI_DATA] = Config->IsLE ? ELFDATA2LSB : ELFDATA2MSB;
Michael J. Spencer84487f12015-07-24 21:03:07 +00001782 EHdr->e_ident[EI_VERSION] = EV_CURRENT;
Rafael Espindola7cc713a2016-10-27 14:00:51 +00001783 EHdr->e_ident[EI_OSABI] = Config->OSABI;
Rui Ueyama4cea4e82016-02-25 19:28:37 +00001784 EHdr->e_type = getELFType();
Rafael Espindola7cc713a2016-10-27 14:00:51 +00001785 EHdr->e_machine = Config->EMachine;
Michael J. Spencer84487f12015-07-24 21:03:07 +00001786 EHdr->e_version = EV_CURRENT;
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001787 EHdr->e_entry = getEntryAddr();
Michael J. Spencer8039dae22015-07-29 00:30:10 +00001788 EHdr->e_shoff = SectionHeaderOff;
Rafael Espindola18608a02015-09-08 21:57:31 +00001789 EHdr->e_ehsize = sizeof(Elf_Ehdr);
Rui Ueyama2f1b79f2015-10-10 22:34:30 +00001790 EHdr->e_phnum = Phdrs.size();
Rafael Espindola18608a02015-09-08 21:57:31 +00001791 EHdr->e_shentsize = sizeof(Elf_Shdr);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001792 EHdr->e_shnum = OutputSections.size() + 1;
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001793 EHdr->e_shstrndx = InX::ShStrTab->getParent()->SectionIndex;
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001794
Rui Ueyama1e2e8ea2016-09-13 20:51:32 +00001795 if (Config->EMachine == EM_ARM)
1796 // We don't currently use any features incompatible with EF_ARM_EABI_VER5,
1797 // but we don't have any firm guarantees of conformance. Linux AArch64
1798 // kernels (as of 2016) require an EABI version to be set.
1799 EHdr->e_flags = EF_ARM_EABI_VER5;
1800 else if (Config->EMachine == EM_MIPS)
Simon Atanasyan4f90c2f2016-07-20 20:30:41 +00001801 EHdr->e_flags = getMipsEFlags<ELFT>();
Rui Ueyama22b5d1f2016-03-13 19:29:17 +00001802
George Rimar58941ee2016-02-25 08:23:37 +00001803 if (!Config->Relocatable) {
1804 EHdr->e_phoff = sizeof(Elf_Ehdr);
1805 EHdr->e_phentsize = sizeof(Elf_Phdr);
1806 }
1807
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001808 // Write the program header table.
Rafael Espindola4fc60442016-02-10 22:43:13 +00001809 auto *HBuf = reinterpret_cast<Elf_Phdr *>(Buf + EHdr->e_phoff);
George Rimaraa354182017-07-27 07:46:50 +00001810 for (PhdrEntry *P : Phdrs) {
1811 HBuf->p_type = P->p_type;
1812 HBuf->p_flags = P->p_flags;
1813 HBuf->p_offset = P->p_offset;
1814 HBuf->p_vaddr = P->p_vaddr;
1815 HBuf->p_paddr = P->p_paddr;
1816 HBuf->p_filesz = P->p_filesz;
1817 HBuf->p_memsz = P->p_memsz;
1818 HBuf->p_align = P->p_align;
Rafael Espindola17cb7c02016-12-19 17:01:01 +00001819 ++HBuf;
1820 }
Rafael Espindolae438e072015-09-08 22:55:28 +00001821
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001822 // Write the section header table. Note that the first table entry is null.
Rui Ueyamaad59b652016-02-25 23:58:21 +00001823 auto *SHdrs = reinterpret_cast<Elf_Shdr *>(Buf + EHdr->e_shoff);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001824 for (OutputSection *Sec : OutputSections)
1825 Sec->writeHeaderTo<ELFT>(++SHdrs);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001826}
1827
Rui Ueyama6d12eae2016-12-05 17:40:37 +00001828// Open a result file.
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +00001829template <class ELFT> void Writer<ELFT>::openFile() {
Rui Ueyama6bd38222017-04-05 21:37:09 +00001830 if (!Config->Is64 && FileSize > UINT32_MAX) {
1831 error("output file too large: " + Twine(FileSize) + " bytes");
1832 return;
1833 }
1834
Rui Ueyama6d12eae2016-12-05 17:40:37 +00001835 unlinkAsync(Config->OutputFile);
Rafael Espindolabdc8f2f2015-08-13 00:31:46 +00001836 ErrorOr<std::unique_ptr<FileOutputBuffer>> BufferOrErr =
Rui Ueyamacbe39262016-02-02 22:48:04 +00001837 FileOutputBuffer::create(Config->OutputFile, FileSize,
1838 FileOutputBuffer::F_executable);
Rui Ueyama6d12eae2016-12-05 17:40:37 +00001839
Rui Ueyamaaa2db882016-07-15 01:38:54 +00001840 if (auto EC = BufferOrErr.getError())
Rui Ueyamac8d3a832017-01-12 22:18:04 +00001841 error("failed to open " + Config->OutputFile + ": " + EC.message());
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +00001842 else
Rui Ueyamaaa2db882016-07-15 01:38:54 +00001843 Buffer = std::move(*BufferOrErr);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001844}
1845
George Rimar86ce2672016-08-25 09:05:47 +00001846template <class ELFT> void Writer<ELFT>::writeSectionsBinary() {
1847 uint8_t *Buf = Buffer->getBufferStart();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001848 for (OutputSection *Sec : OutputSections)
Rafael Espindola04a2e342016-11-09 01:42:41 +00001849 if (Sec->Flags & SHF_ALLOC)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001850 Sec->writeTo<ELFT>(Buf + Sec->Offset);
George Rimar86ce2672016-08-25 09:05:47 +00001851}
1852
Rui Ueyama6238ed22017-08-14 21:18:12 +00001853static void fillTrap(uint8_t *I, uint8_t *End) {
George Rimarf7ef2a12017-08-21 08:31:14 +00001854 for (; I + 4 <= End; I += 4)
Petr Hosekedd6c352017-08-02 16:35:00 +00001855 memcpy(I, &Target->TrapInstr, 4);
1856}
1857
Rui Ueyama6238ed22017-08-14 21:18:12 +00001858// Fill the last page of executable segments with trap instructions
1859// instead of leaving them as zero. Even though it is not required by any
1860// standard, it is in general a good thing to do for security reasons.
1861//
1862// We'll leave other pages in segments as-is because the rest will be
1863// overwritten by output sections.
Petr Hosekedd6c352017-08-02 16:35:00 +00001864template <class ELFT> void Writer<ELFT>::writeTrapInstr() {
1865 if (Script->Opt.HasSections)
1866 return;
1867
Rui Ueyama6238ed22017-08-14 21:18:12 +00001868 // Fill the last page.
Petr Hosekedd6c352017-08-02 16:35:00 +00001869 uint8_t *Buf = Buffer->getBufferStart();
Rui Ueyama6238ed22017-08-14 21:18:12 +00001870 for (PhdrEntry *P : Phdrs)
1871 if (P->p_type == PT_LOAD && (P->p_flags & PF_X))
1872 fillTrap(Buf + alignDown(P->p_offset + P->p_filesz, Target->PageSize),
1873 Buf + alignTo(P->p_offset + P->p_filesz, Target->PageSize));
Petr Hosekedd6c352017-08-02 16:35:00 +00001874
Rui Ueyama6238ed22017-08-14 21:18:12 +00001875 // Round up the file size of the last segment to the page boundary iff it is
1876 // an executable segment to ensure that other other tools don't accidentally
1877 // trim the instruction padding (e.g. when stripping the file).
Petr Hosekedd6c352017-08-02 16:35:00 +00001878 PhdrEntry *LastRX = nullptr;
1879 for (PhdrEntry *P : Phdrs) {
1880 if (P->p_type != PT_LOAD)
1881 continue;
1882 if (P->p_flags & PF_X)
1883 LastRX = P;
1884 else
1885 LastRX = nullptr;
1886 }
Petr Hosekedd6c352017-08-02 16:35:00 +00001887 if (LastRX)
Petr Hosek7ab9f7b2017-09-01 21:48:20 +00001888 LastRX->p_memsz = LastRX->p_filesz =
1889 alignTo(LastRX->p_filesz, Target->PageSize);
Petr Hosekedd6c352017-08-02 16:35:00 +00001890}
1891
Michael J. Spencer84487f12015-07-24 21:03:07 +00001892// Write section contents to a mmap'ed file.
1893template <class ELFT> void Writer<ELFT>::writeSections() {
1894 uint8_t *Buf = Buffer->getBufferStart();
Hal Finkeldaedc122015-10-12 23:16:53 +00001895
Rui Ueyama75118252016-08-09 01:35:37 +00001896 // PPC64 needs to process relocations in the .opd section
1897 // before processing relocations in code-containing sections.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001898 if (auto *OpdCmd = findSection(".opd")) {
1899 Out::Opd = OpdCmd;
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001900 Out::OpdBuf = Buf + Out::Opd->Offset;
Rafael Espindola55b169b2017-05-24 18:08:04 +00001901 OpdCmd->template writeTo<ELFT>(Buf + Out::Opd->Offset);
Rafael Espindola7a513052015-10-13 14:45:51 +00001902 }
Hal Finkeldaedc122015-10-12 23:16:53 +00001903
Rafael Espindola24e6f362017-02-24 15:07:30 +00001904 OutputSection *EhFrameHdr =
Rafael Espindola881cc162017-05-26 17:28:17 +00001905 (In<ELFT>::EhFrameHdr && !In<ELFT>::EhFrameHdr->empty())
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001906 ? In<ELFT>::EhFrameHdr->getParent()
Rafael Espindola881cc162017-05-26 17:28:17 +00001907 : nullptr;
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001908
1909 // In -r or -emit-relocs mode, write the relocation sections first as in
1910 // ELf_Rel targets we might find out that we need to modify the relocated
1911 // section while doing it.
Rui Ueyamacb222032017-10-01 02:25:34 +00001912 parallelForEach(OutputSections, [&](OutputSection *Sec) {
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001913 if (Sec->Type == SHT_REL || Sec->Type == SHT_RELA)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001914 Sec->writeTo<ELFT>(Buf + Sec->Offset);
Rui Ueyamacb222032017-10-01 02:25:34 +00001915 });
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001916
Rui Ueyamacb222032017-10-01 02:25:34 +00001917 parallelForEach(OutputSections, [&](OutputSection *Sec) {
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001918 if (Sec != Out::Opd && Sec != EhFrameHdr && Sec->Type != SHT_REL &&
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001919 Sec->Type != SHT_RELA)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001920 Sec->writeTo<ELFT>(Buf + Sec->Offset);
Rui Ueyamacb222032017-10-01 02:25:34 +00001921 });
Eugene Leviante4f590f2016-08-31 07:43:50 +00001922
1923 // The .eh_frame_hdr depends on .eh_frame section contents, therefore
1924 // it should be written after .eh_frame is written.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001925 if (EhFrameHdr)
1926 EhFrameHdr->writeTo<ELFT>(Buf + EhFrameHdr->Offset);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001927}
Rui Ueyama3ce825e2015-10-09 21:07:25 +00001928
Rui Ueyama634ddf02016-03-11 20:51:53 +00001929template <class ELFT> void Writer<ELFT>::writeBuildId() {
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001930 if (!InX::BuildId || !InX::BuildId->getParent())
Rui Ueyama634ddf02016-03-11 20:51:53 +00001931 return;
1932
Petr Hosekfdfcb792016-09-01 22:43:03 +00001933 // Compute a hash of all sections of the output file.
Rui Ueyama634ddf02016-03-11 20:51:53 +00001934 uint8_t *Start = Buffer->getBufferStart();
Petr Hosekfdfcb792016-09-01 22:43:03 +00001935 uint8_t *End = Start + FileSize;
Rafael Espindola895aea62017-05-11 22:02:41 +00001936 InX::BuildId->writeBuildId({Start, End});
Rui Ueyama634ddf02016-03-11 20:51:53 +00001937}
1938
Rui Ueyama84907c52016-08-09 03:38:23 +00001939template void elf::writeResult<ELF32LE>();
1940template void elf::writeResult<ELF32BE>();
1941template void elf::writeResult<ELF64LE>();
1942template void elf::writeResult<ELF64BE>();