blob: 4442f44b0e2cc7c3b4343f018dcd2a6a67c10a3b [file] [log] [blame]
Michael J. Spencer84487f12015-07-24 21:03:07 +00001//===- Writer.cpp ---------------------------------------------------------===//
2//
3// The LLVM Linker
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Michael J. Spencerf8325412015-09-04 22:48:30 +000010#include "Writer.h"
Rui Ueyamacb8474ed2015-08-05 23:51:50 +000011#include "Config.h"
Rui Ueyama9b55e922017-03-24 00:15:16 +000012#include "Filesystem.h"
Rui Ueyama717677a2016-02-11 21:17:59 +000013#include "LinkerScript.h"
Rafael Espindola1ebfc592017-01-13 21:05:46 +000014#include "MapFile.h"
Rui Ueyama9381eb12016-12-18 14:06:06 +000015#include "Memory.h"
Rafael Espindola5805c4f2015-09-21 21:38:08 +000016#include "OutputSections.h"
Rui Ueyama0fcdc732016-05-24 20:24:43 +000017#include "Relocations.h"
Rui Ueyamafbbde542016-06-29 09:08:02 +000018#include "Strings.h"
Rui Ueyamaafff74e22015-08-05 23:24:46 +000019#include "SymbolTable.h"
Rui Ueyama6dc7fcb2016-11-01 20:28:21 +000020#include "SyntheticSections.h"
Rafael Espindola01205f72015-09-22 18:19:46 +000021#include "Target.h"
George Rimardbf93392017-04-17 08:58:12 +000022#include "Threads.h"
Denis Protivensky8e3b38a2015-11-12 09:52:08 +000023#include "llvm/ADT/StringMap.h"
Hal Finkel3bae2d82015-10-12 20:51:48 +000024#include "llvm/ADT/StringSwitch.h"
Rui Ueyamaafff74e22015-08-05 23:24:46 +000025#include "llvm/Support/FileOutputBuffer.h"
Rui Ueyamae8b2df42016-09-29 01:45:22 +000026#include <climits>
Michael J. Spencer84487f12015-07-24 21:03:07 +000027
28using namespace llvm;
29using namespace llvm::ELF;
30using namespace llvm::object;
Peter Smith0a259f32016-10-10 09:39:26 +000031using namespace llvm::support;
32using namespace llvm::support::endian;
Michael J. Spencer84487f12015-07-24 21:03:07 +000033
34using namespace lld;
Rafael Espindolae0df00b2016-02-28 00:25:54 +000035using namespace lld::elf;
Michael J. Spencer84487f12015-07-24 21:03:07 +000036
Rui Ueyamaafff74e22015-08-05 23:24:46 +000037namespace {
38// The writer writes a SymbolTable result to a file.
39template <class ELFT> class Writer {
40public:
Rui Ueyama9328b2c2016-03-14 23:16:09 +000041 typedef typename ELFT::Shdr Elf_Shdr;
42 typedef typename ELFT::Ehdr Elf_Ehdr;
43 typedef typename ELFT::Phdr Elf_Phdr;
Rui Ueyama0ce388b2017-04-05 21:46:06 +000044
Rui Ueyamaafff74e22015-08-05 23:24:46 +000045 void run();
46
47private:
Rui Ueyamaf83aca42016-11-01 23:17:45 +000048 void createSyntheticSections();
Rui Ueyama5a9640b2015-10-08 23:49:30 +000049 void copyLocalSymbols();
Rafael Espindola08d6a3f2017-02-11 01:40:49 +000050 void addSectionSymbols();
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +000051 void addReservedSymbols();
George Rimar9e694502016-07-29 16:18:47 +000052 void createSections();
Rafael Espindolab4c9b812017-02-23 02:28:28 +000053 void forEachRelSec(std::function<void(InputSectionBase &)> Fn);
Rafael Espindola24c073d2016-09-21 22:36:19 +000054 void sortSections();
Eugene Leviante63d81b2016-07-20 14:43:20 +000055 void finalizeSections();
Rui Ueyama84417f82015-12-26 07:50:41 +000056 void addPredefinedSections();
Rafael Espindola4d560162017-09-12 16:38:01 +000057 void setReservedSymbolSections();
Rui Ueyama2df0fd82015-12-25 07:38:58 +000058
George Rimaraa354182017-07-27 07:46:50 +000059 std::vector<PhdrEntry *> createPhdrs();
Rafael Espindola074ba932016-12-06 13:43:34 +000060 void removeEmptyPTLoad();
George Rimaraa354182017-07-27 07:46:50 +000061 void addPtArmExid(std::vector<PhdrEntry *> &Phdrs);
Rui Ueyamae044e9c2016-04-01 17:07:17 +000062 void assignFileOffsets();
George Rimar86ce2672016-08-25 09:05:47 +000063 void assignFileOffsetsBinary();
Rui Ueyamae044e9c2016-04-01 17:07:17 +000064 void setPhdrs();
Rui Ueyama47091902016-03-30 19:41:51 +000065 void fixSectionAlignments();
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +000066 void openFile();
Petr Hosekedd6c352017-08-02 16:35:00 +000067 void writeTrapInstr();
Rui Ueyamaafff74e22015-08-05 23:24:46 +000068 void writeHeader();
69 void writeSections();
George Rimar86ce2672016-08-25 09:05:47 +000070 void writeSectionsBinary();
Rui Ueyama634ddf02016-03-11 20:51:53 +000071 void writeBuildId();
Rui Ueyamaafff74e22015-08-05 23:24:46 +000072
Rui Ueyama818bb2f2016-07-16 18:55:47 +000073 std::unique_ptr<FileOutputBuffer> Buffer;
Michael J. Spencer2f008242015-09-17 19:58:07 +000074
Rafael Espindola05531242017-07-06 16:40:44 +000075 OutputSectionFactory Factory;
Rafael Espindola4fc60442016-02-10 22:43:13 +000076
Rui Ueyama01687222015-12-26 09:47:57 +000077 void addRelIpltSymbols();
Rui Ueyamaa5d79d12015-12-26 09:48:00 +000078 void addStartEndSymbols();
Rafael Espindola24e6f362017-02-24 15:07:30 +000079 void addStartStopSymbols(OutputSection *Sec);
Rui Ueyama6bd38222017-04-05 21:37:09 +000080 uint64_t getEntryAddr();
Rafael Espindola8c022ca2017-07-27 19:22:43 +000081 OutputSection *findSection(StringRef Name);
Rui Ueyama2f1b79f2015-10-10 22:34:30 +000082
George Rimaraa354182017-07-27 07:46:50 +000083 std::vector<PhdrEntry *> Phdrs;
Michael J. Spencer2f008242015-09-17 19:58:07 +000084
Rui Ueyama6bd38222017-04-05 21:37:09 +000085 uint64_t FileSize;
86 uint64_t SectionHeaderOff;
Peter Smith113a59e2017-06-26 10:22:17 +000087
88 bool HasGotBaseSym = false;
Rui Ueyamaafff74e22015-08-05 23:24:46 +000089};
90} // anonymous namespace
91
Rui Ueyama55518e72016-10-28 20:57:25 +000092StringRef elf::getOutputSectionName(StringRef Name) {
George Rimar60a0ea12017-06-05 12:49:21 +000093 // ".zdebug_" is a prefix for ZLIB-compressed sections.
94 // Because we decompressed input sections, we want to remove 'z'.
95 if (Name.startswith(".zdebug_"))
96 return Saver.save("." + Name.substr(2));
97
Eugene Levianta8d12ef2016-10-05 10:10:45 +000098 if (Config->Relocatable)
99 return Name;
100
Rafael Espindola7d382732016-09-19 19:59:21 +0000101 for (StringRef V :
George Rimar1ab9cf42017-03-17 10:14:53 +0000102 {".text.", ".rodata.", ".data.rel.ro.", ".data.", ".bss.rel.ro.",
103 ".bss.", ".init_array.", ".fini_array.", ".ctors.", ".dtors.", ".tbss.",
Peter Smith691ff762017-06-28 09:12:38 +0000104 ".gcc_except_table.", ".tdata.", ".ARM.exidx.", ".ARM.extab."}) {
Rafael Espindola7d382732016-09-19 19:59:21 +0000105 StringRef Prefix = V.drop_back();
106 if (Name.startswith(V) || Name == Prefix)
107 return Prefix;
108 }
Rui Ueyama05384082016-10-12 22:36:31 +0000109
Rui Ueyamae8a61022016-11-05 23:05:47 +0000110 // CommonSection is identified as "COMMON" in linker scripts.
111 // By default, it should go to .bss section.
112 if (Name == "COMMON")
113 return ".bss";
114
George Rimar5d53d1f2016-07-12 08:50:42 +0000115 return Name;
116}
117
George Rimar696a7f92017-09-19 09:20:54 +0000118static bool needsInterpSection() {
119 return !SharedFiles.empty() && !Config->DynamicLinker.empty() &&
120 !Script->ignoreInterpSection();
Rui Ueyamafd03cfd2016-07-21 11:01:23 +0000121}
122
George Rimard8b27762016-11-14 10:14:18 +0000123template <class ELFT> void elf::writeResult() { Writer<ELFT>().run(); }
Rafael Espindola4fc60442016-02-10 22:43:13 +0000124
Rafael Espindola074ba932016-12-06 13:43:34 +0000125template <class ELFT> void Writer<ELFT>::removeEmptyPTLoad() {
George Rimar60608a82017-08-28 09:28:15 +0000126 llvm::erase_if(Phdrs, [&](const PhdrEntry *P) {
George Rimaraa354182017-07-27 07:46:50 +0000127 if (P->p_type != PT_LOAD)
Rafael Espindola074ba932016-12-06 13:43:34 +0000128 return false;
George Rimar6823c5f2017-09-07 11:01:10 +0000129 if (!P->FirstSec)
Rafael Espindola41217612016-12-08 03:17:05 +0000130 return true;
George Rimar6823c5f2017-09-07 11:01:10 +0000131 uint64_t Size = P->LastSec->Addr + P->LastSec->Size - P->FirstSec->Addr;
Rafael Espindola074ba932016-12-06 13:43:34 +0000132 return Size == 0;
133 });
Rafael Espindola074ba932016-12-06 13:43:34 +0000134}
135
Petr Hosek7b793212017-03-10 20:00:42 +0000136template <class ELFT> static void combineEhFrameSections() {
137 for (InputSectionBase *&S : InputSections) {
138 EhInputSection *ES = dyn_cast<EhInputSection>(S);
Rafael Espindolaa1565552017-03-15 12:31:54 +0000139 if (!ES || !ES->Live)
Petr Hosek7b793212017-03-10 20:00:42 +0000140 continue;
141
142 In<ELFT>::EhFrame->addSection(ES);
143 S = nullptr;
144 }
145
146 std::vector<InputSectionBase *> &V = InputSections;
147 V.erase(std::remove(V.begin(), V.end(), nullptr), V.end());
148}
149
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000150// The main function of the writer.
151template <class ELFT> void Writer<ELFT>::run() {
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000152 // Create linker-synthesized sections such as .got or .plt.
153 // Such sections are of type input section.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000154 createSyntheticSections();
George Rimar7beff422016-11-15 08:19:02 +0000155
Petr Hosek7b793212017-03-10 20:00:42 +0000156 if (!Config->Relocatable)
157 combineEhFrameSections<ELFT>();
158
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000159 // We need to create some reserved symbols such as _end. Create them.
George Rimar7beff422016-11-15 08:19:02 +0000160 if (!Config->Relocatable)
161 addReservedSymbols();
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000162
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000163 // Create output sections.
Rui Ueyamaa34da932017-03-21 23:03:09 +0000164 if (Script->Opt.HasSections) {
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000165 // If linker script contains SECTIONS commands, let it create sections.
George Rimara8dba482017-03-20 10:09:58 +0000166 Script->processCommands(Factory);
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000167
168 // Linker scripts may have left some input sections unassigned.
169 // Assign such sections using the default rule.
George Rimara8dba482017-03-20 10:09:58 +0000170 Script->addOrphanSections(Factory);
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000171 } else {
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000172 // If linker script does not contain SECTIONS commands, create
173 // output sections by default rules. We still need to give the
174 // linker script a chance to run, because it might contain
175 // non-SECTIONS commands such as ASSERT.
George Rimara8dba482017-03-20 10:09:58 +0000176 Script->processCommands(Factory);
Rafael Espindola21263342017-07-05 23:36:24 +0000177 createSections();
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000178 }
179
180 if (Config->Discard != DiscardPolicy::All)
181 copyLocalSymbols();
182
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000183 if (Config->CopyRelocs)
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000184 addSectionSymbols();
185
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000186 // Now that we have a complete set of output sections. This function
187 // completes section contents. For example, we need to add strings
188 // to the string table, and add entries to .got and .plt.
189 // finalizeSections does that.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000190 finalizeSections();
Rui Ueyamaf373dd72016-11-24 01:43:21 +0000191 if (ErrorCount)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000192 return;
193
Rafael Espindola55b169b2017-05-24 18:08:04 +0000194 // If -compressed-debug-sections is specified, we need to compress
195 // .debug_* sections. Do it right now because it changes the size of
196 // output sections.
George Rimara9b07142017-08-04 08:30:16 +0000197 parallelForEach(OutputSections,
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000198 [](OutputSection *Sec) { Sec->maybeCompress<ELFT>(); });
Rafael Espindola805f5152017-06-01 16:30:12 +0000199
Peter Smith5aedebf2017-07-05 09:12:54 +0000200 Script->assignAddresses();
201 Script->allocateHeaders(Phdrs);
Rafael Espindola189860c2017-06-07 02:24:08 +0000202
203 // Remove empty PT_LOAD to avoid causing the dynamic linker to try to mmap a
204 // 0 sized region. This has to be done late since only after assignAddresses
205 // we know the size of the sections.
206 removeEmptyPTLoad();
207
208 if (!Config->OFormatBinary)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000209 assignFileOffsets();
Rafael Espindola189860c2017-06-07 02:24:08 +0000210 else
211 assignFileOffsetsBinary();
212
213 setPhdrs();
214
215 if (Config->Relocatable) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000216 for (OutputSection *Sec : OutputSections)
217 Sec->Addr = 0;
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000218 }
219
George Rimar2ddab6d2017-01-17 13:50:34 +0000220 // It does not make sense try to open the file if we have error already.
221 if (ErrorCount)
222 return;
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000223 // Write the result down to a file.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000224 openFile();
Rui Ueyamaf373dd72016-11-24 01:43:21 +0000225 if (ErrorCount)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000226 return;
Rafael Espindola3f235c72017-06-01 16:32:58 +0000227
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000228 if (!Config->OFormatBinary) {
Petr Hosekedd6c352017-08-02 16:35:00 +0000229 writeTrapInstr();
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000230 writeHeader();
231 writeSections();
232 } else {
233 writeSectionsBinary();
234 }
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000235
236 // Backfill .note.gnu.build-id section content. This is done at last
237 // because the content is usually a hash value of the entire output file.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000238 writeBuildId();
Rui Ueyamaf373dd72016-11-24 01:43:21 +0000239 if (ErrorCount)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000240 return;
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000241
Rui Ueyama40eaa992017-01-18 03:34:38 +0000242 // Handle -Map option.
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000243 writeMapFile<ELFT>();
Rui Ueyama40eaa992017-01-18 03:34:38 +0000244 if (ErrorCount)
245 return;
246
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000247 if (auto EC = Buffer->commit())
Rui Ueyamac8d3a832017-01-12 22:18:04 +0000248 error("failed to write to the output file: " + EC.message());
Rui Ueyama0b1b6952016-11-21 02:11:05 +0000249
250 // Flush the output streams and exit immediately. A full shutdown
251 // is a good test that we are keeping track of all allocated memory,
252 // but actually freeing it is a waste of time in a regular linker run.
253 if (Config->ExitEarly)
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000254 exitLld(0);
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000255}
256
Rui Ueyama9d1bacb12017-02-27 02:31:26 +0000257// Initialize Out members.
Rui Ueyamaf83aca42016-11-01 23:17:45 +0000258template <class ELFT> void Writer<ELFT>::createSyntheticSections() {
259 // Initialize all pointers with NULL. This is needed because
260 // you can call lld::elf::main more than once as a library.
Rui Ueyama9d1bacb12017-02-27 02:31:26 +0000261 memset(&Out::First, 0, sizeof(Out));
Rui Ueyamacfadbd92016-11-01 23:12:51 +0000262
Rui Ueyama536a2672017-02-27 02:32:08 +0000263 auto Add = [](InputSectionBase *Sec) { InputSections.push_back(Sec); };
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000264
Rafael Espindola895aea62017-05-11 22:02:41 +0000265 InX::DynStrTab = make<StringTableSection>(".dynstr", true);
Rafael Espindola5ab19892017-05-11 23:16:43 +0000266 InX::Dynamic = make<DynamicSection<ELFT>>();
Eugene Levianta96d9022016-11-16 10:02:27 +0000267 In<ELFT>::RelaDyn = make<RelocationSection<ELFT>>(
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000268 Config->IsRela ? ".rela.dyn" : ".rel.dyn", Config->ZCombreloc);
Rafael Espindola895aea62017-05-11 22:02:41 +0000269 InX::ShStrTab = make<StringTableSection>(".shstrtab", false);
Rui Ueyama4197a6a2016-02-05 18:41:40 +0000270
Rui Ueyama9d1bacb12017-02-27 02:31:26 +0000271 Out::ElfHeader = make<OutputSection>("", 0, SHF_ALLOC);
272 Out::ElfHeader->Size = sizeof(Elf_Ehdr);
273 Out::ProgramHeaders = make<OutputSection>("", 0, SHF_ALLOC);
Rui Ueyama6bd38222017-04-05 21:37:09 +0000274 Out::ProgramHeaders->updateAlignment(Config->Wordsize);
Rui Ueyama4197a6a2016-02-05 18:41:40 +0000275
George Rimar696a7f92017-09-19 09:20:54 +0000276 if (needsInterpSection()) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000277 InX::Interp = createInterpSection();
278 Add(InX::Interp);
Rui Ueyamae8a61022016-11-05 23:05:47 +0000279 } else {
Rafael Espindola895aea62017-05-11 22:02:41 +0000280 InX::Interp = nullptr;
Rui Ueyamae8a61022016-11-05 23:05:47 +0000281 }
Rui Ueyama3a41be22016-04-07 22:49:21 +0000282
George Rimarf21aade2016-08-31 08:38:11 +0000283 if (Config->Strip != StripPolicy::All) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000284 InX::StrTab = make<StringTableSection>(".strtab", false);
George Rimarf45f6812017-05-16 08:53:30 +0000285 InX::SymTab = make<SymbolTableSection<ELFT>>(*InX::StrTab);
Rui Ueyama4197a6a2016-02-05 18:41:40 +0000286 }
Rui Ueyamacfadbd92016-11-01 23:12:51 +0000287
Rui Ueyamac4030a12016-11-22 00:54:15 +0000288 if (Config->BuildId != BuildIdKind::None) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000289 InX::BuildId = make<BuildIdSection>();
290 Add(InX::BuildId);
Rui Ueyamac4030a12016-11-22 00:54:15 +0000291 }
Rui Ueyamae8a61022016-11-05 23:05:47 +0000292
Rui Ueyama90113202017-09-08 19:41:35 +0000293 for (InputSection *S : createCommonSections())
Dmitry Mikulin1e30f072017-09-08 16:22:43 +0000294 Add(S);
Simon Atanasyance02cf02016-11-09 21:36:56 +0000295
Rafael Espindola895aea62017-05-11 22:02:41 +0000296 InX::Bss = make<BssSection>(".bss");
297 Add(InX::Bss);
298 InX::BssRelRo = make<BssSection>(".bss.rel.ro");
299 Add(InX::BssRelRo);
George Rimar1ab9cf42017-03-17 10:14:53 +0000300
Rui Ueyama1d75de02016-11-22 04:28:39 +0000301 // Add MIPS-specific sections.
Simon Atanasyance02cf02016-11-09 21:36:56 +0000302 if (Config->EMachine == EM_MIPS) {
Rafael Espindolae05e2f82017-09-15 18:05:02 +0000303 if (!Config->Shared && Config->HasDynSymTab) {
Rafael Espindola895aea62017-05-11 22:02:41 +0000304 InX::MipsRldMap = make<MipsRldMapSection>();
305 Add(InX::MipsRldMap);
Eugene Leviant17b7a572016-11-22 17:49:14 +0000306 }
Rui Ueyama1d75de02016-11-22 04:28:39 +0000307 if (auto *Sec = MipsAbiFlagsSection<ELFT>::create())
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000308 Add(Sec);
Rui Ueyama1d75de02016-11-22 04:28:39 +0000309 if (auto *Sec = MipsOptionsSection<ELFT>::create())
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000310 Add(Sec);
Rui Ueyama1d75de02016-11-22 04:28:39 +0000311 if (auto *Sec = MipsReginfoSection<ELFT>::create())
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000312 Add(Sec);
Simon Atanasyance02cf02016-11-09 21:36:56 +0000313 }
Eugene Leviant41ca3272016-11-10 09:48:29 +0000314
Rafael Espindolae05e2f82017-09-15 18:05:02 +0000315 if (Config->HasDynSymTab) {
George Rimar69b17c32017-05-16 10:04:42 +0000316 InX::DynSymTab = make<SymbolTableSection<ELFT>>(*InX::DynStrTab);
317 Add(InX::DynSymTab);
George Rimar11992c862016-11-25 08:05:41 +0000318
319 In<ELFT>::VerSym = make<VersionTableSection<ELFT>>();
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000320 Add(In<ELFT>::VerSym);
George Rimar11992c862016-11-25 08:05:41 +0000321
322 if (!Config->VersionDefinitions.empty()) {
323 In<ELFT>::VerDef = make<VersionDefinitionSection<ELFT>>();
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000324 Add(In<ELFT>::VerDef);
George Rimar11992c862016-11-25 08:05:41 +0000325 }
326
327 In<ELFT>::VerNeed = make<VersionNeedSection<ELFT>>();
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000328 Add(In<ELFT>::VerNeed);
George Rimar11992c862016-11-25 08:05:41 +0000329
330 if (Config->GnuHash) {
George Rimar69b17c32017-05-16 10:04:42 +0000331 InX::GnuHashTab = make<GnuHashTableSection>();
332 Add(InX::GnuHashTab);
George Rimar11992c862016-11-25 08:05:41 +0000333 }
334
335 if (Config->SysvHash) {
George Rimaraaf54712017-09-27 09:14:59 +0000336 InX::HashTab = make<HashTableSection>();
337 Add(InX::HashTab);
George Rimar11992c862016-11-25 08:05:41 +0000338 }
339
Rafael Espindola5ab19892017-05-11 23:16:43 +0000340 Add(InX::Dynamic);
Rafael Espindola895aea62017-05-11 22:02:41 +0000341 Add(InX::DynStrTab);
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000342 Add(In<ELFT>::RelaDyn);
George Rimar11992c862016-11-25 08:05:41 +0000343 }
344
Rui Ueyama1d75de02016-11-22 04:28:39 +0000345 // Add .got. MIPS' .got is so different from the other archs,
346 // it has its own class.
George Rimar11992c862016-11-25 08:05:41 +0000347 if (Config->EMachine == EM_MIPS) {
Rafael Espindolab3aa2c92017-05-11 21:33:30 +0000348 InX::MipsGot = make<MipsGotSection>();
349 Add(InX::MipsGot);
George Rimar11992c862016-11-25 08:05:41 +0000350 } else {
Rafael Espindolaa6465bb2017-05-18 16:45:36 +0000351 InX::Got = make<GotSection>();
Rafael Espindola88ab9fb2017-05-11 23:26:03 +0000352 Add(InX::Got);
George Rimar11992c862016-11-25 08:05:41 +0000353 }
Simon Atanasyan725dc142016-11-16 21:01:02 +0000354
Rafael Espindola4b1c3692017-05-11 21:23:38 +0000355 InX::GotPlt = make<GotPltSection>();
356 Add(InX::GotPlt);
Rafael Espindola895aea62017-05-11 22:02:41 +0000357 InX::IgotPlt = make<IgotPltSection>();
358 Add(InX::IgotPlt);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000359
360 if (Config->GdbIndex) {
Rafael Espindola300b3862017-07-12 23:56:53 +0000361 InX::GdbIndex = createGdbIndex<ELFT>();
Rafael Espindola895aea62017-05-11 22:02:41 +0000362 Add(InX::GdbIndex);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000363 }
364
365 // We always need to add rel[a].plt to output if it has entries.
366 // Even for static linking it can contain R_[*]_IRELATIVE relocations.
367 In<ELFT>::RelaPlt = make<RelocationSection<ELFT>>(
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000368 Config->IsRela ? ".rela.plt" : ".rel.plt", false /*Sort*/);
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000369 Add(In<ELFT>::RelaPlt);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000370
Peter Smithbaffdb82016-12-08 12:58:55 +0000371 // The RelaIplt immediately follows .rel.plt (.rel.dyn for ARM) to ensure
372 // that the IRelative relocations are processed last by the dynamic loader
373 In<ELFT>::RelaIplt = make<RelocationSection<ELFT>>(
374 (Config->EMachine == EM_ARM) ? ".rel.dyn" : In<ELFT>::RelaPlt->Name,
375 false /*Sort*/);
Rui Ueyama7ddd7a82017-02-05 05:18:58 +0000376 Add(In<ELFT>::RelaIplt);
Peter Smithbaffdb82016-12-08 12:58:55 +0000377
Rafael Espindola895aea62017-05-11 22:02:41 +0000378 InX::Plt = make<PltSection>(Target->PltHeaderSize);
379 Add(InX::Plt);
380 InX::Iplt = make<PltSection>(0);
381 Add(InX::Iplt);
George Rimar3fb5a6d2016-11-29 16:05:27 +0000382
Rafael Espindola66b4e212017-02-23 22:06:28 +0000383 if (!Config->Relocatable) {
George Rimar1c74c2f2017-03-09 08:45:25 +0000384 if (Config->EhFrameHdr) {
385 In<ELFT>::EhFrameHdr = make<EhFrameHeader<ELFT>>();
386 Add(In<ELFT>::EhFrameHdr);
387 }
Rafael Espindola66b4e212017-02-23 22:06:28 +0000388 In<ELFT>::EhFrame = make<EhFrameSection<ELFT>>();
389 Add(In<ELFT>::EhFrame);
390 }
391
George Rimar69b17c32017-05-16 10:04:42 +0000392 if (InX::SymTab)
393 Add(InX::SymTab);
Rafael Espindola895aea62017-05-11 22:02:41 +0000394 Add(InX::ShStrTab);
395 if (InX::StrTab)
396 Add(InX::StrTab);
Michael J. Spencer84487f12015-07-24 21:03:07 +0000397}
398
Rafael Espindola5616adf2017-03-08 22:36:28 +0000399static bool shouldKeepInSymtab(SectionBase *Sec, StringRef SymName,
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000400 const SymbolBody &B) {
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000401 if (B.isFile() || B.isSection())
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000402 return false;
403
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000404 // If sym references a section in a discarded group, don't keep it.
Rafael Espindola774ea7d2017-02-23 16:49:07 +0000405 if (Sec == &InputSection::Discarded)
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000406 return false;
407
George Rimar9503f6d2016-08-31 08:46:30 +0000408 if (Config->Discard == DiscardPolicy::None)
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000409 return true;
410
411 // In ELF assembly .L symbols are normally discarded by the assembler.
412 // If the assembler fails to do so, the linker discards them if
413 // * --discard-locals is used.
414 // * The symbol is in a SHF_MERGE section, which is normally the reason for
415 // the assembler keeping the .L symbol.
416 if (!SymName.startswith(".L") && !SymName.empty())
417 return true;
418
George Rimar9503f6d2016-08-31 08:46:30 +0000419 if (Config->Discard == DiscardPolicy::Locals)
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000420 return false;
421
Rafael Espindola1854a8e2016-10-26 12:36:56 +0000422 return !Sec || !(Sec->Flags & SHF_MERGE);
Rafael Espindola10d71ff2016-01-27 18:04:26 +0000423}
424
George Rimar7702bc22017-03-16 11:20:02 +0000425static bool includeInSymtab(const SymbolBody &B) {
Rafael Espindola474eb012016-05-05 16:40:28 +0000426 if (!B.isLocal() && !B.symbol()->IsUsedInRegularObj)
427 return false;
428
Rui Ueyama80474a22017-02-28 19:29:55 +0000429 if (auto *D = dyn_cast<DefinedRegular>(&B)) {
Rafael Espindola474eb012016-05-05 16:40:28 +0000430 // Always include absolute symbols.
Rafael Espindola5616adf2017-03-08 22:36:28 +0000431 SectionBase *Sec = D->Section;
432 if (!Sec)
Rafael Espindola474eb012016-05-05 16:40:28 +0000433 return true;
Rafael Espindola5616adf2017-03-08 22:36:28 +0000434 if (auto *IS = dyn_cast<InputSectionBase>(Sec)) {
435 Sec = IS->Repl;
436 IS = cast<InputSectionBase>(Sec);
437 // Exclude symbols pointing to garbage-collected sections.
438 if (!IS->Live)
439 return false;
440 }
441 if (auto *S = dyn_cast<MergeInputSection>(Sec))
Rui Ueyama90fa3722016-05-22 00:41:38 +0000442 if (!S->getSectionPiece(D->Value)->Live)
Rafael Espindola474eb012016-05-05 16:40:28 +0000443 return false;
Rui Ueyama9c77d272017-08-10 15:54:27 +0000444 return true;
Rafael Espindola474eb012016-05-05 16:40:28 +0000445 }
Rui Ueyama9c77d272017-08-10 15:54:27 +0000446
447 if (auto *Sym = dyn_cast<DefinedCommon>(&B))
448 return Sym->Live;
Rafael Espindola474eb012016-05-05 16:40:28 +0000449 return true;
450}
Rafael Espindola462220d2016-05-05 16:38:46 +0000451
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000452// Local symbols are not in the linker's symbol table. This function scans
453// each object file's symbol table to copy local symbols to the output.
454template <class ELFT> void Writer<ELFT>::copyLocalSymbols() {
George Rimar69b17c32017-05-16 10:04:42 +0000455 if (!InX::SymTab)
Rui Ueyama90f76fb2016-01-21 03:07:38 +0000456 return;
George Rimar696a7f92017-09-19 09:20:54 +0000457 for (InputFile *File : ObjectFiles) {
458 ObjFile<ELFT> *F = cast<ObjFile<ELFT>>(File);
Rafael Espindola67d72c02016-03-11 12:06:30 +0000459 for (SymbolBody *B : F->getLocalSymbols()) {
George Rimar78fe56e2016-10-11 09:07:14 +0000460 if (!B->IsLocal)
Rui Ueyama3fc0f7e2016-11-23 18:07:33 +0000461 fatal(toString(F) +
George Rimar78fe56e2016-10-11 09:07:14 +0000462 ": broken object: getLocalSymbols returns a non-local symbol");
Rui Ueyama80474a22017-02-28 19:29:55 +0000463 auto *DR = dyn_cast<DefinedRegular>(B);
Rui Ueyama3fc0f7e2016-11-23 18:07:33 +0000464
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000465 // No reason to keep local undefined symbol in symtab.
466 if (!DR)
Rafael Espindola444576d2015-10-09 19:25:07 +0000467 continue;
George Rimar7702bc22017-03-16 11:20:02 +0000468 if (!includeInSymtab(*B))
Rafael Espindola462220d2016-05-05 16:38:46 +0000469 continue;
Rui Ueyama3fc0f7e2016-11-23 18:07:33 +0000470
Rafael Espindola5616adf2017-03-08 22:36:28 +0000471 SectionBase *Sec = DR->Section;
George Rimar7702bc22017-03-16 11:20:02 +0000472 if (!shouldKeepInSymtab(Sec, B->getName(), *B))
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000473 continue;
George Rimar69b17c32017-05-16 10:04:42 +0000474 InX::SymTab->addSymbol(B);
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000475 }
476 }
477}
478
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000479template <class ELFT> void Writer<ELFT>::addSectionSymbols() {
480 // Create one STT_SECTION symbol for each output section we might
481 // have a relocation with.
Rafael Espindolad48b2082017-07-04 19:08:40 +0000482 for (BaseCommand *Base : Script->Opt.Commands) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000483 auto *Sec = dyn_cast<OutputSection>(Base);
484 if (!Sec)
Rui Ueyama73d29ab2017-02-28 19:43:54 +0000485 continue;
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000486 auto I = llvm::find_if(Sec->Commands, [](BaseCommand *Base) {
Rafael Espindolad48b2082017-07-04 19:08:40 +0000487 if (auto *ISD = dyn_cast<InputSectionDescription>(Base))
488 return !ISD->Sections.empty();
489 return false;
490 });
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000491 if (I == Sec->Commands.end())
Rafael Espindolad48b2082017-07-04 19:08:40 +0000492 continue;
493 InputSection *IS = cast<InputSectionDescription>(*I)->Sections[0];
Rui Ueyama73d29ab2017-02-28 19:43:54 +0000494 if (isa<SyntheticSection>(IS) || IS->Type == SHT_REL ||
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000495 IS->Type == SHT_RELA)
496 continue;
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000497
Rui Ueyama175e81c2017-02-28 19:36:30 +0000498 auto *Sym =
499 make<DefinedRegular>("", /*IsLocal=*/true, /*StOther=*/0, STT_SECTION,
Rafael Espindola6e93d052017-08-04 22:31:42 +0000500 /*Value=*/0, /*Size=*/0, IS);
George Rimar69b17c32017-05-16 10:04:42 +0000501 InX::SymTab->addSymbol(Sym);
Rafael Espindola08d6a3f2017-02-11 01:40:49 +0000502 }
503}
504
Rui Ueyama26ad0572017-02-16 04:51:46 +0000505// Today's loaders have a feature to make segments read-only after
506// processing dynamic relocations to enhance security. PT_GNU_RELRO
507// is defined for that.
508//
509// This function returns true if a section needs to be put into a
510// PT_GNU_RELRO segment.
Rafael Espindoladc49af92017-07-24 23:55:33 +0000511static bool isRelroSection(const OutputSection *Sec) {
Rafael Espindola4fc60442016-02-10 22:43:13 +0000512 if (!Config->ZRelro)
513 return false;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000514
Rafael Espindolae08e78d2016-11-09 23:23:45 +0000515 uint64_t Flags = Sec->Flags;
Rui Ueyama9d773f32017-04-13 05:40:07 +0000516
517 // Non-allocatable or non-writable sections don't need RELRO because
518 // they are not writable or not even mapped to memory in the first place.
519 // RELRO is for sections that are essentially read-only but need to
520 // be writable only at process startup to allow dynamic linker to
521 // apply relocations.
George Rimare3336c02015-11-24 10:15:50 +0000522 if (!(Flags & SHF_ALLOC) || !(Flags & SHF_WRITE))
523 return false;
Rui Ueyama9d773f32017-04-13 05:40:07 +0000524
525 // Once initialized, TLS data segments are used as data templates
526 // for a thread-local storage. For each new thread, runtime
527 // allocates memory for a TLS and copy templates there. No thread
528 // are supposed to use templates directly. Thus, it can be in RELRO.
Rui Ueyamaccfc3262015-12-10 19:13:08 +0000529 if (Flags & SHF_TLS)
530 return true;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000531
Rui Ueyama9d773f32017-04-13 05:40:07 +0000532 // .init_array, .preinit_array and .fini_array contain pointers to
533 // functions that are executed on process startup or exit. These
534 // pointers are set by the static linker, and they are not expected
535 // to change at runtime. But if you are an attacker, you could do
536 // interesting things by manipulating pointers in .fini_array, for
537 // example. So they are put into RELRO.
Rafael Espindola04a2e342016-11-09 01:42:41 +0000538 uint32_t Type = Sec->Type;
Rui Ueyamaccfc3262015-12-10 19:13:08 +0000539 if (Type == SHT_INIT_ARRAY || Type == SHT_FINI_ARRAY ||
540 Type == SHT_PREINIT_ARRAY)
George Rimare3336c02015-11-24 10:15:50 +0000541 return true;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000542
Rui Ueyama9d773f32017-04-13 05:40:07 +0000543 // .got contains pointers to external symbols. They are resolved by
544 // the dynamic linker when a module is loaded into memory, and after
545 // that they are not expected to change. So, it can be in RELRO.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000546 if (InX::Got && Sec == InX::Got->getParent())
Simon Atanasyan725dc142016-11-16 21:01:02 +0000547 return true;
Rui Ueyama9d773f32017-04-13 05:40:07 +0000548
549 // .got.plt contains pointers to external function symbols. They are
550 // by default resolved lazily, so we usually cannot put it into RELRO.
551 // However, if "-z now" is given, the lazy symbol resolution is
552 // disabled, which enables us to put it into RELRO.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000553 if (Sec == InX::GotPlt->getParent())
Rui Ueyama9d773f32017-04-13 05:40:07 +0000554 return Config->ZNow;
555
556 // .dynamic section contains data for the dynamic linker, and
557 // there's no need to write to it at runtime, so it's better to put
558 // it into RELRO.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000559 if (Sec == InX::Dynamic->getParent())
Rui Ueyama9d773f32017-04-13 05:40:07 +0000560 return true;
561
562 // .bss.rel.ro is used for copy relocations for read-only symbols.
563 // Since the dynamic linker needs to process copy relocations, the
564 // section cannot be read-only, but once initialized, they shouldn't
565 // change.
Rafael Espindoladb5e56f2017-05-31 20:17:44 +0000566 if (Sec == InX::BssRelRo->getParent())
Peter Collingbournefeb66292017-01-10 01:21:50 +0000567 return true;
Rui Ueyama26ad0572017-02-16 04:51:46 +0000568
Rui Ueyama9d773f32017-04-13 05:40:07 +0000569 // Sections with some special names are put into RELRO. This is a
570 // bit unfortunate because section names shouldn't be significant in
571 // ELF in spirit. But in reality many linker features depend on
572 // magic section names.
Rafael Espindola40849412017-02-24 14:28:00 +0000573 StringRef S = Sec->Name;
Rui Ueyama01faef02015-12-10 19:19:04 +0000574 return S == ".data.rel.ro" || S == ".ctors" || S == ".dtors" || S == ".jcr" ||
George Rimard003c7f2016-12-20 11:28:54 +0000575 S == ".eh_frame" || S == ".openbsd.randomdata";
George Rimare3336c02015-11-24 10:15:50 +0000576}
577
Rafael Espindola52101412017-05-12 14:52:22 +0000578// We compute a rank for each section. The rank indicates where the
579// section should be placed in the file. Instead of using simple
580// numbers (0,1,2...), we use a series of flags. One for each decision
581// point when placing the section.
582// Using flags has two key properties:
583// * It is easy to check if a give branch was taken.
584// * It is easy two see how similar two ranks are (see getRankProximity).
585enum RankFlags {
Rafael Espindolad23e9262017-05-26 17:23:25 +0000586 RF_NOT_ADDR_SET = 1 << 16,
587 RF_NOT_INTERP = 1 << 15,
588 RF_NOT_ALLOC = 1 << 14,
589 RF_WRITE = 1 << 13,
590 RF_EXEC_WRITE = 1 << 12,
Rafael Espindola246c1c42017-05-18 16:20:12 +0000591 RF_EXEC = 1 << 11,
592 RF_NON_TLS_BSS = 1 << 10,
593 RF_NON_TLS_BSS_RO = 1 << 9,
594 RF_NOT_TLS = 1 << 8,
595 RF_BSS = 1 << 7,
596 RF_PPC_NOT_TOCBSS = 1 << 6,
597 RF_PPC_OPD = 1 << 5,
598 RF_PPC_TOCL = 1 << 4,
599 RF_PPC_TOC = 1 << 3,
600 RF_PPC_BRANCH_LT = 1 << 2,
601 RF_MIPS_GPREL = 1 << 1,
602 RF_MIPS_NOT_GOT = 1 << 0
Rafael Espindola52101412017-05-12 14:52:22 +0000603};
Rui Ueyamae288eef2016-11-02 18:58:44 +0000604
Rafael Espindola52101412017-05-12 14:52:22 +0000605static unsigned getSectionRank(const OutputSection *Sec) {
606 unsigned Rank = 0;
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000607
Rafael Espindola5967c972016-12-19 21:21:07 +0000608 // We want to put section specified by -T option first, so we
609 // can start assigning VA starting from them later.
Rafael Espindola52101412017-05-12 14:52:22 +0000610 if (Config->SectionStartMap.count(Sec->Name))
611 return Rank;
612 Rank |= RF_NOT_ADDR_SET;
613
614 // Put .interp first because some loaders want to see that section
615 // on the first page of the executable file when loaded into memory.
616 if (Sec->Name == ".interp")
617 return Rank;
618 Rank |= RF_NOT_INTERP;
619
620 // Allocatable sections go first to reduce the total PT_LOAD size and
621 // so debug info doesn't change addresses in actual code.
622 if (!(Sec->Flags & SHF_ALLOC))
623 return Rank | RF_NOT_ALLOC;
Rafael Espindola5967c972016-12-19 21:21:07 +0000624
Rafael Espindolad23e9262017-05-26 17:23:25 +0000625 // Sort sections based on their access permission in the following
626 // order: R, RX, RWX, RW. This order is based on the following
627 // considerations:
628 // * Read-only sections come first such that they go in the
629 // PT_LOAD covering the program headers at the start of the file.
630 // * Read-only, executable sections come next, unless the
631 // -no-rosegment option is used.
632 // * Writable, executable sections follow such that .plt on
633 // architectures where it needs to be writable will be placed
634 // between .text and .data.
635 // * Writable sections come last, such that .bss lands at the very
636 // end of the last PT_LOAD.
637 bool IsExec = Sec->Flags & SHF_EXECINSTR;
638 bool IsWrite = Sec->Flags & SHF_WRITE;
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000639
Rafael Espindolad23e9262017-05-26 17:23:25 +0000640 if (IsExec) {
641 if (IsWrite)
642 Rank |= RF_EXEC_WRITE;
643 else if (!Config->SingleRoRx)
Rafael Espindola52101412017-05-12 14:52:22 +0000644 Rank |= RF_EXEC;
Rafael Espindolad23e9262017-05-26 17:23:25 +0000645 } else {
646 if (IsWrite)
647 Rank |= RF_WRITE;
Rafael Espindolae979fd12016-09-29 22:48:55 +0000648 }
Rui Ueyama5a9640b2015-10-08 23:49:30 +0000649
Hal Finkel0d7e83b2015-10-13 17:57:46 +0000650 // If we got here we know that both A and B are in the same PT_LOAD.
Michael J. Spencer1bf73002015-10-16 23:11:07 +0000651
Rafael Espindola52101412017-05-12 14:52:22 +0000652 bool IsTls = Sec->Flags & SHF_TLS;
653 bool IsNoBits = Sec->Type == SHT_NOBITS;
Hal Finkel3bae2d82015-10-12 20:51:48 +0000654
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000655 // The first requirement we have is to put (non-TLS) nobits sections last. The
656 // reason is that the only thing the dynamic linker will see about them is a
657 // p_memsz that is larger than p_filesz. Seeing that it zeros the end of the
658 // PT_LOAD, so that has to correspond to the nobits sections.
Rafael Espindola52101412017-05-12 14:52:22 +0000659 bool IsNonTlsNoBits = IsNoBits && !IsTls;
660 if (IsNonTlsNoBits)
661 Rank |= RF_NON_TLS_BSS;
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000662
663 // We place nobits RelRo sections before plain r/w ones, and non-nobits RelRo
664 // sections after r/w ones, so that the RelRo sections are contiguous.
Rafael Espindola52101412017-05-12 14:52:22 +0000665 bool IsRelRo = isRelroSection(Sec);
666 if (IsNonTlsNoBits && !IsRelRo)
667 Rank |= RF_NON_TLS_BSS_RO;
668 if (!IsNonTlsNoBits && IsRelRo)
669 Rank |= RF_NON_TLS_BSS_RO;
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000670
671 // The TLS initialization block needs to be a single contiguous block in a R/W
672 // PT_LOAD, so stick TLS sections directly before the other RelRo R/W
673 // sections. The TLS NOBITS sections are placed here as they don't take up
674 // virtual address space in the PT_LOAD.
Rafael Espindola52101412017-05-12 14:52:22 +0000675 if (!IsTls)
676 Rank |= RF_NOT_TLS;
Peter Collingbourne628ec9f2017-01-10 01:21:30 +0000677
678 // Within the TLS initialization block, the non-nobits sections need to appear
679 // first.
Rafael Espindola52101412017-05-12 14:52:22 +0000680 if (IsNoBits)
681 Rank |= RF_BSS;
George Rimare3336c02015-11-24 10:15:50 +0000682
Ben Dunbobbin95637552017-08-18 16:15:36 +0000683 // Some architectures have additional ordering restrictions for sections
684 // within the same PT_LOAD.
Rafael Espindola52101412017-05-12 14:52:22 +0000685 if (Config->EMachine == EM_PPC64) {
686 // PPC64 has a number of special SHT_PROGBITS+SHF_ALLOC+SHF_WRITE sections
687 // that we would like to make sure appear is a specific order to maximize
688 // their coverage by a single signed 16-bit offset from the TOC base
689 // pointer. Conversely, the special .tocbss section should be first among
690 // all SHT_NOBITS sections. This will put it next to the loaded special
691 // PPC64 sections (and, thus, within reach of the TOC base pointer).
692 StringRef Name = Sec->Name;
693 if (Name != ".tocbss")
694 Rank |= RF_PPC_NOT_TOCBSS;
Hal Finkel9abc2a52015-10-13 19:07:29 +0000695
Rafael Espindola52101412017-05-12 14:52:22 +0000696 if (Name == ".opd")
697 Rank |= RF_PPC_OPD;
698
699 if (Name == ".toc1")
700 Rank |= RF_PPC_TOCL;
701
702 if (Name == ".toc")
703 Rank |= RF_PPC_TOC;
704
705 if (Name == ".branch_lt")
706 Rank |= RF_PPC_BRANCH_LT;
707 }
708 if (Config->EMachine == EM_MIPS) {
709 // All sections with SHF_MIPS_GPREL flag should be grouped together
710 // because data in these sections is addressable with a gp relative address.
711 if (Sec->Flags & SHF_MIPS_GPREL)
712 Rank |= RF_MIPS_GPREL;
713
714 if (Sec->Name != ".got")
715 Rank |= RF_MIPS_NOT_GOT;
716 }
717
718 return Rank;
719}
720
Rafael Espindola383971d2017-06-15 21:51:01 +0000721static bool compareSections(const BaseCommand *ACmd, const BaseCommand *BCmd) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000722 const OutputSection *A = cast<OutputSection>(ACmd);
723 const OutputSection *B = cast<OutputSection>(BCmd);
Rafael Espindola52101412017-05-12 14:52:22 +0000724 if (A->SortRank != B->SortRank)
725 return A->SortRank < B->SortRank;
726 if (!(A->SortRank & RF_NOT_ADDR_SET))
727 return Config->SectionStartMap.lookup(A->Name) <
728 Config->SectionStartMap.lookup(B->Name);
Rafael Espindola24c073d2016-09-21 22:36:19 +0000729 return false;
730}
731
Rafael Espindola24e6f362017-02-24 15:07:30 +0000732void PhdrEntry::add(OutputSection *Sec) {
George Rimar6823c5f2017-09-07 11:01:10 +0000733 LastSec = Sec;
734 if (!FirstSec)
735 FirstSec = Sec;
Rafael Espindola37707632017-03-07 14:55:52 +0000736 p_align = std::max(p_align, Sec->Alignment);
Rafael Espindola17cb7c02016-12-19 17:01:01 +0000737 if (p_type == PT_LOAD)
George Rimar582ede82017-09-07 10:53:07 +0000738 Sec->PtLoad = this;
Eugene Leviantbbe38602016-07-19 09:25:43 +0000739}
740
Denis Protivensky8e3b38a2015-11-12 09:52:08 +0000741template <class ELFT>
Rafael Espindola5616adf2017-03-08 22:36:28 +0000742static Symbol *addRegular(StringRef Name, SectionBase *Sec, uint64_t Value,
743 uint8_t StOther = STV_HIDDEN,
744 uint8_t Binding = STB_WEAK) {
Rafael Espindoladab02d42016-11-17 21:20:16 +0000745 // The linker generated symbols are added as STB_WEAK to allow user defined
746 // ones to override them.
Rafael Espindola244ef982017-07-26 18:42:48 +0000747 return Symtab->addRegular<ELFT>(Name, StOther, STT_NOTYPE, Value,
748 /*Size=*/0, Binding, Sec,
749 /*File=*/nullptr);
Eugene Leviantad4439e2016-11-11 11:33:32 +0000750}
751
752template <class ELFT>
Rafael Espindola5616adf2017-03-08 22:36:28 +0000753static DefinedRegular *
754addOptionalRegular(StringRef Name, SectionBase *Sec, uint64_t Val,
755 uint8_t StOther = STV_HIDDEN, uint8_t Binding = STB_GLOBAL) {
Rafael Espindola244ef982017-07-26 18:42:48 +0000756 SymbolBody *S = Symtab->find(Name);
Eugene Leviantad4439e2016-11-11 11:33:32 +0000757 if (!S)
758 return nullptr;
Rafael Espindola1d6d1b42017-01-17 16:08:06 +0000759 if (S->isInCurrentDSO())
Rafael Espindola5616adf2017-03-08 22:36:28 +0000760 return nullptr;
761 return cast<DefinedRegular>(
762 addRegular<ELFT>(Name, Sec, Val, StOther, Binding)->body());
Eugene Leviantad4439e2016-11-11 11:33:32 +0000763}
764
Rui Ueyama01687222015-12-26 09:47:57 +0000765// The beginning and the ending of .rel[a].plt section are marked
766// with __rel[a]_iplt_{start,end} symbols if it is a statically linked
767// executable. The runtime needs these symbols in order to resolve
768// all IRELATIVE relocs on startup. For dynamic executables, we don't
769// need these symbols, since IRELATIVE relocs are resolved through GOT
770// and PLT. For details, see http://www.airs.com/blog/archives/403.
George Rimaree741cf2016-04-14 13:23:02 +0000771template <class ELFT> void Writer<ELFT>::addRelIpltSymbols() {
Shoaib Meenai335fad12017-08-05 05:01:07 +0000772 if (!Config->Static)
George Rimara07ff662015-12-21 10:12:06 +0000773 return;
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000774 StringRef S = Config->IsRela ? "__rela_iplt_start" : "__rel_iplt_start";
Rafael Espindola5616adf2017-03-08 22:36:28 +0000775 addOptionalRegular<ELFT>(S, In<ELFT>::RelaIplt, 0, STV_HIDDEN, STB_WEAK);
Rui Ueyama01687222015-12-26 09:47:57 +0000776
Rui Ueyamad57e74b72017-03-17 23:29:01 +0000777 S = Config->IsRela ? "__rela_iplt_end" : "__rel_iplt_end";
Rafael Espindola5616adf2017-03-08 22:36:28 +0000778 addOptionalRegular<ELFT>(S, In<ELFT>::RelaIplt, -1, STV_HIDDEN, STB_WEAK);
George Rimara07ff662015-12-21 10:12:06 +0000779}
780
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +0000781// The linker is expected to define some symbols depending on
782// the linking result. This function defines such symbols.
783template <class ELFT> void Writer<ELFT>::addReservedSymbols() {
George Rimar7beff422016-11-15 08:19:02 +0000784 if (Config->EMachine == EM_MIPS) {
Rafael Espindola9b3f99e2016-04-12 02:24:43 +0000785 // Define _gp for MIPS. st_value of _gp symbol will be updated by Writer
Simon Atanasyan6a4eb752016-12-08 06:19:47 +0000786 // so that it points to an absolute address which by default is relative
787 // to GOT. Default offset is 0x7ff0.
Rafael Espindola9b3f99e2016-04-12 02:24:43 +0000788 // See "Global Data Symbols" in Chapter 6 in the following document:
789 // ftp://www.linux-mips.org/pub/linux/mips/doc/ABI/mipsabi.pdf
Rafael Espindola244ef982017-07-26 18:42:48 +0000790 ElfSym::MipsGp = Symtab->addAbsolute<ELFT>("_gp", STV_HIDDEN, STB_LOCAL);
Rafael Espindola9b3f99e2016-04-12 02:24:43 +0000791
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000792 // On MIPS O32 ABI, _gp_disp is a magic symbol designates offset between
Simon Atanasyand34a3632017-03-20 21:03:43 +0000793 // start of function and 'gp' pointer into GOT.
Rafael Espindola244ef982017-07-26 18:42:48 +0000794 if (Symtab->find("_gp_disp"))
Rui Ueyama80474a22017-02-28 19:29:55 +0000795 ElfSym::MipsGpDisp =
Rafael Espindola244ef982017-07-26 18:42:48 +0000796 Symtab->addAbsolute<ELFT>("_gp_disp", STV_HIDDEN, STB_LOCAL);
Peter Collingbourne6f535b72016-05-03 18:03:45 +0000797
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000798 // The __gnu_local_gp is a magic symbol equal to the current value of 'gp'
799 // pointer. This symbol is used in the code generated by .cpload pseudo-op
800 // in case of using -mno-shared option.
801 // https://sourceware.org/ml/binutils/2004-12/msg00094.html
Rafael Espindola244ef982017-07-26 18:42:48 +0000802 if (Symtab->find("__gnu_local_gp"))
Rui Ueyama80474a22017-02-28 19:29:55 +0000803 ElfSym::MipsLocalGp =
Rafael Espindola244ef982017-07-26 18:42:48 +0000804 Symtab->addAbsolute<ELFT>("__gnu_local_gp", STV_HIDDEN, STB_LOCAL);
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000805 }
806
Peter Smith113a59e2017-06-26 10:22:17 +0000807 // The _GLOBAL_OFFSET_TABLE_ symbol is defined by target convention to
808 // be at some offset from the base of the .got section, usually 0 or the end
809 // of the .got
Rui Ueyama92c37812017-06-26 15:11:24 +0000810 InputSection *GotSection = InX::MipsGot ? cast<InputSection>(InX::MipsGot)
811 : cast<InputSection>(InX::Got);
812 ElfSym::GlobalOffsetTable = addOptionalRegular<ELFT>(
813 "_GLOBAL_OFFSET_TABLE_", GotSection, Target->GotBaseSymOff);
Rafael Espindolaccfe3cb2016-04-04 14:04:16 +0000814
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +0000815 // __tls_get_addr is defined by the dynamic linker for dynamic ELFs. For
816 // static linking the linker is required to optimize away any references to
817 // __tls_get_addr, so it's not defined anywhere. Create a hidden definition
Rui Ueyamaa2a46a92017-04-25 04:44:54 +0000818 // to avoid the undefined symbol error.
George Rimar69b17c32017-05-16 10:04:42 +0000819 if (!InX::DynSymTab)
Rafael Espindola244ef982017-07-26 18:42:48 +0000820 Symtab->addIgnored<ELFT>("__tls_get_addr");
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +0000821
Petr Hosek6b936bf2017-05-10 16:20:33 +0000822 // __ehdr_start is the location of ELF file headers. Note that we define
823 // this symbol unconditionally even when using a linker script, which
824 // differs from the behavior implemented by GNU linker which only define
825 // this symbol if ELF headers are in the memory mapped segment.
Rafael Espindola0e454a92017-06-06 16:18:48 +0000826 // __executable_start is not documented, but the expectation of at
827 // least the android libc is that it points to the elf header too.
828 // __dso_handle symbol is passed to cxa_finalize as a marker to identify
829 // each DSO. The address of the symbol doesn't matter as long as they are
830 // different in different DSOs, so we chose the start address of the DSO.
831 for (const char *Name :
832 {"__ehdr_start", "__executable_start", "__dso_handle"})
833 addOptionalRegular<ELFT>(Name, Out::ElfHeader, 0, STV_HIDDEN);
Petr Hosek6b936bf2017-05-10 16:20:33 +0000834
George Rimar28ac19c2016-08-08 08:42:48 +0000835 // If linker script do layout we do not need to create any standart symbols.
Rui Ueyamaa34da932017-03-21 23:03:09 +0000836 if (Script->Opt.HasSections)
George Rimar28ac19c2016-08-08 08:42:48 +0000837 return;
838
Davide Italiano763febc2017-09-18 18:31:49 +0000839 auto Add = [](StringRef S, int64_t Pos) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000840 return addOptionalRegular<ELFT>(S, Out::ElfHeader, Pos, STV_DEFAULT);
George Rimar9e859392016-02-26 14:36:36 +0000841 };
842
Rafael Espindola4d560162017-09-12 16:38:01 +0000843 ElfSym::Bss = Add("__bss_start", 0);
Davide Italiano763febc2017-09-18 18:31:49 +0000844 ElfSym::End1 = Add("end", -1);
845 ElfSym::End2 = Add("_end", -1);
846 ElfSym::Etext1 = Add("etext", -1);
847 ElfSym::Etext2 = Add("_etext", -1);
848 ElfSym::Edata1 = Add("edata", -1);
849 ElfSym::Edata2 = Add("_edata", -1);
Rui Ueyamaf18fe7b2015-12-26 07:50:39 +0000850}
851
Rui Ueyamac4185702016-02-10 23:20:42 +0000852// Sort input sections by section name suffixes for
853// __attribute__((init_priority(N))).
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000854static void sortInitFini(OutputSection *Cmd) {
Rafael Espindola21263342017-07-05 23:36:24 +0000855 if (Cmd)
856 Cmd->sortInitFini();
Rui Ueyama5af83682016-02-11 23:41:38 +0000857}
858
859// Sort input sections by the special rule for .ctors and .dtors.
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000860static void sortCtorsDtors(OutputSection *Cmd) {
Rafael Espindola21263342017-07-05 23:36:24 +0000861 if (Cmd)
862 Cmd->sortCtorsDtors();
Rui Ueyamac4185702016-02-10 23:20:42 +0000863}
864
George Rimar1a33c0f2016-11-10 09:05:20 +0000865// Sort input sections using the list provided by --symbol-ordering-file.
George Rimar696a7f92017-09-19 09:20:54 +0000866static void sortBySymbolsOrder() {
George Rimar1a33c0f2016-11-10 09:05:20 +0000867 if (Config->SymbolOrderingFile.empty())
868 return;
869
Rui Ueyama31270312016-12-20 01:51:08 +0000870 // Sort sections by priority.
George Rimar696a7f92017-09-19 09:20:54 +0000871 DenseMap<SectionBase *, int> SectionOrder = buildSectionOrder();
Rafael Espindola21263342017-07-05 23:36:24 +0000872 for (BaseCommand *Base : Script->Opt.Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000873 if (auto *Sec = dyn_cast<OutputSection>(Base))
874 Sec->sort([&](InputSectionBase *S) { return SectionOrder.lookup(S); });
George Rimar1a33c0f2016-11-10 09:05:20 +0000875}
876
Eugene Leviante63d81b2016-07-20 14:43:20 +0000877template <class ELFT>
Rafael Espindolab4c9b812017-02-23 02:28:28 +0000878void Writer<ELFT>::forEachRelSec(std::function<void(InputSectionBase &)> Fn) {
George Rimarcb888a62017-09-13 07:54:47 +0000879 // Scan all relocations. Each relocation goes through a series
880 // of tests to determine if it needs special treatment, such as
881 // creating GOT, PLT, copy relocations, etc.
882 // Note that relocations for non-alloc sections are directly
883 // processed by InputSection::relocateNonAlloc.
884 for (InputSectionBase *IS : InputSections)
885 if (IS->Live && isa<InputSection>(IS) && (IS->Flags & SHF_ALLOC))
Rafael Espindola9f0c4bb2016-11-10 14:53:24 +0000886 Fn(*IS);
George Rimarcb888a62017-09-13 07:54:47 +0000887 for (EhInputSection *ES : In<ELFT>::EhFrame->Sections)
888 Fn(*ES);
Rafael Espindola0f7ceda2016-07-20 17:58:07 +0000889}
890
Eugene Leviant282251a2016-11-01 09:49:24 +0000891template <class ELFT> void Writer<ELFT>::createSections() {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000892 std::vector<BaseCommand *> Old = Script->Opt.Commands;
893 Script->Opt.Commands.clear();
Rui Ueyama536a2672017-02-27 02:32:08 +0000894 for (InputSectionBase *IS : InputSections)
Rafael Espindola82902742017-02-16 17:32:26 +0000895 if (IS)
George Rimare21c3af2017-03-14 09:30:25 +0000896 Factory.addInputSec(IS, getOutputSectionName(IS->Name));
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000897 Script->Opt.Commands.insert(Script->Opt.Commands.end(), Old.begin(),
898 Old.end());
Eugene Leviantceabe802016-08-11 07:56:43 +0000899
Rafael Espindola21263342017-07-05 23:36:24 +0000900 Script->fabricateDefaultCommands();
George Rimar696a7f92017-09-19 09:20:54 +0000901 sortBySymbolsOrder();
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000902 sortInitFini(findSection(".init_array"));
903 sortInitFini(findSection(".fini_array"));
904 sortCtorsDtors(findSection(".ctors"));
905 sortCtorsDtors(findSection(".dtors"));
Eugene Leviante63d81b2016-07-20 14:43:20 +0000906}
907
Petr Hosek18821b62017-09-01 02:23:31 +0000908// This function generates assignments for predefined symbols (e.g. _end or
909// _etext) and inserts them into the commands sequence to be processed at the
910// appropriate time. This ensures that the value is going to be correct by the
911// time any references to these symbols are processed and is equivalent to
912// defining these symbols explicitly in the linker script.
Rafael Espindola4d560162017-09-12 16:38:01 +0000913template <class ELFT> void Writer<ELFT>::setReservedSymbolSections() {
Petr Hosek18821b62017-09-01 02:23:31 +0000914 PhdrEntry *Last = nullptr;
915 PhdrEntry *LastRO = nullptr;
916 PhdrEntry *LastRW = nullptr;
Rui Ueyama888da8c2017-09-05 20:17:37 +0000917
Petr Hosek18821b62017-09-01 02:23:31 +0000918 for (PhdrEntry *P : Phdrs) {
919 if (P->p_type != PT_LOAD)
920 continue;
921 Last = P;
922 if (P->p_flags & PF_W)
923 LastRW = P;
924 else
925 LastRO = P;
926 }
927
Rui Ueyama888da8c2017-09-05 20:17:37 +0000928 // _end is the first location after the uninitialized data region.
Petr Hosek18821b62017-09-01 02:23:31 +0000929 if (Last) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000930 if (ElfSym::End1)
931 ElfSym::End1->Section = Last->LastSec;
932 if (ElfSym::End2)
933 ElfSym::End2->Section = Last->LastSec;
Petr Hosek18821b62017-09-01 02:23:31 +0000934 }
Rui Ueyama888da8c2017-09-05 20:17:37 +0000935
936 // _etext is the first location after the last read-only loadable segment.
Petr Hosek18821b62017-09-01 02:23:31 +0000937 if (LastRO) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000938 if (ElfSym::Etext1)
939 ElfSym::Etext1->Section = LastRO->LastSec;
940 if (ElfSym::Etext2)
941 ElfSym::Etext2->Section = LastRO->LastSec;
Petr Hosek18821b62017-09-01 02:23:31 +0000942 }
Rui Ueyama888da8c2017-09-05 20:17:37 +0000943
944 // _edata points to the end of the last non SHT_NOBITS section.
Petr Hosek18821b62017-09-01 02:23:31 +0000945 if (LastRW) {
Rui Ueyama888da8c2017-09-05 20:17:37 +0000946 size_t I = 0;
Rafael Espindola4d560162017-09-12 16:38:01 +0000947 for (; I < OutputSections.size(); ++I)
948 if (OutputSections[I] == LastRW->FirstSec)
Rui Ueyama888da8c2017-09-05 20:17:37 +0000949 break;
950
Rafael Espindola4d560162017-09-12 16:38:01 +0000951 for (; I < OutputSections.size(); ++I) {
952 if (OutputSections[I]->Type != SHT_NOBITS)
Rui Ueyama888da8c2017-09-05 20:17:37 +0000953 continue;
Rui Ueyama888da8c2017-09-05 20:17:37 +0000954 break;
Petr Hosek18821b62017-09-01 02:23:31 +0000955 }
Rafael Espindola4d560162017-09-12 16:38:01 +0000956 if (ElfSym::Edata1)
957 ElfSym::Edata1->Section = OutputSections[I - 1];
958 if (ElfSym::Edata2)
959 ElfSym::Edata2->Section = OutputSections[I - 1];
960 }
961
962 if (ElfSym::Bss)
963 ElfSym::Bss->Section = findSection(".bss");
964
965 // Setup MIPS _gp_disp/__gnu_local_gp symbols which should
966 // be equal to the _gp symbol's value.
Rafael Espindola9be24cf2017-09-20 18:30:57 +0000967 if (ElfSym::MipsGp) {
Rafael Espindola4d560162017-09-12 16:38:01 +0000968 // Find GP-relative section with the lowest address
969 // and use this address to calculate default _gp value.
970 for (OutputSection *OS : OutputSections) {
971 if (OS->Flags & SHF_MIPS_GPREL) {
972 ElfSym::MipsGp->Section = OS;
973 ElfSym::MipsGp->Value = 0x7ff0;
974 break;
975 }
976 }
Petr Hosek18821b62017-09-01 02:23:31 +0000977 }
978}
979
Rafael Espindola52101412017-05-12 14:52:22 +0000980// We want to find how similar two ranks are.
981// The more branches in getSectionRank that match, the more similar they are.
982// Since each branch corresponds to a bit flag, we can just use
983// countLeadingZeros.
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000984static int getRankProximityAux(OutputSection *A, OutputSection *B) {
Rafael Espindola52101412017-05-12 14:52:22 +0000985 return countLeadingZeros(A->SortRank ^ B->SortRank);
Eugene Leviantbae1c652016-11-08 10:44:48 +0000986}
987
Rafael Espindola383971d2017-06-15 21:51:01 +0000988static int getRankProximity(OutputSection *A, BaseCommand *B) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +0000989 if (auto *Sec = dyn_cast<OutputSection>(B))
990 if (Sec->Live)
991 return getRankProximityAux(A, Sec);
Rafael Espindola383971d2017-06-15 21:51:01 +0000992 return -1;
993}
994
995// When placing orphan sections, we want to place them after symbol assignments
996// so that an orphan after
997// begin_foo = .;
998// foo : { *(foo) }
999// end_foo = .;
1000// doesn't break the intended meaning of the begin/end symbols.
1001// We don't want to go over sections since findOrphanPos is the
1002// one in charge of deciding the order of the sections.
1003// We don't want to go over changes to '.', since doing so in
1004// rx_sec : { *(rx_sec) }
1005// . = ALIGN(0x1000);
1006// /* The RW PT_LOAD starts here*/
1007// rw_sec : { *(rw_sec) }
1008// would mean that the RW PT_LOAD would become unaligned.
1009static bool shouldSkip(BaseCommand *Cmd) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001010 if (isa<OutputSection>(Cmd))
Rafael Espindola383971d2017-06-15 21:51:01 +00001011 return false;
1012 if (auto *Assign = dyn_cast<SymbolAssignment>(Cmd))
1013 return Assign->Name != ".";
1014 return true;
1015}
1016
Rafael Espindola52101412017-05-12 14:52:22 +00001017// We want to place orphan sections so that they share as much
1018// characteristics with their neighbors as possible. For example, if
1019// both are rw, or both are tls.
Rafael Espindola0ca37122017-05-09 13:58:46 +00001020template <typename ELFT>
Rafael Espindola383971d2017-06-15 21:51:01 +00001021static std::vector<BaseCommand *>::iterator
1022findOrphanPos(std::vector<BaseCommand *>::iterator B,
1023 std::vector<BaseCommand *>::iterator E) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001024 OutputSection *Sec = cast<OutputSection>(*E);
Rafael Espindola0ca37122017-05-09 13:58:46 +00001025
Rafael Espindola52101412017-05-12 14:52:22 +00001026 // Find the first element that has as close a rank as possible.
Rafael Espindola383971d2017-06-15 21:51:01 +00001027 auto I = std::max_element(B, E, [=](BaseCommand *A, BaseCommand *B) {
Rafael Espindola52101412017-05-12 14:52:22 +00001028 return getRankProximity(Sec, A) < getRankProximity(Sec, B);
1029 });
1030 if (I == E)
Rafael Espindola0ca37122017-05-09 13:58:46 +00001031 return E;
1032
Rafael Espindola52101412017-05-12 14:52:22 +00001033 // Consider all existing sections with the same proximity.
Rafael Espindola383971d2017-06-15 21:51:01 +00001034 int Proximity = getRankProximity(Sec, *I);
1035 for (; I != E; ++I) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001036 auto *CurSec = dyn_cast<OutputSection>(*I);
1037 if (!CurSec || !CurSec->Live)
Rafael Espindola383971d2017-06-15 21:51:01 +00001038 continue;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001039 if (getRankProximity(Sec, CurSec) != Proximity ||
1040 Sec->SortRank < CurSec->SortRank)
Rafael Espindola383971d2017-06-15 21:51:01 +00001041 break;
1042 }
1043 auto J = std::find_if(
Rafael Espindolac54b1c82017-06-15 22:03:06 +00001044 llvm::make_reverse_iterator(I), llvm::make_reverse_iterator(B),
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001045 [](BaseCommand *Cmd) { return isa<OutputSection>(Cmd); });
Rafael Espindola383971d2017-06-15 21:51:01 +00001046 I = J.base();
Rafael Espindolaaad64e02017-09-19 17:29:58 +00001047
1048 // As a special case, if the orphan section is the last section, put
1049 // it at the very end, past any other commands.
1050 // This matches bfd's behavior and is convenient when the linker script fully
1051 // specifies the start of the file, but doesn't care about the end (the non
1052 // alloc sections for example).
1053 auto NextSec = std::find_if(
1054 I, E, [](BaseCommand *Cmd) { return isa<OutputSection>(Cmd); });
1055 if (NextSec == E)
1056 return E;
1057
Rafael Espindola383971d2017-06-15 21:51:01 +00001058 while (I != E && shouldSkip(*I))
Rafael Espindola52101412017-05-12 14:52:22 +00001059 ++I;
1060 return I;
Rafael Espindola0ca37122017-05-09 13:58:46 +00001061}
1062
Rafael Espindola24c073d2016-09-21 22:36:19 +00001063template <class ELFT> void Writer<ELFT>::sortSections() {
George Rimare0b43df2017-06-28 09:59:34 +00001064 if (Script->Opt.HasSections)
1065 Script->adjustSectionsBeforeSorting();
1066
Rafael Espindola1960bcd2016-11-11 22:43:27 +00001067 // Don't sort if using -r. It is not necessary and we want to preserve the
1068 // relative order for SHF_LINK_ORDER sections.
1069 if (Config->Relocatable)
Rafael Espindola85de6782017-06-28 22:44:11 +00001070 return;
Rafael Espindola52101412017-05-12 14:52:22 +00001071
Rafael Espindola383971d2017-06-15 21:51:01 +00001072 for (BaseCommand *Base : Script->Opt.Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001073 if (auto *Sec = dyn_cast<OutputSection>(Base))
1074 Sec->SortRank = getSectionRank(Sec);
Rafael Espindola52101412017-05-12 14:52:22 +00001075
Rui Ueyamaa34da932017-03-21 23:03:09 +00001076 if (!Script->Opt.HasSections) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001077 // We know that all the OutputSections are contiguous in
Rafael Espindola383971d2017-06-15 21:51:01 +00001078 // this case.
1079 auto E = Script->Opt.Commands.end();
1080 auto I = Script->Opt.Commands.begin();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001081 auto IsSection = [](BaseCommand *Base) { return isa<OutputSection>(Base); };
Rafael Espindola383971d2017-06-15 21:51:01 +00001082 I = std::find_if(I, E, IsSection);
Rafael Espindolac54b1c82017-06-15 22:03:06 +00001083 E = std::find_if(llvm::make_reverse_iterator(E),
1084 llvm::make_reverse_iterator(I), IsSection)
Rafael Espindola383971d2017-06-15 21:51:01 +00001085 .base();
1086 std::stable_sort(I, E, compareSections);
Rafael Espindola24c073d2016-09-21 22:36:19 +00001087 return;
1088 }
1089
Rafael Espindola383971d2017-06-15 21:51:01 +00001090 // Orphan sections are sections present in the input files which are
1091 // not explicitly placed into the output file by the linker script.
1092 //
1093 // The sections in the linker script are already in the correct
1094 // order. We have to figuere out where to insert the orphan
1095 // sections.
1096 //
Rafael Espindola24c073d2016-09-21 22:36:19 +00001097 // The order of the sections in the script is arbitrary and may not agree with
Rafael Espindola383971d2017-06-15 21:51:01 +00001098 // compareSections. This means that we cannot easily define a strict weak
1099 // ordering. To see why, consider a comparison of a section in the script and
1100 // one not in the script. We have a two simple options:
Rafael Espindola24c073d2016-09-21 22:36:19 +00001101 // * Make them equivalent (a is not less than b, and b is not less than a).
1102 // The problem is then that equivalence has to be transitive and we can
1103 // have sections a, b and c with only b in a script and a less than c
1104 // which breaks this property.
1105 // * Use compareSectionsNonScript. Given that the script order doesn't have
1106 // to match, we can end up with sections a, b, c, d where b and c are in the
1107 // script and c is compareSectionsNonScript less than b. In which case d
1108 // can be equivalent to c, a to b and d < a. As a concrete example:
1109 // .a (rx) # not in script
1110 // .b (rx) # in script
1111 // .c (ro) # in script
1112 // .d (ro) # not in script
1113 //
1114 // The way we define an order then is:
Rafael Espindola383971d2017-06-15 21:51:01 +00001115 // * Sort only the orphan sections. They are in the end right now.
1116 // * Move each orphan section to its preferred position. We try
Eugene Leviantbae1c652016-11-08 10:44:48 +00001117 // to put each section in the last position where it it can share
1118 // a PT_LOAD.
Rafael Espindola383971d2017-06-15 21:51:01 +00001119 //
1120 // There is some ambiguity as to where exactly a new entry should be
1121 // inserted, because Opt.Commands contains not only output section
1122 // commands but also other types of commands such as symbol assignment
1123 // expressions. There's no correct answer here due to the lack of the
1124 // formal specification of the linker script. We use heuristics to
1125 // determine whether a new output command should be added before or
1126 // after another commands. For the details, look at shouldSkip
1127 // function.
Rafael Espindola24c073d2016-09-21 22:36:19 +00001128
Rafael Espindola383971d2017-06-15 21:51:01 +00001129 auto I = Script->Opt.Commands.begin();
1130 auto E = Script->Opt.Commands.end();
1131 auto NonScriptI = std::find_if(I, E, [](BaseCommand *Base) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001132 if (auto *Sec = dyn_cast<OutputSection>(Base))
1133 return Sec->Live && Sec->SectionIndex == INT_MAX;
Rafael Espindola383971d2017-06-15 21:51:01 +00001134 return false;
1135 });
Rafael Espindola24c073d2016-09-21 22:36:19 +00001136
Rafael Espindola383971d2017-06-15 21:51:01 +00001137 // Sort the orphan sections.
1138 std::stable_sort(NonScriptI, E, compareSections);
1139
1140 // As a horrible special case, skip the first . assignment if it is before any
1141 // section. We do this because it is common to set a load address by starting
1142 // the script with ". = 0xabcd" and the expectation is that every section is
1143 // after that.
1144 auto FirstSectionOrDotAssignment =
1145 std::find_if(I, E, [](BaseCommand *Cmd) { return !shouldSkip(Cmd); });
1146 if (FirstSectionOrDotAssignment != E &&
1147 isa<SymbolAssignment>(**FirstSectionOrDotAssignment))
1148 ++FirstSectionOrDotAssignment;
1149 I = FirstSectionOrDotAssignment;
1150
Rafael Espindola52101412017-05-12 14:52:22 +00001151 while (NonScriptI != E) {
1152 auto Pos = findOrphanPos<ELFT>(I, NonScriptI);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001153 OutputSection *Orphan = cast<OutputSection>(*NonScriptI);
Rafael Espindola52101412017-05-12 14:52:22 +00001154
1155 // As an optimization, find all sections with the same sort rank
1156 // and insert them with one rotate.
Rafael Espindola383971d2017-06-15 21:51:01 +00001157 unsigned Rank = Orphan->SortRank;
1158 auto End = std::find_if(NonScriptI + 1, E, [=](BaseCommand *Cmd) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001159 return cast<OutputSection>(Cmd)->SortRank != Rank;
Rafael Espindola52101412017-05-12 14:52:22 +00001160 });
1161 std::rotate(Pos, NonScriptI, End);
1162 NonScriptI = End;
1163 }
Rafael Espindolaf7a17442016-11-14 15:39:38 +00001164
George Rimara8dba482017-03-20 10:09:58 +00001165 Script->adjustSectionsAfterSorting();
Rafael Espindola24c073d2016-09-21 22:36:19 +00001166}
1167
Peter Smith1ec42d92017-03-08 14:06:24 +00001168static void applySynthetic(const std::vector<SyntheticSection *> &Sections,
1169 std::function<void(SyntheticSection *)> Fn) {
Rui Ueyama9320cb02017-02-27 02:56:02 +00001170 for (SyntheticSection *SS : Sections)
Rafael Espindolad57c58d2017-06-07 02:31:19 +00001171 if (SS && SS->getParent() && !SS->empty())
Peter Smith1ec42d92017-03-08 14:06:24 +00001172 Fn(SS);
Eugene Leviant6380ce22016-11-15 12:26:55 +00001173}
1174
George Rimar11992c862016-11-25 08:05:41 +00001175// We need to add input synthetic sections early in createSyntheticSections()
Rui Ueyamac38860b2016-12-05 21:39:35 +00001176// to make them visible from linkescript side. But not all sections are always
1177// required to be in output. For example we don't need dynamic section content
James Henderson7ee22752017-04-06 09:40:03 +00001178// sometimes. This function filters out such unused sections from the output.
Rafael Espindolac080ff62017-07-03 16:54:39 +00001179static void removeUnusedSyntheticSections() {
Rafael Espindola9e9754b2017-02-03 13:06:18 +00001180 // All input synthetic sections that can be empty are placed after
1181 // all regular ones. We iterate over them all and exit at first
1182 // non-synthetic.
Rui Ueyama536a2672017-02-27 02:32:08 +00001183 for (InputSectionBase *S : llvm::reverse(InputSections)) {
Rui Ueyama9320cb02017-02-27 02:56:02 +00001184 SyntheticSection *SS = dyn_cast<SyntheticSection>(S);
Rui Ueyamac38860b2016-12-05 21:39:35 +00001185 if (!SS)
George Rimar11992c862016-11-25 08:05:41 +00001186 return;
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001187 OutputSection *OS = SS->getParent();
1188 if (!SS->empty() || !OS)
George Rimar11992c862016-11-25 08:05:41 +00001189 continue;
Rafael Espindolac080ff62017-07-03 16:54:39 +00001190
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001191 std::vector<BaseCommand *>::iterator Empty = OS->Commands.end();
1192 for (auto I = OS->Commands.begin(), E = OS->Commands.end(); I != E; ++I) {
Rafael Espindola43ee3602017-07-03 17:32:09 +00001193 BaseCommand *B = *I;
Rafael Espindolac080ff62017-07-03 16:54:39 +00001194 if (auto *ISD = dyn_cast<InputSectionDescription>(B)) {
George Rimar7ac38252017-09-08 13:26:45 +00001195 llvm::erase_if(ISD->Sections,
1196 [=](InputSection *IS) { return IS == SS; });
Rafael Espindolac080ff62017-07-03 16:54:39 +00001197 if (ISD->Sections.empty())
Rafael Espindola43ee3602017-07-03 17:32:09 +00001198 Empty = I;
Rafael Espindolac080ff62017-07-03 16:54:39 +00001199 }
1200 }
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001201 if (Empty != OS->Commands.end())
1202 OS->Commands.erase(Empty);
Rafael Espindolac080ff62017-07-03 16:54:39 +00001203
James Henderson7ee22752017-04-06 09:40:03 +00001204 // If there are no other sections in the output section, remove it from the
1205 // output.
George Rimar9a2da392017-09-08 13:40:07 +00001206 if (OS->Commands.empty())
1207 llvm::erase_if(Script->Opt.Commands,
1208 [&](BaseCommand *Cmd) { return Cmd == OS; });
George Rimar11992c862016-11-25 08:05:41 +00001209 }
1210}
1211
Rafael Espindola35c908f2017-08-10 15:05:37 +00001212// Returns true if a symbol can be replaced at load-time by a symbol
1213// with the same name defined in other ELF executable or DSO.
1214static bool computeIsPreemptible(const SymbolBody &B) {
1215 assert(!B.isLocal());
Rafael Espindola35c908f2017-08-10 15:05:37 +00001216 // Only symbols that appear in dynsym can be preempted.
1217 if (!B.symbol()->includeInDynsym())
1218 return false;
1219
1220 // Only default visibility symbols can be preempted.
1221 if (B.symbol()->Visibility != STV_DEFAULT)
1222 return false;
1223
Rafael Espindola30ea5cf2017-09-12 17:18:03 +00001224 // At this point copy relocations have not been created yet, so any
1225 // symbol that is not defined locally is preemptible.
Rafael Espindolaee6a3522017-09-08 18:41:49 +00001226 if (!B.isInCurrentDSO())
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001227 return true;
1228
1229 // If we have a dynamic list it specifies which local symbols are preemptible.
Rafael Espindola8016bdf2017-09-08 18:53:43 +00001230 if (Config->HasDynamicList)
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001231 return false;
1232
Rafael Espindola35c908f2017-08-10 15:05:37 +00001233 if (!Config->Shared)
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001234 return false;
Rafael Espindola35c908f2017-08-10 15:05:37 +00001235
1236 // -Bsymbolic means that definitions are not preempted.
1237 if (Config->Bsymbolic || (Config->BsymbolicFunctions && B.isFunc()))
Rafael Espindola716c57b2017-09-08 18:23:25 +00001238 return false;
Rafael Espindola35c908f2017-08-10 15:05:37 +00001239 return true;
1240}
1241
Eugene Leviante63d81b2016-07-20 14:43:20 +00001242// Create output section objects and add them to OutputSections.
1243template <class ELFT> void Writer<ELFT>::finalizeSections() {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001244 Out::DebugInfo = findSection(".debug_info");
1245 Out::PreinitArray = findSection(".preinit_array");
1246 Out::InitArray = findSection(".init_array");
1247 Out::FiniArray = findSection(".fini_array");
Rafael Espindola77572242015-10-02 19:37:55 +00001248
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001249 // The linker needs to define SECNAME_start, SECNAME_end and SECNAME_stop
1250 // symbols for sections, so that the runtime can get the start and end
1251 // addresses of each section by section name. Add such symbols.
George Rimarc1034a82016-03-01 19:12:35 +00001252 if (!Config->Relocatable) {
1253 addStartEndSymbols();
Rafael Espindolab6915452017-07-04 19:05:03 +00001254 for (BaseCommand *Base : Script->Opt.Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001255 if (auto *Sec = dyn_cast<OutputSection>(Base))
1256 addStartStopSymbols(Sec);
George Rimarc1034a82016-03-01 19:12:35 +00001257 }
Rui Ueyamad4530c62016-03-04 18:34:14 +00001258
1259 // Add _DYNAMIC symbol. Unlike GNU gold, our _DYNAMIC symbol has no type.
1260 // It should be okay as no one seems to care about the type.
1261 // Even the author of gold doesn't remember why gold behaves that way.
1262 // https://sourceware.org/ml/binutils/2002-03/msg00360.html
George Rimar69b17c32017-05-16 10:04:42 +00001263 if (InX::DynSymTab)
Rafael Espindola5ab19892017-05-11 23:16:43 +00001264 addRegular<ELFT>("_DYNAMIC", InX::Dynamic, 0);
Rafael Espindola334c3e12015-10-19 15:21:42 +00001265
Rafael Espindolade9857e2016-02-04 21:33:05 +00001266 // Define __rel[a]_iplt_{start,end} symbols if needed.
1267 addRelIpltSymbols();
1268
Rafael Espindola66b4e212017-02-23 22:06:28 +00001269 // This responsible for splitting up .eh_frame section into
Peter Smith1ec42d92017-03-08 14:06:24 +00001270 // pieces. The relocation scan uses those pieces, so this has to be
Rafael Espindola66b4e212017-02-23 22:06:28 +00001271 // earlier.
George Rimar49a47f22017-03-16 10:29:44 +00001272 applySynthetic({In<ELFT>::EhFrame},
1273 [](SyntheticSection *SS) { SS->finalizeContents(); });
Rafael Espindola56004c52016-04-07 14:22:09 +00001274
Rafael Espindola0ff545c2017-09-08 01:09:52 +00001275 for (Symbol *S : Symtab->getSymbols())
Rafael Espindolad72d97b2017-09-08 18:16:59 +00001276 S->body()->IsPreemptible |= computeIsPreemptible(*S->body());
Rafael Espindola35c908f2017-08-10 15:05:37 +00001277
Rafael Espindola0f7ceda2016-07-20 17:58:07 +00001278 // Scan relocations. This must be done after every symbol is declared so that
1279 // we can correctly decide if a dynamic relocation is needed.
George Rimarcb888a62017-09-13 07:54:47 +00001280 if (!Config->Relocatable)
1281 forEachRelSec(scanRelocations<ELFT>);
Rafael Espindola0f7ceda2016-07-20 17:58:07 +00001282
Rafael Espindola895aea62017-05-11 22:02:41 +00001283 if (InX::Plt && !InX::Plt->empty())
1284 InX::Plt->addSymbols();
1285 if (InX::Iplt && !InX::Iplt->empty())
1286 InX::Iplt->addSymbols();
Peter Smith96943762017-01-25 10:31:16 +00001287
Peter Smith55865432017-02-20 11:12:33 +00001288 // Now that we have defined all possible global symbols including linker-
Rui Ueyama1b2a8bf2015-12-26 10:22:16 +00001289 // synthesized ones. Visit all symbols to give the finishing touches.
Rafael Espindola244ef982017-07-26 18:42:48 +00001290 for (Symbol *S : Symtab->getSymbols()) {
Peter Collingbourne4f952702016-05-01 04:55:03 +00001291 SymbolBody *Body = S->body();
Rafael Espindola0baa73f2016-04-26 13:56:26 +00001292
George Rimar7702bc22017-03-16 11:20:02 +00001293 if (!includeInSymtab(*Body))
Rafael Espindola05a3dd22015-09-22 23:38:23 +00001294 continue;
George Rimar69b17c32017-05-16 10:04:42 +00001295 if (InX::SymTab)
1296 InX::SymTab->addSymbol(Body);
Rafael Espindola05a3dd22015-09-22 23:38:23 +00001297
George Rimar69b17c32017-05-16 10:04:42 +00001298 if (InX::DynSymTab && S->includeInDynsym()) {
1299 InX::DynSymTab->addSymbol(Body);
Rui Ueyama4076fa12017-02-26 23:35:34 +00001300 if (auto *SS = dyn_cast<SharedSymbol>(Body))
Rafael Espindola6e93d052017-08-04 22:31:42 +00001301 if (cast<SharedFile<ELFT>>(S->File)->isNeeded())
Eugene Leviante9bab5d2016-11-21 16:59:33 +00001302 In<ELFT>::VerNeed->addSymbol(SS);
Peter Collingbourne21a12fc2016-04-27 20:22:31 +00001303 }
Rafael Espindola05a3dd22015-09-22 23:38:23 +00001304 }
Rui Ueyamac2a0d7e2016-01-28 22:56:29 +00001305
1306 // Do not proceed if there was an undefined symbol.
Rui Ueyamaf373dd72016-11-24 01:43:21 +00001307 if (ErrorCount)
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +00001308 return;
Rui Ueyamac2a0d7e2016-01-28 22:56:29 +00001309
Rafael Espindola1eb3a0f2017-07-04 18:26:21 +00001310 addPredefinedSections();
Rafael Espindolac080ff62017-07-03 16:54:39 +00001311 removeUnusedSyntheticSections();
1312
Rafael Espindola24c073d2016-09-21 22:36:19 +00001313 sortSections();
Rafael Espindola383971d2017-06-15 21:51:01 +00001314
1315 // Now that we have the final list, create a list of all the
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001316 // OutputSections for convenience.
Rafael Espindolacdf813b2017-06-13 22:36:20 +00001317 for (BaseCommand *Base : Script->Opt.Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001318 if (auto *Sec = dyn_cast<OutputSection>(Base))
1319 OutputSections.push_back(Sec);
Rui Ueyama84417f82015-12-26 07:50:41 +00001320
Rafael Espindola9c0395e2017-06-20 01:51:50 +00001321 // Prefer command line supplied address over other constraints.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001322 for (OutputSection *Sec : OutputSections) {
1323 auto I = Config->SectionStartMap.find(Sec->Name);
Rafael Espindola9c0395e2017-06-20 01:51:50 +00001324 if (I != Config->SectionStartMap.end())
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001325 Sec->AddrExpr = [=] { return I->second; };
Rafael Espindola9c0395e2017-06-20 01:51:50 +00001326 }
1327
Rafael Espindola78493a22017-01-28 17:48:21 +00001328 // This is a bit of a hack. A value of 0 means undef, so we set it
1329 // to 1 t make __ehdr_start defined. The section number is not
1330 // particularly relevant.
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001331 Out::ElfHeader->SectionIndex = 1;
Rafael Espindola78493a22017-01-28 17:48:21 +00001332
George Rimar7ca06272016-04-06 07:20:45 +00001333 unsigned I = 1;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001334 for (OutputSection *Sec : OutputSections) {
George Rimar7ca06272016-04-06 07:20:45 +00001335 Sec->SectionIndex = I++;
Rafael Espindola895aea62017-05-11 22:02:41 +00001336 Sec->ShName = InX::ShStrTab->addString(Sec->Name);
George Rimar7ca06272016-04-06 07:20:45 +00001337 }
Rui Ueyama84417f82015-12-26 07:50:41 +00001338
Rafael Espindola5967c972016-12-19 21:21:07 +00001339 // Binary and relocatable output does not have PHDRS.
1340 // The headers have to be created before finalize as that can influence the
1341 // image base and the dynamic section on mips includes the image base.
1342 if (!Config->Relocatable && !Config->OFormatBinary) {
Rafael Espindolaf51c8052017-06-13 23:26:31 +00001343 Phdrs = Script->hasPhdrsCommands() ? Script->createPhdrs() : createPhdrs();
Rafael Espindola5967c972016-12-19 21:21:07 +00001344 addPtArmExid(Phdrs);
Rafael Espindola02ed7572017-05-04 19:34:17 +00001345 Out::ProgramHeaders->Size = sizeof(Elf_Phdr) * Phdrs.size();
Rafael Espindola5967c972016-12-19 21:21:07 +00001346 }
1347
Rafael Espindola4d560162017-09-12 16:38:01 +00001348 // Some symbols are defined in term of program headers. Now that we
1349 // have the headers, we can find out which sections they point to.
1350 setReservedSymbolSections();
1351
Eugene Leviantbe809a72016-11-18 06:44:18 +00001352 // Dynamic section must be the last one in this list and dynamic
1353 // symbol table section (DynSymTab) must be the first one.
Rui Ueyama2b6631b2017-08-15 17:01:39 +00001354 applySynthetic({InX::DynSymTab, InX::Bss,
1355 InX::BssRelRo, InX::GnuHashTab,
George Rimaraaf54712017-09-27 09:14:59 +00001356 InX::HashTab, InX::SymTab,
Rui Ueyama2b6631b2017-08-15 17:01:39 +00001357 InX::ShStrTab, InX::StrTab,
1358 In<ELFT>::VerDef, InX::DynStrTab,
1359 InX::Got, InX::MipsGot,
1360 InX::IgotPlt, InX::GotPlt,
1361 In<ELFT>::RelaDyn, In<ELFT>::RelaIplt,
1362 In<ELFT>::RelaPlt, InX::Plt,
1363 InX::Iplt, In<ELFT>::EhFrameHdr,
1364 In<ELFT>::VerSym, In<ELFT>::VerNeed,
1365 InX::Dynamic},
George Rimar49a47f22017-03-16 10:29:44 +00001366 [](SyntheticSection *SS) { SS->finalizeContents(); });
Peter Smith1ec42d92017-03-08 14:06:24 +00001367
Peter Smith3ef89b02017-09-06 14:02:14 +00001368 if (!Script->Opt.HasSections && !Config->Relocatable)
1369 fixSectionAlignments();
1370
Peter Smith1ec42d92017-03-08 14:06:24 +00001371 // Some architectures use small displacements for jump instructions.
1372 // It is linker's responsibility to create thunks containing long
1373 // jump instructions if jump targets are too far. Create thunks.
1374 if (Target->NeedsThunks) {
1375 // FIXME: only ARM Interworking and Mips LA25 Thunks are implemented,
1376 // these
1377 // do not require address information. To support range extension Thunks
1378 // we need to assign addresses so that we can tell if jump instructions
1379 // are out of range. This will need to turn into a loop that converges
1380 // when no more Thunks are added
George Rimarec84ffc2017-05-17 07:10:59 +00001381 ThunkCreator TC;
Peter Smith96f813d2017-07-07 10:03:37 +00001382 Script->assignAddresses();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001383 if (TC.createThunks(OutputSections)) {
Rafael Espindolab3aa2c92017-05-11 21:33:30 +00001384 applySynthetic({InX::MipsGot},
George Rimar49a47f22017-03-16 10:29:44 +00001385 [](SyntheticSection *SS) { SS->updateAllocSize(); });
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001386 if (TC.createThunks(OutputSections))
Peter Smith32980272017-06-16 13:10:08 +00001387 fatal("All non-range thunks should be created in first call");
1388 }
Peter Smith1ec42d92017-03-08 14:06:24 +00001389 }
Peter Smith43e852f2017-06-05 08:51:15 +00001390
Peter Smith1ec42d92017-03-08 14:06:24 +00001391 // Fill other section headers. The dynamic table is finalized
1392 // at the end because some tags like RELSZ depend on result
1393 // of finalizing other sections.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001394 for (OutputSection *Sec : OutputSections)
1395 Sec->finalize<ELFT>();
Peter Smith1ec42d92017-03-08 14:06:24 +00001396
1397 // createThunks may have added local symbols to the static symbol table
George Rimar69b17c32017-05-16 10:04:42 +00001398 applySynthetic({InX::SymTab, InX::ShStrTab, InX::StrTab},
George Rimar49a47f22017-03-16 10:29:44 +00001399 [](SyntheticSection *SS) { SS->postThunkContents(); });
Rui Ueyama84417f82015-12-26 07:50:41 +00001400}
1401
Rui Ueyama84417f82015-12-26 07:50:41 +00001402template <class ELFT> void Writer<ELFT>::addPredefinedSections() {
Rui Ueyamadec4ab02017-02-16 04:19:03 +00001403 // ARM ABI requires .ARM.exidx to be terminated by some piece of data.
1404 // We have the terminater synthetic section class. Add that at the end.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001405 OutputSection *Cmd = findSection(".ARM.exidx");
1406 if (!Cmd || !Cmd->Live || Config->Relocatable)
Peter Smith626c9972017-05-30 11:51:02 +00001407 return;
1408
1409 auto *Sentinel = make<ARMExidxSentinelSection>();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001410 Cmd->addSection(Sentinel);
Rafael Espindolaabad6182015-08-13 15:23:46 +00001411}
1412
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001413// The linker is expected to define SECNAME_start and SECNAME_end
1414// symbols for a few sections. This function defines them.
1415template <class ELFT> void Writer<ELFT>::addStartEndSymbols() {
Rafael Espindola24e6f362017-02-24 15:07:30 +00001416 auto Define = [&](StringRef Start, StringRef End, OutputSection *OS) {
Peter Collingbourne0fab40b2016-10-24 20:46:21 +00001417 // These symbols resolve to the image base if the section does not exist.
Rui Ueyama4f2f50d2016-12-21 08:40:09 +00001418 // A special value -1 indicates end of the section.
Peter Collingbournef8435a92017-03-13 16:40:20 +00001419 if (OS) {
1420 addOptionalRegular<ELFT>(Start, OS, 0);
1421 addOptionalRegular<ELFT>(End, OS, -1);
1422 } else {
Rui Ueyamad57e74b72017-03-17 23:29:01 +00001423 if (Config->Pic)
Peter Collingbournef8435a92017-03-13 16:40:20 +00001424 OS = Out::ElfHeader;
1425 addOptionalRegular<ELFT>(Start, OS, 0);
1426 addOptionalRegular<ELFT>(End, OS, 0);
1427 }
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001428 };
1429
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001430 Define("__preinit_array_start", "__preinit_array_end", Out::PreinitArray);
1431 Define("__init_array_start", "__init_array_end", Out::InitArray);
1432 Define("__fini_array_start", "__fini_array_end", Out::FiniArray);
Peter Smith17cd3752016-10-27 10:28:53 +00001433
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001434 if (OutputSection *Sec = findSection(".ARM.exidx"))
Peter Smith17cd3752016-10-27 10:28:53 +00001435 Define("__exidx_start", "__exidx_end", Sec);
Rui Ueyamaa5d79d12015-12-26 09:48:00 +00001436}
1437
Rui Ueyamad9189ce2015-10-15 17:11:03 +00001438// If a section name is valid as a C identifier (which is rare because of
1439// the leading '.'), linkers are expected to define __start_<secname> and
1440// __stop_<secname> symbols. They are at beginning and end of the section,
1441// respectively. This is not requested by the ELF standard, but GNU ld and
1442// gold provide the feature, and used by many programs.
1443template <class ELFT>
Rafael Espindola24e6f362017-02-24 15:07:30 +00001444void Writer<ELFT>::addStartStopSymbols(OutputSection *Sec) {
Rafael Espindola40849412017-02-24 14:28:00 +00001445 StringRef S = Sec->Name;
Rui Ueyamad9189ce2015-10-15 17:11:03 +00001446 if (!isValidCIdentifier(S))
1447 return;
Rafael Espindola5616adf2017-03-08 22:36:28 +00001448 addOptionalRegular<ELFT>(Saver.save("__start_" + S), Sec, 0, STV_DEFAULT);
1449 addOptionalRegular<ELFT>(Saver.save("__stop_" + S), Sec, -1, STV_DEFAULT);
Rui Ueyamad9189ce2015-10-15 17:11:03 +00001450}
1451
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001452template <class ELFT> OutputSection *Writer<ELFT>::findSection(StringRef Name) {
Rafael Espindola1eb3a0f2017-07-04 18:26:21 +00001453 for (BaseCommand *Base : Script->Opt.Commands)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001454 if (auto *Sec = dyn_cast<OutputSection>(Base))
1455 if (Sec->Name == Name)
1456 return Sec;
Rafael Espindola43e76cd2017-05-26 17:48:27 +00001457 return nullptr;
1458}
1459
George Rimar7702bc22017-03-16 11:20:02 +00001460static bool needsPtLoad(OutputSection *Sec) {
Rafael Espindola04a2e342016-11-09 01:42:41 +00001461 if (!(Sec->Flags & SHF_ALLOC))
Rafael Espindolaef762f22016-02-10 23:29:38 +00001462 return false;
1463
1464 // Don't allocate VA space for TLS NOBITS sections. The PT_TLS PHDR is
1465 // responsible for allocating space for them, not the PT_LOAD that
1466 // contains the TLS initialization image.
Rafael Espindola04a2e342016-11-09 01:42:41 +00001467 if (Sec->Flags & SHF_TLS && Sec->Type == SHT_NOBITS)
Rafael Espindolaef762f22016-02-10 23:29:38 +00001468 return false;
1469 return true;
Michael J. Spencer1d299a82015-09-09 20:48:09 +00001470}
1471
Rafael Espindolab45fd702016-09-20 15:22:27 +00001472// Linker scripts are responsible for aligning addresses. Unfortunately, most
1473// linker scripts are designed for creating two PT_LOADs only, one RX and one
1474// RW. This means that there is no alignment in the RO to RX transition and we
1475// cannot create a PT_LOAD there.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001476static uint64_t computeFlags(uint64_t Flags) {
Rui Ueyamaa37ace8d2017-02-25 01:52:03 +00001477 if (Config->Omagic)
George Rimar595a7632016-11-29 09:43:51 +00001478 return PF_R | PF_W | PF_X;
Rui Ueyama6bd38222017-04-05 21:37:09 +00001479 if (Config->SingleRoRx && !(Flags & PF_W))
1480 return Flags | PF_X;
1481 return Flags;
Rafael Espindolab45fd702016-09-20 15:22:27 +00001482}
1483
Rafael Espindola4fc60442016-02-10 22:43:13 +00001484// Decide which program headers to create and which sections to include in each
1485// one.
George Rimaraa354182017-07-27 07:46:50 +00001486template <class ELFT> std::vector<PhdrEntry *> Writer<ELFT>::createPhdrs() {
1487 std::vector<PhdrEntry *> Ret;
Rafael Espindola17cb7c02016-12-19 17:01:01 +00001488 auto AddHdr = [&](unsigned Type, unsigned Flags) -> PhdrEntry * {
George Rimaraa354182017-07-27 07:46:50 +00001489 Ret.push_back(make<PhdrEntry>(Type, Flags));
1490 return Ret.back();
Rafael Espindola4fc60442016-02-10 22:43:13 +00001491 };
George Rimare3336c02015-11-24 10:15:50 +00001492
Rui Ueyama803195e2015-10-23 21:45:59 +00001493 // The first phdr entry is PT_PHDR which describes the program header itself.
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001494 AddHdr(PT_PHDR, PF_R)->add(Out::ProgramHeaders);
Rui Ueyama953c2c42015-10-10 23:59:57 +00001495
Rui Ueyama803195e2015-10-23 21:45:59 +00001496 // PT_INTERP must be the second entry if exists.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001497 if (OutputSection *Cmd = findSection(".interp"))
1498 AddHdr(PT_INTERP, Cmd->getPhdrFlags())->add(Cmd);
Rafael Espindola70107762015-09-11 18:49:42 +00001499
Rui Ueyama803195e2015-10-23 21:45:59 +00001500 // Add the first PT_LOAD segment for regular output sections.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001501 uint64_t Flags = computeFlags(PF_R);
Rafael Espindola17cb7c02016-12-19 17:01:01 +00001502 PhdrEntry *Load = AddHdr(PT_LOAD, Flags);
Rafael Espindola02ed7572017-05-04 19:34:17 +00001503
1504 // Add the headers. We will remove them if they don't fit.
1505 Load->add(Out::ElfHeader);
1506 Load->add(Out::ProgramHeaders);
1507
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001508 for (OutputSection *Sec : OutputSections) {
Rafael Espindola04a2e342016-11-09 01:42:41 +00001509 if (!(Sec->Flags & SHF_ALLOC))
Rafael Espindolaaab6d5c2016-09-16 21:29:07 +00001510 break;
George Rimar7702bc22017-03-16 11:20:02 +00001511 if (!needsPtLoad(Sec))
Rafael Espindolaef762f22016-02-10 23:29:38 +00001512 continue;
1513
George Rimar8ceadb32016-08-17 07:44:19 +00001514 // Segments are contiguous memory regions that has the same attributes
1515 // (e.g. executable or writable). There is one phdr for each segment.
1516 // Therefore, we need to create a new phdr when the next section has
1517 // different flags or is loaded at a discontiguous address using AT linker
1518 // script command.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001519 uint64_t NewFlags = computeFlags(Sec->getPhdrFlags());
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001520 if (Sec->LMAExpr || Flags != NewFlags) {
Rafael Espindolae090fb22016-03-09 21:37:22 +00001521 Load = AddHdr(PT_LOAD, NewFlags);
Rafael Espindola4fc60442016-02-10 22:43:13 +00001522 Flags = NewFlags;
1523 }
Michael J. Spencer78aa1de2015-11-03 00:34:39 +00001524
Rui Ueyama18f084f2016-07-20 19:36:41 +00001525 Load->add(Sec);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001526 }
Rafael Espindola6b83b902015-08-12 00:00:24 +00001527
Rui Ueyamadb00b612017-02-01 22:42:17 +00001528 // Add a TLS segment if any.
George Rimaraa354182017-07-27 07:46:50 +00001529 PhdrEntry *TlsHdr = make<PhdrEntry>(PT_TLS, PF_R);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001530 for (OutputSection *Sec : OutputSections)
Rui Ueyamadb00b612017-02-01 22:42:17 +00001531 if (Sec->Flags & SHF_TLS)
George Rimaraa354182017-07-27 07:46:50 +00001532 TlsHdr->add(Sec);
George Rimar6823c5f2017-09-07 11:01:10 +00001533 if (TlsHdr->FirstSec)
George Rimaraa354182017-07-27 07:46:50 +00001534 Ret.push_back(TlsHdr);
Michael J. Spencer78aa1de2015-11-03 00:34:39 +00001535
Rui Ueyama803195e2015-10-23 21:45:59 +00001536 // Add an entry for .dynamic.
George Rimar69b17c32017-05-16 10:04:42 +00001537 if (InX::DynSymTab)
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001538 AddHdr(PT_DYNAMIC, InX::Dynamic->getParent()->getPhdrFlags())
1539 ->add(InX::Dynamic->getParent());
Rafael Espindola91009b32015-08-12 01:45:28 +00001540
Rafael Espindola4fc60442016-02-10 22:43:13 +00001541 // PT_GNU_RELRO includes all sections that should be marked as
1542 // read-only by dynamic linker after proccessing relocations.
George Rimaraa354182017-07-27 07:46:50 +00001543 PhdrEntry *RelRo = make<PhdrEntry>(PT_GNU_RELRO, PF_R);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001544 for (OutputSection *Sec : OutputSections)
Rafael Espindola9e889eb2017-05-11 23:31:06 +00001545 if (needsPtLoad(Sec) && isRelroSection(Sec))
George Rimaraa354182017-07-27 07:46:50 +00001546 RelRo->add(Sec);
George Rimar6823c5f2017-09-07 11:01:10 +00001547 if (RelRo->FirstSec)
George Rimaraa354182017-07-27 07:46:50 +00001548 Ret.push_back(RelRo);
George Rimare3336c02015-11-24 10:15:50 +00001549
Rafael Espindola4fc60442016-02-10 22:43:13 +00001550 // PT_GNU_EH_FRAME is a special section pointing on .eh_frame_hdr.
Eugene Leviant30c1b432017-03-14 08:49:09 +00001551 if (!In<ELFT>::EhFrame->empty() && In<ELFT>::EhFrameHdr &&
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001552 In<ELFT>::EhFrame->getParent() && In<ELFT>::EhFrameHdr->getParent())
1553 AddHdr(PT_GNU_EH_FRAME, In<ELFT>::EhFrameHdr->getParent()->getPhdrFlags())
1554 ->add(In<ELFT>::EhFrameHdr->getParent());
George Rimarf6bc65a2016-01-15 13:34:52 +00001555
Rui Ueyama81cb7102017-03-24 00:15:57 +00001556 // PT_OPENBSD_RANDOMIZE is an OpenBSD-specific feature. That makes
1557 // the dynamic linker fill the segment with random data.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001558 if (OutputSection *Cmd = findSection(".openbsd.randomdata"))
1559 AddHdr(PT_OPENBSD_RANDOMIZE, Cmd->getPhdrFlags())->add(Cmd);
George Rimar270173f2016-10-14 13:02:22 +00001560
Rui Ueyamae79b09a2015-11-21 22:19:32 +00001561 // PT_GNU_STACK is a special section to tell the loader to make the
Rui Ueyamaa7e87252017-02-23 08:09:51 +00001562 // pages for the stack non-executable. If you really want an executable
1563 // stack, you can pass -z execstack, but that's not recommended for
1564 // security reasons.
1565 unsigned Perm;
1566 if (Config->ZExecstack)
1567 Perm = PF_R | PF_W | PF_X;
1568 else
1569 Perm = PF_R | PF_W;
1570 AddHdr(PT_GNU_STACK, Perm)->p_memsz = Config->ZStackSize;
Rafael Espindola9907eb02016-03-01 13:23:29 +00001571
George Rimarcc6e5672016-10-14 10:34:36 +00001572 // PT_OPENBSD_WXNEEDED is a OpenBSD-specific header to mark the executable
1573 // is expected to perform W^X violations, such as calling mprotect(2) or
1574 // mmap(2) with PROT_WRITE | PROT_EXEC, which is prohibited by default on
1575 // OpenBSD.
1576 if (Config->ZWxneeded)
1577 AddHdr(PT_OPENBSD_WXNEEDED, PF_X);
1578
Petr Hosek4d65ef3b2017-02-01 20:58:41 +00001579 // Create one PT_NOTE per a group of contiguous .note sections.
1580 PhdrEntry *Note = nullptr;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001581 for (OutputSection *Sec : OutputSections) {
Petr Hosek4d65ef3b2017-02-01 20:58:41 +00001582 if (Sec->Type == SHT_NOTE) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001583 if (!Note || Sec->LMAExpr)
Petr Hosek4d65ef3b2017-02-01 20:58:41 +00001584 Note = AddHdr(PT_NOTE, PF_R);
1585 Note->add(Sec);
1586 } else {
1587 Note = nullptr;
1588 }
1589 }
Rui Ueyama703296a2016-07-20 19:36:39 +00001590 return Ret;
Rafael Espindola4fc60442016-02-10 22:43:13 +00001591}
1592
Rafael Espindola8e670002016-11-28 00:40:21 +00001593template <class ELFT>
George Rimaraa354182017-07-27 07:46:50 +00001594void Writer<ELFT>::addPtArmExid(std::vector<PhdrEntry *> &Phdrs) {
Rafael Espindola8e670002016-11-28 00:40:21 +00001595 if (Config->EMachine != EM_ARM)
1596 return;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001597 auto I = llvm::find_if(OutputSections, [](OutputSection *Cmd) {
1598 return Cmd->Type == SHT_ARM_EXIDX;
George Rimara951d5c2017-07-04 13:10:37 +00001599 });
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001600 if (I == OutputSections.end())
Rafael Espindola8e670002016-11-28 00:40:21 +00001601 return;
1602
1603 // PT_ARM_EXIDX is the ARM EHABI equivalent of PT_GNU_EH_FRAME
George Rimaraa354182017-07-27 07:46:50 +00001604 PhdrEntry *ARMExidx = make<PhdrEntry>(PT_ARM_EXIDX, PF_R);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001605 ARMExidx->add(*I);
Rafael Espindola8e670002016-11-28 00:40:21 +00001606 Phdrs.push_back(ARMExidx);
1607}
1608
Peter Collingbourne628ec9f2017-01-10 01:21:30 +00001609// The first section of each PT_LOAD, the first section in PT_GNU_RELRO and the
1610// first section after PT_GNU_RELRO have to be page aligned so that the dynamic
1611// linker can set the permissions.
Rui Ueyama47091902016-03-30 19:41:51 +00001612template <class ELFT> void Writer<ELFT>::fixSectionAlignments() {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001613 auto PageAlign = [](OutputSection *Cmd) {
Rafael Espindola0f7dc0e2017-06-02 01:37:58 +00001614 if (Cmd && !Cmd->AddrExpr)
1615 Cmd->AddrExpr = [=] {
1616 return alignTo(Script->getDot(), Config->MaxPageSize);
1617 };
1618 };
1619
George Rimaraa354182017-07-27 07:46:50 +00001620 for (const PhdrEntry *P : Phdrs)
George Rimar6823c5f2017-09-07 11:01:10 +00001621 if (P->p_type == PT_LOAD && P->FirstSec)
1622 PageAlign(P->FirstSec);
Rui Ueyama47091902016-03-30 19:41:51 +00001623
George Rimaraa354182017-07-27 07:46:50 +00001624 for (const PhdrEntry *P : Phdrs) {
1625 if (P->p_type != PT_GNU_RELRO)
Rui Ueyama47091902016-03-30 19:41:51 +00001626 continue;
George Rimar6823c5f2017-09-07 11:01:10 +00001627 if (P->FirstSec)
1628 PageAlign(P->FirstSec);
Rui Ueyama47091902016-03-30 19:41:51 +00001629 // Find the first section after PT_GNU_RELRO. If it is in a PT_LOAD we
1630 // have to align it to a page.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001631 auto End = OutputSections.end();
George Rimar6823c5f2017-09-07 11:01:10 +00001632 auto I = std::find(OutputSections.begin(), End, P->LastSec);
Rui Ueyama47091902016-03-30 19:41:51 +00001633 if (I == End || (I + 1) == End)
1634 continue;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001635 OutputSection *Cmd = (*(I + 1));
1636 if (needsPtLoad(Cmd))
1637 PageAlign(Cmd);
Rui Ueyama47091902016-03-30 19:41:51 +00001638 }
1639}
1640
George Rimar5f857322016-04-27 09:16:28 +00001641// Adjusts the file alignment for a given output section and returns
1642// its new file offset. The file offset must be the same with its
1643// virtual address (modulo the page size) so that the loader can load
1644// executables without any address adjustment.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001645static uint64_t getFileAlignment(uint64_t Off, OutputSection *Cmd) {
Rafael Espindola8b8f74f2016-12-07 20:20:39 +00001646 // If the section is not in a PT_LOAD, we just have to align it.
George Rimar582ede82017-09-07 10:53:07 +00001647 if (!Cmd->PtLoad)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001648 return alignTo(Off, Cmd->Alignment);
Eugene Leviant3d9abec2016-09-29 09:20:33 +00001649
George Rimar6823c5f2017-09-07 11:01:10 +00001650 OutputSection *First = Cmd->PtLoad->FirstSec;
Rafael Espindola8b8f74f2016-12-07 20:20:39 +00001651 // The first section in a PT_LOAD has to have congruent offset and address
1652 // module the page size.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001653 if (Cmd == First)
1654 return alignTo(Off, std::max<uint64_t>(Cmd->Alignment, Config->MaxPageSize),
1655 Cmd->Addr);
Rafael Espindola8b8f74f2016-12-07 20:20:39 +00001656
1657 // If two sections share the same PT_LOAD the file offset is calculated
1658 // using this formula: Off2 = Off1 + (VA2 - VA1).
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001659 return First->Offset + Cmd->Addr - First->Addr;
George Rimar5f857322016-04-27 09:16:28 +00001660}
1661
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001662static uint64_t setOffset(OutputSection *Cmd, uint64_t Off) {
1663 if (Cmd->Type == SHT_NOBITS) {
1664 Cmd->Offset = Off;
Rui Ueyama35723f02017-02-14 23:35:42 +00001665 return Off;
George Rimar86ce2672016-08-25 09:05:47 +00001666 }
1667
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001668 Off = getFileAlignment(Off, Cmd);
1669 Cmd->Offset = Off;
1670 return Off + Cmd->Size;
George Rimar86ce2672016-08-25 09:05:47 +00001671}
1672
1673template <class ELFT> void Writer<ELFT>::assignFileOffsetsBinary() {
Rui Ueyama6bd38222017-04-05 21:37:09 +00001674 uint64_t Off = 0;
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001675 for (OutputSection *Sec : OutputSections)
Rafael Espindola04a2e342016-11-09 01:42:41 +00001676 if (Sec->Flags & SHF_ALLOC)
Rui Ueyama6bd38222017-04-05 21:37:09 +00001677 Off = setOffset(Sec, Off);
1678 FileSize = alignTo(Off, Config->Wordsize);
George Rimar86ce2672016-08-25 09:05:47 +00001679}
1680
Rui Ueyamae044e9c2016-04-01 17:07:17 +00001681// Assign file offsets to output sections.
1682template <class ELFT> void Writer<ELFT>::assignFileOffsets() {
Rui Ueyama6bd38222017-04-05 21:37:09 +00001683 uint64_t Off = 0;
1684 Off = setOffset(Out::ElfHeader, Off);
1685 Off = setOffset(Out::ProgramHeaders, Off);
George Rimar7ca06272016-04-06 07:20:45 +00001686
Petr Hosekedd6c352017-08-02 16:35:00 +00001687 PhdrEntry *LastRX = nullptr;
1688 for (PhdrEntry *P : Phdrs)
1689 if (P->p_type == PT_LOAD && (P->p_flags & PF_X))
1690 LastRX = P;
1691
1692 for (OutputSection *Sec : OutputSections) {
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001693 Off = setOffset(Sec, Off);
Petr Hosekedd6c352017-08-02 16:35:00 +00001694 if (Script->Opt.HasSections)
1695 continue;
1696 // If this is a last section of the last executable segment and that
1697 // segment is the last loadable segment, align the offset of the
1698 // following section to avoid loading non-segments parts of the file.
George Rimar6823c5f2017-09-07 11:01:10 +00001699 if (LastRX && LastRX->LastSec == Sec)
Petr Hosekedd6c352017-08-02 16:35:00 +00001700 Off = alignTo(Off, Target->PageSize);
1701 }
Eugene Leviant467c4d52016-07-01 10:27:36 +00001702
Rui Ueyama6bd38222017-04-05 21:37:09 +00001703 SectionHeaderOff = alignTo(Off, Config->Wordsize);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001704 FileSize = SectionHeaderOff + (OutputSections.size() + 1) * sizeof(Elf_Shdr);
Rui Ueyamae044e9c2016-04-01 17:07:17 +00001705}
1706
1707// Finalize the program headers. We call this function after we assign
1708// file offsets and VAs to all sections.
1709template <class ELFT> void Writer<ELFT>::setPhdrs() {
George Rimaraa354182017-07-27 07:46:50 +00001710 for (PhdrEntry *P : Phdrs) {
George Rimar6823c5f2017-09-07 11:01:10 +00001711 OutputSection *First = P->FirstSec;
1712 OutputSection *Last = P->LastSec;
Rui Ueyamae8a45e42016-04-01 22:42:04 +00001713 if (First) {
George Rimaraa354182017-07-27 07:46:50 +00001714 P->p_filesz = Last->Offset - First->Offset;
Rafael Espindola04a2e342016-11-09 01:42:41 +00001715 if (Last->Type != SHT_NOBITS)
George Rimaraa354182017-07-27 07:46:50 +00001716 P->p_filesz += Last->Size;
1717 P->p_memsz = Last->Addr + Last->Size - First->Addr;
1718 P->p_offset = First->Offset;
1719 P->p_vaddr = First->Addr;
1720 if (!P->HasLMA)
1721 P->p_paddr = First->getLMA();
Rafael Espindola4fc60442016-02-10 22:43:13 +00001722 }
George Rimaraa354182017-07-27 07:46:50 +00001723 if (P->p_type == PT_LOAD)
1724 P->p_align = std::max<uint64_t>(P->p_align, Config->MaxPageSize);
1725 else if (P->p_type == PT_GNU_RELRO) {
1726 P->p_align = 1;
Peter Collingbourne7b5088b2017-01-04 18:56:15 +00001727 // The glibc dynamic loader rounds the size down, so we need to round up
1728 // to protect the last page. This is a no-op on FreeBSD which always
1729 // rounds up.
George Rimaraa354182017-07-27 07:46:50 +00001730 P->p_memsz = alignTo(P->p_memsz, Target->PageSize);
Peter Collingbourne7b5088b2017-01-04 18:56:15 +00001731 }
George Rimar8ceadb32016-08-17 07:44:19 +00001732
Rafael Espindola4fc60442016-02-10 22:43:13 +00001733 // The TLS pointer goes after PT_TLS. At least glibc will align it,
1734 // so round up the size to make sure the offsets are correct.
George Rimaraa354182017-07-27 07:46:50 +00001735 if (P->p_type == PT_TLS) {
1736 Out::TlsPhdr = P;
1737 if (P->p_memsz)
1738 P->p_memsz = alignTo(P->p_memsz, P->p_align);
Rui Ueyama803195e2015-10-23 21:45:59 +00001739 }
1740 }
Michael J. Spencer84487f12015-07-24 21:03:07 +00001741}
1742
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001743// The entry point address is chosen in the following ways.
1744//
1745// 1. the '-e' entry command-line option;
1746// 2. the ENTRY(symbol) command in a linker control script;
1747// 3. the value of the symbol start, if present;
1748// 4. the address of the first byte of the .text section, if present;
1749// 5. the address 0.
Rui Ueyama6bd38222017-04-05 21:37:09 +00001750template <class ELFT> uint64_t Writer<ELFT>::getEntryAddr() {
Rui Ueyamaa1407c42016-12-07 03:23:06 +00001751 // Case 1, 2 or 3. As a special case, if the symbol is actually
1752 // a number, we'll use that number as an address.
Rafael Espindola244ef982017-07-26 18:42:48 +00001753 if (SymbolBody *B = Symtab->find(Config->Entry))
George Rimarf64618a2017-03-17 11:56:54 +00001754 return B->getVA();
Rui Ueyamaa1407c42016-12-07 03:23:06 +00001755 uint64_t Addr;
George Rimarab947682017-05-16 08:19:25 +00001756 if (to_integer(Config->Entry, Addr))
Rui Ueyamaa1407c42016-12-07 03:23:06 +00001757 return Addr;
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001758
1759 // Case 4
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001760 if (OutputSection *Sec = findSection(".text")) {
Rui Ueyama9e5f5ef2016-12-07 04:06:21 +00001761 if (Config->WarnMissingEntry)
Petr Hosek2f50fef2016-12-07 02:26:16 +00001762 warn("cannot find entry symbol " + Config->Entry + "; defaulting to 0x" +
1763 utohexstr(Sec->Addr));
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001764 return Sec->Addr;
1765 }
1766
1767 // Case 5
Rui Ueyama9e5f5ef2016-12-07 04:06:21 +00001768 if (Config->WarnMissingEntry)
Petr Hosek2f50fef2016-12-07 02:26:16 +00001769 warn("cannot find entry symbol " + Config->Entry +
1770 "; not setting start address");
Rui Ueyama8da7aa02016-10-20 00:07:36 +00001771 return 0;
Rui Ueyama3bfaba92015-12-24 08:37:34 +00001772}
1773
Rui Ueyama4cea4e82016-02-25 19:28:37 +00001774static uint16_t getELFType() {
Rui Ueyamad57e74b72017-03-17 23:29:01 +00001775 if (Config->Pic)
Rui Ueyama4cea4e82016-02-25 19:28:37 +00001776 return ET_DYN;
1777 if (Config->Relocatable)
1778 return ET_REL;
1779 return ET_EXEC;
1780}
1781
Michael J. Spencer84487f12015-07-24 21:03:07 +00001782template <class ELFT> void Writer<ELFT>::writeHeader() {
1783 uint8_t *Buf = Buffer->getBufferStart();
Rui Ueyamae08cd672015-10-23 22:44:39 +00001784 memcpy(Buf, "\177ELF", 4);
1785
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001786 // Write the ELF header.
Rafael Espindola18608a02015-09-08 21:57:31 +00001787 auto *EHdr = reinterpret_cast<Elf_Ehdr *>(Buf);
Rui Ueyamaf2dc4362017-04-05 21:08:47 +00001788 EHdr->e_ident[EI_CLASS] = Config->Is64 ? ELFCLASS64 : ELFCLASS32;
1789 EHdr->e_ident[EI_DATA] = Config->IsLE ? ELFDATA2LSB : ELFDATA2MSB;
Michael J. Spencer84487f12015-07-24 21:03:07 +00001790 EHdr->e_ident[EI_VERSION] = EV_CURRENT;
Rafael Espindola7cc713a2016-10-27 14:00:51 +00001791 EHdr->e_ident[EI_OSABI] = Config->OSABI;
Rui Ueyama4cea4e82016-02-25 19:28:37 +00001792 EHdr->e_type = getELFType();
Rafael Espindola7cc713a2016-10-27 14:00:51 +00001793 EHdr->e_machine = Config->EMachine;
Michael J. Spencer84487f12015-07-24 21:03:07 +00001794 EHdr->e_version = EV_CURRENT;
Rui Ueyama2eda6d12016-11-23 22:41:00 +00001795 EHdr->e_entry = getEntryAddr();
Michael J. Spencer8039dae22015-07-29 00:30:10 +00001796 EHdr->e_shoff = SectionHeaderOff;
Rafael Espindola18608a02015-09-08 21:57:31 +00001797 EHdr->e_ehsize = sizeof(Elf_Ehdr);
Rui Ueyama2f1b79f2015-10-10 22:34:30 +00001798 EHdr->e_phnum = Phdrs.size();
Rafael Espindola18608a02015-09-08 21:57:31 +00001799 EHdr->e_shentsize = sizeof(Elf_Shdr);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001800 EHdr->e_shnum = OutputSections.size() + 1;
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001801 EHdr->e_shstrndx = InX::ShStrTab->getParent()->SectionIndex;
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001802
Rui Ueyama1e2e8ea2016-09-13 20:51:32 +00001803 if (Config->EMachine == EM_ARM)
1804 // We don't currently use any features incompatible with EF_ARM_EABI_VER5,
1805 // but we don't have any firm guarantees of conformance. Linux AArch64
1806 // kernels (as of 2016) require an EABI version to be set.
1807 EHdr->e_flags = EF_ARM_EABI_VER5;
1808 else if (Config->EMachine == EM_MIPS)
Simon Atanasyan4f90c2f2016-07-20 20:30:41 +00001809 EHdr->e_flags = getMipsEFlags<ELFT>();
Rui Ueyama22b5d1f2016-03-13 19:29:17 +00001810
George Rimar58941ee2016-02-25 08:23:37 +00001811 if (!Config->Relocatable) {
1812 EHdr->e_phoff = sizeof(Elf_Ehdr);
1813 EHdr->e_phentsize = sizeof(Elf_Phdr);
1814 }
1815
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001816 // Write the program header table.
Rafael Espindola4fc60442016-02-10 22:43:13 +00001817 auto *HBuf = reinterpret_cast<Elf_Phdr *>(Buf + EHdr->e_phoff);
George Rimaraa354182017-07-27 07:46:50 +00001818 for (PhdrEntry *P : Phdrs) {
1819 HBuf->p_type = P->p_type;
1820 HBuf->p_flags = P->p_flags;
1821 HBuf->p_offset = P->p_offset;
1822 HBuf->p_vaddr = P->p_vaddr;
1823 HBuf->p_paddr = P->p_paddr;
1824 HBuf->p_filesz = P->p_filesz;
1825 HBuf->p_memsz = P->p_memsz;
1826 HBuf->p_align = P->p_align;
Rafael Espindola17cb7c02016-12-19 17:01:01 +00001827 ++HBuf;
1828 }
Rafael Espindolae438e072015-09-08 22:55:28 +00001829
Rui Ueyama6621d8e2015-10-24 17:57:40 +00001830 // Write the section header table. Note that the first table entry is null.
Rui Ueyamaad59b652016-02-25 23:58:21 +00001831 auto *SHdrs = reinterpret_cast<Elf_Shdr *>(Buf + EHdr->e_shoff);
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001832 for (OutputSection *Sec : OutputSections)
1833 Sec->writeHeaderTo<ELFT>(++SHdrs);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001834}
1835
Rui Ueyama6d12eae2016-12-05 17:40:37 +00001836// Open a result file.
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +00001837template <class ELFT> void Writer<ELFT>::openFile() {
Rui Ueyama6bd38222017-04-05 21:37:09 +00001838 if (!Config->Is64 && FileSize > UINT32_MAX) {
1839 error("output file too large: " + Twine(FileSize) + " bytes");
1840 return;
1841 }
1842
Rui Ueyama6d12eae2016-12-05 17:40:37 +00001843 unlinkAsync(Config->OutputFile);
Rafael Espindolabdc8f2f2015-08-13 00:31:46 +00001844 ErrorOr<std::unique_ptr<FileOutputBuffer>> BufferOrErr =
Rui Ueyamacbe39262016-02-02 22:48:04 +00001845 FileOutputBuffer::create(Config->OutputFile, FileSize,
1846 FileOutputBuffer::F_executable);
Rui Ueyama6d12eae2016-12-05 17:40:37 +00001847
Rui Ueyamaaa2db882016-07-15 01:38:54 +00001848 if (auto EC = BufferOrErr.getError())
Rui Ueyamac8d3a832017-01-12 22:18:04 +00001849 error("failed to open " + Config->OutputFile + ": " + EC.message());
Rui Ueyamaf7f52ef2016-04-01 17:24:19 +00001850 else
Rui Ueyamaaa2db882016-07-15 01:38:54 +00001851 Buffer = std::move(*BufferOrErr);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001852}
1853
George Rimar86ce2672016-08-25 09:05:47 +00001854template <class ELFT> void Writer<ELFT>::writeSectionsBinary() {
1855 uint8_t *Buf = Buffer->getBufferStart();
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001856 for (OutputSection *Sec : OutputSections)
Rafael Espindola04a2e342016-11-09 01:42:41 +00001857 if (Sec->Flags & SHF_ALLOC)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001858 Sec->writeTo<ELFT>(Buf + Sec->Offset);
George Rimar86ce2672016-08-25 09:05:47 +00001859}
1860
Rui Ueyama6238ed22017-08-14 21:18:12 +00001861static void fillTrap(uint8_t *I, uint8_t *End) {
George Rimarf7ef2a12017-08-21 08:31:14 +00001862 for (; I + 4 <= End; I += 4)
Petr Hosekedd6c352017-08-02 16:35:00 +00001863 memcpy(I, &Target->TrapInstr, 4);
1864}
1865
Rui Ueyama6238ed22017-08-14 21:18:12 +00001866// Fill the last page of executable segments with trap instructions
1867// instead of leaving them as zero. Even though it is not required by any
1868// standard, it is in general a good thing to do for security reasons.
1869//
1870// We'll leave other pages in segments as-is because the rest will be
1871// overwritten by output sections.
Petr Hosekedd6c352017-08-02 16:35:00 +00001872template <class ELFT> void Writer<ELFT>::writeTrapInstr() {
1873 if (Script->Opt.HasSections)
1874 return;
1875
Rui Ueyama6238ed22017-08-14 21:18:12 +00001876 // Fill the last page.
Petr Hosekedd6c352017-08-02 16:35:00 +00001877 uint8_t *Buf = Buffer->getBufferStart();
Rui Ueyama6238ed22017-08-14 21:18:12 +00001878 for (PhdrEntry *P : Phdrs)
1879 if (P->p_type == PT_LOAD && (P->p_flags & PF_X))
1880 fillTrap(Buf + alignDown(P->p_offset + P->p_filesz, Target->PageSize),
1881 Buf + alignTo(P->p_offset + P->p_filesz, Target->PageSize));
Petr Hosekedd6c352017-08-02 16:35:00 +00001882
Rui Ueyama6238ed22017-08-14 21:18:12 +00001883 // Round up the file size of the last segment to the page boundary iff it is
1884 // an executable segment to ensure that other other tools don't accidentally
1885 // trim the instruction padding (e.g. when stripping the file).
Petr Hosekedd6c352017-08-02 16:35:00 +00001886 PhdrEntry *LastRX = nullptr;
1887 for (PhdrEntry *P : Phdrs) {
1888 if (P->p_type != PT_LOAD)
1889 continue;
1890 if (P->p_flags & PF_X)
1891 LastRX = P;
1892 else
1893 LastRX = nullptr;
1894 }
Petr Hosekedd6c352017-08-02 16:35:00 +00001895 if (LastRX)
Petr Hosek7ab9f7b2017-09-01 21:48:20 +00001896 LastRX->p_memsz = LastRX->p_filesz =
1897 alignTo(LastRX->p_filesz, Target->PageSize);
Petr Hosekedd6c352017-08-02 16:35:00 +00001898}
1899
Michael J. Spencer84487f12015-07-24 21:03:07 +00001900// Write section contents to a mmap'ed file.
1901template <class ELFT> void Writer<ELFT>::writeSections() {
1902 uint8_t *Buf = Buffer->getBufferStart();
Hal Finkeldaedc122015-10-12 23:16:53 +00001903
Rui Ueyama75118252016-08-09 01:35:37 +00001904 // PPC64 needs to process relocations in the .opd section
1905 // before processing relocations in code-containing sections.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001906 if (auto *OpdCmd = findSection(".opd")) {
1907 Out::Opd = OpdCmd;
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001908 Out::OpdBuf = Buf + Out::Opd->Offset;
Rafael Espindola55b169b2017-05-24 18:08:04 +00001909 OpdCmd->template writeTo<ELFT>(Buf + Out::Opd->Offset);
Rafael Espindola7a513052015-10-13 14:45:51 +00001910 }
Hal Finkeldaedc122015-10-12 23:16:53 +00001911
Rafael Espindola24e6f362017-02-24 15:07:30 +00001912 OutputSection *EhFrameHdr =
Rafael Espindola881cc162017-05-26 17:28:17 +00001913 (In<ELFT>::EhFrameHdr && !In<ELFT>::EhFrameHdr->empty())
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001914 ? In<ELFT>::EhFrameHdr->getParent()
Rafael Espindola881cc162017-05-26 17:28:17 +00001915 : nullptr;
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001916
1917 // In -r or -emit-relocs mode, write the relocation sections first as in
1918 // ELf_Rel targets we might find out that we need to modify the relocated
1919 // section while doing it.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001920 for (OutputSection *Sec : OutputSections)
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001921 if (Sec->Type == SHT_REL || Sec->Type == SHT_RELA)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001922 Sec->writeTo<ELFT>(Buf + Sec->Offset);
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001923
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001924 for (OutputSection *Sec : OutputSections)
Rui Ueyama9d1bacb12017-02-27 02:31:26 +00001925 if (Sec != Out::Opd && Sec != EhFrameHdr && Sec->Type != SHT_REL &&
Rafael Espindola08d6a3f2017-02-11 01:40:49 +00001926 Sec->Type != SHT_RELA)
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001927 Sec->writeTo<ELFT>(Buf + Sec->Offset);
Eugene Leviante4f590f2016-08-31 07:43:50 +00001928
1929 // The .eh_frame_hdr depends on .eh_frame section contents, therefore
1930 // it should be written after .eh_frame is written.
Rafael Espindola8c022ca2017-07-27 19:22:43 +00001931 if (EhFrameHdr)
1932 EhFrameHdr->writeTo<ELFT>(Buf + EhFrameHdr->Offset);
Michael J. Spencer84487f12015-07-24 21:03:07 +00001933}
Rui Ueyama3ce825e2015-10-09 21:07:25 +00001934
Rui Ueyama634ddf02016-03-11 20:51:53 +00001935template <class ELFT> void Writer<ELFT>::writeBuildId() {
Rafael Espindoladb5e56f2017-05-31 20:17:44 +00001936 if (!InX::BuildId || !InX::BuildId->getParent())
Rui Ueyama634ddf02016-03-11 20:51:53 +00001937 return;
1938
Petr Hosekfdfcb792016-09-01 22:43:03 +00001939 // Compute a hash of all sections of the output file.
Rui Ueyama634ddf02016-03-11 20:51:53 +00001940 uint8_t *Start = Buffer->getBufferStart();
Petr Hosekfdfcb792016-09-01 22:43:03 +00001941 uint8_t *End = Start + FileSize;
Rafael Espindola895aea62017-05-11 22:02:41 +00001942 InX::BuildId->writeBuildId({Start, End});
Rui Ueyama634ddf02016-03-11 20:51:53 +00001943}
1944
Rui Ueyama84907c52016-08-09 03:38:23 +00001945template void elf::writeResult<ELF32LE>();
1946template void elf::writeResult<ELF32BE>();
1947template void elf::writeResult<ELF64LE>();
1948template void elf::writeResult<ELF64BE>();