blob: 57536203a71603f99219040f5ccfc39784d213b6 [file] [log] [blame]
Rui Ueyama717677a2016-02-11 21:17:59 +00001//===- LinkerScript.h -------------------------------------------*- C++ -*-===//
2//
3// The LLVM Linker
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#ifndef LLD_ELF_LINKER_SCRIPT_H
11#define LLD_ELF_LINKER_SCRIPT_H
12
George Rimarbe394db2016-09-16 20:21:55 +000013#include "Config.h"
George Rimarc91930a2016-09-02 21:17:20 +000014#include "Strings.h"
Eugene Leviantbbe38602016-07-19 09:25:43 +000015#include "Writer.h"
Rui Ueyama717677a2016-02-11 21:17:59 +000016#include "lld/Core/LLVM.h"
17#include "llvm/ADT/DenseMap.h"
Rafael Espindolad3190792016-09-16 15:10:23 +000018#include "llvm/ADT/DenseSet.h"
Rui Ueyama717677a2016-02-11 21:17:59 +000019#include "llvm/ADT/MapVector.h"
Rui Ueyamaf9de0d62016-02-11 21:38:55 +000020#include "llvm/Support/Allocator.h"
21#include "llvm/Support/MemoryBuffer.h"
George Rimarc91930a2016-09-02 21:17:20 +000022#include "llvm/Support/Regex.h"
Rui Ueyama708019c2016-07-24 18:19:40 +000023#include <functional>
Rui Ueyama717677a2016-02-11 21:17:59 +000024
25namespace lld {
Rafael Espindolae0df00b2016-02-28 00:25:54 +000026namespace elf {
Rafael Espindolae7553e42016-08-31 13:28:33 +000027class DefinedCommon;
George Rimardbb76db2016-08-18 13:00:49 +000028class ScriptParser;
Rui Ueyama8d083e62016-07-29 05:48:39 +000029class SymbolBody;
Eugene Leviante63d81b2016-07-20 14:43:20 +000030template <class ELFT> class InputSectionBase;
Rafael Espindolad3190792016-09-16 15:10:23 +000031template <class ELFT> class InputSection;
Eugene Leviante63d81b2016-07-20 14:43:20 +000032template <class ELFT> class OutputSectionBase;
33template <class ELFT> class OutputSectionFactory;
Eugene Leviant97403d12016-09-01 09:55:57 +000034class InputSectionData;
Rui Ueyama717677a2016-02-11 21:17:59 +000035
Rui Ueyamab04af132016-10-13 23:08:33 +000036// This represents an expression in the linker script.
37// ScriptParser::readExpr reads an expression and returns an Expr.
38// Later, we evaluate the expression by calling the function
39// with the value of special context variable ".".
Rafael Espindolaf6613932016-10-31 17:43:38 +000040struct Expr {
41 std::function<uint64_t(uint64_t)> Val;
Rafael Espindola2f831dc2016-10-31 19:56:37 +000042 std::function<bool()> IsAbsolute;
Rafael Espindolaf6613932016-10-31 17:43:38 +000043 uint64_t operator()(uint64_t Dot) const { return Val(Dot); }
44 operator bool() const { return (bool)Val; }
45
46 template <typename T>
Rafael Espindola2f831dc2016-10-31 19:56:37 +000047 Expr(T Val, std::function<bool()> IsAbsolute)
48 : Val(Val), IsAbsolute(IsAbsolute) {}
49 template <typename T> Expr(T Val, bool IsAbsolute) : Val(Val) {
50 this->IsAbsolute = [=]() { return IsAbsolute; };
51 }
Rafael Espindolaf6613932016-10-31 17:43:38 +000052 template <typename T> Expr(T V) : Expr(V, false) {}
53 Expr() : Expr(nullptr) {}
54};
Rui Ueyama708019c2016-07-24 18:19:40 +000055
Rui Ueyama07320e42016-04-20 20:13:41 +000056// Parses a linker script. Calling this function updates
57// Config and ScriptConfig.
58void readLinkerScript(MemoryBufferRef MB);
59
Rui Ueyamab04af132016-10-13 23:08:33 +000060// Parses a version script.
George Rimar20b65982016-08-31 09:08:26 +000061void readVersionScript(MemoryBufferRef MB);
62
George Rimareea31142016-07-21 14:26:59 +000063// This enum is used to implement linker script SECTIONS command.
64// https://sourceware.org/binutils/docs/ld/SECTIONS.html#SECTIONS
65enum SectionsCommandKind {
George Rimare38cbab2016-09-26 19:22:50 +000066 AssignmentKind, // . = expr or <sym> = expr
George Rimareea31142016-07-21 14:26:59 +000067 OutputSectionKind,
George Rimareefa7582016-08-04 09:29:31 +000068 InputSectionKind,
George Rimare38cbab2016-09-26 19:22:50 +000069 AssertKind, // ASSERT(expr)
70 BytesDataKind // BYTE(expr), SHORT(expr), LONG(expr) or QUAD(expr)
Rui Ueyama1ebc8ed2016-02-12 21:47:28 +000071};
72
George Rimar076fe152016-07-21 06:43:01 +000073struct BaseCommand {
74 BaseCommand(int K) : Kind(K) {}
75 virtual ~BaseCommand() {}
76 int Kind;
77};
78
Rui Ueyamab04af132016-10-13 23:08:33 +000079// This represents ". = <expr>" or "<symbol> = <expr>".
George Rimar076fe152016-07-21 06:43:01 +000080struct SymbolAssignment : BaseCommand {
Rafael Espindolaf6613932016-10-31 17:43:38 +000081 SymbolAssignment(StringRef Name, Expr E)
82 : BaseCommand(AssignmentKind), Name(Name), Expression(E) {}
George Rimar076fe152016-07-21 06:43:01 +000083 static bool classof(const BaseCommand *C);
Rui Ueyama20204242016-07-29 05:52:33 +000084
85 // The LHS of an expression. Name is either a symbol name or ".".
George Rimar076fe152016-07-21 06:43:01 +000086 StringRef Name;
Rui Ueyama20204242016-07-29 05:52:33 +000087 SymbolBody *Sym = nullptr;
88
89 // The RHS of an expression.
Rui Ueyama708019c2016-07-24 18:19:40 +000090 Expr Expression;
Rui Ueyama20204242016-07-29 05:52:33 +000091
92 // Command attributes for PROVIDE, HIDDEN and PROVIDE_HIDDEN.
Eugene Levianta31c91b2016-07-22 07:38:40 +000093 bool Provide = false;
Eugene Levianta31c91b2016-07-22 07:38:40 +000094 bool Hidden = false;
George Rimar076fe152016-07-21 06:43:01 +000095};
96
Davide Italiano246f6812016-07-22 03:36:24 +000097// Linker scripts allow additional constraints to be put on ouput sections.
Rui Ueyamab04af132016-10-13 23:08:33 +000098// If an output section is marked as ONLY_IF_RO, the section is created
99// only if its input sections are read-only. Likewise, an output section
100// with ONLY_IF_RW is created if all input sections are RW.
Rui Ueyamaefc40662016-07-25 22:00:10 +0000101enum class ConstraintKind { NoConstraint, ReadOnly, ReadWrite };
Davide Italiano246f6812016-07-22 03:36:24 +0000102
George Rimar076fe152016-07-21 06:43:01 +0000103struct OutputSectionCommand : BaseCommand {
104 OutputSectionCommand(StringRef Name)
105 : BaseCommand(OutputSectionKind), Name(Name) {}
106 static bool classof(const BaseCommand *C);
Eugene Levianteda81a12016-07-12 06:39:48 +0000107 StringRef Name;
George Rimar58e5c4d2016-07-25 08:29:46 +0000108 Expr AddrExpr;
George Rimar630c6172016-07-26 18:06:29 +0000109 Expr AlignExpr;
Eugene Leviantb71d6f72016-10-06 09:39:28 +0000110 Expr LMAExpr;
George Rimardb24d9c2016-08-19 15:18:23 +0000111 Expr SubalignExpr;
George Rimareea31142016-07-21 14:26:59 +0000112 std::vector<std::unique_ptr<BaseCommand>> Commands;
Eugene Leviantbbe38602016-07-19 09:25:43 +0000113 std::vector<StringRef> Phdrs;
George Rimar076fe152016-07-21 06:43:01 +0000114 std::vector<uint8_t> Filler;
Rui Ueyamaefc40662016-07-25 22:00:10 +0000115 ConstraintKind Constraint = ConstraintKind::NoConstraint;
Eugene Leviantbbe38602016-07-19 09:25:43 +0000116};
117
George Rimar8034d492016-09-17 07:31:49 +0000118// This struct represents one section match pattern in SECTIONS() command.
Rui Ueyama4dc07be2016-09-17 02:23:40 +0000119// It can optionally have negative match pattern for EXCLUDED_FILE command.
George Rimar07171f22016-09-21 15:56:44 +0000120// Also it may be surrounded with SORT() command, so contains sorting rules.
Rui Ueyama4dc07be2016-09-17 02:23:40 +0000121struct SectionPattern {
Rui Ueyamad1d7cfc2016-09-20 00:02:06 +0000122 SectionPattern(llvm::Regex &&Re1, llvm::Regex &&Re2)
123 : ExcludedFileRe(std::forward<llvm::Regex>(Re1)),
124 SectionRe(std::forward<llvm::Regex>(Re2)) {}
125
126 SectionPattern(SectionPattern &&Other) {
127 std::swap(ExcludedFileRe, Other.ExcludedFileRe);
128 std::swap(SectionRe, Other.SectionRe);
George Rimar07171f22016-09-21 15:56:44 +0000129 std::swap(SortOuter, Other.SortOuter);
130 std::swap(SortInner, Other.SortInner);
Rui Ueyamad1d7cfc2016-09-20 00:02:06 +0000131 }
132
Rui Ueyama4dc07be2016-09-17 02:23:40 +0000133 llvm::Regex ExcludedFileRe;
134 llvm::Regex SectionRe;
George Rimar07171f22016-09-21 15:56:44 +0000135 SortSectionPolicy SortOuter;
136 SortSectionPolicy SortInner;
Rui Ueyama4dc07be2016-09-17 02:23:40 +0000137};
138
George Rimareea31142016-07-21 14:26:59 +0000139struct InputSectionDescription : BaseCommand {
George Rimarc91930a2016-09-02 21:17:20 +0000140 InputSectionDescription(StringRef FilePattern)
141 : BaseCommand(InputSectionKind),
142 FileRe(compileGlobPatterns({FilePattern})) {}
George Rimareea31142016-07-21 14:26:59 +0000143 static bool classof(const BaseCommand *C);
George Rimarc91930a2016-09-02 21:17:20 +0000144 llvm::Regex FileRe;
Rui Ueyama4dc07be2016-09-17 02:23:40 +0000145
George Rimar8034d492016-09-17 07:31:49 +0000146 // Input sections that matches at least one of SectionPatterns
Rui Ueyama70efa2f2016-09-17 02:34:50 +0000147 // will be associated with this InputSectionDescription.
Rui Ueyamad1d7cfc2016-09-20 00:02:06 +0000148 std::vector<SectionPattern> SectionPatterns;
Rui Ueyama4dc07be2016-09-17 02:23:40 +0000149
Rafael Espindolad3190792016-09-16 15:10:23 +0000150 std::vector<InputSectionData *> Sections;
George Rimareea31142016-07-21 14:26:59 +0000151};
152
Rui Ueyamab04af132016-10-13 23:08:33 +0000153// Represents an ASSERT().
George Rimareefa7582016-08-04 09:29:31 +0000154struct AssertCommand : BaseCommand {
155 AssertCommand(Expr E) : BaseCommand(AssertKind), Expression(E) {}
156 static bool classof(const BaseCommand *C);
157 Expr Expression;
158};
159
Rui Ueyamab04af132016-10-13 23:08:33 +0000160// Represents BYTE(), SHORT(), LONG(), or QUAD().
George Rimare38cbab2016-09-26 19:22:50 +0000161struct BytesDataCommand : BaseCommand {
162 BytesDataCommand(uint64_t Data, unsigned Size)
163 : BaseCommand(BytesDataKind), Data(Data), Size(Size) {}
164 static bool classof(const BaseCommand *C);
165 uint64_t Data;
166 unsigned Offset;
167 unsigned Size;
168};
169
Eugene Leviantbbe38602016-07-19 09:25:43 +0000170struct PhdrsCommand {
171 StringRef Name;
172 unsigned Type;
173 bool HasFilehdr;
174 bool HasPhdrs;
Eugene Leviant865bf862016-07-21 10:43:25 +0000175 unsigned Flags;
Eugene Leviant56b21c82016-09-09 09:46:16 +0000176 Expr LMAExpr;
George Rimar652852c2016-04-16 10:10:32 +0000177};
178
George Rimar884e7862016-09-08 08:19:13 +0000179class LinkerScriptBase {
Rafael Espindola4d1e4d72016-09-08 14:11:08 +0000180protected:
181 ~LinkerScriptBase() = default;
182
George Rimar884e7862016-09-08 08:19:13 +0000183public:
184 virtual uint64_t getOutputSectionAddress(StringRef Name) = 0;
185 virtual uint64_t getOutputSectionSize(StringRef Name) = 0;
Eugene Leviant36fac7f2016-09-08 09:08:30 +0000186 virtual uint64_t getOutputSectionAlign(StringRef Name) = 0;
Eugene Leviantb71d6f72016-10-06 09:39:28 +0000187 virtual uint64_t getOutputSectionLMA(StringRef Name) = 0;
George Rimar884e7862016-09-08 08:19:13 +0000188 virtual uint64_t getHeaderSize() = 0;
189 virtual uint64_t getSymbolValue(StringRef S) = 0;
George Rimarf34f45f2016-09-23 13:17:23 +0000190 virtual bool isDefined(StringRef S) = 0;
Rafael Espindola2f831dc2016-10-31 19:56:37 +0000191 virtual bool isAbsolute(StringRef S) = 0;
George Rimar884e7862016-09-08 08:19:13 +0000192};
193
Rui Ueyama07320e42016-04-20 20:13:41 +0000194// ScriptConfiguration holds linker script parse results.
195struct ScriptConfiguration {
George Rimar652852c2016-04-16 10:10:32 +0000196 // Used to assign addresses to sections.
George Rimar076fe152016-07-21 06:43:01 +0000197 std::vector<std::unique_ptr<BaseCommand>> Commands;
George Rimar652852c2016-04-16 10:10:32 +0000198
Eugene Leviantbbe38602016-07-19 09:25:43 +0000199 // Used to assign sections to headers.
George Rimar70ce0a92016-07-20 15:09:10 +0000200 std::vector<PhdrsCommand> PhdrsCommands;
201
Eugene Leviante05336ff2016-09-14 08:32:36 +0000202 bool HasSections = false;
Rui Ueyama07320e42016-04-20 20:13:41 +0000203
Rui Ueyama8ec77e62016-04-21 22:00:51 +0000204 // List of section patterns specified with KEEP commands. They will
205 // be kept even if they are unused and --gc-sections is specified.
Eugene Leviantcf43f172016-10-05 09:36:59 +0000206 std::vector<InputSectionDescription *> KeptSections;
Rui Ueyama717677a2016-02-11 21:17:59 +0000207};
208
Rui Ueyama07320e42016-04-20 20:13:41 +0000209extern ScriptConfiguration *ScriptConfig;
210
211// This is a runner of the linker script.
George Rimar884e7862016-09-08 08:19:13 +0000212template <class ELFT> class LinkerScript final : public LinkerScriptBase {
Rui Ueyama0b3868e2016-04-22 20:41:07 +0000213 typedef typename ELFT::uint uintX_t;
214
Rui Ueyama07320e42016-04-20 20:13:41 +0000215public:
Rui Ueyamaf34d0e02016-08-12 01:24:53 +0000216 LinkerScript();
217 ~LinkerScript();
Eugene Leviant20d03192016-09-16 15:30:47 +0000218 void processCommands(OutputSectionFactory<ELFT> &Factory);
Rafael Espindolaa4b41dc2016-08-04 12:13:05 +0000219 void createSections(OutputSectionFactory<ELFT> &Factory);
Rafael Espindola9546fff2016-09-22 14:40:50 +0000220 void adjustSectionsBeforeSorting();
Rui Ueyamaa7f78842016-07-20 17:19:03 +0000221
Rafael Espindolaa4b41dc2016-08-04 12:13:05 +0000222 std::vector<PhdrEntry<ELFT>> createPhdrs();
Eugene Leviantf9bc3bd2016-08-16 06:40:58 +0000223 bool ignoreInterpSection();
Rui Ueyamaadca2452016-07-23 14:18:48 +0000224
Rui Ueyama07320e42016-04-20 20:13:41 +0000225 ArrayRef<uint8_t> getFiller(StringRef Name);
George Rimare38cbab2016-09-26 19:22:50 +0000226 void writeDataBytes(StringRef Name, uint8_t *Buf);
Eugene Leviantb71d6f72016-10-06 09:39:28 +0000227 bool hasLMA(StringRef Name);
Rui Ueyama07320e42016-04-20 20:13:41 +0000228 bool shouldKeep(InputSectionBase<ELFT> *S);
Rafael Espindolad3190792016-09-16 15:10:23 +0000229 void assignOffsets(OutputSectionCommand *Cmd);
Rafael Espindola6d91fce2016-09-29 18:50:34 +0000230 void assignAddresses(std::vector<PhdrEntry<ELFT>> &Phdrs);
Eugene Leviantbbe38602016-07-19 09:25:43 +0000231 bool hasPhdrsCommands();
George Rimar884e7862016-09-08 08:19:13 +0000232 uint64_t getOutputSectionAddress(StringRef Name) override;
233 uint64_t getOutputSectionSize(StringRef Name) override;
Eugene Leviant36fac7f2016-09-08 09:08:30 +0000234 uint64_t getOutputSectionAlign(StringRef Name) override;
Eugene Leviantb71d6f72016-10-06 09:39:28 +0000235 uint64_t getOutputSectionLMA(StringRef Name) override;
George Rimar884e7862016-09-08 08:19:13 +0000236 uint64_t getHeaderSize() override;
237 uint64_t getSymbolValue(StringRef S) override;
George Rimarf34f45f2016-09-23 13:17:23 +0000238 bool isDefined(StringRef S) override;
Rafael Espindola2f831dc2016-10-31 19:56:37 +0000239 bool isAbsolute(StringRef S) override;
Rui Ueyama07320e42016-04-20 20:13:41 +0000240
Rafael Espindolaa4b41dc2016-08-04 12:13:05 +0000241 std::vector<OutputSectionBase<ELFT> *> *OutputSections;
242
Rafael Espindolab6b8f6c2016-09-20 22:43:15 +0000243 int getSectionIndex(StringRef Name);
244
Rui Ueyama07320e42016-04-20 20:13:41 +0000245private:
Rafael Espindolae71a3f8a2016-09-16 20:34:02 +0000246 void computeInputSections(InputSectionDescription *);
Rui Ueyama6b274812016-07-25 22:51:07 +0000247
Eugene Leviant20d03192016-09-16 15:30:47 +0000248 void addSection(OutputSectionFactory<ELFT> &Factory,
249 InputSectionBase<ELFT> *Sec, StringRef Name);
Rafael Espindola7bd37872016-09-12 16:05:16 +0000250 void discard(ArrayRef<InputSectionBase<ELFT> *> V);
Rui Ueyama48c3f1c2016-08-12 00:27:23 +0000251
Rui Ueyama0b9ce6a2016-08-12 03:16:56 +0000252 std::vector<InputSectionBase<ELFT> *>
253 createInputSectionList(OutputSectionCommand &Cmd);
254
Rui Ueyamac998a8c2016-04-22 00:03:13 +0000255 // "ScriptConfig" is a bit too long, so define a short name for it.
256 ScriptConfiguration &Opt = *ScriptConfig;
257
Rui Ueyamaedebbdf2016-07-24 23:47:31 +0000258 std::vector<size_t> getPhdrIndices(StringRef SectionName);
Rui Ueyama29c5a2a2016-07-26 00:27:36 +0000259 size_t getPhdrIndex(StringRef PhdrName);
Rui Ueyama07320e42016-04-20 20:13:41 +0000260
Rui Ueyama0b3868e2016-04-22 20:41:07 +0000261 uintX_t Dot;
Eugene Leviantb71d6f72016-10-06 09:39:28 +0000262 uintX_t LMAOffset = 0;
Rafael Espindolad3190792016-09-16 15:10:23 +0000263 OutputSectionBase<ELFT> *CurOutSec = nullptr;
264 uintX_t ThreadBssOffset = 0;
265 void switchTo(OutputSectionBase<ELFT> *Sec);
266 void flush();
267 void output(InputSection<ELFT> *Sec);
268 void process(BaseCommand &Base);
269 llvm::DenseSet<OutputSectionBase<ELFT> *> AlreadyOutputOS;
270 llvm::DenseSet<InputSectionData *> AlreadyOutputIS;
Rui Ueyama07320e42016-04-20 20:13:41 +0000271};
272
273// Variable template is a C++14 feature, so we can't template
274// a global variable. Use a struct to workaround.
275template <class ELFT> struct Script { static LinkerScript<ELFT> *X; };
276template <class ELFT> LinkerScript<ELFT> *Script<ELFT>::X;
Rui Ueyama717677a2016-02-11 21:17:59 +0000277
George Rimar884e7862016-09-08 08:19:13 +0000278extern LinkerScriptBase *ScriptBase;
279
Rafael Espindolae0df00b2016-02-28 00:25:54 +0000280} // namespace elf
Rui Ueyama717677a2016-02-11 21:17:59 +0000281} // namespace lld
282
283#endif