blob: d9fc1175fcec6faa9fbea38800b1a50511ba7325 [file] [log] [blame]
Rui Ueyama717677a2016-02-11 21:17:59 +00001//===- LinkerScript.h -------------------------------------------*- C++ -*-===//
2//
3// The LLVM Linker
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#ifndef LLD_ELF_LINKER_SCRIPT_H
11#define LLD_ELF_LINKER_SCRIPT_H
12
George Rimarc91930a2016-09-02 21:17:20 +000013#include "Strings.h"
Eugene Leviantbbe38602016-07-19 09:25:43 +000014#include "Writer.h"
Rui Ueyama717677a2016-02-11 21:17:59 +000015#include "lld/Core/LLVM.h"
16#include "llvm/ADT/DenseMap.h"
Rafael Espindolad3190792016-09-16 15:10:23 +000017#include "llvm/ADT/DenseSet.h"
Rui Ueyama717677a2016-02-11 21:17:59 +000018#include "llvm/ADT/MapVector.h"
Rui Ueyamaf9de0d62016-02-11 21:38:55 +000019#include "llvm/Support/Allocator.h"
20#include "llvm/Support/MemoryBuffer.h"
George Rimarc91930a2016-09-02 21:17:20 +000021#include "llvm/Support/Regex.h"
Rui Ueyama708019c2016-07-24 18:19:40 +000022#include <functional>
Rui Ueyama717677a2016-02-11 21:17:59 +000023
24namespace lld {
Rafael Espindolae0df00b2016-02-28 00:25:54 +000025namespace elf {
Rafael Espindolae7553e42016-08-31 13:28:33 +000026class DefinedCommon;
George Rimardbb76db2016-08-18 13:00:49 +000027class ScriptParser;
Rui Ueyama8d083e62016-07-29 05:48:39 +000028class SymbolBody;
Eugene Leviante63d81b2016-07-20 14:43:20 +000029template <class ELFT> class InputSectionBase;
Rafael Espindolad3190792016-09-16 15:10:23 +000030template <class ELFT> class InputSection;
Eugene Leviante63d81b2016-07-20 14:43:20 +000031template <class ELFT> class OutputSectionBase;
32template <class ELFT> class OutputSectionFactory;
Eugene Leviant97403d12016-09-01 09:55:57 +000033class InputSectionData;
Rui Ueyama717677a2016-02-11 21:17:59 +000034
Rui Ueyama708019c2016-07-24 18:19:40 +000035typedef std::function<uint64_t(uint64_t)> Expr;
36
Rui Ueyama07320e42016-04-20 20:13:41 +000037// Parses a linker script. Calling this function updates
38// Config and ScriptConfig.
39void readLinkerScript(MemoryBufferRef MB);
40
George Rimar20b65982016-08-31 09:08:26 +000041void readVersionScript(MemoryBufferRef MB);
42
George Rimareea31142016-07-21 14:26:59 +000043// This enum is used to implement linker script SECTIONS command.
44// https://sourceware.org/binutils/docs/ld/SECTIONS.html#SECTIONS
45enum SectionsCommandKind {
46 AssignmentKind,
47 OutputSectionKind,
George Rimareefa7582016-08-04 09:29:31 +000048 InputSectionKind,
49 AssertKind
Rui Ueyama1ebc8ed2016-02-12 21:47:28 +000050};
51
George Rimar076fe152016-07-21 06:43:01 +000052struct BaseCommand {
53 BaseCommand(int K) : Kind(K) {}
54 virtual ~BaseCommand() {}
55 int Kind;
56};
57
58struct SymbolAssignment : BaseCommand {
Eugene Leviantdb741e72016-09-07 07:08:43 +000059 SymbolAssignment(StringRef Name, Expr E, bool IsAbsolute)
60 : BaseCommand(AssignmentKind), Name(Name), Expression(E),
61 IsAbsolute(IsAbsolute) {}
George Rimar076fe152016-07-21 06:43:01 +000062 static bool classof(const BaseCommand *C);
Rui Ueyama20204242016-07-29 05:52:33 +000063
64 // The LHS of an expression. Name is either a symbol name or ".".
George Rimar076fe152016-07-21 06:43:01 +000065 StringRef Name;
Rui Ueyama20204242016-07-29 05:52:33 +000066 SymbolBody *Sym = nullptr;
67
68 // The RHS of an expression.
Rui Ueyama708019c2016-07-24 18:19:40 +000069 Expr Expression;
Rui Ueyama20204242016-07-29 05:52:33 +000070
71 // Command attributes for PROVIDE, HIDDEN and PROVIDE_HIDDEN.
Eugene Levianta31c91b2016-07-22 07:38:40 +000072 bool Provide = false;
Eugene Levianta31c91b2016-07-22 07:38:40 +000073 bool Hidden = false;
Eugene Leviantdb741e72016-09-07 07:08:43 +000074 bool IsAbsolute;
George Rimar076fe152016-07-21 06:43:01 +000075};
76
Davide Italiano246f6812016-07-22 03:36:24 +000077// Linker scripts allow additional constraints to be put on ouput sections.
78// An output section will only be created if all of its input sections are
79// read-only
80// or all of its input sections are read-write by using the keyword ONLY_IF_RO
81// and ONLY_IF_RW respectively.
Rui Ueyamaefc40662016-07-25 22:00:10 +000082enum class ConstraintKind { NoConstraint, ReadOnly, ReadWrite };
Davide Italiano246f6812016-07-22 03:36:24 +000083
George Rimar076fe152016-07-21 06:43:01 +000084struct OutputSectionCommand : BaseCommand {
85 OutputSectionCommand(StringRef Name)
86 : BaseCommand(OutputSectionKind), Name(Name) {}
87 static bool classof(const BaseCommand *C);
Eugene Levianteda81a12016-07-12 06:39:48 +000088 StringRef Name;
George Rimar58e5c4d2016-07-25 08:29:46 +000089 Expr AddrExpr;
George Rimar630c6172016-07-26 18:06:29 +000090 Expr AlignExpr;
George Rimar8ceadb32016-08-17 07:44:19 +000091 Expr LmaExpr;
George Rimardb24d9c2016-08-19 15:18:23 +000092 Expr SubalignExpr;
George Rimareea31142016-07-21 14:26:59 +000093 std::vector<std::unique_ptr<BaseCommand>> Commands;
Eugene Leviantbbe38602016-07-19 09:25:43 +000094 std::vector<StringRef> Phdrs;
George Rimar076fe152016-07-21 06:43:01 +000095 std::vector<uint8_t> Filler;
Rui Ueyamaefc40662016-07-25 22:00:10 +000096 ConstraintKind Constraint = ConstraintKind::NoConstraint;
Eugene Leviantbbe38602016-07-19 09:25:43 +000097};
98
George Rimar575208c2016-09-15 19:15:12 +000099enum SortKind { SortNone, SortByPriority, SortByName, SortByAlignment };
George Rimar350ece42016-08-03 08:35:59 +0000100
George Rimareea31142016-07-21 14:26:59 +0000101struct InputSectionDescription : BaseCommand {
George Rimarc91930a2016-09-02 21:17:20 +0000102 InputSectionDescription(StringRef FilePattern)
103 : BaseCommand(InputSectionKind),
104 FileRe(compileGlobPatterns({FilePattern})) {}
George Rimareea31142016-07-21 14:26:59 +0000105 static bool classof(const BaseCommand *C);
George Rimarc91930a2016-09-02 21:17:20 +0000106 llvm::Regex FileRe;
Rui Ueyama742c3832016-08-04 22:27:00 +0000107 SortKind SortOuter = SortNone;
108 SortKind SortInner = SortNone;
George Rimarceae6302016-09-16 13:30:18 +0000109 llvm::Regex ExcludedFileRe;
110 llvm::Regex SectionRe;
Rafael Espindolad3190792016-09-16 15:10:23 +0000111 std::vector<InputSectionData *> Sections;
George Rimareea31142016-07-21 14:26:59 +0000112};
113
George Rimareefa7582016-08-04 09:29:31 +0000114struct AssertCommand : BaseCommand {
115 AssertCommand(Expr E) : BaseCommand(AssertKind), Expression(E) {}
116 static bool classof(const BaseCommand *C);
117 Expr Expression;
118};
119
Eugene Leviantbbe38602016-07-19 09:25:43 +0000120struct PhdrsCommand {
121 StringRef Name;
122 unsigned Type;
123 bool HasFilehdr;
124 bool HasPhdrs;
Eugene Leviant865bf862016-07-21 10:43:25 +0000125 unsigned Flags;
Eugene Leviant56b21c82016-09-09 09:46:16 +0000126 Expr LMAExpr;
George Rimar652852c2016-04-16 10:10:32 +0000127};
128
George Rimar884e7862016-09-08 08:19:13 +0000129class LinkerScriptBase {
Rafael Espindola4d1e4d72016-09-08 14:11:08 +0000130protected:
131 ~LinkerScriptBase() = default;
132
George Rimar884e7862016-09-08 08:19:13 +0000133public:
134 virtual uint64_t getOutputSectionAddress(StringRef Name) = 0;
135 virtual uint64_t getOutputSectionSize(StringRef Name) = 0;
Eugene Leviant36fac7f2016-09-08 09:08:30 +0000136 virtual uint64_t getOutputSectionAlign(StringRef Name) = 0;
George Rimar884e7862016-09-08 08:19:13 +0000137 virtual uint64_t getHeaderSize() = 0;
138 virtual uint64_t getSymbolValue(StringRef S) = 0;
139};
140
Rui Ueyama07320e42016-04-20 20:13:41 +0000141// ScriptConfiguration holds linker script parse results.
142struct ScriptConfiguration {
George Rimar652852c2016-04-16 10:10:32 +0000143 // Used to assign addresses to sections.
George Rimar076fe152016-07-21 06:43:01 +0000144 std::vector<std::unique_ptr<BaseCommand>> Commands;
George Rimar652852c2016-04-16 10:10:32 +0000145
Eugene Leviantbbe38602016-07-19 09:25:43 +0000146 // Used to assign sections to headers.
George Rimar70ce0a92016-07-20 15:09:10 +0000147 std::vector<PhdrsCommand> PhdrsCommands;
148
Eugene Leviante05336ff2016-09-14 08:32:36 +0000149 bool HasSections = false;
Rui Ueyama07320e42016-04-20 20:13:41 +0000150
Rui Ueyamaf9de0d62016-02-11 21:38:55 +0000151 llvm::BumpPtrAllocator Alloc;
Rui Ueyama8ec77e62016-04-21 22:00:51 +0000152
153 // List of section patterns specified with KEEP commands. They will
154 // be kept even if they are unused and --gc-sections is specified.
George Rimarc91930a2016-09-02 21:17:20 +0000155 std::vector<llvm::Regex *> KeptSections;
Rui Ueyama717677a2016-02-11 21:17:59 +0000156};
157
Rui Ueyama07320e42016-04-20 20:13:41 +0000158extern ScriptConfiguration *ScriptConfig;
159
160// This is a runner of the linker script.
George Rimar884e7862016-09-08 08:19:13 +0000161template <class ELFT> class LinkerScript final : public LinkerScriptBase {
Rui Ueyama0b3868e2016-04-22 20:41:07 +0000162 typedef typename ELFT::uint uintX_t;
163
Rui Ueyama07320e42016-04-20 20:13:41 +0000164public:
Rui Ueyamaf34d0e02016-08-12 01:24:53 +0000165 LinkerScript();
166 ~LinkerScript();
Eugene Leviant20d03192016-09-16 15:30:47 +0000167 void processCommands(OutputSectionFactory<ELFT> &Factory);
Rafael Espindolaa4b41dc2016-08-04 12:13:05 +0000168 void createSections(OutputSectionFactory<ELFT> &Factory);
Rui Ueyamaa7f78842016-07-20 17:19:03 +0000169
Rafael Espindolaa4b41dc2016-08-04 12:13:05 +0000170 std::vector<PhdrEntry<ELFT>> createPhdrs();
Eugene Leviantf9bc3bd2016-08-16 06:40:58 +0000171 bool ignoreInterpSection();
Rui Ueyamaadca2452016-07-23 14:18:48 +0000172
Rui Ueyama07320e42016-04-20 20:13:41 +0000173 ArrayRef<uint8_t> getFiller(StringRef Name);
George Rimar8ceadb32016-08-17 07:44:19 +0000174 Expr getLma(StringRef Name);
Rui Ueyama07320e42016-04-20 20:13:41 +0000175 bool shouldKeep(InputSectionBase<ELFT> *S);
Rafael Espindolad3190792016-09-16 15:10:23 +0000176 void assignOffsets(OutputSectionCommand *Cmd);
Rafael Espindolaa4b41dc2016-08-04 12:13:05 +0000177 void assignAddresses();
Rui Ueyama07320e42016-04-20 20:13:41 +0000178 int compareSections(StringRef A, StringRef B);
Eugene Leviantbbe38602016-07-19 09:25:43 +0000179 bool hasPhdrsCommands();
George Rimar884e7862016-09-08 08:19:13 +0000180 uint64_t getOutputSectionAddress(StringRef Name) override;
181 uint64_t getOutputSectionSize(StringRef Name) override;
Eugene Leviant36fac7f2016-09-08 09:08:30 +0000182 uint64_t getOutputSectionAlign(StringRef Name) override;
George Rimar884e7862016-09-08 08:19:13 +0000183 uint64_t getHeaderSize() override;
184 uint64_t getSymbolValue(StringRef S) override;
Rui Ueyama07320e42016-04-20 20:13:41 +0000185
Rafael Espindolaa4b41dc2016-08-04 12:13:05 +0000186 std::vector<OutputSectionBase<ELFT> *> *OutputSections;
187
Rui Ueyama07320e42016-04-20 20:13:41 +0000188private:
Rafael Espindolad3190792016-09-16 15:10:23 +0000189 void computeInputSections(InputSectionDescription *,
190 ConstraintKind Constraint);
Rui Ueyama6b274812016-07-25 22:51:07 +0000191
Eugene Leviant20d03192016-09-16 15:30:47 +0000192 void addSection(OutputSectionFactory<ELFT> &Factory,
193 InputSectionBase<ELFT> *Sec, StringRef Name);
Rafael Espindola7bd37872016-09-12 16:05:16 +0000194 void discard(ArrayRef<InputSectionBase<ELFT> *> V);
Rui Ueyama48c3f1c2016-08-12 00:27:23 +0000195
Rui Ueyama0b9ce6a2016-08-12 03:16:56 +0000196 std::vector<InputSectionBase<ELFT> *>
197 createInputSectionList(OutputSectionCommand &Cmd);
198
Rui Ueyamac998a8c2016-04-22 00:03:13 +0000199 // "ScriptConfig" is a bit too long, so define a short name for it.
200 ScriptConfiguration &Opt = *ScriptConfig;
201
Rui Ueyamac3e2a4b2016-04-21 20:30:00 +0000202 int getSectionIndex(StringRef Name);
Rui Ueyamaedebbdf2016-07-24 23:47:31 +0000203 std::vector<size_t> getPhdrIndices(StringRef SectionName);
Rui Ueyama29c5a2a2016-07-26 00:27:36 +0000204 size_t getPhdrIndex(StringRef PhdrName);
Rui Ueyama07320e42016-04-20 20:13:41 +0000205
Rui Ueyama0b3868e2016-04-22 20:41:07 +0000206 uintX_t Dot;
Rafael Espindolad3190792016-09-16 15:10:23 +0000207 OutputSectionBase<ELFT> *CurOutSec = nullptr;
208 uintX_t ThreadBssOffset = 0;
209 void switchTo(OutputSectionBase<ELFT> *Sec);
210 void flush();
211 void output(InputSection<ELFT> *Sec);
212 void process(BaseCommand &Base);
213 llvm::DenseSet<OutputSectionBase<ELFT> *> AlreadyOutputOS;
214 llvm::DenseSet<InputSectionData *> AlreadyOutputIS;
Rui Ueyama07320e42016-04-20 20:13:41 +0000215};
216
217// Variable template is a C++14 feature, so we can't template
218// a global variable. Use a struct to workaround.
219template <class ELFT> struct Script { static LinkerScript<ELFT> *X; };
220template <class ELFT> LinkerScript<ELFT> *Script<ELFT>::X;
Rui Ueyama717677a2016-02-11 21:17:59 +0000221
George Rimar884e7862016-09-08 08:19:13 +0000222extern LinkerScriptBase *ScriptBase;
223
Rafael Espindolae0df00b2016-02-28 00:25:54 +0000224} // namespace elf
Rui Ueyama717677a2016-02-11 21:17:59 +0000225} // namespace lld
226
227#endif