Rui Ueyama | 717677a | 2016-02-11 21:17:59 +0000 | [diff] [blame] | 1 | //===- LinkerScript.h -------------------------------------------*- C++ -*-===// |
| 2 | // |
| 3 | // The LLVM Linker |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | |
| 10 | #ifndef LLD_ELF_LINKER_SCRIPT_H |
| 11 | #define LLD_ELF_LINKER_SCRIPT_H |
| 12 | |
George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 13 | #include "Strings.h" |
Eugene Leviant | bbe3860 | 2016-07-19 09:25:43 +0000 | [diff] [blame] | 14 | #include "Writer.h" |
Rui Ueyama | 717677a | 2016-02-11 21:17:59 +0000 | [diff] [blame] | 15 | #include "lld/Core/LLVM.h" |
| 16 | #include "llvm/ADT/DenseMap.h" |
| 17 | #include "llvm/ADT/MapVector.h" |
Rui Ueyama | f9de0d6 | 2016-02-11 21:38:55 +0000 | [diff] [blame] | 18 | #include "llvm/Support/Allocator.h" |
| 19 | #include "llvm/Support/MemoryBuffer.h" |
George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 20 | #include "llvm/Support/Regex.h" |
Rui Ueyama | 708019c | 2016-07-24 18:19:40 +0000 | [diff] [blame] | 21 | #include <functional> |
Rui Ueyama | 717677a | 2016-02-11 21:17:59 +0000 | [diff] [blame] | 22 | |
| 23 | namespace lld { |
Rafael Espindola | e0df00b | 2016-02-28 00:25:54 +0000 | [diff] [blame] | 24 | namespace elf { |
Rafael Espindola | e7553e4 | 2016-08-31 13:28:33 +0000 | [diff] [blame] | 25 | class DefinedCommon; |
George Rimar | dbb76db | 2016-08-18 13:00:49 +0000 | [diff] [blame] | 26 | class ScriptParser; |
Rui Ueyama | 8d083e6 | 2016-07-29 05:48:39 +0000 | [diff] [blame] | 27 | class SymbolBody; |
Eugene Leviant | e63d81b | 2016-07-20 14:43:20 +0000 | [diff] [blame] | 28 | template <class ELFT> class InputSectionBase; |
| 29 | template <class ELFT> class OutputSectionBase; |
| 30 | template <class ELFT> class OutputSectionFactory; |
Eugene Leviant | 97403d1 | 2016-09-01 09:55:57 +0000 | [diff] [blame] | 31 | class InputSectionData; |
Rui Ueyama | 717677a | 2016-02-11 21:17:59 +0000 | [diff] [blame] | 32 | |
Rui Ueyama | 708019c | 2016-07-24 18:19:40 +0000 | [diff] [blame] | 33 | typedef std::function<uint64_t(uint64_t)> Expr; |
| 34 | |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 35 | // Parses a linker script. Calling this function updates |
| 36 | // Config and ScriptConfig. |
| 37 | void readLinkerScript(MemoryBufferRef MB); |
| 38 | |
George Rimar | 20b6598 | 2016-08-31 09:08:26 +0000 | [diff] [blame] | 39 | void readVersionScript(MemoryBufferRef MB); |
| 40 | |
George Rimar | eea3114 | 2016-07-21 14:26:59 +0000 | [diff] [blame] | 41 | // This enum is used to implement linker script SECTIONS command. |
| 42 | // https://sourceware.org/binutils/docs/ld/SECTIONS.html#SECTIONS |
| 43 | enum SectionsCommandKind { |
| 44 | AssignmentKind, |
| 45 | OutputSectionKind, |
George Rimar | eefa758 | 2016-08-04 09:29:31 +0000 | [diff] [blame] | 46 | InputSectionKind, |
| 47 | AssertKind |
Rui Ueyama | 1ebc8ed | 2016-02-12 21:47:28 +0000 | [diff] [blame] | 48 | }; |
| 49 | |
George Rimar | 076fe15 | 2016-07-21 06:43:01 +0000 | [diff] [blame] | 50 | struct BaseCommand { |
| 51 | BaseCommand(int K) : Kind(K) {} |
| 52 | virtual ~BaseCommand() {} |
| 53 | int Kind; |
| 54 | }; |
| 55 | |
| 56 | struct SymbolAssignment : BaseCommand { |
Eugene Leviant | db741e7 | 2016-09-07 07:08:43 +0000 | [diff] [blame] | 57 | SymbolAssignment(StringRef Name, Expr E, bool IsAbsolute) |
| 58 | : BaseCommand(AssignmentKind), Name(Name), Expression(E), |
| 59 | IsAbsolute(IsAbsolute) {} |
George Rimar | 076fe15 | 2016-07-21 06:43:01 +0000 | [diff] [blame] | 60 | static bool classof(const BaseCommand *C); |
Rui Ueyama | 2020424 | 2016-07-29 05:52:33 +0000 | [diff] [blame] | 61 | |
| 62 | // The LHS of an expression. Name is either a symbol name or ".". |
George Rimar | 076fe15 | 2016-07-21 06:43:01 +0000 | [diff] [blame] | 63 | StringRef Name; |
Rui Ueyama | 2020424 | 2016-07-29 05:52:33 +0000 | [diff] [blame] | 64 | SymbolBody *Sym = nullptr; |
| 65 | |
| 66 | // The RHS of an expression. |
Rui Ueyama | 708019c | 2016-07-24 18:19:40 +0000 | [diff] [blame] | 67 | Expr Expression; |
Rui Ueyama | 2020424 | 2016-07-29 05:52:33 +0000 | [diff] [blame] | 68 | |
| 69 | // Command attributes for PROVIDE, HIDDEN and PROVIDE_HIDDEN. |
Eugene Leviant | a31c91b | 2016-07-22 07:38:40 +0000 | [diff] [blame] | 70 | bool Provide = false; |
Eugene Leviant | a31c91b | 2016-07-22 07:38:40 +0000 | [diff] [blame] | 71 | bool Hidden = false; |
Eugene Leviant | db741e7 | 2016-09-07 07:08:43 +0000 | [diff] [blame] | 72 | bool IsAbsolute; |
Eugene Leviant | 97403d1 | 2016-09-01 09:55:57 +0000 | [diff] [blame] | 73 | InputSectionData *GoesAfter = nullptr; |
George Rimar | 076fe15 | 2016-07-21 06:43:01 +0000 | [diff] [blame] | 74 | }; |
| 75 | |
Davide Italiano | 246f681 | 2016-07-22 03:36:24 +0000 | [diff] [blame] | 76 | // Linker scripts allow additional constraints to be put on ouput sections. |
| 77 | // An output section will only be created if all of its input sections are |
| 78 | // read-only |
| 79 | // or all of its input sections are read-write by using the keyword ONLY_IF_RO |
| 80 | // and ONLY_IF_RW respectively. |
Rui Ueyama | efc4066 | 2016-07-25 22:00:10 +0000 | [diff] [blame] | 81 | enum class ConstraintKind { NoConstraint, ReadOnly, ReadWrite }; |
Davide Italiano | 246f681 | 2016-07-22 03:36:24 +0000 | [diff] [blame] | 82 | |
George Rimar | 076fe15 | 2016-07-21 06:43:01 +0000 | [diff] [blame] | 83 | struct OutputSectionCommand : BaseCommand { |
| 84 | OutputSectionCommand(StringRef Name) |
| 85 | : BaseCommand(OutputSectionKind), Name(Name) {} |
| 86 | static bool classof(const BaseCommand *C); |
Eugene Leviant | eda81a1 | 2016-07-12 06:39:48 +0000 | [diff] [blame] | 87 | StringRef Name; |
George Rimar | 58e5c4d | 2016-07-25 08:29:46 +0000 | [diff] [blame] | 88 | Expr AddrExpr; |
George Rimar | 630c617 | 2016-07-26 18:06:29 +0000 | [diff] [blame] | 89 | Expr AlignExpr; |
George Rimar | 8ceadb3 | 2016-08-17 07:44:19 +0000 | [diff] [blame] | 90 | Expr LmaExpr; |
George Rimar | db24d9c | 2016-08-19 15:18:23 +0000 | [diff] [blame] | 91 | Expr SubalignExpr; |
George Rimar | eea3114 | 2016-07-21 14:26:59 +0000 | [diff] [blame] | 92 | std::vector<std::unique_ptr<BaseCommand>> Commands; |
Eugene Leviant | bbe3860 | 2016-07-19 09:25:43 +0000 | [diff] [blame] | 93 | std::vector<StringRef> Phdrs; |
George Rimar | 076fe15 | 2016-07-21 06:43:01 +0000 | [diff] [blame] | 94 | std::vector<uint8_t> Filler; |
Rui Ueyama | efc4066 | 2016-07-25 22:00:10 +0000 | [diff] [blame] | 95 | ConstraintKind Constraint = ConstraintKind::NoConstraint; |
Eugene Leviant | bbe3860 | 2016-07-19 09:25:43 +0000 | [diff] [blame] | 96 | }; |
| 97 | |
Rui Ueyama | 742c383 | 2016-08-04 22:27:00 +0000 | [diff] [blame] | 98 | enum SortKind { SortNone, SortByName, SortByAlignment }; |
George Rimar | 350ece4 | 2016-08-03 08:35:59 +0000 | [diff] [blame] | 99 | |
George Rimar | eea3114 | 2016-07-21 14:26:59 +0000 | [diff] [blame] | 100 | struct InputSectionDescription : BaseCommand { |
George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 101 | InputSectionDescription(StringRef FilePattern) |
| 102 | : BaseCommand(InputSectionKind), |
| 103 | FileRe(compileGlobPatterns({FilePattern})) {} |
George Rimar | eea3114 | 2016-07-21 14:26:59 +0000 | [diff] [blame] | 104 | static bool classof(const BaseCommand *C); |
George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 105 | llvm::Regex FileRe; |
Rui Ueyama | 742c383 | 2016-08-04 22:27:00 +0000 | [diff] [blame] | 106 | SortKind SortOuter = SortNone; |
| 107 | SortKind SortInner = SortNone; |
George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 108 | llvm::Regex ExcludedFileRe; |
| 109 | llvm::Regex SectionRe; |
George Rimar | eea3114 | 2016-07-21 14:26:59 +0000 | [diff] [blame] | 110 | }; |
| 111 | |
George Rimar | eefa758 | 2016-08-04 09:29:31 +0000 | [diff] [blame] | 112 | struct AssertCommand : BaseCommand { |
| 113 | AssertCommand(Expr E) : BaseCommand(AssertKind), Expression(E) {} |
| 114 | static bool classof(const BaseCommand *C); |
| 115 | Expr Expression; |
| 116 | }; |
| 117 | |
Eugene Leviant | bbe3860 | 2016-07-19 09:25:43 +0000 | [diff] [blame] | 118 | struct PhdrsCommand { |
| 119 | StringRef Name; |
| 120 | unsigned Type; |
| 121 | bool HasFilehdr; |
| 122 | bool HasPhdrs; |
Eugene Leviant | 865bf86 | 2016-07-21 10:43:25 +0000 | [diff] [blame] | 123 | unsigned Flags; |
Eugene Leviant | 56b21c8 | 2016-09-09 09:46:16 +0000 | [diff] [blame] | 124 | Expr LMAExpr; |
George Rimar | 652852c | 2016-04-16 10:10:32 +0000 | [diff] [blame] | 125 | }; |
| 126 | |
George Rimar | 884e786 | 2016-09-08 08:19:13 +0000 | [diff] [blame] | 127 | class LinkerScriptBase { |
Rafael Espindola | 4d1e4d7 | 2016-09-08 14:11:08 +0000 | [diff] [blame] | 128 | protected: |
| 129 | ~LinkerScriptBase() = default; |
| 130 | |
George Rimar | 884e786 | 2016-09-08 08:19:13 +0000 | [diff] [blame] | 131 | public: |
| 132 | virtual uint64_t getOutputSectionAddress(StringRef Name) = 0; |
| 133 | virtual uint64_t getOutputSectionSize(StringRef Name) = 0; |
Eugene Leviant | 36fac7f | 2016-09-08 09:08:30 +0000 | [diff] [blame] | 134 | virtual uint64_t getOutputSectionAlign(StringRef Name) = 0; |
George Rimar | 884e786 | 2016-09-08 08:19:13 +0000 | [diff] [blame] | 135 | virtual uint64_t getHeaderSize() = 0; |
| 136 | virtual uint64_t getSymbolValue(StringRef S) = 0; |
| 137 | }; |
| 138 | |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 139 | // ScriptConfiguration holds linker script parse results. |
| 140 | struct ScriptConfiguration { |
Petr Hosek | e5d3ca5 | 2016-08-31 15:31:17 +0000 | [diff] [blame] | 141 | // Used to create symbol assignments outside SECTIONS command. |
| 142 | std::vector<std::unique_ptr<SymbolAssignment>> Assignments; |
George Rimar | 652852c | 2016-04-16 10:10:32 +0000 | [diff] [blame] | 143 | // Used to assign addresses to sections. |
George Rimar | 076fe15 | 2016-07-21 06:43:01 +0000 | [diff] [blame] | 144 | std::vector<std::unique_ptr<BaseCommand>> Commands; |
George Rimar | 652852c | 2016-04-16 10:10:32 +0000 | [diff] [blame] | 145 | |
Eugene Leviant | bbe3860 | 2016-07-19 09:25:43 +0000 | [diff] [blame] | 146 | // Used to assign sections to headers. |
George Rimar | 70ce0a9 | 2016-07-20 15:09:10 +0000 | [diff] [blame] | 147 | std::vector<PhdrsCommand> PhdrsCommands; |
| 148 | |
Eugene Leviant | e05336ff | 2016-09-14 08:32:36 +0000 | [diff] [blame^] | 149 | bool HasSections = false; |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 150 | |
Rui Ueyama | f9de0d6 | 2016-02-11 21:38:55 +0000 | [diff] [blame] | 151 | llvm::BumpPtrAllocator Alloc; |
Rui Ueyama | 8ec77e6 | 2016-04-21 22:00:51 +0000 | [diff] [blame] | 152 | |
| 153 | // List of section patterns specified with KEEP commands. They will |
| 154 | // be kept even if they are unused and --gc-sections is specified. |
George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 155 | std::vector<llvm::Regex *> KeptSections; |
Rui Ueyama | 717677a | 2016-02-11 21:17:59 +0000 | [diff] [blame] | 156 | }; |
| 157 | |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 158 | extern ScriptConfiguration *ScriptConfig; |
| 159 | |
| 160 | // This is a runner of the linker script. |
George Rimar | 884e786 | 2016-09-08 08:19:13 +0000 | [diff] [blame] | 161 | template <class ELFT> class LinkerScript final : public LinkerScriptBase { |
Rui Ueyama | 0b3868e | 2016-04-22 20:41:07 +0000 | [diff] [blame] | 162 | typedef typename ELFT::uint uintX_t; |
| 163 | |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 164 | public: |
Rui Ueyama | f34d0e0 | 2016-08-12 01:24:53 +0000 | [diff] [blame] | 165 | LinkerScript(); |
| 166 | ~LinkerScript(); |
Petr Hosek | e5d3ca5 | 2016-08-31 15:31:17 +0000 | [diff] [blame] | 167 | void createAssignments(); |
Rafael Espindola | a4b41dc | 2016-08-04 12:13:05 +0000 | [diff] [blame] | 168 | void createSections(OutputSectionFactory<ELFT> &Factory); |
Rui Ueyama | a7f7884 | 2016-07-20 17:19:03 +0000 | [diff] [blame] | 169 | |
Rafael Espindola | a4b41dc | 2016-08-04 12:13:05 +0000 | [diff] [blame] | 170 | std::vector<PhdrEntry<ELFT>> createPhdrs(); |
Eugene Leviant | f9bc3bd | 2016-08-16 06:40:58 +0000 | [diff] [blame] | 171 | bool ignoreInterpSection(); |
Rui Ueyama | adca245 | 2016-07-23 14:18:48 +0000 | [diff] [blame] | 172 | |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 173 | ArrayRef<uint8_t> getFiller(StringRef Name); |
George Rimar | 8ceadb3 | 2016-08-17 07:44:19 +0000 | [diff] [blame] | 174 | Expr getLma(StringRef Name); |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 175 | bool shouldKeep(InputSectionBase<ELFT> *S); |
Rafael Espindola | a4b41dc | 2016-08-04 12:13:05 +0000 | [diff] [blame] | 176 | void assignAddresses(); |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 177 | int compareSections(StringRef A, StringRef B); |
Eugene Leviant | bbe3860 | 2016-07-19 09:25:43 +0000 | [diff] [blame] | 178 | bool hasPhdrsCommands(); |
George Rimar | 884e786 | 2016-09-08 08:19:13 +0000 | [diff] [blame] | 179 | uint64_t getOutputSectionAddress(StringRef Name) override; |
| 180 | uint64_t getOutputSectionSize(StringRef Name) override; |
Eugene Leviant | 36fac7f | 2016-09-08 09:08:30 +0000 | [diff] [blame] | 181 | uint64_t getOutputSectionAlign(StringRef Name) override; |
George Rimar | 884e786 | 2016-09-08 08:19:13 +0000 | [diff] [blame] | 182 | uint64_t getHeaderSize() override; |
| 183 | uint64_t getSymbolValue(StringRef S) override; |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 184 | |
Rafael Espindola | a4b41dc | 2016-08-04 12:13:05 +0000 | [diff] [blame] | 185 | std::vector<OutputSectionBase<ELFT> *> *OutputSections; |
| 186 | |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 187 | private: |
Rui Ueyama | 6b27481 | 2016-07-25 22:51:07 +0000 | [diff] [blame] | 188 | std::vector<InputSectionBase<ELFT> *> |
Rui Ueyama | ad10c3d | 2016-07-28 21:05:04 +0000 | [diff] [blame] | 189 | getInputSections(const InputSectionDescription *); |
Rui Ueyama | 6b27481 | 2016-07-25 22:51:07 +0000 | [diff] [blame] | 190 | |
Rafael Espindola | 7bd3787 | 2016-09-12 16:05:16 +0000 | [diff] [blame] | 191 | void discard(ArrayRef<InputSectionBase<ELFT> *> V); |
Rui Ueyama | 48c3f1c | 2016-08-12 00:27:23 +0000 | [diff] [blame] | 192 | |
Rui Ueyama | 0b9ce6a | 2016-08-12 03:16:56 +0000 | [diff] [blame] | 193 | std::vector<InputSectionBase<ELFT> *> |
| 194 | createInputSectionList(OutputSectionCommand &Cmd); |
| 195 | |
Rui Ueyama | c998a8c | 2016-04-22 00:03:13 +0000 | [diff] [blame] | 196 | // "ScriptConfig" is a bit too long, so define a short name for it. |
| 197 | ScriptConfiguration &Opt = *ScriptConfig; |
| 198 | |
Rui Ueyama | c3e2a4b | 2016-04-21 20:30:00 +0000 | [diff] [blame] | 199 | int getSectionIndex(StringRef Name); |
Rui Ueyama | edebbdf | 2016-07-24 23:47:31 +0000 | [diff] [blame] | 200 | std::vector<size_t> getPhdrIndices(StringRef SectionName); |
Rui Ueyama | 29c5a2a | 2016-07-26 00:27:36 +0000 | [diff] [blame] | 201 | size_t getPhdrIndex(StringRef PhdrName); |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 202 | |
Rui Ueyama | 0b3868e | 2016-04-22 20:41:07 +0000 | [diff] [blame] | 203 | uintX_t Dot; |
Rui Ueyama | 07320e4 | 2016-04-20 20:13:41 +0000 | [diff] [blame] | 204 | }; |
| 205 | |
| 206 | // Variable template is a C++14 feature, so we can't template |
| 207 | // a global variable. Use a struct to workaround. |
| 208 | template <class ELFT> struct Script { static LinkerScript<ELFT> *X; }; |
| 209 | template <class ELFT> LinkerScript<ELFT> *Script<ELFT>::X; |
Rui Ueyama | 717677a | 2016-02-11 21:17:59 +0000 | [diff] [blame] | 210 | |
George Rimar | 884e786 | 2016-09-08 08:19:13 +0000 | [diff] [blame] | 211 | extern LinkerScriptBase *ScriptBase; |
| 212 | |
Rafael Espindola | e0df00b | 2016-02-28 00:25:54 +0000 | [diff] [blame] | 213 | } // namespace elf |
Rui Ueyama | 717677a | 2016-02-11 21:17:59 +0000 | [diff] [blame] | 214 | } // namespace lld |
| 215 | |
| 216 | #endif |