blob: ac384c1fdfe6b3a55f14c56d81d373962caa8849 [file] [log] [blame]
Petr Hosek05a04cb2017-08-01 00:33:58 +00001//===- Object.h -------------------------------------------------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Eugene Zelenko0ad18f82017-11-01 21:16:06 +000010#ifndef LLVM_TOOLS_OBJCOPY_OBJECT_H
11#define LLVM_TOOLS_OBJCOPY_OBJECT_H
Petr Hosek05a04cb2017-08-01 00:33:58 +000012
Eugene Zelenko0ad18f82017-11-01 21:16:06 +000013#include "llvm/ADT/ArrayRef.h"
14#include "llvm/ADT/StringRef.h"
15#include "llvm/ADT/Twine.h"
16#include "llvm/BinaryFormat/ELF.h"
Petr Hosek05a04cb2017-08-01 00:33:58 +000017#include "llvm/MC/StringTableBuilder.h"
18#include "llvm/Object/ELFObjectFile.h"
Jake Ehrlich76e91102018-01-25 22:46:17 +000019#include "llvm/Support/FileOutputBuffer.h"
Jake Ehrlichea07d3c2018-01-25 22:15:14 +000020#include "llvm/Support/JamCRC.h"
Eugene Zelenko0ad18f82017-11-01 21:16:06 +000021#include <cstddef>
22#include <cstdint>
23#include <functional>
Petr Hosek05a04cb2017-08-01 00:33:58 +000024#include <memory>
25#include <set>
Eugene Zelenko0ad18f82017-11-01 21:16:06 +000026#include <vector>
Petr Hosek05a04cb2017-08-01 00:33:58 +000027
Eugene Zelenko0ad18f82017-11-01 21:16:06 +000028namespace llvm {
29
Jake Ehrlichf5a43772017-09-25 20:37:28 +000030class SectionBase;
Jake Ehrlich76e91102018-01-25 22:46:17 +000031class Section;
32class OwnedDataSection;
33class StringTableSection;
34class SymbolTableSection;
35class RelocationSection;
36class DynamicRelocationSection;
37class GnuDebugLinkSection;
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +000038class GroupSection;
Eugene Zelenko0ad18f82017-11-01 21:16:06 +000039class Segment;
Jake Ehrlich76e91102018-01-25 22:46:17 +000040class Object;
Paul Semel4246a462018-05-09 21:36:54 +000041struct Symbol;
Jake Ehrlichf5a43772017-09-25 20:37:28 +000042
43class SectionTableRef {
Jake Ehrlich76e91102018-01-25 22:46:17 +000044 MutableArrayRef<std::unique_ptr<SectionBase>> Sections;
Jake Ehrlichf5a43772017-09-25 20:37:28 +000045
46public:
Jake Ehrlich76e91102018-01-25 22:46:17 +000047 using iterator = pointee_iterator<std::unique_ptr<SectionBase> *>;
48
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +000049 explicit SectionTableRef(MutableArrayRef<std::unique_ptr<SectionBase>> Secs)
Jake Ehrlichf5a43772017-09-25 20:37:28 +000050 : Sections(Secs) {}
51 SectionTableRef(const SectionTableRef &) = default;
52
Jake Ehrlich76e91102018-01-25 22:46:17 +000053 iterator begin() { return iterator(Sections.data()); }
54 iterator end() { return iterator(Sections.data() + Sections.size()); }
55
Jake Ehrlich8b831c12018-03-07 20:33:02 +000056 SectionBase *getSection(uint16_t Index, Twine ErrMsg);
Jake Ehrlichf5a43772017-09-25 20:37:28 +000057
58 template <class T>
Jake Ehrlich8b831c12018-03-07 20:33:02 +000059 T *getSectionOfType(uint16_t Index, Twine IndexErrMsg, Twine TypeErrMsg);
Jake Ehrlichf5a43772017-09-25 20:37:28 +000060};
Petr Hosek05a04cb2017-08-01 00:33:58 +000061
Jake Ehrlich76e91102018-01-25 22:46:17 +000062enum ElfType { ELFT_ELF32LE, ELFT_ELF64LE, ELFT_ELF32BE, ELFT_ELF64BE };
63
64class SectionVisitor {
65public:
66 virtual ~SectionVisitor();
67
68 virtual void visit(const Section &Sec) = 0;
69 virtual void visit(const OwnedDataSection &Sec) = 0;
70 virtual void visit(const StringTableSection &Sec) = 0;
71 virtual void visit(const SymbolTableSection &Sec) = 0;
72 virtual void visit(const RelocationSection &Sec) = 0;
73 virtual void visit(const DynamicRelocationSection &Sec) = 0;
74 virtual void visit(const GnuDebugLinkSection &Sec) = 0;
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +000075 virtual void visit(const GroupSection &Sec) = 0;
Jake Ehrlich76e91102018-01-25 22:46:17 +000076};
77
78class SectionWriter : public SectionVisitor {
79protected:
80 FileOutputBuffer &Out;
81
82public:
83 virtual ~SectionWriter(){};
84
85 void visit(const Section &Sec) override;
86 void visit(const OwnedDataSection &Sec) override;
87 void visit(const StringTableSection &Sec) override;
88 void visit(const DynamicRelocationSection &Sec) override;
89 virtual void visit(const SymbolTableSection &Sec) override = 0;
90 virtual void visit(const RelocationSection &Sec) override = 0;
91 virtual void visit(const GnuDebugLinkSection &Sec) override = 0;
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +000092 virtual void visit(const GroupSection &Sec) override = 0;
Jake Ehrlich76e91102018-01-25 22:46:17 +000093
94 SectionWriter(FileOutputBuffer &Buf) : Out(Buf) {}
95};
96
97template <class ELFT> class ELFSectionWriter : public SectionWriter {
98private:
99 using Elf_Word = typename ELFT::Word;
100 using Elf_Rel = typename ELFT::Rel;
101 using Elf_Rela = typename ELFT::Rela;
102
103public:
104 virtual ~ELFSectionWriter() {}
105 void visit(const SymbolTableSection &Sec) override;
106 void visit(const RelocationSection &Sec) override;
107 void visit(const GnuDebugLinkSection &Sec) override;
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000108 void visit(const GroupSection &Sec) override;
Jake Ehrlich76e91102018-01-25 22:46:17 +0000109
110 ELFSectionWriter(FileOutputBuffer &Buf) : SectionWriter(Buf) {}
111};
112
113#define MAKE_SEC_WRITER_FRIEND \
114 friend class SectionWriter; \
115 template <class ELFT> friend class ELFSectionWriter;
116
117class BinarySectionWriter : public SectionWriter {
118public:
119 virtual ~BinarySectionWriter() {}
120
121 void visit(const SymbolTableSection &Sec) override;
122 void visit(const RelocationSection &Sec) override;
123 void visit(const GnuDebugLinkSection &Sec) override;
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000124 void visit(const GroupSection &Sec) override;
125
Jake Ehrlich76e91102018-01-25 22:46:17 +0000126 BinarySectionWriter(FileOutputBuffer &Buf) : SectionWriter(Buf) {}
127};
128
129class Writer {
130protected:
131 StringRef File;
132 Object &Obj;
133 std::unique_ptr<FileOutputBuffer> BufPtr;
134
135 void createBuffer(uint64_t Size);
136
137public:
138 virtual ~Writer();
139
140 virtual void finalize() = 0;
141 virtual void write() = 0;
142
143 Writer(StringRef File, Object &Obj) : File(File), Obj(Obj) {}
144};
145
146template <class ELFT> class ELFWriter : public Writer {
147private:
148 using Elf_Shdr = typename ELFT::Shdr;
149 using Elf_Phdr = typename ELFT::Phdr;
150 using Elf_Ehdr = typename ELFT::Ehdr;
151
152 void writeEhdr();
153 void writePhdr(const Segment &Seg);
154 void writeShdr(const SectionBase &Sec);
155
156 void writePhdrs();
157 void writeShdrs();
158 void writeSectionData();
159
160 void assignOffsets();
161
162 std::unique_ptr<ELFSectionWriter<ELFT>> SecWriter;
163
164 size_t totalSize() const;
165
166public:
167 virtual ~ELFWriter() {}
168 bool WriteSectionHeaders = true;
169
170 void finalize() override;
171 void write() override;
172 ELFWriter(StringRef File, Object &Obj, bool WSH)
173 : Writer(File, Obj), WriteSectionHeaders(WSH) {}
174};
175
176class BinaryWriter : public Writer {
177private:
178 std::unique_ptr<BinarySectionWriter> SecWriter;
179
180 uint64_t TotalSize;
181
182public:
183 ~BinaryWriter() {}
184 void finalize() override;
185 void write() override;
186 BinaryWriter(StringRef File, Object &Obj) : Writer(File, Obj) {}
187};
188
Petr Hosek05a04cb2017-08-01 00:33:58 +0000189class SectionBase {
190public:
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000191 StringRef Name;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000192 Segment *ParentSegment = nullptr;
193 uint64_t HeaderOffset;
194 uint64_t OriginalOffset;
195 uint32_t Index;
196
197 uint64_t Addr = 0;
198 uint64_t Align = 1;
199 uint32_t EntrySize = 0;
200 uint64_t Flags = 0;
201 uint64_t Info = 0;
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000202 uint64_t Link = ELF::SHN_UNDEF;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000203 uint64_t NameIndex = 0;
204 uint64_t Offset = 0;
205 uint64_t Size = 0;
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000206 uint64_t Type = ELF::SHT_NULL;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000207
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000208 virtual ~SectionBase() = default;
209
Jake Ehrlichf5a43772017-09-25 20:37:28 +0000210 virtual void initialize(SectionTableRef SecTable);
Petr Hosek05a04cb2017-08-01 00:33:58 +0000211 virtual void finalize();
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000212 virtual void removeSectionReferences(const SectionBase *Sec);
Paul Semel4246a462018-05-09 21:36:54 +0000213 virtual void removeSymbols(function_ref<bool(const Symbol &)> ToRemove);
Jake Ehrlich76e91102018-01-25 22:46:17 +0000214 virtual void accept(SectionVisitor &Visitor) const = 0;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000215};
216
217class Segment {
218private:
219 struct SectionCompare {
220 bool operator()(const SectionBase *Lhs, const SectionBase *Rhs) const {
221 // Some sections might have the same address if one of them is empty. To
222 // fix this we can use the lexicographic ordering on ->Addr and the
223 // address of the actully stored section.
224 if (Lhs->OriginalOffset == Rhs->OriginalOffset)
225 return Lhs < Rhs;
226 return Lhs->OriginalOffset < Rhs->OriginalOffset;
227 }
228 };
229
230 std::set<const SectionBase *, SectionCompare> Sections;
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000231 ArrayRef<uint8_t> Contents;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000232
233public:
234 uint64_t Align;
235 uint64_t FileSize;
236 uint32_t Flags;
237 uint32_t Index;
238 uint64_t MemSize;
239 uint64_t Offset;
240 uint64_t PAddr;
241 uint64_t Type;
242 uint64_t VAddr;
243
Petr Hosek3f383832017-08-26 01:32:20 +0000244 uint64_t OriginalOffset;
Jake Ehrlichd246b0a2017-09-19 21:37:35 +0000245 Segment *ParentSegment = nullptr;
Petr Hosek3f383832017-08-26 01:32:20 +0000246
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000247 explicit Segment(ArrayRef<uint8_t> Data) : Contents(Data) {}
Jake Ehrlich6452b112018-02-14 23:31:33 +0000248 Segment() {}
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000249
Petr Hosek05a04cb2017-08-01 00:33:58 +0000250 const SectionBase *firstSection() const {
251 if (!Sections.empty())
252 return *Sections.begin();
253 return nullptr;
254 }
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000255
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000256 void removeSection(const SectionBase *Sec) { Sections.erase(Sec); }
257 void addSection(const SectionBase *Sec) { Sections.insert(Sec); }
Petr Hosek05a04cb2017-08-01 00:33:58 +0000258};
259
260class Section : public SectionBase {
Jake Ehrlich76e91102018-01-25 22:46:17 +0000261 MAKE_SEC_WRITER_FRIEND
262
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000263 ArrayRef<uint8_t> Contents;
Alexander Shaposhnikov52db4332018-04-20 20:46:04 +0000264 SectionBase *LinkSection = nullptr;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000265
266public:
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000267 explicit Section(ArrayRef<uint8_t> Data) : Contents(Data) {}
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000268
Jake Ehrlich76e91102018-01-25 22:46:17 +0000269 void accept(SectionVisitor &Visitor) const override;
Alexander Shaposhnikov52db4332018-04-20 20:46:04 +0000270 void removeSectionReferences(const SectionBase *Sec) override;
271 void initialize(SectionTableRef SecTable) override;
272 void finalize() override;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000273};
274
Jake Ehrliche8437de2017-12-19 00:47:30 +0000275class OwnedDataSection : public SectionBase {
Jake Ehrlich76e91102018-01-25 22:46:17 +0000276 MAKE_SEC_WRITER_FRIEND
277
Jake Ehrliche8437de2017-12-19 00:47:30 +0000278 std::vector<uint8_t> Data;
279
280public:
281 OwnedDataSection(StringRef SecName, ArrayRef<uint8_t> Data)
282 : Data(std::begin(Data), std::end(Data)) {
283 Name = SecName;
284 Type = ELF::SHT_PROGBITS;
285 Size = Data.size();
Jake Ehrlich76e91102018-01-25 22:46:17 +0000286 OriginalOffset = std::numeric_limits<uint64_t>::max();
Jake Ehrliche8437de2017-12-19 00:47:30 +0000287 }
Jake Ehrlich76e91102018-01-25 22:46:17 +0000288
289 void accept(SectionVisitor &Sec) const override;
Jake Ehrliche8437de2017-12-19 00:47:30 +0000290};
291
Jake Ehrlich70bd75f2017-10-10 21:28:22 +0000292// There are two types of string tables that can exist, dynamic and not dynamic.
293// In the dynamic case the string table is allocated. Changing a dynamic string
294// table would mean altering virtual addresses and thus the memory image. So
295// dynamic string tables should not have an interface to modify them or
296// reconstruct them. This type lets us reconstruct a string table. To avoid
297// this class being used for dynamic string tables (which has happened) the
298// classof method checks that the particular instance is not allocated. This
299// then agrees with the makeSection method used to construct most sections.
Petr Hosek05a04cb2017-08-01 00:33:58 +0000300class StringTableSection : public SectionBase {
Jake Ehrlich76e91102018-01-25 22:46:17 +0000301 MAKE_SEC_WRITER_FRIEND
302
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000303 StringTableBuilder StrTabBuilder;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000304
305public:
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000306 StringTableSection() : StrTabBuilder(StringTableBuilder::ELF) {
307 Type = ELF::SHT_STRTAB;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000308 }
309
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000310 void addString(StringRef Name);
311 uint32_t findIndex(StringRef Name) const;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000312 void finalize() override;
Jake Ehrlich76e91102018-01-25 22:46:17 +0000313 void accept(SectionVisitor &Visitor) const override;
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000314
Petr Hosek05a04cb2017-08-01 00:33:58 +0000315 static bool classof(const SectionBase *S) {
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000316 if (S->Flags & ELF::SHF_ALLOC)
Jake Ehrlich70bd75f2017-10-10 21:28:22 +0000317 return false;
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000318 return S->Type == ELF::SHT_STRTAB;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000319 }
320};
321
Petr Hosekec2b3fc2017-09-07 23:02:50 +0000322// Symbols have a st_shndx field that normally stores an index but occasionally
323// stores a different special value. This enum keeps track of what the st_shndx
324// field means. Most of the values are just copies of the special SHN_* values.
325// SYMBOL_SIMPLE_INDEX means that the st_shndx is just an index of a section.
326enum SymbolShndxType {
327 SYMBOL_SIMPLE_INDEX = 0,
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000328 SYMBOL_ABS = ELF::SHN_ABS,
329 SYMBOL_COMMON = ELF::SHN_COMMON,
330 SYMBOL_HEXAGON_SCOMMON = ELF::SHN_HEXAGON_SCOMMON,
331 SYMBOL_HEXAGON_SCOMMON_2 = ELF::SHN_HEXAGON_SCOMMON_2,
332 SYMBOL_HEXAGON_SCOMMON_4 = ELF::SHN_HEXAGON_SCOMMON_4,
333 SYMBOL_HEXAGON_SCOMMON_8 = ELF::SHN_HEXAGON_SCOMMON_8,
Petr Hosekec2b3fc2017-09-07 23:02:50 +0000334};
335
Petr Hosek79cee9e2017-08-29 02:12:03 +0000336struct Symbol {
337 uint8_t Binding;
Jake Ehrliched95fce2017-09-27 00:44:00 +0000338 SectionBase *DefinedIn = nullptr;
Petr Hosekec2b3fc2017-09-07 23:02:50 +0000339 SymbolShndxType ShndxType;
Petr Hosek79cee9e2017-08-29 02:12:03 +0000340 uint32_t Index;
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000341 StringRef Name;
Petr Hosek79cee9e2017-08-29 02:12:03 +0000342 uint32_t NameIndex;
343 uint64_t Size;
344 uint8_t Type;
345 uint64_t Value;
Jake Ehrlich30d927a2018-01-02 23:01:24 +0000346 uint8_t Visibility;
Petr Hosekec2b3fc2017-09-07 23:02:50 +0000347
348 uint16_t getShndx() const;
Petr Hosek79cee9e2017-08-29 02:12:03 +0000349};
350
351class SymbolTableSection : public SectionBase {
Jake Ehrlich76e91102018-01-25 22:46:17 +0000352 MAKE_SEC_WRITER_FRIEND
353
Alexander Shaposhnikova8f15502018-02-24 00:41:01 +0000354 void setStrTab(StringTableSection *StrTab) { SymbolNames = StrTab; }
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000355 void assignIndices();
Alexander Shaposhnikova8f15502018-02-24 00:41:01 +0000356
Petr Hosek79cee9e2017-08-29 02:12:03 +0000357protected:
358 std::vector<std::unique_ptr<Symbol>> Symbols;
Jake Ehrliched95fce2017-09-27 00:44:00 +0000359 StringTableSection *SymbolNames = nullptr;
Petr Hosek79cee9e2017-08-29 02:12:03 +0000360
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000361 using SymPtr = std::unique_ptr<Symbol>;
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000362
Petr Hosek79cee9e2017-08-29 02:12:03 +0000363public:
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000364 void addSymbol(StringRef Name, uint8_t Bind, uint8_t Type,
Jake Ehrlich30d927a2018-01-02 23:01:24 +0000365 SectionBase *DefinedIn, uint64_t Value, uint8_t Visibility,
366 uint16_t Shndx, uint64_t Sz);
Jake Ehrlich8b831c12018-03-07 20:33:02 +0000367 void addSymbolNames();
Jake Ehrlichef3b80c2017-11-30 20:14:53 +0000368 const SectionBase *getStrTab() const { return SymbolNames; }
Petr Hosek79cee9e2017-08-29 02:12:03 +0000369 const Symbol *getSymbolByIndex(uint32_t Index) const;
Alexander Shaposhnikov40e9bdf2018-04-26 18:28:17 +0000370 void updateSymbols(function_ref<void(Symbol &)> Callable);
371
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000372 void removeSectionReferences(const SectionBase *Sec) override;
Jake Ehrlichf5a43772017-09-25 20:37:28 +0000373 void initialize(SectionTableRef SecTable) override;
Petr Hosek79cee9e2017-08-29 02:12:03 +0000374 void finalize() override;
Jake Ehrlich76e91102018-01-25 22:46:17 +0000375 void accept(SectionVisitor &Visitor) const override;
Paul Semel4246a462018-05-09 21:36:54 +0000376 void removeSymbols(function_ref<bool(const Symbol &)> ToRemove) override;
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000377
Petr Hosek79cee9e2017-08-29 02:12:03 +0000378 static bool classof(const SectionBase *S) {
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000379 return S->Type == ELF::SHT_SYMTAB;
Petr Hosek79cee9e2017-08-29 02:12:03 +0000380 }
381};
382
Petr Hosekd7df9b22017-09-06 23:41:02 +0000383struct Relocation {
Paul Semel31a212d2018-05-22 01:04:36 +0000384 const Symbol *RelocSymbol = nullptr;
Petr Hosekd7df9b22017-09-06 23:41:02 +0000385 uint64_t Offset;
386 uint64_t Addend;
387 uint32_t Type;
388};
389
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000390// All relocation sections denote relocations to apply to another section.
391// However, some relocation sections use a dynamic symbol table and others use
392// a regular symbol table. Because the types of the two symbol tables differ in
393// our system (because they should behave differently) we can't uniformly
394// represent all relocations with the same base class if we expose an interface
395// that mentions the symbol table type. So we split the two base types into two
396// different classes, one which handles the section the relocation is applied to
397// and another which handles the symbol table type. The symbol table type is
398// taken as a type parameter to the class (see RelocSectionWithSymtabBase).
399class RelocationSectionBase : public SectionBase {
400protected:
Jake Ehrliched95fce2017-09-27 00:44:00 +0000401 SectionBase *SecToApplyRel = nullptr;
Jake Ehrlich9f1a3902017-09-26 18:02:25 +0000402
403public:
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000404 const SectionBase *getSection() const { return SecToApplyRel; }
Jake Ehrlichc5ff7272017-10-10 18:32:22 +0000405 void setSection(SectionBase *Sec) { SecToApplyRel = Sec; }
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000406
407 static bool classof(const SectionBase *S) {
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000408 return S->Type == ELF::SHT_REL || S->Type == ELF::SHT_RELA;
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000409 }
410};
411
412// Takes the symbol table type to use as a parameter so that we can deduplicate
413// that code between the two symbol table types.
414template <class SymTabType>
415class RelocSectionWithSymtabBase : public RelocationSectionBase {
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000416 SymTabType *Symbols = nullptr;
Alexander Shaposhnikova8f15502018-02-24 00:41:01 +0000417 void setSymTab(SymTabType *SymTab) { Symbols = SymTab; }
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000418
419protected:
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000420 RelocSectionWithSymtabBase() = default;
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000421
422public:
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000423 void removeSectionReferences(const SectionBase *Sec) override;
Jake Ehrlich9f1a3902017-09-26 18:02:25 +0000424 void initialize(SectionTableRef SecTable) override;
425 void finalize() override;
426};
427
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000428class RelocationSection
429 : public RelocSectionWithSymtabBase<SymbolTableSection> {
Jake Ehrlich76e91102018-01-25 22:46:17 +0000430 MAKE_SEC_WRITER_FRIEND
431
Petr Hosekd7df9b22017-09-06 23:41:02 +0000432 std::vector<Relocation> Relocations;
Petr Hosekd7df9b22017-09-06 23:41:02 +0000433
Petr Hosekd7df9b22017-09-06 23:41:02 +0000434public:
Petr Hosekd7df9b22017-09-06 23:41:02 +0000435 void addRelocation(Relocation Rel) { Relocations.push_back(Rel); }
Jake Ehrlich76e91102018-01-25 22:46:17 +0000436 void accept(SectionVisitor &Visitor) const override;
Paul Semel4246a462018-05-09 21:36:54 +0000437 void removeSymbols(function_ref<bool(const Symbol &)> ToRemove) override;
Jake Ehrlich9f1a3902017-09-26 18:02:25 +0000438
Petr Hosekd7df9b22017-09-06 23:41:02 +0000439 static bool classof(const SectionBase *S) {
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000440 if (S->Flags & ELF::SHF_ALLOC)
Jake Ehrlich9f1a3902017-09-26 18:02:25 +0000441 return false;
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000442 return S->Type == ELF::SHT_REL || S->Type == ELF::SHT_RELA;
Petr Hosekd7df9b22017-09-06 23:41:02 +0000443 }
444};
445
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000446// TODO: The way stripping and groups interact is complicated
447// and still needs to be worked on.
448
449class GroupSection : public SectionBase {
450 MAKE_SEC_WRITER_FRIEND
451 const SymbolTableSection *SymTab = nullptr;
Paul Semel31a212d2018-05-22 01:04:36 +0000452 const Symbol *Sym = nullptr;
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000453 ELF::Elf32_Word FlagWord;
454 SmallVector<SectionBase *, 3> GroupMembers;
Alexander Shaposhnikov43b8acd2018-03-20 18:20:42 +0000455
456public:
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000457 // TODO: Contents is present in several classes of the hierarchy.
458 // This needs to be refactored to avoid duplication.
459 ArrayRef<uint8_t> Contents;
Alexander Shaposhnikov3b24ed72018-03-20 19:46:00 +0000460
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000461 explicit GroupSection(ArrayRef<uint8_t> Data) : Contents(Data) {}
462
463 void setSymTab(const SymbolTableSection *SymTabSec) { SymTab = SymTabSec; }
Paul Semel31a212d2018-05-22 01:04:36 +0000464 void setSymbol(const Symbol *S) { Sym = S; }
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000465 void setFlagWord(ELF::Elf32_Word W) { FlagWord = W; }
466 void addMember(SectionBase *Sec) { GroupMembers.push_back(Sec); }
467
Alexander Shaposhnikov52db4332018-04-20 20:46:04 +0000468 void initialize(SectionTableRef SecTable) override{};
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000469 void accept(SectionVisitor &) const override;
470 void finalize() override;
Paul Semel4246a462018-05-09 21:36:54 +0000471 void removeSymbols(function_ref<bool(const Symbol &)> ToRemove) override;
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000472
473 static bool classof(const SectionBase *S) {
474 return S->Type == ELF::SHT_GROUP;
475 }
476};
477
Alexander Shaposhnikov52db4332018-04-20 20:46:04 +0000478class DynamicSymbolTableSection : public Section {
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000479public:
Alexander Shaposhnikov52db4332018-04-20 20:46:04 +0000480 explicit DynamicSymbolTableSection(ArrayRef<uint8_t> Data) : Section(Data) {}
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000481
Jake Ehrliche5d424b2017-09-20 17:11:58 +0000482 static bool classof(const SectionBase *S) {
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000483 return S->Type == ELF::SHT_DYNSYM;
Jake Ehrliche5d424b2017-09-20 17:11:58 +0000484 }
485};
486
Alexander Shaposhnikov52db4332018-04-20 20:46:04 +0000487class DynamicSection : public Section {
Jake Ehrliche5d424b2017-09-20 17:11:58 +0000488public:
Alexander Shaposhnikov52db4332018-04-20 20:46:04 +0000489 explicit DynamicSection(ArrayRef<uint8_t> Data) : Section(Data) {}
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000490
Jake Ehrliche5d424b2017-09-20 17:11:58 +0000491 static bool classof(const SectionBase *S) {
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000492 return S->Type == ELF::SHT_DYNAMIC;
Jake Ehrliche5d424b2017-09-20 17:11:58 +0000493 }
494};
495
Jake Ehrlich9f1a3902017-09-26 18:02:25 +0000496class DynamicRelocationSection
Jake Ehrlich36a2eb32017-10-10 18:47:09 +0000497 : public RelocSectionWithSymtabBase<DynamicSymbolTableSection> {
Jake Ehrlich76e91102018-01-25 22:46:17 +0000498 MAKE_SEC_WRITER_FRIEND
499
Jake Ehrlich9f1a3902017-09-26 18:02:25 +0000500private:
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000501 ArrayRef<uint8_t> Contents;
Jake Ehrlich9f1a3902017-09-26 18:02:25 +0000502
503public:
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000504 explicit DynamicRelocationSection(ArrayRef<uint8_t> Data) : Contents(Data) {}
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000505
Jake Ehrlich76e91102018-01-25 22:46:17 +0000506 void accept(SectionVisitor &) const override;
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000507
Jake Ehrlich9f1a3902017-09-26 18:02:25 +0000508 static bool classof(const SectionBase *S) {
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000509 if (!(S->Flags & ELF::SHF_ALLOC))
Jake Ehrlich9f1a3902017-09-26 18:02:25 +0000510 return false;
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000511 return S->Type == ELF::SHT_REL || S->Type == ELF::SHT_RELA;
Jake Ehrlich9f1a3902017-09-26 18:02:25 +0000512 }
513};
514
Jake Ehrlich76e91102018-01-25 22:46:17 +0000515class GnuDebugLinkSection : public SectionBase {
516 MAKE_SEC_WRITER_FRIEND
517
Jake Ehrlichea07d3c2018-01-25 22:15:14 +0000518private:
Jake Ehrlichea07d3c2018-01-25 22:15:14 +0000519 StringRef FileName;
520 uint32_t CRC32;
521
522 void init(StringRef File, StringRef Data);
523
524public:
525 // If we add this section from an external source we can use this ctor.
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000526 explicit GnuDebugLinkSection(StringRef File);
Jake Ehrlich76e91102018-01-25 22:46:17 +0000527 void accept(SectionVisitor &Visitor) const override;
Jake Ehrlichea07d3c2018-01-25 22:15:14 +0000528};
529
Jake Ehrlich76e91102018-01-25 22:46:17 +0000530class Reader {
531public:
532 virtual ~Reader();
533 virtual std::unique_ptr<Object> create() const = 0;
534};
535
Jake Ehrlich76e91102018-01-25 22:46:17 +0000536using object::Binary;
537using object::ELFFile;
538using object::ELFObjectFile;
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000539using object::OwningBinary;
Jake Ehrlich76e91102018-01-25 22:46:17 +0000540
541template <class ELFT> class ELFBuilder {
542private:
Jake Ehrlich6452b112018-02-14 23:31:33 +0000543 using Elf_Addr = typename ELFT::Addr;
Jake Ehrlich76e91102018-01-25 22:46:17 +0000544 using Elf_Shdr = typename ELFT::Shdr;
Jake Ehrlich6452b112018-02-14 23:31:33 +0000545 using Elf_Ehdr = typename ELFT::Ehdr;
Jake Ehrlich76e91102018-01-25 22:46:17 +0000546
547 const ELFFile<ELFT> &ElfFile;
548 Object &Obj;
549
Jake Ehrlich6452b112018-02-14 23:31:33 +0000550 void setParentSegment(Segment &Child);
Jake Ehrlich76e91102018-01-25 22:46:17 +0000551 void readProgramHeaders();
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000552 void initGroupSection(GroupSection *GroupSec);
Jake Ehrlich76e91102018-01-25 22:46:17 +0000553 void initSymbolTable(SymbolTableSection *SymTab);
554 void readSectionHeaders();
555 SectionBase &makeSection(const Elf_Shdr &Shdr);
556
557public:
558 ELFBuilder(const ELFObjectFile<ELFT> &ElfObj, Object &Obj)
559 : ElfFile(*ElfObj.getELFFile()), Obj(Obj) {}
560
561 void build();
562};
563
564class ELFReader : public Reader {
565private:
Jake Ehrlich9634e182018-01-26 02:01:37 +0000566 std::unique_ptr<Binary> Bin;
Jake Ehrlich76e91102018-01-25 22:46:17 +0000567 std::shared_ptr<MemoryBuffer> Data;
568
569public:
570 ElfType getElfType() const;
571 std::unique_ptr<Object> create() const override;
572 ELFReader(StringRef File);
573};
574
575class Object {
Petr Hosek05a04cb2017-08-01 00:33:58 +0000576private:
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000577 using SecPtr = std::unique_ptr<SectionBase>;
578 using SegPtr = std::unique_ptr<Segment>;
Petr Hosek05a04cb2017-08-01 00:33:58 +0000579
Jake Ehrlich76e91102018-01-25 22:46:17 +0000580 std::shared_ptr<MemoryBuffer> OwnedData;
Petr Hosekc4df10e2017-08-04 21:09:26 +0000581 std::vector<SecPtr> Sections;
582 std::vector<SegPtr> Segments;
583
Petr Hosek05a04cb2017-08-01 00:33:58 +0000584public:
Jake Ehrlich76e91102018-01-25 22:46:17 +0000585 template <class T>
586 using Range = iterator_range<
587 pointee_iterator<typename std::vector<std::unique_ptr<T>>::iterator>>;
588
589 template <class T>
590 using ConstRange = iterator_range<pointee_iterator<
591 typename std::vector<std::unique_ptr<T>>::const_iterator>>;
592
Jake Ehrlich6452b112018-02-14 23:31:33 +0000593 // It is often the case that the ELF header and the program header table are
594 // not present in any segment. This could be a problem during file layout,
595 // because other segments may get assigned an offset where either of the
596 // two should reside, which will effectively corrupt the resulting binary.
597 // Other than that we use these segments to track program header offsets
598 // when they may not follow the ELF header.
599 Segment ElfHdrSegment;
600 Segment ProgramHdrSegment;
601
Petr Hosek05a04cb2017-08-01 00:33:58 +0000602 uint8_t Ident[16];
603 uint64_t Entry;
604 uint64_t SHOffset;
605 uint32_t Type;
606 uint32_t Machine;
607 uint32_t Version;
608 uint32_t Flags;
609
Jake Ehrlich76e91102018-01-25 22:46:17 +0000610 StringTableSection *SectionNames = nullptr;
611 SymbolTableSection *SymbolTable = nullptr;
612
Alexander Shaposhnikov6ecc6e62018-03-21 19:53:44 +0000613 explicit Object(std::shared_ptr<MemoryBuffer> Data)
614 : OwnedData(std::move(Data)) {}
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000615 virtual ~Object() = default;
616
Aaron Ballman09f46a72018-01-25 21:03:38 +0000617 void sortSections();
Jake Ehrlich76e91102018-01-25 22:46:17 +0000618 SectionTableRef sections() { return SectionTableRef(Sections); }
619 ConstRange<SectionBase> sections() const {
620 return make_pointee_range(Sections);
621 }
622 Range<Segment> segments() { return make_pointee_range(Segments); }
623 ConstRange<Segment> segments() const { return make_pointee_range(Segments); }
Aaron Ballman09f46a72018-01-25 21:03:38 +0000624
Jake Ehrlich76e91102018-01-25 22:46:17 +0000625 void removeSections(std::function<bool(const SectionBase &)> ToRemove);
Paul Semel4246a462018-05-09 21:36:54 +0000626 void removeSymbols(function_ref<bool(const Symbol &)> ToRemove);
Jake Ehrlich76e91102018-01-25 22:46:17 +0000627 template <class T, class... Ts> T &addSection(Ts &&... Args) {
628 auto Sec = llvm::make_unique<T>(std::forward<Ts>(Args)...);
629 auto Ptr = Sec.get();
630 Sections.emplace_back(std::move(Sec));
631 return *Ptr;
632 }
633 Segment &addSegment(ArrayRef<uint8_t> Data) {
634 Segments.emplace_back(llvm::make_unique<Segment>(Data));
635 return *Segments.back();
636 }
Petr Hosekc4df10e2017-08-04 21:09:26 +0000637};
Eugene Zelenko0ad18f82017-11-01 21:16:06 +0000638} // end namespace llvm
639
640#endif // LLVM_TOOLS_OBJCOPY_OBJECT_H