blob: 59a1164406c0ebe2cada55386d8811e9a06fc751 [file] [log] [blame]
Alexander Shaposhnikovd911ed12019-02-02 00:38:07 +00001//===- MachOWriter.cpp ------------------------------------------*- C++ -*-===//
2//
Chandler Carruth127252b2019-02-11 08:25:19 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Alexander Shaposhnikovd911ed12019-02-02 00:38:07 +00006//
7//===----------------------------------------------------------------------===//
8
9#include "MachOWriter.h"
Alexander Shaposhnikovd911ed12019-02-02 00:38:07 +000010#include "Object.h"
11#include "llvm/ADT/STLExtras.h"
12#include "llvm/BinaryFormat/MachO.h"
13#include "llvm/Object/MachO.h"
14#include <memory>
15
16namespace llvm {
17namespace objcopy {
18namespace macho {
19
20size_t MachOWriter::headerSize() const {
21 return Is64Bit ? sizeof(MachO::mach_header_64) : sizeof(MachO::mach_header);
22}
23
24size_t MachOWriter::loadCommandsSize() const { return O.Header.SizeOfCmds; }
25
26size_t MachOWriter::symTableSize() const {
27 return O.SymTable.NameList.size() *
28 (Is64Bit ? sizeof(MachO::nlist_64) : sizeof(MachO::nlist));
29}
30
31size_t MachOWriter::strTableSize() const {
32 size_t S = 0;
33 for (const auto &Str : O.StrTable.Strings)
34 S += Str.size();
35 S += (O.StrTable.Strings.empty() ? 0 : O.StrTable.Strings.size() - 1);
36 return S;
37}
38
39size_t MachOWriter::totalSize() const {
40 // Going from tail to head and looking for an appropriate "anchor" to
41 // calculate the total size assuming that all the offsets are either valid
42 // ("true") or 0 (0 indicates that the corresponding part is missing).
43
44 SmallVector<size_t, 7> Ends;
45 if (O.SymTabCommandIndex) {
46 const MachO::symtab_command &SymTabCommand =
47 O.LoadCommands[*O.SymTabCommandIndex]
48 .MachOLoadCommand.symtab_command_data;
49 if (SymTabCommand.symoff) {
50 assert((SymTabCommand.nsyms == O.SymTable.NameList.size()) &&
51 "Incorrect number of symbols");
52 Ends.push_back(SymTabCommand.symoff + symTableSize());
53 }
54 if (SymTabCommand.stroff) {
55 assert((SymTabCommand.strsize == strTableSize()) &&
56 "Incorrect string table size");
57 Ends.push_back(SymTabCommand.stroff + SymTabCommand.strsize);
58 }
59 }
60 if (O.DyLdInfoCommandIndex) {
61 const MachO::dyld_info_command &DyLdInfoCommand =
62 O.LoadCommands[*O.DyLdInfoCommandIndex]
63 .MachOLoadCommand.dyld_info_command_data;
64 if (DyLdInfoCommand.rebase_off) {
65 assert((DyLdInfoCommand.rebase_size == O.Rebases.Opcodes.size()) &&
66 "Incorrect rebase opcodes size");
67 Ends.push_back(DyLdInfoCommand.rebase_off + DyLdInfoCommand.rebase_size);
68 }
69 if (DyLdInfoCommand.bind_off) {
70 assert((DyLdInfoCommand.bind_size == O.Binds.Opcodes.size()) &&
71 "Incorrect bind opcodes size");
72 Ends.push_back(DyLdInfoCommand.bind_off + DyLdInfoCommand.bind_size);
73 }
74 if (DyLdInfoCommand.weak_bind_off) {
75 assert((DyLdInfoCommand.weak_bind_size == O.WeakBinds.Opcodes.size()) &&
76 "Incorrect weak bind opcodes size");
77 Ends.push_back(DyLdInfoCommand.weak_bind_off +
78 DyLdInfoCommand.weak_bind_size);
79 }
80 if (DyLdInfoCommand.lazy_bind_off) {
81 assert((DyLdInfoCommand.lazy_bind_size == O.LazyBinds.Opcodes.size()) &&
82 "Incorrect lazy bind opcodes size");
83 Ends.push_back(DyLdInfoCommand.lazy_bind_off +
84 DyLdInfoCommand.lazy_bind_size);
85 }
86 if (DyLdInfoCommand.export_off) {
87 assert((DyLdInfoCommand.export_size == O.Exports.Trie.size()) &&
88 "Incorrect trie size");
89 Ends.push_back(DyLdInfoCommand.export_off + DyLdInfoCommand.export_size);
90 }
91 }
92
93 // Otherwise, use the last section / reloction.
94 for (const auto &LC : O.LoadCommands)
95 for (const auto &S : LC.Sections) {
96 Ends.push_back(S.Offset + S.Size);
97 if (S.RelOff)
98 Ends.push_back(S.RelOff +
99 S.NReloc * sizeof(MachO::any_relocation_info));
100 }
101
102 if (!Ends.empty())
103 return *std::max_element(Ends.begin(), Ends.end());
104
105 // Otherwise, we have only Mach header and load commands.
106 return headerSize() + loadCommandsSize();
107}
108
109void MachOWriter::writeHeader() {
110 MachO::mach_header_64 Header;
111
112 Header.magic = O.Header.Magic;
113 Header.cputype = O.Header.CPUType;
114 Header.cpusubtype = O.Header.CPUSubType;
115 Header.filetype = O.Header.FileType;
116 Header.ncmds = O.Header.NCmds;
117 Header.sizeofcmds = O.Header.SizeOfCmds;
118 Header.flags = O.Header.Flags;
119 Header.reserved = O.Header.Reserved;
120
121 if (IsLittleEndian != sys::IsLittleEndianHost)
122 MachO::swapStruct(Header);
123
124 auto HeaderSize =
125 Is64Bit ? sizeof(MachO::mach_header_64) : sizeof(MachO::mach_header);
126 memcpy(B.getBufferStart(), &Header, HeaderSize);
127}
128
129void MachOWriter::writeLoadCommands() {
130 uint8_t *Begin = B.getBufferStart() + headerSize();
131 MachO::macho_load_command MLC;
132 for (const auto &LC : O.LoadCommands) {
133#define HANDLE_LOAD_COMMAND(LCName, LCValue, LCStruct) \
134 case MachO::LCName: \
135 assert(sizeof(MachO::LCStruct) + LC.Payload.size() == \
136 LC.MachOLoadCommand.load_command_data.cmdsize); \
137 MLC = LC.MachOLoadCommand; \
138 if (IsLittleEndian != sys::IsLittleEndianHost) \
139 MachO::swapStruct(MLC.LCStruct##_data); \
140 memcpy(Begin, &MLC.LCStruct##_data, sizeof(MachO::LCStruct)); \
141 Begin += sizeof(MachO::LCStruct); \
142 memcpy(Begin, LC.Payload.data(), LC.Payload.size()); \
143 Begin += LC.Payload.size(); \
144 break;
145
146 switch (LC.MachOLoadCommand.load_command_data.cmd) {
147 default:
148 assert(sizeof(MachO::load_command) + LC.Payload.size() ==
149 LC.MachOLoadCommand.load_command_data.cmdsize);
150 MLC = LC.MachOLoadCommand;
151 if (IsLittleEndian != sys::IsLittleEndianHost)
152 MachO::swapStruct(MLC.load_command_data);
153 memcpy(Begin, &MLC.load_command_data, sizeof(MachO::load_command));
154 Begin += sizeof(MachO::load_command);
155 memcpy(Begin, LC.Payload.data(), LC.Payload.size());
156 Begin += LC.Payload.size();
157 break;
158#include "llvm/BinaryFormat/MachO.def"
159 }
160 }
161}
162
163void MachOWriter::writeSections() {
164 for (const auto &LC : O.LoadCommands)
165 for (const auto &Sec : LC.Sections) {
166 assert(Sec.Offset && "Section offset can not be zero");
167 assert((Sec.Size == Sec.Content.size()) && "Incorrect section size");
168 memcpy(B.getBufferStart() + Sec.Offset, Sec.Content.data(),
169 Sec.Content.size());
170 for (size_t Index = 0; Index < Sec.Relocations.size(); ++Index) {
171 MachO::any_relocation_info R = Sec.Relocations[Index];
172 if (IsLittleEndian != sys::IsLittleEndianHost)
173 MachO::swapStruct(R);
174 memcpy(B.getBufferStart() + Sec.RelOff +
175 Index * sizeof(MachO::any_relocation_info),
176 &R, sizeof(R));
177 }
178 }
179}
180
181template <typename NListType>
182void writeNListEntry(const NListEntry &NLE, bool IsLittleEndian, char *&Out) {
183 NListType ListEntry;
184 ListEntry.n_strx = NLE.n_strx;
185 ListEntry.n_type = NLE.n_type;
186 ListEntry.n_sect = NLE.n_sect;
187 ListEntry.n_desc = NLE.n_desc;
188 ListEntry.n_value = NLE.n_value;
189
190 if (IsLittleEndian != sys::IsLittleEndianHost)
191 MachO::swapStruct(ListEntry);
192 memcpy(Out, reinterpret_cast<const char *>(&ListEntry), sizeof(NListType));
193 Out += sizeof(NListType);
194}
195
196void MachOWriter::writeSymbolTable() {
197 if (!O.SymTabCommandIndex)
198 return;
199 const MachO::symtab_command &SymTabCommand =
200 O.LoadCommands[*O.SymTabCommandIndex]
201 .MachOLoadCommand.symtab_command_data;
202 assert((SymTabCommand.nsyms == O.SymTable.NameList.size()) &&
203 "Incorrect number of symbols");
204 char *Out = (char *)B.getBufferStart() + SymTabCommand.symoff;
205 for (auto NLE : O.SymTable.NameList) {
206 if (Is64Bit)
207 writeNListEntry<MachO::nlist_64>(NLE, IsLittleEndian, Out);
208 else
209 writeNListEntry<MachO::nlist>(NLE, IsLittleEndian, Out);
210 }
211}
212
213void MachOWriter::writeStringTable() {
214 if (!O.SymTabCommandIndex)
215 return;
216 const MachO::symtab_command &SymTabCommand =
217 O.LoadCommands[*O.SymTabCommandIndex]
218 .MachOLoadCommand.symtab_command_data;
219 char *Out = (char *)B.getBufferStart() + SymTabCommand.stroff;
220 assert((SymTabCommand.strsize == strTableSize()) &&
221 "Incorrect string table size");
222 for (size_t Index = 0; Index < O.StrTable.Strings.size(); ++Index) {
223 memcpy(Out, O.StrTable.Strings[Index].data(),
224 O.StrTable.Strings[Index].size());
225 Out += O.StrTable.Strings[Index].size();
226 if (Index + 1 != O.StrTable.Strings.size()) {
227 memcpy(Out, "\0", 1);
228 Out += 1;
229 }
230 }
231}
232
233void MachOWriter::writeRebaseInfo() {
234 if (!O.DyLdInfoCommandIndex)
235 return;
236 const MachO::dyld_info_command &DyLdInfoCommand =
237 O.LoadCommands[*O.DyLdInfoCommandIndex]
238 .MachOLoadCommand.dyld_info_command_data;
239 char *Out = (char *)B.getBufferStart() + DyLdInfoCommand.rebase_off;
240 assert((DyLdInfoCommand.rebase_size == O.Rebases.Opcodes.size()) &&
241 "Incorrect rebase opcodes size");
242 memcpy(Out, O.Rebases.Opcodes.data(), O.Rebases.Opcodes.size());
243}
244
245void MachOWriter::writeBindInfo() {
246 if (!O.DyLdInfoCommandIndex)
247 return;
248 const MachO::dyld_info_command &DyLdInfoCommand =
249 O.LoadCommands[*O.DyLdInfoCommandIndex]
250 .MachOLoadCommand.dyld_info_command_data;
251 char *Out = (char *)B.getBufferStart() + DyLdInfoCommand.bind_off;
252 assert((DyLdInfoCommand.bind_size == O.Binds.Opcodes.size()) &&
253 "Incorrect bind opcodes size");
254 memcpy(Out, O.Binds.Opcodes.data(), O.Binds.Opcodes.size());
255}
256
257void MachOWriter::writeWeakBindInfo() {
258 if (!O.DyLdInfoCommandIndex)
259 return;
260 const MachO::dyld_info_command &DyLdInfoCommand =
261 O.LoadCommands[*O.DyLdInfoCommandIndex]
262 .MachOLoadCommand.dyld_info_command_data;
263 char *Out = (char *)B.getBufferStart() + DyLdInfoCommand.weak_bind_off;
264 assert((DyLdInfoCommand.weak_bind_size == O.WeakBinds.Opcodes.size()) &&
265 "Incorrect weak bind opcodes size");
266 memcpy(Out, O.WeakBinds.Opcodes.data(), O.WeakBinds.Opcodes.size());
267}
268
269void MachOWriter::writeLazyBindInfo() {
270 if (!O.DyLdInfoCommandIndex)
271 return;
272 const MachO::dyld_info_command &DyLdInfoCommand =
273 O.LoadCommands[*O.DyLdInfoCommandIndex]
274 .MachOLoadCommand.dyld_info_command_data;
275 char *Out = (char *)B.getBufferStart() + DyLdInfoCommand.lazy_bind_off;
276 assert((DyLdInfoCommand.lazy_bind_size == O.LazyBinds.Opcodes.size()) &&
277 "Incorrect lazy bind opcodes size");
278 memcpy(Out, O.LazyBinds.Opcodes.data(), O.LazyBinds.Opcodes.size());
279}
280
281void MachOWriter::writeExportInfo() {
282 if (!O.DyLdInfoCommandIndex)
283 return;
284 const MachO::dyld_info_command &DyLdInfoCommand =
285 O.LoadCommands[*O.DyLdInfoCommandIndex]
286 .MachOLoadCommand.dyld_info_command_data;
287 char *Out = (char *)B.getBufferStart() + DyLdInfoCommand.export_off;
288 assert((DyLdInfoCommand.export_size == O.Exports.Trie.size()) &&
289 "Incorrect export trie size");
290 memcpy(Out, O.Exports.Trie.data(), O.Exports.Trie.size());
291}
292
293void MachOWriter::writeTail() {
294 typedef void (MachOWriter::*WriteHandlerType)(void);
295 typedef std::pair<uint64_t, WriteHandlerType> WriteOperation;
296 SmallVector<WriteOperation, 7> Queue;
297
298 if (O.SymTabCommandIndex) {
299 const MachO::symtab_command &SymTabCommand =
300 O.LoadCommands[*O.SymTabCommandIndex]
301 .MachOLoadCommand.symtab_command_data;
302 if (SymTabCommand.symoff)
303 Queue.push_back({SymTabCommand.symoff, &MachOWriter::writeSymbolTable});
304 if (SymTabCommand.stroff)
305 Queue.push_back({SymTabCommand.stroff, &MachOWriter::writeStringTable});
306 }
307
308 if (O.DyLdInfoCommandIndex) {
309 const MachO::dyld_info_command &DyLdInfoCommand =
310 O.LoadCommands[*O.DyLdInfoCommandIndex]
311 .MachOLoadCommand.dyld_info_command_data;
312 if (DyLdInfoCommand.rebase_off)
313 Queue.push_back(
314 {DyLdInfoCommand.rebase_off, &MachOWriter::writeRebaseInfo});
315 if (DyLdInfoCommand.bind_off)
316 Queue.push_back({DyLdInfoCommand.bind_off, &MachOWriter::writeBindInfo});
317 if (DyLdInfoCommand.weak_bind_off)
318 Queue.push_back(
319 {DyLdInfoCommand.weak_bind_off, &MachOWriter::writeWeakBindInfo});
320 if (DyLdInfoCommand.lazy_bind_off)
321 Queue.push_back(
322 {DyLdInfoCommand.lazy_bind_off, &MachOWriter::writeLazyBindInfo});
323 if (DyLdInfoCommand.export_off)
324 Queue.push_back(
325 {DyLdInfoCommand.export_off, &MachOWriter::writeExportInfo});
326 }
327
328 llvm::sort(Queue, [](const WriteOperation &LHS, const WriteOperation &RHS) {
329 return LHS.first < RHS.first;
330 });
331
332 for (auto WriteOp : Queue)
333 (this->*WriteOp.second)();
334}
335
336Error MachOWriter::write() {
337 if (Error E = B.allocate(totalSize()))
338 return E;
339 memset(B.getBufferStart(), 0, totalSize());
340 writeHeader();
341 writeLoadCommands();
342 writeSections();
343 writeTail();
Jordan Rupprecht2e862c72019-02-04 19:09:20 +0000344 return B.commit();
Alexander Shaposhnikovd911ed12019-02-02 00:38:07 +0000345}
346
347} // end namespace macho
348} // end namespace objcopy
349} // end namespace llvm