blob: 9cdac8681dddae9cb4f9eb66e0e08ae9a1570480 [file] [log] [blame]
Daniel Dunbarfbd25b72010-11-27 05:38:50 +00001//===- MachOObject.cpp - Mach-O Object File Wrapper -----------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#include "llvm/Object/MachOObject.h"
Daniel Dunbar95369162010-11-27 06:39:22 +000011#include "llvm/ADT/StringRef.h"
Benjamin Kramerd4522462011-08-30 22:10:58 +000012#include "llvm/ADT/SmallVector.h"
Daniel Dunbarfbd25b72010-11-27 05:38:50 +000013#include "llvm/Support/MemoryBuffer.h"
Michael J. Spencer1f6efa32010-11-29 18:16:10 +000014#include "llvm/Support/Host.h"
15#include "llvm/Support/SwapByteOrder.h"
Eric Christopher592cf782011-04-03 23:51:47 +000016#include "llvm/Support/raw_ostream.h"
17#include "llvm/Support/Debug.h"
Daniel Dunbarfbd25b72010-11-27 05:38:50 +000018
19using namespace llvm;
Daniel Dunbara956d8b2010-11-27 07:19:41 +000020using namespace llvm::object;
21
Daniel Dunbar4ba1f5e2010-11-27 08:22:29 +000022/* Translation Utilities */
23
Daniel Dunbara956d8b2010-11-27 07:19:41 +000024template<typename T>
25static void SwapValue(T &Value) {
26 Value = sys::SwapByteOrder(Value);
27}
Daniel Dunbarfbd25b72010-11-27 05:38:50 +000028
Daniel Dunbar4ba1f5e2010-11-27 08:22:29 +000029template<typename T>
30static void SwapStruct(T &Value);
31
32template<typename T>
33static void ReadInMemoryStruct(const MachOObject &MOO,
34 StringRef Buffer, uint64_t Base,
35 InMemoryStruct<T> &Res) {
36 typedef T struct_type;
37 uint64_t Size = sizeof(struct_type);
38
39 // Check that the buffer contains the expected data.
40 if (Base + Size > Buffer.size()) {
41 Res = 0;
42 return;
43 }
44
45 // Check whether we can return a direct pointer.
46 struct_type *Ptr = (struct_type *) (Buffer.data() + Base);
47 if (!MOO.isSwappedEndian()) {
48 Res = Ptr;
49 return;
50 }
51
52 // Otherwise, copy the struct and translate the values.
53 Res = *Ptr;
54 SwapStruct(*Res);
55}
56
57/* *** */
58
Daniel Dunbar95369162010-11-27 06:39:22 +000059MachOObject::MachOObject(MemoryBuffer *Buffer_, bool IsLittleEndian_,
60 bool Is64Bit_)
Daniel Dunbara956d8b2010-11-27 07:19:41 +000061 : Buffer(Buffer_), IsLittleEndian(IsLittleEndian_), Is64Bit(Is64Bit_),
62 IsSwappedEndian(IsLittleEndian != sys::isLittleEndianHost()),
Daniel Dunbarf2e2a5f2010-11-27 13:46:11 +000063 HasStringTable(false), LoadCommands(0), NumLoadedCommands(0) {
Daniel Dunbara956d8b2010-11-27 07:19:41 +000064 // Load the common header.
65 memcpy(&Header, Buffer->getBuffer().data(), sizeof(Header));
66 if (IsSwappedEndian) {
67 SwapValue(Header.Magic);
68 SwapValue(Header.CPUType);
69 SwapValue(Header.CPUSubtype);
70 SwapValue(Header.FileType);
71 SwapValue(Header.NumLoadCommands);
72 SwapValue(Header.SizeOfLoadCommands);
73 SwapValue(Header.Flags);
74 }
75
76 if (is64Bit()) {
77 memcpy(&Header64Ext, Buffer->getBuffer().data() + sizeof(Header),
78 sizeof(Header64Ext));
79 if (IsSwappedEndian) {
80 SwapValue(Header64Ext.Reserved);
81 }
82 }
83
84 // Create the load command array if sane.
85 if (getHeader().NumLoadCommands < (1 << 20))
86 LoadCommands = new LoadCommandInfo[getHeader().NumLoadCommands];
87}
88
89MachOObject::~MachOObject() {
Benjamin Kramer23dcd002010-12-17 09:56:50 +000090 delete [] LoadCommands;
Daniel Dunbarfbd25b72010-11-27 05:38:50 +000091}
92
93MachOObject *MachOObject::LoadFromBuffer(MemoryBuffer *Buffer,
94 std::string *ErrorStr) {
Daniel Dunbar95369162010-11-27 06:39:22 +000095 // First, check the magic value and initialize the basic object info.
96 bool IsLittleEndian = false, Is64Bit = false;
97 StringRef Magic = Buffer->getBuffer().slice(0, 4);
98 if (Magic == "\xFE\xED\xFA\xCE") {
99 } else if (Magic == "\xCE\xFA\xED\xFE") {
100 IsLittleEndian = true;
101 } else if (Magic == "\xFE\xED\xFA\xCF") {
102 Is64Bit = true;
103 } else if (Magic == "\xCF\xFA\xED\xFE") {
104 IsLittleEndian = true;
105 Is64Bit = true;
106 } else {
Daniel Dunbara956d8b2010-11-27 07:19:41 +0000107 if (ErrorStr) *ErrorStr = "not a Mach object file (invalid magic)";
108 return 0;
109 }
110
111 // Ensure that the at least the full header is present.
112 unsigned HeaderSize = Is64Bit ? macho::Header64Size : macho::Header32Size;
113 if (Buffer->getBufferSize() < HeaderSize) {
114 if (ErrorStr) *ErrorStr = "not a Mach object file (invalid header)";
Daniel Dunbar95369162010-11-27 06:39:22 +0000115 return 0;
116 }
117
118 OwningPtr<MachOObject> Object(new MachOObject(Buffer, IsLittleEndian,
119 Is64Bit));
120
Daniel Dunbara956d8b2010-11-27 07:19:41 +0000121 // Check for bogus number of load commands.
122 if (Object->getHeader().NumLoadCommands >= (1 << 20)) {
123 if (ErrorStr) *ErrorStr = "not a Mach object file (unreasonable header)";
124 return 0;
125 }
126
Daniel Dunbarfbd25b72010-11-27 05:38:50 +0000127 if (ErrorStr) *ErrorStr = "";
Daniel Dunbar95369162010-11-27 06:39:22 +0000128 return Object.take();
Daniel Dunbarfbd25b72010-11-27 05:38:50 +0000129}
Daniel Dunbara956d8b2010-11-27 07:19:41 +0000130
Daniel Dunbar71130f82010-11-27 13:58:16 +0000131StringRef MachOObject::getData(size_t Offset, size_t Size) const {
132 return Buffer->getBuffer().substr(Offset,Size);
133}
134
Daniel Dunbarf2e2a5f2010-11-27 13:46:11 +0000135void MachOObject::RegisterStringTable(macho::SymtabLoadCommand &SLC) {
136 HasStringTable = true;
137 StringTable = Buffer->getBuffer().substr(SLC.StringTableOffset,
138 SLC.StringTableSize);
139}
140
Daniel Dunbara956d8b2010-11-27 07:19:41 +0000141const MachOObject::LoadCommandInfo &
142MachOObject::getLoadCommandInfo(unsigned Index) const {
143 assert(Index < getHeader().NumLoadCommands && "Invalid index!");
144
145 // Load the command, if necessary.
146 if (Index >= NumLoadedCommands) {
147 uint64_t Offset;
148 if (Index == 0) {
149 Offset = getHeaderSize();
150 } else {
151 const LoadCommandInfo &Prev = getLoadCommandInfo(Index - 1);
152 Offset = Prev.Offset + Prev.Command.Size;
153 }
154
155 LoadCommandInfo &Info = LoadCommands[Index];
156 memcpy(&Info.Command, Buffer->getBuffer().data() + Offset,
157 sizeof(macho::LoadCommand));
158 if (IsSwappedEndian) {
159 SwapValue(Info.Command.Type);
160 SwapValue(Info.Command.Size);
161 }
162 Info.Offset = Offset;
163 NumLoadedCommands = Index + 1;
164 }
165
166 return LoadCommands[Index];
167}
Daniel Dunbar4ba1f5e2010-11-27 08:22:29 +0000168
169template<>
Benjamin Kramer3946e3b2010-11-27 09:08:25 +0000170void SwapStruct(macho::SegmentLoadCommand &Value) {
Daniel Dunbar4ba1f5e2010-11-27 08:22:29 +0000171 SwapValue(Value.Type);
172 SwapValue(Value.Size);
173 SwapValue(Value.VMAddress);
174 SwapValue(Value.VMSize);
175 SwapValue(Value.FileOffset);
176 SwapValue(Value.FileSize);
177 SwapValue(Value.MaxVMProtection);
178 SwapValue(Value.InitialVMProtection);
179 SwapValue(Value.NumSections);
180 SwapValue(Value.Flags);
181}
182void MachOObject::ReadSegmentLoadCommand(const LoadCommandInfo &LCI,
183 InMemoryStruct<macho::SegmentLoadCommand> &Res) const {
184 ReadInMemoryStruct(*this, Buffer->getBuffer(), LCI.Offset, Res);
185}
186
187template<>
Benjamin Kramer3946e3b2010-11-27 09:08:25 +0000188void SwapStruct(macho::Segment64LoadCommand &Value) {
Daniel Dunbar4ba1f5e2010-11-27 08:22:29 +0000189 SwapValue(Value.Type);
190 SwapValue(Value.Size);
191 SwapValue(Value.VMAddress);
192 SwapValue(Value.VMSize);
193 SwapValue(Value.FileOffset);
194 SwapValue(Value.FileSize);
195 SwapValue(Value.MaxVMProtection);
196 SwapValue(Value.InitialVMProtection);
197 SwapValue(Value.NumSections);
198 SwapValue(Value.Flags);
199}
200void MachOObject::ReadSegment64LoadCommand(const LoadCommandInfo &LCI,
201 InMemoryStruct<macho::Segment64LoadCommand> &Res) const {
202 ReadInMemoryStruct(*this, Buffer->getBuffer(), LCI.Offset, Res);
203}
Daniel Dunbarf879f142010-11-27 08:33:44 +0000204
205template<>
Benjamin Kramer3946e3b2010-11-27 09:08:25 +0000206void SwapStruct(macho::SymtabLoadCommand &Value) {
Daniel Dunbarf879f142010-11-27 08:33:44 +0000207 SwapValue(Value.Type);
208 SwapValue(Value.Size);
209 SwapValue(Value.SymbolTableOffset);
210 SwapValue(Value.NumSymbolTableEntries);
211 SwapValue(Value.StringTableOffset);
212 SwapValue(Value.StringTableSize);
213}
214void MachOObject::ReadSymtabLoadCommand(const LoadCommandInfo &LCI,
215 InMemoryStruct<macho::SymtabLoadCommand> &Res) const {
216 ReadInMemoryStruct(*this, Buffer->getBuffer(), LCI.Offset, Res);
217}
218
219template<>
Benjamin Kramer3946e3b2010-11-27 09:08:25 +0000220void SwapStruct(macho::DysymtabLoadCommand &Value) {
Daniel Dunbarf879f142010-11-27 08:33:44 +0000221 SwapValue(Value.Type);
222 SwapValue(Value.Size);
Daniel Dunbara87d7ec2010-12-10 06:19:39 +0000223 SwapValue(Value.LocalSymbolsIndex);
Daniel Dunbarf879f142010-11-27 08:33:44 +0000224 SwapValue(Value.NumLocalSymbols);
225 SwapValue(Value.ExternalSymbolsIndex);
226 SwapValue(Value.NumExternalSymbols);
227 SwapValue(Value.UndefinedSymbolsIndex);
228 SwapValue(Value.NumUndefinedSymbols);
229 SwapValue(Value.TOCOffset);
230 SwapValue(Value.NumTOCEntries);
231 SwapValue(Value.ModuleTableOffset);
232 SwapValue(Value.NumModuleTableEntries);
233 SwapValue(Value.ReferenceSymbolTableOffset);
234 SwapValue(Value.NumReferencedSymbolTableEntries);
235 SwapValue(Value.IndirectSymbolTableOffset);
236 SwapValue(Value.NumIndirectSymbolTableEntries);
237 SwapValue(Value.ExternalRelocationTableOffset);
238 SwapValue(Value.NumExternalRelocationTableEntries);
239 SwapValue(Value.LocalRelocationTableOffset);
240 SwapValue(Value.NumLocalRelocationTableEntries);
241}
242void MachOObject::ReadDysymtabLoadCommand(const LoadCommandInfo &LCI,
243 InMemoryStruct<macho::DysymtabLoadCommand> &Res) const {
244 ReadInMemoryStruct(*this, Buffer->getBuffer(), LCI.Offset, Res);
245}
Daniel Dunbar4c55e0d2010-11-27 13:26:12 +0000246
247template<>
Benjamin Kramer9942aca2011-08-30 18:33:37 +0000248void SwapStruct(macho::LinkeditDataLoadCommand &Value) {
249 SwapValue(Value.Type);
250 SwapValue(Value.Size);
251 SwapValue(Value.DataOffset);
252 SwapValue(Value.DataSize);
253}
254void MachOObject::ReadLinkeditDataLoadCommand(const LoadCommandInfo &LCI,
255 InMemoryStruct<macho::LinkeditDataLoadCommand> &Res) const {
256 ReadInMemoryStruct(*this, Buffer->getBuffer(), LCI.Offset, Res);
257}
258
259template<>
Daniel Dunbar4c55e0d2010-11-27 13:26:12 +0000260void SwapStruct(macho::IndirectSymbolTableEntry &Value) {
261 SwapValue(Value.Index);
262}
263void
264MachOObject::ReadIndirectSymbolTableEntry(const macho::DysymtabLoadCommand &DLC,
265 unsigned Index,
266 InMemoryStruct<macho::IndirectSymbolTableEntry> &Res) const {
267 uint64_t Offset = (DLC.IndirectSymbolTableOffset +
268 Index * sizeof(macho::IndirectSymbolTableEntry));
269 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
270}
Daniel Dunbar2acadbd2010-11-27 13:33:15 +0000271
272
273template<>
274void SwapStruct(macho::Section &Value) {
275 SwapValue(Value.Address);
276 SwapValue(Value.Size);
277 SwapValue(Value.Offset);
278 SwapValue(Value.Align);
279 SwapValue(Value.RelocationTableOffset);
280 SwapValue(Value.NumRelocationTableEntries);
281 SwapValue(Value.Flags);
282 SwapValue(Value.Reserved1);
283 SwapValue(Value.Reserved2);
284}
285void MachOObject::ReadSection(const LoadCommandInfo &LCI,
286 unsigned Index,
287 InMemoryStruct<macho::Section> &Res) const {
288 assert(LCI.Command.Type == macho::LCT_Segment &&
289 "Unexpected load command info!");
290 uint64_t Offset = (LCI.Offset + sizeof(macho::SegmentLoadCommand) +
291 Index * sizeof(macho::Section));
292 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
293}
294
295template<>
296void SwapStruct(macho::Section64 &Value) {
297 SwapValue(Value.Address);
298 SwapValue(Value.Size);
299 SwapValue(Value.Offset);
300 SwapValue(Value.Align);
301 SwapValue(Value.RelocationTableOffset);
302 SwapValue(Value.NumRelocationTableEntries);
303 SwapValue(Value.Flags);
304 SwapValue(Value.Reserved1);
305 SwapValue(Value.Reserved2);
306 SwapValue(Value.Reserved3);
307}
308void MachOObject::ReadSection64(const LoadCommandInfo &LCI,
309 unsigned Index,
310 InMemoryStruct<macho::Section64> &Res) const {
311 assert(LCI.Command.Type == macho::LCT_Segment64 &&
312 "Unexpected load command info!");
313 uint64_t Offset = (LCI.Offset + sizeof(macho::Segment64LoadCommand) +
314 Index * sizeof(macho::Section64));
315 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
316}
Daniel Dunbar90e3e3a2010-11-27 13:39:48 +0000317
318template<>
319void SwapStruct(macho::RelocationEntry &Value) {
320 SwapValue(Value.Word0);
321 SwapValue(Value.Word1);
322}
323void MachOObject::ReadRelocationEntry(uint64_t RelocationTableOffset,
324 unsigned Index,
325 InMemoryStruct<macho::RelocationEntry> &Res) const {
326 uint64_t Offset = (RelocationTableOffset +
327 Index * sizeof(macho::RelocationEntry));
328 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
329}
Daniel Dunbar2208b582010-11-27 13:52:53 +0000330
331template<>
332void SwapStruct(macho::SymbolTableEntry &Value) {
333 SwapValue(Value.StringIndex);
334 SwapValue(Value.Flags);
335 SwapValue(Value.Value);
336}
337void MachOObject::ReadSymbolTableEntry(uint64_t SymbolTableOffset,
338 unsigned Index,
339 InMemoryStruct<macho::SymbolTableEntry> &Res) const {
340 uint64_t Offset = (SymbolTableOffset +
341 Index * sizeof(macho::SymbolTableEntry));
342 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
343}
344
345template<>
346void SwapStruct(macho::Symbol64TableEntry &Value) {
347 SwapValue(Value.StringIndex);
348 SwapValue(Value.Flags);
349 SwapValue(Value.Value);
350}
351void MachOObject::ReadSymbol64TableEntry(uint64_t SymbolTableOffset,
352 unsigned Index,
353 InMemoryStruct<macho::Symbol64TableEntry> &Res) const {
354 uint64_t Offset = (SymbolTableOffset +
355 Index * sizeof(macho::Symbol64TableEntry));
356 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
357}
Eric Christopher592cf782011-04-03 23:51:47 +0000358
Benjamin Kramerd4522462011-08-30 22:10:58 +0000359
360void MachOObject::ReadULEB128s(uint64_t Index,
361 SmallVectorImpl<uint64_t> &Out) const {
362 const char *ptr = Buffer->getBufferStart() + Index;
363 uint64_t data = 0;
364 uint64_t delta = 0;
365 uint32_t shift = 0;
366 while (true) {
367 assert(ptr < Buffer->getBufferEnd() && "index out of bounds");
368 assert(shift < 64 && "too big for uint64_t");
369
370 uint8_t byte = *ptr++;
371 delta |= ((byte & 0x7F) << shift);
372 shift += 7;
373 if (byte < 0x80) {
374 if (delta == 0)
375 break;
376 data += delta;
377 Out.push_back(data);
378 delta = 0;
379 shift = 0;
380 }
381 }
382}
383
Eric Christopher592cf782011-04-03 23:51:47 +0000384/* ** */
385// Object Dumping Facilities
386void MachOObject::dump() const { print(dbgs()); dbgs() << '\n'; }
387void MachOObject::dumpHeader() const { printHeader(dbgs()); dbgs() << '\n'; }
388
389void MachOObject::printHeader(raw_ostream &O) const {
390 O << "('cputype', " << Header.CPUType << ")\n";
391 O << "('cpusubtype', " << Header.CPUSubtype << ")\n";
392 O << "('filetype', " << Header.FileType << ")\n";
393 O << "('num_load_commands', " << Header.NumLoadCommands << ")\n";
394 O << "('load_commands_size', " << Header.SizeOfLoadCommands << ")\n";
395 O << "('flag', " << Header.Flags << ")\n";
396
397 // Print extended header if 64-bit.
398 if (is64Bit())
399 O << "('reserved', " << Header64Ext.Reserved << ")\n";
400}
401
402void MachOObject::print(raw_ostream &O) const {
403 O << "Header:\n";
404 printHeader(O);
405 O << "Load Commands:\n";
406
407 O << "Buffer:\n";
408}