blob: 339b12043ae9b49202ed85fa396e3fff290bf9e4 [file] [log] [blame]
Daniel Dunbarfbd25b72010-11-27 05:38:50 +00001//===- MachOObject.cpp - Mach-O Object File Wrapper -----------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#include "llvm/Object/MachOObject.h"
Daniel Dunbar95369162010-11-27 06:39:22 +000011#include "llvm/ADT/StringRef.h"
Daniel Dunbarfbd25b72010-11-27 05:38:50 +000012#include "llvm/Support/MemoryBuffer.h"
Michael J. Spencer1f6efa32010-11-29 18:16:10 +000013#include "llvm/Support/Host.h"
14#include "llvm/Support/SwapByteOrder.h"
Eric Christopher592cf782011-04-03 23:51:47 +000015#include "llvm/Support/raw_ostream.h"
16#include "llvm/Support/Debug.h"
Daniel Dunbarfbd25b72010-11-27 05:38:50 +000017
18using namespace llvm;
Daniel Dunbara956d8b2010-11-27 07:19:41 +000019using namespace llvm::object;
20
Daniel Dunbar4ba1f5e2010-11-27 08:22:29 +000021/* Translation Utilities */
22
Daniel Dunbara956d8b2010-11-27 07:19:41 +000023template<typename T>
24static void SwapValue(T &Value) {
25 Value = sys::SwapByteOrder(Value);
26}
Daniel Dunbarfbd25b72010-11-27 05:38:50 +000027
Daniel Dunbar4ba1f5e2010-11-27 08:22:29 +000028template<typename T>
29static void SwapStruct(T &Value);
30
31template<typename T>
32static void ReadInMemoryStruct(const MachOObject &MOO,
33 StringRef Buffer, uint64_t Base,
34 InMemoryStruct<T> &Res) {
35 typedef T struct_type;
36 uint64_t Size = sizeof(struct_type);
37
38 // Check that the buffer contains the expected data.
39 if (Base + Size > Buffer.size()) {
40 Res = 0;
41 return;
42 }
43
44 // Check whether we can return a direct pointer.
45 struct_type *Ptr = (struct_type *) (Buffer.data() + Base);
46 if (!MOO.isSwappedEndian()) {
47 Res = Ptr;
48 return;
49 }
50
51 // Otherwise, copy the struct and translate the values.
52 Res = *Ptr;
53 SwapStruct(*Res);
54}
55
56/* *** */
57
Daniel Dunbar95369162010-11-27 06:39:22 +000058MachOObject::MachOObject(MemoryBuffer *Buffer_, bool IsLittleEndian_,
59 bool Is64Bit_)
Daniel Dunbara956d8b2010-11-27 07:19:41 +000060 : Buffer(Buffer_), IsLittleEndian(IsLittleEndian_), Is64Bit(Is64Bit_),
61 IsSwappedEndian(IsLittleEndian != sys::isLittleEndianHost()),
Daniel Dunbarf2e2a5f2010-11-27 13:46:11 +000062 HasStringTable(false), LoadCommands(0), NumLoadedCommands(0) {
Daniel Dunbara956d8b2010-11-27 07:19:41 +000063 // Load the common header.
64 memcpy(&Header, Buffer->getBuffer().data(), sizeof(Header));
65 if (IsSwappedEndian) {
66 SwapValue(Header.Magic);
67 SwapValue(Header.CPUType);
68 SwapValue(Header.CPUSubtype);
69 SwapValue(Header.FileType);
70 SwapValue(Header.NumLoadCommands);
71 SwapValue(Header.SizeOfLoadCommands);
72 SwapValue(Header.Flags);
73 }
74
75 if (is64Bit()) {
76 memcpy(&Header64Ext, Buffer->getBuffer().data() + sizeof(Header),
77 sizeof(Header64Ext));
78 if (IsSwappedEndian) {
79 SwapValue(Header64Ext.Reserved);
80 }
81 }
82
83 // Create the load command array if sane.
84 if (getHeader().NumLoadCommands < (1 << 20))
85 LoadCommands = new LoadCommandInfo[getHeader().NumLoadCommands];
86}
87
88MachOObject::~MachOObject() {
Benjamin Kramer23dcd002010-12-17 09:56:50 +000089 delete [] LoadCommands;
Daniel Dunbarfbd25b72010-11-27 05:38:50 +000090}
91
92MachOObject *MachOObject::LoadFromBuffer(MemoryBuffer *Buffer,
93 std::string *ErrorStr) {
Daniel Dunbar95369162010-11-27 06:39:22 +000094 // First, check the magic value and initialize the basic object info.
95 bool IsLittleEndian = false, Is64Bit = false;
96 StringRef Magic = Buffer->getBuffer().slice(0, 4);
97 if (Magic == "\xFE\xED\xFA\xCE") {
98 } else if (Magic == "\xCE\xFA\xED\xFE") {
99 IsLittleEndian = true;
100 } else if (Magic == "\xFE\xED\xFA\xCF") {
101 Is64Bit = true;
102 } else if (Magic == "\xCF\xFA\xED\xFE") {
103 IsLittleEndian = true;
104 Is64Bit = true;
105 } else {
Daniel Dunbara956d8b2010-11-27 07:19:41 +0000106 if (ErrorStr) *ErrorStr = "not a Mach object file (invalid magic)";
107 return 0;
108 }
109
110 // Ensure that the at least the full header is present.
111 unsigned HeaderSize = Is64Bit ? macho::Header64Size : macho::Header32Size;
112 if (Buffer->getBufferSize() < HeaderSize) {
113 if (ErrorStr) *ErrorStr = "not a Mach object file (invalid header)";
Daniel Dunbar95369162010-11-27 06:39:22 +0000114 return 0;
115 }
116
117 OwningPtr<MachOObject> Object(new MachOObject(Buffer, IsLittleEndian,
118 Is64Bit));
119
Daniel Dunbara956d8b2010-11-27 07:19:41 +0000120 // Check for bogus number of load commands.
121 if (Object->getHeader().NumLoadCommands >= (1 << 20)) {
122 if (ErrorStr) *ErrorStr = "not a Mach object file (unreasonable header)";
123 return 0;
124 }
125
Daniel Dunbarfbd25b72010-11-27 05:38:50 +0000126 if (ErrorStr) *ErrorStr = "";
Daniel Dunbar95369162010-11-27 06:39:22 +0000127 return Object.take();
Daniel Dunbarfbd25b72010-11-27 05:38:50 +0000128}
Daniel Dunbara956d8b2010-11-27 07:19:41 +0000129
Daniel Dunbar71130f82010-11-27 13:58:16 +0000130StringRef MachOObject::getData(size_t Offset, size_t Size) const {
131 return Buffer->getBuffer().substr(Offset,Size);
132}
133
Daniel Dunbarf2e2a5f2010-11-27 13:46:11 +0000134void MachOObject::RegisterStringTable(macho::SymtabLoadCommand &SLC) {
135 HasStringTable = true;
136 StringTable = Buffer->getBuffer().substr(SLC.StringTableOffset,
137 SLC.StringTableSize);
138}
139
Daniel Dunbara956d8b2010-11-27 07:19:41 +0000140const MachOObject::LoadCommandInfo &
141MachOObject::getLoadCommandInfo(unsigned Index) const {
142 assert(Index < getHeader().NumLoadCommands && "Invalid index!");
143
144 // Load the command, if necessary.
145 if (Index >= NumLoadedCommands) {
146 uint64_t Offset;
147 if (Index == 0) {
148 Offset = getHeaderSize();
149 } else {
150 const LoadCommandInfo &Prev = getLoadCommandInfo(Index - 1);
151 Offset = Prev.Offset + Prev.Command.Size;
152 }
153
154 LoadCommandInfo &Info = LoadCommands[Index];
155 memcpy(&Info.Command, Buffer->getBuffer().data() + Offset,
156 sizeof(macho::LoadCommand));
157 if (IsSwappedEndian) {
158 SwapValue(Info.Command.Type);
159 SwapValue(Info.Command.Size);
160 }
161 Info.Offset = Offset;
162 NumLoadedCommands = Index + 1;
163 }
164
165 return LoadCommands[Index];
166}
Daniel Dunbar4ba1f5e2010-11-27 08:22:29 +0000167
168template<>
Benjamin Kramer3946e3b2010-11-27 09:08:25 +0000169void SwapStruct(macho::SegmentLoadCommand &Value) {
Daniel Dunbar4ba1f5e2010-11-27 08:22:29 +0000170 SwapValue(Value.Type);
171 SwapValue(Value.Size);
172 SwapValue(Value.VMAddress);
173 SwapValue(Value.VMSize);
174 SwapValue(Value.FileOffset);
175 SwapValue(Value.FileSize);
176 SwapValue(Value.MaxVMProtection);
177 SwapValue(Value.InitialVMProtection);
178 SwapValue(Value.NumSections);
179 SwapValue(Value.Flags);
180}
181void MachOObject::ReadSegmentLoadCommand(const LoadCommandInfo &LCI,
182 InMemoryStruct<macho::SegmentLoadCommand> &Res) const {
183 ReadInMemoryStruct(*this, Buffer->getBuffer(), LCI.Offset, Res);
184}
185
186template<>
Benjamin Kramer3946e3b2010-11-27 09:08:25 +0000187void SwapStruct(macho::Segment64LoadCommand &Value) {
Daniel Dunbar4ba1f5e2010-11-27 08:22:29 +0000188 SwapValue(Value.Type);
189 SwapValue(Value.Size);
190 SwapValue(Value.VMAddress);
191 SwapValue(Value.VMSize);
192 SwapValue(Value.FileOffset);
193 SwapValue(Value.FileSize);
194 SwapValue(Value.MaxVMProtection);
195 SwapValue(Value.InitialVMProtection);
196 SwapValue(Value.NumSections);
197 SwapValue(Value.Flags);
198}
199void MachOObject::ReadSegment64LoadCommand(const LoadCommandInfo &LCI,
200 InMemoryStruct<macho::Segment64LoadCommand> &Res) const {
201 ReadInMemoryStruct(*this, Buffer->getBuffer(), LCI.Offset, Res);
202}
Daniel Dunbarf879f142010-11-27 08:33:44 +0000203
204template<>
Benjamin Kramer3946e3b2010-11-27 09:08:25 +0000205void SwapStruct(macho::SymtabLoadCommand &Value) {
Daniel Dunbarf879f142010-11-27 08:33:44 +0000206 SwapValue(Value.Type);
207 SwapValue(Value.Size);
208 SwapValue(Value.SymbolTableOffset);
209 SwapValue(Value.NumSymbolTableEntries);
210 SwapValue(Value.StringTableOffset);
211 SwapValue(Value.StringTableSize);
212}
213void MachOObject::ReadSymtabLoadCommand(const LoadCommandInfo &LCI,
214 InMemoryStruct<macho::SymtabLoadCommand> &Res) const {
215 ReadInMemoryStruct(*this, Buffer->getBuffer(), LCI.Offset, Res);
216}
217
218template<>
Benjamin Kramer3946e3b2010-11-27 09:08:25 +0000219void SwapStruct(macho::DysymtabLoadCommand &Value) {
Daniel Dunbarf879f142010-11-27 08:33:44 +0000220 SwapValue(Value.Type);
221 SwapValue(Value.Size);
Daniel Dunbara87d7ec2010-12-10 06:19:39 +0000222 SwapValue(Value.LocalSymbolsIndex);
Daniel Dunbarf879f142010-11-27 08:33:44 +0000223 SwapValue(Value.NumLocalSymbols);
224 SwapValue(Value.ExternalSymbolsIndex);
225 SwapValue(Value.NumExternalSymbols);
226 SwapValue(Value.UndefinedSymbolsIndex);
227 SwapValue(Value.NumUndefinedSymbols);
228 SwapValue(Value.TOCOffset);
229 SwapValue(Value.NumTOCEntries);
230 SwapValue(Value.ModuleTableOffset);
231 SwapValue(Value.NumModuleTableEntries);
232 SwapValue(Value.ReferenceSymbolTableOffset);
233 SwapValue(Value.NumReferencedSymbolTableEntries);
234 SwapValue(Value.IndirectSymbolTableOffset);
235 SwapValue(Value.NumIndirectSymbolTableEntries);
236 SwapValue(Value.ExternalRelocationTableOffset);
237 SwapValue(Value.NumExternalRelocationTableEntries);
238 SwapValue(Value.LocalRelocationTableOffset);
239 SwapValue(Value.NumLocalRelocationTableEntries);
240}
241void MachOObject::ReadDysymtabLoadCommand(const LoadCommandInfo &LCI,
242 InMemoryStruct<macho::DysymtabLoadCommand> &Res) const {
243 ReadInMemoryStruct(*this, Buffer->getBuffer(), LCI.Offset, Res);
244}
Daniel Dunbar4c55e0d2010-11-27 13:26:12 +0000245
246template<>
Benjamin Kramer9942aca2011-08-30 18:33:37 +0000247void SwapStruct(macho::LinkeditDataLoadCommand &Value) {
248 SwapValue(Value.Type);
249 SwapValue(Value.Size);
250 SwapValue(Value.DataOffset);
251 SwapValue(Value.DataSize);
252}
253void MachOObject::ReadLinkeditDataLoadCommand(const LoadCommandInfo &LCI,
254 InMemoryStruct<macho::LinkeditDataLoadCommand> &Res) const {
255 ReadInMemoryStruct(*this, Buffer->getBuffer(), LCI.Offset, Res);
256}
257
258template<>
Daniel Dunbar4c55e0d2010-11-27 13:26:12 +0000259void SwapStruct(macho::IndirectSymbolTableEntry &Value) {
260 SwapValue(Value.Index);
261}
262void
263MachOObject::ReadIndirectSymbolTableEntry(const macho::DysymtabLoadCommand &DLC,
264 unsigned Index,
265 InMemoryStruct<macho::IndirectSymbolTableEntry> &Res) const {
266 uint64_t Offset = (DLC.IndirectSymbolTableOffset +
267 Index * sizeof(macho::IndirectSymbolTableEntry));
268 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
269}
Daniel Dunbar2acadbd2010-11-27 13:33:15 +0000270
271
272template<>
273void SwapStruct(macho::Section &Value) {
274 SwapValue(Value.Address);
275 SwapValue(Value.Size);
276 SwapValue(Value.Offset);
277 SwapValue(Value.Align);
278 SwapValue(Value.RelocationTableOffset);
279 SwapValue(Value.NumRelocationTableEntries);
280 SwapValue(Value.Flags);
281 SwapValue(Value.Reserved1);
282 SwapValue(Value.Reserved2);
283}
284void MachOObject::ReadSection(const LoadCommandInfo &LCI,
285 unsigned Index,
286 InMemoryStruct<macho::Section> &Res) const {
287 assert(LCI.Command.Type == macho::LCT_Segment &&
288 "Unexpected load command info!");
289 uint64_t Offset = (LCI.Offset + sizeof(macho::SegmentLoadCommand) +
290 Index * sizeof(macho::Section));
291 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
292}
293
294template<>
295void SwapStruct(macho::Section64 &Value) {
296 SwapValue(Value.Address);
297 SwapValue(Value.Size);
298 SwapValue(Value.Offset);
299 SwapValue(Value.Align);
300 SwapValue(Value.RelocationTableOffset);
301 SwapValue(Value.NumRelocationTableEntries);
302 SwapValue(Value.Flags);
303 SwapValue(Value.Reserved1);
304 SwapValue(Value.Reserved2);
305 SwapValue(Value.Reserved3);
306}
307void MachOObject::ReadSection64(const LoadCommandInfo &LCI,
308 unsigned Index,
309 InMemoryStruct<macho::Section64> &Res) const {
310 assert(LCI.Command.Type == macho::LCT_Segment64 &&
311 "Unexpected load command info!");
312 uint64_t Offset = (LCI.Offset + sizeof(macho::Segment64LoadCommand) +
313 Index * sizeof(macho::Section64));
314 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
315}
Daniel Dunbar90e3e3a2010-11-27 13:39:48 +0000316
317template<>
318void SwapStruct(macho::RelocationEntry &Value) {
319 SwapValue(Value.Word0);
320 SwapValue(Value.Word1);
321}
322void MachOObject::ReadRelocationEntry(uint64_t RelocationTableOffset,
323 unsigned Index,
324 InMemoryStruct<macho::RelocationEntry> &Res) const {
325 uint64_t Offset = (RelocationTableOffset +
326 Index * sizeof(macho::RelocationEntry));
327 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
328}
Daniel Dunbar2208b582010-11-27 13:52:53 +0000329
330template<>
331void SwapStruct(macho::SymbolTableEntry &Value) {
332 SwapValue(Value.StringIndex);
333 SwapValue(Value.Flags);
334 SwapValue(Value.Value);
335}
336void MachOObject::ReadSymbolTableEntry(uint64_t SymbolTableOffset,
337 unsigned Index,
338 InMemoryStruct<macho::SymbolTableEntry> &Res) const {
339 uint64_t Offset = (SymbolTableOffset +
340 Index * sizeof(macho::SymbolTableEntry));
341 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
342}
343
344template<>
345void SwapStruct(macho::Symbol64TableEntry &Value) {
346 SwapValue(Value.StringIndex);
347 SwapValue(Value.Flags);
348 SwapValue(Value.Value);
349}
350void MachOObject::ReadSymbol64TableEntry(uint64_t SymbolTableOffset,
351 unsigned Index,
352 InMemoryStruct<macho::Symbol64TableEntry> &Res) const {
353 uint64_t Offset = (SymbolTableOffset +
354 Index * sizeof(macho::Symbol64TableEntry));
355 ReadInMemoryStruct(*this, Buffer->getBuffer(), Offset, Res);
356}
Eric Christopher592cf782011-04-03 23:51:47 +0000357
358/* ** */
359// Object Dumping Facilities
360void MachOObject::dump() const { print(dbgs()); dbgs() << '\n'; }
361void MachOObject::dumpHeader() const { printHeader(dbgs()); dbgs() << '\n'; }
362
363void MachOObject::printHeader(raw_ostream &O) const {
364 O << "('cputype', " << Header.CPUType << ")\n";
365 O << "('cpusubtype', " << Header.CPUSubtype << ")\n";
366 O << "('filetype', " << Header.FileType << ")\n";
367 O << "('num_load_commands', " << Header.NumLoadCommands << ")\n";
368 O << "('load_commands_size', " << Header.SizeOfLoadCommands << ")\n";
369 O << "('flag', " << Header.Flags << ")\n";
370
371 // Print extended header if 64-bit.
372 if (is64Bit())
373 O << "('reserved', " << Header64Ext.Reserved << ")\n";
374}
375
376void MachOObject::print(raw_ostream &O) const {
377 O << "Header:\n";
378 printHeader(O);
379 O << "Load Commands:\n";
380
381 O << "Buffer:\n";
382}