blob: a1cbef2c281c0da6f987f94f0d1153e65f00454c [file] [log] [blame]
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00001//===- MachOObjectFile.cpp - Mach-O object file binding -------------------===//
Eric Christopher7b015c72011-04-22 03:19:48 +00002//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Eric Christopher7b015c72011-04-22 03:19:48 +00006//
7//===----------------------------------------------------------------------===//
8//
9// This file defines the MachOObjectFile class, which binds the MachOObject
10// class to the generic ObjectFile wrapper.
11//
12//===----------------------------------------------------------------------===//
13
Eugene Zelenko9f5094d2017-04-21 22:03:05 +000014#include "llvm/ADT/ArrayRef.h"
15#include "llvm/ADT/None.h"
Tim Northover00ed9962014-03-29 10:18:08 +000016#include "llvm/ADT/STLExtras.h"
Chandler Carruth6bda14b2017-06-06 11:49:48 +000017#include "llvm/ADT/SmallVector.h"
Eugene Zelenko9f5094d2017-04-21 22:03:05 +000018#include "llvm/ADT/StringRef.h"
Rafael Espindola72318b42014-08-08 16:30:17 +000019#include "llvm/ADT/StringSwitch.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000020#include "llvm/ADT/Triple.h"
Eugene Zelenko9f5094d2017-04-21 22:03:05 +000021#include "llvm/ADT/Twine.h"
Zachary Turner264b5d92017-06-07 03:48:56 +000022#include "llvm/BinaryFormat/MachO.h"
Eugene Zelenko9f5094d2017-04-21 22:03:05 +000023#include "llvm/Object/Error.h"
24#include "llvm/Object/MachO.h"
25#include "llvm/Object/ObjectFile.h"
26#include "llvm/Object/SymbolicFile.h"
Rafael Espindola421305a2013-04-07 20:01:29 +000027#include "llvm/Support/DataExtractor.h"
Nick Kledzikac431442014-09-12 21:34:15 +000028#include "llvm/Support/Debug.h"
Eugene Zelenko9f5094d2017-04-21 22:03:05 +000029#include "llvm/Support/Error.h"
30#include "llvm/Support/ErrorHandling.h"
Owen Andersonbc14bd32011-10-26 20:42:54 +000031#include "llvm/Support/Format.h"
Rafael Espindola56f976f2013-04-18 18:08:55 +000032#include "llvm/Support/Host.h"
Nick Kledzikd04bc352014-08-30 00:20:14 +000033#include "llvm/Support/LEB128.h"
Eric Christopher7b015c72011-04-22 03:19:48 +000034#include "llvm/Support/MemoryBuffer.h"
Eugene Zelenko9f5094d2017-04-21 22:03:05 +000035#include "llvm/Support/SwapByteOrder.h"
Chandler Carruth6bda14b2017-06-06 11:49:48 +000036#include "llvm/Support/raw_ostream.h"
Eugene Zelenko9f5094d2017-04-21 22:03:05 +000037#include <algorithm>
38#include <cassert>
39#include <cstddef>
40#include <cstdint>
Eric Christopher7b015c72011-04-22 03:19:48 +000041#include <cstring>
42#include <limits>
Kevin Enderbyd5039402016-10-31 20:29:48 +000043#include <list>
Eugene Zelenko9f5094d2017-04-21 22:03:05 +000044#include <memory>
45#include <string>
46#include <system_error>
Eric Christopher7b015c72011-04-22 03:19:48 +000047
48using namespace llvm;
49using namespace object;
50
Artyom Skrobov7d602f72014-07-20 12:08:28 +000051namespace {
Eugene Zelenko9f5094d2017-04-21 22:03:05 +000052
Artyom Skrobov7d602f72014-07-20 12:08:28 +000053 struct section_base {
54 char sectname[16];
55 char segname[16];
56 };
Eugene Zelenko9f5094d2017-04-21 22:03:05 +000057
58} // end anonymous namespace
Rafael Espindola56f976f2013-04-18 18:08:55 +000059
Benjamin Kramer760e00b2017-08-20 15:13:39 +000060static Error malformedError(const Twine &Msg) {
61 return make_error<GenericBinaryError>("truncated or malformed object (" +
62 Msg + ")",
Kevin Enderby89134962016-05-05 23:41:05 +000063 object_error::parse_failed);
Lang Hames9e964f32016-03-25 17:25:34 +000064}
65
Alexey Samsonov9f336632015-06-04 19:45:22 +000066// FIXME: Replace all uses of this function with getStructOrErr.
Filipe Cabecinhas40139502015-01-15 22:52:38 +000067template <typename T>
Lang Hames697e7cd2016-12-04 01:56:10 +000068static T getStruct(const MachOObjectFile &O, const char *P) {
Filipe Cabecinhas40139502015-01-15 22:52:38 +000069 // Don't read before the beginning or past the end of the file
Lang Hames697e7cd2016-12-04 01:56:10 +000070 if (P < O.getData().begin() || P + sizeof(T) > O.getData().end())
Filipe Cabecinhas40139502015-01-15 22:52:38 +000071 report_fatal_error("Malformed MachO file.");
72
Rafael Espindola3cdeb172013-04-19 13:45:05 +000073 T Cmd;
74 memcpy(&Cmd, P, sizeof(T));
Lang Hames697e7cd2016-12-04 01:56:10 +000075 if (O.isLittleEndian() != sys::IsLittleEndianHost)
Artyom Skrobov78d5daf2014-07-18 09:26:16 +000076 MachO::swapStruct(Cmd);
Rafael Espindola3cdeb172013-04-19 13:45:05 +000077 return Cmd;
Rafael Espindola56f976f2013-04-18 18:08:55 +000078}
79
Alexey Samsonov9f336632015-06-04 19:45:22 +000080template <typename T>
Lang Hames697e7cd2016-12-04 01:56:10 +000081static Expected<T> getStructOrErr(const MachOObjectFile &O, const char *P) {
Alexey Samsonov9f336632015-06-04 19:45:22 +000082 // Don't read before the beginning or past the end of the file
Lang Hames697e7cd2016-12-04 01:56:10 +000083 if (P < O.getData().begin() || P + sizeof(T) > O.getData().end())
Kevin Enderbyd4e075b2016-05-06 20:16:28 +000084 return malformedError("Structure read out-of-range");
Alexey Samsonov9f336632015-06-04 19:45:22 +000085
86 T Cmd;
87 memcpy(&Cmd, P, sizeof(T));
Lang Hames697e7cd2016-12-04 01:56:10 +000088 if (O.isLittleEndian() != sys::IsLittleEndianHost)
Alexey Samsonov9f336632015-06-04 19:45:22 +000089 MachO::swapStruct(Cmd);
90 return Cmd;
91}
92
Rafael Espindola6e040c02013-04-26 20:07:33 +000093static const char *
Lang Hames697e7cd2016-12-04 01:56:10 +000094getSectionPtr(const MachOObjectFile &O, MachOObjectFile::LoadCommandInfo L,
Rafael Espindola6e040c02013-04-26 20:07:33 +000095 unsigned Sec) {
Rafael Espindola56f976f2013-04-18 18:08:55 +000096 uintptr_t CommandAddr = reinterpret_cast<uintptr_t>(L.Ptr);
97
Lang Hames697e7cd2016-12-04 01:56:10 +000098 bool Is64 = O.is64Bit();
Charles Davis8bdfafd2013-09-01 04:28:48 +000099 unsigned SegmentLoadSize = Is64 ? sizeof(MachO::segment_command_64) :
100 sizeof(MachO::segment_command);
101 unsigned SectionSize = Is64 ? sizeof(MachO::section_64) :
102 sizeof(MachO::section);
Rafael Espindola56f976f2013-04-18 18:08:55 +0000103
104 uintptr_t SectionAddr = CommandAddr + SegmentLoadSize + Sec * SectionSize;
Charles Davis1827bd82013-08-27 05:38:30 +0000105 return reinterpret_cast<const char*>(SectionAddr);
Rafael Espindola60689982013-04-07 19:05:30 +0000106}
107
Lang Hames697e7cd2016-12-04 01:56:10 +0000108static const char *getPtr(const MachOObjectFile &O, size_t Offset) {
Sam Clegg675a5172018-06-04 17:01:20 +0000109 assert(Offset <= O.getData().size());
Sam Clegga81fb842018-05-30 03:37:26 +0000110 return O.getData().data() + Offset;
Rafael Espindola60689982013-04-07 19:05:30 +0000111}
112
Artyom Skrobov78d5daf2014-07-18 09:26:16 +0000113static MachO::nlist_base
Lang Hames697e7cd2016-12-04 01:56:10 +0000114getSymbolTableEntryBase(const MachOObjectFile &O, DataRefImpl DRI) {
Rafael Espindola75c30362013-04-24 19:47:55 +0000115 const char *P = reinterpret_cast<const char *>(DRI.p);
Artyom Skrobov78d5daf2014-07-18 09:26:16 +0000116 return getStruct<MachO::nlist_base>(O, P);
Eric Christopher7b015c72011-04-22 03:19:48 +0000117}
118
Rafael Espindola56f976f2013-04-18 18:08:55 +0000119static StringRef parseSegmentOrSectionName(const char *P) {
Rafael Espindolaa9f810b2012-12-21 03:47:03 +0000120 if (P[15] == 0)
121 // Null terminated.
122 return P;
123 // Not null terminated, so this is a 16 char string.
124 return StringRef(P, 16);
125}
126
Lang Hames697e7cd2016-12-04 01:56:10 +0000127static unsigned getCPUType(const MachOObjectFile &O) {
128 return O.getHeader().cputype;
Rafael Espindola56f976f2013-04-18 18:08:55 +0000129}
130
Charles Davis8bdfafd2013-09-01 04:28:48 +0000131static uint32_t
132getPlainRelocationAddress(const MachO::any_relocation_info &RE) {
133 return RE.r_word0;
Rafael Espindola56f976f2013-04-18 18:08:55 +0000134}
135
136static unsigned
Charles Davis8bdfafd2013-09-01 04:28:48 +0000137getScatteredRelocationAddress(const MachO::any_relocation_info &RE) {
138 return RE.r_word0 & 0xffffff;
Rafael Espindola56f976f2013-04-18 18:08:55 +0000139}
140
Lang Hames697e7cd2016-12-04 01:56:10 +0000141static bool getPlainRelocationPCRel(const MachOObjectFile &O,
Charles Davis8bdfafd2013-09-01 04:28:48 +0000142 const MachO::any_relocation_info &RE) {
Lang Hames697e7cd2016-12-04 01:56:10 +0000143 if (O.isLittleEndian())
Charles Davis8bdfafd2013-09-01 04:28:48 +0000144 return (RE.r_word1 >> 24) & 1;
145 return (RE.r_word1 >> 7) & 1;
Rafael Espindola56f976f2013-04-18 18:08:55 +0000146}
147
148static bool
Lang Hames697e7cd2016-12-04 01:56:10 +0000149getScatteredRelocationPCRel(const MachO::any_relocation_info &RE) {
Charles Davis8bdfafd2013-09-01 04:28:48 +0000150 return (RE.r_word0 >> 30) & 1;
Rafael Espindola56f976f2013-04-18 18:08:55 +0000151}
152
Lang Hames697e7cd2016-12-04 01:56:10 +0000153static unsigned getPlainRelocationLength(const MachOObjectFile &O,
Charles Davis8bdfafd2013-09-01 04:28:48 +0000154 const MachO::any_relocation_info &RE) {
Lang Hames697e7cd2016-12-04 01:56:10 +0000155 if (O.isLittleEndian())
Charles Davis8bdfafd2013-09-01 04:28:48 +0000156 return (RE.r_word1 >> 25) & 3;
157 return (RE.r_word1 >> 5) & 3;
Rafael Espindola56f976f2013-04-18 18:08:55 +0000158}
159
160static unsigned
Charles Davis8bdfafd2013-09-01 04:28:48 +0000161getScatteredRelocationLength(const MachO::any_relocation_info &RE) {
162 return (RE.r_word0 >> 28) & 3;
Rafael Espindola56f976f2013-04-18 18:08:55 +0000163}
164
Lang Hames697e7cd2016-12-04 01:56:10 +0000165static unsigned getPlainRelocationType(const MachOObjectFile &O,
Charles Davis8bdfafd2013-09-01 04:28:48 +0000166 const MachO::any_relocation_info &RE) {
Lang Hames697e7cd2016-12-04 01:56:10 +0000167 if (O.isLittleEndian())
Charles Davis8bdfafd2013-09-01 04:28:48 +0000168 return RE.r_word1 >> 28;
169 return RE.r_word1 & 0xf;
Rafael Espindola56f976f2013-04-18 18:08:55 +0000170}
171
Lang Hames697e7cd2016-12-04 01:56:10 +0000172static uint32_t getSectionFlags(const MachOObjectFile &O,
Rafael Espindola56f976f2013-04-18 18:08:55 +0000173 DataRefImpl Sec) {
Lang Hames697e7cd2016-12-04 01:56:10 +0000174 if (O.is64Bit()) {
175 MachO::section_64 Sect = O.getSection64(Sec);
Charles Davis8bdfafd2013-09-01 04:28:48 +0000176 return Sect.flags;
Rafael Espindola56f976f2013-04-18 18:08:55 +0000177 }
Lang Hames697e7cd2016-12-04 01:56:10 +0000178 MachO::section Sect = O.getSection(Sec);
Charles Davis8bdfafd2013-09-01 04:28:48 +0000179 return Sect.flags;
Rafael Espindola56f976f2013-04-18 18:08:55 +0000180}
181
Lang Hames9e964f32016-03-25 17:25:34 +0000182static Expected<MachOObjectFile::LoadCommandInfo>
Lang Hames697e7cd2016-12-04 01:56:10 +0000183getLoadCommandInfo(const MachOObjectFile &Obj, const char *Ptr,
Kevin Enderbya8e3ab02016-05-03 23:13:50 +0000184 uint32_t LoadCommandIndex) {
Lang Hames9e964f32016-03-25 17:25:34 +0000185 if (auto CmdOrErr = getStructOrErr<MachO::load_command>(Obj, Ptr)) {
Jonas Devlieghere81f5abe2017-09-13 13:43:01 +0000186 if (CmdOrErr->cmdsize + Ptr > Obj.getData().end())
187 return malformedError("load command " + Twine(LoadCommandIndex) +
188 " extends past end of file");
Lang Hames9e964f32016-03-25 17:25:34 +0000189 if (CmdOrErr->cmdsize < 8)
Kevin Enderbyd4e075b2016-05-06 20:16:28 +0000190 return malformedError("load command " + Twine(LoadCommandIndex) +
Kevin Enderby89134962016-05-05 23:41:05 +0000191 " with size less than 8 bytes");
Lang Hames9e964f32016-03-25 17:25:34 +0000192 return MachOObjectFile::LoadCommandInfo({Ptr, *CmdOrErr});
193 } else
194 return CmdOrErr.takeError();
Alexey Samsonov4fdbed32015-06-04 19:34:14 +0000195}
196
Lang Hames9e964f32016-03-25 17:25:34 +0000197static Expected<MachOObjectFile::LoadCommandInfo>
Lang Hames697e7cd2016-12-04 01:56:10 +0000198getFirstLoadCommandInfo(const MachOObjectFile &Obj) {
199 unsigned HeaderSize = Obj.is64Bit() ? sizeof(MachO::mach_header_64)
200 : sizeof(MachO::mach_header);
201 if (sizeof(MachO::load_command) > Obj.getHeader().sizeofcmds)
Kevin Enderbyd4e075b2016-05-06 20:16:28 +0000202 return malformedError("load command 0 extends past the end all load "
Kevin Enderby89134962016-05-05 23:41:05 +0000203 "commands in the file");
Kevin Enderbya8e3ab02016-05-03 23:13:50 +0000204 return getLoadCommandInfo(Obj, getPtr(Obj, HeaderSize), 0);
Alexey Samsonov4fdbed32015-06-04 19:34:14 +0000205}
206
Lang Hames9e964f32016-03-25 17:25:34 +0000207static Expected<MachOObjectFile::LoadCommandInfo>
Lang Hames697e7cd2016-12-04 01:56:10 +0000208getNextLoadCommandInfo(const MachOObjectFile &Obj, uint32_t LoadCommandIndex,
Alexey Samsonov4fdbed32015-06-04 19:34:14 +0000209 const MachOObjectFile::LoadCommandInfo &L) {
Lang Hames697e7cd2016-12-04 01:56:10 +0000210 unsigned HeaderSize = Obj.is64Bit() ? sizeof(MachO::mach_header_64)
211 : sizeof(MachO::mach_header);
Kevin Enderby9d0c9452016-08-31 17:57:46 +0000212 if (L.Ptr + L.C.cmdsize + sizeof(MachO::load_command) >
Lang Hames697e7cd2016-12-04 01:56:10 +0000213 Obj.getData().data() + HeaderSize + Obj.getHeader().sizeofcmds)
Kevin Enderbyd4e075b2016-05-06 20:16:28 +0000214 return malformedError("load command " + Twine(LoadCommandIndex + 1) +
Kevin Enderby89134962016-05-05 23:41:05 +0000215 " extends past the end all load commands in the file");
Kevin Enderbya8e3ab02016-05-03 23:13:50 +0000216 return getLoadCommandInfo(Obj, L.Ptr + L.C.cmdsize, LoadCommandIndex + 1);
Alexey Samsonov4fdbed32015-06-04 19:34:14 +0000217}
218
Alexey Samsonov9f336632015-06-04 19:45:22 +0000219template <typename T>
Lang Hames697e7cd2016-12-04 01:56:10 +0000220static void parseHeader(const MachOObjectFile &Obj, T &Header,
Lang Hames9e964f32016-03-25 17:25:34 +0000221 Error &Err) {
Lang Hames697e7cd2016-12-04 01:56:10 +0000222 if (sizeof(T) > Obj.getData().size()) {
Kevin Enderbyd4e075b2016-05-06 20:16:28 +0000223 Err = malformedError("the mach header extends past the end of the "
Kevin Enderby89134962016-05-05 23:41:05 +0000224 "file");
Kevin Enderby87025742016-04-13 21:17:58 +0000225 return;
226 }
Lang Hames9e964f32016-03-25 17:25:34 +0000227 if (auto HeaderOrErr = getStructOrErr<T>(Obj, getPtr(Obj, 0)))
228 Header = *HeaderOrErr;
Alexey Samsonov9f336632015-06-04 19:45:22 +0000229 else
Lang Hames9e964f32016-03-25 17:25:34 +0000230 Err = HeaderOrErr.takeError();
Alexey Samsonov9f336632015-06-04 19:45:22 +0000231}
232
Kevin Enderbyd5039402016-10-31 20:29:48 +0000233// This is used to check for overlapping of Mach-O elements.
234struct MachOElement {
235 uint64_t Offset;
236 uint64_t Size;
237 const char *Name;
238};
239
240static Error checkOverlappingElement(std::list<MachOElement> &Elements,
241 uint64_t Offset, uint64_t Size,
242 const char *Name) {
243 if (Size == 0)
244 return Error::success();
245
246 for (auto it=Elements.begin() ; it != Elements.end(); ++it) {
247 auto E = *it;
248 if ((Offset >= E.Offset && Offset < E.Offset + E.Size) ||
249 (Offset + Size > E.Offset && Offset + Size < E.Offset + E.Size) ||
250 (Offset <= E.Offset && Offset + Size >= E.Offset + E.Size))
251 return malformedError(Twine(Name) + " at offset " + Twine(Offset) +
252 " with a size of " + Twine(Size) + ", overlaps " +
253 E.Name + " at offset " + Twine(E.Offset) + " with "
254 "a size of " + Twine(E.Size));
255 auto nt = it;
256 nt++;
257 if (nt != Elements.end()) {
258 auto N = *nt;
259 if (Offset + Size <= N.Offset) {
260 Elements.insert(nt, {Offset, Size, Name});
261 return Error::success();
262 }
263 }
264 }
265 Elements.push_back({Offset, Size, Name});
266 return Error::success();
267}
268
Alexey Samsonove1a76ab2015-06-04 22:08:37 +0000269// Parses LC_SEGMENT or LC_SEGMENT_64 load command, adds addresses of all
270// sections to \param Sections, and optionally sets
271// \param IsPageZeroSegment to true.
Kevin Enderbyc614d282016-08-12 20:10:25 +0000272template <typename Segment, typename Section>
Lang Hames9e964f32016-03-25 17:25:34 +0000273static Error parseSegmentLoadCommand(
Lang Hames697e7cd2016-12-04 01:56:10 +0000274 const MachOObjectFile &Obj, const MachOObjectFile::LoadCommandInfo &Load,
Kevin Enderbyb34e3a12016-05-05 17:43:35 +0000275 SmallVectorImpl<const char *> &Sections, bool &IsPageZeroSegment,
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000276 uint32_t LoadCommandIndex, const char *CmdName, uint64_t SizeOfHeaders,
277 std::list<MachOElement> &Elements) {
Kevin Enderbyc614d282016-08-12 20:10:25 +0000278 const unsigned SegmentLoadSize = sizeof(Segment);
Alexey Samsonove1a76ab2015-06-04 22:08:37 +0000279 if (Load.C.cmdsize < SegmentLoadSize)
Kevin Enderbyd4e075b2016-05-06 20:16:28 +0000280 return malformedError("load command " + Twine(LoadCommandIndex) +
Kevin Enderby89134962016-05-05 23:41:05 +0000281 " " + CmdName + " cmdsize too small");
Kevin Enderbyc614d282016-08-12 20:10:25 +0000282 if (auto SegOrErr = getStructOrErr<Segment>(Obj, Load.Ptr)) {
283 Segment S = SegOrErr.get();
284 const unsigned SectionSize = sizeof(Section);
Lang Hames697e7cd2016-12-04 01:56:10 +0000285 uint64_t FileSize = Obj.getData().size();
Lang Hames9e964f32016-03-25 17:25:34 +0000286 if (S.nsects > std::numeric_limits<uint32_t>::max() / SectionSize ||
287 S.nsects * SectionSize > Load.C.cmdsize - SegmentLoadSize)
Kevin Enderbyd4e075b2016-05-06 20:16:28 +0000288 return malformedError("load command " + Twine(LoadCommandIndex) +
NAKAMURA Takumi9d0b5312016-08-22 00:58:47 +0000289 " inconsistent cmdsize in " + CmdName +
Kevin Enderby89134962016-05-05 23:41:05 +0000290 " for the number of sections");
Lang Hames9e964f32016-03-25 17:25:34 +0000291 for (unsigned J = 0; J < S.nsects; ++J) {
292 const char *Sec = getSectionPtr(Obj, Load, J);
293 Sections.push_back(Sec);
Kevin Enderbyc614d282016-08-12 20:10:25 +0000294 Section s = getStruct<Section>(Obj, Sec);
Lang Hames697e7cd2016-12-04 01:56:10 +0000295 if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
296 Obj.getHeader().filetype != MachO::MH_DSYM &&
Kevin Enderbyc614d282016-08-12 20:10:25 +0000297 s.flags != MachO::S_ZEROFILL &&
298 s.flags != MachO::S_THREAD_LOCAL_ZEROFILL &&
299 s.offset > FileSize)
300 return malformedError("offset field of section " + Twine(J) + " in " +
301 CmdName + " command " + Twine(LoadCommandIndex) +
302 " extends past the end of the file");
Lang Hames697e7cd2016-12-04 01:56:10 +0000303 if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
304 Obj.getHeader().filetype != MachO::MH_DSYM &&
Kevin Enderbyc614d282016-08-12 20:10:25 +0000305 s.flags != MachO::S_ZEROFILL &&
NAKAMURA Takumi59a20642016-08-22 00:58:04 +0000306 s.flags != MachO::S_THREAD_LOCAL_ZEROFILL && S.fileoff == 0 &&
307 s.offset < SizeOfHeaders && s.size != 0)
Kevin Enderbyc614d282016-08-12 20:10:25 +0000308 return malformedError("offset field of section " + Twine(J) + " in " +
309 CmdName + " command " + Twine(LoadCommandIndex) +
310 " not past the headers of the file");
311 uint64_t BigSize = s.offset;
312 BigSize += s.size;
Lang Hames697e7cd2016-12-04 01:56:10 +0000313 if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
314 Obj.getHeader().filetype != MachO::MH_DSYM &&
Kevin Enderbyc614d282016-08-12 20:10:25 +0000315 s.flags != MachO::S_ZEROFILL &&
316 s.flags != MachO::S_THREAD_LOCAL_ZEROFILL &&
317 BigSize > FileSize)
318 return malformedError("offset field plus size field of section " +
319 Twine(J) + " in " + CmdName + " command " +
320 Twine(LoadCommandIndex) +
321 " extends past the end of the file");
Lang Hames697e7cd2016-12-04 01:56:10 +0000322 if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
323 Obj.getHeader().filetype != MachO::MH_DSYM &&
Kevin Enderbyc614d282016-08-12 20:10:25 +0000324 s.flags != MachO::S_ZEROFILL &&
325 s.flags != MachO::S_THREAD_LOCAL_ZEROFILL &&
326 s.size > S.filesize)
327 return malformedError("size field of section " +
328 Twine(J) + " in " + CmdName + " command " +
329 Twine(LoadCommandIndex) +
330 " greater than the segment");
Lang Hames697e7cd2016-12-04 01:56:10 +0000331 if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
332 Obj.getHeader().filetype != MachO::MH_DSYM && s.size != 0 &&
NAKAMURA Takumi59a20642016-08-22 00:58:04 +0000333 s.addr < S.vmaddr)
334 return malformedError("addr field of section " + Twine(J) + " in " +
335 CmdName + " command " + Twine(LoadCommandIndex) +
336 " less than the segment's vmaddr");
Kevin Enderbyc614d282016-08-12 20:10:25 +0000337 BigSize = s.addr;
338 BigSize += s.size;
339 uint64_t BigEnd = S.vmaddr;
340 BigEnd += S.vmsize;
341 if (S.vmsize != 0 && s.size != 0 && BigSize > BigEnd)
NAKAMURA Takumi59a20642016-08-22 00:58:04 +0000342 return malformedError("addr field plus size of section " + Twine(J) +
343 " in " + CmdName + " command " +
344 Twine(LoadCommandIndex) +
345 " greater than than "
Kevin Enderbyc614d282016-08-12 20:10:25 +0000346 "the segment's vmaddr plus vmsize");
Lang Hames697e7cd2016-12-04 01:56:10 +0000347 if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
348 Obj.getHeader().filetype != MachO::MH_DSYM &&
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000349 s.flags != MachO::S_ZEROFILL &&
350 s.flags != MachO::S_THREAD_LOCAL_ZEROFILL)
351 if (Error Err = checkOverlappingElement(Elements, s.offset, s.size,
352 "section contents"))
353 return Err;
Kevin Enderbyc614d282016-08-12 20:10:25 +0000354 if (s.reloff > FileSize)
NAKAMURA Takumi59a20642016-08-22 00:58:04 +0000355 return malformedError("reloff field of section " + Twine(J) + " in " +
356 CmdName + " command " + Twine(LoadCommandIndex) +
Kevin Enderbyc614d282016-08-12 20:10:25 +0000357 " extends past the end of the file");
358 BigSize = s.nreloc;
359 BigSize *= sizeof(struct MachO::relocation_info);
360 BigSize += s.reloff;
361 if (BigSize > FileSize)
362 return malformedError("reloff field plus nreloc field times sizeof("
363 "struct relocation_info) of section " +
364 Twine(J) + " in " + CmdName + " command " +
NAKAMURA Takumi59a20642016-08-22 00:58:04 +0000365 Twine(LoadCommandIndex) +
Kevin Enderbyc614d282016-08-12 20:10:25 +0000366 " extends past the end of the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000367 if (Error Err = checkOverlappingElement(Elements, s.reloff, s.nreloc *
368 sizeof(struct
369 MachO::relocation_info),
370 "section relocation entries"))
371 return Err;
Lang Hames9e964f32016-03-25 17:25:34 +0000372 }
Kevin Enderby600fb3f2016-08-05 18:19:40 +0000373 if (S.fileoff > FileSize)
374 return malformedError("load command " + Twine(LoadCommandIndex) +
NAKAMURA Takumi9d0b5312016-08-22 00:58:47 +0000375 " fileoff field in " + CmdName +
Kevin Enderby600fb3f2016-08-05 18:19:40 +0000376 " extends past the end of the file");
Kevin Enderbyc614d282016-08-12 20:10:25 +0000377 uint64_t BigSize = S.fileoff;
378 BigSize += S.filesize;
379 if (BigSize > FileSize)
380 return malformedError("load command " + Twine(LoadCommandIndex) +
381 " fileoff field plus filesize field in " +
382 CmdName + " extends past the end of the file");
383 if (S.vmsize != 0 && S.filesize > S.vmsize)
384 return malformedError("load command " + Twine(LoadCommandIndex) +
Kevin Enderby86d8bd12017-02-07 21:20:44 +0000385 " filesize field in " + CmdName +
Kevin Enderbyc614d282016-08-12 20:10:25 +0000386 " greater than vmsize field");
Lang Hames9e964f32016-03-25 17:25:34 +0000387 IsPageZeroSegment |= StringRef("__PAGEZERO").equals(S.segname);
388 } else
389 return SegOrErr.takeError();
390
391 return Error::success();
Alexey Samsonove1a76ab2015-06-04 22:08:37 +0000392}
393
Lang Hames697e7cd2016-12-04 01:56:10 +0000394static Error checkSymtabCommand(const MachOObjectFile &Obj,
Kevin Enderby0e52c922016-08-26 19:34:07 +0000395 const MachOObjectFile::LoadCommandInfo &Load,
396 uint32_t LoadCommandIndex,
Kevin Enderbyd5039402016-10-31 20:29:48 +0000397 const char **SymtabLoadCmd,
398 std::list<MachOElement> &Elements) {
Kevin Enderby0e52c922016-08-26 19:34:07 +0000399 if (Load.C.cmdsize < sizeof(MachO::symtab_command))
400 return malformedError("load command " + Twine(LoadCommandIndex) +
401 " LC_SYMTAB cmdsize too small");
402 if (*SymtabLoadCmd != nullptr)
403 return malformedError("more than one LC_SYMTAB command");
404 MachO::symtab_command Symtab =
405 getStruct<MachO::symtab_command>(Obj, Load.Ptr);
406 if (Symtab.cmdsize != sizeof(MachO::symtab_command))
407 return malformedError("LC_SYMTAB command " + Twine(LoadCommandIndex) +
408 " has incorrect cmdsize");
Lang Hames697e7cd2016-12-04 01:56:10 +0000409 uint64_t FileSize = Obj.getData().size();
Kevin Enderby0e52c922016-08-26 19:34:07 +0000410 if (Symtab.symoff > FileSize)
411 return malformedError("symoff field of LC_SYMTAB command " +
412 Twine(LoadCommandIndex) + " extends past the end "
413 "of the file");
Kevin Enderbyd5039402016-10-31 20:29:48 +0000414 uint64_t SymtabSize = Symtab.nsyms;
Kevin Enderby0e52c922016-08-26 19:34:07 +0000415 const char *struct_nlist_name;
Lang Hames697e7cd2016-12-04 01:56:10 +0000416 if (Obj.is64Bit()) {
Kevin Enderbyd5039402016-10-31 20:29:48 +0000417 SymtabSize *= sizeof(MachO::nlist_64);
Kevin Enderby0e52c922016-08-26 19:34:07 +0000418 struct_nlist_name = "struct nlist_64";
419 } else {
Kevin Enderbyd5039402016-10-31 20:29:48 +0000420 SymtabSize *= sizeof(MachO::nlist);
Kevin Enderby0e52c922016-08-26 19:34:07 +0000421 struct_nlist_name = "struct nlist";
422 }
Kevin Enderbyd5039402016-10-31 20:29:48 +0000423 uint64_t BigSize = SymtabSize;
Kevin Enderby0e52c922016-08-26 19:34:07 +0000424 BigSize += Symtab.symoff;
425 if (BigSize > FileSize)
426 return malformedError("symoff field plus nsyms field times sizeof(" +
427 Twine(struct_nlist_name) + ") of LC_SYMTAB command " +
428 Twine(LoadCommandIndex) + " extends past the end "
429 "of the file");
Kevin Enderbyd5039402016-10-31 20:29:48 +0000430 if (Error Err = checkOverlappingElement(Elements, Symtab.symoff, SymtabSize,
431 "symbol table"))
432 return Err;
Kevin Enderby0e52c922016-08-26 19:34:07 +0000433 if (Symtab.stroff > FileSize)
434 return malformedError("stroff field of LC_SYMTAB command " +
435 Twine(LoadCommandIndex) + " extends past the end "
436 "of the file");
437 BigSize = Symtab.stroff;
438 BigSize += Symtab.strsize;
439 if (BigSize > FileSize)
440 return malformedError("stroff field plus strsize field of LC_SYMTAB "
441 "command " + Twine(LoadCommandIndex) + " extends "
442 "past the end of the file");
Kevin Enderbyd5039402016-10-31 20:29:48 +0000443 if (Error Err = checkOverlappingElement(Elements, Symtab.stroff,
444 Symtab.strsize, "string table"))
445 return Err;
Kevin Enderby0e52c922016-08-26 19:34:07 +0000446 *SymtabLoadCmd = Load.Ptr;
447 return Error::success();
448}
449
Lang Hames697e7cd2016-12-04 01:56:10 +0000450static Error checkDysymtabCommand(const MachOObjectFile &Obj,
451 const MachOObjectFile::LoadCommandInfo &Load,
452 uint32_t LoadCommandIndex,
453 const char **DysymtabLoadCmd,
454 std::list<MachOElement> &Elements) {
Kevin Enderbydcbc5042016-08-30 21:28:30 +0000455 if (Load.C.cmdsize < sizeof(MachO::dysymtab_command))
456 return malformedError("load command " + Twine(LoadCommandIndex) +
457 " LC_DYSYMTAB cmdsize too small");
458 if (*DysymtabLoadCmd != nullptr)
459 return malformedError("more than one LC_DYSYMTAB command");
460 MachO::dysymtab_command Dysymtab =
461 getStruct<MachO::dysymtab_command>(Obj, Load.Ptr);
462 if (Dysymtab.cmdsize != sizeof(MachO::dysymtab_command))
463 return malformedError("LC_DYSYMTAB command " + Twine(LoadCommandIndex) +
464 " has incorrect cmdsize");
Lang Hames697e7cd2016-12-04 01:56:10 +0000465 uint64_t FileSize = Obj.getData().size();
Kevin Enderbydcbc5042016-08-30 21:28:30 +0000466 if (Dysymtab.tocoff > FileSize)
467 return malformedError("tocoff field of LC_DYSYMTAB command " +
468 Twine(LoadCommandIndex) + " extends past the end of "
469 "the file");
470 uint64_t BigSize = Dysymtab.ntoc;
471 BigSize *= sizeof(MachO::dylib_table_of_contents);
472 BigSize += Dysymtab.tocoff;
473 if (BigSize > FileSize)
474 return malformedError("tocoff field plus ntoc field times sizeof(struct "
475 "dylib_table_of_contents) of LC_DYSYMTAB command " +
476 Twine(LoadCommandIndex) + " extends past the end of "
477 "the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000478 if (Error Err = checkOverlappingElement(Elements, Dysymtab.tocoff,
479 Dysymtab.ntoc * sizeof(struct
NAKAMURA Takumi6f43bd42017-10-18 13:31:28 +0000480 MachO::dylib_table_of_contents),
481 "table of contents"))
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000482 return Err;
Kevin Enderbydcbc5042016-08-30 21:28:30 +0000483 if (Dysymtab.modtaboff > FileSize)
484 return malformedError("modtaboff field of LC_DYSYMTAB command " +
485 Twine(LoadCommandIndex) + " extends past the end of "
486 "the file");
487 BigSize = Dysymtab.nmodtab;
488 const char *struct_dylib_module_name;
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000489 uint64_t sizeof_modtab;
Lang Hames697e7cd2016-12-04 01:56:10 +0000490 if (Obj.is64Bit()) {
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000491 sizeof_modtab = sizeof(MachO::dylib_module_64);
Kevin Enderbydcbc5042016-08-30 21:28:30 +0000492 struct_dylib_module_name = "struct dylib_module_64";
493 } else {
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000494 sizeof_modtab = sizeof(MachO::dylib_module);
Kevin Enderbydcbc5042016-08-30 21:28:30 +0000495 struct_dylib_module_name = "struct dylib_module";
496 }
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000497 BigSize *= sizeof_modtab;
Kevin Enderbydcbc5042016-08-30 21:28:30 +0000498 BigSize += Dysymtab.modtaboff;
499 if (BigSize > FileSize)
500 return malformedError("modtaboff field plus nmodtab field times sizeof(" +
501 Twine(struct_dylib_module_name) + ") of LC_DYSYMTAB "
502 "command " + Twine(LoadCommandIndex) + " extends "
503 "past the end of the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000504 if (Error Err = checkOverlappingElement(Elements, Dysymtab.modtaboff,
505 Dysymtab.nmodtab * sizeof_modtab,
NAKAMURA Takumia1e97a72017-08-28 06:47:47 +0000506 "module table"))
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000507 return Err;
Kevin Enderbydcbc5042016-08-30 21:28:30 +0000508 if (Dysymtab.extrefsymoff > FileSize)
509 return malformedError("extrefsymoff field of LC_DYSYMTAB command " +
510 Twine(LoadCommandIndex) + " extends past the end of "
511 "the file");
512 BigSize = Dysymtab.nextrefsyms;
513 BigSize *= sizeof(MachO::dylib_reference);
514 BigSize += Dysymtab.extrefsymoff;
515 if (BigSize > FileSize)
516 return malformedError("extrefsymoff field plus nextrefsyms field times "
517 "sizeof(struct dylib_reference) of LC_DYSYMTAB "
518 "command " + Twine(LoadCommandIndex) + " extends "
519 "past the end of the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000520 if (Error Err = checkOverlappingElement(Elements, Dysymtab.extrefsymoff,
521 Dysymtab.nextrefsyms *
NAKAMURA Takumia1e97a72017-08-28 06:47:47 +0000522 sizeof(MachO::dylib_reference),
523 "reference table"))
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000524 return Err;
Kevin Enderbydcbc5042016-08-30 21:28:30 +0000525 if (Dysymtab.indirectsymoff > FileSize)
526 return malformedError("indirectsymoff field of LC_DYSYMTAB command " +
527 Twine(LoadCommandIndex) + " extends past the end of "
528 "the file");
529 BigSize = Dysymtab.nindirectsyms;
530 BigSize *= sizeof(uint32_t);
531 BigSize += Dysymtab.indirectsymoff;
532 if (BigSize > FileSize)
533 return malformedError("indirectsymoff field plus nindirectsyms field times "
534 "sizeof(uint32_t) of LC_DYSYMTAB command " +
535 Twine(LoadCommandIndex) + " extends past the end of "
536 "the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000537 if (Error Err = checkOverlappingElement(Elements, Dysymtab.indirectsymoff,
538 Dysymtab.nindirectsyms *
539 sizeof(uint32_t),
NAKAMURA Takumi6f43bd42017-10-18 13:31:28 +0000540 "indirect table"))
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000541 return Err;
Kevin Enderbydcbc5042016-08-30 21:28:30 +0000542 if (Dysymtab.extreloff > FileSize)
543 return malformedError("extreloff field of LC_DYSYMTAB command " +
544 Twine(LoadCommandIndex) + " extends past the end of "
545 "the file");
546 BigSize = Dysymtab.nextrel;
547 BigSize *= sizeof(MachO::relocation_info);
548 BigSize += Dysymtab.extreloff;
549 if (BigSize > FileSize)
550 return malformedError("extreloff field plus nextrel field times sizeof"
551 "(struct relocation_info) of LC_DYSYMTAB command " +
552 Twine(LoadCommandIndex) + " extends past the end of "
553 "the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000554 if (Error Err = checkOverlappingElement(Elements, Dysymtab.extreloff,
555 Dysymtab.nextrel *
NAKAMURA Takumia1e97a72017-08-28 06:47:47 +0000556 sizeof(MachO::relocation_info),
557 "external relocation table"))
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000558 return Err;
Kevin Enderbydcbc5042016-08-30 21:28:30 +0000559 if (Dysymtab.locreloff > FileSize)
560 return malformedError("locreloff field of LC_DYSYMTAB command " +
561 Twine(LoadCommandIndex) + " extends past the end of "
562 "the file");
563 BigSize = Dysymtab.nlocrel;
564 BigSize *= sizeof(MachO::relocation_info);
565 BigSize += Dysymtab.locreloff;
566 if (BigSize > FileSize)
567 return malformedError("locreloff field plus nlocrel field times sizeof"
568 "(struct relocation_info) of LC_DYSYMTAB command " +
569 Twine(LoadCommandIndex) + " extends past the end of "
570 "the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000571 if (Error Err = checkOverlappingElement(Elements, Dysymtab.locreloff,
572 Dysymtab.nlocrel *
NAKAMURA Takumia1e97a72017-08-28 06:47:47 +0000573 sizeof(MachO::relocation_info),
574 "local relocation table"))
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000575 return Err;
Kevin Enderbydcbc5042016-08-30 21:28:30 +0000576 *DysymtabLoadCmd = Load.Ptr;
577 return Error::success();
578}
579
Lang Hames697e7cd2016-12-04 01:56:10 +0000580static Error checkLinkeditDataCommand(const MachOObjectFile &Obj,
Kevin Enderby9d0c9452016-08-31 17:57:46 +0000581 const MachOObjectFile::LoadCommandInfo &Load,
582 uint32_t LoadCommandIndex,
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000583 const char **LoadCmd, const char *CmdName,
584 std::list<MachOElement> &Elements,
585 const char *ElementName) {
Kevin Enderby9d0c9452016-08-31 17:57:46 +0000586 if (Load.C.cmdsize < sizeof(MachO::linkedit_data_command))
587 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
588 CmdName + " cmdsize too small");
589 if (*LoadCmd != nullptr)
590 return malformedError("more than one " + Twine(CmdName) + " command");
591 MachO::linkedit_data_command LinkData =
592 getStruct<MachO::linkedit_data_command>(Obj, Load.Ptr);
593 if (LinkData.cmdsize != sizeof(MachO::linkedit_data_command))
594 return malformedError(Twine(CmdName) + " command " +
595 Twine(LoadCommandIndex) + " has incorrect cmdsize");
Lang Hames697e7cd2016-12-04 01:56:10 +0000596 uint64_t FileSize = Obj.getData().size();
Kevin Enderby9d0c9452016-08-31 17:57:46 +0000597 if (LinkData.dataoff > FileSize)
598 return malformedError("dataoff field of " + Twine(CmdName) + " command " +
599 Twine(LoadCommandIndex) + " extends past the end of "
600 "the file");
601 uint64_t BigSize = LinkData.dataoff;
602 BigSize += LinkData.datasize;
603 if (BigSize > FileSize)
604 return malformedError("dataoff field plus datasize field of " +
605 Twine(CmdName) + " command " +
606 Twine(LoadCommandIndex) + " extends past the end of "
607 "the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000608 if (Error Err = checkOverlappingElement(Elements, LinkData.dataoff,
609 LinkData.datasize, ElementName))
610 return Err;
Kevin Enderby9d0c9452016-08-31 17:57:46 +0000611 *LoadCmd = Load.Ptr;
612 return Error::success();
613}
614
Lang Hames697e7cd2016-12-04 01:56:10 +0000615static Error checkDyldInfoCommand(const MachOObjectFile &Obj,
Kevin Enderbyf76b56c2016-09-13 21:42:28 +0000616 const MachOObjectFile::LoadCommandInfo &Load,
617 uint32_t LoadCommandIndex,
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000618 const char **LoadCmd, const char *CmdName,
619 std::list<MachOElement> &Elements) {
Kevin Enderbyf76b56c2016-09-13 21:42:28 +0000620 if (Load.C.cmdsize < sizeof(MachO::dyld_info_command))
621 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
622 CmdName + " cmdsize too small");
623 if (*LoadCmd != nullptr)
624 return malformedError("more than one LC_DYLD_INFO and or LC_DYLD_INFO_ONLY "
625 "command");
626 MachO::dyld_info_command DyldInfo =
627 getStruct<MachO::dyld_info_command>(Obj, Load.Ptr);
628 if (DyldInfo.cmdsize != sizeof(MachO::dyld_info_command))
629 return malformedError(Twine(CmdName) + " command " +
630 Twine(LoadCommandIndex) + " has incorrect cmdsize");
Lang Hames697e7cd2016-12-04 01:56:10 +0000631 uint64_t FileSize = Obj.getData().size();
Kevin Enderbyf76b56c2016-09-13 21:42:28 +0000632 if (DyldInfo.rebase_off > FileSize)
633 return malformedError("rebase_off field of " + Twine(CmdName) +
634 " command " + Twine(LoadCommandIndex) + " extends "
635 "past the end of the file");
636 uint64_t BigSize = DyldInfo.rebase_off;
637 BigSize += DyldInfo.rebase_size;
638 if (BigSize > FileSize)
639 return malformedError("rebase_off field plus rebase_size field of " +
640 Twine(CmdName) + " command " +
641 Twine(LoadCommandIndex) + " extends past the end of "
642 "the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000643 if (Error Err = checkOverlappingElement(Elements, DyldInfo.rebase_off,
644 DyldInfo.rebase_size,
645 "dyld rebase info"))
646 return Err;
Kevin Enderbyf76b56c2016-09-13 21:42:28 +0000647 if (DyldInfo.bind_off > FileSize)
648 return malformedError("bind_off field of " + Twine(CmdName) +
649 " command " + Twine(LoadCommandIndex) + " extends "
650 "past the end of the file");
651 BigSize = DyldInfo.bind_off;
652 BigSize += DyldInfo.bind_size;
653 if (BigSize > FileSize)
654 return malformedError("bind_off field plus bind_size field of " +
655 Twine(CmdName) + " command " +
656 Twine(LoadCommandIndex) + " extends past the end of "
657 "the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000658 if (Error Err = checkOverlappingElement(Elements, DyldInfo.bind_off,
659 DyldInfo.bind_size,
660 "dyld bind info"))
661 return Err;
Kevin Enderbyf76b56c2016-09-13 21:42:28 +0000662 if (DyldInfo.weak_bind_off > FileSize)
663 return malformedError("weak_bind_off field of " + Twine(CmdName) +
664 " command " + Twine(LoadCommandIndex) + " extends "
665 "past the end of the file");
666 BigSize = DyldInfo.weak_bind_off;
667 BigSize += DyldInfo.weak_bind_size;
668 if (BigSize > FileSize)
669 return malformedError("weak_bind_off field plus weak_bind_size field of " +
670 Twine(CmdName) + " command " +
671 Twine(LoadCommandIndex) + " extends past the end of "
672 "the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000673 if (Error Err = checkOverlappingElement(Elements, DyldInfo.weak_bind_off,
674 DyldInfo.weak_bind_size,
675 "dyld weak bind info"))
676 return Err;
Kevin Enderbyf76b56c2016-09-13 21:42:28 +0000677 if (DyldInfo.lazy_bind_off > FileSize)
678 return malformedError("lazy_bind_off field of " + Twine(CmdName) +
679 " command " + Twine(LoadCommandIndex) + " extends "
680 "past the end of the file");
681 BigSize = DyldInfo.lazy_bind_off;
682 BigSize += DyldInfo.lazy_bind_size;
683 if (BigSize > FileSize)
684 return malformedError("lazy_bind_off field plus lazy_bind_size field of " +
685 Twine(CmdName) + " command " +
686 Twine(LoadCommandIndex) + " extends past the end of "
687 "the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000688 if (Error Err = checkOverlappingElement(Elements, DyldInfo.lazy_bind_off,
689 DyldInfo.lazy_bind_size,
690 "dyld lazy bind info"))
691 return Err;
Kevin Enderbyf76b56c2016-09-13 21:42:28 +0000692 if (DyldInfo.export_off > FileSize)
693 return malformedError("export_off field of " + Twine(CmdName) +
694 " command " + Twine(LoadCommandIndex) + " extends "
695 "past the end of the file");
696 BigSize = DyldInfo.export_off;
697 BigSize += DyldInfo.export_size;
698 if (BigSize > FileSize)
699 return malformedError("export_off field plus export_size field of " +
700 Twine(CmdName) + " command " +
701 Twine(LoadCommandIndex) + " extends past the end of "
702 "the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +0000703 if (Error Err = checkOverlappingElement(Elements, DyldInfo.export_off,
704 DyldInfo.export_size,
705 "dyld export info"))
706 return Err;
Kevin Enderbyf76b56c2016-09-13 21:42:28 +0000707 *LoadCmd = Load.Ptr;
708 return Error::success();
709}
710
Lang Hames697e7cd2016-12-04 01:56:10 +0000711static Error checkDylibCommand(const MachOObjectFile &Obj,
Kevin Enderbyfc0929a2016-09-20 20:14:14 +0000712 const MachOObjectFile::LoadCommandInfo &Load,
713 uint32_t LoadCommandIndex, const char *CmdName) {
714 if (Load.C.cmdsize < sizeof(MachO::dylib_command))
715 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
716 CmdName + " cmdsize too small");
717 MachO::dylib_command D = getStruct<MachO::dylib_command>(Obj, Load.Ptr);
718 if (D.dylib.name < sizeof(MachO::dylib_command))
719 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
720 CmdName + " name.offset field too small, not past "
721 "the end of the dylib_command struct");
722 if (D.dylib.name >= D.cmdsize)
723 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
724 CmdName + " name.offset field extends past the end "
725 "of the load command");
726 // Make sure there is a null between the starting offset of the name and
727 // the end of the load command.
728 uint32_t i;
729 const char *P = (const char *)Load.Ptr;
730 for (i = D.dylib.name; i < D.cmdsize; i++)
731 if (P[i] == '\0')
732 break;
733 if (i >= D.cmdsize)
734 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
735 CmdName + " library name extends past the end of the "
736 "load command");
737 return Error::success();
738}
739
Lang Hames697e7cd2016-12-04 01:56:10 +0000740static Error checkDylibIdCommand(const MachOObjectFile &Obj,
Kevin Enderbyfc0929a2016-09-20 20:14:14 +0000741 const MachOObjectFile::LoadCommandInfo &Load,
742 uint32_t LoadCommandIndex,
743 const char **LoadCmd) {
744 if (Error Err = checkDylibCommand(Obj, Load, LoadCommandIndex,
745 "LC_ID_DYLIB"))
746 return Err;
747 if (*LoadCmd != nullptr)
748 return malformedError("more than one LC_ID_DYLIB command");
Lang Hames697e7cd2016-12-04 01:56:10 +0000749 if (Obj.getHeader().filetype != MachO::MH_DYLIB &&
750 Obj.getHeader().filetype != MachO::MH_DYLIB_STUB)
Kevin Enderbyfc0929a2016-09-20 20:14:14 +0000751 return malformedError("LC_ID_DYLIB load command in non-dynamic library "
752 "file type");
753 *LoadCmd = Load.Ptr;
754 return Error::success();
755}
756
Lang Hames697e7cd2016-12-04 01:56:10 +0000757static Error checkDyldCommand(const MachOObjectFile &Obj,
Kevin Enderby3e490ef2016-09-27 23:24:13 +0000758 const MachOObjectFile::LoadCommandInfo &Load,
759 uint32_t LoadCommandIndex, const char *CmdName) {
760 if (Load.C.cmdsize < sizeof(MachO::dylinker_command))
761 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
762 CmdName + " cmdsize too small");
763 MachO::dylinker_command D = getStruct<MachO::dylinker_command>(Obj, Load.Ptr);
764 if (D.name < sizeof(MachO::dylinker_command))
765 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
766 CmdName + " name.offset field too small, not past "
767 "the end of the dylinker_command struct");
768 if (D.name >= D.cmdsize)
769 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
770 CmdName + " name.offset field extends past the end "
771 "of the load command");
772 // Make sure there is a null between the starting offset of the name and
773 // the end of the load command.
774 uint32_t i;
775 const char *P = (const char *)Load.Ptr;
776 for (i = D.name; i < D.cmdsize; i++)
777 if (P[i] == '\0')
778 break;
779 if (i >= D.cmdsize)
780 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
781 CmdName + " dyld name extends past the end of the "
782 "load command");
783 return Error::success();
784}
785
Lang Hames697e7cd2016-12-04 01:56:10 +0000786static Error checkVersCommand(const MachOObjectFile &Obj,
Kevin Enderby32359db2016-09-28 21:20:45 +0000787 const MachOObjectFile::LoadCommandInfo &Load,
788 uint32_t LoadCommandIndex,
789 const char **LoadCmd, const char *CmdName) {
790 if (Load.C.cmdsize != sizeof(MachO::version_min_command))
791 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
792 CmdName + " has incorrect cmdsize");
793 if (*LoadCmd != nullptr)
794 return malformedError("more than one LC_VERSION_MIN_MACOSX, "
795 "LC_VERSION_MIN_IPHONEOS, LC_VERSION_MIN_TVOS or "
796 "LC_VERSION_MIN_WATCHOS command");
797 *LoadCmd = Load.Ptr;
798 return Error::success();
799}
800
Kevin Enderbya4579c42017-01-19 17:36:31 +0000801static Error checkNoteCommand(const MachOObjectFile &Obj,
802 const MachOObjectFile::LoadCommandInfo &Load,
803 uint32_t LoadCommandIndex,
804 std::list<MachOElement> &Elements) {
805 if (Load.C.cmdsize != sizeof(MachO::note_command))
Jonas Devlieghere81f5abe2017-09-13 13:43:01 +0000806 return malformedError("load command " + Twine(LoadCommandIndex) +
Kevin Enderbya4579c42017-01-19 17:36:31 +0000807 " LC_NOTE has incorrect cmdsize");
808 MachO::note_command Nt = getStruct<MachO::note_command>(Obj, Load.Ptr);
809 uint64_t FileSize = Obj.getData().size();
810 if (Nt.offset > FileSize)
811 return malformedError("offset field of LC_NOTE command " +
812 Twine(LoadCommandIndex) + " extends "
813 "past the end of the file");
814 uint64_t BigSize = Nt.offset;
815 BigSize += Nt.size;
816 if (BigSize > FileSize)
817 return malformedError("size field plus offset field of LC_NOTE command " +
818 Twine(LoadCommandIndex) + " extends past the end of "
819 "the file");
820 if (Error Err = checkOverlappingElement(Elements, Nt.offset, Nt.size,
821 "LC_NOTE data"))
822 return Err;
823 return Error::success();
824}
825
Steven Wu5b54a422017-01-23 20:07:55 +0000826static Error
827parseBuildVersionCommand(const MachOObjectFile &Obj,
828 const MachOObjectFile::LoadCommandInfo &Load,
829 SmallVectorImpl<const char*> &BuildTools,
830 uint32_t LoadCommandIndex) {
831 MachO::build_version_command BVC =
832 getStruct<MachO::build_version_command>(Obj, Load.Ptr);
833 if (Load.C.cmdsize !=
834 sizeof(MachO::build_version_command) +
835 BVC.ntools * sizeof(MachO::build_tool_version))
836 return malformedError("load command " + Twine(LoadCommandIndex) +
837 " LC_BUILD_VERSION_COMMAND has incorrect cmdsize");
838
839 auto Start = Load.Ptr + sizeof(MachO::build_version_command);
840 BuildTools.resize(BVC.ntools);
841 for (unsigned i = 0; i < BVC.ntools; ++i)
842 BuildTools[i] = Start + i * sizeof(MachO::build_tool_version);
843
844 return Error::success();
845}
846
Lang Hames697e7cd2016-12-04 01:56:10 +0000847static Error checkRpathCommand(const MachOObjectFile &Obj,
Kevin Enderby76966bf2016-09-28 23:16:01 +0000848 const MachOObjectFile::LoadCommandInfo &Load,
849 uint32_t LoadCommandIndex) {
850 if (Load.C.cmdsize < sizeof(MachO::rpath_command))
851 return malformedError("load command " + Twine(LoadCommandIndex) +
852 " LC_RPATH cmdsize too small");
853 MachO::rpath_command R = getStruct<MachO::rpath_command>(Obj, Load.Ptr);
854 if (R.path < sizeof(MachO::rpath_command))
855 return malformedError("load command " + Twine(LoadCommandIndex) +
856 " LC_RPATH path.offset field too small, not past "
857 "the end of the rpath_command struct");
858 if (R.path >= R.cmdsize)
859 return malformedError("load command " + Twine(LoadCommandIndex) +
860 " LC_RPATH path.offset field extends past the end "
861 "of the load command");
862 // Make sure there is a null between the starting offset of the path and
863 // the end of the load command.
864 uint32_t i;
865 const char *P = (const char *)Load.Ptr;
866 for (i = R.path; i < R.cmdsize; i++)
867 if (P[i] == '\0')
868 break;
869 if (i >= R.cmdsize)
870 return malformedError("load command " + Twine(LoadCommandIndex) +
871 " LC_RPATH library name extends past the end of the "
872 "load command");
873 return Error::success();
874}
875
Lang Hames697e7cd2016-12-04 01:56:10 +0000876static Error checkEncryptCommand(const MachOObjectFile &Obj,
Kevin Enderbyf993d6e2016-10-04 20:37:43 +0000877 const MachOObjectFile::LoadCommandInfo &Load,
878 uint32_t LoadCommandIndex,
879 uint64_t cryptoff, uint64_t cryptsize,
880 const char **LoadCmd, const char *CmdName) {
881 if (*LoadCmd != nullptr)
882 return malformedError("more than one LC_ENCRYPTION_INFO and or "
883 "LC_ENCRYPTION_INFO_64 command");
Lang Hames697e7cd2016-12-04 01:56:10 +0000884 uint64_t FileSize = Obj.getData().size();
Kevin Enderbyf993d6e2016-10-04 20:37:43 +0000885 if (cryptoff > FileSize)
886 return malformedError("cryptoff field of " + Twine(CmdName) +
887 " command " + Twine(LoadCommandIndex) + " extends "
888 "past the end of the file");
889 uint64_t BigSize = cryptoff;
890 BigSize += cryptsize;
891 if (BigSize > FileSize)
892 return malformedError("cryptoff field plus cryptsize field of " +
893 Twine(CmdName) + " command " +
894 Twine(LoadCommandIndex) + " extends past the end of "
895 "the file");
896 *LoadCmd = Load.Ptr;
897 return Error::success();
898}
899
Lang Hames697e7cd2016-12-04 01:56:10 +0000900static Error checkLinkerOptCommand(const MachOObjectFile &Obj,
Kevin Enderby68fffa82016-10-11 21:04:39 +0000901 const MachOObjectFile::LoadCommandInfo &Load,
902 uint32_t LoadCommandIndex) {
903 if (Load.C.cmdsize < sizeof(MachO::linker_option_command))
904 return malformedError("load command " + Twine(LoadCommandIndex) +
905 " LC_LINKER_OPTION cmdsize too small");
906 MachO::linker_option_command L =
907 getStruct<MachO::linker_option_command>(Obj, Load.Ptr);
908 // Make sure the count of strings is correct.
909 const char *string = (const char *)Load.Ptr +
910 sizeof(struct MachO::linker_option_command);
911 uint32_t left = L.cmdsize - sizeof(struct MachO::linker_option_command);
912 uint32_t i = 0;
913 while (left > 0) {
914 while (*string == '\0' && left > 0) {
915 string++;
916 left--;
917 }
918 if (left > 0) {
919 i++;
920 uint32_t NullPos = StringRef(string, left).find('\0');
921 uint32_t len = std::min(NullPos, left) + 1;
922 string += len;
923 left -= len;
924 }
925 }
926 if (L.count != i)
927 return malformedError("load command " + Twine(LoadCommandIndex) +
928 " LC_LINKER_OPTION string count " + Twine(L.count) +
929 " does not match number of strings");
930 return Error::success();
931}
932
Lang Hames697e7cd2016-12-04 01:56:10 +0000933static Error checkSubCommand(const MachOObjectFile &Obj,
Kevin Enderby2490de02016-10-17 22:09:25 +0000934 const MachOObjectFile::LoadCommandInfo &Load,
935 uint32_t LoadCommandIndex, const char *CmdName,
936 size_t SizeOfCmd, const char *CmdStructName,
937 uint32_t PathOffset, const char *PathFieldName) {
938 if (PathOffset < SizeOfCmd)
939 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
940 CmdName + " " + PathFieldName + ".offset field too "
941 "small, not past the end of the " + CmdStructName);
942 if (PathOffset >= Load.C.cmdsize)
943 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
944 CmdName + " " + PathFieldName + ".offset field "
945 "extends past the end of the load command");
946 // Make sure there is a null between the starting offset of the path and
947 // the end of the load command.
948 uint32_t i;
949 const char *P = (const char *)Load.Ptr;
950 for (i = PathOffset; i < Load.C.cmdsize; i++)
951 if (P[i] == '\0')
952 break;
953 if (i >= Load.C.cmdsize)
954 return malformedError("load command " + Twine(LoadCommandIndex) + " " +
955 CmdName + " " + PathFieldName + " name extends past "
956 "the end of the load command");
957 return Error::success();
958}
959
Lang Hames697e7cd2016-12-04 01:56:10 +0000960static Error checkThreadCommand(const MachOObjectFile &Obj,
Kevin Enderby210030b2016-10-19 23:44:34 +0000961 const MachOObjectFile::LoadCommandInfo &Load,
962 uint32_t LoadCommandIndex,
963 const char *CmdName) {
964 if (Load.C.cmdsize < sizeof(MachO::thread_command))
965 return malformedError("load command " + Twine(LoadCommandIndex) +
966 CmdName + " cmdsize too small");
967 MachO::thread_command T =
968 getStruct<MachO::thread_command>(Obj, Load.Ptr);
969 const char *state = Load.Ptr + sizeof(MachO::thread_command);
970 const char *end = Load.Ptr + T.cmdsize;
971 uint32_t nflavor = 0;
972 uint32_t cputype = getCPUType(Obj);
973 while (state < end) {
974 if(state + sizeof(uint32_t) > end)
975 return malformedError("load command " + Twine(LoadCommandIndex) +
976 "flavor in " + CmdName + " extends past end of "
977 "command");
978 uint32_t flavor;
979 memcpy(&flavor, state, sizeof(uint32_t));
Lang Hames697e7cd2016-12-04 01:56:10 +0000980 if (Obj.isLittleEndian() != sys::IsLittleEndianHost)
Kevin Enderby210030b2016-10-19 23:44:34 +0000981 sys::swapByteOrder(flavor);
982 state += sizeof(uint32_t);
983
984 if(state + sizeof(uint32_t) > end)
985 return malformedError("load command " + Twine(LoadCommandIndex) +
986 " count in " + CmdName + " extends past end of "
987 "command");
988 uint32_t count;
989 memcpy(&count, state, sizeof(uint32_t));
Lang Hames697e7cd2016-12-04 01:56:10 +0000990 if (Obj.isLittleEndian() != sys::IsLittleEndianHost)
Kevin Enderby210030b2016-10-19 23:44:34 +0000991 sys::swapByteOrder(count);
992 state += sizeof(uint32_t);
993
Kevin Enderbyc3a035d2017-01-23 21:13:29 +0000994 if (cputype == MachO::CPU_TYPE_I386) {
995 if (flavor == MachO::x86_THREAD_STATE32) {
996 if (count != MachO::x86_THREAD_STATE32_COUNT)
997 return malformedError("load command " + Twine(LoadCommandIndex) +
998 " count not x86_THREAD_STATE32_COUNT for "
999 "flavor number " + Twine(nflavor) + " which is "
1000 "a x86_THREAD_STATE32 flavor in " + CmdName +
1001 " command");
1002 if (state + sizeof(MachO::x86_thread_state32_t) > end)
1003 return malformedError("load command " + Twine(LoadCommandIndex) +
1004 " x86_THREAD_STATE32 extends past end of "
1005 "command in " + CmdName + " command");
1006 state += sizeof(MachO::x86_thread_state32_t);
1007 } else {
1008 return malformedError("load command " + Twine(LoadCommandIndex) +
1009 " unknown flavor (" + Twine(flavor) + ") for "
1010 "flavor number " + Twine(nflavor) + " in " +
1011 CmdName + " command");
1012 }
1013 } else if (cputype == MachO::CPU_TYPE_X86_64) {
Kevin Enderby299cd892018-03-08 23:10:38 +00001014 if (flavor == MachO::x86_THREAD_STATE) {
1015 if (count != MachO::x86_THREAD_STATE_COUNT)
1016 return malformedError("load command " + Twine(LoadCommandIndex) +
1017 " count not x86_THREAD_STATE_COUNT for "
1018 "flavor number " + Twine(nflavor) + " which is "
1019 "a x86_THREAD_STATE flavor in " + CmdName +
1020 " command");
1021 if (state + sizeof(MachO::x86_thread_state_t) > end)
1022 return malformedError("load command " + Twine(LoadCommandIndex) +
1023 " x86_THREAD_STATE extends past end of "
1024 "command in " + CmdName + " command");
1025 state += sizeof(MachO::x86_thread_state_t);
1026 } else if (flavor == MachO::x86_FLOAT_STATE) {
1027 if (count != MachO::x86_FLOAT_STATE_COUNT)
1028 return malformedError("load command " + Twine(LoadCommandIndex) +
1029 " count not x86_FLOAT_STATE_COUNT for "
1030 "flavor number " + Twine(nflavor) + " which is "
1031 "a x86_FLOAT_STATE flavor in " + CmdName +
1032 " command");
1033 if (state + sizeof(MachO::x86_float_state_t) > end)
1034 return malformedError("load command " + Twine(LoadCommandIndex) +
1035 " x86_FLOAT_STATE extends past end of "
1036 "command in " + CmdName + " command");
1037 state += sizeof(MachO::x86_float_state_t);
1038 } else if (flavor == MachO::x86_EXCEPTION_STATE) {
1039 if (count != MachO::x86_EXCEPTION_STATE_COUNT)
1040 return malformedError("load command " + Twine(LoadCommandIndex) +
1041 " count not x86_EXCEPTION_STATE_COUNT for "
1042 "flavor number " + Twine(nflavor) + " which is "
1043 "a x86_EXCEPTION_STATE flavor in " + CmdName +
1044 " command");
1045 if (state + sizeof(MachO::x86_exception_state_t) > end)
1046 return malformedError("load command " + Twine(LoadCommandIndex) +
1047 " x86_EXCEPTION_STATE extends past end of "
1048 "command in " + CmdName + " command");
1049 state += sizeof(MachO::x86_exception_state_t);
1050 } else if (flavor == MachO::x86_THREAD_STATE64) {
Kevin Enderby210030b2016-10-19 23:44:34 +00001051 if (count != MachO::x86_THREAD_STATE64_COUNT)
1052 return malformedError("load command " + Twine(LoadCommandIndex) +
1053 " count not x86_THREAD_STATE64_COUNT for "
1054 "flavor number " + Twine(nflavor) + " which is "
1055 "a x86_THREAD_STATE64 flavor in " + CmdName +
1056 " command");
1057 if (state + sizeof(MachO::x86_thread_state64_t) > end)
1058 return malformedError("load command " + Twine(LoadCommandIndex) +
1059 " x86_THREAD_STATE64 extends past end of "
1060 "command in " + CmdName + " command");
1061 state += sizeof(MachO::x86_thread_state64_t);
Kevin Enderby299cd892018-03-08 23:10:38 +00001062 } else if (flavor == MachO::x86_EXCEPTION_STATE64) {
1063 if (count != MachO::x86_EXCEPTION_STATE64_COUNT)
1064 return malformedError("load command " + Twine(LoadCommandIndex) +
1065 " count not x86_EXCEPTION_STATE64_COUNT for "
1066 "flavor number " + Twine(nflavor) + " which is "
1067 "a x86_EXCEPTION_STATE64 flavor in " + CmdName +
1068 " command");
1069 if (state + sizeof(MachO::x86_exception_state64_t) > end)
1070 return malformedError("load command " + Twine(LoadCommandIndex) +
1071 " x86_EXCEPTION_STATE64 extends past end of "
1072 "command in " + CmdName + " command");
1073 state += sizeof(MachO::x86_exception_state64_t);
Kevin Enderby210030b2016-10-19 23:44:34 +00001074 } else {
1075 return malformedError("load command " + Twine(LoadCommandIndex) +
1076 " unknown flavor (" + Twine(flavor) + ") for "
1077 "flavor number " + Twine(nflavor) + " in " +
1078 CmdName + " command");
1079 }
1080 } else if (cputype == MachO::CPU_TYPE_ARM) {
1081 if (flavor == MachO::ARM_THREAD_STATE) {
1082 if (count != MachO::ARM_THREAD_STATE_COUNT)
1083 return malformedError("load command " + Twine(LoadCommandIndex) +
1084 " count not ARM_THREAD_STATE_COUNT for "
1085 "flavor number " + Twine(nflavor) + " which is "
1086 "a ARM_THREAD_STATE flavor in " + CmdName +
1087 " command");
1088 if (state + sizeof(MachO::arm_thread_state32_t) > end)
1089 return malformedError("load command " + Twine(LoadCommandIndex) +
1090 " ARM_THREAD_STATE extends past end of "
1091 "command in " + CmdName + " command");
1092 state += sizeof(MachO::arm_thread_state32_t);
1093 } else {
1094 return malformedError("load command " + Twine(LoadCommandIndex) +
1095 " unknown flavor (" + Twine(flavor) + ") for "
1096 "flavor number " + Twine(nflavor) + " in " +
1097 CmdName + " command");
1098 }
Kevin Enderby7747cb52016-11-03 20:51:28 +00001099 } else if (cputype == MachO::CPU_TYPE_ARM64) {
1100 if (flavor == MachO::ARM_THREAD_STATE64) {
1101 if (count != MachO::ARM_THREAD_STATE64_COUNT)
1102 return malformedError("load command " + Twine(LoadCommandIndex) +
1103 " count not ARM_THREAD_STATE64_COUNT for "
1104 "flavor number " + Twine(nflavor) + " which is "
1105 "a ARM_THREAD_STATE64 flavor in " + CmdName +
1106 " command");
1107 if (state + sizeof(MachO::arm_thread_state64_t) > end)
1108 return malformedError("load command " + Twine(LoadCommandIndex) +
1109 " ARM_THREAD_STATE64 extends past end of "
1110 "command in " + CmdName + " command");
1111 state += sizeof(MachO::arm_thread_state64_t);
1112 } else {
1113 return malformedError("load command " + Twine(LoadCommandIndex) +
1114 " unknown flavor (" + Twine(flavor) + ") for "
1115 "flavor number " + Twine(nflavor) + " in " +
1116 CmdName + " command");
1117 }
Kevin Enderby210030b2016-10-19 23:44:34 +00001118 } else if (cputype == MachO::CPU_TYPE_POWERPC) {
1119 if (flavor == MachO::PPC_THREAD_STATE) {
1120 if (count != MachO::PPC_THREAD_STATE_COUNT)
1121 return malformedError("load command " + Twine(LoadCommandIndex) +
1122 " count not PPC_THREAD_STATE_COUNT for "
1123 "flavor number " + Twine(nflavor) + " which is "
1124 "a PPC_THREAD_STATE flavor in " + CmdName +
1125 " command");
1126 if (state + sizeof(MachO::ppc_thread_state32_t) > end)
1127 return malformedError("load command " + Twine(LoadCommandIndex) +
1128 " PPC_THREAD_STATE extends past end of "
1129 "command in " + CmdName + " command");
1130 state += sizeof(MachO::ppc_thread_state32_t);
1131 } else {
1132 return malformedError("load command " + Twine(LoadCommandIndex) +
1133 " unknown flavor (" + Twine(flavor) + ") for "
1134 "flavor number " + Twine(nflavor) + " in " +
1135 CmdName + " command");
1136 }
1137 } else {
1138 return malformedError("unknown cputype (" + Twine(cputype) + ") load "
1139 "command " + Twine(LoadCommandIndex) + " for " +
1140 CmdName + " command can't be checked");
1141 }
1142 nflavor++;
1143 }
1144 return Error::success();
1145}
1146
Lang Hames697e7cd2016-12-04 01:56:10 +00001147static Error checkTwoLevelHintsCommand(const MachOObjectFile &Obj,
Kevin Enderbyc8bb4222016-10-20 20:10:30 +00001148 const MachOObjectFile::LoadCommandInfo
1149 &Load,
1150 uint32_t LoadCommandIndex,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001151 const char **LoadCmd,
1152 std::list<MachOElement> &Elements) {
Kevin Enderbyc8bb4222016-10-20 20:10:30 +00001153 if (Load.C.cmdsize != sizeof(MachO::twolevel_hints_command))
1154 return malformedError("load command " + Twine(LoadCommandIndex) +
1155 " LC_TWOLEVEL_HINTS has incorrect cmdsize");
1156 if (*LoadCmd != nullptr)
1157 return malformedError("more than one LC_TWOLEVEL_HINTS command");
1158 MachO::twolevel_hints_command Hints =
1159 getStruct<MachO::twolevel_hints_command>(Obj, Load.Ptr);
Lang Hames697e7cd2016-12-04 01:56:10 +00001160 uint64_t FileSize = Obj.getData().size();
Kevin Enderbyc8bb4222016-10-20 20:10:30 +00001161 if (Hints.offset > FileSize)
1162 return malformedError("offset field of LC_TWOLEVEL_HINTS command " +
1163 Twine(LoadCommandIndex) + " extends past the end of "
1164 "the file");
1165 uint64_t BigSize = Hints.nhints;
Jessica Paquette1a81dfb2017-10-17 20:43:33 +00001166 BigSize *= sizeof(MachO::twolevel_hint);
Kevin Enderbyc8bb4222016-10-20 20:10:30 +00001167 BigSize += Hints.offset;
1168 if (BigSize > FileSize)
1169 return malformedError("offset field plus nhints times sizeof(struct "
1170 "twolevel_hint) field of LC_TWOLEVEL_HINTS command " +
1171 Twine(LoadCommandIndex) + " extends past the end of "
1172 "the file");
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001173 if (Error Err = checkOverlappingElement(Elements, Hints.offset, Hints.nhints *
1174 sizeof(MachO::twolevel_hint),
1175 "two level hints"))
1176 return Err;
Kevin Enderbyc8bb4222016-10-20 20:10:30 +00001177 *LoadCmd = Load.Ptr;
1178 return Error::success();
1179}
1180
Kevin Enderbybc5c29a2016-10-27 20:59:10 +00001181// Returns true if the libObject code does not support the load command and its
1182// contents. The cmd value it is treated as an unknown load command but with
1183// an error message that says the cmd value is obsolete.
1184static bool isLoadCommandObsolete(uint32_t cmd) {
1185 if (cmd == MachO::LC_SYMSEG ||
1186 cmd == MachO::LC_LOADFVMLIB ||
1187 cmd == MachO::LC_IDFVMLIB ||
1188 cmd == MachO::LC_IDENT ||
1189 cmd == MachO::LC_FVMFILE ||
1190 cmd == MachO::LC_PREPAGE ||
1191 cmd == MachO::LC_PREBOUND_DYLIB ||
1192 cmd == MachO::LC_TWOLEVEL_HINTS ||
1193 cmd == MachO::LC_PREBIND_CKSUM)
1194 return true;
1195 return false;
1196}
1197
Lang Hames82627642016-03-25 21:59:14 +00001198Expected<std::unique_ptr<MachOObjectFile>>
1199MachOObjectFile::create(MemoryBufferRef Object, bool IsLittleEndian,
Kevin Enderby79d6c632016-10-24 21:15:11 +00001200 bool Is64Bits, uint32_t UniversalCputype,
1201 uint32_t UniversalIndex) {
Mehdi Amini41af4302016-11-11 04:28:40 +00001202 Error Err = Error::success();
Lang Hames82627642016-03-25 21:59:14 +00001203 std::unique_ptr<MachOObjectFile> Obj(
1204 new MachOObjectFile(std::move(Object), IsLittleEndian,
Kevin Enderby79d6c632016-10-24 21:15:11 +00001205 Is64Bits, Err, UniversalCputype,
1206 UniversalIndex));
Lang Hames82627642016-03-25 21:59:14 +00001207 if (Err)
1208 return std::move(Err);
1209 return std::move(Obj);
1210}
1211
Rafael Espindola48af1c22014-08-19 18:44:46 +00001212MachOObjectFile::MachOObjectFile(MemoryBufferRef Object, bool IsLittleEndian,
Kevin Enderby79d6c632016-10-24 21:15:11 +00001213 bool Is64bits, Error &Err,
1214 uint32_t UniversalCputype,
1215 uint32_t UniversalIndex)
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00001216 : ObjectFile(getMachOType(IsLittleEndian, Is64bits), Object) {
Lang Hames5e51a2e2016-07-22 16:11:25 +00001217 ErrorAsOutParameter ErrAsOutParam(&Err);
Kevin Enderbyc614d282016-08-12 20:10:25 +00001218 uint64_t SizeOfHeaders;
Kevin Enderby79d6c632016-10-24 21:15:11 +00001219 uint32_t cputype;
Kevin Enderby87025742016-04-13 21:17:58 +00001220 if (is64Bit()) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001221 parseHeader(*this, Header64, Err);
Kevin Enderbyc614d282016-08-12 20:10:25 +00001222 SizeOfHeaders = sizeof(MachO::mach_header_64);
Kevin Enderby79d6c632016-10-24 21:15:11 +00001223 cputype = Header64.cputype;
Kevin Enderby87025742016-04-13 21:17:58 +00001224 } else {
Lang Hames697e7cd2016-12-04 01:56:10 +00001225 parseHeader(*this, Header, Err);
Kevin Enderbyc614d282016-08-12 20:10:25 +00001226 SizeOfHeaders = sizeof(MachO::mach_header);
Kevin Enderby79d6c632016-10-24 21:15:11 +00001227 cputype = Header.cputype;
Kevin Enderby87025742016-04-13 21:17:58 +00001228 }
Lang Hames9e964f32016-03-25 17:25:34 +00001229 if (Err)
Alexey Samsonov9f336632015-06-04 19:45:22 +00001230 return;
Kevin Enderbyc614d282016-08-12 20:10:25 +00001231 SizeOfHeaders += getHeader().sizeofcmds;
1232 if (getData().data() + SizeOfHeaders > getData().end()) {
Kevin Enderbyd4e075b2016-05-06 20:16:28 +00001233 Err = malformedError("load commands extend past the end of the file");
Kevin Enderby87025742016-04-13 21:17:58 +00001234 return;
1235 }
Kevin Enderby79d6c632016-10-24 21:15:11 +00001236 if (UniversalCputype != 0 && cputype != UniversalCputype) {
1237 Err = malformedError("universal header architecture: " +
1238 Twine(UniversalIndex) + "'s cputype does not match "
1239 "object file's mach header");
1240 return;
1241 }
Kevin Enderbyd5039402016-10-31 20:29:48 +00001242 std::list<MachOElement> Elements;
1243 Elements.push_back({0, SizeOfHeaders, "Mach-O headers"});
Alexey Samsonov13415ed2015-06-04 19:22:03 +00001244
1245 uint32_t LoadCommandCount = getHeader().ncmds;
Lang Hames9e964f32016-03-25 17:25:34 +00001246 LoadCommandInfo Load;
Kevin Enderbyfc0929a2016-09-20 20:14:14 +00001247 if (LoadCommandCount != 0) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001248 if (auto LoadOrErr = getFirstLoadCommandInfo(*this))
Kevin Enderbyfc0929a2016-09-20 20:14:14 +00001249 Load = *LoadOrErr;
1250 else {
1251 Err = LoadOrErr.takeError();
1252 return;
1253 }
Alexey Samsonovde5a94a2015-06-04 19:57:46 +00001254 }
Lang Hames9e964f32016-03-25 17:25:34 +00001255
Kevin Enderbyfc0929a2016-09-20 20:14:14 +00001256 const char *DyldIdLoadCmd = nullptr;
Kevin Enderby90986e62016-09-26 21:11:03 +00001257 const char *FuncStartsLoadCmd = nullptr;
1258 const char *SplitInfoLoadCmd = nullptr;
1259 const char *CodeSignDrsLoadCmd = nullptr;
Kevin Enderby89baf992016-10-18 20:24:12 +00001260 const char *CodeSignLoadCmd = nullptr;
Kevin Enderby32359db2016-09-28 21:20:45 +00001261 const char *VersLoadCmd = nullptr;
Kevin Enderby245be3e2016-09-29 17:45:23 +00001262 const char *SourceLoadCmd = nullptr;
Kevin Enderby4f229d82016-09-29 21:07:29 +00001263 const char *EntryPointLoadCmd = nullptr;
Kevin Enderbyf993d6e2016-10-04 20:37:43 +00001264 const char *EncryptLoadCmd = nullptr;
Kevin Enderby6f695822016-10-18 17:54:17 +00001265 const char *RoutinesLoadCmd = nullptr;
Kevin Enderby210030b2016-10-19 23:44:34 +00001266 const char *UnixThreadLoadCmd = nullptr;
Kevin Enderbyc8bb4222016-10-20 20:10:30 +00001267 const char *TwoLevelHintsLoadCmd = nullptr;
Alexey Samsonovd319c4f2015-06-03 22:19:36 +00001268 for (unsigned I = 0; I < LoadCommandCount; ++I) {
Kevin Enderby1851a822016-07-07 22:11:42 +00001269 if (is64Bit()) {
1270 if (Load.C.cmdsize % 8 != 0) {
1271 // We have a hack here to allow 64-bit Mach-O core files to have
1272 // LC_THREAD commands that are only a multiple of 4 and not 8 to be
1273 // allowed since the macOS kernel produces them.
1274 if (getHeader().filetype != MachO::MH_CORE ||
1275 Load.C.cmd != MachO::LC_THREAD || Load.C.cmdsize % 4) {
1276 Err = malformedError("load command " + Twine(I) + " cmdsize not a "
1277 "multiple of 8");
1278 return;
1279 }
1280 }
1281 } else {
1282 if (Load.C.cmdsize % 4 != 0) {
1283 Err = malformedError("load command " + Twine(I) + " cmdsize not a "
1284 "multiple of 4");
1285 return;
1286 }
1287 }
Alexey Samsonovd319c4f2015-06-03 22:19:36 +00001288 LoadCommands.push_back(Load);
Charles Davis8bdfafd2013-09-01 04:28:48 +00001289 if (Load.C.cmd == MachO::LC_SYMTAB) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001290 if ((Err = checkSymtabCommand(*this, Load, I, &SymtabLoadCmd, Elements)))
David Majnemer73cc6ff2014-11-13 19:48:56 +00001291 return;
Charles Davis8bdfafd2013-09-01 04:28:48 +00001292 } else if (Load.C.cmd == MachO::LC_DYSYMTAB) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001293 if ((Err = checkDysymtabCommand(*this, Load, I, &DysymtabLoadCmd,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001294 Elements)))
David Majnemer73cc6ff2014-11-13 19:48:56 +00001295 return;
Charles Davis8bdfafd2013-09-01 04:28:48 +00001296 } else if (Load.C.cmd == MachO::LC_DATA_IN_CODE) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001297 if ((Err = checkLinkeditDataCommand(*this, Load, I, &DataInCodeLoadCmd,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001298 "LC_DATA_IN_CODE", Elements,
1299 "data in code info")))
David Majnemer73cc6ff2014-11-13 19:48:56 +00001300 return;
Kevin Enderby9a509442015-01-27 21:28:24 +00001301 } else if (Load.C.cmd == MachO::LC_LINKER_OPTIMIZATION_HINT) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001302 if ((Err = checkLinkeditDataCommand(*this, Load, I, &LinkOptHintsLoadCmd,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001303 "LC_LINKER_OPTIMIZATION_HINT",
1304 Elements, "linker optimization "
1305 "hints")))
Kevin Enderby9a509442015-01-27 21:28:24 +00001306 return;
Kevin Enderby90986e62016-09-26 21:11:03 +00001307 } else if (Load.C.cmd == MachO::LC_FUNCTION_STARTS) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001308 if ((Err = checkLinkeditDataCommand(*this, Load, I, &FuncStartsLoadCmd,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001309 "LC_FUNCTION_STARTS", Elements,
1310 "function starts data")))
Kevin Enderby90986e62016-09-26 21:11:03 +00001311 return;
1312 } else if (Load.C.cmd == MachO::LC_SEGMENT_SPLIT_INFO) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001313 if ((Err = checkLinkeditDataCommand(*this, Load, I, &SplitInfoLoadCmd,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001314 "LC_SEGMENT_SPLIT_INFO", Elements,
1315 "split info data")))
Kevin Enderby90986e62016-09-26 21:11:03 +00001316 return;
1317 } else if (Load.C.cmd == MachO::LC_DYLIB_CODE_SIGN_DRS) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001318 if ((Err = checkLinkeditDataCommand(*this, Load, I, &CodeSignDrsLoadCmd,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001319 "LC_DYLIB_CODE_SIGN_DRS", Elements,
1320 "code signing RDs data")))
Kevin Enderby90986e62016-09-26 21:11:03 +00001321 return;
Kevin Enderby89baf992016-10-18 20:24:12 +00001322 } else if (Load.C.cmd == MachO::LC_CODE_SIGNATURE) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001323 if ((Err = checkLinkeditDataCommand(*this, Load, I, &CodeSignLoadCmd,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001324 "LC_CODE_SIGNATURE", Elements,
1325 "code signature data")))
Kevin Enderby89baf992016-10-18 20:24:12 +00001326 return;
Kevin Enderbyf76b56c2016-09-13 21:42:28 +00001327 } else if (Load.C.cmd == MachO::LC_DYLD_INFO) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001328 if ((Err = checkDyldInfoCommand(*this, Load, I, &DyldInfoLoadCmd,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001329 "LC_DYLD_INFO", Elements)))
David Majnemer73cc6ff2014-11-13 19:48:56 +00001330 return;
Kevin Enderbyf76b56c2016-09-13 21:42:28 +00001331 } else if (Load.C.cmd == MachO::LC_DYLD_INFO_ONLY) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001332 if ((Err = checkDyldInfoCommand(*this, Load, I, &DyldInfoLoadCmd,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001333 "LC_DYLD_INFO_ONLY", Elements)))
Kevin Enderbyf76b56c2016-09-13 21:42:28 +00001334 return;
Alexander Potapenko6909b5b2014-10-15 23:35:45 +00001335 } else if (Load.C.cmd == MachO::LC_UUID) {
Kevin Enderbye71e13c2016-09-21 20:03:09 +00001336 if (Load.C.cmdsize != sizeof(MachO::uuid_command)) {
1337 Err = malformedError("LC_UUID command " + Twine(I) + " has incorrect "
1338 "cmdsize");
1339 return;
1340 }
David Majnemer73cc6ff2014-11-13 19:48:56 +00001341 if (UuidLoadCmd) {
Kevin Enderbye71e13c2016-09-21 20:03:09 +00001342 Err = malformedError("more than one LC_UUID command");
David Majnemer73cc6ff2014-11-13 19:48:56 +00001343 return;
1344 }
Alexander Potapenko6909b5b2014-10-15 23:35:45 +00001345 UuidLoadCmd = Load.Ptr;
Alexey Samsonove1a76ab2015-06-04 22:08:37 +00001346 } else if (Load.C.cmd == MachO::LC_SEGMENT_64) {
Kevin Enderbyc614d282016-08-12 20:10:25 +00001347 if ((Err = parseSegmentLoadCommand<MachO::segment_command_64,
1348 MachO::section_64>(
Lang Hames697e7cd2016-12-04 01:56:10 +00001349 *this, Load, Sections, HasPageZeroSegment, I,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001350 "LC_SEGMENT_64", SizeOfHeaders, Elements)))
Alexey Samsonov074da9b2015-06-04 20:08:52 +00001351 return;
Alexey Samsonove1a76ab2015-06-04 22:08:37 +00001352 } else if (Load.C.cmd == MachO::LC_SEGMENT) {
Kevin Enderbyc614d282016-08-12 20:10:25 +00001353 if ((Err = parseSegmentLoadCommand<MachO::segment_command,
1354 MachO::section>(
Lang Hames697e7cd2016-12-04 01:56:10 +00001355 *this, Load, Sections, HasPageZeroSegment, I,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001356 "LC_SEGMENT", SizeOfHeaders, Elements)))
Alexey Samsonov074da9b2015-06-04 20:08:52 +00001357 return;
Kevin Enderbyfc0929a2016-09-20 20:14:14 +00001358 } else if (Load.C.cmd == MachO::LC_ID_DYLIB) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001359 if ((Err = checkDylibIdCommand(*this, Load, I, &DyldIdLoadCmd)))
Kevin Enderbyfc0929a2016-09-20 20:14:14 +00001360 return;
1361 } else if (Load.C.cmd == MachO::LC_LOAD_DYLIB) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001362 if ((Err = checkDylibCommand(*this, Load, I, "LC_LOAD_DYLIB")))
Kevin Enderbyfc0929a2016-09-20 20:14:14 +00001363 return;
1364 Libraries.push_back(Load.Ptr);
1365 } else if (Load.C.cmd == MachO::LC_LOAD_WEAK_DYLIB) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001366 if ((Err = checkDylibCommand(*this, Load, I, "LC_LOAD_WEAK_DYLIB")))
Kevin Enderbyfc0929a2016-09-20 20:14:14 +00001367 return;
1368 Libraries.push_back(Load.Ptr);
1369 } else if (Load.C.cmd == MachO::LC_LAZY_LOAD_DYLIB) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001370 if ((Err = checkDylibCommand(*this, Load, I, "LC_LAZY_LOAD_DYLIB")))
Kevin Enderbyfc0929a2016-09-20 20:14:14 +00001371 return;
1372 Libraries.push_back(Load.Ptr);
1373 } else if (Load.C.cmd == MachO::LC_REEXPORT_DYLIB) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001374 if ((Err = checkDylibCommand(*this, Load, I, "LC_REEXPORT_DYLIB")))
Kevin Enderbyfc0929a2016-09-20 20:14:14 +00001375 return;
1376 Libraries.push_back(Load.Ptr);
1377 } else if (Load.C.cmd == MachO::LC_LOAD_UPWARD_DYLIB) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001378 if ((Err = checkDylibCommand(*this, Load, I, "LC_LOAD_UPWARD_DYLIB")))
Kevin Enderbyfc0929a2016-09-20 20:14:14 +00001379 return;
Kevin Enderby980b2582014-06-05 21:21:57 +00001380 Libraries.push_back(Load.Ptr);
Kevin Enderby3e490ef2016-09-27 23:24:13 +00001381 } else if (Load.C.cmd == MachO::LC_ID_DYLINKER) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001382 if ((Err = checkDyldCommand(*this, Load, I, "LC_ID_DYLINKER")))
Kevin Enderby3e490ef2016-09-27 23:24:13 +00001383 return;
1384 } else if (Load.C.cmd == MachO::LC_LOAD_DYLINKER) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001385 if ((Err = checkDyldCommand(*this, Load, I, "LC_LOAD_DYLINKER")))
Kevin Enderby3e490ef2016-09-27 23:24:13 +00001386 return;
1387 } else if (Load.C.cmd == MachO::LC_DYLD_ENVIRONMENT) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001388 if ((Err = checkDyldCommand(*this, Load, I, "LC_DYLD_ENVIRONMENT")))
Kevin Enderby3e490ef2016-09-27 23:24:13 +00001389 return;
Kevin Enderby32359db2016-09-28 21:20:45 +00001390 } else if (Load.C.cmd == MachO::LC_VERSION_MIN_MACOSX) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001391 if ((Err = checkVersCommand(*this, Load, I, &VersLoadCmd,
Kevin Enderby32359db2016-09-28 21:20:45 +00001392 "LC_VERSION_MIN_MACOSX")))
1393 return;
1394 } else if (Load.C.cmd == MachO::LC_VERSION_MIN_IPHONEOS) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001395 if ((Err = checkVersCommand(*this, Load, I, &VersLoadCmd,
Kevin Enderby32359db2016-09-28 21:20:45 +00001396 "LC_VERSION_MIN_IPHONEOS")))
1397 return;
1398 } else if (Load.C.cmd == MachO::LC_VERSION_MIN_TVOS) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001399 if ((Err = checkVersCommand(*this, Load, I, &VersLoadCmd,
Kevin Enderby32359db2016-09-28 21:20:45 +00001400 "LC_VERSION_MIN_TVOS")))
1401 return;
1402 } else if (Load.C.cmd == MachO::LC_VERSION_MIN_WATCHOS) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001403 if ((Err = checkVersCommand(*this, Load, I, &VersLoadCmd,
Kevin Enderby32359db2016-09-28 21:20:45 +00001404 "LC_VERSION_MIN_WATCHOS")))
1405 return;
Kevin Enderbya4579c42017-01-19 17:36:31 +00001406 } else if (Load.C.cmd == MachO::LC_NOTE) {
1407 if ((Err = checkNoteCommand(*this, Load, I, Elements)))
1408 return;
Steven Wu5b54a422017-01-23 20:07:55 +00001409 } else if (Load.C.cmd == MachO::LC_BUILD_VERSION) {
1410 if ((Err = parseBuildVersionCommand(*this, Load, BuildTools, I)))
1411 return;
Kevin Enderby76966bf2016-09-28 23:16:01 +00001412 } else if (Load.C.cmd == MachO::LC_RPATH) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001413 if ((Err = checkRpathCommand(*this, Load, I)))
Kevin Enderby76966bf2016-09-28 23:16:01 +00001414 return;
Kevin Enderby245be3e2016-09-29 17:45:23 +00001415 } else if (Load.C.cmd == MachO::LC_SOURCE_VERSION) {
1416 if (Load.C.cmdsize != sizeof(MachO::source_version_command)) {
1417 Err = malformedError("LC_SOURCE_VERSION command " + Twine(I) +
1418 " has incorrect cmdsize");
1419 return;
1420 }
1421 if (SourceLoadCmd) {
1422 Err = malformedError("more than one LC_SOURCE_VERSION command");
1423 return;
1424 }
1425 SourceLoadCmd = Load.Ptr;
Kevin Enderby4f229d82016-09-29 21:07:29 +00001426 } else if (Load.C.cmd == MachO::LC_MAIN) {
1427 if (Load.C.cmdsize != sizeof(MachO::entry_point_command)) {
1428 Err = malformedError("LC_MAIN command " + Twine(I) +
1429 " has incorrect cmdsize");
1430 return;
1431 }
1432 if (EntryPointLoadCmd) {
1433 Err = malformedError("more than one LC_MAIN command");
1434 return;
1435 }
1436 EntryPointLoadCmd = Load.Ptr;
Kevin Enderbyf993d6e2016-10-04 20:37:43 +00001437 } else if (Load.C.cmd == MachO::LC_ENCRYPTION_INFO) {
1438 if (Load.C.cmdsize != sizeof(MachO::encryption_info_command)) {
1439 Err = malformedError("LC_ENCRYPTION_INFO command " + Twine(I) +
1440 " has incorrect cmdsize");
1441 return;
1442 }
1443 MachO::encryption_info_command E =
Lang Hames697e7cd2016-12-04 01:56:10 +00001444 getStruct<MachO::encryption_info_command>(*this, Load.Ptr);
1445 if ((Err = checkEncryptCommand(*this, Load, I, E.cryptoff, E.cryptsize,
Kevin Enderbyf993d6e2016-10-04 20:37:43 +00001446 &EncryptLoadCmd, "LC_ENCRYPTION_INFO")))
1447 return;
1448 } else if (Load.C.cmd == MachO::LC_ENCRYPTION_INFO_64) {
1449 if (Load.C.cmdsize != sizeof(MachO::encryption_info_command_64)) {
1450 Err = malformedError("LC_ENCRYPTION_INFO_64 command " + Twine(I) +
1451 " has incorrect cmdsize");
1452 return;
1453 }
1454 MachO::encryption_info_command_64 E =
Lang Hames697e7cd2016-12-04 01:56:10 +00001455 getStruct<MachO::encryption_info_command_64>(*this, Load.Ptr);
1456 if ((Err = checkEncryptCommand(*this, Load, I, E.cryptoff, E.cryptsize,
Kevin Enderbyf993d6e2016-10-04 20:37:43 +00001457 &EncryptLoadCmd, "LC_ENCRYPTION_INFO_64")))
1458 return;
Kevin Enderby68fffa82016-10-11 21:04:39 +00001459 } else if (Load.C.cmd == MachO::LC_LINKER_OPTION) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001460 if ((Err = checkLinkerOptCommand(*this, Load, I)))
Kevin Enderby68fffa82016-10-11 21:04:39 +00001461 return;
Kevin Enderby2490de02016-10-17 22:09:25 +00001462 } else if (Load.C.cmd == MachO::LC_SUB_FRAMEWORK) {
1463 if (Load.C.cmdsize < sizeof(MachO::sub_framework_command)) {
1464 Err = malformedError("load command " + Twine(I) +
1465 " LC_SUB_FRAMEWORK cmdsize too small");
1466 return;
1467 }
1468 MachO::sub_framework_command S =
Lang Hames697e7cd2016-12-04 01:56:10 +00001469 getStruct<MachO::sub_framework_command>(*this, Load.Ptr);
1470 if ((Err = checkSubCommand(*this, Load, I, "LC_SUB_FRAMEWORK",
Kevin Enderby2490de02016-10-17 22:09:25 +00001471 sizeof(MachO::sub_framework_command),
1472 "sub_framework_command", S.umbrella,
1473 "umbrella")))
1474 return;
1475 } else if (Load.C.cmd == MachO::LC_SUB_UMBRELLA) {
1476 if (Load.C.cmdsize < sizeof(MachO::sub_umbrella_command)) {
1477 Err = malformedError("load command " + Twine(I) +
1478 " LC_SUB_UMBRELLA cmdsize too small");
1479 return;
1480 }
1481 MachO::sub_umbrella_command S =
Lang Hames697e7cd2016-12-04 01:56:10 +00001482 getStruct<MachO::sub_umbrella_command>(*this, Load.Ptr);
1483 if ((Err = checkSubCommand(*this, Load, I, "LC_SUB_UMBRELLA",
Kevin Enderby2490de02016-10-17 22:09:25 +00001484 sizeof(MachO::sub_umbrella_command),
1485 "sub_umbrella_command", S.sub_umbrella,
1486 "sub_umbrella")))
1487 return;
1488 } else if (Load.C.cmd == MachO::LC_SUB_LIBRARY) {
1489 if (Load.C.cmdsize < sizeof(MachO::sub_library_command)) {
1490 Err = malformedError("load command " + Twine(I) +
1491 " LC_SUB_LIBRARY cmdsize too small");
1492 return;
1493 }
1494 MachO::sub_library_command S =
Lang Hames697e7cd2016-12-04 01:56:10 +00001495 getStruct<MachO::sub_library_command>(*this, Load.Ptr);
1496 if ((Err = checkSubCommand(*this, Load, I, "LC_SUB_LIBRARY",
Kevin Enderby2490de02016-10-17 22:09:25 +00001497 sizeof(MachO::sub_library_command),
1498 "sub_library_command", S.sub_library,
1499 "sub_library")))
1500 return;
1501 } else if (Load.C.cmd == MachO::LC_SUB_CLIENT) {
1502 if (Load.C.cmdsize < sizeof(MachO::sub_client_command)) {
1503 Err = malformedError("load command " + Twine(I) +
1504 " LC_SUB_CLIENT cmdsize too small");
1505 return;
1506 }
1507 MachO::sub_client_command S =
Lang Hames697e7cd2016-12-04 01:56:10 +00001508 getStruct<MachO::sub_client_command>(*this, Load.Ptr);
1509 if ((Err = checkSubCommand(*this, Load, I, "LC_SUB_CLIENT",
Kevin Enderby2490de02016-10-17 22:09:25 +00001510 sizeof(MachO::sub_client_command),
1511 "sub_client_command", S.client, "client")))
1512 return;
Kevin Enderby6f695822016-10-18 17:54:17 +00001513 } else if (Load.C.cmd == MachO::LC_ROUTINES) {
1514 if (Load.C.cmdsize != sizeof(MachO::routines_command)) {
1515 Err = malformedError("LC_ROUTINES command " + Twine(I) +
1516 " has incorrect cmdsize");
1517 return;
1518 }
1519 if (RoutinesLoadCmd) {
1520 Err = malformedError("more than one LC_ROUTINES and or LC_ROUTINES_64 "
1521 "command");
1522 return;
1523 }
1524 RoutinesLoadCmd = Load.Ptr;
1525 } else if (Load.C.cmd == MachO::LC_ROUTINES_64) {
1526 if (Load.C.cmdsize != sizeof(MachO::routines_command_64)) {
1527 Err = malformedError("LC_ROUTINES_64 command " + Twine(I) +
1528 " has incorrect cmdsize");
1529 return;
1530 }
1531 if (RoutinesLoadCmd) {
1532 Err = malformedError("more than one LC_ROUTINES_64 and or LC_ROUTINES "
1533 "command");
1534 return;
1535 }
1536 RoutinesLoadCmd = Load.Ptr;
Kevin Enderby210030b2016-10-19 23:44:34 +00001537 } else if (Load.C.cmd == MachO::LC_UNIXTHREAD) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001538 if ((Err = checkThreadCommand(*this, Load, I, "LC_UNIXTHREAD")))
Kevin Enderby210030b2016-10-19 23:44:34 +00001539 return;
1540 if (UnixThreadLoadCmd) {
1541 Err = malformedError("more than one LC_UNIXTHREAD command");
1542 return;
1543 }
1544 UnixThreadLoadCmd = Load.Ptr;
1545 } else if (Load.C.cmd == MachO::LC_THREAD) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001546 if ((Err = checkThreadCommand(*this, Load, I, "LC_THREAD")))
Kevin Enderby210030b2016-10-19 23:44:34 +00001547 return;
Kevin Enderbybc5c29a2016-10-27 20:59:10 +00001548 // Note: LC_TWOLEVEL_HINTS is really obsolete and is not supported.
Kevin Enderbyc8bb4222016-10-20 20:10:30 +00001549 } else if (Load.C.cmd == MachO::LC_TWOLEVEL_HINTS) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001550 if ((Err = checkTwoLevelHintsCommand(*this, Load, I,
Kevin Enderbyfbebe162016-11-02 21:08:39 +00001551 &TwoLevelHintsLoadCmd, Elements)))
Kevin Enderbyc8bb4222016-10-20 20:10:30 +00001552 return;
Kevin Enderbybc5c29a2016-10-27 20:59:10 +00001553 } else if (isLoadCommandObsolete(Load.C.cmd)) {
1554 Err = malformedError("load command " + Twine(I) + " for cmd value of: " +
1555 Twine(Load.C.cmd) + " is obsolete and not "
1556 "supported");
1557 return;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001558 }
Kevin Enderbybc5c29a2016-10-27 20:59:10 +00001559 // TODO: generate a error for unknown load commands by default. But still
1560 // need work out an approach to allow or not allow unknown values like this
1561 // as an option for some uses like lldb.
Alexey Samsonovde5a94a2015-06-04 19:57:46 +00001562 if (I < LoadCommandCount - 1) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001563 if (auto LoadOrErr = getNextLoadCommandInfo(*this, I, Load))
Lang Hames9e964f32016-03-25 17:25:34 +00001564 Load = *LoadOrErr;
1565 else {
1566 Err = LoadOrErr.takeError();
Alexey Samsonovde5a94a2015-06-04 19:57:46 +00001567 return;
1568 }
Alexey Samsonovde5a94a2015-06-04 19:57:46 +00001569 }
Rafael Espindola56f976f2013-04-18 18:08:55 +00001570 }
Kevin Enderby1829c682016-01-22 22:49:55 +00001571 if (!SymtabLoadCmd) {
1572 if (DysymtabLoadCmd) {
Kevin Enderbyd4e075b2016-05-06 20:16:28 +00001573 Err = malformedError("contains LC_DYSYMTAB load command without a "
Kevin Enderby89134962016-05-05 23:41:05 +00001574 "LC_SYMTAB load command");
Kevin Enderby1829c682016-01-22 22:49:55 +00001575 return;
1576 }
1577 } else if (DysymtabLoadCmd) {
1578 MachO::symtab_command Symtab =
Lang Hames697e7cd2016-12-04 01:56:10 +00001579 getStruct<MachO::symtab_command>(*this, SymtabLoadCmd);
Kevin Enderby1829c682016-01-22 22:49:55 +00001580 MachO::dysymtab_command Dysymtab =
Lang Hames697e7cd2016-12-04 01:56:10 +00001581 getStruct<MachO::dysymtab_command>(*this, DysymtabLoadCmd);
Kevin Enderby1829c682016-01-22 22:49:55 +00001582 if (Dysymtab.nlocalsym != 0 && Dysymtab.ilocalsym > Symtab.nsyms) {
Kevin Enderbyd4e075b2016-05-06 20:16:28 +00001583 Err = malformedError("ilocalsym in LC_DYSYMTAB load command "
Kevin Enderby89134962016-05-05 23:41:05 +00001584 "extends past the end of the symbol table");
Kevin Enderby1829c682016-01-22 22:49:55 +00001585 return;
1586 }
Kevin Enderby5e55d172016-04-21 20:29:49 +00001587 uint64_t BigSize = Dysymtab.ilocalsym;
1588 BigSize += Dysymtab.nlocalsym;
1589 if (Dysymtab.nlocalsym != 0 && BigSize > Symtab.nsyms) {
Kevin Enderbyd4e075b2016-05-06 20:16:28 +00001590 Err = malformedError("ilocalsym plus nlocalsym in LC_DYSYMTAB load "
Kevin Enderby89134962016-05-05 23:41:05 +00001591 "command extends past the end of the symbol table");
Kevin Enderby1829c682016-01-22 22:49:55 +00001592 return;
1593 }
Francis Visoiu Mistrih7690af42018-09-04 16:31:48 +00001594 if (Dysymtab.nextdefsym != 0 && Dysymtab.iextdefsym > Symtab.nsyms) {
Francis Visoiu Mistrih2d3f01c2018-09-04 16:31:53 +00001595 Err = malformedError("iextdefsym in LC_DYSYMTAB load command "
Kevin Enderby89134962016-05-05 23:41:05 +00001596 "extends past the end of the symbol table");
Kevin Enderby1829c682016-01-22 22:49:55 +00001597 return;
1598 }
Kevin Enderby5e55d172016-04-21 20:29:49 +00001599 BigSize = Dysymtab.iextdefsym;
1600 BigSize += Dysymtab.nextdefsym;
1601 if (Dysymtab.nextdefsym != 0 && BigSize > Symtab.nsyms) {
Kevin Enderbyd4e075b2016-05-06 20:16:28 +00001602 Err = malformedError("iextdefsym plus nextdefsym in LC_DYSYMTAB "
Kevin Enderby89134962016-05-05 23:41:05 +00001603 "load command extends past the end of the symbol "
1604 "table");
Kevin Enderby1829c682016-01-22 22:49:55 +00001605 return;
1606 }
1607 if (Dysymtab.nundefsym != 0 && Dysymtab.iundefsym > Symtab.nsyms) {
Francis Visoiu Mistrih2d3f01c2018-09-04 16:31:53 +00001608 Err = malformedError("iundefsym in LC_DYSYMTAB load command "
Kevin Enderby89134962016-05-05 23:41:05 +00001609 "extends past the end of the symbol table");
Kevin Enderby1829c682016-01-22 22:49:55 +00001610 return;
1611 }
Kevin Enderby5e55d172016-04-21 20:29:49 +00001612 BigSize = Dysymtab.iundefsym;
1613 BigSize += Dysymtab.nundefsym;
1614 if (Dysymtab.nundefsym != 0 && BigSize > Symtab.nsyms) {
Kevin Enderbyd4e075b2016-05-06 20:16:28 +00001615 Err = malformedError("iundefsym plus nundefsym in LC_DYSYMTAB load "
Kevin Enderby89134962016-05-05 23:41:05 +00001616 " command extends past the end of the symbol table");
Kevin Enderby1829c682016-01-22 22:49:55 +00001617 return;
1618 }
1619 }
Kevin Enderbyfc0929a2016-09-20 20:14:14 +00001620 if ((getHeader().filetype == MachO::MH_DYLIB ||
1621 getHeader().filetype == MachO::MH_DYLIB_STUB) &&
1622 DyldIdLoadCmd == nullptr) {
1623 Err = malformedError("no LC_ID_DYLIB load command in dynamic library "
1624 "filetype");
1625 return;
1626 }
Alexey Samsonovd319c4f2015-06-03 22:19:36 +00001627 assert(LoadCommands.size() == LoadCommandCount);
Lang Hames9e964f32016-03-25 17:25:34 +00001628
1629 Err = Error::success();
Rafael Espindola56f976f2013-04-18 18:08:55 +00001630}
1631
Kevin Enderby22fc0072016-11-14 20:57:04 +00001632Error MachOObjectFile::checkSymbolTable() const {
1633 uint32_t Flags = 0;
1634 if (is64Bit()) {
1635 MachO::mach_header_64 H_64 = MachOObjectFile::getHeader64();
1636 Flags = H_64.flags;
1637 } else {
1638 MachO::mach_header H = MachOObjectFile::getHeader();
1639 Flags = H.flags;
1640 }
1641 uint8_t NType = 0;
1642 uint8_t NSect = 0;
1643 uint16_t NDesc = 0;
1644 uint32_t NStrx = 0;
1645 uint64_t NValue = 0;
1646 uint32_t SymbolIndex = 0;
1647 MachO::symtab_command S = getSymtabLoadCommand();
1648 for (const SymbolRef &Symbol : symbols()) {
1649 DataRefImpl SymDRI = Symbol.getRawDataRefImpl();
1650 if (is64Bit()) {
1651 MachO::nlist_64 STE_64 = getSymbol64TableEntry(SymDRI);
1652 NType = STE_64.n_type;
1653 NSect = STE_64.n_sect;
1654 NDesc = STE_64.n_desc;
1655 NStrx = STE_64.n_strx;
1656 NValue = STE_64.n_value;
1657 } else {
1658 MachO::nlist STE = getSymbolTableEntry(SymDRI);
1659 NType = STE.n_type;
1660 NType = STE.n_type;
1661 NSect = STE.n_sect;
1662 NDesc = STE.n_desc;
1663 NStrx = STE.n_strx;
1664 NValue = STE.n_value;
1665 }
1666 if ((NType & MachO::N_STAB) == 0 &&
1667 (NType & MachO::N_TYPE) == MachO::N_SECT) {
1668 if (NSect == 0 || NSect > Sections.size())
1669 return malformedError("bad section index: " + Twine((int)NSect) +
1670 " for symbol at index " + Twine(SymbolIndex));
1671 }
1672 if ((NType & MachO::N_STAB) == 0 &&
1673 (NType & MachO::N_TYPE) == MachO::N_INDR) {
1674 if (NValue >= S.strsize)
1675 return malformedError("bad n_value: " + Twine((int)NValue) + " past "
1676 "the end of string table, for N_INDR symbol at "
1677 "index " + Twine(SymbolIndex));
1678 }
1679 if ((Flags & MachO::MH_TWOLEVEL) == MachO::MH_TWOLEVEL &&
1680 (((NType & MachO::N_TYPE) == MachO::N_UNDF && NValue == 0) ||
1681 (NType & MachO::N_TYPE) == MachO::N_PBUD)) {
1682 uint32_t LibraryOrdinal = MachO::GET_LIBRARY_ORDINAL(NDesc);
1683 if (LibraryOrdinal != 0 &&
1684 LibraryOrdinal != MachO::EXECUTABLE_ORDINAL &&
1685 LibraryOrdinal != MachO::DYNAMIC_LOOKUP_ORDINAL &&
1686 LibraryOrdinal - 1 >= Libraries.size() ) {
1687 return malformedError("bad library ordinal: " + Twine(LibraryOrdinal) +
1688 " for symbol at index " + Twine(SymbolIndex));
1689 }
1690 }
1691 if (NStrx >= S.strsize)
1692 return malformedError("bad string table index: " + Twine((int)NStrx) +
1693 " past the end of string table, for symbol at "
1694 "index " + Twine(SymbolIndex));
1695 SymbolIndex++;
1696 }
1697 return Error::success();
1698}
1699
Rafael Espindola5e812af2014-01-30 02:49:50 +00001700void MachOObjectFile::moveSymbolNext(DataRefImpl &Symb) const {
Rafael Espindola75c30362013-04-24 19:47:55 +00001701 unsigned SymbolTableEntrySize = is64Bit() ?
Charles Davis8bdfafd2013-09-01 04:28:48 +00001702 sizeof(MachO::nlist_64) :
1703 sizeof(MachO::nlist);
Rafael Espindola75c30362013-04-24 19:47:55 +00001704 Symb.p += SymbolTableEntrySize;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001705}
1706
Kevin Enderby81e8b7d2016-04-20 21:24:34 +00001707Expected<StringRef> MachOObjectFile::getSymbolName(DataRefImpl Symb) const {
Rafael Espindola6e040c02013-04-26 20:07:33 +00001708 StringRef StringTable = getStringTableData();
Lang Hames697e7cd2016-12-04 01:56:10 +00001709 MachO::nlist_base Entry = getSymbolTableEntryBase(*this, Symb);
Michael Trentca309022018-01-03 23:28:32 +00001710 if (Entry.n_strx == 0)
1711 // A n_strx value of 0 indicates that no name is associated with a
1712 // particular symbol table entry.
1713 return StringRef();
Charles Davis8bdfafd2013-09-01 04:28:48 +00001714 const char *Start = &StringTable.data()[Entry.n_strx];
Kevin Enderby81e8b7d2016-04-20 21:24:34 +00001715 if (Start < getData().begin() || Start >= getData().end()) {
Kevin Enderbyd4e075b2016-05-06 20:16:28 +00001716 return malformedError("bad string index: " + Twine(Entry.n_strx) +
Kevin Enderby89134962016-05-05 23:41:05 +00001717 " for symbol at index " + Twine(getSymbolIndex(Symb)));
Kevin Enderby81e8b7d2016-04-20 21:24:34 +00001718 }
Rafael Espindola5d0c2ff2015-07-02 20:55:21 +00001719 return StringRef(Start);
Rafael Espindola56f976f2013-04-18 18:08:55 +00001720}
1721
Rafael Espindola0e77a942014-12-10 20:46:55 +00001722unsigned MachOObjectFile::getSectionType(SectionRef Sec) const {
1723 DataRefImpl DRI = Sec.getRawDataRefImpl();
Lang Hames697e7cd2016-12-04 01:56:10 +00001724 uint32_t Flags = getSectionFlags(*this, DRI);
Rafael Espindola0e77a942014-12-10 20:46:55 +00001725 return Flags & MachO::SECTION_TYPE;
1726}
1727
Rafael Espindola59128922015-06-24 18:14:41 +00001728uint64_t MachOObjectFile::getNValue(DataRefImpl Sym) const {
1729 if (is64Bit()) {
1730 MachO::nlist_64 Entry = getSymbol64TableEntry(Sym);
1731 return Entry.n_value;
1732 }
1733 MachO::nlist Entry = getSymbolTableEntry(Sym);
1734 return Entry.n_value;
1735}
1736
Kevin Enderby980b2582014-06-05 21:21:57 +00001737// getIndirectName() returns the name of the alias'ed symbol who's string table
1738// index is in the n_value field.
Rafael Espindola3acea392014-06-12 21:46:39 +00001739std::error_code MachOObjectFile::getIndirectName(DataRefImpl Symb,
1740 StringRef &Res) const {
Kevin Enderby980b2582014-06-05 21:21:57 +00001741 StringRef StringTable = getStringTableData();
Lang Hames697e7cd2016-12-04 01:56:10 +00001742 MachO::nlist_base Entry = getSymbolTableEntryBase(*this, Symb);
Rafael Espindola59128922015-06-24 18:14:41 +00001743 if ((Entry.n_type & MachO::N_TYPE) != MachO::N_INDR)
1744 return object_error::parse_failed;
1745 uint64_t NValue = getNValue(Symb);
Kevin Enderby980b2582014-06-05 21:21:57 +00001746 if (NValue >= StringTable.size())
1747 return object_error::parse_failed;
1748 const char *Start = &StringTable.data()[NValue];
1749 Res = StringRef(Start);
Rui Ueyama7d099192015-06-09 15:20:42 +00001750 return std::error_code();
Kevin Enderby980b2582014-06-05 21:21:57 +00001751}
1752
Rafael Espindolabe8b0ea2015-07-07 17:12:59 +00001753uint64_t MachOObjectFile::getSymbolValueImpl(DataRefImpl Sym) const {
Rafael Espindola7e7be922015-07-07 15:05:09 +00001754 return getNValue(Sym);
Rafael Espindola991af662015-06-24 19:11:10 +00001755}
1756
Kevin Enderby931cb652016-06-24 18:24:42 +00001757Expected<uint64_t> MachOObjectFile::getSymbolAddress(DataRefImpl Sym) const {
Rafael Espindolaed067c42015-07-03 18:19:00 +00001758 return getSymbolValue(Sym);
Rafael Espindola56f976f2013-04-18 18:08:55 +00001759}
1760
Rafael Espindolaa4d224722015-05-31 23:52:50 +00001761uint32_t MachOObjectFile::getSymbolAlignment(DataRefImpl DRI) const {
Rafael Espindola20122a42014-01-31 20:57:12 +00001762 uint32_t flags = getSymbolFlags(DRI);
Rafael Espindolae4dd2e02013-04-29 22:24:22 +00001763 if (flags & SymbolRef::SF_Common) {
Lang Hames697e7cd2016-12-04 01:56:10 +00001764 MachO::nlist_base Entry = getSymbolTableEntryBase(*this, DRI);
Rafael Espindolaa4d224722015-05-31 23:52:50 +00001765 return 1 << MachO::GET_COMM_ALIGN(Entry.n_desc);
Rafael Espindolae4dd2e02013-04-29 22:24:22 +00001766 }
Rafael Espindolaa4d224722015-05-31 23:52:50 +00001767 return 0;
Rafael Espindolae4dd2e02013-04-29 22:24:22 +00001768}
1769
Rafael Espindolad7a32ea2015-06-24 10:20:30 +00001770uint64_t MachOObjectFile::getCommonSymbolSizeImpl(DataRefImpl DRI) const {
Rafael Espindola05cbccc2015-07-07 13:58:32 +00001771 return getNValue(DRI);
Rafael Espindola56f976f2013-04-18 18:08:55 +00001772}
1773
Kevin Enderby7bd8d992016-05-02 20:28:12 +00001774Expected<SymbolRef::Type>
Kevin Enderby5afbc1c2016-03-23 20:27:00 +00001775MachOObjectFile::getSymbolType(DataRefImpl Symb) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00001776 MachO::nlist_base Entry = getSymbolTableEntryBase(*this, Symb);
Charles Davis8bdfafd2013-09-01 04:28:48 +00001777 uint8_t n_type = Entry.n_type;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001778
Rafael Espindola56f976f2013-04-18 18:08:55 +00001779 // If this is a STAB debugging symbol, we can do nothing more.
Rafael Espindola2fa80cc2015-06-26 12:18:49 +00001780 if (n_type & MachO::N_STAB)
1781 return SymbolRef::ST_Debug;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001782
Charles Davis74ec8b02013-08-27 05:00:13 +00001783 switch (n_type & MachO::N_TYPE) {
1784 case MachO::N_UNDF :
Rafael Espindola2fa80cc2015-06-26 12:18:49 +00001785 return SymbolRef::ST_Unknown;
Charles Davis74ec8b02013-08-27 05:00:13 +00001786 case MachO::N_SECT :
Kevin Enderby7bd8d992016-05-02 20:28:12 +00001787 Expected<section_iterator> SecOrError = getSymbolSection(Symb);
Kevin Enderby5afbc1c2016-03-23 20:27:00 +00001788 if (!SecOrError)
Kevin Enderby7bd8d992016-05-02 20:28:12 +00001789 return SecOrError.takeError();
Kevin Enderby5afbc1c2016-03-23 20:27:00 +00001790 section_iterator Sec = *SecOrError;
Kuba Breckade833222015-11-12 09:40:29 +00001791 if (Sec->isData() || Sec->isBSS())
1792 return SymbolRef::ST_Data;
Rafael Espindola2fa80cc2015-06-26 12:18:49 +00001793 return SymbolRef::ST_Function;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001794 }
Rafael Espindola2fa80cc2015-06-26 12:18:49 +00001795 return SymbolRef::ST_Other;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001796}
1797
Rafael Espindola20122a42014-01-31 20:57:12 +00001798uint32_t MachOObjectFile::getSymbolFlags(DataRefImpl DRI) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00001799 MachO::nlist_base Entry = getSymbolTableEntryBase(*this, DRI);
Rafael Espindola56f976f2013-04-18 18:08:55 +00001800
Charles Davis8bdfafd2013-09-01 04:28:48 +00001801 uint8_t MachOType = Entry.n_type;
1802 uint16_t MachOFlags = Entry.n_desc;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001803
Rafael Espindola20122a42014-01-31 20:57:12 +00001804 uint32_t Result = SymbolRef::SF_None;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001805
Tim Northovereaef0742014-05-30 13:22:59 +00001806 if ((MachOType & MachO::N_TYPE) == MachO::N_INDR)
1807 Result |= SymbolRef::SF_Indirect;
1808
Rafael Espindolaa1356322013-11-02 05:03:24 +00001809 if (MachOType & MachO::N_STAB)
Rafael Espindola56f976f2013-04-18 18:08:55 +00001810 Result |= SymbolRef::SF_FormatSpecific;
1811
Charles Davis74ec8b02013-08-27 05:00:13 +00001812 if (MachOType & MachO::N_EXT) {
Rafael Espindola56f976f2013-04-18 18:08:55 +00001813 Result |= SymbolRef::SF_Global;
Charles Davis74ec8b02013-08-27 05:00:13 +00001814 if ((MachOType & MachO::N_TYPE) == MachO::N_UNDF) {
Rafael Espindola05cbccc2015-07-07 13:58:32 +00001815 if (getNValue(DRI))
Rafael Espindolae4dd2e02013-04-29 22:24:22 +00001816 Result |= SymbolRef::SF_Common;
Rafael Espindolad8247722015-07-07 14:26:39 +00001817 else
1818 Result |= SymbolRef::SF_Undefined;
Rafael Espindolae4dd2e02013-04-29 22:24:22 +00001819 }
Lang Hames7e0692b2015-01-15 22:33:30 +00001820
1821 if (!(MachOType & MachO::N_PEXT))
1822 Result |= SymbolRef::SF_Exported;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001823 }
1824
Charles Davis74ec8b02013-08-27 05:00:13 +00001825 if (MachOFlags & (MachO::N_WEAK_REF | MachO::N_WEAK_DEF))
Rafael Espindola56f976f2013-04-18 18:08:55 +00001826 Result |= SymbolRef::SF_Weak;
1827
Kevin Enderbyec5ca032014-08-18 20:21:02 +00001828 if (MachOFlags & (MachO::N_ARM_THUMB_DEF))
1829 Result |= SymbolRef::SF_Thumb;
1830
Charles Davis74ec8b02013-08-27 05:00:13 +00001831 if ((MachOType & MachO::N_TYPE) == MachO::N_ABS)
Rafael Espindola56f976f2013-04-18 18:08:55 +00001832 Result |= SymbolRef::SF_Absolute;
1833
Rafael Espindola20122a42014-01-31 20:57:12 +00001834 return Result;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001835}
1836
Kevin Enderby7bd8d992016-05-02 20:28:12 +00001837Expected<section_iterator>
Rafael Espindola8bab8892015-08-07 23:27:14 +00001838MachOObjectFile::getSymbolSection(DataRefImpl Symb) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00001839 MachO::nlist_base Entry = getSymbolTableEntryBase(*this, Symb);
Charles Davis8bdfafd2013-09-01 04:28:48 +00001840 uint8_t index = Entry.n_sect;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001841
Rafael Espindola8bab8892015-08-07 23:27:14 +00001842 if (index == 0)
1843 return section_end();
1844 DataRefImpl DRI;
1845 DRI.d.a = index - 1;
Kevin Enderby5afbc1c2016-03-23 20:27:00 +00001846 if (DRI.d.a >= Sections.size()){
Kevin Enderbyd4e075b2016-05-06 20:16:28 +00001847 return malformedError("bad section index: " + Twine((int)index) +
Kevin Enderby89134962016-05-05 23:41:05 +00001848 " for symbol at index " + Twine(getSymbolIndex(Symb)));
Kevin Enderby5afbc1c2016-03-23 20:27:00 +00001849 }
Rafael Espindola8bab8892015-08-07 23:27:14 +00001850 return section_iterator(SectionRef(DRI, this));
Rafael Espindola56f976f2013-04-18 18:08:55 +00001851}
1852
Rafael Espindola6bf32212015-06-24 19:57:32 +00001853unsigned MachOObjectFile::getSymbolSectionID(SymbolRef Sym) const {
1854 MachO::nlist_base Entry =
Lang Hames697e7cd2016-12-04 01:56:10 +00001855 getSymbolTableEntryBase(*this, Sym.getRawDataRefImpl());
Rafael Espindola6bf32212015-06-24 19:57:32 +00001856 return Entry.n_sect - 1;
1857}
1858
Rafael Espindola5e812af2014-01-30 02:49:50 +00001859void MachOObjectFile::moveSectionNext(DataRefImpl &Sec) const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00001860 Sec.d.a++;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001861}
1862
Rafael Espindola3acea392014-06-12 21:46:39 +00001863std::error_code MachOObjectFile::getSectionName(DataRefImpl Sec,
1864 StringRef &Result) const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00001865 ArrayRef<char> Raw = getSectionRawName(Sec);
1866 Result = parseSegmentOrSectionName(Raw.data());
Rui Ueyama7d099192015-06-09 15:20:42 +00001867 return std::error_code();
Rafael Espindola56f976f2013-04-18 18:08:55 +00001868}
1869
Rafael Espindola80291272014-10-08 15:28:58 +00001870uint64_t MachOObjectFile::getSectionAddress(DataRefImpl Sec) const {
1871 if (is64Bit())
1872 return getSection64(Sec).addr;
1873 return getSection(Sec).addr;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001874}
1875
George Rimara25d3292017-05-27 18:10:23 +00001876uint64_t MachOObjectFile::getSectionIndex(DataRefImpl Sec) const {
1877 return Sec.d.a;
1878}
1879
Rafael Espindola80291272014-10-08 15:28:58 +00001880uint64_t MachOObjectFile::getSectionSize(DataRefImpl Sec) const {
Kevin Enderby46e642f2015-10-08 22:50:55 +00001881 // In the case if a malformed Mach-O file where the section offset is past
1882 // the end of the file or some part of the section size is past the end of
1883 // the file return a size of zero or a size that covers the rest of the file
1884 // but does not extend past the end of the file.
1885 uint32_t SectOffset, SectType;
1886 uint64_t SectSize;
1887
1888 if (is64Bit()) {
1889 MachO::section_64 Sect = getSection64(Sec);
1890 SectOffset = Sect.offset;
1891 SectSize = Sect.size;
1892 SectType = Sect.flags & MachO::SECTION_TYPE;
1893 } else {
1894 MachO::section Sect = getSection(Sec);
1895 SectOffset = Sect.offset;
1896 SectSize = Sect.size;
1897 SectType = Sect.flags & MachO::SECTION_TYPE;
1898 }
1899 if (SectType == MachO::S_ZEROFILL || SectType == MachO::S_GB_ZEROFILL)
1900 return SectSize;
1901 uint64_t FileSize = getData().size();
1902 if (SectOffset > FileSize)
1903 return 0;
1904 if (FileSize - SectOffset < SectSize)
1905 return FileSize - SectOffset;
1906 return SectSize;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001907}
1908
Rafael Espindola3acea392014-06-12 21:46:39 +00001909std::error_code MachOObjectFile::getSectionContents(DataRefImpl Sec,
1910 StringRef &Res) const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00001911 uint32_t Offset;
1912 uint64_t Size;
1913
1914 if (is64Bit()) {
Charles Davis8bdfafd2013-09-01 04:28:48 +00001915 MachO::section_64 Sect = getSection64(Sec);
1916 Offset = Sect.offset;
1917 Size = Sect.size;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001918 } else {
Charles Davis8bdfafd2013-09-01 04:28:48 +00001919 MachO::section Sect = getSection(Sec);
1920 Offset = Sect.offset;
1921 Size = Sect.size;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001922 }
1923
1924 Res = this->getData().substr(Offset, Size);
Rui Ueyama7d099192015-06-09 15:20:42 +00001925 return std::error_code();
Rafael Espindola56f976f2013-04-18 18:08:55 +00001926}
1927
Rafael Espindola80291272014-10-08 15:28:58 +00001928uint64_t MachOObjectFile::getSectionAlignment(DataRefImpl Sec) const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00001929 uint32_t Align;
1930 if (is64Bit()) {
Charles Davis8bdfafd2013-09-01 04:28:48 +00001931 MachO::section_64 Sect = getSection64(Sec);
1932 Align = Sect.align;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001933 } else {
Charles Davis8bdfafd2013-09-01 04:28:48 +00001934 MachO::section Sect = getSection(Sec);
1935 Align = Sect.align;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001936 }
1937
Rafael Espindola80291272014-10-08 15:28:58 +00001938 return uint64_t(1) << Align;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001939}
1940
Paul Semelb98f5042018-07-11 10:00:29 +00001941Expected<SectionRef> MachOObjectFile::getSection(unsigned SectionIndex) const {
1942 if (SectionIndex < 1 || SectionIndex > Sections.size())
1943 return malformedError("bad section index: " + Twine((int)SectionIndex));
1944
1945 DataRefImpl DRI;
1946 DRI.d.a = SectionIndex - 1;
1947 return SectionRef(DRI, this);
1948}
1949
1950Expected<SectionRef> MachOObjectFile::getSection(StringRef SectionName) const {
1951 StringRef SecName;
1952 for (const SectionRef &Section : sections()) {
1953 if (std::error_code E = Section.getName(SecName))
1954 return errorCodeToError(E);
1955 if (SecName == SectionName) {
1956 return Section;
1957 }
1958 }
1959 return errorCodeToError(object_error::parse_failed);
1960}
1961
George Rimar401e4e52016-05-24 12:48:46 +00001962bool MachOObjectFile::isSectionCompressed(DataRefImpl Sec) const {
1963 return false;
1964}
1965
Rafael Espindola80291272014-10-08 15:28:58 +00001966bool MachOObjectFile::isSectionText(DataRefImpl Sec) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00001967 uint32_t Flags = getSectionFlags(*this, Sec);
Rafael Espindola80291272014-10-08 15:28:58 +00001968 return Flags & MachO::S_ATTR_PURE_INSTRUCTIONS;
Rafael Espindola56f976f2013-04-18 18:08:55 +00001969}
1970
Rafael Espindola80291272014-10-08 15:28:58 +00001971bool MachOObjectFile::isSectionData(DataRefImpl Sec) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00001972 uint32_t Flags = getSectionFlags(*this, Sec);
Kevin Enderby403258f2014-05-19 20:36:02 +00001973 unsigned SectionType = Flags & MachO::SECTION_TYPE;
Rafael Espindola80291272014-10-08 15:28:58 +00001974 return !(Flags & MachO::S_ATTR_PURE_INSTRUCTIONS) &&
1975 !(SectionType == MachO::S_ZEROFILL ||
1976 SectionType == MachO::S_GB_ZEROFILL);
Michael J. Spencer800619f2011-09-28 20:57:30 +00001977}
1978
Rafael Espindola80291272014-10-08 15:28:58 +00001979bool MachOObjectFile::isSectionBSS(DataRefImpl Sec) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00001980 uint32_t Flags = getSectionFlags(*this, Sec);
Kevin Enderby403258f2014-05-19 20:36:02 +00001981 unsigned SectionType = Flags & MachO::SECTION_TYPE;
Rafael Espindola80291272014-10-08 15:28:58 +00001982 return !(Flags & MachO::S_ATTR_PURE_INSTRUCTIONS) &&
1983 (SectionType == MachO::S_ZEROFILL ||
1984 SectionType == MachO::S_GB_ZEROFILL);
Preston Gurd2138ef62012-04-12 20:13:57 +00001985}
1986
Rafael Espindola6bf32212015-06-24 19:57:32 +00001987unsigned MachOObjectFile::getSectionID(SectionRef Sec) const {
1988 return Sec.getRawDataRefImpl().d.a;
1989}
1990
Rafael Espindola80291272014-10-08 15:28:58 +00001991bool MachOObjectFile::isSectionVirtual(DataRefImpl Sec) const {
Francis Visoiu Mistrih18346822018-04-19 17:02:57 +00001992 uint32_t Flags = getSectionFlags(*this, Sec);
1993 unsigned SectionType = Flags & MachO::SECTION_TYPE;
1994 return SectionType == MachO::S_ZEROFILL ||
1995 SectionType == MachO::S_GB_ZEROFILL;
Rafael Espindolac2413f52013-04-09 14:49:08 +00001996}
1997
Steven Wuf2fe0142016-02-29 19:40:10 +00001998bool MachOObjectFile::isSectionBitcode(DataRefImpl Sec) const {
1999 StringRef SegmentName = getSectionFinalSegmentName(Sec);
2000 StringRef SectName;
2001 if (!getSectionName(Sec, SectName))
2002 return (SegmentName == "__LLVM" && SectName == "__bitcode");
2003 return false;
2004}
2005
Jonas Devlieghere8af23872017-09-26 14:22:35 +00002006bool MachOObjectFile::isSectionStripped(DataRefImpl Sec) const {
2007 if (is64Bit())
2008 return getSection64(Sec).offset == 0;
2009 return getSection(Sec).offset == 0;
2010}
2011
Rui Ueyamabc654b12013-09-27 21:47:05 +00002012relocation_iterator MachOObjectFile::section_rel_begin(DataRefImpl Sec) const {
Rafael Espindola04d3f492013-04-25 12:45:46 +00002013 DataRefImpl Ret;
Rafael Espindola128b8112014-04-03 23:51:28 +00002014 Ret.d.a = Sec.d.a;
2015 Ret.d.b = 0;
Rafael Espindola04d3f492013-04-25 12:45:46 +00002016 return relocation_iterator(RelocationRef(Ret, this));
Michael J. Spencere5fd0042011-10-07 19:25:32 +00002017}
Rafael Espindolac0406e12013-04-08 20:45:01 +00002018
Rafael Espindola56f976f2013-04-18 18:08:55 +00002019relocation_iterator
Rui Ueyamabc654b12013-09-27 21:47:05 +00002020MachOObjectFile::section_rel_end(DataRefImpl Sec) const {
Rafael Espindola04d3f492013-04-25 12:45:46 +00002021 uint32_t Num;
Rafael Espindola56f976f2013-04-18 18:08:55 +00002022 if (is64Bit()) {
Charles Davis8bdfafd2013-09-01 04:28:48 +00002023 MachO::section_64 Sect = getSection64(Sec);
Charles Davis8bdfafd2013-09-01 04:28:48 +00002024 Num = Sect.nreloc;
Rafael Espindola56f976f2013-04-18 18:08:55 +00002025 } else {
Charles Davis8bdfafd2013-09-01 04:28:48 +00002026 MachO::section Sect = getSection(Sec);
Charles Davis8bdfafd2013-09-01 04:28:48 +00002027 Num = Sect.nreloc;
Rafael Espindola56f976f2013-04-18 18:08:55 +00002028 }
Eric Christopher7b015c72011-04-22 03:19:48 +00002029
Rafael Espindola56f976f2013-04-18 18:08:55 +00002030 DataRefImpl Ret;
Rafael Espindola128b8112014-04-03 23:51:28 +00002031 Ret.d.a = Sec.d.a;
2032 Ret.d.b = Num;
Rafael Espindola56f976f2013-04-18 18:08:55 +00002033 return relocation_iterator(RelocationRef(Ret, this));
2034}
Benjamin Kramer022ecdf2011-09-08 20:52:17 +00002035
Kevin Enderbyabf10f22017-06-22 17:41:22 +00002036relocation_iterator MachOObjectFile::extrel_begin() const {
2037 DataRefImpl Ret;
Michael Trenta1703b12017-12-15 17:57:40 +00002038 // for DYSYMTAB symbols, Ret.d.a == 0 for external relocations
Kevin Enderbyabf10f22017-06-22 17:41:22 +00002039 Ret.d.a = 0; // Would normally be a section index.
2040 Ret.d.b = 0; // Index into the external relocations
2041 return relocation_iterator(RelocationRef(Ret, this));
2042}
2043
2044relocation_iterator MachOObjectFile::extrel_end() const {
2045 MachO::dysymtab_command DysymtabLoadCmd = getDysymtabLoadCommand();
2046 DataRefImpl Ret;
Michael Trenta1703b12017-12-15 17:57:40 +00002047 // for DYSYMTAB symbols, Ret.d.a == 0 for external relocations
Kevin Enderbyabf10f22017-06-22 17:41:22 +00002048 Ret.d.a = 0; // Would normally be a section index.
2049 Ret.d.b = DysymtabLoadCmd.nextrel; // Index into the external relocations
2050 return relocation_iterator(RelocationRef(Ret, this));
2051}
2052
Michael Trenta1703b12017-12-15 17:57:40 +00002053relocation_iterator MachOObjectFile::locrel_begin() const {
2054 DataRefImpl Ret;
2055 // for DYSYMTAB symbols, Ret.d.a == 1 for local relocations
2056 Ret.d.a = 1; // Would normally be a section index.
2057 Ret.d.b = 0; // Index into the local relocations
2058 return relocation_iterator(RelocationRef(Ret, this));
2059}
2060
2061relocation_iterator MachOObjectFile::locrel_end() const {
2062 MachO::dysymtab_command DysymtabLoadCmd = getDysymtabLoadCommand();
2063 DataRefImpl Ret;
2064 // for DYSYMTAB symbols, Ret.d.a == 1 for local relocations
2065 Ret.d.a = 1; // Would normally be a section index.
2066 Ret.d.b = DysymtabLoadCmd.nlocrel; // Index into the local relocations
2067 return relocation_iterator(RelocationRef(Ret, this));
2068}
2069
Rafael Espindola5e812af2014-01-30 02:49:50 +00002070void MachOObjectFile::moveRelocationNext(DataRefImpl &Rel) const {
Rafael Espindola128b8112014-04-03 23:51:28 +00002071 ++Rel.d.b;
Benjamin Kramer022ecdf2011-09-08 20:52:17 +00002072}
Owen Anderson171f4852011-10-24 23:20:07 +00002073
Rafael Espindola96d071c2015-06-29 23:29:12 +00002074uint64_t MachOObjectFile::getRelocationOffset(DataRefImpl Rel) const {
Kevin Enderbyabf10f22017-06-22 17:41:22 +00002075 assert((getHeader().filetype == MachO::MH_OBJECT ||
2076 getHeader().filetype == MachO::MH_KEXT_BUNDLE) &&
2077 "Only implemented for MH_OBJECT && MH_KEXT_BUNDLE");
Charles Davis8bdfafd2013-09-01 04:28:48 +00002078 MachO::any_relocation_info RE = getRelocation(Rel);
Rafael Espindola96d071c2015-06-29 23:29:12 +00002079 return getAnyRelocationAddress(RE);
David Meyer2fc34c52012-03-01 01:36:50 +00002080}
2081
Rafael Espindola806f0062013-06-05 01:33:53 +00002082symbol_iterator
2083MachOObjectFile::getRelocationSymbol(DataRefImpl Rel) const {
Charles Davis8bdfafd2013-09-01 04:28:48 +00002084 MachO::any_relocation_info RE = getRelocation(Rel);
Tim Northover07f99fb2014-07-04 10:57:56 +00002085 if (isRelocationScattered(RE))
2086 return symbol_end();
2087
Rafael Espindola56f976f2013-04-18 18:08:55 +00002088 uint32_t SymbolIdx = getPlainRelocationSymbolNum(RE);
2089 bool isExtern = getPlainRelocationExternal(RE);
Rafael Espindola806f0062013-06-05 01:33:53 +00002090 if (!isExtern)
Rafael Espindolab5155a52014-02-10 20:24:04 +00002091 return symbol_end();
Rafael Espindola75c30362013-04-24 19:47:55 +00002092
Charles Davis8bdfafd2013-09-01 04:28:48 +00002093 MachO::symtab_command S = getSymtabLoadCommand();
Rafael Espindola75c30362013-04-24 19:47:55 +00002094 unsigned SymbolTableEntrySize = is64Bit() ?
Charles Davis8bdfafd2013-09-01 04:28:48 +00002095 sizeof(MachO::nlist_64) :
2096 sizeof(MachO::nlist);
2097 uint64_t Offset = S.symoff + SymbolIdx * SymbolTableEntrySize;
Rafael Espindola75c30362013-04-24 19:47:55 +00002098 DataRefImpl Sym;
Lang Hames697e7cd2016-12-04 01:56:10 +00002099 Sym.p = reinterpret_cast<uintptr_t>(getPtr(*this, Offset));
Rafael Espindola806f0062013-06-05 01:33:53 +00002100 return symbol_iterator(SymbolRef(Sym, this));
Rafael Espindola56f976f2013-04-18 18:08:55 +00002101}
2102
Keno Fischerc780e8e2015-05-21 21:24:32 +00002103section_iterator
2104MachOObjectFile::getRelocationSection(DataRefImpl Rel) const {
2105 return section_iterator(getAnyRelocationSection(getRelocation(Rel)));
2106}
2107
Rafael Espindola99c041b2015-06-30 01:53:01 +00002108uint64_t MachOObjectFile::getRelocationType(DataRefImpl Rel) const {
Charles Davis8bdfafd2013-09-01 04:28:48 +00002109 MachO::any_relocation_info RE = getRelocation(Rel);
Rafael Espindola99c041b2015-06-30 01:53:01 +00002110 return getAnyRelocationType(RE);
Rafael Espindola56f976f2013-04-18 18:08:55 +00002111}
2112
Rafael Espindola41bb4322015-06-30 04:08:37 +00002113void MachOObjectFile::getRelocationTypeName(
2114 DataRefImpl Rel, SmallVectorImpl<char> &Result) const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00002115 StringRef res;
Rafael Espindola99c041b2015-06-30 01:53:01 +00002116 uint64_t RType = getRelocationType(Rel);
Rafael Espindola56f976f2013-04-18 18:08:55 +00002117
2118 unsigned Arch = this->getArch();
2119
2120 switch (Arch) {
2121 case Triple::x86: {
2122 static const char *const Table[] = {
2123 "GENERIC_RELOC_VANILLA",
2124 "GENERIC_RELOC_PAIR",
2125 "GENERIC_RELOC_SECTDIFF",
2126 "GENERIC_RELOC_PB_LA_PTR",
2127 "GENERIC_RELOC_LOCAL_SECTDIFF",
2128 "GENERIC_RELOC_TLV" };
2129
Eric Christopher13250cb2013-12-06 02:33:38 +00002130 if (RType > 5)
Rafael Espindola56f976f2013-04-18 18:08:55 +00002131 res = "Unknown";
2132 else
2133 res = Table[RType];
2134 break;
2135 }
2136 case Triple::x86_64: {
2137 static const char *const Table[] = {
2138 "X86_64_RELOC_UNSIGNED",
2139 "X86_64_RELOC_SIGNED",
2140 "X86_64_RELOC_BRANCH",
2141 "X86_64_RELOC_GOT_LOAD",
2142 "X86_64_RELOC_GOT",
2143 "X86_64_RELOC_SUBTRACTOR",
2144 "X86_64_RELOC_SIGNED_1",
2145 "X86_64_RELOC_SIGNED_2",
2146 "X86_64_RELOC_SIGNED_4",
2147 "X86_64_RELOC_TLV" };
2148
2149 if (RType > 9)
2150 res = "Unknown";
2151 else
2152 res = Table[RType];
2153 break;
2154 }
2155 case Triple::arm: {
2156 static const char *const Table[] = {
2157 "ARM_RELOC_VANILLA",
2158 "ARM_RELOC_PAIR",
2159 "ARM_RELOC_SECTDIFF",
2160 "ARM_RELOC_LOCAL_SECTDIFF",
2161 "ARM_RELOC_PB_LA_PTR",
2162 "ARM_RELOC_BR24",
2163 "ARM_THUMB_RELOC_BR22",
2164 "ARM_THUMB_32BIT_BRANCH",
2165 "ARM_RELOC_HALF",
2166 "ARM_RELOC_HALF_SECTDIFF" };
2167
2168 if (RType > 9)
2169 res = "Unknown";
2170 else
2171 res = Table[RType];
2172 break;
2173 }
Tim Northover00ed9962014-03-29 10:18:08 +00002174 case Triple::aarch64: {
2175 static const char *const Table[] = {
2176 "ARM64_RELOC_UNSIGNED", "ARM64_RELOC_SUBTRACTOR",
2177 "ARM64_RELOC_BRANCH26", "ARM64_RELOC_PAGE21",
2178 "ARM64_RELOC_PAGEOFF12", "ARM64_RELOC_GOT_LOAD_PAGE21",
2179 "ARM64_RELOC_GOT_LOAD_PAGEOFF12", "ARM64_RELOC_POINTER_TO_GOT",
2180 "ARM64_RELOC_TLVP_LOAD_PAGE21", "ARM64_RELOC_TLVP_LOAD_PAGEOFF12",
2181 "ARM64_RELOC_ADDEND"
2182 };
2183
2184 if (RType >= array_lengthof(Table))
2185 res = "Unknown";
2186 else
2187 res = Table[RType];
2188 break;
2189 }
Rafael Espindola56f976f2013-04-18 18:08:55 +00002190 case Triple::ppc: {
2191 static const char *const Table[] = {
2192 "PPC_RELOC_VANILLA",
2193 "PPC_RELOC_PAIR",
2194 "PPC_RELOC_BR14",
2195 "PPC_RELOC_BR24",
2196 "PPC_RELOC_HI16",
2197 "PPC_RELOC_LO16",
2198 "PPC_RELOC_HA16",
2199 "PPC_RELOC_LO14",
2200 "PPC_RELOC_SECTDIFF",
2201 "PPC_RELOC_PB_LA_PTR",
2202 "PPC_RELOC_HI16_SECTDIFF",
2203 "PPC_RELOC_LO16_SECTDIFF",
2204 "PPC_RELOC_HA16_SECTDIFF",
2205 "PPC_RELOC_JBSR",
2206 "PPC_RELOC_LO14_SECTDIFF",
2207 "PPC_RELOC_LOCAL_SECTDIFF" };
2208
Eric Christopher13250cb2013-12-06 02:33:38 +00002209 if (RType > 15)
2210 res = "Unknown";
2211 else
2212 res = Table[RType];
Rafael Espindola56f976f2013-04-18 18:08:55 +00002213 break;
2214 }
2215 case Triple::UnknownArch:
2216 res = "Unknown";
2217 break;
2218 }
2219 Result.append(res.begin(), res.end());
Rafael Espindola56f976f2013-04-18 18:08:55 +00002220}
2221
Keno Fischer281b6942015-05-30 19:44:53 +00002222uint8_t MachOObjectFile::getRelocationLength(DataRefImpl Rel) const {
2223 MachO::any_relocation_info RE = getRelocation(Rel);
2224 return getAnyRelocationLength(RE);
2225}
2226
Kevin Enderby980b2582014-06-05 21:21:57 +00002227//
2228// guessLibraryShortName() is passed a name of a dynamic library and returns a
2229// guess on what the short name is. Then name is returned as a substring of the
2230// StringRef Name passed in. The name of the dynamic library is recognized as
2231// a framework if it has one of the two following forms:
2232// Foo.framework/Versions/A/Foo
2233// Foo.framework/Foo
2234// Where A and Foo can be any string. And may contain a trailing suffix
2235// starting with an underbar. If the Name is recognized as a framework then
2236// isFramework is set to true else it is set to false. If the Name has a
2237// suffix then Suffix is set to the substring in Name that contains the suffix
2238// else it is set to a NULL StringRef.
2239//
2240// The Name of the dynamic library is recognized as a library name if it has
2241// one of the two following forms:
2242// libFoo.A.dylib
2243// libFoo.dylib
2244// The library may have a suffix trailing the name Foo of the form:
2245// libFoo_profile.A.dylib
2246// libFoo_profile.dylib
2247//
2248// The Name of the dynamic library is also recognized as a library name if it
2249// has the following form:
2250// Foo.qtx
2251//
2252// If the Name of the dynamic library is none of the forms above then a NULL
2253// StringRef is returned.
2254//
2255StringRef MachOObjectFile::guessLibraryShortName(StringRef Name,
2256 bool &isFramework,
2257 StringRef &Suffix) {
2258 StringRef Foo, F, DotFramework, V, Dylib, Lib, Dot, Qtx;
2259 size_t a, b, c, d, Idx;
2260
2261 isFramework = false;
2262 Suffix = StringRef();
2263
2264 // Pull off the last component and make Foo point to it
2265 a = Name.rfind('/');
2266 if (a == Name.npos || a == 0)
2267 goto guess_library;
2268 Foo = Name.slice(a+1, Name.npos);
2269
2270 // Look for a suffix starting with a '_'
2271 Idx = Foo.rfind('_');
2272 if (Idx != Foo.npos && Foo.size() >= 2) {
2273 Suffix = Foo.slice(Idx, Foo.npos);
2274 Foo = Foo.slice(0, Idx);
2275 }
2276
2277 // First look for the form Foo.framework/Foo
2278 b = Name.rfind('/', a);
2279 if (b == Name.npos)
2280 Idx = 0;
2281 else
2282 Idx = b+1;
2283 F = Name.slice(Idx, Idx + Foo.size());
2284 DotFramework = Name.slice(Idx + Foo.size(),
2285 Idx + Foo.size() + sizeof(".framework/")-1);
2286 if (F == Foo && DotFramework == ".framework/") {
2287 isFramework = true;
2288 return Foo;
2289 }
2290
2291 // Next look for the form Foo.framework/Versions/A/Foo
2292 if (b == Name.npos)
2293 goto guess_library;
2294 c = Name.rfind('/', b);
2295 if (c == Name.npos || c == 0)
2296 goto guess_library;
2297 V = Name.slice(c+1, Name.npos);
2298 if (!V.startswith("Versions/"))
2299 goto guess_library;
2300 d = Name.rfind('/', c);
2301 if (d == Name.npos)
2302 Idx = 0;
2303 else
2304 Idx = d+1;
2305 F = Name.slice(Idx, Idx + Foo.size());
2306 DotFramework = Name.slice(Idx + Foo.size(),
2307 Idx + Foo.size() + sizeof(".framework/")-1);
2308 if (F == Foo && DotFramework == ".framework/") {
2309 isFramework = true;
2310 return Foo;
2311 }
2312
2313guess_library:
2314 // pull off the suffix after the "." and make a point to it
2315 a = Name.rfind('.');
2316 if (a == Name.npos || a == 0)
2317 return StringRef();
2318 Dylib = Name.slice(a, Name.npos);
2319 if (Dylib != ".dylib")
2320 goto guess_qtx;
2321
2322 // First pull off the version letter for the form Foo.A.dylib if any.
2323 if (a >= 3) {
2324 Dot = Name.slice(a-2, a-1);
2325 if (Dot == ".")
2326 a = a - 2;
2327 }
2328
2329 b = Name.rfind('/', a);
2330 if (b == Name.npos)
2331 b = 0;
2332 else
2333 b = b+1;
2334 // ignore any suffix after an underbar like Foo_profile.A.dylib
2335 Idx = Name.find('_', b);
2336 if (Idx != Name.npos && Idx != b) {
2337 Lib = Name.slice(b, Idx);
2338 Suffix = Name.slice(Idx, a);
2339 }
2340 else
2341 Lib = Name.slice(b, a);
2342 // There are incorrect library names of the form:
2343 // libATS.A_profile.dylib so check for these.
2344 if (Lib.size() >= 3) {
2345 Dot = Lib.slice(Lib.size()-2, Lib.size()-1);
2346 if (Dot == ".")
2347 Lib = Lib.slice(0, Lib.size()-2);
2348 }
2349 return Lib;
2350
2351guess_qtx:
2352 Qtx = Name.slice(a, Name.npos);
2353 if (Qtx != ".qtx")
2354 return StringRef();
2355 b = Name.rfind('/', a);
2356 if (b == Name.npos)
2357 Lib = Name.slice(0, a);
2358 else
2359 Lib = Name.slice(b+1, a);
2360 // There are library names of the form: QT.A.qtx so check for these.
2361 if (Lib.size() >= 3) {
2362 Dot = Lib.slice(Lib.size()-2, Lib.size()-1);
2363 if (Dot == ".")
2364 Lib = Lib.slice(0, Lib.size()-2);
2365 }
2366 return Lib;
2367}
2368
2369// getLibraryShortNameByIndex() is used to get the short name of the library
2370// for an undefined symbol in a linked Mach-O binary that was linked with the
2371// normal two-level namespace default (that is MH_TWOLEVEL in the header).
2372// It is passed the index (0 - based) of the library as translated from
2373// GET_LIBRARY_ORDINAL (1 - based).
Rafael Espindola3acea392014-06-12 21:46:39 +00002374std::error_code MachOObjectFile::getLibraryShortNameByIndex(unsigned Index,
Nick Kledzikd04bc352014-08-30 00:20:14 +00002375 StringRef &Res) const {
Kevin Enderby980b2582014-06-05 21:21:57 +00002376 if (Index >= Libraries.size())
2377 return object_error::parse_failed;
2378
Kevin Enderby980b2582014-06-05 21:21:57 +00002379 // If the cache of LibrariesShortNames is not built up do that first for
2380 // all the Libraries.
2381 if (LibrariesShortNames.size() == 0) {
2382 for (unsigned i = 0; i < Libraries.size(); i++) {
2383 MachO::dylib_command D =
Lang Hames697e7cd2016-12-04 01:56:10 +00002384 getStruct<MachO::dylib_command>(*this, Libraries[i]);
Nick Kledzik30061302014-09-17 00:25:22 +00002385 if (D.dylib.name >= D.cmdsize)
2386 return object_error::parse_failed;
Kevin Enderby4eff6cd2014-06-20 18:07:34 +00002387 const char *P = (const char *)(Libraries[i]) + D.dylib.name;
Kevin Enderby980b2582014-06-05 21:21:57 +00002388 StringRef Name = StringRef(P);
Nick Kledzik30061302014-09-17 00:25:22 +00002389 if (D.dylib.name+Name.size() >= D.cmdsize)
2390 return object_error::parse_failed;
Kevin Enderby980b2582014-06-05 21:21:57 +00002391 StringRef Suffix;
2392 bool isFramework;
2393 StringRef shortName = guessLibraryShortName(Name, isFramework, Suffix);
Nick Kledzik30061302014-09-17 00:25:22 +00002394 if (shortName.empty())
Kevin Enderby980b2582014-06-05 21:21:57 +00002395 LibrariesShortNames.push_back(Name);
2396 else
2397 LibrariesShortNames.push_back(shortName);
2398 }
2399 }
2400
2401 Res = LibrariesShortNames[Index];
Rui Ueyama7d099192015-06-09 15:20:42 +00002402 return std::error_code();
Kevin Enderby980b2582014-06-05 21:21:57 +00002403}
2404
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00002405uint32_t MachOObjectFile::getLibraryCount() const {
2406 return Libraries.size();
2407}
2408
Rafael Espindola76ad2322015-07-06 14:55:37 +00002409section_iterator
2410MachOObjectFile::getRelocationRelocatedSection(relocation_iterator Rel) const {
2411 DataRefImpl Sec;
2412 Sec.d.a = Rel->getRawDataRefImpl().d.a;
2413 return section_iterator(SectionRef(Sec, this));
2414}
2415
Peter Collingbourne435890a2016-11-22 03:38:40 +00002416basic_symbol_iterator MachOObjectFile::symbol_begin() const {
Kevin Enderby1829c682016-01-22 22:49:55 +00002417 DataRefImpl DRI;
2418 MachO::symtab_command Symtab = getSymtabLoadCommand();
2419 if (!SymtabLoadCmd || Symtab.nsyms == 0)
2420 return basic_symbol_iterator(SymbolRef(DRI, this));
2421
Lang Hames36072da2014-05-12 21:39:59 +00002422 return getSymbolByIndex(0);
Rafael Espindola56f976f2013-04-18 18:08:55 +00002423}
2424
Peter Collingbourne435890a2016-11-22 03:38:40 +00002425basic_symbol_iterator MachOObjectFile::symbol_end() const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00002426 DataRefImpl DRI;
Kevin Enderby1829c682016-01-22 22:49:55 +00002427 MachO::symtab_command Symtab = getSymtabLoadCommand();
2428 if (!SymtabLoadCmd || Symtab.nsyms == 0)
Rafael Espindolaf12b8282014-02-21 20:10:59 +00002429 return basic_symbol_iterator(SymbolRef(DRI, this));
Rafael Espindola75c30362013-04-24 19:47:55 +00002430
Rafael Espindola75c30362013-04-24 19:47:55 +00002431 unsigned SymbolTableEntrySize = is64Bit() ?
Charles Davis8bdfafd2013-09-01 04:28:48 +00002432 sizeof(MachO::nlist_64) :
2433 sizeof(MachO::nlist);
2434 unsigned Offset = Symtab.symoff +
2435 Symtab.nsyms * SymbolTableEntrySize;
Lang Hames697e7cd2016-12-04 01:56:10 +00002436 DRI.p = reinterpret_cast<uintptr_t>(getPtr(*this, Offset));
Rafael Espindolaf12b8282014-02-21 20:10:59 +00002437 return basic_symbol_iterator(SymbolRef(DRI, this));
Rafael Espindola56f976f2013-04-18 18:08:55 +00002438}
2439
Lang Hames46f0a972019-01-14 22:05:12 +00002440symbol_iterator MachOObjectFile::getSymbolByIndex(unsigned Index) const {
Lang Hames36072da2014-05-12 21:39:59 +00002441 MachO::symtab_command Symtab = getSymtabLoadCommand();
Kevin Enderby1829c682016-01-22 22:49:55 +00002442 if (!SymtabLoadCmd || Index >= Symtab.nsyms)
Filipe Cabecinhas40139502015-01-15 22:52:38 +00002443 report_fatal_error("Requested symbol index is out of range.");
Lang Hames36072da2014-05-12 21:39:59 +00002444 unsigned SymbolTableEntrySize =
2445 is64Bit() ? sizeof(MachO::nlist_64) : sizeof(MachO::nlist);
Kevin Enderby1829c682016-01-22 22:49:55 +00002446 DataRefImpl DRI;
Lang Hames697e7cd2016-12-04 01:56:10 +00002447 DRI.p = reinterpret_cast<uintptr_t>(getPtr(*this, Symtab.symoff));
Lang Hames36072da2014-05-12 21:39:59 +00002448 DRI.p += Index * SymbolTableEntrySize;
2449 return basic_symbol_iterator(SymbolRef(DRI, this));
2450}
2451
Kevin Enderby81e8b7d2016-04-20 21:24:34 +00002452uint64_t MachOObjectFile::getSymbolIndex(DataRefImpl Symb) const {
2453 MachO::symtab_command Symtab = getSymtabLoadCommand();
2454 if (!SymtabLoadCmd)
2455 report_fatal_error("getSymbolIndex() called with no symbol table symbol");
2456 unsigned SymbolTableEntrySize =
2457 is64Bit() ? sizeof(MachO::nlist_64) : sizeof(MachO::nlist);
2458 DataRefImpl DRIstart;
Lang Hames697e7cd2016-12-04 01:56:10 +00002459 DRIstart.p = reinterpret_cast<uintptr_t>(getPtr(*this, Symtab.symoff));
Kevin Enderby81e8b7d2016-04-20 21:24:34 +00002460 uint64_t Index = (Symb.p - DRIstart.p) / SymbolTableEntrySize;
2461 return Index;
2462}
2463
Rafael Espindolab5155a52014-02-10 20:24:04 +00002464section_iterator MachOObjectFile::section_begin() const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00002465 DataRefImpl DRI;
2466 return section_iterator(SectionRef(DRI, this));
2467}
2468
Rafael Espindolab5155a52014-02-10 20:24:04 +00002469section_iterator MachOObjectFile::section_end() const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00002470 DataRefImpl DRI;
2471 DRI.d.a = Sections.size();
2472 return section_iterator(SectionRef(DRI, this));
2473}
2474
Rafael Espindola56f976f2013-04-18 18:08:55 +00002475uint8_t MachOObjectFile::getBytesInAddress() const {
Rafael Espindola60689982013-04-07 19:05:30 +00002476 return is64Bit() ? 8 : 4;
Eric Christopher7b015c72011-04-22 03:19:48 +00002477}
2478
Rafael Espindola56f976f2013-04-18 18:08:55 +00002479StringRef MachOObjectFile::getFileFormatName() const {
Lang Hames697e7cd2016-12-04 01:56:10 +00002480 unsigned CPUType = getCPUType(*this);
Rafael Espindola56f976f2013-04-18 18:08:55 +00002481 if (!is64Bit()) {
2482 switch (CPUType) {
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002483 case MachO::CPU_TYPE_I386:
Rafael Espindola56f976f2013-04-18 18:08:55 +00002484 return "Mach-O 32-bit i386";
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002485 case MachO::CPU_TYPE_ARM:
Rafael Espindola56f976f2013-04-18 18:08:55 +00002486 return "Mach-O arm";
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002487 case MachO::CPU_TYPE_POWERPC:
Rafael Espindola56f976f2013-04-18 18:08:55 +00002488 return "Mach-O 32-bit ppc";
2489 default:
Rafael Espindola56f976f2013-04-18 18:08:55 +00002490 return "Mach-O 32-bit unknown";
2491 }
2492 }
2493
Rafael Espindola56f976f2013-04-18 18:08:55 +00002494 switch (CPUType) {
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002495 case MachO::CPU_TYPE_X86_64:
Rafael Espindola56f976f2013-04-18 18:08:55 +00002496 return "Mach-O 64-bit x86-64";
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002497 case MachO::CPU_TYPE_ARM64:
Tim Northover00ed9962014-03-29 10:18:08 +00002498 return "Mach-O arm64";
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002499 case MachO::CPU_TYPE_POWERPC64:
Rafael Espindola56f976f2013-04-18 18:08:55 +00002500 return "Mach-O 64-bit ppc64";
2501 default:
2502 return "Mach-O 64-bit unknown";
2503 }
2504}
2505
Alexey Samsonove6388e62013-06-18 15:03:28 +00002506Triple::ArchType MachOObjectFile::getArch(uint32_t CPUType) {
2507 switch (CPUType) {
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002508 case MachO::CPU_TYPE_I386:
Rafael Espindola56f976f2013-04-18 18:08:55 +00002509 return Triple::x86;
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002510 case MachO::CPU_TYPE_X86_64:
Rafael Espindola56f976f2013-04-18 18:08:55 +00002511 return Triple::x86_64;
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002512 case MachO::CPU_TYPE_ARM:
Rafael Espindola56f976f2013-04-18 18:08:55 +00002513 return Triple::arm;
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002514 case MachO::CPU_TYPE_ARM64:
Tim Northovere19bed72014-07-23 12:32:47 +00002515 return Triple::aarch64;
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002516 case MachO::CPU_TYPE_POWERPC:
Rafael Espindola56f976f2013-04-18 18:08:55 +00002517 return Triple::ppc;
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002518 case MachO::CPU_TYPE_POWERPC64:
Rafael Espindola56f976f2013-04-18 18:08:55 +00002519 return Triple::ppc64;
2520 default:
2521 return Triple::UnknownArch;
2522 }
2523}
2524
Tim Northover9e8eb412016-04-22 23:21:13 +00002525Triple MachOObjectFile::getArchTriple(uint32_t CPUType, uint32_t CPUSubType,
Kevin Enderby59343a92016-12-16 22:54:02 +00002526 const char **McpuDefault,
2527 const char **ArchFlag) {
Kevin Enderbyec5ca032014-08-18 20:21:02 +00002528 if (McpuDefault)
2529 *McpuDefault = nullptr;
Kevin Enderby59343a92016-12-16 22:54:02 +00002530 if (ArchFlag)
2531 *ArchFlag = nullptr;
Kevin Enderbyec5ca032014-08-18 20:21:02 +00002532
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002533 switch (CPUType) {
2534 case MachO::CPU_TYPE_I386:
2535 switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
2536 case MachO::CPU_SUBTYPE_I386_ALL:
Kevin Enderby59343a92016-12-16 22:54:02 +00002537 if (ArchFlag)
2538 *ArchFlag = "i386";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002539 return Triple("i386-apple-darwin");
2540 default:
2541 return Triple();
2542 }
2543 case MachO::CPU_TYPE_X86_64:
2544 switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
2545 case MachO::CPU_SUBTYPE_X86_64_ALL:
Kevin Enderby59343a92016-12-16 22:54:02 +00002546 if (ArchFlag)
2547 *ArchFlag = "x86_64";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002548 return Triple("x86_64-apple-darwin");
2549 case MachO::CPU_SUBTYPE_X86_64_H:
Kevin Enderby59343a92016-12-16 22:54:02 +00002550 if (ArchFlag)
2551 *ArchFlag = "x86_64h";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002552 return Triple("x86_64h-apple-darwin");
2553 default:
2554 return Triple();
2555 }
2556 case MachO::CPU_TYPE_ARM:
2557 switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
2558 case MachO::CPU_SUBTYPE_ARM_V4T:
Kevin Enderby59343a92016-12-16 22:54:02 +00002559 if (ArchFlag)
2560 *ArchFlag = "armv4t";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002561 return Triple("armv4t-apple-darwin");
2562 case MachO::CPU_SUBTYPE_ARM_V5TEJ:
Kevin Enderby59343a92016-12-16 22:54:02 +00002563 if (ArchFlag)
2564 *ArchFlag = "armv5e";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002565 return Triple("armv5e-apple-darwin");
Kevin Enderbyae2a9a22014-08-07 21:30:25 +00002566 case MachO::CPU_SUBTYPE_ARM_XSCALE:
Kevin Enderby59343a92016-12-16 22:54:02 +00002567 if (ArchFlag)
2568 *ArchFlag = "xscale";
Kevin Enderbyae2a9a22014-08-07 21:30:25 +00002569 return Triple("xscale-apple-darwin");
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002570 case MachO::CPU_SUBTYPE_ARM_V6:
Kevin Enderby59343a92016-12-16 22:54:02 +00002571 if (ArchFlag)
2572 *ArchFlag = "armv6";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002573 return Triple("armv6-apple-darwin");
2574 case MachO::CPU_SUBTYPE_ARM_V6M:
Kevin Enderbyec5ca032014-08-18 20:21:02 +00002575 if (McpuDefault)
2576 *McpuDefault = "cortex-m0";
Kevin Enderby59343a92016-12-16 22:54:02 +00002577 if (ArchFlag)
2578 *ArchFlag = "armv6m";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002579 return Triple("armv6m-apple-darwin");
Kevin Enderbyae2a9a22014-08-07 21:30:25 +00002580 case MachO::CPU_SUBTYPE_ARM_V7:
Kevin Enderby59343a92016-12-16 22:54:02 +00002581 if (ArchFlag)
2582 *ArchFlag = "armv7";
Kevin Enderbyae2a9a22014-08-07 21:30:25 +00002583 return Triple("armv7-apple-darwin");
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002584 case MachO::CPU_SUBTYPE_ARM_V7EM:
Kevin Enderbyec5ca032014-08-18 20:21:02 +00002585 if (McpuDefault)
2586 *McpuDefault = "cortex-m4";
Kevin Enderby59343a92016-12-16 22:54:02 +00002587 if (ArchFlag)
2588 *ArchFlag = "armv7em";
Tim Northover9e8eb412016-04-22 23:21:13 +00002589 return Triple("thumbv7em-apple-darwin");
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002590 case MachO::CPU_SUBTYPE_ARM_V7K:
Kevin Enderby7a165752017-01-24 23:41:04 +00002591 if (McpuDefault)
2592 *McpuDefault = "cortex-a7";
Kevin Enderby59343a92016-12-16 22:54:02 +00002593 if (ArchFlag)
2594 *ArchFlag = "armv7k";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002595 return Triple("armv7k-apple-darwin");
2596 case MachO::CPU_SUBTYPE_ARM_V7M:
Kevin Enderbyec5ca032014-08-18 20:21:02 +00002597 if (McpuDefault)
2598 *McpuDefault = "cortex-m3";
Kevin Enderby59343a92016-12-16 22:54:02 +00002599 if (ArchFlag)
2600 *ArchFlag = "armv7m";
Tim Northover9e8eb412016-04-22 23:21:13 +00002601 return Triple("thumbv7m-apple-darwin");
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002602 case MachO::CPU_SUBTYPE_ARM_V7S:
Kevin Enderby7a165752017-01-24 23:41:04 +00002603 if (McpuDefault)
2604 *McpuDefault = "cortex-a7";
Kevin Enderby59343a92016-12-16 22:54:02 +00002605 if (ArchFlag)
2606 *ArchFlag = "armv7s";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002607 return Triple("armv7s-apple-darwin");
2608 default:
2609 return Triple();
2610 }
2611 case MachO::CPU_TYPE_ARM64:
2612 switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
2613 case MachO::CPU_SUBTYPE_ARM64_ALL:
Kevin Enderbydc412cc2017-02-10 19:27:10 +00002614 if (McpuDefault)
2615 *McpuDefault = "cyclone";
Kevin Enderby59343a92016-12-16 22:54:02 +00002616 if (ArchFlag)
2617 *ArchFlag = "arm64";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002618 return Triple("arm64-apple-darwin");
2619 default:
2620 return Triple();
2621 }
2622 case MachO::CPU_TYPE_POWERPC:
2623 switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
2624 case MachO::CPU_SUBTYPE_POWERPC_ALL:
Kevin Enderby59343a92016-12-16 22:54:02 +00002625 if (ArchFlag)
2626 *ArchFlag = "ppc";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002627 return Triple("ppc-apple-darwin");
2628 default:
2629 return Triple();
2630 }
2631 case MachO::CPU_TYPE_POWERPC64:
Reid Kleckner4da3d572014-06-30 20:12:59 +00002632 switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002633 case MachO::CPU_SUBTYPE_POWERPC_ALL:
Kevin Enderby59343a92016-12-16 22:54:02 +00002634 if (ArchFlag)
2635 *ArchFlag = "ppc64";
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002636 return Triple("ppc64-apple-darwin");
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002637 default:
2638 return Triple();
2639 }
2640 default:
2641 return Triple();
2642 }
2643}
2644
2645Triple MachOObjectFile::getHostArch() {
2646 return Triple(sys::getDefaultTargetTriple());
2647}
2648
Rafael Espindola72318b42014-08-08 16:30:17 +00002649bool MachOObjectFile::isValidArch(StringRef ArchFlag) {
2650 return StringSwitch<bool>(ArchFlag)
2651 .Case("i386", true)
2652 .Case("x86_64", true)
2653 .Case("x86_64h", true)
2654 .Case("armv4t", true)
2655 .Case("arm", true)
2656 .Case("armv5e", true)
2657 .Case("armv6", true)
2658 .Case("armv6m", true)
Frederic Riss40baa0a2015-06-16 17:37:03 +00002659 .Case("armv7", true)
Rafael Espindola72318b42014-08-08 16:30:17 +00002660 .Case("armv7em", true)
2661 .Case("armv7k", true)
2662 .Case("armv7m", true)
2663 .Case("armv7s", true)
2664 .Case("arm64", true)
2665 .Case("ppc", true)
2666 .Case("ppc64", true)
2667 .Default(false);
Kevin Enderby4c8dfe42014-06-30 18:45:23 +00002668}
2669
Zachary Turner260fe3e2017-12-14 22:07:03 +00002670Triple::ArchType MachOObjectFile::getArch() const {
Lang Hames697e7cd2016-12-04 01:56:10 +00002671 return getArch(getCPUType(*this));
Alexey Samsonove6388e62013-06-18 15:03:28 +00002672}
2673
Tim Northover9e8eb412016-04-22 23:21:13 +00002674Triple MachOObjectFile::getArchTriple(const char **McpuDefault) const {
2675 return getArchTriple(Header.cputype, Header.cpusubtype, McpuDefault);
Kevin Enderbyec5ca032014-08-18 20:21:02 +00002676}
2677
Rui Ueyamabc654b12013-09-27 21:47:05 +00002678relocation_iterator MachOObjectFile::section_rel_begin(unsigned Index) const {
Rafael Espindola6e040c02013-04-26 20:07:33 +00002679 DataRefImpl DRI;
2680 DRI.d.a = Index;
Rui Ueyamabc654b12013-09-27 21:47:05 +00002681 return section_rel_begin(DRI);
Rafael Espindola6e040c02013-04-26 20:07:33 +00002682}
2683
Rui Ueyamabc654b12013-09-27 21:47:05 +00002684relocation_iterator MachOObjectFile::section_rel_end(unsigned Index) const {
Rafael Espindola6e040c02013-04-26 20:07:33 +00002685 DataRefImpl DRI;
2686 DRI.d.a = Index;
Rui Ueyamabc654b12013-09-27 21:47:05 +00002687 return section_rel_end(DRI);
Rafael Espindola6e040c02013-04-26 20:07:33 +00002688}
2689
Kevin Enderby273ae012013-06-06 17:20:50 +00002690dice_iterator MachOObjectFile::begin_dices() const {
2691 DataRefImpl DRI;
2692 if (!DataInCodeLoadCmd)
2693 return dice_iterator(DiceRef(DRI, this));
2694
Charles Davis8bdfafd2013-09-01 04:28:48 +00002695 MachO::linkedit_data_command DicLC = getDataInCodeLoadCommand();
Lang Hames697e7cd2016-12-04 01:56:10 +00002696 DRI.p = reinterpret_cast<uintptr_t>(getPtr(*this, DicLC.dataoff));
Kevin Enderby273ae012013-06-06 17:20:50 +00002697 return dice_iterator(DiceRef(DRI, this));
2698}
2699
2700dice_iterator MachOObjectFile::end_dices() const {
2701 DataRefImpl DRI;
2702 if (!DataInCodeLoadCmd)
2703 return dice_iterator(DiceRef(DRI, this));
2704
Charles Davis8bdfafd2013-09-01 04:28:48 +00002705 MachO::linkedit_data_command DicLC = getDataInCodeLoadCommand();
2706 unsigned Offset = DicLC.dataoff + DicLC.datasize;
Lang Hames697e7cd2016-12-04 01:56:10 +00002707 DRI.p = reinterpret_cast<uintptr_t>(getPtr(*this, Offset));
Kevin Enderby273ae012013-06-06 17:20:50 +00002708 return dice_iterator(DiceRef(DRI, this));
2709}
2710
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002711ExportEntry::ExportEntry(Error *E, const MachOObjectFile *O,
2712 ArrayRef<uint8_t> T) : E(E), O(O), Trie(T) {}
Nick Kledzikd04bc352014-08-30 00:20:14 +00002713
2714void ExportEntry::moveToFirst() {
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002715 ErrorAsOutParameter ErrAsOutParam(E);
Nick Kledzikd04bc352014-08-30 00:20:14 +00002716 pushNode(0);
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002717 if (*E)
2718 return;
Nick Kledzikd04bc352014-08-30 00:20:14 +00002719 pushDownUntilBottom();
2720}
2721
2722void ExportEntry::moveToEnd() {
2723 Stack.clear();
2724 Done = true;
2725}
2726
2727bool ExportEntry::operator==(const ExportEntry &Other) const {
NAKAMURA Takumi84965032015-09-22 11:14:12 +00002728 // Common case, one at end, other iterating from begin.
Nick Kledzikd04bc352014-08-30 00:20:14 +00002729 if (Done || Other.Done)
2730 return (Done == Other.Done);
2731 // Not equal if different stack sizes.
2732 if (Stack.size() != Other.Stack.size())
2733 return false;
2734 // Not equal if different cumulative strings.
Yaron Keren075759a2015-03-30 15:42:36 +00002735 if (!CumulativeString.equals(Other.CumulativeString))
Nick Kledzikd04bc352014-08-30 00:20:14 +00002736 return false;
2737 // Equal if all nodes in both stacks match.
2738 for (unsigned i=0; i < Stack.size(); ++i) {
2739 if (Stack[i].Start != Other.Stack[i].Start)
2740 return false;
2741 }
NAKAMURA Takumi10c80e72015-09-22 11:19:03 +00002742 return true;
Nick Kledzikd04bc352014-08-30 00:20:14 +00002743}
2744
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002745uint64_t ExportEntry::readULEB128(const uint8_t *&Ptr, const char **error) {
Nick Kledzikac7cbdc2014-09-02 18:50:24 +00002746 unsigned Count;
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002747 uint64_t Result = decodeULEB128(Ptr, &Count, Trie.end(), error);
Nick Kledzikac7cbdc2014-09-02 18:50:24 +00002748 Ptr += Count;
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002749 if (Ptr > Trie.end())
Nick Kledzikac7cbdc2014-09-02 18:50:24 +00002750 Ptr = Trie.end();
Nick Kledzikac7cbdc2014-09-02 18:50:24 +00002751 return Result;
Nick Kledzikd04bc352014-08-30 00:20:14 +00002752}
2753
2754StringRef ExportEntry::name() const {
Yaron Keren075759a2015-03-30 15:42:36 +00002755 return CumulativeString;
Nick Kledzikd04bc352014-08-30 00:20:14 +00002756}
2757
2758uint64_t ExportEntry::flags() const {
2759 return Stack.back().Flags;
2760}
2761
2762uint64_t ExportEntry::address() const {
2763 return Stack.back().Address;
2764}
2765
2766uint64_t ExportEntry::other() const {
2767 return Stack.back().Other;
2768}
2769
2770StringRef ExportEntry::otherName() const {
2771 const char* ImportName = Stack.back().ImportName;
2772 if (ImportName)
2773 return StringRef(ImportName);
2774 return StringRef();
2775}
2776
2777uint32_t ExportEntry::nodeOffset() const {
2778 return Stack.back().Start - Trie.begin();
2779}
2780
NAKAMURA Takumi70ad98a2015-09-22 11:13:55 +00002781ExportEntry::NodeState::NodeState(const uint8_t *Ptr)
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00002782 : Start(Ptr), Current(Ptr) {}
Nick Kledzikd04bc352014-08-30 00:20:14 +00002783
2784void ExportEntry::pushNode(uint64_t offset) {
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002785 ErrorAsOutParameter ErrAsOutParam(E);
Nick Kledzikd04bc352014-08-30 00:20:14 +00002786 const uint8_t *Ptr = Trie.begin() + offset;
2787 NodeState State(Ptr);
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002788 const char *error;
2789 uint64_t ExportInfoSize = readULEB128(State.Current, &error);
2790 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002791 *E = malformedError("export info size " + Twine(error) +
2792 " in export trie data at node: 0x" +
2793 Twine::utohexstr(offset));
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002794 moveToEnd();
2795 return;
2796 }
Nick Kledzikd04bc352014-08-30 00:20:14 +00002797 State.IsExportNode = (ExportInfoSize != 0);
2798 const uint8_t* Children = State.Current + ExportInfoSize;
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002799 if (Children > Trie.end()) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002800 *E = malformedError(
2801 "export info size: 0x" + Twine::utohexstr(ExportInfoSize) +
2802 " in export trie data at node: 0x" + Twine::utohexstr(offset) +
2803 " too big and extends past end of trie data");
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002804 moveToEnd();
2805 return;
2806 }
Nick Kledzikd04bc352014-08-30 00:20:14 +00002807 if (State.IsExportNode) {
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002808 const uint8_t *ExportStart = State.Current;
2809 State.Flags = readULEB128(State.Current, &error);
2810 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002811 *E = malformedError("flags " + Twine(error) +
2812 " in export trie data at node: 0x" +
2813 Twine::utohexstr(offset));
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002814 moveToEnd();
2815 return;
2816 }
2817 uint64_t Kind = State.Flags & MachO::EXPORT_SYMBOL_FLAGS_KIND_MASK;
2818 if (State.Flags != 0 &&
2819 (Kind != MachO::EXPORT_SYMBOL_FLAGS_KIND_REGULAR &&
2820 Kind != MachO::EXPORT_SYMBOL_FLAGS_KIND_ABSOLUTE &&
2821 Kind != MachO::EXPORT_SYMBOL_FLAGS_KIND_THREAD_LOCAL)) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002822 *E = malformedError(
2823 "unsupported exported symbol kind: " + Twine((int)Kind) +
2824 " in flags: 0x" + Twine::utohexstr(State.Flags) +
2825 " in export trie data at node: 0x" + Twine::utohexstr(offset));
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002826 moveToEnd();
2827 return;
2828 }
Nick Kledzikd04bc352014-08-30 00:20:14 +00002829 if (State.Flags & MachO::EXPORT_SYMBOL_FLAGS_REEXPORT) {
2830 State.Address = 0;
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002831 State.Other = readULEB128(State.Current, &error); // dylib ordinal
2832 if (error) {
2833 *E = malformedError("dylib ordinal of re-export " + Twine(error) +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002834 " in export trie data at node: 0x" +
2835 Twine::utohexstr(offset));
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002836 moveToEnd();
2837 return;
2838 }
2839 if (O != nullptr) {
2840 if (State.Other > O->getLibraryCount()) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002841 *E = malformedError(
2842 "bad library ordinal: " + Twine((int)State.Other) + " (max " +
2843 Twine((int)O->getLibraryCount()) +
2844 ") in export trie data at node: 0x" + Twine::utohexstr(offset));
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002845 moveToEnd();
2846 return;
2847 }
2848 }
Nick Kledzikd04bc352014-08-30 00:20:14 +00002849 State.ImportName = reinterpret_cast<const char*>(State.Current);
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002850 if (*State.ImportName == '\0') {
2851 State.Current++;
2852 } else {
2853 const uint8_t *End = State.Current + 1;
2854 if (End >= Trie.end()) {
2855 *E = malformedError("import name of re-export in export trie data at "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002856 "node: 0x" +
2857 Twine::utohexstr(offset) +
2858 " starts past end of trie data");
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002859 moveToEnd();
2860 return;
2861 }
2862 while(*End != '\0' && End < Trie.end())
2863 End++;
2864 if (*End != '\0') {
2865 *E = malformedError("import name of re-export in export trie data at "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002866 "node: 0x" +
2867 Twine::utohexstr(offset) +
2868 " extends past end of trie data");
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002869 moveToEnd();
2870 return;
2871 }
2872 State.Current = End + 1;
2873 }
Nick Kledzikd04bc352014-08-30 00:20:14 +00002874 } else {
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002875 State.Address = readULEB128(State.Current, &error);
2876 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002877 *E = malformedError("address " + Twine(error) +
2878 " in export trie data at node: 0x" +
2879 Twine::utohexstr(offset));
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002880 moveToEnd();
2881 return;
2882 }
2883 if (State.Flags & MachO::EXPORT_SYMBOL_FLAGS_STUB_AND_RESOLVER) {
2884 State.Other = readULEB128(State.Current, &error);
2885 if (error) {
2886 *E = malformedError("resolver of stub and resolver " + Twine(error) +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002887 " in export trie data at node: 0x" +
2888 Twine::utohexstr(offset));
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002889 moveToEnd();
2890 return;
2891 }
2892 }
Nick Kledzikd04bc352014-08-30 00:20:14 +00002893 }
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002894 if(ExportStart + ExportInfoSize != State.Current) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002895 *E = malformedError(
2896 "inconsistant export info size: 0x" +
2897 Twine::utohexstr(ExportInfoSize) + " where actual size was: 0x" +
2898 Twine::utohexstr(State.Current - ExportStart) +
2899 " in export trie data at node: 0x" + Twine::utohexstr(offset));
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002900 moveToEnd();
2901 return;
2902 }
2903 }
Kevin Enderby8100cde2017-07-24 20:33:41 +00002904 State.ChildCount = *Children;
2905 if (State.ChildCount != 0 && Children + 1 >= Trie.end()) {
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002906 *E = malformedError("byte for count of childern in export trie data at "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002907 "node: 0x" +
2908 Twine::utohexstr(offset) +
2909 " extends past end of trie data");
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002910 moveToEnd();
2911 return;
Nick Kledzikd04bc352014-08-30 00:20:14 +00002912 }
Nick Kledzikd04bc352014-08-30 00:20:14 +00002913 State.Current = Children + 1;
2914 State.NextChildIndex = 0;
2915 State.ParentStringLength = CumulativeString.size();
2916 Stack.push_back(State);
2917}
2918
2919void ExportEntry::pushDownUntilBottom() {
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002920 ErrorAsOutParameter ErrAsOutParam(E);
2921 const char *error;
Nick Kledzikd04bc352014-08-30 00:20:14 +00002922 while (Stack.back().NextChildIndex < Stack.back().ChildCount) {
2923 NodeState &Top = Stack.back();
2924 CumulativeString.resize(Top.ParentStringLength);
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002925 for (;*Top.Current != 0 && Top.Current < Trie.end(); Top.Current++) {
Nick Kledzikac7cbdc2014-09-02 18:50:24 +00002926 char C = *Top.Current;
2927 CumulativeString.push_back(C);
Nick Kledzikd04bc352014-08-30 00:20:14 +00002928 }
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002929 if (Top.Current >= Trie.end()) {
2930 *E = malformedError("edge sub-string in export trie data at node: 0x" +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002931 Twine::utohexstr(Top.Start - Trie.begin()) +
2932 " for child #" + Twine((int)Top.NextChildIndex) +
2933 " extends past end of trie data");
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002934 moveToEnd();
2935 return;
2936 }
Nick Kledzikd04bc352014-08-30 00:20:14 +00002937 Top.Current += 1;
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002938 uint64_t childNodeIndex = readULEB128(Top.Current, &error);
2939 if (error) {
2940 *E = malformedError("child node offset " + Twine(error) +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002941 " in export trie data at node: 0x" +
2942 Twine::utohexstr(Top.Start - Trie.begin()));
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002943 moveToEnd();
2944 return;
2945 }
2946 for (const NodeState &node : nodes()) {
2947 if (node.Start == Trie.begin() + childNodeIndex){
2948 *E = malformedError("loop in childern in export trie data at node: 0x" +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002949 Twine::utohexstr(Top.Start - Trie.begin()) +
2950 " back to node: 0x" +
2951 Twine::utohexstr(childNodeIndex));
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002952 moveToEnd();
2953 return;
2954 }
2955 }
Nick Kledzikd04bc352014-08-30 00:20:14 +00002956 Top.NextChildIndex += 1;
2957 pushNode(childNodeIndex);
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002958 if (*E)
2959 return;
Nick Kledzikd04bc352014-08-30 00:20:14 +00002960 }
2961 if (!Stack.back().IsExportNode) {
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002962 *E = malformedError("node is not an export node in export trie data at "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002963 "node: 0x" +
2964 Twine::utohexstr(Stack.back().Start - Trie.begin()));
Nick Kledzikd04bc352014-08-30 00:20:14 +00002965 moveToEnd();
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002966 return;
Nick Kledzikd04bc352014-08-30 00:20:14 +00002967 }
2968}
2969
2970// We have a trie data structure and need a way to walk it that is compatible
2971// with the C++ iterator model. The solution is a non-recursive depth first
2972// traversal where the iterator contains a stack of parent nodes along with a
2973// string that is the accumulation of all edge strings along the parent chain
2974// to this point.
2975//
NAKAMURA Takumi59c74b222014-10-27 08:08:18 +00002976// There is one "export" node for each exported symbol. But because some
Nick Kledzikd04bc352014-08-30 00:20:14 +00002977// symbols may be a prefix of another symbol (e.g. _dup and _dup2), an export
NAKAMURA Takumi84965032015-09-22 11:14:12 +00002978// node may have child nodes too.
Nick Kledzikd04bc352014-08-30 00:20:14 +00002979//
2980// The algorithm for moveNext() is to keep moving down the leftmost unvisited
2981// child until hitting a node with no children (which is an export node or
2982// else the trie is malformed). On the way down, each node is pushed on the
2983// stack ivar. If there is no more ways down, it pops up one and tries to go
2984// down a sibling path until a childless node is reached.
2985void ExportEntry::moveNext() {
Kevin Enderby3e95bd22017-07-20 23:08:41 +00002986 assert(!Stack.empty() && "ExportEntry::moveNext() with empty node stack");
2987 if (!Stack.back().IsExportNode) {
2988 *E = malformedError("node is not an export node in export trie data at "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00002989 "node: 0x" +
2990 Twine::utohexstr(Stack.back().Start - Trie.begin()));
Nick Kledzikd04bc352014-08-30 00:20:14 +00002991 moveToEnd();
2992 return;
2993 }
2994
2995 Stack.pop_back();
2996 while (!Stack.empty()) {
2997 NodeState &Top = Stack.back();
2998 if (Top.NextChildIndex < Top.ChildCount) {
2999 pushDownUntilBottom();
3000 // Now at the next export node.
3001 return;
3002 } else {
3003 if (Top.IsExportNode) {
3004 // This node has no children but is itself an export node.
3005 CumulativeString.resize(Top.ParentStringLength);
3006 return;
3007 }
3008 Stack.pop_back();
3009 }
3010 }
3011 Done = true;
3012}
3013
NAKAMURA Takumi10c80e72015-09-22 11:19:03 +00003014iterator_range<export_iterator>
Kevin Enderby3e95bd22017-07-20 23:08:41 +00003015MachOObjectFile::exports(Error &E, ArrayRef<uint8_t> Trie,
3016 const MachOObjectFile *O) {
3017 ExportEntry Start(&E, O, Trie);
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003018 if (Trie.empty())
Juergen Ributzka4d7f70d2014-12-19 02:31:01 +00003019 Start.moveToEnd();
3020 else
3021 Start.moveToFirst();
Nick Kledzikd04bc352014-08-30 00:20:14 +00003022
Kevin Enderby3e95bd22017-07-20 23:08:41 +00003023 ExportEntry Finish(&E, O, Trie);
Nick Kledzikd04bc352014-08-30 00:20:14 +00003024 Finish.moveToEnd();
3025
Craig Topper15576e12015-12-06 05:08:07 +00003026 return make_range(export_iterator(Start), export_iterator(Finish));
Nick Kledzikd04bc352014-08-30 00:20:14 +00003027}
3028
Alexander Shaposhnikove5740342017-07-29 00:30:45 +00003029iterator_range<export_iterator> MachOObjectFile::exports(Error &Err) const {
3030 return exports(Err, getDyldInfoExportsTrie(), this);
Nick Kledzikd04bc352014-08-30 00:20:14 +00003031}
3032
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003033MachORebaseEntry::MachORebaseEntry(Error *E, const MachOObjectFile *O,
3034 ArrayRef<uint8_t> Bytes, bool is64Bit)
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003035 : E(E), O(O), Opcodes(Bytes), Ptr(Bytes.begin()),
3036 PointerSize(is64Bit ? 8 : 4) {}
Nick Kledzikac431442014-09-12 21:34:15 +00003037
3038void MachORebaseEntry::moveToFirst() {
3039 Ptr = Opcodes.begin();
3040 moveNext();
3041}
3042
3043void MachORebaseEntry::moveToEnd() {
3044 Ptr = Opcodes.end();
3045 RemainingLoopCount = 0;
3046 Done = true;
3047}
3048
3049void MachORebaseEntry::moveNext() {
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003050 ErrorAsOutParameter ErrAsOutParam(E);
Nick Kledzikac431442014-09-12 21:34:15 +00003051 // If in the middle of some loop, move to next rebasing in loop.
3052 SegmentOffset += AdvanceAmount;
3053 if (RemainingLoopCount) {
3054 --RemainingLoopCount;
3055 return;
3056 }
Juergen Ributzkacad12492017-03-30 19:56:50 +00003057 // REBASE_OPCODE_DONE is only used for padding if we are not aligned to
3058 // pointer size. Therefore it is possible to reach the end without ever having
3059 // seen REBASE_OPCODE_DONE.
3060 if (Ptr == Opcodes.end()) {
Nick Kledzikac431442014-09-12 21:34:15 +00003061 Done = true;
3062 return;
3063 }
3064 bool More = true;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003065 while (More) {
Nick Kledzikac431442014-09-12 21:34:15 +00003066 // Parse next opcode and set up next loop.
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003067 const uint8_t *OpcodeStart = Ptr;
Nick Kledzikac431442014-09-12 21:34:15 +00003068 uint8_t Byte = *Ptr++;
3069 uint8_t ImmValue = Byte & MachO::REBASE_IMMEDIATE_MASK;
3070 uint8_t Opcode = Byte & MachO::REBASE_OPCODE_MASK;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003071 uint32_t Count, Skip;
3072 const char *error = nullptr;
Nick Kledzikac431442014-09-12 21:34:15 +00003073 switch (Opcode) {
3074 case MachO::REBASE_OPCODE_DONE:
3075 More = false;
3076 Done = true;
3077 moveToEnd();
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003078 DEBUG_WITH_TYPE("mach-o-rebase", dbgs() << "REBASE_OPCODE_DONE\n");
Nick Kledzikac431442014-09-12 21:34:15 +00003079 break;
3080 case MachO::REBASE_OPCODE_SET_TYPE_IMM:
3081 RebaseType = ImmValue;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003082 if (RebaseType > MachO::REBASE_TYPE_TEXT_PCREL32) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003083 *E = malformedError("for REBASE_OPCODE_SET_TYPE_IMM bad bind type: " +
3084 Twine((int)RebaseType) + " for opcode at: 0x" +
3085 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
3086 moveToEnd();
3087 return;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003088 }
Nick Kledzikac431442014-09-12 21:34:15 +00003089 DEBUG_WITH_TYPE(
3090 "mach-o-rebase",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003091 dbgs() << "REBASE_OPCODE_SET_TYPE_IMM: "
3092 << "RebaseType=" << (int) RebaseType << "\n");
Nick Kledzikac431442014-09-12 21:34:15 +00003093 break;
3094 case MachO::REBASE_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB:
3095 SegmentIndex = ImmValue;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003096 SegmentOffset = readULEB128(&error);
3097 if (error) {
3098 *E = malformedError("for REBASE_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003099 Twine(error) + " for opcode at: 0x" +
3100 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003101 moveToEnd();
3102 return;
3103 }
3104 error = O->RebaseEntryCheckSegAndOffset(SegmentIndex, SegmentOffset,
3105 true);
3106 if (error) {
3107 *E = malformedError("for REBASE_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003108 Twine(error) + " for opcode at: 0x" +
3109 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003110 moveToEnd();
3111 return;
3112 }
Nick Kledzikac431442014-09-12 21:34:15 +00003113 DEBUG_WITH_TYPE(
3114 "mach-o-rebase",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003115 dbgs() << "REBASE_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB: "
3116 << "SegmentIndex=" << SegmentIndex << ", "
3117 << format("SegmentOffset=0x%06X", SegmentOffset)
3118 << "\n");
Nick Kledzikac431442014-09-12 21:34:15 +00003119 break;
3120 case MachO::REBASE_OPCODE_ADD_ADDR_ULEB:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003121 SegmentOffset += readULEB128(&error);
3122 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003123 *E = malformedError("for REBASE_OPCODE_ADD_ADDR_ULEB " + Twine(error) +
3124 " for opcode at: 0x" +
3125 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003126 moveToEnd();
3127 return;
3128 }
3129 error = O->RebaseEntryCheckSegAndOffset(SegmentIndex, SegmentOffset,
3130 true);
3131 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003132 *E = malformedError("for REBASE_OPCODE_ADD_ADDR_ULEB " + Twine(error) +
3133 " for opcode at: 0x" +
3134 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003135 moveToEnd();
3136 return;
3137 }
Nick Kledzikac431442014-09-12 21:34:15 +00003138 DEBUG_WITH_TYPE("mach-o-rebase",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003139 dbgs() << "REBASE_OPCODE_ADD_ADDR_ULEB: "
3140 << format("SegmentOffset=0x%06X",
3141 SegmentOffset) << "\n");
Nick Kledzikac431442014-09-12 21:34:15 +00003142 break;
3143 case MachO::REBASE_OPCODE_ADD_ADDR_IMM_SCALED:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003144 error = O->RebaseEntryCheckSegAndOffset(SegmentIndex, SegmentOffset,
3145 true);
3146 if (error) {
3147 *E = malformedError("for REBASE_OPCODE_ADD_ADDR_IMM_SCALED " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003148 Twine(error) + " for opcode at: 0x" +
3149 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003150 moveToEnd();
3151 return;
3152 }
Nick Kledzikac431442014-09-12 21:34:15 +00003153 SegmentOffset += ImmValue * PointerSize;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003154 error = O->RebaseEntryCheckSegAndOffset(SegmentIndex, SegmentOffset,
3155 false);
3156 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003157 *E =
3158 malformedError("for REBASE_OPCODE_ADD_ADDR_IMM_SCALED "
3159 " (after adding immediate times the pointer size) " +
3160 Twine(error) + " for opcode at: 0x" +
3161 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003162 moveToEnd();
3163 return;
3164 }
Nick Kledzikac431442014-09-12 21:34:15 +00003165 DEBUG_WITH_TYPE("mach-o-rebase",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003166 dbgs() << "REBASE_OPCODE_ADD_ADDR_IMM_SCALED: "
3167 << format("SegmentOffset=0x%06X",
3168 SegmentOffset) << "\n");
Nick Kledzikac431442014-09-12 21:34:15 +00003169 break;
3170 case MachO::REBASE_OPCODE_DO_REBASE_IMM_TIMES:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003171 error = O->RebaseEntryCheckSegAndOffset(SegmentIndex, SegmentOffset,
3172 true);
3173 if (error) {
3174 *E = malformedError("for REBASE_OPCODE_DO_REBASE_IMM_TIMES " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003175 Twine(error) + " for opcode at: 0x" +
3176 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003177 moveToEnd();
3178 return;
3179 }
Nick Kledzikac431442014-09-12 21:34:15 +00003180 AdvanceAmount = PointerSize;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003181 Skip = 0;
3182 Count = ImmValue;
3183 if (ImmValue != 0)
3184 RemainingLoopCount = ImmValue - 1;
3185 else
3186 RemainingLoopCount = 0;
3187 error = O->RebaseEntryCheckCountAndSkip(Count, Skip, PointerSize,
3188 SegmentIndex, SegmentOffset);
3189 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003190 *E = malformedError("for REBASE_OPCODE_DO_REBASE_IMM_TIMES " +
3191 Twine(error) + " for opcode at: 0x" +
3192 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003193 moveToEnd();
NAKAMURA Takumia1e97a72017-08-28 06:47:47 +00003194 return;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003195 }
Nick Kledzikac431442014-09-12 21:34:15 +00003196 DEBUG_WITH_TYPE(
3197 "mach-o-rebase",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003198 dbgs() << "REBASE_OPCODE_DO_REBASE_IMM_TIMES: "
3199 << format("SegmentOffset=0x%06X", SegmentOffset)
3200 << ", AdvanceAmount=" << AdvanceAmount
3201 << ", RemainingLoopCount=" << RemainingLoopCount
3202 << "\n");
Nick Kledzikac431442014-09-12 21:34:15 +00003203 return;
3204 case MachO::REBASE_OPCODE_DO_REBASE_ULEB_TIMES:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003205 error = O->RebaseEntryCheckSegAndOffset(SegmentIndex, SegmentOffset,
3206 true);
3207 if (error) {
3208 *E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003209 Twine(error) + " for opcode at: 0x" +
3210 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003211 moveToEnd();
3212 return;
3213 }
Nick Kledzikac431442014-09-12 21:34:15 +00003214 AdvanceAmount = PointerSize;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003215 Skip = 0;
3216 Count = readULEB128(&error);
3217 if (error) {
3218 *E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003219 Twine(error) + " for opcode at: 0x" +
3220 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003221 moveToEnd();
3222 return;
3223 }
3224 if (Count != 0)
3225 RemainingLoopCount = Count - 1;
3226 else
3227 RemainingLoopCount = 0;
3228 error = O->RebaseEntryCheckCountAndSkip(Count, Skip, PointerSize,
3229 SegmentIndex, SegmentOffset);
3230 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003231 *E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES " +
3232 Twine(error) + " for opcode at: 0x" +
3233 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003234 moveToEnd();
NAKAMURA Takumia1e97a72017-08-28 06:47:47 +00003235 return;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003236 }
Nick Kledzikac431442014-09-12 21:34:15 +00003237 DEBUG_WITH_TYPE(
3238 "mach-o-rebase",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003239 dbgs() << "REBASE_OPCODE_DO_REBASE_ULEB_TIMES: "
3240 << format("SegmentOffset=0x%06X", SegmentOffset)
3241 << ", AdvanceAmount=" << AdvanceAmount
3242 << ", RemainingLoopCount=" << RemainingLoopCount
3243 << "\n");
Nick Kledzikac431442014-09-12 21:34:15 +00003244 return;
3245 case MachO::REBASE_OPCODE_DO_REBASE_ADD_ADDR_ULEB:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003246 error = O->RebaseEntryCheckSegAndOffset(SegmentIndex, SegmentOffset,
3247 true);
3248 if (error) {
3249 *E = malformedError("for REBASE_OPCODE_DO_REBASE_ADD_ADDR_ULEB " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003250 Twine(error) + " for opcode at: 0x" +
3251 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003252 moveToEnd();
3253 return;
3254 }
3255 Skip = readULEB128(&error);
3256 if (error) {
3257 *E = malformedError("for REBASE_OPCODE_DO_REBASE_ADD_ADDR_ULEB " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003258 Twine(error) + " for opcode at: 0x" +
3259 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003260 moveToEnd();
3261 return;
3262 }
3263 AdvanceAmount = Skip + PointerSize;
3264 Count = 1;
Nick Kledzikac431442014-09-12 21:34:15 +00003265 RemainingLoopCount = 0;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003266 error = O->RebaseEntryCheckCountAndSkip(Count, Skip, PointerSize,
3267 SegmentIndex, SegmentOffset);
3268 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003269 *E = malformedError("for REBASE_OPCODE_DO_REBASE_ADD_ADDR_ULEB " +
3270 Twine(error) + " for opcode at: 0x" +
3271 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003272 moveToEnd();
NAKAMURA Takumia1e97a72017-08-28 06:47:47 +00003273 return;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003274 }
Nick Kledzikac431442014-09-12 21:34:15 +00003275 DEBUG_WITH_TYPE(
3276 "mach-o-rebase",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003277 dbgs() << "REBASE_OPCODE_DO_REBASE_ADD_ADDR_ULEB: "
3278 << format("SegmentOffset=0x%06X", SegmentOffset)
3279 << ", AdvanceAmount=" << AdvanceAmount
3280 << ", RemainingLoopCount=" << RemainingLoopCount
3281 << "\n");
Nick Kledzikac431442014-09-12 21:34:15 +00003282 return;
3283 case MachO::REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_ULEB:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003284 error = O->RebaseEntryCheckSegAndOffset(SegmentIndex, SegmentOffset,
3285 true);
3286 if (error) {
3287 *E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_"
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003288 "ULEB " +
3289 Twine(error) + " for opcode at: 0x" +
3290 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003291 moveToEnd();
3292 return;
3293 }
3294 Count = readULEB128(&error);
3295 if (error) {
3296 *E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_"
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003297 "ULEB " +
3298 Twine(error) + " for opcode at: 0x" +
3299 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003300 moveToEnd();
3301 return;
3302 }
3303 if (Count != 0)
3304 RemainingLoopCount = Count - 1;
3305 else
3306 RemainingLoopCount = 0;
3307 Skip = readULEB128(&error);
3308 if (error) {
3309 *E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_"
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003310 "ULEB " +
3311 Twine(error) + " for opcode at: 0x" +
3312 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003313 moveToEnd();
3314 return;
3315 }
3316 AdvanceAmount = Skip + PointerSize;
3317
3318 error = O->RebaseEntryCheckCountAndSkip(Count, Skip, PointerSize,
3319 SegmentIndex, SegmentOffset);
3320 if (error) {
3321 *E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_"
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003322 "ULEB " +
3323 Twine(error) + " for opcode at: 0x" +
3324 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003325 moveToEnd();
NAKAMURA Takumia1e97a72017-08-28 06:47:47 +00003326 return;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003327 }
Nick Kledzikac431442014-09-12 21:34:15 +00003328 DEBUG_WITH_TYPE(
3329 "mach-o-rebase",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003330 dbgs() << "REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_ULEB: "
3331 << format("SegmentOffset=0x%06X", SegmentOffset)
3332 << ", AdvanceAmount=" << AdvanceAmount
3333 << ", RemainingLoopCount=" << RemainingLoopCount
3334 << "\n");
Nick Kledzikac431442014-09-12 21:34:15 +00003335 return;
3336 default:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003337 *E = malformedError("bad rebase info (bad opcode value 0x" +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003338 Twine::utohexstr(Opcode) + " for opcode at: 0x" +
3339 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003340 moveToEnd();
3341 return;
Nick Kledzikac431442014-09-12 21:34:15 +00003342 }
3343 }
3344}
3345
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003346uint64_t MachORebaseEntry::readULEB128(const char **error) {
Nick Kledzikac431442014-09-12 21:34:15 +00003347 unsigned Count;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003348 uint64_t Result = decodeULEB128(Ptr, &Count, Opcodes.end(), error);
Nick Kledzikac431442014-09-12 21:34:15 +00003349 Ptr += Count;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003350 if (Ptr > Opcodes.end())
Nick Kledzikac431442014-09-12 21:34:15 +00003351 Ptr = Opcodes.end();
Nick Kledzikac431442014-09-12 21:34:15 +00003352 return Result;
3353}
3354
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003355int32_t MachORebaseEntry::segmentIndex() const { return SegmentIndex; }
Nick Kledzikac431442014-09-12 21:34:15 +00003356
3357uint64_t MachORebaseEntry::segmentOffset() const { return SegmentOffset; }
3358
3359StringRef MachORebaseEntry::typeName() const {
3360 switch (RebaseType) {
3361 case MachO::REBASE_TYPE_POINTER:
3362 return "pointer";
3363 case MachO::REBASE_TYPE_TEXT_ABSOLUTE32:
3364 return "text abs32";
3365 case MachO::REBASE_TYPE_TEXT_PCREL32:
3366 return "text rel32";
3367 }
3368 return "unknown";
3369}
3370
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003371// For use with the SegIndex of a checked Mach-O Rebase entry
3372// to get the segment name.
3373StringRef MachORebaseEntry::segmentName() const {
3374 return O->BindRebaseSegmentName(SegmentIndex);
3375}
3376
3377// For use with a SegIndex,SegOffset pair from a checked Mach-O Rebase entry
3378// to get the section name.
3379StringRef MachORebaseEntry::sectionName() const {
3380 return O->BindRebaseSectionName(SegmentIndex, SegmentOffset);
3381}
3382
3383// For use with a SegIndex,SegOffset pair from a checked Mach-O Rebase entry
3384// to get the address.
3385uint64_t MachORebaseEntry::address() const {
3386 return O->BindRebaseAddress(SegmentIndex, SegmentOffset);
3387}
3388
Nick Kledzikac431442014-09-12 21:34:15 +00003389bool MachORebaseEntry::operator==(const MachORebaseEntry &Other) const {
Saleem Abdulrasool1d84d9a2017-01-08 19:14:15 +00003390#ifdef EXPENSIVE_CHECKS
Nick Kledzikac431442014-09-12 21:34:15 +00003391 assert(Opcodes == Other.Opcodes && "compare iterators of different files");
Saleem Abdulrasool1d84d9a2017-01-08 19:14:15 +00003392#else
3393 assert(Opcodes.data() == Other.Opcodes.data() && "compare iterators of different files");
3394#endif
Nick Kledzikac431442014-09-12 21:34:15 +00003395 return (Ptr == Other.Ptr) &&
3396 (RemainingLoopCount == Other.RemainingLoopCount) &&
3397 (Done == Other.Done);
3398}
3399
3400iterator_range<rebase_iterator>
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003401MachOObjectFile::rebaseTable(Error &Err, MachOObjectFile *O,
3402 ArrayRef<uint8_t> Opcodes, bool is64) {
3403 if (O->BindRebaseSectionTable == nullptr)
3404 O->BindRebaseSectionTable = llvm::make_unique<BindRebaseSegInfo>(O);
3405 MachORebaseEntry Start(&Err, O, Opcodes, is64);
Nick Kledzikac431442014-09-12 21:34:15 +00003406 Start.moveToFirst();
3407
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003408 MachORebaseEntry Finish(&Err, O, Opcodes, is64);
Nick Kledzikac431442014-09-12 21:34:15 +00003409 Finish.moveToEnd();
3410
Craig Topper15576e12015-12-06 05:08:07 +00003411 return make_range(rebase_iterator(Start), rebase_iterator(Finish));
Nick Kledzikac431442014-09-12 21:34:15 +00003412}
3413
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003414iterator_range<rebase_iterator> MachOObjectFile::rebaseTable(Error &Err) {
3415 return rebaseTable(Err, this, getDyldInfoRebaseOpcodes(), is64Bit());
Nick Kledzikac431442014-09-12 21:34:15 +00003416}
3417
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00003418MachOBindEntry::MachOBindEntry(Error *E, const MachOObjectFile *O,
3419 ArrayRef<uint8_t> Bytes, bool is64Bit, Kind BK)
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003420 : E(E), O(O), Opcodes(Bytes), Ptr(Bytes.begin()),
3421 PointerSize(is64Bit ? 8 : 4), TableKind(BK) {}
Nick Kledzik56ebef42014-09-16 01:41:51 +00003422
3423void MachOBindEntry::moveToFirst() {
3424 Ptr = Opcodes.begin();
3425 moveNext();
3426}
3427
3428void MachOBindEntry::moveToEnd() {
3429 Ptr = Opcodes.end();
3430 RemainingLoopCount = 0;
3431 Done = true;
3432}
3433
3434void MachOBindEntry::moveNext() {
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00003435 ErrorAsOutParameter ErrAsOutParam(E);
Nick Kledzik56ebef42014-09-16 01:41:51 +00003436 // If in the middle of some loop, move to next binding in loop.
3437 SegmentOffset += AdvanceAmount;
3438 if (RemainingLoopCount) {
3439 --RemainingLoopCount;
3440 return;
3441 }
Juergen Ributzkacad12492017-03-30 19:56:50 +00003442 // BIND_OPCODE_DONE is only used for padding if we are not aligned to
3443 // pointer size. Therefore it is possible to reach the end without ever having
3444 // seen BIND_OPCODE_DONE.
3445 if (Ptr == Opcodes.end()) {
Nick Kledzik56ebef42014-09-16 01:41:51 +00003446 Done = true;
3447 return;
3448 }
3449 bool More = true;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003450 while (More) {
Nick Kledzik56ebef42014-09-16 01:41:51 +00003451 // Parse next opcode and set up next loop.
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00003452 const uint8_t *OpcodeStart = Ptr;
Nick Kledzik56ebef42014-09-16 01:41:51 +00003453 uint8_t Byte = *Ptr++;
3454 uint8_t ImmValue = Byte & MachO::BIND_IMMEDIATE_MASK;
3455 uint8_t Opcode = Byte & MachO::BIND_OPCODE_MASK;
3456 int8_t SignExtended;
3457 const uint8_t *SymStart;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003458 uint32_t Count, Skip;
3459 const char *error = nullptr;
Nick Kledzik56ebef42014-09-16 01:41:51 +00003460 switch (Opcode) {
3461 case MachO::BIND_OPCODE_DONE:
3462 if (TableKind == Kind::Lazy) {
3463 // Lazying bindings have a DONE opcode between entries. Need to ignore
3464 // it to advance to next entry. But need not if this is last entry.
3465 bool NotLastEntry = false;
3466 for (const uint8_t *P = Ptr; P < Opcodes.end(); ++P) {
3467 if (*P) {
3468 NotLastEntry = true;
3469 }
3470 }
3471 if (NotLastEntry)
3472 break;
3473 }
3474 More = false;
Nick Kledzik56ebef42014-09-16 01:41:51 +00003475 moveToEnd();
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003476 DEBUG_WITH_TYPE("mach-o-bind", dbgs() << "BIND_OPCODE_DONE\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003477 break;
3478 case MachO::BIND_OPCODE_SET_DYLIB_ORDINAL_IMM:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003479 if (TableKind == Kind::Weak) {
3480 *E = malformedError("BIND_OPCODE_SET_DYLIB_ORDINAL_IMM not allowed in "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003481 "weak bind table for opcode at: 0x" +
3482 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003483 moveToEnd();
3484 return;
3485 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003486 Ordinal = ImmValue;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003487 LibraryOrdinalSet = true;
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00003488 if (ImmValue > O->getLibraryCount()) {
3489 *E = malformedError("for BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB bad "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003490 "library ordinal: " +
3491 Twine((int)ImmValue) + " (max " +
3492 Twine((int)O->getLibraryCount()) +
3493 ") for opcode at: 0x" +
3494 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00003495 moveToEnd();
3496 return;
3497 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003498 DEBUG_WITH_TYPE(
3499 "mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003500 dbgs() << "BIND_OPCODE_SET_DYLIB_ORDINAL_IMM: "
3501 << "Ordinal=" << Ordinal << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003502 break;
3503 case MachO::BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003504 if (TableKind == Kind::Weak) {
3505 *E = malformedError("BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB not allowed in "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003506 "weak bind table for opcode at: 0x" +
3507 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003508 moveToEnd();
3509 return;
3510 }
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003511 Ordinal = readULEB128(&error);
3512 LibraryOrdinalSet = true;
3513 if (error) {
3514 *E = malformedError("for BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003515 Twine(error) + " for opcode at: 0x" +
3516 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003517 moveToEnd();
3518 return;
3519 }
3520 if (Ordinal > (int)O->getLibraryCount()) {
3521 *E = malformedError("for BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB bad "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003522 "library ordinal: " +
3523 Twine((int)Ordinal) + " (max " +
3524 Twine((int)O->getLibraryCount()) +
3525 ") for opcode at: 0x" +
3526 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003527 moveToEnd();
3528 return;
3529 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003530 DEBUG_WITH_TYPE(
3531 "mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003532 dbgs() << "BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB: "
3533 << "Ordinal=" << Ordinal << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003534 break;
3535 case MachO::BIND_OPCODE_SET_DYLIB_SPECIAL_IMM:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003536 if (TableKind == Kind::Weak) {
3537 *E = malformedError("BIND_OPCODE_SET_DYLIB_SPECIAL_IMM not allowed in "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003538 "weak bind table for opcode at: 0x" +
3539 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003540 moveToEnd();
3541 return;
3542 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003543 if (ImmValue) {
3544 SignExtended = MachO::BIND_OPCODE_MASK | ImmValue;
3545 Ordinal = SignExtended;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003546 if (Ordinal < MachO::BIND_SPECIAL_DYLIB_FLAT_LOOKUP) {
3547 *E = malformedError("for BIND_OPCODE_SET_DYLIB_SPECIAL_IMM unknown "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003548 "special ordinal: " +
3549 Twine((int)Ordinal) + " for opcode at: 0x" +
3550 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003551 moveToEnd();
3552 return;
3553 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003554 } else
3555 Ordinal = 0;
Steven Wu97e2cf82017-05-31 22:17:43 +00003556 LibraryOrdinalSet = true;
Nick Kledzik56ebef42014-09-16 01:41:51 +00003557 DEBUG_WITH_TYPE(
3558 "mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003559 dbgs() << "BIND_OPCODE_SET_DYLIB_SPECIAL_IMM: "
3560 << "Ordinal=" << Ordinal << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003561 break;
3562 case MachO::BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM:
3563 Flags = ImmValue;
3564 SymStart = Ptr;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003565 while (*Ptr && (Ptr < Opcodes.end())) {
Nick Kledzik56ebef42014-09-16 01:41:51 +00003566 ++Ptr;
3567 }
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003568 if (Ptr == Opcodes.end()) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003569 *E = malformedError(
3570 "for BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM "
3571 "symbol name extends past opcodes for opcode at: 0x" +
3572 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
3573 moveToEnd();
3574 return;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003575 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003576 SymbolName = StringRef(reinterpret_cast<const char*>(SymStart),
3577 Ptr-SymStart);
Nick Kledzika6375362014-09-17 01:51:43 +00003578 ++Ptr;
Nick Kledzik56ebef42014-09-16 01:41:51 +00003579 DEBUG_WITH_TYPE(
3580 "mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003581 dbgs() << "BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM: "
3582 << "SymbolName=" << SymbolName << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003583 if (TableKind == Kind::Weak) {
3584 if (ImmValue & MachO::BIND_SYMBOL_FLAGS_NON_WEAK_DEFINITION)
3585 return;
3586 }
3587 break;
3588 case MachO::BIND_OPCODE_SET_TYPE_IMM:
3589 BindType = ImmValue;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003590 if (ImmValue > MachO::BIND_TYPE_TEXT_PCREL32) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003591 *E = malformedError("for BIND_OPCODE_SET_TYPE_IMM bad bind type: " +
3592 Twine((int)ImmValue) + " for opcode at: 0x" +
3593 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
3594 moveToEnd();
3595 return;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003596 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003597 DEBUG_WITH_TYPE(
3598 "mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003599 dbgs() << "BIND_OPCODE_SET_TYPE_IMM: "
3600 << "BindType=" << (int)BindType << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003601 break;
3602 case MachO::BIND_OPCODE_SET_ADDEND_SLEB:
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003603 Addend = readSLEB128(&error);
3604 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003605 *E = malformedError("for BIND_OPCODE_SET_ADDEND_SLEB " + Twine(error) +
3606 " for opcode at: 0x" +
3607 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003608 moveToEnd();
3609 return;
3610 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003611 DEBUG_WITH_TYPE(
3612 "mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003613 dbgs() << "BIND_OPCODE_SET_ADDEND_SLEB: "
3614 << "Addend=" << Addend << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003615 break;
3616 case MachO::BIND_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB:
3617 SegmentIndex = ImmValue;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003618 SegmentOffset = readULEB128(&error);
3619 if (error) {
3620 *E = malformedError("for BIND_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003621 Twine(error) + " for opcode at: 0x" +
3622 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003623 moveToEnd();
3624 return;
3625 }
3626 error = O->BindEntryCheckSegAndOffset(SegmentIndex, SegmentOffset, true);
3627 if (error) {
3628 *E = malformedError("for BIND_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003629 Twine(error) + " for opcode at: 0x" +
3630 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003631 moveToEnd();
3632 return;
3633 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003634 DEBUG_WITH_TYPE(
3635 "mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003636 dbgs() << "BIND_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB: "
3637 << "SegmentIndex=" << SegmentIndex << ", "
3638 << format("SegmentOffset=0x%06X", SegmentOffset)
3639 << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003640 break;
3641 case MachO::BIND_OPCODE_ADD_ADDR_ULEB:
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003642 SegmentOffset += readULEB128(&error);
3643 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003644 *E = malformedError("for BIND_OPCODE_ADD_ADDR_ULEB " + Twine(error) +
3645 " for opcode at: 0x" +
3646 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003647 moveToEnd();
3648 return;
3649 }
3650 error = O->BindEntryCheckSegAndOffset(SegmentIndex, SegmentOffset, true);
3651 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003652 *E = malformedError("for BIND_OPCODE_ADD_ADDR_ULEB " + Twine(error) +
3653 " for opcode at: 0x" +
3654 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003655 moveToEnd();
3656 return;
3657 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003658 DEBUG_WITH_TYPE("mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003659 dbgs() << "BIND_OPCODE_ADD_ADDR_ULEB: "
3660 << format("SegmentOffset=0x%06X",
3661 SegmentOffset) << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003662 break;
3663 case MachO::BIND_OPCODE_DO_BIND:
3664 AdvanceAmount = PointerSize;
3665 RemainingLoopCount = 0;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003666 error = O->BindEntryCheckSegAndOffset(SegmentIndex, SegmentOffset, true);
3667 if (error) {
3668 *E = malformedError("for BIND_OPCODE_DO_BIND " + Twine(error) +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003669 " for opcode at: 0x" +
3670 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003671 moveToEnd();
3672 return;
3673 }
3674 if (SymbolName == StringRef()) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003675 *E = malformedError(
3676 "for BIND_OPCODE_DO_BIND missing preceding "
3677 "BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM for opcode at: 0x" +
3678 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003679 moveToEnd();
3680 return;
3681 }
3682 if (!LibraryOrdinalSet && TableKind != Kind::Weak) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003683 *E =
3684 malformedError("for BIND_OPCODE_DO_BIND missing preceding "
3685 "BIND_OPCODE_SET_DYLIB_ORDINAL_* for opcode at: 0x" +
3686 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003687 moveToEnd();
3688 return;
3689 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003690 DEBUG_WITH_TYPE("mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003691 dbgs() << "BIND_OPCODE_DO_BIND: "
3692 << format("SegmentOffset=0x%06X",
3693 SegmentOffset) << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003694 return;
3695 case MachO::BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003696 if (TableKind == Kind::Lazy) {
3697 *E = malformedError("BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB not allowed in "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003698 "lazy bind table for opcode at: 0x" +
3699 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003700 moveToEnd();
3701 return;
3702 }
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003703 error = O->BindEntryCheckSegAndOffset(SegmentIndex, SegmentOffset, true);
3704 if (error) {
3705 *E = malformedError("for BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003706 Twine(error) + " for opcode at: 0x" +
3707 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003708 moveToEnd();
3709 return;
3710 }
3711 if (SymbolName == StringRef()) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003712 *E = malformedError(
3713 "for BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB missing "
3714 "preceding BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM for opcode "
3715 "at: 0x" +
3716 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003717 moveToEnd();
3718 return;
3719 }
3720 if (!LibraryOrdinalSet && TableKind != Kind::Weak) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003721 *E = malformedError(
3722 "for BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB missing "
3723 "preceding BIND_OPCODE_SET_DYLIB_ORDINAL_* for opcode at: 0x" +
3724 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003725 moveToEnd();
3726 return;
3727 }
3728 AdvanceAmount = readULEB128(&error) + PointerSize;
3729 if (error) {
3730 *E = malformedError("for BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003731 Twine(error) + " for opcode at: 0x" +
3732 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003733 moveToEnd();
3734 return;
3735 }
3736 // Note, this is not really an error until the next bind but make no sense
3737 // for a BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB to not be followed by another
3738 // bind operation.
3739 error = O->BindEntryCheckSegAndOffset(SegmentIndex, SegmentOffset +
3740 AdvanceAmount, false);
3741 if (error) {
3742 *E = malformedError("for BIND_OPCODE_ADD_ADDR_ULEB (after adding "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003743 "ULEB) " +
3744 Twine(error) + " for opcode at: 0x" +
3745 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003746 moveToEnd();
3747 return;
3748 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003749 RemainingLoopCount = 0;
Nick Kledzik56ebef42014-09-16 01:41:51 +00003750 DEBUG_WITH_TYPE(
3751 "mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003752 dbgs() << "BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB: "
3753 << format("SegmentOffset=0x%06X", SegmentOffset)
3754 << ", AdvanceAmount=" << AdvanceAmount
3755 << ", RemainingLoopCount=" << RemainingLoopCount
3756 << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003757 return;
3758 case MachO::BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003759 if (TableKind == Kind::Lazy) {
3760 *E = malformedError("BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED not "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003761 "allowed in lazy bind table for opcode at: 0x" +
3762 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003763 moveToEnd();
3764 return;
3765 }
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003766 error = O->BindEntryCheckSegAndOffset(SegmentIndex, SegmentOffset, true);
3767 if (error) {
3768 *E = malformedError("for BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED " +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003769 Twine(error) + " for opcode at: 0x" +
3770 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003771 moveToEnd();
3772 return;
3773 }
3774 if (SymbolName == StringRef()) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003775 *E = malformedError(
3776 "for BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED "
3777 "missing preceding BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM for "
3778 "opcode at: 0x" +
3779 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003780 moveToEnd();
3781 return;
3782 }
3783 if (!LibraryOrdinalSet && TableKind != Kind::Weak) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003784 *E = malformedError(
3785 "for BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED "
3786 "missing preceding BIND_OPCODE_SET_DYLIB_ORDINAL_* for opcode "
3787 "at: 0x" +
3788 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003789 moveToEnd();
3790 return;
3791 }
Nick Kledzik3b2aa052014-10-18 01:21:02 +00003792 AdvanceAmount = ImmValue * PointerSize + PointerSize;
Nick Kledzik56ebef42014-09-16 01:41:51 +00003793 RemainingLoopCount = 0;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003794 error = O->BindEntryCheckSegAndOffset(SegmentIndex, SegmentOffset +
3795 AdvanceAmount, false);
3796 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003797 *E =
3798 malformedError("for BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED "
3799 " (after adding immediate times the pointer size) " +
3800 Twine(error) + " for opcode at: 0x" +
3801 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003802 moveToEnd();
3803 return;
3804 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003805 DEBUG_WITH_TYPE("mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003806 dbgs()
Nick Kledzik56ebef42014-09-16 01:41:51 +00003807 << "BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED: "
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003808 << format("SegmentOffset=0x%06X", SegmentOffset) << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003809 return;
3810 case MachO::BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB:
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003811 if (TableKind == Kind::Lazy) {
3812 *E = malformedError("BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB not "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003813 "allowed in lazy bind table for opcode at: 0x" +
3814 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003815 moveToEnd();
3816 return;
3817 }
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003818 Count = readULEB128(&error);
3819 if (Count != 0)
3820 RemainingLoopCount = Count - 1;
3821 else
3822 RemainingLoopCount = 0;
3823 if (error) {
3824 *E = malformedError("for BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003825 " (count value) " +
3826 Twine(error) + " for opcode at: 0x" +
3827 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003828 moveToEnd();
3829 return;
3830 }
3831 Skip = readULEB128(&error);
3832 AdvanceAmount = Skip + PointerSize;
3833 if (error) {
3834 *E = malformedError("for BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB "
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003835 " (skip value) " +
3836 Twine(error) + " for opcode at: 0x" +
3837 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003838 moveToEnd();
3839 return;
3840 }
3841 error = O->BindEntryCheckSegAndOffset(SegmentIndex, SegmentOffset, true);
3842 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003843 *E =
3844 malformedError("for BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB " +
3845 Twine(error) + " for opcode at: 0x" +
3846 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003847 moveToEnd();
3848 return;
3849 }
3850 if (SymbolName == StringRef()) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003851 *E = malformedError(
3852 "for BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB "
3853 "missing preceding BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM for "
3854 "opcode at: 0x" +
3855 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003856 moveToEnd();
3857 return;
3858 }
3859 if (!LibraryOrdinalSet && TableKind != Kind::Weak) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003860 *E = malformedError(
3861 "for BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB "
3862 "missing preceding BIND_OPCODE_SET_DYLIB_ORDINAL_* for opcode "
3863 "at: 0x" +
3864 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003865 moveToEnd();
3866 return;
3867 }
3868 error = O->BindEntryCheckCountAndSkip(Count, Skip, PointerSize,
3869 SegmentIndex, SegmentOffset);
3870 if (error) {
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003871 *E =
3872 malformedError("for BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB " +
3873 Twine(error) + " for opcode at: 0x" +
3874 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003875 moveToEnd();
NAKAMURA Takumia1e97a72017-08-28 06:47:47 +00003876 return;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003877 }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003878 DEBUG_WITH_TYPE(
3879 "mach-o-bind",
Eugene Zelenko9f5094d2017-04-21 22:03:05 +00003880 dbgs() << "BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB: "
3881 << format("SegmentOffset=0x%06X", SegmentOffset)
3882 << ", AdvanceAmount=" << AdvanceAmount
3883 << ", RemainingLoopCount=" << RemainingLoopCount
3884 << "\n");
Nick Kledzik56ebef42014-09-16 01:41:51 +00003885 return;
3886 default:
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003887 *E = malformedError("bad bind info (bad opcode value 0x" +
Benjamin Kramer760e00b2017-08-20 15:13:39 +00003888 Twine::utohexstr(Opcode) + " for opcode at: 0x" +
3889 Twine::utohexstr(OpcodeStart - Opcodes.begin()));
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003890 moveToEnd();
3891 return;
Nick Kledzik56ebef42014-09-16 01:41:51 +00003892 }
3893 }
3894}
3895
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003896uint64_t MachOBindEntry::readULEB128(const char **error) {
Nick Kledzik56ebef42014-09-16 01:41:51 +00003897 unsigned Count;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003898 uint64_t Result = decodeULEB128(Ptr, &Count, Opcodes.end(), error);
Nick Kledzik56ebef42014-09-16 01:41:51 +00003899 Ptr += Count;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003900 if (Ptr > Opcodes.end())
Nick Kledzik56ebef42014-09-16 01:41:51 +00003901 Ptr = Opcodes.end();
Nick Kledzik56ebef42014-09-16 01:41:51 +00003902 return Result;
3903}
3904
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003905int64_t MachOBindEntry::readSLEB128(const char **error) {
Nick Kledzik56ebef42014-09-16 01:41:51 +00003906 unsigned Count;
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003907 int64_t Result = decodeSLEB128(Ptr, &Count, Opcodes.end(), error);
Nick Kledzik56ebef42014-09-16 01:41:51 +00003908 Ptr += Count;
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003909 if (Ptr > Opcodes.end())
Nick Kledzik56ebef42014-09-16 01:41:51 +00003910 Ptr = Opcodes.end();
Nick Kledzik56ebef42014-09-16 01:41:51 +00003911 return Result;
3912}
3913
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003914int32_t MachOBindEntry::segmentIndex() const { return SegmentIndex; }
Nick Kledzik56ebef42014-09-16 01:41:51 +00003915
3916uint64_t MachOBindEntry::segmentOffset() const { return SegmentOffset; }
3917
3918StringRef MachOBindEntry::typeName() const {
3919 switch (BindType) {
3920 case MachO::BIND_TYPE_POINTER:
3921 return "pointer";
3922 case MachO::BIND_TYPE_TEXT_ABSOLUTE32:
3923 return "text abs32";
3924 case MachO::BIND_TYPE_TEXT_PCREL32:
3925 return "text rel32";
3926 }
3927 return "unknown";
3928}
3929
3930StringRef MachOBindEntry::symbolName() const { return SymbolName; }
3931
3932int64_t MachOBindEntry::addend() const { return Addend; }
3933
3934uint32_t MachOBindEntry::flags() const { return Flags; }
3935
3936int MachOBindEntry::ordinal() const { return Ordinal; }
3937
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003938// For use with the SegIndex of a checked Mach-O Bind entry
3939// to get the segment name.
3940StringRef MachOBindEntry::segmentName() const {
3941 return O->BindRebaseSegmentName(SegmentIndex);
3942}
3943
3944// For use with a SegIndex,SegOffset pair from a checked Mach-O Bind entry
3945// to get the section name.
3946StringRef MachOBindEntry::sectionName() const {
3947 return O->BindRebaseSectionName(SegmentIndex, SegmentOffset);
3948}
3949
3950// For use with a SegIndex,SegOffset pair from a checked Mach-O Bind entry
3951// to get the address.
3952uint64_t MachOBindEntry::address() const {
3953 return O->BindRebaseAddress(SegmentIndex, SegmentOffset);
3954}
3955
Nick Kledzik56ebef42014-09-16 01:41:51 +00003956bool MachOBindEntry::operator==(const MachOBindEntry &Other) const {
Saleem Abdulrasool1d84d9a2017-01-08 19:14:15 +00003957#ifdef EXPENSIVE_CHECKS
Nick Kledzik56ebef42014-09-16 01:41:51 +00003958 assert(Opcodes == Other.Opcodes && "compare iterators of different files");
Saleem Abdulrasool1d84d9a2017-01-08 19:14:15 +00003959#else
3960 assert(Opcodes.data() == Other.Opcodes.data() && "compare iterators of different files");
3961#endif
Nick Kledzik56ebef42014-09-16 01:41:51 +00003962 return (Ptr == Other.Ptr) &&
3963 (RemainingLoopCount == Other.RemainingLoopCount) &&
3964 (Done == Other.Done);
3965}
3966
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003967// Build table of sections so SegIndex/SegOffset pairs can be translated.
3968BindRebaseSegInfo::BindRebaseSegInfo(const object::MachOObjectFile *Obj) {
3969 uint32_t CurSegIndex = Obj->hasPageZeroSegment() ? 1 : 0;
3970 StringRef CurSegName;
3971 uint64_t CurSegAddress;
3972 for (const SectionRef &Section : Obj->sections()) {
3973 SectionInfo Info;
3974 Section.getName(Info.SectionName);
3975 Info.Address = Section.getAddress();
3976 Info.Size = Section.getSize();
3977 Info.SegmentName =
3978 Obj->getSectionFinalSegmentName(Section.getRawDataRefImpl());
3979 if (!Info.SegmentName.equals(CurSegName)) {
3980 ++CurSegIndex;
3981 CurSegName = Info.SegmentName;
3982 CurSegAddress = Info.Address;
3983 }
3984 Info.SegmentIndex = CurSegIndex - 1;
3985 Info.OffsetInSegment = Info.Address - CurSegAddress;
3986 Info.SegmentStartAddress = CurSegAddress;
3987 Sections.push_back(Info);
3988 }
3989 MaxSegIndex = CurSegIndex;
3990}
3991
3992// For use with a SegIndex,SegOffset pair in MachOBindEntry::moveNext() to
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003993// validate a MachOBindEntry or MachORebaseEntry.
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003994const char * BindRebaseSegInfo::checkSegAndOffset(int32_t SegIndex,
3995 uint64_t SegOffset,
3996 bool endInvalid) {
3997 if (SegIndex == -1)
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00003998 return "missing preceding *_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB";
Kevin Enderbya8d256c2017-03-20 19:46:55 +00003999 if (SegIndex >= MaxSegIndex)
4000 return "bad segIndex (too large)";
4001 for (const SectionInfo &SI : Sections) {
4002 if (SI.SegmentIndex != SegIndex)
4003 continue;
4004 if (SI.OffsetInSegment > SegOffset)
4005 continue;
4006 if (SegOffset > (SI.OffsetInSegment + SI.Size))
4007 continue;
4008 if (endInvalid && SegOffset >= (SI.OffsetInSegment + SI.Size))
4009 continue;
4010 return nullptr;
4011 }
4012 return "bad segOffset, too large";
4013}
4014
4015// For use in MachOBindEntry::moveNext() to validate a MachOBindEntry for
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00004016// the BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB opcode and for use in
4017// MachORebaseEntry::moveNext() to validate a MachORebaseEntry for
4018// REBASE_OPCODE_DO_*_TIMES* opcodes. The SegIndex and SegOffset must have
4019// been already checked.
Kevin Enderbya8d256c2017-03-20 19:46:55 +00004020const char * BindRebaseSegInfo::checkCountAndSkip(uint32_t Count, uint32_t Skip,
4021 uint8_t PointerSize,
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00004022 int32_t SegIndex,
4023 uint64_t SegOffset) {
Kevin Enderbya8d256c2017-03-20 19:46:55 +00004024 const SectionInfo &SI = findSection(SegIndex, SegOffset);
4025 uint64_t addr = SI.SegmentStartAddress + SegOffset;
4026 if (addr >= SI.Address + SI.Size)
4027 return "bad segOffset, too large";
4028 uint64_t i = 0;
4029 if (Count > 1)
4030 i = (Skip + PointerSize) * (Count - 1);
Kevin Enderby6c1d2b42017-03-27 20:09:23 +00004031 else if (Count == 1)
4032 i = Skip + PointerSize;
4033 if (addr + i >= SI.Address + SI.Size) {
4034 // For rebase opcodes they can step from one section to another.
4035 uint64_t TrailingSegOffset = (addr + i) - SI.SegmentStartAddress;
4036 const char *error = checkSegAndOffset(SegIndex, TrailingSegOffset, false);
4037 if (error)
4038 return "bad count and skip, too large";
4039 }
Kevin Enderbya8d256c2017-03-20 19:46:55 +00004040 return nullptr;
4041}
4042
4043// For use with the SegIndex of a checked Mach-O Bind or Rebase entry
4044// to get the segment name.
4045StringRef BindRebaseSegInfo::segmentName(int32_t SegIndex) {
4046 for (const SectionInfo &SI : Sections) {
4047 if (SI.SegmentIndex == SegIndex)
4048 return SI.SegmentName;
4049 }
4050 llvm_unreachable("invalid SegIndex");
4051}
4052
4053// For use with a SegIndex,SegOffset pair from a checked Mach-O Bind or Rebase
4054// to get the SectionInfo.
4055const BindRebaseSegInfo::SectionInfo &BindRebaseSegInfo::findSection(
4056 int32_t SegIndex, uint64_t SegOffset) {
4057 for (const SectionInfo &SI : Sections) {
4058 if (SI.SegmentIndex != SegIndex)
4059 continue;
4060 if (SI.OffsetInSegment > SegOffset)
4061 continue;
4062 if (SegOffset >= (SI.OffsetInSegment + SI.Size))
4063 continue;
4064 return SI;
4065 }
4066 llvm_unreachable("SegIndex and SegOffset not in any section");
4067}
4068
4069// For use with a SegIndex,SegOffset pair from a checked Mach-O Bind or Rebase
4070// entry to get the section name.
4071StringRef BindRebaseSegInfo::sectionName(int32_t SegIndex,
4072 uint64_t SegOffset) {
4073 return findSection(SegIndex, SegOffset).SectionName;
4074}
4075
4076// For use with a SegIndex,SegOffset pair from a checked Mach-O Bind or Rebase
4077// entry to get the address.
4078uint64_t BindRebaseSegInfo::address(uint32_t SegIndex, uint64_t OffsetInSeg) {
4079 const SectionInfo &SI = findSection(SegIndex, OffsetInSeg);
4080 return SI.SegmentStartAddress + OffsetInSeg;
4081}
4082
Nick Kledzik56ebef42014-09-16 01:41:51 +00004083iterator_range<bind_iterator>
Kevin Enderbya8d256c2017-03-20 19:46:55 +00004084MachOObjectFile::bindTable(Error &Err, MachOObjectFile *O,
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00004085 ArrayRef<uint8_t> Opcodes, bool is64,
Nick Kledzik56ebef42014-09-16 01:41:51 +00004086 MachOBindEntry::Kind BKind) {
Kevin Enderbya8d256c2017-03-20 19:46:55 +00004087 if (O->BindRebaseSectionTable == nullptr)
4088 O->BindRebaseSectionTable = llvm::make_unique<BindRebaseSegInfo>(O);
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00004089 MachOBindEntry Start(&Err, O, Opcodes, is64, BKind);
Nick Kledzik56ebef42014-09-16 01:41:51 +00004090 Start.moveToFirst();
4091
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00004092 MachOBindEntry Finish(&Err, O, Opcodes, is64, BKind);
Nick Kledzik56ebef42014-09-16 01:41:51 +00004093 Finish.moveToEnd();
4094
Craig Topper15576e12015-12-06 05:08:07 +00004095 return make_range(bind_iterator(Start), bind_iterator(Finish));
Nick Kledzik56ebef42014-09-16 01:41:51 +00004096}
4097
Kevin Enderbya8d256c2017-03-20 19:46:55 +00004098iterator_range<bind_iterator> MachOObjectFile::bindTable(Error &Err) {
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00004099 return bindTable(Err, this, getDyldInfoBindOpcodes(), is64Bit(),
Nick Kledzik56ebef42014-09-16 01:41:51 +00004100 MachOBindEntry::Kind::Regular);
4101}
4102
Kevin Enderbya8d256c2017-03-20 19:46:55 +00004103iterator_range<bind_iterator> MachOObjectFile::lazyBindTable(Error &Err) {
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00004104 return bindTable(Err, this, getDyldInfoLazyBindOpcodes(), is64Bit(),
Nick Kledzik56ebef42014-09-16 01:41:51 +00004105 MachOBindEntry::Kind::Lazy);
4106}
4107
Kevin Enderbya8d256c2017-03-20 19:46:55 +00004108iterator_range<bind_iterator> MachOObjectFile::weakBindTable(Error &Err) {
Kevin Enderbyfeb63b92017-02-28 21:47:07 +00004109 return bindTable(Err, this, getDyldInfoWeakBindOpcodes(), is64Bit(),
Nick Kledzik56ebef42014-09-16 01:41:51 +00004110 MachOBindEntry::Kind::Weak);
4111}
4112
Alexey Samsonovd319c4f2015-06-03 22:19:36 +00004113MachOObjectFile::load_command_iterator
4114MachOObjectFile::begin_load_commands() const {
4115 return LoadCommands.begin();
4116}
4117
4118MachOObjectFile::load_command_iterator
4119MachOObjectFile::end_load_commands() const {
4120 return LoadCommands.end();
4121}
4122
4123iterator_range<MachOObjectFile::load_command_iterator>
4124MachOObjectFile::load_commands() const {
Craig Topper15576e12015-12-06 05:08:07 +00004125 return make_range(begin_load_commands(), end_load_commands());
Alexey Samsonovd319c4f2015-06-03 22:19:36 +00004126}
4127
Rafael Espindola56f976f2013-04-18 18:08:55 +00004128StringRef
4129MachOObjectFile::getSectionFinalSegmentName(DataRefImpl Sec) const {
4130 ArrayRef<char> Raw = getSectionRawFinalSegmentName(Sec);
4131 return parseSegmentOrSectionName(Raw.data());
4132}
4133
4134ArrayRef<char>
4135MachOObjectFile::getSectionRawName(DataRefImpl Sec) const {
Rafael Espindola0d85d102015-05-22 14:59:27 +00004136 assert(Sec.d.a < Sections.size() && "Should have detected this earlier");
Charles Davis8bdfafd2013-09-01 04:28:48 +00004137 const section_base *Base =
4138 reinterpret_cast<const section_base *>(Sections[Sec.d.a]);
Craig Toppere1d12942014-08-27 05:25:25 +00004139 return makeArrayRef(Base->sectname);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004140}
4141
4142ArrayRef<char>
4143MachOObjectFile::getSectionRawFinalSegmentName(DataRefImpl Sec) const {
Rafael Espindola0d85d102015-05-22 14:59:27 +00004144 assert(Sec.d.a < Sections.size() && "Should have detected this earlier");
Charles Davis8bdfafd2013-09-01 04:28:48 +00004145 const section_base *Base =
4146 reinterpret_cast<const section_base *>(Sections[Sec.d.a]);
Craig Toppere1d12942014-08-27 05:25:25 +00004147 return makeArrayRef(Base->segname);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004148}
4149
4150bool
Charles Davis8bdfafd2013-09-01 04:28:48 +00004151MachOObjectFile::isRelocationScattered(const MachO::any_relocation_info &RE)
Rafael Espindola56f976f2013-04-18 18:08:55 +00004152 const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004153 if (getCPUType(*this) == MachO::CPU_TYPE_X86_64)
Rafael Espindola56f976f2013-04-18 18:08:55 +00004154 return false;
Charles Davis8bdfafd2013-09-01 04:28:48 +00004155 return getPlainRelocationAddress(RE) & MachO::R_SCATTERED;
Rafael Espindola56f976f2013-04-18 18:08:55 +00004156}
4157
Eric Christopher1d62c252013-07-22 22:25:07 +00004158unsigned MachOObjectFile::getPlainRelocationSymbolNum(
Charles Davis8bdfafd2013-09-01 04:28:48 +00004159 const MachO::any_relocation_info &RE) const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00004160 if (isLittleEndian())
Charles Davis8bdfafd2013-09-01 04:28:48 +00004161 return RE.r_word1 & 0xffffff;
4162 return RE.r_word1 >> 8;
Rafael Espindola56f976f2013-04-18 18:08:55 +00004163}
4164
Eric Christopher1d62c252013-07-22 22:25:07 +00004165bool MachOObjectFile::getPlainRelocationExternal(
Charles Davis8bdfafd2013-09-01 04:28:48 +00004166 const MachO::any_relocation_info &RE) const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00004167 if (isLittleEndian())
Charles Davis8bdfafd2013-09-01 04:28:48 +00004168 return (RE.r_word1 >> 27) & 1;
4169 return (RE.r_word1 >> 4) & 1;
Rafael Espindola56f976f2013-04-18 18:08:55 +00004170}
4171
Eric Christopher1d62c252013-07-22 22:25:07 +00004172bool MachOObjectFile::getScatteredRelocationScattered(
Charles Davis8bdfafd2013-09-01 04:28:48 +00004173 const MachO::any_relocation_info &RE) const {
4174 return RE.r_word0 >> 31;
Rafael Espindola56f976f2013-04-18 18:08:55 +00004175}
4176
Eric Christopher1d62c252013-07-22 22:25:07 +00004177uint32_t MachOObjectFile::getScatteredRelocationValue(
Charles Davis8bdfafd2013-09-01 04:28:48 +00004178 const MachO::any_relocation_info &RE) const {
4179 return RE.r_word1;
Rafael Espindola56f976f2013-04-18 18:08:55 +00004180}
4181
Kevin Enderby9907d0a2014-11-04 00:43:16 +00004182uint32_t MachOObjectFile::getScatteredRelocationType(
4183 const MachO::any_relocation_info &RE) const {
4184 return (RE.r_word0 >> 24) & 0xf;
4185}
4186
Eric Christopher1d62c252013-07-22 22:25:07 +00004187unsigned MachOObjectFile::getAnyRelocationAddress(
Charles Davis8bdfafd2013-09-01 04:28:48 +00004188 const MachO::any_relocation_info &RE) const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00004189 if (isRelocationScattered(RE))
4190 return getScatteredRelocationAddress(RE);
4191 return getPlainRelocationAddress(RE);
4192}
4193
Charles Davis8bdfafd2013-09-01 04:28:48 +00004194unsigned MachOObjectFile::getAnyRelocationPCRel(
4195 const MachO::any_relocation_info &RE) const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00004196 if (isRelocationScattered(RE))
Lang Hames697e7cd2016-12-04 01:56:10 +00004197 return getScatteredRelocationPCRel(RE);
4198 return getPlainRelocationPCRel(*this, RE);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004199}
4200
Eric Christopher1d62c252013-07-22 22:25:07 +00004201unsigned MachOObjectFile::getAnyRelocationLength(
Charles Davis8bdfafd2013-09-01 04:28:48 +00004202 const MachO::any_relocation_info &RE) const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00004203 if (isRelocationScattered(RE))
4204 return getScatteredRelocationLength(RE);
Lang Hames697e7cd2016-12-04 01:56:10 +00004205 return getPlainRelocationLength(*this, RE);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004206}
4207
4208unsigned
Charles Davis8bdfafd2013-09-01 04:28:48 +00004209MachOObjectFile::getAnyRelocationType(
4210 const MachO::any_relocation_info &RE) const {
Rafael Espindola56f976f2013-04-18 18:08:55 +00004211 if (isRelocationScattered(RE))
4212 return getScatteredRelocationType(RE);
Lang Hames697e7cd2016-12-04 01:56:10 +00004213 return getPlainRelocationType(*this, RE);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004214}
4215
Rafael Espindola52501032013-04-30 15:40:54 +00004216SectionRef
Keno Fischerc780e8e2015-05-21 21:24:32 +00004217MachOObjectFile::getAnyRelocationSection(
Charles Davis8bdfafd2013-09-01 04:28:48 +00004218 const MachO::any_relocation_info &RE) const {
Rafael Espindola52501032013-04-30 15:40:54 +00004219 if (isRelocationScattered(RE) || getPlainRelocationExternal(RE))
Rafael Espindolab5155a52014-02-10 20:24:04 +00004220 return *section_end();
Rafael Espindola9ac06a02015-06-18 22:38:20 +00004221 unsigned SecNum = getPlainRelocationSymbolNum(RE);
4222 if (SecNum == MachO::R_ABS || SecNum > Sections.size())
4223 return *section_end();
Rafael Espindola52501032013-04-30 15:40:54 +00004224 DataRefImpl DRI;
Rafael Espindola9ac06a02015-06-18 22:38:20 +00004225 DRI.d.a = SecNum - 1;
Rafael Espindola52501032013-04-30 15:40:54 +00004226 return SectionRef(DRI, this);
4227}
4228
Charles Davis8bdfafd2013-09-01 04:28:48 +00004229MachO::section MachOObjectFile::getSection(DataRefImpl DRI) const {
Rafael Espindola62a07cb2015-05-22 15:43:00 +00004230 assert(DRI.d.a < Sections.size() && "Should have detected this earlier");
Lang Hames697e7cd2016-12-04 01:56:10 +00004231 return getStruct<MachO::section>(*this, Sections[DRI.d.a]);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004232}
4233
Charles Davis8bdfafd2013-09-01 04:28:48 +00004234MachO::section_64 MachOObjectFile::getSection64(DataRefImpl DRI) const {
Rafael Espindola62a07cb2015-05-22 15:43:00 +00004235 assert(DRI.d.a < Sections.size() && "Should have detected this earlier");
Lang Hames697e7cd2016-12-04 01:56:10 +00004236 return getStruct<MachO::section_64>(*this, Sections[DRI.d.a]);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004237}
4238
Charles Davis8bdfafd2013-09-01 04:28:48 +00004239MachO::section MachOObjectFile::getSection(const LoadCommandInfo &L,
Rafael Espindola6e040c02013-04-26 20:07:33 +00004240 unsigned Index) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004241 const char *Sec = getSectionPtr(*this, L, Index);
4242 return getStruct<MachO::section>(*this, Sec);
Rafael Espindola6e040c02013-04-26 20:07:33 +00004243}
4244
Charles Davis8bdfafd2013-09-01 04:28:48 +00004245MachO::section_64 MachOObjectFile::getSection64(const LoadCommandInfo &L,
4246 unsigned Index) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004247 const char *Sec = getSectionPtr(*this, L, Index);
4248 return getStruct<MachO::section_64>(*this, Sec);
Rafael Espindola6e040c02013-04-26 20:07:33 +00004249}
4250
Charles Davis8bdfafd2013-09-01 04:28:48 +00004251MachO::nlist
Rafael Espindola56f976f2013-04-18 18:08:55 +00004252MachOObjectFile::getSymbolTableEntry(DataRefImpl DRI) const {
Rafael Espindola75c30362013-04-24 19:47:55 +00004253 const char *P = reinterpret_cast<const char *>(DRI.p);
Lang Hames697e7cd2016-12-04 01:56:10 +00004254 return getStruct<MachO::nlist>(*this, P);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004255}
4256
Charles Davis8bdfafd2013-09-01 04:28:48 +00004257MachO::nlist_64
Rafael Espindola56f976f2013-04-18 18:08:55 +00004258MachOObjectFile::getSymbol64TableEntry(DataRefImpl DRI) const {
Rafael Espindola75c30362013-04-24 19:47:55 +00004259 const char *P = reinterpret_cast<const char *>(DRI.p);
Lang Hames697e7cd2016-12-04 01:56:10 +00004260 return getStruct<MachO::nlist_64>(*this, P);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004261}
4262
Charles Davis8bdfafd2013-09-01 04:28:48 +00004263MachO::linkedit_data_command
4264MachOObjectFile::getLinkeditDataLoadCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004265 return getStruct<MachO::linkedit_data_command>(*this, L.Ptr);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004266}
4267
Charles Davis8bdfafd2013-09-01 04:28:48 +00004268MachO::segment_command
Rafael Espindola6e040c02013-04-26 20:07:33 +00004269MachOObjectFile::getSegmentLoadCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004270 return getStruct<MachO::segment_command>(*this, L.Ptr);
Rafael Espindola6e040c02013-04-26 20:07:33 +00004271}
4272
Charles Davis8bdfafd2013-09-01 04:28:48 +00004273MachO::segment_command_64
Rafael Espindola6e040c02013-04-26 20:07:33 +00004274MachOObjectFile::getSegment64LoadCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004275 return getStruct<MachO::segment_command_64>(*this, L.Ptr);
Rafael Espindola6e040c02013-04-26 20:07:33 +00004276}
4277
Kevin Enderbyd0b6b7f2014-12-18 00:53:40 +00004278MachO::linker_option_command
4279MachOObjectFile::getLinkerOptionLoadCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004280 return getStruct<MachO::linker_option_command>(*this, L.Ptr);
Rafael Espindola6e040c02013-04-26 20:07:33 +00004281}
4282
Jim Grosbach448334a2014-03-18 22:09:05 +00004283MachO::version_min_command
4284MachOObjectFile::getVersionMinLoadCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004285 return getStruct<MachO::version_min_command>(*this, L.Ptr);
Jim Grosbach448334a2014-03-18 22:09:05 +00004286}
4287
Kevin Enderbya4579c42017-01-19 17:36:31 +00004288MachO::note_command
4289MachOObjectFile::getNoteLoadCommand(const LoadCommandInfo &L) const {
4290 return getStruct<MachO::note_command>(*this, L.Ptr);
4291}
4292
Steven Wu5b54a422017-01-23 20:07:55 +00004293MachO::build_version_command
4294MachOObjectFile::getBuildVersionLoadCommand(const LoadCommandInfo &L) const {
4295 return getStruct<MachO::build_version_command>(*this, L.Ptr);
4296}
4297
4298MachO::build_tool_version
4299MachOObjectFile::getBuildToolVersion(unsigned index) const {
4300 return getStruct<MachO::build_tool_version>(*this, BuildTools[index]);
4301}
4302
Tim Northover8f9590b2014-06-30 14:40:57 +00004303MachO::dylib_command
4304MachOObjectFile::getDylibIDLoadCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004305 return getStruct<MachO::dylib_command>(*this, L.Ptr);
Tim Northover8f9590b2014-06-30 14:40:57 +00004306}
4307
Kevin Enderby8ae63c12014-09-04 16:54:47 +00004308MachO::dyld_info_command
4309MachOObjectFile::getDyldInfoLoadCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004310 return getStruct<MachO::dyld_info_command>(*this, L.Ptr);
Kevin Enderby8ae63c12014-09-04 16:54:47 +00004311}
4312
4313MachO::dylinker_command
4314MachOObjectFile::getDylinkerCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004315 return getStruct<MachO::dylinker_command>(*this, L.Ptr);
Kevin Enderby8ae63c12014-09-04 16:54:47 +00004316}
4317
4318MachO::uuid_command
4319MachOObjectFile::getUuidCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004320 return getStruct<MachO::uuid_command>(*this, L.Ptr);
Kevin Enderby8ae63c12014-09-04 16:54:47 +00004321}
4322
Jean-Daniel Dupas00cc1f52014-12-04 07:37:02 +00004323MachO::rpath_command
4324MachOObjectFile::getRpathCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004325 return getStruct<MachO::rpath_command>(*this, L.Ptr);
Jean-Daniel Dupas00cc1f52014-12-04 07:37:02 +00004326}
4327
Kevin Enderby8ae63c12014-09-04 16:54:47 +00004328MachO::source_version_command
4329MachOObjectFile::getSourceVersionCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004330 return getStruct<MachO::source_version_command>(*this, L.Ptr);
Kevin Enderby8ae63c12014-09-04 16:54:47 +00004331}
4332
4333MachO::entry_point_command
4334MachOObjectFile::getEntryPointCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004335 return getStruct<MachO::entry_point_command>(*this, L.Ptr);
Kevin Enderby8ae63c12014-09-04 16:54:47 +00004336}
4337
Kevin Enderby0804f4672014-12-16 23:25:52 +00004338MachO::encryption_info_command
4339MachOObjectFile::getEncryptionInfoCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004340 return getStruct<MachO::encryption_info_command>(*this, L.Ptr);
Kevin Enderby0804f4672014-12-16 23:25:52 +00004341}
4342
Kevin Enderby57538292014-12-17 01:01:30 +00004343MachO::encryption_info_command_64
4344MachOObjectFile::getEncryptionInfoCommand64(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004345 return getStruct<MachO::encryption_info_command_64>(*this, L.Ptr);
Kevin Enderby57538292014-12-17 01:01:30 +00004346}
4347
Kevin Enderbyb4b79312014-12-18 19:24:35 +00004348MachO::sub_framework_command
4349MachOObjectFile::getSubFrameworkCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004350 return getStruct<MachO::sub_framework_command>(*this, L.Ptr);
Kevin Enderbyb4b79312014-12-18 19:24:35 +00004351}
Tim Northover8f9590b2014-06-30 14:40:57 +00004352
Kevin Enderbya2bd8d92014-12-18 23:13:26 +00004353MachO::sub_umbrella_command
4354MachOObjectFile::getSubUmbrellaCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004355 return getStruct<MachO::sub_umbrella_command>(*this, L.Ptr);
Kevin Enderbya2bd8d92014-12-18 23:13:26 +00004356}
4357
Kevin Enderby36c8d3a2014-12-19 19:48:16 +00004358MachO::sub_library_command
4359MachOObjectFile::getSubLibraryCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004360 return getStruct<MachO::sub_library_command>(*this, L.Ptr);
Kevin Enderby36c8d3a2014-12-19 19:48:16 +00004361}
4362
Kevin Enderby186eac32014-12-19 21:06:24 +00004363MachO::sub_client_command
4364MachOObjectFile::getSubClientCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004365 return getStruct<MachO::sub_client_command>(*this, L.Ptr);
Kevin Enderby186eac32014-12-19 21:06:24 +00004366}
4367
Kevin Enderby52e4ce42014-12-19 22:25:22 +00004368MachO::routines_command
4369MachOObjectFile::getRoutinesCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004370 return getStruct<MachO::routines_command>(*this, L.Ptr);
Kevin Enderby52e4ce42014-12-19 22:25:22 +00004371}
4372
4373MachO::routines_command_64
4374MachOObjectFile::getRoutinesCommand64(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004375 return getStruct<MachO::routines_command_64>(*this, L.Ptr);
Kevin Enderby52e4ce42014-12-19 22:25:22 +00004376}
4377
Kevin Enderby48ef5342014-12-23 22:56:39 +00004378MachO::thread_command
4379MachOObjectFile::getThreadCommand(const LoadCommandInfo &L) const {
Lang Hames697e7cd2016-12-04 01:56:10 +00004380 return getStruct<MachO::thread_command>(*this, L.Ptr);
Kevin Enderby48ef5342014-12-23 22:56:39 +00004381}
4382
Charles Davis8bdfafd2013-09-01 04:28:48 +00004383MachO::any_relocation_info
Rafael Espindola56f976f2013-04-18 18:08:55 +00004384MachOObjectFile::getRelocation(DataRefImpl Rel) const {
Rafael Espindola128b8112014-04-03 23:51:28 +00004385 uint32_t Offset;
Kevin Enderbyabf10f22017-06-22 17:41:22 +00004386 if (getHeader().filetype == MachO::MH_OBJECT) {
4387 DataRefImpl Sec;
4388 Sec.d.a = Rel.d.a;
4389 if (is64Bit()) {
4390 MachO::section_64 Sect = getSection64(Sec);
4391 Offset = Sect.reloff;
4392 } else {
4393 MachO::section Sect = getSection(Sec);
4394 Offset = Sect.reloff;
4395 }
Rafael Espindola128b8112014-04-03 23:51:28 +00004396 } else {
Kevin Enderbyabf10f22017-06-22 17:41:22 +00004397 MachO::dysymtab_command DysymtabLoadCmd = getDysymtabLoadCommand();
Michael Trenta1703b12017-12-15 17:57:40 +00004398 if (Rel.d.a == 0)
4399 Offset = DysymtabLoadCmd.extreloff; // Offset to the external relocations
4400 else
4401 Offset = DysymtabLoadCmd.locreloff; // Offset to the local relocations
Rafael Espindola128b8112014-04-03 23:51:28 +00004402 }
4403
4404 auto P = reinterpret_cast<const MachO::any_relocation_info *>(
Lang Hames697e7cd2016-12-04 01:56:10 +00004405 getPtr(*this, Offset)) + Rel.d.b;
Rafael Espindola128b8112014-04-03 23:51:28 +00004406 return getStruct<MachO::any_relocation_info>(
Lang Hames697e7cd2016-12-04 01:56:10 +00004407 *this, reinterpret_cast<const char *>(P));
Rafael Espindola56f976f2013-04-18 18:08:55 +00004408}
4409
Charles Davis8bdfafd2013-09-01 04:28:48 +00004410MachO::data_in_code_entry
Kevin Enderby273ae012013-06-06 17:20:50 +00004411MachOObjectFile::getDice(DataRefImpl Rel) const {
4412 const char *P = reinterpret_cast<const char *>(Rel.p);
Lang Hames697e7cd2016-12-04 01:56:10 +00004413 return getStruct<MachO::data_in_code_entry>(*this, P);
Kevin Enderby273ae012013-06-06 17:20:50 +00004414}
4415
Alexey Samsonov13415ed2015-06-04 19:22:03 +00004416const MachO::mach_header &MachOObjectFile::getHeader() const {
Alexey Samsonovfa5edc52015-06-04 22:49:55 +00004417 return Header;
Rafael Espindola56f976f2013-04-18 18:08:55 +00004418}
4419
Alexey Samsonov13415ed2015-06-04 19:22:03 +00004420const MachO::mach_header_64 &MachOObjectFile::getHeader64() const {
4421 assert(is64Bit());
4422 return Header64;
Rafael Espindola6e040c02013-04-26 20:07:33 +00004423}
4424
Charles Davis8bdfafd2013-09-01 04:28:48 +00004425uint32_t MachOObjectFile::getIndirectSymbolTableEntry(
4426 const MachO::dysymtab_command &DLC,
4427 unsigned Index) const {
4428 uint64_t Offset = DLC.indirectsymoff + Index * sizeof(uint32_t);
Lang Hames697e7cd2016-12-04 01:56:10 +00004429 return getStruct<uint32_t>(*this, getPtr(*this, Offset));
Rafael Espindola6e040c02013-04-26 20:07:33 +00004430}
4431
Charles Davis8bdfafd2013-09-01 04:28:48 +00004432MachO::data_in_code_entry
Rafael Espindola6e040c02013-04-26 20:07:33 +00004433MachOObjectFile::getDataInCodeTableEntry(uint32_t DataOffset,
4434 unsigned Index) const {
Charles Davis8bdfafd2013-09-01 04:28:48 +00004435 uint64_t Offset = DataOffset + Index * sizeof(MachO::data_in_code_entry);
Lang Hames697e7cd2016-12-04 01:56:10 +00004436 return getStruct<MachO::data_in_code_entry>(*this, getPtr(*this, Offset));
Rafael Espindola6e040c02013-04-26 20:07:33 +00004437}
4438
Charles Davis8bdfafd2013-09-01 04:28:48 +00004439MachO::symtab_command MachOObjectFile::getSymtabLoadCommand() const {
Kevin Enderby6f326ce2014-10-23 19:37:31 +00004440 if (SymtabLoadCmd)
Lang Hames697e7cd2016-12-04 01:56:10 +00004441 return getStruct<MachO::symtab_command>(*this, SymtabLoadCmd);
Kevin Enderby6f326ce2014-10-23 19:37:31 +00004442
4443 // If there is no SymtabLoadCmd return a load command with zero'ed fields.
4444 MachO::symtab_command Cmd;
4445 Cmd.cmd = MachO::LC_SYMTAB;
4446 Cmd.cmdsize = sizeof(MachO::symtab_command);
4447 Cmd.symoff = 0;
4448 Cmd.nsyms = 0;
4449 Cmd.stroff = 0;
4450 Cmd.strsize = 0;
4451 return Cmd;
Rafael Espindola56f976f2013-04-18 18:08:55 +00004452}
4453
Charles Davis8bdfafd2013-09-01 04:28:48 +00004454MachO::dysymtab_command MachOObjectFile::getDysymtabLoadCommand() const {
Kevin Enderby6f326ce2014-10-23 19:37:31 +00004455 if (DysymtabLoadCmd)
Lang Hames697e7cd2016-12-04 01:56:10 +00004456 return getStruct<MachO::dysymtab_command>(*this, DysymtabLoadCmd);
Kevin Enderby6f326ce2014-10-23 19:37:31 +00004457
4458 // If there is no DysymtabLoadCmd return a load command with zero'ed fields.
4459 MachO::dysymtab_command Cmd;
4460 Cmd.cmd = MachO::LC_DYSYMTAB;
4461 Cmd.cmdsize = sizeof(MachO::dysymtab_command);
4462 Cmd.ilocalsym = 0;
4463 Cmd.nlocalsym = 0;
4464 Cmd.iextdefsym = 0;
4465 Cmd.nextdefsym = 0;
4466 Cmd.iundefsym = 0;
4467 Cmd.nundefsym = 0;
4468 Cmd.tocoff = 0;
4469 Cmd.ntoc = 0;
4470 Cmd.modtaboff = 0;
4471 Cmd.nmodtab = 0;
4472 Cmd.extrefsymoff = 0;
4473 Cmd.nextrefsyms = 0;
4474 Cmd.indirectsymoff = 0;
4475 Cmd.nindirectsyms = 0;
4476 Cmd.extreloff = 0;
4477 Cmd.nextrel = 0;
4478 Cmd.locreloff = 0;
4479 Cmd.nlocrel = 0;
4480 return Cmd;
Rafael Espindola6e040c02013-04-26 20:07:33 +00004481}
4482
Charles Davis8bdfafd2013-09-01 04:28:48 +00004483MachO::linkedit_data_command
Kevin Enderby273ae012013-06-06 17:20:50 +00004484MachOObjectFile::getDataInCodeLoadCommand() const {
4485 if (DataInCodeLoadCmd)
Lang Hames697e7cd2016-12-04 01:56:10 +00004486 return getStruct<MachO::linkedit_data_command>(*this, DataInCodeLoadCmd);
Kevin Enderby273ae012013-06-06 17:20:50 +00004487
4488 // If there is no DataInCodeLoadCmd return a load command with zero'ed fields.
Charles Davis8bdfafd2013-09-01 04:28:48 +00004489 MachO::linkedit_data_command Cmd;
4490 Cmd.cmd = MachO::LC_DATA_IN_CODE;
4491 Cmd.cmdsize = sizeof(MachO::linkedit_data_command);
4492 Cmd.dataoff = 0;
4493 Cmd.datasize = 0;
Kevin Enderby273ae012013-06-06 17:20:50 +00004494 return Cmd;
4495}
4496
Kevin Enderby9a509442015-01-27 21:28:24 +00004497MachO::linkedit_data_command
4498MachOObjectFile::getLinkOptHintsLoadCommand() const {
4499 if (LinkOptHintsLoadCmd)
Lang Hames697e7cd2016-12-04 01:56:10 +00004500 return getStruct<MachO::linkedit_data_command>(*this, LinkOptHintsLoadCmd);
Kevin Enderby9a509442015-01-27 21:28:24 +00004501
4502 // If there is no LinkOptHintsLoadCmd return a load command with zero'ed
4503 // fields.
4504 MachO::linkedit_data_command Cmd;
4505 Cmd.cmd = MachO::LC_LINKER_OPTIMIZATION_HINT;
4506 Cmd.cmdsize = sizeof(MachO::linkedit_data_command);
4507 Cmd.dataoff = 0;
4508 Cmd.datasize = 0;
4509 return Cmd;
4510}
4511
Nick Kledzikd04bc352014-08-30 00:20:14 +00004512ArrayRef<uint8_t> MachOObjectFile::getDyldInfoRebaseOpcodes() const {
NAKAMURA Takumi10c80e72015-09-22 11:19:03 +00004513 if (!DyldInfoLoadCmd)
Craig Topper0013be12015-09-21 05:32:41 +00004514 return None;
Nick Kledzikd04bc352014-08-30 00:20:14 +00004515
NAKAMURA Takumi70ad98a2015-09-22 11:13:55 +00004516 MachO::dyld_info_command DyldInfo =
Lang Hames697e7cd2016-12-04 01:56:10 +00004517 getStruct<MachO::dyld_info_command>(*this, DyldInfoLoadCmd);
NAKAMURA Takumi70ad98a2015-09-22 11:13:55 +00004518 const uint8_t *Ptr =
Lang Hames697e7cd2016-12-04 01:56:10 +00004519 reinterpret_cast<const uint8_t *>(getPtr(*this, DyldInfo.rebase_off));
Craig Topper0013be12015-09-21 05:32:41 +00004520 return makeArrayRef(Ptr, DyldInfo.rebase_size);
Nick Kledzikd04bc352014-08-30 00:20:14 +00004521}
4522
4523ArrayRef<uint8_t> MachOObjectFile::getDyldInfoBindOpcodes() const {
NAKAMURA Takumi10c80e72015-09-22 11:19:03 +00004524 if (!DyldInfoLoadCmd)
Craig Topper0013be12015-09-21 05:32:41 +00004525 return None;
Nick Kledzikd04bc352014-08-30 00:20:14 +00004526
NAKAMURA Takumi70ad98a2015-09-22 11:13:55 +00004527 MachO::dyld_info_command DyldInfo =
Lang Hames697e7cd2016-12-04 01:56:10 +00004528 getStruct<MachO::dyld_info_command>(*this, DyldInfoLoadCmd);
NAKAMURA Takumi70ad98a2015-09-22 11:13:55 +00004529 const uint8_t *Ptr =
Lang Hames697e7cd2016-12-04 01:56:10 +00004530 reinterpret_cast<const uint8_t *>(getPtr(*this, DyldInfo.bind_off));
Craig Topper0013be12015-09-21 05:32:41 +00004531 return makeArrayRef(Ptr, DyldInfo.bind_size);
Nick Kledzikd04bc352014-08-30 00:20:14 +00004532}
4533
4534ArrayRef<uint8_t> MachOObjectFile::getDyldInfoWeakBindOpcodes() const {
NAKAMURA Takumi10c80e72015-09-22 11:19:03 +00004535 if (!DyldInfoLoadCmd)
Craig Topper0013be12015-09-21 05:32:41 +00004536 return None;
Nick Kledzikd04bc352014-08-30 00:20:14 +00004537
NAKAMURA Takumi70ad98a2015-09-22 11:13:55 +00004538 MachO::dyld_info_command DyldInfo =
Lang Hames697e7cd2016-12-04 01:56:10 +00004539 getStruct<MachO::dyld_info_command>(*this, DyldInfoLoadCmd);
NAKAMURA Takumi70ad98a2015-09-22 11:13:55 +00004540 const uint8_t *Ptr =
Lang Hames697e7cd2016-12-04 01:56:10 +00004541 reinterpret_cast<const uint8_t *>(getPtr(*this, DyldInfo.weak_bind_off));
Craig Topper0013be12015-09-21 05:32:41 +00004542 return makeArrayRef(Ptr, DyldInfo.weak_bind_size);
Nick Kledzikd04bc352014-08-30 00:20:14 +00004543}
4544
4545ArrayRef<uint8_t> MachOObjectFile::getDyldInfoLazyBindOpcodes() const {
NAKAMURA Takumi10c80e72015-09-22 11:19:03 +00004546 if (!DyldInfoLoadCmd)
Craig Topper0013be12015-09-21 05:32:41 +00004547 return None;
Nick Kledzikd04bc352014-08-30 00:20:14 +00004548
NAKAMURA Takumi70ad98a2015-09-22 11:13:55 +00004549 MachO::dyld_info_command DyldInfo =
Lang Hames697e7cd2016-12-04 01:56:10 +00004550 getStruct<MachO::dyld_info_command>(*this, DyldInfoLoadCmd);
NAKAMURA Takumi70ad98a2015-09-22 11:13:55 +00004551 const uint8_t *Ptr =
Lang Hames697e7cd2016-12-04 01:56:10 +00004552 reinterpret_cast<const uint8_t *>(getPtr(*this, DyldInfo.lazy_bind_off));
Craig Topper0013be12015-09-21 05:32:41 +00004553 return makeArrayRef(Ptr, DyldInfo.lazy_bind_size);
Nick Kledzikd04bc352014-08-30 00:20:14 +00004554}
4555
4556ArrayRef<uint8_t> MachOObjectFile::getDyldInfoExportsTrie() const {
NAKAMURA Takumi10c80e72015-09-22 11:19:03 +00004557 if (!DyldInfoLoadCmd)
Craig Topper0013be12015-09-21 05:32:41 +00004558 return None;
Nick Kledzikd04bc352014-08-30 00:20:14 +00004559
NAKAMURA Takumi70ad98a2015-09-22 11:13:55 +00004560 MachO::dyld_info_command DyldInfo =
Lang Hames697e7cd2016-12-04 01:56:10 +00004561 getStruct<MachO::dyld_info_command>(*this, DyldInfoLoadCmd);
NAKAMURA Takumi70ad98a2015-09-22 11:13:55 +00004562 const uint8_t *Ptr =
Lang Hames697e7cd2016-12-04 01:56:10 +00004563 reinterpret_cast<const uint8_t *>(getPtr(*this, DyldInfo.export_off));
Craig Topper0013be12015-09-21 05:32:41 +00004564 return makeArrayRef(Ptr, DyldInfo.export_size);
Nick Kledzikd04bc352014-08-30 00:20:14 +00004565}
4566
Alexander Potapenko6909b5b2014-10-15 23:35:45 +00004567ArrayRef<uint8_t> MachOObjectFile::getUuid() const {
4568 if (!UuidLoadCmd)
Craig Topper0013be12015-09-21 05:32:41 +00004569 return None;
Benjamin Kramer014601d2014-10-24 15:52:05 +00004570 // Returning a pointer is fine as uuid doesn't need endian swapping.
4571 const char *Ptr = UuidLoadCmd + offsetof(MachO::uuid_command, uuid);
Craig Topper0013be12015-09-21 05:32:41 +00004572 return makeArrayRef(reinterpret_cast<const uint8_t *>(Ptr), 16);
Alexander Potapenko6909b5b2014-10-15 23:35:45 +00004573}
Nick Kledzikd04bc352014-08-30 00:20:14 +00004574
Rafael Espindola6e040c02013-04-26 20:07:33 +00004575StringRef MachOObjectFile::getStringTableData() const {
Charles Davis8bdfafd2013-09-01 04:28:48 +00004576 MachO::symtab_command S = getSymtabLoadCommand();
4577 return getData().substr(S.stroff, S.strsize);
Rafael Espindola6e040c02013-04-26 20:07:33 +00004578}
4579
Rafael Espindola56f976f2013-04-18 18:08:55 +00004580bool MachOObjectFile::is64Bit() const {
4581 return getType() == getMachOType(false, true) ||
Lang Hames84bc8182014-07-15 19:35:22 +00004582 getType() == getMachOType(true, true);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004583}
4584
4585void MachOObjectFile::ReadULEB128s(uint64_t Index,
4586 SmallVectorImpl<uint64_t> &Out) const {
4587 DataExtractor extractor(ObjectFile::getData(), true, 0);
4588
4589 uint32_t offset = Index;
4590 uint64_t data = 0;
4591 while (uint64_t delta = extractor.getULEB128(&offset)) {
4592 data += delta;
4593 Out.push_back(data);
4594 }
4595}
4596
Rafael Espindolac66d7612014-08-17 19:09:37 +00004597bool MachOObjectFile::isRelocatableObject() const {
4598 return getHeader().filetype == MachO::MH_OBJECT;
4599}
4600
Lang Hamesff044b12016-03-25 23:11:52 +00004601Expected<std::unique_ptr<MachOObjectFile>>
Kevin Enderby79d6c632016-10-24 21:15:11 +00004602ObjectFile::createMachOObjectFile(MemoryBufferRef Buffer,
4603 uint32_t UniversalCputype,
4604 uint32_t UniversalIndex) {
Rafael Espindola48af1c22014-08-19 18:44:46 +00004605 StringRef Magic = Buffer.getBuffer().slice(0, 4);
Lang Hames82627642016-03-25 21:59:14 +00004606 if (Magic == "\xFE\xED\xFA\xCE")
Kevin Enderby79d6c632016-10-24 21:15:11 +00004607 return MachOObjectFile::create(Buffer, false, false,
4608 UniversalCputype, UniversalIndex);
David Blaikieb805f732016-03-28 17:45:48 +00004609 if (Magic == "\xCE\xFA\xED\xFE")
Kevin Enderby79d6c632016-10-24 21:15:11 +00004610 return MachOObjectFile::create(Buffer, true, false,
4611 UniversalCputype, UniversalIndex);
David Blaikieb805f732016-03-28 17:45:48 +00004612 if (Magic == "\xFE\xED\xFA\xCF")
Kevin Enderby79d6c632016-10-24 21:15:11 +00004613 return MachOObjectFile::create(Buffer, false, true,
4614 UniversalCputype, UniversalIndex);
David Blaikieb805f732016-03-28 17:45:48 +00004615 if (Magic == "\xCF\xFA\xED\xFE")
Kevin Enderby79d6c632016-10-24 21:15:11 +00004616 return MachOObjectFile::create(Buffer, true, true,
4617 UniversalCputype, UniversalIndex);
Kevin Enderbyd4e075b2016-05-06 20:16:28 +00004618 return make_error<GenericBinaryError>("Unrecognized MachO magic number",
Justin Bogner2a42da92016-05-05 23:59:57 +00004619 object_error::invalid_file_type);
Rafael Espindola56f976f2013-04-18 18:08:55 +00004620}
Wolfgang Pieb77d3e932017-06-06 01:22:34 +00004621
4622StringRef MachOObjectFile::mapDebugSectionName(StringRef Name) const {
4623 return StringSwitch<StringRef>(Name)
4624 .Case("debug_str_offs", "debug_str_offsets")
4625 .Default(Name);
4626}