blob: b17eefd220b8504dacd3fadf8f05f34e60887099 [file] [log] [blame]
Eugene Zelenkod341c932017-04-19 23:02:10 +00001//===- Archive.cpp - ar File Format implementation ------------------------===//
Michael J. Spencerd3b7b122011-09-27 19:36:55 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file defines the ArchiveObjectFile class.
11//
12//===----------------------------------------------------------------------===//
13
Chandler Carruth6bda14b2017-06-06 11:49:48 +000014#include "llvm/Object/Archive.h"
Eugene Zelenkod341c932017-04-19 23:02:10 +000015#include "llvm/ADT/Optional.h"
Rafael Espindola747bc072013-07-09 03:39:35 +000016#include "llvm/ADT/SmallString.h"
Eugene Zelenkod341c932017-04-19 23:02:10 +000017#include "llvm/ADT/StringRef.h"
Rafael Espindola747bc072013-07-09 03:39:35 +000018#include "llvm/ADT/Twine.h"
Eugene Zelenkod341c932017-04-19 23:02:10 +000019#include "llvm/Object/Binary.h"
20#include "llvm/Object/Error.h"
21#include "llvm/Support/Chrono.h"
Michael J. Spencere03ea9c2011-11-02 19:33:12 +000022#include "llvm/Support/Endian.h"
Eugene Zelenkod341c932017-04-19 23:02:10 +000023#include "llvm/Support/Error.h"
24#include "llvm/Support/ErrorOr.h"
25#include "llvm/Support/FileSystem.h"
Michael J. Spencerd3b7b122011-09-27 19:36:55 +000026#include "llvm/Support/MemoryBuffer.h"
Rafael Espindola4b83cb52015-07-14 22:18:43 +000027#include "llvm/Support/Path.h"
Eugene Zelenkod341c932017-04-19 23:02:10 +000028#include "llvm/Support/raw_ostream.h"
29#include <algorithm>
30#include <cassert>
31#include <cstddef>
32#include <cstdint>
33#include <cstring>
34#include <memory>
35#include <string>
36#include <system_error>
Michael J. Spencerd3b7b122011-09-27 19:36:55 +000037
38using namespace llvm;
39using namespace object;
Rui Ueyama3206b792015-03-02 21:19:12 +000040using namespace llvm::support::endian;
Michael J. Spencerd3b7b122011-09-27 19:36:55 +000041
Craig Topperd3a34f82013-07-16 01:17:10 +000042static const char *const Magic = "!<arch>\n";
Rafael Espindola9d102062014-12-16 01:43:41 +000043static const char *const ThinMagic = "!<thin>\n";
Michael J. Spencerd3b7b122011-09-27 19:36:55 +000044
Eugene Zelenkod341c932017-04-19 23:02:10 +000045void Archive::anchor() {}
David Blaikiea379b1812011-12-20 02:50:00 +000046
Kevin Enderby6524bd82016-07-19 20:47:07 +000047static Error
48malformedError(Twine Msg) {
49 std::string StringMsg = "truncated or malformed archive (" + Msg.str() + ")";
50 return make_error<GenericBinaryError>(std::move(StringMsg),
51 object_error::parse_failed);
52}
53
Kevin Enderby95b08422016-07-25 20:36:36 +000054ArchiveMemberHeader::ArchiveMemberHeader(const Archive *Parent,
55 const char *RawHeaderPtr,
56 uint64_t Size, Error *Err)
57 : Parent(Parent),
58 ArMemHdr(reinterpret_cast<const ArMemHdrType *>(RawHeaderPtr)) {
59 if (RawHeaderPtr == nullptr)
60 return;
61 ErrorAsOutParameter ErrAsOutParam(Err);
62
Kevin Enderby95b08422016-07-25 20:36:36 +000063 if (Size < sizeof(ArMemHdrType)) {
64 if (Err) {
Kevin Enderby31b07f12016-07-29 22:32:02 +000065 std::string Msg("remaining size of archive too small for next archive "
66 "member header ");
Kevin Enderbyf4586032016-07-29 17:44:13 +000067 Expected<StringRef> NameOrErr = getName(Size);
68 if (!NameOrErr) {
69 consumeError(NameOrErr.takeError());
70 uint64_t Offset = RawHeaderPtr - Parent->getData().data();
71 *Err = malformedError(Msg + "at offset " + Twine(Offset));
72 } else
Kevin Enderby31b07f12016-07-29 22:32:02 +000073 *Err = malformedError(Msg + "for " + NameOrErr.get());
Kevin Enderby95b08422016-07-25 20:36:36 +000074 }
75 return;
76 }
77 if (ArMemHdr->Terminator[0] != '`' || ArMemHdr->Terminator[1] != '\n') {
78 if (Err) {
79 std::string Buf;
80 raw_string_ostream OS(Buf);
Eugene Zelenkod341c932017-04-19 23:02:10 +000081 OS.write_escaped(StringRef(ArMemHdr->Terminator,
82 sizeof(ArMemHdr->Terminator)));
Kevin Enderby95b08422016-07-25 20:36:36 +000083 OS.flush();
Kevin Enderby31b07f12016-07-29 22:32:02 +000084 std::string Msg("terminator characters in archive member \"" + Buf +
85 "\" not the correct \"`\\n\" values for the archive "
86 "member header ");
Kevin Enderbyf4586032016-07-29 17:44:13 +000087 Expected<StringRef> NameOrErr = getName(Size);
88 if (!NameOrErr) {
89 consumeError(NameOrErr.takeError());
90 uint64_t Offset = RawHeaderPtr - Parent->getData().data();
91 *Err = malformedError(Msg + "at offset " + Twine(Offset));
92 } else
Kevin Enderby31b07f12016-07-29 22:32:02 +000093 *Err = malformedError(Msg + "for " + NameOrErr.get());
Kevin Enderby95b08422016-07-25 20:36:36 +000094 }
95 return;
96 }
97}
98
Kevin Enderbyf4586032016-07-29 17:44:13 +000099// This gets the raw name from the ArMemHdr->Name field and checks that it is
100// valid for the kind of archive. If it is not valid it returns an Error.
101Expected<StringRef> ArchiveMemberHeader::getRawName() const {
Rafael Espindola747bc072013-07-09 03:39:35 +0000102 char EndCond;
Kevin Enderbyf4586032016-07-29 17:44:13 +0000103 auto Kind = Parent->kind();
104 if (Kind == Archive::K_BSD || Kind == Archive::K_DARWIN64) {
105 if (ArMemHdr->Name[0] == ' ') {
106 uint64_t Offset = reinterpret_cast<const char *>(ArMemHdr) -
107 Parent->getData().data();
108 return malformedError("name contains a leading space for archive member "
109 "header at offset " + Twine(Offset));
110 }
111 EndCond = ' ';
112 }
113 else if (ArMemHdr->Name[0] == '/' || ArMemHdr->Name[0] == '#')
Rafael Espindola747bc072013-07-09 03:39:35 +0000114 EndCond = ' ';
115 else
116 EndCond = '/';
Eugene Zelenkod341c932017-04-19 23:02:10 +0000117 StringRef::size_type end =
118 StringRef(ArMemHdr->Name, sizeof(ArMemHdr->Name)).find(EndCond);
119 if (end == StringRef::npos)
Kevin Enderby95b08422016-07-25 20:36:36 +0000120 end = sizeof(ArMemHdr->Name);
121 assert(end <= sizeof(ArMemHdr->Name) && end > 0);
Rafael Espindola747bc072013-07-09 03:39:35 +0000122 // Don't include the EndCond if there is one.
Eugene Zelenkod341c932017-04-19 23:02:10 +0000123 return StringRef(ArMemHdr->Name, end);
Rafael Espindola747bc072013-07-09 03:39:35 +0000124}
125
Kevin Enderbyf4586032016-07-29 17:44:13 +0000126// This gets the name looking up long names. Size is the size of the archive
127// member including the header, so the size of any name following the header
128// is checked to make sure it does not overflow.
129Expected<StringRef> ArchiveMemberHeader::getName(uint64_t Size) const {
130
131 // This can be called from the ArchiveMemberHeader constructor when the
132 // archive header is truncated to produce an error message with the name.
133 // Make sure the name field is not truncated.
134 if (Size < offsetof(ArMemHdrType, Name) + sizeof(ArMemHdr->Name)) {
135 uint64_t ArchiveOffset = reinterpret_cast<const char *>(ArMemHdr) -
136 Parent->getData().data();
137 return malformedError("archive header truncated before the name field "
138 "for archive member header at offset " +
139 Twine(ArchiveOffset));
140 }
141
142 // The raw name itself can be invalid.
143 Expected<StringRef> NameOrErr = getRawName();
144 if (!NameOrErr)
145 return NameOrErr.takeError();
146 StringRef Name = NameOrErr.get();
147
148 // Check if it's a special name.
149 if (Name[0] == '/') {
150 if (Name.size() == 1) // Linker member.
151 return Name;
152 if (Name.size() == 2 && Name[1] == '/') // String table.
153 return Name;
154 // It's a long name.
155 // Get the string table offset.
156 std::size_t StringOffset;
157 if (Name.substr(1).rtrim(' ').getAsInteger(10, StringOffset)) {
158 std::string Buf;
159 raw_string_ostream OS(Buf);
Kevin Enderby31b07f12016-07-29 22:32:02 +0000160 OS.write_escaped(Name.substr(1).rtrim(' '));
Kevin Enderbyf4586032016-07-29 17:44:13 +0000161 OS.flush();
162 uint64_t ArchiveOffset = reinterpret_cast<const char *>(ArMemHdr) -
163 Parent->getData().data();
164 return malformedError("long name offset characters after the '/' are "
165 "not all decimal numbers: '" + Buf + "' for "
166 "archive member header at offset " +
167 Twine(ArchiveOffset));
168 }
169
170 // Verify it.
171 if (StringOffset >= Parent->getStringTable().size()) {
172 uint64_t ArchiveOffset = reinterpret_cast<const char *>(ArMemHdr) -
173 Parent->getData().data();
174 return malformedError("long name offset " + Twine(StringOffset) + " past "
175 "the end of the string table for archive member "
176 "header at offset " + Twine(ArchiveOffset));
177 }
178 const char *addr = Parent->getStringTable().begin() + StringOffset;
179
180 // GNU long file names end with a "/\n".
181 if (Parent->kind() == Archive::K_GNU ||
Jake Ehrlich1b30d632017-09-20 18:23:01 +0000182 Parent->kind() == Archive::K_GNU64) {
Kevin Enderbyf4586032016-07-29 17:44:13 +0000183 StringRef::size_type End = StringRef(addr).find('\n');
184 return StringRef(addr, End - 1);
185 }
David Blaikiecd842ec2016-08-01 21:50:43 +0000186 return addr;
187 }
188
189 if (Name.startswith("#1/")) {
Kevin Enderbyf4586032016-07-29 17:44:13 +0000190 uint64_t NameLength;
191 if (Name.substr(3).rtrim(' ').getAsInteger(10, NameLength)) {
192 std::string Buf;
193 raw_string_ostream OS(Buf);
Kevin Enderby31b07f12016-07-29 22:32:02 +0000194 OS.write_escaped(Name.substr(3).rtrim(' '));
Kevin Enderbyf4586032016-07-29 17:44:13 +0000195 OS.flush();
196 uint64_t ArchiveOffset = reinterpret_cast<const char *>(ArMemHdr) -
197 Parent->getData().data();
198 return malformedError("long name length characters after the #1/ are "
199 "not all decimal numbers: '" + Buf + "' for "
200 "archive member header at offset " +
201 Twine(ArchiveOffset));
202 }
203 if (getSizeOf() + NameLength > Size) {
204 uint64_t ArchiveOffset = reinterpret_cast<const char *>(ArMemHdr) -
205 Parent->getData().data();
206 return malformedError("long name length: " + Twine(NameLength) +
207 " extends past the end of the member or archive "
208 "for archive member header at offset " +
209 Twine(ArchiveOffset));
210 }
211 return StringRef(reinterpret_cast<const char *>(ArMemHdr) + getSizeOf(),
212 NameLength).rtrim('\0');
Kevin Enderbyf4586032016-07-29 17:44:13 +0000213 }
David Blaikiecd842ec2016-08-01 21:50:43 +0000214
215 // It is not a long name so trim the blanks at the end of the name.
216 if (Name[Name.size() - 1] != '/')
217 return Name.rtrim(' ');
218
Kevin Enderbyf4586032016-07-29 17:44:13 +0000219 // It's a simple name.
David Blaikiecd842ec2016-08-01 21:50:43 +0000220 return Name.drop_back(1);
Kevin Enderbyf4586032016-07-29 17:44:13 +0000221}
222
Kevin Enderby6524bd82016-07-19 20:47:07 +0000223Expected<uint32_t> ArchiveMemberHeader::getSize() const {
Rafael Espindola8e9385e2013-07-09 12:45:11 +0000224 uint32_t Ret;
Eugene Zelenkod341c932017-04-19 23:02:10 +0000225 if (StringRef(ArMemHdr->Size,
226 sizeof(ArMemHdr->Size)).rtrim(" ").getAsInteger(10, Ret)) {
Kevin Enderby6524bd82016-07-19 20:47:07 +0000227 std::string Buf;
228 raw_string_ostream OS(Buf);
Eugene Zelenkod341c932017-04-19 23:02:10 +0000229 OS.write_escaped(StringRef(ArMemHdr->Size,
230 sizeof(ArMemHdr->Size)).rtrim(" "));
Kevin Enderby6524bd82016-07-19 20:47:07 +0000231 OS.flush();
Kevin Enderby95b08422016-07-25 20:36:36 +0000232 uint64_t Offset = reinterpret_cast<const char *>(ArMemHdr) -
233 Parent->getData().data();
Kevin Enderby6524bd82016-07-19 20:47:07 +0000234 return malformedError("characters in size field in archive header are not "
Kevin Enderby95b08422016-07-25 20:36:36 +0000235 "all decimal numbers: '" + Buf + "' for archive "
236 "member header at offset " + Twine(Offset));
Kevin Enderby6524bd82016-07-19 20:47:07 +0000237 }
Rafael Espindola8e9385e2013-07-09 12:45:11 +0000238 return Ret;
Rafael Espindola747bc072013-07-09 03:39:35 +0000239}
240
Vedant Kumar4031d9f2016-08-03 19:02:50 +0000241Expected<sys::fs::perms> ArchiveMemberHeader::getAccessMode() const {
Rafael Espindola8115e1d2013-07-09 12:49:24 +0000242 unsigned Ret;
Kevin Enderby95b08422016-07-25 20:36:36 +0000243 if (StringRef(ArMemHdr->AccessMode,
Vedant Kumar4031d9f2016-08-03 19:02:50 +0000244 sizeof(ArMemHdr->AccessMode)).rtrim(' ').getAsInteger(8, Ret)) {
245 std::string Buf;
246 raw_string_ostream OS(Buf);
Eugene Zelenkod341c932017-04-19 23:02:10 +0000247 OS.write_escaped(StringRef(ArMemHdr->AccessMode,
248 sizeof(ArMemHdr->AccessMode)).rtrim(" "));
Vedant Kumar4031d9f2016-08-03 19:02:50 +0000249 OS.flush();
250 uint64_t Offset = reinterpret_cast<const char *>(ArMemHdr) -
251 Parent->getData().data();
252 return malformedError("characters in AccessMode field in archive header "
253 "are not all decimal numbers: '" + Buf + "' for the "
254 "archive member header at offset " + Twine(Offset));
255 }
Rafael Espindola8115e1d2013-07-09 12:49:24 +0000256 return static_cast<sys::fs::perms>(Ret);
257}
258
Pavel Labathbff47b52016-10-24 13:38:27 +0000259Expected<sys::TimePoint<std::chrono::seconds>>
260ArchiveMemberHeader::getLastModified() const {
Rafael Espindola8115e1d2013-07-09 12:49:24 +0000261 unsigned Seconds;
Kevin Enderby95b08422016-07-25 20:36:36 +0000262 if (StringRef(ArMemHdr->LastModified,
263 sizeof(ArMemHdr->LastModified)).rtrim(' ')
Vedant Kumar4031d9f2016-08-03 19:02:50 +0000264 .getAsInteger(10, Seconds)) {
265 std::string Buf;
266 raw_string_ostream OS(Buf);
Eugene Zelenkod341c932017-04-19 23:02:10 +0000267 OS.write_escaped(StringRef(ArMemHdr->LastModified,
268 sizeof(ArMemHdr->LastModified)).rtrim(" "));
Vedant Kumar4031d9f2016-08-03 19:02:50 +0000269 OS.flush();
270 uint64_t Offset = reinterpret_cast<const char *>(ArMemHdr) -
271 Parent->getData().data();
272 return malformedError("characters in LastModified field in archive header "
273 "are not all decimal numbers: '" + Buf + "' for the "
274 "archive member header at offset " + Twine(Offset));
275 }
Rafael Espindola8115e1d2013-07-09 12:49:24 +0000276
Pavel Labathbff47b52016-10-24 13:38:27 +0000277 return sys::toTimePoint(Seconds);
Rafael Espindola8115e1d2013-07-09 12:49:24 +0000278}
279
Vedant Kumar4031d9f2016-08-03 19:02:50 +0000280Expected<unsigned> ArchiveMemberHeader::getUID() const {
Rafael Espindola8115e1d2013-07-09 12:49:24 +0000281 unsigned Ret;
Kevin Enderby95b08422016-07-25 20:36:36 +0000282 StringRef User = StringRef(ArMemHdr->UID, sizeof(ArMemHdr->UID)).rtrim(' ');
Saleem Abdulrasoolaecbdf72016-07-05 00:23:05 +0000283 if (User.empty())
284 return 0;
Vedant Kumar4031d9f2016-08-03 19:02:50 +0000285 if (User.getAsInteger(10, Ret)) {
286 std::string Buf;
287 raw_string_ostream OS(Buf);
288 OS.write_escaped(User);
289 OS.flush();
290 uint64_t Offset = reinterpret_cast<const char *>(ArMemHdr) -
291 Parent->getData().data();
292 return malformedError("characters in UID field in archive header "
293 "are not all decimal numbers: '" + Buf + "' for the "
294 "archive member header at offset " + Twine(Offset));
295 }
Rafael Espindola8115e1d2013-07-09 12:49:24 +0000296 return Ret;
297}
298
Vedant Kumar4031d9f2016-08-03 19:02:50 +0000299Expected<unsigned> ArchiveMemberHeader::getGID() const {
Rafael Espindola8115e1d2013-07-09 12:49:24 +0000300 unsigned Ret;
Kevin Enderby95b08422016-07-25 20:36:36 +0000301 StringRef Group = StringRef(ArMemHdr->GID, sizeof(ArMemHdr->GID)).rtrim(' ');
Saleem Abdulrasoolaecbdf72016-07-05 00:23:05 +0000302 if (Group.empty())
303 return 0;
Vedant Kumar4031d9f2016-08-03 19:02:50 +0000304 if (Group.getAsInteger(10, Ret)) {
305 std::string Buf;
306 raw_string_ostream OS(Buf);
307 OS.write_escaped(Group);
308 OS.flush();
309 uint64_t Offset = reinterpret_cast<const char *>(ArMemHdr) -
310 Parent->getData().data();
311 return malformedError("characters in GID field in archive header "
312 "are not all decimal numbers: '" + Buf + "' for the "
313 "archive member header at offset " + Twine(Offset));
314 }
Rafael Espindola8115e1d2013-07-09 12:49:24 +0000315 return Ret;
316}
317
Rafael Espindola43358762015-10-31 21:44:42 +0000318Archive::Child::Child(const Archive *Parent, StringRef Data,
319 uint16_t StartOfFile)
Kevin Enderby95b08422016-07-25 20:36:36 +0000320 : Parent(Parent), Header(Parent, Data.data(), Data.size(), nullptr),
321 Data(Data), StartOfFile(StartOfFile) {
322}
Rafael Espindola43358762015-10-31 21:44:42 +0000323
Kevin Enderby6524bd82016-07-19 20:47:07 +0000324Archive::Child::Child(const Archive *Parent, const char *Start, Error *Err)
Lang Hamesa5e873e2016-10-05 21:20:00 +0000325 : Parent(Parent),
326 Header(Parent, Start,
327 Parent
328 ? Parent->getData().size() - (Start - Parent->getData().data())
329 : 0, Err) {
Rafael Espindola0f3de642013-07-09 05:26:25 +0000330 if (!Start)
Rafael Espindola747bc072013-07-09 03:39:35 +0000331 return;
Kevin Enderby2c182702016-08-04 21:54:19 +0000332
333 // If we are pointed to real data, Start is not a nullptr, then there must be
334 // a non-null Err pointer available to report malformed data on. Only in
335 // the case sentinel value is being constructed is Err is permitted to be a
336 // nullptr.
337 assert(Err && "Err can't be nullptr if Start is not a nullptr");
338
Lang Hames5e51a2e2016-07-22 16:11:25 +0000339 ErrorAsOutParameter ErrAsOutParam(Err);
Rafael Espindola0f3de642013-07-09 05:26:25 +0000340
Jake Ehrlich1b30d632017-09-20 18:23:01 +0000341 // If there was an error in the construction of the Header
Kevin Enderby2c182702016-08-04 21:54:19 +0000342 // then just return with the error now set.
343 if (*Err)
Kevin Enderby95b08422016-07-25 20:36:36 +0000344 return;
345
346 uint64_t Size = Header.getSizeOf();
Rafael Espindola9d102062014-12-16 01:43:41 +0000347 Data = StringRef(Start, Size);
Kevin Enderbyf4586032016-07-29 17:44:13 +0000348 Expected<bool> isThinOrErr = isThinMember();
349 if (!isThinOrErr) {
Kevin Enderby2c182702016-08-04 21:54:19 +0000350 *Err = isThinOrErr.takeError();
Kevin Enderbyf4586032016-07-29 17:44:13 +0000351 return;
352 }
353 bool isThin = isThinOrErr.get();
354 if (!isThin) {
Kevin Enderby6524bd82016-07-19 20:47:07 +0000355 Expected<uint64_t> MemberSize = getRawSize();
356 if (!MemberSize) {
Kevin Enderby2c182702016-08-04 21:54:19 +0000357 *Err = MemberSize.takeError();
Kevin Enderby7a969422015-11-05 19:24:56 +0000358 return;
Kevin Enderby6524bd82016-07-19 20:47:07 +0000359 }
Kevin Enderby7a969422015-11-05 19:24:56 +0000360 Size += MemberSize.get();
Rafael Espindolabe9ab262015-07-22 19:34:26 +0000361 Data = StringRef(Start, Size);
362 }
Rafael Espindola0f3de642013-07-09 05:26:25 +0000363
Rafael Espindola747bc072013-07-09 03:39:35 +0000364 // Setup StartOfFile and PaddingBytes.
Kevin Enderby95b08422016-07-25 20:36:36 +0000365 StartOfFile = Header.getSizeOf();
Rafael Espindola747bc072013-07-09 03:39:35 +0000366 // Don't include attached name.
Kevin Enderbyf4586032016-07-29 17:44:13 +0000367 Expected<StringRef> NameOrErr = getRawName();
368 if (!NameOrErr){
Kevin Enderby2c182702016-08-04 21:54:19 +0000369 *Err = NameOrErr.takeError();
Kevin Enderbyf4586032016-07-29 17:44:13 +0000370 return;
371 }
372 StringRef Name = NameOrErr.get();
Rafael Espindola747bc072013-07-09 03:39:35 +0000373 if (Name.startswith("#1/")) {
374 uint64_t NameSize;
Kevin Enderbyf4586032016-07-29 17:44:13 +0000375 if (Name.substr(3).rtrim(' ').getAsInteger(10, NameSize)) {
Kevin Enderby2c182702016-08-04 21:54:19 +0000376 std::string Buf;
377 raw_string_ostream OS(Buf);
378 OS.write_escaped(Name.substr(3).rtrim(' '));
379 OS.flush();
380 uint64_t Offset = Start - Parent->getData().data();
381 *Err = malformedError("long name length characters after the #1/ are "
382 "not all decimal numbers: '" + Buf + "' for "
383 "archive member header at offset " +
384 Twine(Offset));
385 return;
Kevin Enderbyf4586032016-07-29 17:44:13 +0000386 }
Rafael Espindola747bc072013-07-09 03:39:35 +0000387 StartOfFile += NameSize;
388 }
389}
390
Kevin Enderby6524bd82016-07-19 20:47:07 +0000391Expected<uint64_t> Archive::Child::getSize() const {
Kevin Enderby1c1add42015-10-13 20:48:04 +0000392 if (Parent->IsThin) {
Kevin Enderby95b08422016-07-25 20:36:36 +0000393 Expected<uint32_t> Size = Header.getSize();
Kevin Enderby6524bd82016-07-19 20:47:07 +0000394 if (!Size)
395 return Size.takeError();
Kevin Enderby1c1add42015-10-13 20:48:04 +0000396 return Size.get();
397 }
Rafael Espindola9d102062014-12-16 01:43:41 +0000398 return Data.size() - StartOfFile;
399}
400
Kevin Enderby6524bd82016-07-19 20:47:07 +0000401Expected<uint64_t> Archive::Child::getRawSize() const {
Kevin Enderby95b08422016-07-25 20:36:36 +0000402 return Header.getSize();
Kevin Enderby13023a12015-01-15 23:19:11 +0000403}
404
Kevin Enderbyf4586032016-07-29 17:44:13 +0000405Expected<bool> Archive::Child::isThinMember() const {
406 Expected<StringRef> NameOrErr = Header.getRawName();
407 if (!NameOrErr)
408 return NameOrErr.takeError();
409 StringRef Name = NameOrErr.get();
Rafael Espindolabe9ab262015-07-22 19:34:26 +0000410 return Parent->IsThin && Name != "/" && Name != "//";
411}
412
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000413Expected<std::string> Archive::Child::getFullName() const {
Kevin Enderbyf4586032016-07-29 17:44:13 +0000414 Expected<bool> isThin = isThinMember();
415 if (!isThin)
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000416 return isThin.takeError();
Kevin Enderbyf4586032016-07-29 17:44:13 +0000417 assert(isThin.get());
418 Expected<StringRef> NameOrErr = getName();
419 if (!NameOrErr)
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000420 return NameOrErr.takeError();
Rafael Espindola694210c2016-05-02 13:45:06 +0000421 StringRef Name = *NameOrErr;
422 if (sys::path::is_absolute(Name))
423 return Name;
424
425 SmallString<128> FullName = sys::path::parent_path(
426 Parent->getMemoryBufferRef().getBufferIdentifier());
427 sys::path::append(FullName, Name);
428 return StringRef(FullName);
429}
430
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000431Expected<StringRef> Archive::Child::getBuffer() const {
Kevin Enderbyf4586032016-07-29 17:44:13 +0000432 Expected<bool> isThinOrErr = isThinMember();
433 if (!isThinOrErr)
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000434 return isThinOrErr.takeError();
Kevin Enderbyf4586032016-07-29 17:44:13 +0000435 bool isThin = isThinOrErr.get();
436 if (!isThin) {
Kevin Enderby6524bd82016-07-19 20:47:07 +0000437 Expected<uint32_t> Size = getSize();
438 if (!Size)
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000439 return Size.takeError();
Kevin Enderby7a969422015-11-05 19:24:56 +0000440 return StringRef(Data.data() + StartOfFile, Size.get());
441 }
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000442 Expected<std::string> FullNameOrErr = getFullName();
443 if (!FullNameOrErr)
444 return FullNameOrErr.takeError();
445 const std::string &FullName = *FullNameOrErr;
Rafael Espindola4b83cb52015-07-14 22:18:43 +0000446 ErrorOr<std::unique_ptr<MemoryBuffer>> Buf = MemoryBuffer::getFile(FullName);
447 if (std::error_code EC = Buf.getError())
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000448 return errorCodeToError(EC);
Rafael Espindola4b83cb52015-07-14 22:18:43 +0000449 Parent->ThinBuffers.push_back(std::move(*Buf));
450 return Parent->ThinBuffers.back()->getBuffer();
451}
452
Kevin Enderby6524bd82016-07-19 20:47:07 +0000453Expected<Archive::Child> Archive::Child::getNext() const {
Rafael Espindola747bc072013-07-09 03:39:35 +0000454 size_t SpaceToSkip = Data.size();
455 // If it's odd, add 1 to make it even.
456 if (SpaceToSkip & 1)
Kevin Enderbyda9dd052015-10-21 17:13:20 +0000457 ++SpaceToSkip;
Rafael Espindola747bc072013-07-09 03:39:35 +0000458
Kevin Enderbyda9dd052015-10-21 17:13:20 +0000459 const char *NextLoc = Data.data() + SpaceToSkip;
Rafael Espindola747bc072013-07-09 03:39:35 +0000460
Kevin Enderby7a969422015-11-05 19:24:56 +0000461 // Check to see if this is at the end of the archive.
462 if (NextLoc == Parent->Data.getBufferEnd())
Lang Hamesa5e873e2016-10-05 21:20:00 +0000463 return Child(nullptr, nullptr, nullptr);
Rafael Espindola747bc072013-07-09 03:39:35 +0000464
Kevin Enderby7a969422015-11-05 19:24:56 +0000465 // Check to see if this is past the end of the archive.
Kevin Enderby95b08422016-07-25 20:36:36 +0000466 if (NextLoc > Parent->Data.getBufferEnd()) {
Kevin Enderby31b07f12016-07-29 22:32:02 +0000467 std::string Msg("offset to next archive member past the end of the archive "
468 "after member ");
Kevin Enderbyf4586032016-07-29 17:44:13 +0000469 Expected<StringRef> NameOrErr = getName();
470 if (!NameOrErr) {
471 consumeError(NameOrErr.takeError());
Kevin Enderby95b08422016-07-25 20:36:36 +0000472 uint64_t Offset = Data.data() - Parent->getData().data();
473 return malformedError(Msg + "at offset " + Twine(Offset));
474 } else
Kevin Enderby31b07f12016-07-29 22:32:02 +0000475 return malformedError(Msg + NameOrErr.get());
Kevin Enderby95b08422016-07-25 20:36:36 +0000476 }
Kevin Enderby7a969422015-11-05 19:24:56 +0000477
Mehdi Amini41af4302016-11-11 04:28:40 +0000478 Error Err = Error::success();
Kevin Enderby6524bd82016-07-19 20:47:07 +0000479 Child Ret(Parent, NextLoc, &Err);
480 if (Err)
481 return std::move(Err);
Kevin Enderby7a969422015-11-05 19:24:56 +0000482 return Ret;
Rafael Espindola747bc072013-07-09 03:39:35 +0000483}
484
Kevin Enderby13023a12015-01-15 23:19:11 +0000485uint64_t Archive::Child::getChildOffset() const {
486 const char *a = Parent->Data.getBuffer().data();
487 const char *c = Data.data();
488 uint64_t offset = c - a;
489 return offset;
490}
491
Kevin Enderbyf4586032016-07-29 17:44:13 +0000492Expected<StringRef> Archive::Child::getName() const {
493 Expected<uint64_t> RawSizeOrErr = getRawSize();
494 if (!RawSizeOrErr)
495 return RawSizeOrErr.takeError();
496 uint64_t RawSize = RawSizeOrErr.get();
497 Expected<StringRef> NameOrErr = Header.getName(Header.getSizeOf() + RawSize);
498 if (!NameOrErr)
499 return NameOrErr.takeError();
500 StringRef Name = NameOrErr.get();
501 return Name;
Michael J. Spencerd3b7b122011-09-27 19:36:55 +0000502}
503
Kevin Enderbyf4586032016-07-29 17:44:13 +0000504Expected<MemoryBufferRef> Archive::Child::getMemoryBufferRef() const {
505 Expected<StringRef> NameOrErr = getName();
506 if (!NameOrErr)
507 return NameOrErr.takeError();
Rafael Espindolaae460022014-06-16 16:08:36 +0000508 StringRef Name = NameOrErr.get();
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000509 Expected<StringRef> Buf = getBuffer();
510 if (!Buf)
511 return Buf.takeError();
Rafael Espindola4b83cb52015-07-14 22:18:43 +0000512 return MemoryBufferRef(*Buf, Name);
Rafael Espindolaae460022014-06-16 16:08:36 +0000513}
514
Kevin Enderbyac9e1552016-05-17 17:10:12 +0000515Expected<std::unique_ptr<Binary>>
Rafael Espindolaae460022014-06-16 16:08:36 +0000516Archive::Child::getAsBinary(LLVMContext *Context) const {
Kevin Enderbyf4586032016-07-29 17:44:13 +0000517 Expected<MemoryBufferRef> BuffOrErr = getMemoryBufferRef();
518 if (!BuffOrErr)
519 return BuffOrErr.takeError();
Rafael Espindolac3f9b5a2014-06-23 21:53:12 +0000520
Kevin Enderby3fcdf6a2016-04-06 22:14:09 +0000521 auto BinaryOrErr = createBinary(BuffOrErr.get(), Context);
522 if (BinaryOrErr)
523 return std::move(*BinaryOrErr);
Kevin Enderbyac9e1552016-05-17 17:10:12 +0000524 return BinaryOrErr.takeError();
Michael J. Spencerd3b7b122011-09-27 19:36:55 +0000525}
526
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000527Expected<std::unique_ptr<Archive>> Archive::create(MemoryBufferRef Source) {
Mehdi Amini41af4302016-11-11 04:28:40 +0000528 Error Err = Error::success();
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000529 std::unique_ptr<Archive> Ret(new Archive(Source, Err));
530 if (Err)
531 return std::move(Err);
Rafael Espindolaf5577132014-07-31 03:36:00 +0000532 return std::move(Ret);
Rafael Espindola692410e2014-01-21 23:06:54 +0000533}
534
Rafael Espindola43358762015-10-31 21:44:42 +0000535void Archive::setFirstRegular(const Child &C) {
536 FirstRegularData = C.Data;
537 FirstRegularStartOfFile = C.StartOfFile;
538}
539
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000540Archive::Archive(MemoryBufferRef Source, Error &Err)
Rafael Espindola43358762015-10-31 21:44:42 +0000541 : Binary(Binary::ID_Archive, Source) {
Lang Hames5e51a2e2016-07-22 16:11:25 +0000542 ErrorAsOutParameter ErrAsOutParam(&Err);
Rafael Espindola9d102062014-12-16 01:43:41 +0000543 StringRef Buffer = Data.getBuffer();
Michael J. Spencerd3b7b122011-09-27 19:36:55 +0000544 // Check for sufficient magic.
Rafael Espindola9d102062014-12-16 01:43:41 +0000545 if (Buffer.startswith(ThinMagic)) {
546 IsThin = true;
547 } else if (Buffer.startswith(Magic)) {
548 IsThin = false;
549 } else {
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000550 Err = make_error<GenericBinaryError>("File too small to be an archive",
551 object_error::invalid_file_type);
Michael J. Spencerd3b7b122011-09-27 19:36:55 +0000552 return;
553 }
554
Kevin Enderbyf4586032016-07-29 17:44:13 +0000555 // Make sure Format is initialized before any call to
556 // ArchiveMemberHeader::getName() is made. This could be a valid empty
557 // archive which is the same in all formats. So claiming it to be gnu to is
558 // fine if not totally correct before we look for a string table or table of
559 // contents.
560 Format = K_GNU;
561
Michael J. Spencere03ea9c2011-11-02 19:33:12 +0000562 // Get the special members.
Lang Hamesfc209622016-07-14 02:24:01 +0000563 child_iterator I = child_begin(Err, false);
564 if (Err)
Kevin Enderby7a969422015-11-05 19:24:56 +0000565 return;
566 child_iterator E = child_end();
Michael J. Spencerd3b7b122011-09-27 19:36:55 +0000567
Kevin Enderbyf4586032016-07-29 17:44:13 +0000568 // See if this is a valid empty archive and if so return.
Kevin Enderby7a969422015-11-05 19:24:56 +0000569 if (I == E) {
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000570 Err = Error::success();
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000571 return;
572 }
Lang Hamesfc209622016-07-14 02:24:01 +0000573 const Child *C = &*I;
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000574
Kevin Enderby7a969422015-11-05 19:24:56 +0000575 auto Increment = [&]() {
576 ++I;
Lang Hamesfc209622016-07-14 02:24:01 +0000577 if (Err)
Kevin Enderby7a969422015-11-05 19:24:56 +0000578 return true;
Lang Hamesfc209622016-07-14 02:24:01 +0000579 C = &*I;
Kevin Enderby7a969422015-11-05 19:24:56 +0000580 return false;
581 };
582
Kevin Enderbyf4586032016-07-29 17:44:13 +0000583 Expected<StringRef> NameOrErr = C->getRawName();
584 if (!NameOrErr) {
585 Err = NameOrErr.takeError();
586 return;
587 }
588 StringRef Name = NameOrErr.get();
Michael J. Spencerd3b7b122011-09-27 19:36:55 +0000589
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000590 // Below is the pattern that is used to figure out the archive format
591 // GNU archive format
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000592 // First member : / (may exist, if it exists, points to the symbol table )
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000593 // Second member : // (may exist, if it exists, points to the string table)
594 // Note : The string table is used if the filename exceeds 15 characters
595 // BSD archive format
Rafael Espindola55509922013-07-10 22:07:59 +0000596 // First member : __.SYMDEF or "__.SYMDEF SORTED" (the symbol table)
597 // There is no string table, if the filename exceeds 15 characters or has a
598 // embedded space, the filename has #1/<size>, The size represents the size
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000599 // of the filename that needs to be read after the archive header
600 // COFF archive format
601 // First member : /
602 // Second member : / (provides a directory of symbols)
Rui Ueyamaf4d0a8c2013-06-03 00:27:03 +0000603 // Third member : // (may exist, if it exists, contains the string table)
604 // Note: Microsoft PE/COFF Spec 8.3 says that the third member is present
605 // even if the string table is empty. However, lib.exe does not in fact
606 // seem to create the third member if there's no member whose filename
607 // exceeds 15 characters. So the third member is optional.
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000608
Kevin Enderbyae108ff2016-06-17 22:16:06 +0000609 if (Name == "__.SYMDEF" || Name == "__.SYMDEF_64") {
610 if (Name == "__.SYMDEF")
611 Format = K_BSD;
612 else // Name == "__.SYMDEF_64"
613 Format = K_DARWIN64;
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000614 // We know that the symbol table is not an external file, but we still must
615 // check any Expected<> return value.
616 Expected<StringRef> BufOrErr = C->getBuffer();
617 if (!BufOrErr) {
618 Err = BufOrErr.takeError();
619 return;
620 }
621 SymbolTable = BufOrErr.get();
Kevin Enderby7a969422015-11-05 19:24:56 +0000622 if (Increment())
623 return;
624 setFirstRegular(*C);
625
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000626 Err = Error::success();
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000627 return;
628 }
629
Rafael Espindola55509922013-07-10 22:07:59 +0000630 if (Name.startswith("#1/")) {
631 Format = K_BSD;
632 // We know this is BSD, so getName will work since there is no string table.
Kevin Enderbyf4586032016-07-29 17:44:13 +0000633 Expected<StringRef> NameOrErr = C->getName();
634 if (!NameOrErr) {
635 Err = NameOrErr.takeError();
Rafael Espindola55509922013-07-10 22:07:59 +0000636 return;
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000637 }
Rafael Espindolaae460022014-06-16 16:08:36 +0000638 Name = NameOrErr.get();
Nick Kledzikf44dbda2014-11-12 01:37:45 +0000639 if (Name == "__.SYMDEF SORTED" || Name == "__.SYMDEF") {
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000640 // We know that the symbol table is not an external file, but we still
641 // must check any Expected<> return value.
642 Expected<StringRef> BufOrErr = C->getBuffer();
643 if (!BufOrErr) {
644 Err = BufOrErr.takeError();
645 return;
646 }
647 SymbolTable = BufOrErr.get();
Kevin Enderby7a969422015-11-05 19:24:56 +0000648 if (Increment())
649 return;
Rafael Espindola3e2b21c2013-07-12 20:21:39 +0000650 }
Kevin Enderbyae108ff2016-06-17 22:16:06 +0000651 else if (Name == "__.SYMDEF_64 SORTED" || Name == "__.SYMDEF_64") {
652 Format = K_DARWIN64;
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000653 // We know that the symbol table is not an external file, but we still
654 // must check any Expected<> return value.
655 Expected<StringRef> BufOrErr = C->getBuffer();
656 if (!BufOrErr) {
657 Err = BufOrErr.takeError();
658 return;
659 }
660 SymbolTable = BufOrErr.get();
Kevin Enderbyae108ff2016-06-17 22:16:06 +0000661 if (Increment())
662 return;
663 }
Kevin Enderby7a969422015-11-05 19:24:56 +0000664 setFirstRegular(*C);
Rafael Espindola55509922013-07-10 22:07:59 +0000665 return;
666 }
667
Simon Atanasyan1d902b72015-02-17 18:54:22 +0000668 // MIPS 64-bit ELF archives use a special format of a symbol table.
669 // This format is marked by `ar_name` field equals to "/SYM64/".
670 // For detailed description see page 96 in the following document:
671 // http://techpubs.sgi.com/library/manuals/4000/007-4658-001/pdf/007-4658-001.pdf
672
673 bool has64SymTable = false;
674 if (Name == "/" || Name == "/SYM64/") {
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000675 // We know that the symbol table is not an external file, but we still
676 // must check any Expected<> return value.
677 Expected<StringRef> BufOrErr = C->getBuffer();
678 if (!BufOrErr) {
679 Err = BufOrErr.takeError();
680 return;
681 }
682 SymbolTable = BufOrErr.get();
Simon Atanasyan1d902b72015-02-17 18:54:22 +0000683 if (Name == "/SYM64/")
684 has64SymTable = true;
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000685
Kevin Enderby7a969422015-11-05 19:24:56 +0000686 if (Increment())
687 return;
688 if (I == E) {
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000689 Err = Error::success();
Michael J. Spencer04614ff2013-01-10 00:07:38 +0000690 return;
691 }
Kevin Enderbyf4586032016-07-29 17:44:13 +0000692 Expected<StringRef> NameOrErr = C->getRawName();
693 if (!NameOrErr) {
694 Err = NameOrErr.takeError();
695 return;
696 }
697 Name = NameOrErr.get();
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000698 }
699
Rafael Espindola6cc2dc72013-07-05 03:35:15 +0000700 if (Name == "//") {
Jake Ehrlich1b30d632017-09-20 18:23:01 +0000701 Format = has64SymTable ? K_GNU64 : K_GNU;
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000702 // The string table is never an external member, but we still
703 // must check any Expected<> return value.
704 Expected<StringRef> BufOrErr = C->getBuffer();
705 if (!BufOrErr) {
706 Err = BufOrErr.takeError();
707 return;
708 }
709 StringTable = BufOrErr.get();
Kevin Enderby7a969422015-11-05 19:24:56 +0000710 if (Increment())
711 return;
712 setFirstRegular(*C);
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000713 Err = Error::success();
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000714 return;
715 }
716
Rafael Espindola6cc2dc72013-07-05 03:35:15 +0000717 if (Name[0] != '/') {
Jake Ehrlich1b30d632017-09-20 18:23:01 +0000718 Format = has64SymTable ? K_GNU64 : K_GNU;
Kevin Enderby7a969422015-11-05 19:24:56 +0000719 setFirstRegular(*C);
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000720 Err = Error::success();
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000721 return;
722 }
723
Rafael Espindola6cc2dc72013-07-05 03:35:15 +0000724 if (Name != "/") {
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000725 Err = errorCodeToError(object_error::parse_failed);
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000726 return;
727 }
728
729 Format = K_COFF;
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000730 // We know that the symbol table is not an external file, but we still
731 // must check any Expected<> return value.
732 Expected<StringRef> BufOrErr = C->getBuffer();
733 if (!BufOrErr) {
734 Err = BufOrErr.takeError();
735 return;
736 }
737 SymbolTable = BufOrErr.get();
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000738
Kevin Enderby7a969422015-11-05 19:24:56 +0000739 if (Increment())
740 return;
741
742 if (I == E) {
743 setFirstRegular(*C);
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000744 Err = Error::success();
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000745 return;
746 }
747
Kevin Enderbyf4586032016-07-29 17:44:13 +0000748 NameOrErr = C->getRawName();
749 if (!NameOrErr) {
750 Err = NameOrErr.takeError();
751 return;
752 }
753 Name = NameOrErr.get();
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000754
Rafael Espindola3e2b21c2013-07-12 20:21:39 +0000755 if (Name == "//") {
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000756 // The string table is never an external member, but we still
757 // must check any Expected<> return value.
758 Expected<StringRef> BufOrErr = C->getBuffer();
759 if (!BufOrErr) {
760 Err = BufOrErr.takeError();
761 return;
762 }
763 StringTable = BufOrErr.get();
Kevin Enderby7a969422015-11-05 19:24:56 +0000764 if (Increment())
765 return;
Rafael Espindola3e2b21c2013-07-12 20:21:39 +0000766 }
Rafael Espindola88ae7dd2013-07-03 15:57:14 +0000767
Kevin Enderby7a969422015-11-05 19:24:56 +0000768 setFirstRegular(*C);
Kevin Enderbyc60a3212016-06-29 20:35:44 +0000769 Err = Error::success();
Michael J. Spencerd3b7b122011-09-27 19:36:55 +0000770}
771
Lang Hamesfc209622016-07-14 02:24:01 +0000772Archive::child_iterator Archive::child_begin(Error &Err,
773 bool SkipInternal) const {
Rui Ueyama14a5ca02016-09-30 17:54:31 +0000774 if (isEmpty())
Rafael Espindola23a97502014-01-21 16:09:45 +0000775 return child_end();
Rafael Espindola3e2b21c2013-07-12 20:21:39 +0000776
777 if (SkipInternal)
Lang Hamesfc209622016-07-14 02:24:01 +0000778 return child_iterator(Child(this, FirstRegularData,
779 FirstRegularStartOfFile),
780 &Err);
Rafael Espindola3e2b21c2013-07-12 20:21:39 +0000781
Rafael Espindola48af1c22014-08-19 18:44:46 +0000782 const char *Loc = Data.getBufferStart() + strlen(Magic);
Kevin Enderby6524bd82016-07-19 20:47:07 +0000783 Child C(this, Loc, &Err);
784 if (Err)
Lang Hamesfc209622016-07-14 02:24:01 +0000785 return child_end();
Lang Hamesfc209622016-07-14 02:24:01 +0000786 return child_iterator(C, &Err);
Michael J. Spencerd3b7b122011-09-27 19:36:55 +0000787}
788
Rafael Espindola23a97502014-01-21 16:09:45 +0000789Archive::child_iterator Archive::child_end() const {
Lang Hamesa5e873e2016-10-05 21:20:00 +0000790 return child_iterator(Child(nullptr, nullptr, nullptr), nullptr);
Michael J. Spencerd3b7b122011-09-27 19:36:55 +0000791}
Michael J. Spencere03ea9c2011-11-02 19:33:12 +0000792
Rafael Espindolaae460022014-06-16 16:08:36 +0000793StringRef Archive::Symbol::getName() const {
Rafael Espindola2b054162015-07-14 01:06:16 +0000794 return Parent->getSymbolTable().begin() + StringIndex;
Michael J. Spencere03ea9c2011-11-02 19:33:12 +0000795}
796
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000797Expected<Archive::Child> Archive::Symbol::getMember() const {
Rafael Espindola2b054162015-07-14 01:06:16 +0000798 const char *Buf = Parent->getSymbolTable().begin();
Simon Atanasyan1d902b72015-02-17 18:54:22 +0000799 const char *Offsets = Buf;
Jake Ehrlich1b30d632017-09-20 18:23:01 +0000800 if (Parent->kind() == K_GNU64 || Parent->kind() == K_DARWIN64)
Simon Atanasyan1d902b72015-02-17 18:54:22 +0000801 Offsets += sizeof(uint64_t);
802 else
803 Offsets += sizeof(uint32_t);
Jake Ehrlichde370412017-10-27 21:47:38 +0000804 uint64_t Offset = 0;
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000805 if (Parent->kind() == K_GNU) {
Rui Ueyama3206b792015-03-02 21:19:12 +0000806 Offset = read32be(Offsets + SymbolIndex * 4);
Jake Ehrlich1b30d632017-09-20 18:23:01 +0000807 } else if (Parent->kind() == K_GNU64) {
Rui Ueyama3206b792015-03-02 21:19:12 +0000808 Offset = read64be(Offsets + SymbolIndex * 8);
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000809 } else if (Parent->kind() == K_BSD) {
Kevin Enderby8c50dbb2014-07-08 22:10:02 +0000810 // The SymbolIndex is an index into the ranlib structs that start at
811 // Offsets (the first uint32_t is the number of bytes of the ranlib
812 // structs). The ranlib structs are a pair of uint32_t's the first
813 // being a string table offset and the second being the offset into
814 // the archive of the member that defines the symbol. Which is what
815 // is needed here.
Rui Ueyama3206b792015-03-02 21:19:12 +0000816 Offset = read32le(Offsets + SymbolIndex * 8 + 4);
Kevin Enderbyae108ff2016-06-17 22:16:06 +0000817 } else if (Parent->kind() == K_DARWIN64) {
818 // The SymbolIndex is an index into the ranlib_64 structs that start at
819 // Offsets (the first uint64_t is the number of bytes of the ranlib_64
820 // structs). The ranlib_64 structs are a pair of uint64_t's the first
821 // being a string table offset and the second being the offset into
822 // the archive of the member that defines the symbol. Which is what
823 // is needed here.
824 Offset = read64le(Offsets + SymbolIndex * 16 + 8);
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000825 } else {
Michael J. Spencer4e92d5b2012-11-14 00:04:13 +0000826 // Skip offsets.
Rui Ueyama3206b792015-03-02 21:19:12 +0000827 uint32_t MemberCount = read32le(Buf);
828 Buf += MemberCount * 4 + 4;
Michael J. Spencer4e92d5b2012-11-14 00:04:13 +0000829
Rui Ueyama3206b792015-03-02 21:19:12 +0000830 uint32_t SymbolCount = read32le(Buf);
Michael J. Spencer4e92d5b2012-11-14 00:04:13 +0000831 if (SymbolIndex >= SymbolCount)
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000832 return errorCodeToError(object_error::parse_failed);
Michael J. Spencer4e92d5b2012-11-14 00:04:13 +0000833
Matt Beaumont-Gay68e0b6a2012-11-14 00:21:27 +0000834 // Skip SymbolCount to get to the indices table.
Rui Ueyama3206b792015-03-02 21:19:12 +0000835 const char *Indices = Buf + 4;
Michael J. Spencer4e92d5b2012-11-14 00:04:13 +0000836
837 // Get the index of the offset in the file member offset table for this
838 // symbol.
Rui Ueyama3206b792015-03-02 21:19:12 +0000839 uint16_t OffsetIndex = read16le(Indices + SymbolIndex * 2);
Michael J. Spencer4e92d5b2012-11-14 00:04:13 +0000840 // Subtract 1 since OffsetIndex is 1 based.
841 --OffsetIndex;
842
843 if (OffsetIndex >= MemberCount)
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000844 return errorCodeToError(object_error::parse_failed);
Michael J. Spencer4e92d5b2012-11-14 00:04:13 +0000845
Rui Ueyama3206b792015-03-02 21:19:12 +0000846 Offset = read32le(Offsets + OffsetIndex * 4);
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000847 }
Michael J. Spencere03ea9c2011-11-02 19:33:12 +0000848
Michael J. Spencer4e92d5b2012-11-14 00:04:13 +0000849 const char *Loc = Parent->getData().begin() + Offset;
Mehdi Amini41af4302016-11-11 04:28:40 +0000850 Error Err = Error::success();
Kevin Enderby6524bd82016-07-19 20:47:07 +0000851 Child C(Parent, Loc, &Err);
852 if (Err)
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000853 return std::move(Err);
Kevin Enderby7a969422015-11-05 19:24:56 +0000854 return C;
Michael J. Spencere03ea9c2011-11-02 19:33:12 +0000855}
856
857Archive::Symbol Archive::Symbol::getNext() const {
858 Symbol t(*this);
Kevin Enderby8c50dbb2014-07-08 22:10:02 +0000859 if (Parent->kind() == K_BSD) {
860 // t.StringIndex is an offset from the start of the __.SYMDEF or
861 // "__.SYMDEF SORTED" member into the string table for the ranlib
862 // struct indexed by t.SymbolIndex . To change t.StringIndex to the
863 // offset in the string table for t.SymbolIndex+1 we subtract the
864 // its offset from the start of the string table for t.SymbolIndex
865 // and add the offset of the string table for t.SymbolIndex+1.
866
867 // The __.SYMDEF or "__.SYMDEF SORTED" member starts with a uint32_t
868 // which is the number of bytes of ranlib structs that follow. The ranlib
869 // structs are a pair of uint32_t's the first being a string table offset
870 // and the second being the offset into the archive of the member that
871 // define the symbol. After that the next uint32_t is the byte count of
872 // the string table followed by the string table.
Rafael Espindola2b054162015-07-14 01:06:16 +0000873 const char *Buf = Parent->getSymbolTable().begin();
Kevin Enderby8c50dbb2014-07-08 22:10:02 +0000874 uint32_t RanlibCount = 0;
Rui Ueyama3206b792015-03-02 21:19:12 +0000875 RanlibCount = read32le(Buf) / 8;
Kevin Enderby8c50dbb2014-07-08 22:10:02 +0000876 // If t.SymbolIndex + 1 will be past the count of symbols (the RanlibCount)
877 // don't change the t.StringIndex as we don't want to reference a ranlib
878 // past RanlibCount.
879 if (t.SymbolIndex + 1 < RanlibCount) {
880 const char *Ranlibs = Buf + 4;
881 uint32_t CurRanStrx = 0;
882 uint32_t NextRanStrx = 0;
Rui Ueyama3206b792015-03-02 21:19:12 +0000883 CurRanStrx = read32le(Ranlibs + t.SymbolIndex * 8);
884 NextRanStrx = read32le(Ranlibs + (t.SymbolIndex + 1) * 8);
Kevin Enderby8c50dbb2014-07-08 22:10:02 +0000885 t.StringIndex -= CurRanStrx;
886 t.StringIndex += NextRanStrx;
887 }
888 } else {
889 // Go to one past next null.
Rafael Espindola2b054162015-07-14 01:06:16 +0000890 t.StringIndex = Parent->getSymbolTable().find('\0', t.StringIndex) + 1;
Kevin Enderby8c50dbb2014-07-08 22:10:02 +0000891 }
Michael J. Spencere03ea9c2011-11-02 19:33:12 +0000892 ++t.SymbolIndex;
893 return t;
894}
895
Rafael Espindola23a97502014-01-21 16:09:45 +0000896Archive::symbol_iterator Archive::symbol_begin() const {
Rafael Espindolab6b5f52e2013-07-29 12:40:31 +0000897 if (!hasSymbolTable())
Rafael Espindolafbcafc02013-07-10 20:14:22 +0000898 return symbol_iterator(Symbol(this, 0, 0));
899
Rafael Espindola2b054162015-07-14 01:06:16 +0000900 const char *buf = getSymbolTable().begin();
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000901 if (kind() == K_GNU) {
902 uint32_t symbol_count = 0;
Rui Ueyama3206b792015-03-02 21:19:12 +0000903 symbol_count = read32be(buf);
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000904 buf += sizeof(uint32_t) + (symbol_count * (sizeof(uint32_t)));
Jake Ehrlich1b30d632017-09-20 18:23:01 +0000905 } else if (kind() == K_GNU64) {
Rui Ueyama3206b792015-03-02 21:19:12 +0000906 uint64_t symbol_count = read64be(buf);
Simon Atanasyan1d902b72015-02-17 18:54:22 +0000907 buf += sizeof(uint64_t) + (symbol_count * (sizeof(uint64_t)));
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000908 } else if (kind() == K_BSD) {
Kevin Enderby8c50dbb2014-07-08 22:10:02 +0000909 // The __.SYMDEF or "__.SYMDEF SORTED" member starts with a uint32_t
910 // which is the number of bytes of ranlib structs that follow. The ranlib
911 // structs are a pair of uint32_t's the first being a string table offset
912 // and the second being the offset into the archive of the member that
913 // define the symbol. After that the next uint32_t is the byte count of
914 // the string table followed by the string table.
915 uint32_t ranlib_count = 0;
Rui Ueyama3206b792015-03-02 21:19:12 +0000916 ranlib_count = read32le(buf) / 8;
Kevin Enderby8c50dbb2014-07-08 22:10:02 +0000917 const char *ranlibs = buf + 4;
918 uint32_t ran_strx = 0;
Rui Ueyama3206b792015-03-02 21:19:12 +0000919 ran_strx = read32le(ranlibs);
Kevin Enderby8c50dbb2014-07-08 22:10:02 +0000920 buf += sizeof(uint32_t) + (ranlib_count * (2 * (sizeof(uint32_t))));
921 // Skip the byte count of the string table.
922 buf += sizeof(uint32_t);
923 buf += ran_strx;
Kevin Enderbyae108ff2016-06-17 22:16:06 +0000924 } else if (kind() == K_DARWIN64) {
925 // The __.SYMDEF_64 or "__.SYMDEF_64 SORTED" member starts with a uint64_t
926 // which is the number of bytes of ranlib_64 structs that follow. The
927 // ranlib_64 structs are a pair of uint64_t's the first being a string
928 // table offset and the second being the offset into the archive of the
929 // member that define the symbol. After that the next uint64_t is the byte
930 // count of the string table followed by the string table.
931 uint64_t ranlib_count = 0;
932 ranlib_count = read64le(buf) / 16;
933 const char *ranlibs = buf + 8;
934 uint64_t ran_strx = 0;
935 ran_strx = read64le(ranlibs);
936 buf += sizeof(uint64_t) + (ranlib_count * (2 * (sizeof(uint64_t))));
937 // Skip the byte count of the string table.
938 buf += sizeof(uint64_t);
939 buf += ran_strx;
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000940 } else {
941 uint32_t member_count = 0;
942 uint32_t symbol_count = 0;
Rui Ueyama3206b792015-03-02 21:19:12 +0000943 member_count = read32le(buf);
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000944 buf += 4 + (member_count * 4); // Skip offsets.
Rui Ueyama3206b792015-03-02 21:19:12 +0000945 symbol_count = read32le(buf);
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000946 buf += 4 + (symbol_count * 2); // Skip indices.
947 }
Rafael Espindola2b054162015-07-14 01:06:16 +0000948 uint32_t string_start_offset = buf - getSymbolTable().begin();
Michael J. Spencere03ea9c2011-11-02 19:33:12 +0000949 return symbol_iterator(Symbol(this, 0, string_start_offset));
950}
951
Rafael Espindola23a97502014-01-21 16:09:45 +0000952Archive::symbol_iterator Archive::symbol_end() const {
Rui Ueyama407e0972015-05-26 16:20:40 +0000953 return symbol_iterator(Symbol(this, getNumberOfSymbols(), 0));
954}
Rafael Espindolafbcafc02013-07-10 20:14:22 +0000955
Rui Ueyama407e0972015-05-26 16:20:40 +0000956uint32_t Archive::getNumberOfSymbols() const {
Rafael Espindola483ad202015-10-08 18:06:20 +0000957 if (!hasSymbolTable())
958 return 0;
Rafael Espindola2b054162015-07-14 01:06:16 +0000959 const char *buf = getSymbolTable().begin();
Rui Ueyama407e0972015-05-26 16:20:40 +0000960 if (kind() == K_GNU)
961 return read32be(buf);
Jake Ehrlich1b30d632017-09-20 18:23:01 +0000962 if (kind() == K_GNU64)
Rui Ueyama407e0972015-05-26 16:20:40 +0000963 return read64be(buf);
964 if (kind() == K_BSD)
965 return read32le(buf) / 8;
Kevin Enderbyae108ff2016-06-17 22:16:06 +0000966 if (kind() == K_DARWIN64)
967 return read64le(buf) / 16;
Rui Ueyama407e0972015-05-26 16:20:40 +0000968 uint32_t member_count = 0;
969 member_count = read32le(buf);
970 buf += 4 + (member_count * 4); // Skip offsets.
971 return read32le(buf);
Michael J. Spencere03ea9c2011-11-02 19:33:12 +0000972}
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000973
Lang Hames69f49022016-07-14 20:44:27 +0000974Expected<Optional<Archive::Child>> Archive::findSym(StringRef name) const {
Rafael Espindola23a97502014-01-21 16:09:45 +0000975 Archive::symbol_iterator bs = symbol_begin();
976 Archive::symbol_iterator es = symbol_end();
Rafael Espindolaae460022014-06-16 16:08:36 +0000977
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000978 for (; bs != es; ++bs) {
Rafael Espindolaae460022014-06-16 16:08:36 +0000979 StringRef SymName = bs->getName();
980 if (SymName == name) {
Lang Hames69f49022016-07-14 20:44:27 +0000981 if (auto MemberOrErr = bs->getMember())
982 return Child(*MemberOrErr);
983 else
Kevin Enderby27e85bd2016-08-03 21:57:47 +0000984 return MemberOrErr.takeError();
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000985 }
986 }
Lang Hames69f49022016-07-14 20:44:27 +0000987 return Optional<Child>();
Shankar Easwaran15b28be2012-11-13 18:38:42 +0000988}
Rafael Espindolab6b5f52e2013-07-29 12:40:31 +0000989
Rui Ueyama14a5ca02016-09-30 17:54:31 +0000990// Returns true if archive file contains no member file.
991bool Archive::isEmpty() const { return Data.getBufferSize() == 8; }
992
Rafael Espindola4a782fb2015-10-31 21:03:29 +0000993bool Archive::hasSymbolTable() const { return !SymbolTable.empty(); }