Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 1 | //===- Archive.cpp - ar File Format implementation --------------*- C++ -*-===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file defines the ArchiveObjectFile class. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #include "llvm/Object/Archive.h" |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 15 | #include "llvm/ADT/SmallString.h" |
| 16 | #include "llvm/ADT/Twine.h" |
Michael J. Spencer | e03ea9c | 2011-11-02 19:33:12 +0000 | [diff] [blame] | 17 | #include "llvm/Support/Endian.h" |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 18 | #include "llvm/Support/MemoryBuffer.h" |
Rafael Espindola | 4b83cb5 | 2015-07-14 22:18:43 +0000 | [diff] [blame] | 19 | #include "llvm/Support/Path.h" |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 20 | |
| 21 | using namespace llvm; |
| 22 | using namespace object; |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 23 | using namespace llvm::support::endian; |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 24 | |
Craig Topper | d3a34f8 | 2013-07-16 01:17:10 +0000 | [diff] [blame] | 25 | static const char *const Magic = "!<arch>\n"; |
Rafael Espindola | 9d10206 | 2014-12-16 01:43:41 +0000 | [diff] [blame] | 26 | static const char *const ThinMagic = "!<thin>\n"; |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 27 | |
David Blaikie | a379b181 | 2011-12-20 02:50:00 +0000 | [diff] [blame] | 28 | void Archive::anchor() { } |
| 29 | |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 30 | static Error |
| 31 | malformedError(Twine Msg) { |
| 32 | std::string StringMsg = "truncated or malformed archive (" + Msg.str() + ")"; |
| 33 | return make_error<GenericBinaryError>(std::move(StringMsg), |
| 34 | object_error::parse_failed); |
| 35 | } |
| 36 | |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 37 | ArchiveMemberHeader::ArchiveMemberHeader(const Archive *Parent, |
| 38 | const char *RawHeaderPtr, |
| 39 | uint64_t Size, Error *Err) |
| 40 | : Parent(Parent), |
| 41 | ArMemHdr(reinterpret_cast<const ArMemHdrType *>(RawHeaderPtr)) { |
| 42 | if (RawHeaderPtr == nullptr) |
| 43 | return; |
| 44 | ErrorAsOutParameter ErrAsOutParam(Err); |
| 45 | |
| 46 | // TODO: For errors messages with the ArchiveMemberHeader class use the |
| 47 | // archive member name instead of the the offset to the archive member header. |
| 48 | // When there is also error getting the member name then use the offset to |
| 49 | // the member in the message. |
| 50 | |
| 51 | if (Size < sizeof(ArMemHdrType)) { |
| 52 | if (Err) { |
| 53 | uint64_t Offset = RawHeaderPtr - Parent->getData().data(); |
| 54 | *Err = malformedError("remaining size of archive too small for next " |
| 55 | "archive member header at offset " + |
| 56 | Twine(Offset)); |
| 57 | } |
| 58 | return; |
| 59 | } |
| 60 | if (ArMemHdr->Terminator[0] != '`' || ArMemHdr->Terminator[1] != '\n') { |
| 61 | if (Err) { |
| 62 | std::string Buf; |
| 63 | raw_string_ostream OS(Buf); |
| 64 | OS.write_escaped(llvm::StringRef(ArMemHdr->Terminator, |
| 65 | sizeof(ArMemHdr->Terminator))); |
| 66 | OS.flush(); |
| 67 | uint64_t Offset = RawHeaderPtr - Parent->getData().data(); |
| 68 | *Err = malformedError("terminator characters in archive member \"" + Buf + |
| 69 | "\" not the correct \"`\\n\" values for the " |
| 70 | "archive member header at offset " + Twine(Offset)); |
| 71 | } |
| 72 | return; |
| 73 | } |
| 74 | } |
| 75 | |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 76 | StringRef ArchiveMemberHeader::getName() const { |
| 77 | char EndCond; |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 78 | if (ArMemHdr->Name[0] == '/' || ArMemHdr->Name[0] == '#') |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 79 | EndCond = ' '; |
| 80 | else |
| 81 | EndCond = '/'; |
| 82 | llvm::StringRef::size_type end = |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 83 | llvm::StringRef(ArMemHdr->Name, sizeof(ArMemHdr->Name)).find(EndCond); |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 84 | if (end == llvm::StringRef::npos) |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 85 | end = sizeof(ArMemHdr->Name); |
| 86 | assert(end <= sizeof(ArMemHdr->Name) && end > 0); |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 87 | // Don't include the EndCond if there is one. |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 88 | return llvm::StringRef(ArMemHdr->Name, end); |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 89 | } |
| 90 | |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 91 | Expected<uint32_t> ArchiveMemberHeader::getSize() const { |
Rafael Espindola | 8e9385e | 2013-07-09 12:45:11 +0000 | [diff] [blame] | 92 | uint32_t Ret; |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 93 | if (llvm::StringRef(ArMemHdr->Size, |
| 94 | sizeof(ArMemHdr->Size)).rtrim(" ").getAsInteger(10, Ret)) { |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 95 | std::string Buf; |
| 96 | raw_string_ostream OS(Buf); |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 97 | OS.write_escaped(llvm::StringRef(ArMemHdr->Size, |
| 98 | sizeof(ArMemHdr->Size)).rtrim(" ")); |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 99 | OS.flush(); |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 100 | uint64_t Offset = reinterpret_cast<const char *>(ArMemHdr) - |
| 101 | Parent->getData().data(); |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 102 | return malformedError("characters in size field in archive header are not " |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 103 | "all decimal numbers: '" + Buf + "' for archive " |
| 104 | "member header at offset " + Twine(Offset)); |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 105 | } |
Rafael Espindola | 8e9385e | 2013-07-09 12:45:11 +0000 | [diff] [blame] | 106 | return Ret; |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 107 | } |
| 108 | |
Rafael Espindola | 8115e1d | 2013-07-09 12:49:24 +0000 | [diff] [blame] | 109 | sys::fs::perms ArchiveMemberHeader::getAccessMode() const { |
| 110 | unsigned Ret; |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 111 | if (StringRef(ArMemHdr->AccessMode, |
| 112 | sizeof(ArMemHdr->AccessMode)).rtrim(' ').getAsInteger(8, Ret)) |
Rafael Espindola | 8115e1d | 2013-07-09 12:49:24 +0000 | [diff] [blame] | 113 | llvm_unreachable("Access mode is not an octal number."); |
| 114 | return static_cast<sys::fs::perms>(Ret); |
| 115 | } |
| 116 | |
| 117 | sys::TimeValue ArchiveMemberHeader::getLastModified() const { |
| 118 | unsigned Seconds; |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 119 | if (StringRef(ArMemHdr->LastModified, |
| 120 | sizeof(ArMemHdr->LastModified)).rtrim(' ') |
Rafael Espindola | 8115e1d | 2013-07-09 12:49:24 +0000 | [diff] [blame] | 121 | .getAsInteger(10, Seconds)) |
| 122 | llvm_unreachable("Last modified time not a decimal number."); |
| 123 | |
| 124 | sys::TimeValue Ret; |
| 125 | Ret.fromEpochTime(Seconds); |
| 126 | return Ret; |
| 127 | } |
| 128 | |
| 129 | unsigned ArchiveMemberHeader::getUID() const { |
| 130 | unsigned Ret; |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 131 | StringRef User = StringRef(ArMemHdr->UID, sizeof(ArMemHdr->UID)).rtrim(' '); |
Saleem Abdulrasool | aecbdf7 | 2016-07-05 00:23:05 +0000 | [diff] [blame] | 132 | if (User.empty()) |
| 133 | return 0; |
| 134 | if (User.getAsInteger(10, Ret)) |
Rafael Espindola | 8115e1d | 2013-07-09 12:49:24 +0000 | [diff] [blame] | 135 | llvm_unreachable("UID time not a decimal number."); |
| 136 | return Ret; |
| 137 | } |
| 138 | |
| 139 | unsigned ArchiveMemberHeader::getGID() const { |
| 140 | unsigned Ret; |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 141 | StringRef Group = StringRef(ArMemHdr->GID, sizeof(ArMemHdr->GID)).rtrim(' '); |
Saleem Abdulrasool | aecbdf7 | 2016-07-05 00:23:05 +0000 | [diff] [blame] | 142 | if (Group.empty()) |
| 143 | return 0; |
| 144 | if (Group.getAsInteger(10, Ret)) |
Rafael Espindola | 8115e1d | 2013-07-09 12:49:24 +0000 | [diff] [blame] | 145 | llvm_unreachable("GID time not a decimal number."); |
| 146 | return Ret; |
| 147 | } |
| 148 | |
Rafael Espindola | 4335876 | 2015-10-31 21:44:42 +0000 | [diff] [blame] | 149 | Archive::Child::Child(const Archive *Parent, StringRef Data, |
| 150 | uint16_t StartOfFile) |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 151 | : Parent(Parent), Header(Parent, Data.data(), Data.size(), nullptr), |
| 152 | Data(Data), StartOfFile(StartOfFile) { |
| 153 | } |
Rafael Espindola | 4335876 | 2015-10-31 21:44:42 +0000 | [diff] [blame] | 154 | |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 155 | Archive::Child::Child(const Archive *Parent, const char *Start, Error *Err) |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 156 | : Parent(Parent), Header(Parent, Start, Parent->getData().size() - |
| 157 | (Start - Parent->getData().data()), Err) { |
Rafael Espindola | 0f3de64 | 2013-07-09 05:26:25 +0000 | [diff] [blame] | 158 | if (!Start) |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 159 | return; |
Lang Hames | 5e51a2e | 2016-07-22 16:11:25 +0000 | [diff] [blame] | 160 | ErrorAsOutParameter ErrAsOutParam(Err); |
Rafael Espindola | 0f3de64 | 2013-07-09 05:26:25 +0000 | [diff] [blame] | 161 | |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 162 | // If there was an error in the construction of the Header and we were passed |
| 163 | // Err that is not nullptr then just return with the error now set. |
| 164 | if (Err && *Err) |
| 165 | return; |
| 166 | |
| 167 | uint64_t Size = Header.getSizeOf(); |
Rafael Espindola | 9d10206 | 2014-12-16 01:43:41 +0000 | [diff] [blame] | 168 | Data = StringRef(Start, Size); |
Rafael Espindola | be9ab26 | 2015-07-22 19:34:26 +0000 | [diff] [blame] | 169 | if (!isThinMember()) { |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 170 | Expected<uint64_t> MemberSize = getRawSize(); |
| 171 | if (!MemberSize) { |
Lang Hames | 5e51a2e | 2016-07-22 16:11:25 +0000 | [diff] [blame] | 172 | if (Err) |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 173 | *Err = MemberSize.takeError(); |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 174 | return; |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 175 | } |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 176 | Size += MemberSize.get(); |
Rafael Espindola | be9ab26 | 2015-07-22 19:34:26 +0000 | [diff] [blame] | 177 | Data = StringRef(Start, Size); |
| 178 | } |
Rafael Espindola | 0f3de64 | 2013-07-09 05:26:25 +0000 | [diff] [blame] | 179 | |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 180 | // Setup StartOfFile and PaddingBytes. |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 181 | StartOfFile = Header.getSizeOf(); |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 182 | // Don't include attached name. |
Rafael Espindola | be9ab26 | 2015-07-22 19:34:26 +0000 | [diff] [blame] | 183 | StringRef Name = getRawName(); |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 184 | if (Name.startswith("#1/")) { |
| 185 | uint64_t NameSize; |
Vedant Kumar | 98372e3 | 2016-02-16 02:06:01 +0000 | [diff] [blame] | 186 | if (Name.substr(3).rtrim(' ').getAsInteger(10, NameSize)) |
Kevin Enderby | da9dd05 | 2015-10-21 17:13:20 +0000 | [diff] [blame] | 187 | llvm_unreachable("Long name length is not an integer"); |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 188 | StartOfFile += NameSize; |
| 189 | } |
| 190 | } |
| 191 | |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 192 | Expected<uint64_t> Archive::Child::getSize() const { |
Kevin Enderby | 1c1add4 | 2015-10-13 20:48:04 +0000 | [diff] [blame] | 193 | if (Parent->IsThin) { |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 194 | Expected<uint32_t> Size = Header.getSize(); |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 195 | if (!Size) |
| 196 | return Size.takeError(); |
Kevin Enderby | 1c1add4 | 2015-10-13 20:48:04 +0000 | [diff] [blame] | 197 | return Size.get(); |
| 198 | } |
Rafael Espindola | 9d10206 | 2014-12-16 01:43:41 +0000 | [diff] [blame] | 199 | return Data.size() - StartOfFile; |
| 200 | } |
| 201 | |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 202 | Expected<uint64_t> Archive::Child::getRawSize() const { |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 203 | return Header.getSize(); |
Kevin Enderby | 13023a1 | 2015-01-15 23:19:11 +0000 | [diff] [blame] | 204 | } |
| 205 | |
Rafael Espindola | be9ab26 | 2015-07-22 19:34:26 +0000 | [diff] [blame] | 206 | bool Archive::Child::isThinMember() const { |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 207 | StringRef Name = Header.getName(); |
Rafael Espindola | be9ab26 | 2015-07-22 19:34:26 +0000 | [diff] [blame] | 208 | return Parent->IsThin && Name != "/" && Name != "//"; |
| 209 | } |
| 210 | |
Rafael Espindola | 694210c | 2016-05-02 13:45:06 +0000 | [diff] [blame] | 211 | ErrorOr<std::string> Archive::Child::getFullName() const { |
| 212 | assert(isThinMember()); |
| 213 | ErrorOr<StringRef> NameOrErr = getName(); |
| 214 | if (std::error_code EC = NameOrErr.getError()) |
| 215 | return EC; |
| 216 | StringRef Name = *NameOrErr; |
| 217 | if (sys::path::is_absolute(Name)) |
| 218 | return Name; |
| 219 | |
| 220 | SmallString<128> FullName = sys::path::parent_path( |
| 221 | Parent->getMemoryBufferRef().getBufferIdentifier()); |
| 222 | sys::path::append(FullName, Name); |
| 223 | return StringRef(FullName); |
| 224 | } |
| 225 | |
Rafael Espindola | 4b83cb5 | 2015-07-14 22:18:43 +0000 | [diff] [blame] | 226 | ErrorOr<StringRef> Archive::Child::getBuffer() const { |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 227 | if (!isThinMember()) { |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 228 | Expected<uint32_t> Size = getSize(); |
| 229 | if (!Size) |
| 230 | return errorToErrorCode(Size.takeError()); |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 231 | return StringRef(Data.data() + StartOfFile, Size.get()); |
| 232 | } |
Rafael Espindola | 694210c | 2016-05-02 13:45:06 +0000 | [diff] [blame] | 233 | ErrorOr<std::string> FullNameOrEr = getFullName(); |
| 234 | if (std::error_code EC = FullNameOrEr.getError()) |
Rafael Espindola | 4b83cb5 | 2015-07-14 22:18:43 +0000 | [diff] [blame] | 235 | return EC; |
Rafael Espindola | 694210c | 2016-05-02 13:45:06 +0000 | [diff] [blame] | 236 | const std::string &FullName = *FullNameOrEr; |
Rafael Espindola | 4b83cb5 | 2015-07-14 22:18:43 +0000 | [diff] [blame] | 237 | ErrorOr<std::unique_ptr<MemoryBuffer>> Buf = MemoryBuffer::getFile(FullName); |
| 238 | if (std::error_code EC = Buf.getError()) |
| 239 | return EC; |
| 240 | Parent->ThinBuffers.push_back(std::move(*Buf)); |
| 241 | return Parent->ThinBuffers.back()->getBuffer(); |
| 242 | } |
| 243 | |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 244 | Expected<Archive::Child> Archive::Child::getNext() const { |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 245 | size_t SpaceToSkip = Data.size(); |
| 246 | // If it's odd, add 1 to make it even. |
| 247 | if (SpaceToSkip & 1) |
Kevin Enderby | da9dd05 | 2015-10-21 17:13:20 +0000 | [diff] [blame] | 248 | ++SpaceToSkip; |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 249 | |
Kevin Enderby | da9dd05 | 2015-10-21 17:13:20 +0000 | [diff] [blame] | 250 | const char *NextLoc = Data.data() + SpaceToSkip; |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 251 | |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 252 | // Check to see if this is at the end of the archive. |
| 253 | if (NextLoc == Parent->Data.getBufferEnd()) |
| 254 | return Child(Parent, nullptr, nullptr); |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 255 | |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 256 | // Check to see if this is past the end of the archive. |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 257 | if (NextLoc > Parent->Data.getBufferEnd()) { |
| 258 | Twine Msg("offset to next archive member past the end of the archive after " |
| 259 | "member "); |
| 260 | ErrorOr<StringRef> NameOrErr = getName(); |
| 261 | if (NameOrErr.getError()) { |
| 262 | uint64_t Offset = Data.data() - Parent->getData().data(); |
| 263 | return malformedError(Msg + "at offset " + Twine(Offset)); |
| 264 | } else |
| 265 | return malformedError(Msg + Twine(NameOrErr.get())); |
| 266 | } |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 267 | |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 268 | Error Err; |
| 269 | Child Ret(Parent, NextLoc, &Err); |
| 270 | if (Err) |
| 271 | return std::move(Err); |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 272 | return Ret; |
Rafael Espindola | 747bc07 | 2013-07-09 03:39:35 +0000 | [diff] [blame] | 273 | } |
| 274 | |
Kevin Enderby | 13023a1 | 2015-01-15 23:19:11 +0000 | [diff] [blame] | 275 | uint64_t Archive::Child::getChildOffset() const { |
| 276 | const char *a = Parent->Data.getBuffer().data(); |
| 277 | const char *c = Data.data(); |
| 278 | uint64_t offset = c - a; |
| 279 | return offset; |
| 280 | } |
| 281 | |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 282 | ErrorOr<StringRef> Archive::Child::getName() const { |
Rafael Espindola | 6cc2dc7 | 2013-07-05 03:35:15 +0000 | [diff] [blame] | 283 | StringRef name = getRawName(); |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 284 | // Check if it's a special name. |
| 285 | if (name[0] == '/') { |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 286 | if (name.size() == 1) // Linker member. |
| 287 | return name; |
| 288 | if (name.size() == 2 && name[1] == '/') // String table. |
| 289 | return name; |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 290 | // It's a long name. |
| 291 | // Get the offset. |
Michael J. Spencer | 04614ff | 2013-01-10 00:07:38 +0000 | [diff] [blame] | 292 | std::size_t offset; |
Vedant Kumar | 98372e3 | 2016-02-16 02:06:01 +0000 | [diff] [blame] | 293 | if (name.substr(1).rtrim(' ').getAsInteger(10, offset)) |
Kevin Enderby | da9dd05 | 2015-10-21 17:13:20 +0000 | [diff] [blame] | 294 | llvm_unreachable("Long name offset is not an integer"); |
Rafael Espindola | 8f23882 | 2015-10-31 20:06:13 +0000 | [diff] [blame] | 295 | |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 296 | // Verify it. |
Rafael Espindola | 8f23882 | 2015-10-31 20:06:13 +0000 | [diff] [blame] | 297 | if (offset >= Parent->StringTable.size()) |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 298 | return object_error::parse_failed; |
Rafael Espindola | 8f23882 | 2015-10-31 20:06:13 +0000 | [diff] [blame] | 299 | const char *addr = Parent->StringTable.begin() + offset; |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 300 | |
Rafael Espindola | c60d0d2 | 2015-07-13 23:07:05 +0000 | [diff] [blame] | 301 | // GNU long file names end with a "/\n". |
Simon Atanasyan | 1d902b7 | 2015-02-17 18:54:22 +0000 | [diff] [blame] | 302 | if (Parent->kind() == K_GNU || Parent->kind() == K_MIPS64) { |
Rafael Espindola | c60d0d2 | 2015-07-13 23:07:05 +0000 | [diff] [blame] | 303 | StringRef::size_type End = StringRef(addr).find('\n'); |
| 304 | return StringRef(addr, End - 1); |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 305 | } |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 306 | return StringRef(addr); |
Michael J. Spencer | 9aaa852 | 2011-10-25 22:30:42 +0000 | [diff] [blame] | 307 | } else if (name.startswith("#1/")) { |
Michael J. Spencer | 751fd88 | 2013-01-09 22:58:43 +0000 | [diff] [blame] | 308 | uint64_t name_size; |
Vedant Kumar | 98372e3 | 2016-02-16 02:06:01 +0000 | [diff] [blame] | 309 | if (name.substr(3).rtrim(' ').getAsInteger(10, name_size)) |
Kevin Enderby | da9dd05 | 2015-10-21 17:13:20 +0000 | [diff] [blame] | 310 | llvm_unreachable("Long name length is not an ingeter"); |
Kevin Enderby | 95b0842 | 2016-07-25 20:36:36 +0000 | [diff] [blame] | 311 | return Data.substr(Header.getSizeOf(), name_size).rtrim('\0'); |
Kevin Enderby | ac9e155 | 2016-05-17 17:10:12 +0000 | [diff] [blame] | 312 | } else { |
| 313 | // It is not a long name so trim the blanks at the end of the name. |
| 314 | if (name[name.size() - 1] != '/') { |
| 315 | return name.rtrim(' '); |
| 316 | } |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 317 | } |
| 318 | // It's a simple name. |
| 319 | if (name[name.size() - 1] == '/') |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 320 | return name.substr(0, name.size() - 1); |
| 321 | return name; |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 322 | } |
| 323 | |
Rafael Espindola | 48af1c2 | 2014-08-19 18:44:46 +0000 | [diff] [blame] | 324 | ErrorOr<MemoryBufferRef> Archive::Child::getMemoryBufferRef() const { |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 325 | ErrorOr<StringRef> NameOrErr = getName(); |
| 326 | if (std::error_code EC = NameOrErr.getError()) |
Rafael Espindola | 63da295 | 2014-01-15 19:37:43 +0000 | [diff] [blame] | 327 | return EC; |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 328 | StringRef Name = NameOrErr.get(); |
Rafael Espindola | 4b83cb5 | 2015-07-14 22:18:43 +0000 | [diff] [blame] | 329 | ErrorOr<StringRef> Buf = getBuffer(); |
| 330 | if (std::error_code EC = Buf.getError()) |
| 331 | return EC; |
| 332 | return MemoryBufferRef(*Buf, Name); |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 333 | } |
| 334 | |
Kevin Enderby | ac9e155 | 2016-05-17 17:10:12 +0000 | [diff] [blame] | 335 | Expected<std::unique_ptr<Binary>> |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 336 | Archive::Child::getAsBinary(LLVMContext *Context) const { |
Rafael Espindola | 48af1c2 | 2014-08-19 18:44:46 +0000 | [diff] [blame] | 337 | ErrorOr<MemoryBufferRef> BuffOrErr = getMemoryBufferRef(); |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 338 | if (std::error_code EC = BuffOrErr.getError()) |
Kevin Enderby | ac9e155 | 2016-05-17 17:10:12 +0000 | [diff] [blame] | 339 | return errorCodeToError(EC); |
Rafael Espindola | c3f9b5a | 2014-06-23 21:53:12 +0000 | [diff] [blame] | 340 | |
Kevin Enderby | 3fcdf6a | 2016-04-06 22:14:09 +0000 | [diff] [blame] | 341 | auto BinaryOrErr = createBinary(BuffOrErr.get(), Context); |
| 342 | if (BinaryOrErr) |
| 343 | return std::move(*BinaryOrErr); |
Kevin Enderby | ac9e155 | 2016-05-17 17:10:12 +0000 | [diff] [blame] | 344 | return BinaryOrErr.takeError(); |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 345 | } |
| 346 | |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 347 | Expected<std::unique_ptr<Archive>> Archive::create(MemoryBufferRef Source) { |
| 348 | Error Err; |
| 349 | std::unique_ptr<Archive> Ret(new Archive(Source, Err)); |
| 350 | if (Err) |
| 351 | return std::move(Err); |
Rafael Espindola | f557713 | 2014-07-31 03:36:00 +0000 | [diff] [blame] | 352 | return std::move(Ret); |
Rafael Espindola | 692410e | 2014-01-21 23:06:54 +0000 | [diff] [blame] | 353 | } |
| 354 | |
Rafael Espindola | 4335876 | 2015-10-31 21:44:42 +0000 | [diff] [blame] | 355 | void Archive::setFirstRegular(const Child &C) { |
| 356 | FirstRegularData = C.Data; |
| 357 | FirstRegularStartOfFile = C.StartOfFile; |
| 358 | } |
| 359 | |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 360 | Archive::Archive(MemoryBufferRef Source, Error &Err) |
Rafael Espindola | 4335876 | 2015-10-31 21:44:42 +0000 | [diff] [blame] | 361 | : Binary(Binary::ID_Archive, Source) { |
Lang Hames | 5e51a2e | 2016-07-22 16:11:25 +0000 | [diff] [blame] | 362 | ErrorAsOutParameter ErrAsOutParam(&Err); |
Rafael Espindola | 9d10206 | 2014-12-16 01:43:41 +0000 | [diff] [blame] | 363 | StringRef Buffer = Data.getBuffer(); |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 364 | // Check for sufficient magic. |
Rafael Espindola | 9d10206 | 2014-12-16 01:43:41 +0000 | [diff] [blame] | 365 | if (Buffer.startswith(ThinMagic)) { |
| 366 | IsThin = true; |
| 367 | } else if (Buffer.startswith(Magic)) { |
| 368 | IsThin = false; |
| 369 | } else { |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 370 | Err = make_error<GenericBinaryError>("File too small to be an archive", |
| 371 | object_error::invalid_file_type); |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 372 | return; |
| 373 | } |
| 374 | |
Michael J. Spencer | e03ea9c | 2011-11-02 19:33:12 +0000 | [diff] [blame] | 375 | // Get the special members. |
Lang Hames | fc20962 | 2016-07-14 02:24:01 +0000 | [diff] [blame] | 376 | child_iterator I = child_begin(Err, false); |
| 377 | if (Err) |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 378 | return; |
| 379 | child_iterator E = child_end(); |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 380 | |
Rafael Espindola | cc37120 | 2016-06-24 13:47:29 +0000 | [diff] [blame] | 381 | // This is at least a valid empty archive. Since an empty archive is the |
| 382 | // same in all formats, just claim it to be gnu to make sure Format is |
| 383 | // initialized. |
| 384 | Format = K_GNU; |
| 385 | |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 386 | if (I == E) { |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 387 | Err = Error::success(); |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 388 | return; |
| 389 | } |
Lang Hames | fc20962 | 2016-07-14 02:24:01 +0000 | [diff] [blame] | 390 | const Child *C = &*I; |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 391 | |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 392 | auto Increment = [&]() { |
| 393 | ++I; |
Lang Hames | fc20962 | 2016-07-14 02:24:01 +0000 | [diff] [blame] | 394 | if (Err) |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 395 | return true; |
Lang Hames | fc20962 | 2016-07-14 02:24:01 +0000 | [diff] [blame] | 396 | C = &*I; |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 397 | return false; |
| 398 | }; |
| 399 | |
| 400 | StringRef Name = C->getRawName(); |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 401 | |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 402 | // Below is the pattern that is used to figure out the archive format |
| 403 | // GNU archive format |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 404 | // First member : / (may exist, if it exists, points to the symbol table ) |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 405 | // Second member : // (may exist, if it exists, points to the string table) |
| 406 | // Note : The string table is used if the filename exceeds 15 characters |
| 407 | // BSD archive format |
Rafael Espindola | 5550992 | 2013-07-10 22:07:59 +0000 | [diff] [blame] | 408 | // First member : __.SYMDEF or "__.SYMDEF SORTED" (the symbol table) |
| 409 | // There is no string table, if the filename exceeds 15 characters or has a |
| 410 | // embedded space, the filename has #1/<size>, The size represents the size |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 411 | // of the filename that needs to be read after the archive header |
| 412 | // COFF archive format |
| 413 | // First member : / |
| 414 | // Second member : / (provides a directory of symbols) |
Rui Ueyama | f4d0a8c | 2013-06-03 00:27:03 +0000 | [diff] [blame] | 415 | // Third member : // (may exist, if it exists, contains the string table) |
| 416 | // Note: Microsoft PE/COFF Spec 8.3 says that the third member is present |
| 417 | // even if the string table is empty. However, lib.exe does not in fact |
| 418 | // seem to create the third member if there's no member whose filename |
| 419 | // exceeds 15 characters. So the third member is optional. |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 420 | |
Kevin Enderby | ae108ff | 2016-06-17 22:16:06 +0000 | [diff] [blame] | 421 | if (Name == "__.SYMDEF" || Name == "__.SYMDEF_64") { |
| 422 | if (Name == "__.SYMDEF") |
| 423 | Format = K_BSD; |
| 424 | else // Name == "__.SYMDEF_64" |
| 425 | Format = K_DARWIN64; |
Rafael Espindola | 4a782fb | 2015-10-31 21:03:29 +0000 | [diff] [blame] | 426 | // We know that the symbol table is not an external file, so we just assert |
| 427 | // there is no error. |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 428 | SymbolTable = *C->getBuffer(); |
| 429 | if (Increment()) |
| 430 | return; |
| 431 | setFirstRegular(*C); |
| 432 | |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 433 | Err = Error::success(); |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 434 | return; |
| 435 | } |
| 436 | |
Rafael Espindola | 5550992 | 2013-07-10 22:07:59 +0000 | [diff] [blame] | 437 | if (Name.startswith("#1/")) { |
| 438 | Format = K_BSD; |
| 439 | // We know this is BSD, so getName will work since there is no string table. |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 440 | ErrorOr<StringRef> NameOrErr = C->getName(); |
Lang Hames | fc20962 | 2016-07-14 02:24:01 +0000 | [diff] [blame] | 441 | if (auto ec = NameOrErr.getError()) { |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 442 | Err = errorCodeToError(ec); |
Rafael Espindola | 5550992 | 2013-07-10 22:07:59 +0000 | [diff] [blame] | 443 | return; |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 444 | } |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 445 | Name = NameOrErr.get(); |
Nick Kledzik | f44dbda | 2014-11-12 01:37:45 +0000 | [diff] [blame] | 446 | if (Name == "__.SYMDEF SORTED" || Name == "__.SYMDEF") { |
Rafael Espindola | 4a782fb | 2015-10-31 21:03:29 +0000 | [diff] [blame] | 447 | // We know that the symbol table is not an external file, so we just |
| 448 | // assert there is no error. |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 449 | SymbolTable = *C->getBuffer(); |
| 450 | if (Increment()) |
| 451 | return; |
Rafael Espindola | 3e2b21c | 2013-07-12 20:21:39 +0000 | [diff] [blame] | 452 | } |
Kevin Enderby | ae108ff | 2016-06-17 22:16:06 +0000 | [diff] [blame] | 453 | else if (Name == "__.SYMDEF_64 SORTED" || Name == "__.SYMDEF_64") { |
| 454 | Format = K_DARWIN64; |
| 455 | // We know that the symbol table is not an external file, so we just |
| 456 | // assert there is no error. |
| 457 | SymbolTable = *C->getBuffer(); |
| 458 | if (Increment()) |
| 459 | return; |
| 460 | } |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 461 | setFirstRegular(*C); |
Rafael Espindola | 5550992 | 2013-07-10 22:07:59 +0000 | [diff] [blame] | 462 | return; |
| 463 | } |
| 464 | |
Simon Atanasyan | 1d902b7 | 2015-02-17 18:54:22 +0000 | [diff] [blame] | 465 | // MIPS 64-bit ELF archives use a special format of a symbol table. |
| 466 | // This format is marked by `ar_name` field equals to "/SYM64/". |
| 467 | // For detailed description see page 96 in the following document: |
| 468 | // http://techpubs.sgi.com/library/manuals/4000/007-4658-001/pdf/007-4658-001.pdf |
| 469 | |
| 470 | bool has64SymTable = false; |
| 471 | if (Name == "/" || Name == "/SYM64/") { |
Rafael Espindola | 4a782fb | 2015-10-31 21:03:29 +0000 | [diff] [blame] | 472 | // We know that the symbol table is not an external file, so we just assert |
| 473 | // there is no error. |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 474 | SymbolTable = *C->getBuffer(); |
Simon Atanasyan | 1d902b7 | 2015-02-17 18:54:22 +0000 | [diff] [blame] | 475 | if (Name == "/SYM64/") |
| 476 | has64SymTable = true; |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 477 | |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 478 | if (Increment()) |
| 479 | return; |
| 480 | if (I == E) { |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 481 | Err = Error::success(); |
Michael J. Spencer | 04614ff | 2013-01-10 00:07:38 +0000 | [diff] [blame] | 482 | return; |
| 483 | } |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 484 | Name = C->getRawName(); |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 485 | } |
| 486 | |
Rafael Espindola | 6cc2dc7 | 2013-07-05 03:35:15 +0000 | [diff] [blame] | 487 | if (Name == "//") { |
Simon Atanasyan | 1d902b7 | 2015-02-17 18:54:22 +0000 | [diff] [blame] | 488 | Format = has64SymTable ? K_MIPS64 : K_GNU; |
Rafael Espindola | 8f23882 | 2015-10-31 20:06:13 +0000 | [diff] [blame] | 489 | // The string table is never an external member, so we just assert on the |
| 490 | // ErrorOr. |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 491 | StringTable = *C->getBuffer(); |
| 492 | if (Increment()) |
| 493 | return; |
| 494 | setFirstRegular(*C); |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 495 | Err = Error::success(); |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 496 | return; |
| 497 | } |
| 498 | |
Rafael Espindola | 6cc2dc7 | 2013-07-05 03:35:15 +0000 | [diff] [blame] | 499 | if (Name[0] != '/') { |
Simon Atanasyan | 1d902b7 | 2015-02-17 18:54:22 +0000 | [diff] [blame] | 500 | Format = has64SymTable ? K_MIPS64 : K_GNU; |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 501 | setFirstRegular(*C); |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 502 | Err = Error::success(); |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 503 | return; |
| 504 | } |
| 505 | |
Rafael Espindola | 6cc2dc7 | 2013-07-05 03:35:15 +0000 | [diff] [blame] | 506 | if (Name != "/") { |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 507 | Err = errorCodeToError(object_error::parse_failed); |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 508 | return; |
| 509 | } |
| 510 | |
| 511 | Format = K_COFF; |
Rafael Espindola | 4a782fb | 2015-10-31 21:03:29 +0000 | [diff] [blame] | 512 | // We know that the symbol table is not an external file, so we just assert |
| 513 | // there is no error. |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 514 | SymbolTable = *C->getBuffer(); |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 515 | |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 516 | if (Increment()) |
| 517 | return; |
| 518 | |
| 519 | if (I == E) { |
| 520 | setFirstRegular(*C); |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 521 | Err = Error::success(); |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 522 | return; |
| 523 | } |
| 524 | |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 525 | Name = C->getRawName(); |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 526 | |
Rafael Espindola | 3e2b21c | 2013-07-12 20:21:39 +0000 | [diff] [blame] | 527 | if (Name == "//") { |
Rafael Espindola | 8f23882 | 2015-10-31 20:06:13 +0000 | [diff] [blame] | 528 | // The string table is never an external member, so we just assert on the |
| 529 | // ErrorOr. |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 530 | StringTable = *C->getBuffer(); |
| 531 | if (Increment()) |
| 532 | return; |
Rafael Espindola | 3e2b21c | 2013-07-12 20:21:39 +0000 | [diff] [blame] | 533 | } |
Rafael Espindola | 88ae7dd | 2013-07-03 15:57:14 +0000 | [diff] [blame] | 534 | |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 535 | setFirstRegular(*C); |
Kevin Enderby | c60a321 | 2016-06-29 20:35:44 +0000 | [diff] [blame] | 536 | Err = Error::success(); |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 537 | } |
| 538 | |
Lang Hames | fc20962 | 2016-07-14 02:24:01 +0000 | [diff] [blame] | 539 | Archive::child_iterator Archive::child_begin(Error &Err, |
| 540 | bool SkipInternal) const { |
Rafael Espindola | 48af1c2 | 2014-08-19 18:44:46 +0000 | [diff] [blame] | 541 | if (Data.getBufferSize() == 8) // empty archive. |
Rafael Espindola | 23a9750 | 2014-01-21 16:09:45 +0000 | [diff] [blame] | 542 | return child_end(); |
Rafael Espindola | 3e2b21c | 2013-07-12 20:21:39 +0000 | [diff] [blame] | 543 | |
| 544 | if (SkipInternal) |
Lang Hames | fc20962 | 2016-07-14 02:24:01 +0000 | [diff] [blame] | 545 | return child_iterator(Child(this, FirstRegularData, |
| 546 | FirstRegularStartOfFile), |
| 547 | &Err); |
Rafael Espindola | 3e2b21c | 2013-07-12 20:21:39 +0000 | [diff] [blame] | 548 | |
Rafael Espindola | 48af1c2 | 2014-08-19 18:44:46 +0000 | [diff] [blame] | 549 | const char *Loc = Data.getBufferStart() + strlen(Magic); |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 550 | Child C(this, Loc, &Err); |
| 551 | if (Err) |
Lang Hames | fc20962 | 2016-07-14 02:24:01 +0000 | [diff] [blame] | 552 | return child_end(); |
Lang Hames | fc20962 | 2016-07-14 02:24:01 +0000 | [diff] [blame] | 553 | return child_iterator(C, &Err); |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 554 | } |
| 555 | |
Rafael Espindola | 23a9750 | 2014-01-21 16:09:45 +0000 | [diff] [blame] | 556 | Archive::child_iterator Archive::child_end() const { |
Lang Hames | fc20962 | 2016-07-14 02:24:01 +0000 | [diff] [blame] | 557 | return child_iterator(Child(this, nullptr, nullptr), nullptr); |
Michael J. Spencer | d3b7b12 | 2011-09-27 19:36:55 +0000 | [diff] [blame] | 558 | } |
Michael J. Spencer | e03ea9c | 2011-11-02 19:33:12 +0000 | [diff] [blame] | 559 | |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 560 | StringRef Archive::Symbol::getName() const { |
Rafael Espindola | 2b05416 | 2015-07-14 01:06:16 +0000 | [diff] [blame] | 561 | return Parent->getSymbolTable().begin() + StringIndex; |
Michael J. Spencer | e03ea9c | 2011-11-02 19:33:12 +0000 | [diff] [blame] | 562 | } |
| 563 | |
Rafael Espindola | cc86d82 | 2015-11-03 01:20:44 +0000 | [diff] [blame] | 564 | ErrorOr<Archive::Child> Archive::Symbol::getMember() const { |
Rafael Espindola | 2b05416 | 2015-07-14 01:06:16 +0000 | [diff] [blame] | 565 | const char *Buf = Parent->getSymbolTable().begin(); |
Simon Atanasyan | 1d902b7 | 2015-02-17 18:54:22 +0000 | [diff] [blame] | 566 | const char *Offsets = Buf; |
Kevin Enderby | ae108ff | 2016-06-17 22:16:06 +0000 | [diff] [blame] | 567 | if (Parent->kind() == K_MIPS64 || Parent->kind() == K_DARWIN64) |
Simon Atanasyan | 1d902b7 | 2015-02-17 18:54:22 +0000 | [diff] [blame] | 568 | Offsets += sizeof(uint64_t); |
| 569 | else |
| 570 | Offsets += sizeof(uint32_t); |
Michael J. Spencer | 4e92d5b | 2012-11-14 00:04:13 +0000 | [diff] [blame] | 571 | uint32_t Offset = 0; |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 572 | if (Parent->kind() == K_GNU) { |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 573 | Offset = read32be(Offsets + SymbolIndex * 4); |
Simon Atanasyan | 1d902b7 | 2015-02-17 18:54:22 +0000 | [diff] [blame] | 574 | } else if (Parent->kind() == K_MIPS64) { |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 575 | Offset = read64be(Offsets + SymbolIndex * 8); |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 576 | } else if (Parent->kind() == K_BSD) { |
Kevin Enderby | 8c50dbb | 2014-07-08 22:10:02 +0000 | [diff] [blame] | 577 | // The SymbolIndex is an index into the ranlib structs that start at |
| 578 | // Offsets (the first uint32_t is the number of bytes of the ranlib |
| 579 | // structs). The ranlib structs are a pair of uint32_t's the first |
| 580 | // being a string table offset and the second being the offset into |
| 581 | // the archive of the member that defines the symbol. Which is what |
| 582 | // is needed here. |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 583 | Offset = read32le(Offsets + SymbolIndex * 8 + 4); |
Kevin Enderby | ae108ff | 2016-06-17 22:16:06 +0000 | [diff] [blame] | 584 | } else if (Parent->kind() == K_DARWIN64) { |
| 585 | // The SymbolIndex is an index into the ranlib_64 structs that start at |
| 586 | // Offsets (the first uint64_t is the number of bytes of the ranlib_64 |
| 587 | // structs). The ranlib_64 structs are a pair of uint64_t's the first |
| 588 | // being a string table offset and the second being the offset into |
| 589 | // the archive of the member that defines the symbol. Which is what |
| 590 | // is needed here. |
| 591 | Offset = read64le(Offsets + SymbolIndex * 16 + 8); |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 592 | } else { |
Michael J. Spencer | 4e92d5b | 2012-11-14 00:04:13 +0000 | [diff] [blame] | 593 | // Skip offsets. |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 594 | uint32_t MemberCount = read32le(Buf); |
| 595 | Buf += MemberCount * 4 + 4; |
Michael J. Spencer | 4e92d5b | 2012-11-14 00:04:13 +0000 | [diff] [blame] | 596 | |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 597 | uint32_t SymbolCount = read32le(Buf); |
Michael J. Spencer | 4e92d5b | 2012-11-14 00:04:13 +0000 | [diff] [blame] | 598 | if (SymbolIndex >= SymbolCount) |
| 599 | return object_error::parse_failed; |
| 600 | |
Matt Beaumont-Gay | 68e0b6a | 2012-11-14 00:21:27 +0000 | [diff] [blame] | 601 | // Skip SymbolCount to get to the indices table. |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 602 | const char *Indices = Buf + 4; |
Michael J. Spencer | 4e92d5b | 2012-11-14 00:04:13 +0000 | [diff] [blame] | 603 | |
| 604 | // Get the index of the offset in the file member offset table for this |
| 605 | // symbol. |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 606 | uint16_t OffsetIndex = read16le(Indices + SymbolIndex * 2); |
Michael J. Spencer | 4e92d5b | 2012-11-14 00:04:13 +0000 | [diff] [blame] | 607 | // Subtract 1 since OffsetIndex is 1 based. |
| 608 | --OffsetIndex; |
| 609 | |
| 610 | if (OffsetIndex >= MemberCount) |
| 611 | return object_error::parse_failed; |
| 612 | |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 613 | Offset = read32le(Offsets + OffsetIndex * 4); |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 614 | } |
Michael J. Spencer | e03ea9c | 2011-11-02 19:33:12 +0000 | [diff] [blame] | 615 | |
Michael J. Spencer | 4e92d5b | 2012-11-14 00:04:13 +0000 | [diff] [blame] | 616 | const char *Loc = Parent->getData().begin() + Offset; |
Kevin Enderby | 6524bd8 | 2016-07-19 20:47:07 +0000 | [diff] [blame] | 617 | Error Err; |
| 618 | Child C(Parent, Loc, &Err); |
| 619 | if (Err) |
| 620 | return errorToErrorCode(std::move(Err)); |
Kevin Enderby | 7a96942 | 2015-11-05 19:24:56 +0000 | [diff] [blame] | 621 | return C; |
Michael J. Spencer | e03ea9c | 2011-11-02 19:33:12 +0000 | [diff] [blame] | 622 | } |
| 623 | |
| 624 | Archive::Symbol Archive::Symbol::getNext() const { |
| 625 | Symbol t(*this); |
Kevin Enderby | 8c50dbb | 2014-07-08 22:10:02 +0000 | [diff] [blame] | 626 | if (Parent->kind() == K_BSD) { |
| 627 | // t.StringIndex is an offset from the start of the __.SYMDEF or |
| 628 | // "__.SYMDEF SORTED" member into the string table for the ranlib |
| 629 | // struct indexed by t.SymbolIndex . To change t.StringIndex to the |
| 630 | // offset in the string table for t.SymbolIndex+1 we subtract the |
| 631 | // its offset from the start of the string table for t.SymbolIndex |
| 632 | // and add the offset of the string table for t.SymbolIndex+1. |
| 633 | |
| 634 | // The __.SYMDEF or "__.SYMDEF SORTED" member starts with a uint32_t |
| 635 | // which is the number of bytes of ranlib structs that follow. The ranlib |
| 636 | // structs are a pair of uint32_t's the first being a string table offset |
| 637 | // and the second being the offset into the archive of the member that |
| 638 | // define the symbol. After that the next uint32_t is the byte count of |
| 639 | // the string table followed by the string table. |
Rafael Espindola | 2b05416 | 2015-07-14 01:06:16 +0000 | [diff] [blame] | 640 | const char *Buf = Parent->getSymbolTable().begin(); |
Kevin Enderby | 8c50dbb | 2014-07-08 22:10:02 +0000 | [diff] [blame] | 641 | uint32_t RanlibCount = 0; |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 642 | RanlibCount = read32le(Buf) / 8; |
Kevin Enderby | 8c50dbb | 2014-07-08 22:10:02 +0000 | [diff] [blame] | 643 | // If t.SymbolIndex + 1 will be past the count of symbols (the RanlibCount) |
| 644 | // don't change the t.StringIndex as we don't want to reference a ranlib |
| 645 | // past RanlibCount. |
| 646 | if (t.SymbolIndex + 1 < RanlibCount) { |
| 647 | const char *Ranlibs = Buf + 4; |
| 648 | uint32_t CurRanStrx = 0; |
| 649 | uint32_t NextRanStrx = 0; |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 650 | CurRanStrx = read32le(Ranlibs + t.SymbolIndex * 8); |
| 651 | NextRanStrx = read32le(Ranlibs + (t.SymbolIndex + 1) * 8); |
Kevin Enderby | 8c50dbb | 2014-07-08 22:10:02 +0000 | [diff] [blame] | 652 | t.StringIndex -= CurRanStrx; |
| 653 | t.StringIndex += NextRanStrx; |
| 654 | } |
| 655 | } else { |
| 656 | // Go to one past next null. |
Rafael Espindola | 2b05416 | 2015-07-14 01:06:16 +0000 | [diff] [blame] | 657 | t.StringIndex = Parent->getSymbolTable().find('\0', t.StringIndex) + 1; |
Kevin Enderby | 8c50dbb | 2014-07-08 22:10:02 +0000 | [diff] [blame] | 658 | } |
Michael J. Spencer | e03ea9c | 2011-11-02 19:33:12 +0000 | [diff] [blame] | 659 | ++t.SymbolIndex; |
| 660 | return t; |
| 661 | } |
| 662 | |
Rafael Espindola | 23a9750 | 2014-01-21 16:09:45 +0000 | [diff] [blame] | 663 | Archive::symbol_iterator Archive::symbol_begin() const { |
Rafael Espindola | b6b5f52e | 2013-07-29 12:40:31 +0000 | [diff] [blame] | 664 | if (!hasSymbolTable()) |
Rafael Espindola | fbcafc0 | 2013-07-10 20:14:22 +0000 | [diff] [blame] | 665 | return symbol_iterator(Symbol(this, 0, 0)); |
| 666 | |
Rafael Espindola | 2b05416 | 2015-07-14 01:06:16 +0000 | [diff] [blame] | 667 | const char *buf = getSymbolTable().begin(); |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 668 | if (kind() == K_GNU) { |
| 669 | uint32_t symbol_count = 0; |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 670 | symbol_count = read32be(buf); |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 671 | buf += sizeof(uint32_t) + (symbol_count * (sizeof(uint32_t))); |
Simon Atanasyan | 1d902b7 | 2015-02-17 18:54:22 +0000 | [diff] [blame] | 672 | } else if (kind() == K_MIPS64) { |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 673 | uint64_t symbol_count = read64be(buf); |
Simon Atanasyan | 1d902b7 | 2015-02-17 18:54:22 +0000 | [diff] [blame] | 674 | buf += sizeof(uint64_t) + (symbol_count * (sizeof(uint64_t))); |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 675 | } else if (kind() == K_BSD) { |
Kevin Enderby | 8c50dbb | 2014-07-08 22:10:02 +0000 | [diff] [blame] | 676 | // The __.SYMDEF or "__.SYMDEF SORTED" member starts with a uint32_t |
| 677 | // which is the number of bytes of ranlib structs that follow. The ranlib |
| 678 | // structs are a pair of uint32_t's the first being a string table offset |
| 679 | // and the second being the offset into the archive of the member that |
| 680 | // define the symbol. After that the next uint32_t is the byte count of |
| 681 | // the string table followed by the string table. |
| 682 | uint32_t ranlib_count = 0; |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 683 | ranlib_count = read32le(buf) / 8; |
Kevin Enderby | 8c50dbb | 2014-07-08 22:10:02 +0000 | [diff] [blame] | 684 | const char *ranlibs = buf + 4; |
| 685 | uint32_t ran_strx = 0; |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 686 | ran_strx = read32le(ranlibs); |
Kevin Enderby | 8c50dbb | 2014-07-08 22:10:02 +0000 | [diff] [blame] | 687 | buf += sizeof(uint32_t) + (ranlib_count * (2 * (sizeof(uint32_t)))); |
| 688 | // Skip the byte count of the string table. |
| 689 | buf += sizeof(uint32_t); |
| 690 | buf += ran_strx; |
Kevin Enderby | ae108ff | 2016-06-17 22:16:06 +0000 | [diff] [blame] | 691 | } else if (kind() == K_DARWIN64) { |
| 692 | // The __.SYMDEF_64 or "__.SYMDEF_64 SORTED" member starts with a uint64_t |
| 693 | // which is the number of bytes of ranlib_64 structs that follow. The |
| 694 | // ranlib_64 structs are a pair of uint64_t's the first being a string |
| 695 | // table offset and the second being the offset into the archive of the |
| 696 | // member that define the symbol. After that the next uint64_t is the byte |
| 697 | // count of the string table followed by the string table. |
| 698 | uint64_t ranlib_count = 0; |
| 699 | ranlib_count = read64le(buf) / 16; |
| 700 | const char *ranlibs = buf + 8; |
| 701 | uint64_t ran_strx = 0; |
| 702 | ran_strx = read64le(ranlibs); |
| 703 | buf += sizeof(uint64_t) + (ranlib_count * (2 * (sizeof(uint64_t)))); |
| 704 | // Skip the byte count of the string table. |
| 705 | buf += sizeof(uint64_t); |
| 706 | buf += ran_strx; |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 707 | } else { |
| 708 | uint32_t member_count = 0; |
| 709 | uint32_t symbol_count = 0; |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 710 | member_count = read32le(buf); |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 711 | buf += 4 + (member_count * 4); // Skip offsets. |
Rui Ueyama | 3206b79 | 2015-03-02 21:19:12 +0000 | [diff] [blame] | 712 | symbol_count = read32le(buf); |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 713 | buf += 4 + (symbol_count * 2); // Skip indices. |
| 714 | } |
Rafael Espindola | 2b05416 | 2015-07-14 01:06:16 +0000 | [diff] [blame] | 715 | uint32_t string_start_offset = buf - getSymbolTable().begin(); |
Michael J. Spencer | e03ea9c | 2011-11-02 19:33:12 +0000 | [diff] [blame] | 716 | return symbol_iterator(Symbol(this, 0, string_start_offset)); |
| 717 | } |
| 718 | |
Rafael Espindola | 23a9750 | 2014-01-21 16:09:45 +0000 | [diff] [blame] | 719 | Archive::symbol_iterator Archive::symbol_end() const { |
Rui Ueyama | 407e097 | 2015-05-26 16:20:40 +0000 | [diff] [blame] | 720 | return symbol_iterator(Symbol(this, getNumberOfSymbols(), 0)); |
| 721 | } |
Rafael Espindola | fbcafc0 | 2013-07-10 20:14:22 +0000 | [diff] [blame] | 722 | |
Rui Ueyama | 407e097 | 2015-05-26 16:20:40 +0000 | [diff] [blame] | 723 | uint32_t Archive::getNumberOfSymbols() const { |
Rafael Espindola | 483ad20 | 2015-10-08 18:06:20 +0000 | [diff] [blame] | 724 | if (!hasSymbolTable()) |
| 725 | return 0; |
Rafael Espindola | 2b05416 | 2015-07-14 01:06:16 +0000 | [diff] [blame] | 726 | const char *buf = getSymbolTable().begin(); |
Rui Ueyama | 407e097 | 2015-05-26 16:20:40 +0000 | [diff] [blame] | 727 | if (kind() == K_GNU) |
| 728 | return read32be(buf); |
| 729 | if (kind() == K_MIPS64) |
| 730 | return read64be(buf); |
| 731 | if (kind() == K_BSD) |
| 732 | return read32le(buf) / 8; |
Kevin Enderby | ae108ff | 2016-06-17 22:16:06 +0000 | [diff] [blame] | 733 | if (kind() == K_DARWIN64) |
| 734 | return read64le(buf) / 16; |
Rui Ueyama | 407e097 | 2015-05-26 16:20:40 +0000 | [diff] [blame] | 735 | uint32_t member_count = 0; |
| 736 | member_count = read32le(buf); |
| 737 | buf += 4 + (member_count * 4); // Skip offsets. |
| 738 | return read32le(buf); |
Michael J. Spencer | e03ea9c | 2011-11-02 19:33:12 +0000 | [diff] [blame] | 739 | } |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 740 | |
Lang Hames | 69f4902 | 2016-07-14 20:44:27 +0000 | [diff] [blame] | 741 | Expected<Optional<Archive::Child>> Archive::findSym(StringRef name) const { |
Rafael Espindola | 23a9750 | 2014-01-21 16:09:45 +0000 | [diff] [blame] | 742 | Archive::symbol_iterator bs = symbol_begin(); |
| 743 | Archive::symbol_iterator es = symbol_end(); |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 744 | |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 745 | for (; bs != es; ++bs) { |
Rafael Espindola | ae46002 | 2014-06-16 16:08:36 +0000 | [diff] [blame] | 746 | StringRef SymName = bs->getName(); |
| 747 | if (SymName == name) { |
Lang Hames | 69f4902 | 2016-07-14 20:44:27 +0000 | [diff] [blame] | 748 | if (auto MemberOrErr = bs->getMember()) |
| 749 | return Child(*MemberOrErr); |
| 750 | else |
| 751 | return errorCodeToError(MemberOrErr.getError()); |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 752 | } |
| 753 | } |
Lang Hames | 69f4902 | 2016-07-14 20:44:27 +0000 | [diff] [blame] | 754 | return Optional<Child>(); |
Shankar Easwaran | 15b28be | 2012-11-13 18:38:42 +0000 | [diff] [blame] | 755 | } |
Rafael Espindola | b6b5f52e | 2013-07-29 12:40:31 +0000 | [diff] [blame] | 756 | |
Rafael Espindola | 4a782fb | 2015-10-31 21:03:29 +0000 | [diff] [blame] | 757 | bool Archive::hasSymbolTable() const { return !SymbolTable.empty(); } |