Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 1 | //===-- ArchiveReader.cpp - Read LLVM archive files -------------*- C++ -*-===// |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 2 | // |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | 4ee451d | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 7 | // |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 9 | // |
Gabor Greif | a99be51 | 2007-07-05 17:07:56 +0000 | [diff] [blame] | 10 | // Builds up standard unix archive files (.a) containing LLVM bitcode. |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 14 | #include "llvm/Bitcode/Archive.h" |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 15 | #include "ArchiveInternals.h" |
Rafael Espindola | 603d6b5 | 2012-01-23 03:41:53 +0000 | [diff] [blame] | 16 | #include "llvm/ADT/SmallPtrSet.h" |
Chris Lattner | e07c15c | 2007-05-06 06:18:07 +0000 | [diff] [blame] | 17 | #include "llvm/Bitcode/ReaderWriter.h" |
Chandler Carruth | 0b8c9a8 | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 18 | #include "llvm/IR/Module.h" |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 19 | #include "llvm/Support/MemoryBuffer.h" |
Benjamin Kramer | 901b858 | 2012-03-23 11:35:30 +0000 | [diff] [blame] | 20 | #include <cstdio> |
Dan Gohman | d68a076 | 2009-01-05 17:59:02 +0000 | [diff] [blame] | 21 | #include <cstdlib> |
Duraid Madina | 8748746 | 2005-12-26 14:31:26 +0000 | [diff] [blame] | 22 | #include <memory> |
Chris Lattner | 3446ae8 | 2004-01-10 19:00:15 +0000 | [diff] [blame] | 23 | using namespace llvm; |
Brian Gaeke | d0fde30 | 2003-11-11 22:41:34 +0000 | [diff] [blame] | 24 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 25 | /// Read a variable-bit-rate encoded unsigned integer |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 26 | static inline unsigned readInteger(const char*&At, const char*End) { |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 27 | unsigned Shift = 0; |
| 28 | unsigned Result = 0; |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 29 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 30 | do { |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 31 | if (At == End) |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 32 | return Result; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 33 | Result |= (unsigned)((*At++) & 0x7F) << Shift; |
| 34 | Shift += 7; |
| 35 | } while (At[-1] & 0x80); |
| 36 | return Result; |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 37 | } |
| 38 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 39 | // Completely parse the Archive's symbol table and populate symTab member var. |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 40 | bool |
| 41 | Archive::parseSymbolTable(const void* data, unsigned size, std::string* error) { |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 42 | const char* At = (const char*) data; |
| 43 | const char* End = At + size; |
| 44 | while (At < End) { |
| 45 | unsigned offset = readInteger(At, End); |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 46 | if (At == End) { |
| 47 | if (error) |
| 48 | *error = "Ran out of data reading vbr_uint for symtab offset!"; |
| 49 | return false; |
| 50 | } |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 51 | unsigned length = readInteger(At, End); |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 52 | if (At == End) { |
| 53 | if (error) |
| 54 | *error = "Ran out of data reading vbr_uint for symtab length!"; |
| 55 | return false; |
| 56 | } |
| 57 | if (At + length > End) { |
| 58 | if (error) |
| 59 | *error = "Malformed symbol table: length not consistent with size"; |
| 60 | return false; |
| 61 | } |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 62 | // we don't care if it can't be inserted (duplicate entry) |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 63 | symTab.insert(std::make_pair(std::string(At, length), offset)); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 64 | At += length; |
| 65 | } |
| 66 | symTabSize = size; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 67 | return true; |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 68 | } |
| 69 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 70 | // This member parses an ArchiveMemberHeader that is presumed to be pointed to |
| 71 | // by At. The At pointer is updated to the byte just after the header, which |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 72 | // can be variable in size. |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 73 | ArchiveMember* |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 74 | Archive::parseMemberHeader(const char*& At, const char* End, std::string* error) |
| 75 | { |
Reid Spencer | cd5561a | 2006-12-15 19:44:51 +0000 | [diff] [blame] | 76 | if (At + sizeof(ArchiveMemberHeader) >= End) { |
| 77 | if (error) |
| 78 | *error = "Unexpected end of file"; |
| 79 | return 0; |
| 80 | } |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 81 | |
| 82 | // Cast archive member header |
Roman Divacky | 651e800 | 2012-09-05 22:09:23 +0000 | [diff] [blame] | 83 | const ArchiveMemberHeader* Hdr = (const ArchiveMemberHeader*)At; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 84 | At += sizeof(ArchiveMemberHeader); |
| 85 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 86 | int flags = 0; |
| 87 | int MemberSize = atoi(Hdr->size); |
Rafael Espindola | 94bc246 | 2012-08-10 01:57:52 +0000 | [diff] [blame] | 88 | assert(MemberSize >= 0); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 89 | |
| 90 | // Check the size of the member for sanity |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 91 | if (At + MemberSize > End) { |
| 92 | if (error) |
| 93 | *error = "invalid member length in archive file"; |
| 94 | return 0; |
| 95 | } |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 96 | |
| 97 | // Check the member signature |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 98 | if (!Hdr->checkSignature()) { |
| 99 | if (error) |
| 100 | *error = "invalid file member signature"; |
| 101 | return 0; |
| 102 | } |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 103 | |
| 104 | // Convert and check the member name |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 105 | // The empty name ( '/' and 15 blanks) is for a foreign (non-LLVM) symbol |
| 106 | // table. The special name "//" and 14 blanks is for a string table, used |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 107 | // for long file names. This library doesn't generate either of those but |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 108 | // it will accept them. If the name starts with #1/ and the remainder is |
| 109 | // digits, then those digits specify the length of the name that is |
| 110 | // stored immediately following the header. The special name |
Gabor Greif | a99be51 | 2007-07-05 17:07:56 +0000 | [diff] [blame] | 111 | // __LLVM_SYM_TAB__ identifies the symbol table for LLVM bitcode. |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 112 | // Anything else is a regular, short filename that is terminated with |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 113 | // a '/' and blanks. |
| 114 | |
| 115 | std::string pathname; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 116 | switch (Hdr->name[0]) { |
| 117 | case '#': |
| 118 | if (Hdr->name[1] == '1' && Hdr->name[2] == '/') { |
| 119 | if (isdigit(Hdr->name[3])) { |
| 120 | unsigned len = atoi(&Hdr->name[3]); |
Chris Lattner | 4633306 | 2010-02-04 06:19:43 +0000 | [diff] [blame] | 121 | const char *nulp = (const char *)memchr(At, '\0', len); |
Chris Lattner | 7338242 | 2010-04-25 04:44:26 +0000 | [diff] [blame] | 122 | pathname.assign(At, nulp != 0 ? (uintptr_t)(nulp - At) : len); |
Reid Spencer | dd95e8d | 2004-11-17 16:13:11 +0000 | [diff] [blame] | 123 | At += len; |
| 124 | MemberSize -= len; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 125 | flags |= ArchiveMember::HasLongFilenameFlag; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 126 | } else { |
| 127 | if (error) |
| 128 | *error = "invalid long filename"; |
| 129 | return 0; |
| 130 | } |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 131 | } else if (Hdr->name[1] == '_' && |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 132 | (0 == memcmp(Hdr->name, ARFILE_LLVM_SYMTAB_NAME, 16))) { |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 133 | // The member is using a long file name (>15 chars) format. |
| 134 | // This format is standard for 4.4BSD and Mac OSX operating |
| 135 | // systems. LLVM uses it similarly. In this format, the |
| 136 | // remainder of the name field (after #1/) specifies the |
| 137 | // length of the file name which occupy the first bytes of |
| 138 | // the member's data. The pathname already has the #1/ stripped. |
| 139 | pathname.assign(ARFILE_LLVM_SYMTAB_NAME); |
| 140 | flags |= ArchiveMember::LLVMSymbolTableFlag; |
| 141 | } |
| 142 | break; |
| 143 | case '/': |
| 144 | if (Hdr->name[1]== '/') { |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 145 | if (0 == memcmp(Hdr->name, ARFILE_STRTAB_NAME, 16)) { |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 146 | pathname.assign(ARFILE_STRTAB_NAME); |
| 147 | flags |= ArchiveMember::StringTableFlag; |
| 148 | } else { |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 149 | if (error) |
| 150 | *error = "invalid string table name"; |
| 151 | return 0; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 152 | } |
| 153 | } else if (Hdr->name[1] == ' ') { |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 154 | if (0 == memcmp(Hdr->name, ARFILE_SVR4_SYMTAB_NAME, 16)) { |
| 155 | pathname.assign(ARFILE_SVR4_SYMTAB_NAME); |
| 156 | flags |= ArchiveMember::SVR4SymbolTableFlag; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 157 | } else { |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 158 | if (error) |
| 159 | *error = "invalid SVR4 symbol table name"; |
| 160 | return 0; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 161 | } |
| 162 | } else if (isdigit(Hdr->name[1])) { |
| 163 | unsigned index = atoi(&Hdr->name[1]); |
| 164 | if (index < strtab.length()) { |
| 165 | const char* namep = strtab.c_str() + index; |
| 166 | const char* endp = strtab.c_str() + strtab.length(); |
| 167 | const char* p = namep; |
| 168 | const char* last_p = p; |
| 169 | while (p < endp) { |
| 170 | if (*p == '\n' && *last_p == '/') { |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 171 | pathname.assign(namep, last_p - namep); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 172 | flags |= ArchiveMember::HasLongFilenameFlag; |
| 173 | break; |
| 174 | } |
| 175 | last_p = p; |
| 176 | p++; |
| 177 | } |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 178 | if (p >= endp) { |
| 179 | if (error) |
Matt Arsenault | d06c9cb | 2013-02-26 20:13:09 +0000 | [diff] [blame] | 180 | *error = "missing name terminator in string table"; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 181 | return 0; |
| 182 | } |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 183 | } else { |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 184 | if (error) |
| 185 | *error = "name index beyond string table"; |
| 186 | return 0; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 187 | } |
| 188 | } |
| 189 | break; |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 190 | case '_': |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 191 | if (Hdr->name[1] == '_' && |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 192 | (0 == memcmp(Hdr->name, ARFILE_BSD4_SYMTAB_NAME, 16))) { |
| 193 | pathname.assign(ARFILE_BSD4_SYMTAB_NAME); |
| 194 | flags |= ArchiveMember::BSD4SymbolTableFlag; |
Reid Spencer | 84b9ced | 2004-11-23 22:35:39 +0000 | [diff] [blame] | 195 | break; |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 196 | } |
Reid Spencer | 84b9ced | 2004-11-23 22:35:39 +0000 | [diff] [blame] | 197 | /* FALL THROUGH */ |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 198 | |
| 199 | default: |
Roman Divacky | 651e800 | 2012-09-05 22:09:23 +0000 | [diff] [blame] | 200 | const char* slash = (const char*) memchr(Hdr->name, '/', 16); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 201 | if (slash == 0) |
Reid Spencer | dd95e8d | 2004-11-17 16:13:11 +0000 | [diff] [blame] | 202 | slash = Hdr->name + 16; |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 203 | pathname.assign(Hdr->name, slash - Hdr->name); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 204 | break; |
| 205 | } |
| 206 | |
Gabor Greif | db5565a | 2007-07-06 20:28:40 +0000 | [diff] [blame] | 207 | // Determine if this is a bitcode file |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 208 | switch (sys::IdentifyFileType(At, 4)) { |
Chris Lattner | e07c15c | 2007-05-06 06:18:07 +0000 | [diff] [blame] | 209 | case sys::Bitcode_FileType: |
Gabor Greif | e75ca3d | 2007-07-06 13:38:17 +0000 | [diff] [blame] | 210 | flags |= ArchiveMember::BitcodeFlag; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 211 | break; |
| 212 | default: |
Gabor Greif | e75ca3d | 2007-07-06 13:38:17 +0000 | [diff] [blame] | 213 | flags &= ~ArchiveMember::BitcodeFlag; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 214 | break; |
| 215 | } |
| 216 | |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 217 | // Instantiate the ArchiveMember to be filled |
| 218 | ArchiveMember* member = new ArchiveMember(this); |
| 219 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 220 | // Fill in fields of the ArchiveMember |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 221 | member->parent = this; |
Reid Spencer | dd04df0 | 2005-07-07 23:21:43 +0000 | [diff] [blame] | 222 | member->path.set(pathname); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 223 | member->info.fileSize = MemberSize; |
| 224 | member->info.modTime.fromEpochTime(atoi(Hdr->date)); |
Reid Spencer | 5612762 | 2004-12-29 01:20:24 +0000 | [diff] [blame] | 225 | unsigned int mode; |
| 226 | sscanf(Hdr->mode, "%o", &mode); |
| 227 | member->info.mode = mode; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 228 | member->info.user = atoi(Hdr->uid); |
| 229 | member->info.group = atoi(Hdr->gid); |
| 230 | member->flags = flags; |
| 231 | member->data = At; |
| 232 | |
| 233 | return member; |
| 234 | } |
| 235 | |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 236 | bool |
| 237 | Archive::checkSignature(std::string* error) { |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 238 | // Check the magic string at file's header |
Chris Lattner | 7f6b447 | 2008-04-01 04:26:46 +0000 | [diff] [blame] | 239 | if (mapfile->getBufferSize() < 8 || memcmp(base, ARFILE_MAGIC, 8)) { |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 240 | if (error) |
| 241 | *error = "invalid signature for an archive file"; |
| 242 | return false; |
| 243 | } |
| 244 | return true; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 245 | } |
| 246 | |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 247 | // This function loads the entire archive and fully populates its ilist with |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 248 | // the members of the archive file. This is typically used in preparation for |
| 249 | // editing the contents of the archive. |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 250 | bool |
| 251 | Archive::loadArchive(std::string* error) { |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 252 | |
| 253 | // Set up parsing |
| 254 | members.clear(); |
| 255 | symTab.clear(); |
| 256 | const char *At = base; |
Chris Lattner | 7f6b447 | 2008-04-01 04:26:46 +0000 | [diff] [blame] | 257 | const char *End = mapfile->getBufferEnd(); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 258 | |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 259 | if (!checkSignature(error)) |
| 260 | return false; |
| 261 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 262 | At += 8; // Skip the magic string. |
| 263 | |
| 264 | bool seenSymbolTable = false; |
| 265 | bool foundFirstFile = false; |
| 266 | while (At < End) { |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 267 | // parse the member header |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 268 | const char* Save = At; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 269 | ArchiveMember* mbr = parseMemberHeader(At, End, error); |
| 270 | if (!mbr) |
| 271 | return false; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 272 | |
| 273 | // check if this is the foreign symbol table |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 274 | if (mbr->isSVR4SymbolTable() || mbr->isBSD4SymbolTable()) { |
Reid Spencer | 4a980d1 | 2004-11-16 06:47:19 +0000 | [diff] [blame] | 275 | // We just save this but don't do anything special |
| 276 | // with it. It doesn't count as the "first file". |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 277 | if (foreignST) { |
| 278 | // What? Multiple foreign symbol tables? Just chuck it |
| 279 | // and retain the last one found. |
| 280 | delete foreignST; |
| 281 | } |
Reid Spencer | 4a980d1 | 2004-11-16 06:47:19 +0000 | [diff] [blame] | 282 | foreignST = mbr; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 283 | At += mbr->getSize(); |
Reid Spencer | 6405c9e | 2004-11-19 17:08:00 +0000 | [diff] [blame] | 284 | if ((intptr_t(At) & 1) == 1) |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 285 | At++; |
| 286 | } else if (mbr->isStringTable()) { |
Reid Spencer | 4a980d1 | 2004-11-16 06:47:19 +0000 | [diff] [blame] | 287 | // Simply suck the entire string table into a string |
| 288 | // variable. This will be used to get the names of the |
| 289 | // members that use the "/ddd" format for their names |
| 290 | // (SVR4 style long names). |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 291 | strtab.assign(At, mbr->getSize()); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 292 | At += mbr->getSize(); |
Reid Spencer | 6405c9e | 2004-11-19 17:08:00 +0000 | [diff] [blame] | 293 | if ((intptr_t(At) & 1) == 1) |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 294 | At++; |
| 295 | delete mbr; |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 296 | } else if (mbr->isLLVMSymbolTable()) { |
Reid Spencer | 4a980d1 | 2004-11-16 06:47:19 +0000 | [diff] [blame] | 297 | // This is the LLVM symbol table for the archive. If we've seen it |
| 298 | // already, its an error. Otherwise, parse the symbol table and move on. |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 299 | if (seenSymbolTable) { |
| 300 | if (error) |
| 301 | *error = "invalid archive: multiple symbol tables"; |
| 302 | return false; |
| 303 | } |
| 304 | if (!parseSymbolTable(mbr->getData(), mbr->getSize(), error)) |
| 305 | return false; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 306 | seenSymbolTable = true; |
| 307 | At += mbr->getSize(); |
Reid Spencer | 6405c9e | 2004-11-19 17:08:00 +0000 | [diff] [blame] | 308 | if ((intptr_t(At) & 1) == 1) |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 309 | At++; |
Reid Spencer | 4a980d1 | 2004-11-16 06:47:19 +0000 | [diff] [blame] | 310 | delete mbr; // We don't need this member in the list of members. |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 311 | } else { |
Reid Spencer | 4a980d1 | 2004-11-16 06:47:19 +0000 | [diff] [blame] | 312 | // This is just a regular file. If its the first one, save its offset. |
| 313 | // Otherwise just push it on the list and move on to the next file. |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 314 | if (!foundFirstFile) { |
| 315 | firstFileOffset = Save - base; |
| 316 | foundFirstFile = true; |
| 317 | } |
| 318 | members.push_back(mbr); |
| 319 | At += mbr->getSize(); |
Reid Spencer | 6405c9e | 2004-11-19 17:08:00 +0000 | [diff] [blame] | 320 | if ((intptr_t(At) & 1) == 1) |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 321 | At++; |
| 322 | } |
| 323 | } |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 324 | return true; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 325 | } |
| 326 | |
| 327 | // Open and completely load the archive file. |
| 328 | Archive* |
Owen Anderson | 4434ed4 | 2009-07-01 23:13:44 +0000 | [diff] [blame] | 329 | Archive::OpenAndLoad(const sys::Path& file, LLVMContext& C, |
Owen Anderson | 8b477ed | 2009-07-01 16:58:40 +0000 | [diff] [blame] | 330 | std::string* ErrorMessage) { |
| 331 | std::auto_ptr<Archive> result ( new Archive(file, C)); |
Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 332 | if (result->mapToMemory(ErrorMessage)) |
| 333 | return 0; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 334 | if (!result->loadArchive(ErrorMessage)) |
Reid Spencer | 5af4688 | 2004-12-13 02:59:03 +0000 | [diff] [blame] | 335 | return 0; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 336 | return result.release(); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 337 | } |
| 338 | |
Gabor Greif | a99be51 | 2007-07-05 17:07:56 +0000 | [diff] [blame] | 339 | // Get all the bitcode modules from the archive |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 340 | bool |
Owen Anderson | 8b477ed | 2009-07-01 16:58:40 +0000 | [diff] [blame] | 341 | Archive::getAllModules(std::vector<Module*>& Modules, |
| 342 | std::string* ErrMessage) { |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 343 | |
| 344 | for (iterator I=begin(), E=end(); I != E; ++I) { |
Gabor Greif | e75ca3d | 2007-07-06 13:38:17 +0000 | [diff] [blame] | 345 | if (I->isBitcode()) { |
Chris Lattner | 74382b7 | 2009-08-23 22:45:37 +0000 | [diff] [blame] | 346 | std::string FullMemberName = archPath.str() + |
| 347 | "(" + I->getPath().str() + ")"; |
Chris Lattner | c1d5624 | 2007-05-06 09:28:33 +0000 | [diff] [blame] | 348 | MemoryBuffer *Buffer = |
Benjamin Kramer | 9d44e70 | 2010-04-19 16:15:31 +0000 | [diff] [blame] | 349 | MemoryBuffer::getMemBufferCopy(StringRef(I->getData(), I->getSize()), |
| 350 | FullMemberName.c_str()); |
Chris Lattner | e07c15c | 2007-05-06 06:18:07 +0000 | [diff] [blame] | 351 | |
Owen Anderson | 8b477ed | 2009-07-01 16:58:40 +0000 | [diff] [blame] | 352 | Module *M = ParseBitcodeFile(Buffer, Context, ErrMessage); |
Chris Lattner | c1d5624 | 2007-05-06 09:28:33 +0000 | [diff] [blame] | 353 | delete Buffer; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 354 | if (!M) |
| 355 | return true; |
| 356 | |
| 357 | Modules.push_back(M); |
| 358 | } |
| 359 | } |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 360 | return false; |
| 361 | } |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 362 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 363 | // Load just the symbol table from the archive file |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 364 | bool |
| 365 | Archive::loadSymbolTable(std::string* ErrorMsg) { |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 366 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 367 | // Set up parsing |
| 368 | members.clear(); |
| 369 | symTab.clear(); |
| 370 | const char *At = base; |
Chris Lattner | 7f6b447 | 2008-04-01 04:26:46 +0000 | [diff] [blame] | 371 | const char *End = mapfile->getBufferEnd(); |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 372 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 373 | // Make sure we're dealing with an archive |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 374 | if (!checkSignature(ErrorMsg)) |
| 375 | return false; |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 376 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 377 | At += 8; // Skip signature |
| 378 | |
| 379 | // Parse the first file member header |
| 380 | const char* FirstFile = At; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 381 | ArchiveMember* mbr = parseMemberHeader(At, End, ErrorMsg); |
| 382 | if (!mbr) |
| 383 | return false; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 384 | |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 385 | if (mbr->isSVR4SymbolTable() || mbr->isBSD4SymbolTable()) { |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 386 | // Skip the foreign symbol table, we don't do anything with it |
| 387 | At += mbr->getSize(); |
Reid Spencer | 6405c9e | 2004-11-19 17:08:00 +0000 | [diff] [blame] | 388 | if ((intptr_t(At) & 1) == 1) |
Reid Spencer | b323113 | 2004-11-15 01:40:20 +0000 | [diff] [blame] | 389 | At++; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 390 | delete mbr; |
| 391 | |
Reid Spencer | b323113 | 2004-11-15 01:40:20 +0000 | [diff] [blame] | 392 | // Read the next one |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 393 | FirstFile = At; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 394 | mbr = parseMemberHeader(At, End, ErrorMsg); |
| 395 | if (!mbr) { |
| 396 | delete mbr; |
| 397 | return false; |
| 398 | } |
Reid Spencer | b323113 | 2004-11-15 01:40:20 +0000 | [diff] [blame] | 399 | } |
| 400 | |
| 401 | if (mbr->isStringTable()) { |
| 402 | // Process the string table entry |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 403 | strtab.assign((const char*)mbr->getData(), mbr->getSize()); |
Reid Spencer | b323113 | 2004-11-15 01:40:20 +0000 | [diff] [blame] | 404 | At += mbr->getSize(); |
Reid Spencer | 6405c9e | 2004-11-19 17:08:00 +0000 | [diff] [blame] | 405 | if ((intptr_t(At) & 1) == 1) |
Reid Spencer | b323113 | 2004-11-15 01:40:20 +0000 | [diff] [blame] | 406 | At++; |
| 407 | delete mbr; |
| 408 | // Get the next one |
| 409 | FirstFile = At; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 410 | mbr = parseMemberHeader(At, End, ErrorMsg); |
| 411 | if (!mbr) { |
| 412 | delete mbr; |
| 413 | return false; |
| 414 | } |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 415 | } |
| 416 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 417 | // See if its the symbol table |
| 418 | if (mbr->isLLVMSymbolTable()) { |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 419 | if (!parseSymbolTable(mbr->getData(), mbr->getSize(), ErrorMsg)) { |
| 420 | delete mbr; |
| 421 | return false; |
| 422 | } |
| 423 | |
Reid Spencer | 8dde18f | 2004-11-28 03:13:02 +0000 | [diff] [blame] | 424 | At += mbr->getSize(); |
Reid Spencer | 6405c9e | 2004-11-19 17:08:00 +0000 | [diff] [blame] | 425 | if ((intptr_t(At) & 1) == 1) |
Reid Spencer | 8dde18f | 2004-11-28 03:13:02 +0000 | [diff] [blame] | 426 | At++; |
Reid Spencer | ffb4d62 | 2006-05-12 17:56:20 +0000 | [diff] [blame] | 427 | delete mbr; |
| 428 | // Can't be any more symtab headers so just advance |
Reid Spencer | 8dde18f | 2004-11-28 03:13:02 +0000 | [diff] [blame] | 429 | FirstFile = At; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 430 | } else { |
| 431 | // There's no symbol table in the file. We have to rebuild it from scratch |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 432 | // because the intent of this method is to get the symbol table loaded so |
| 433 | // it can be searched efficiently. |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 434 | // Add the member to the members list |
| 435 | members.push_back(mbr); |
| 436 | } |
| 437 | |
| 438 | firstFileOffset = FirstFile - base; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 439 | return true; |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 440 | } |
| 441 | |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 442 | // Open the archive and load just the symbol tables |
Owen Anderson | 31895e7 | 2009-07-01 21:22:36 +0000 | [diff] [blame] | 443 | Archive* Archive::OpenAndLoadSymbols(const sys::Path& file, |
Owen Anderson | 4434ed4 | 2009-07-01 23:13:44 +0000 | [diff] [blame] | 444 | LLVMContext& C, |
Owen Anderson | 8b477ed | 2009-07-01 16:58:40 +0000 | [diff] [blame] | 445 | std::string* ErrorMessage) { |
| 446 | std::auto_ptr<Archive> result ( new Archive(file, C) ); |
Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 447 | if (result->mapToMemory(ErrorMessage)) |
| 448 | return 0; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 449 | if (!result->loadSymbolTable(ErrorMessage)) |
Reid Spencer | 5af4688 | 2004-12-13 02:59:03 +0000 | [diff] [blame] | 450 | return 0; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 451 | return result.release(); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 452 | } |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 453 | |
Jeffrey Yasskin | f0356fe | 2010-01-27 20:34:15 +0000 | [diff] [blame] | 454 | // Look up one symbol in the symbol table and return the module that defines |
| 455 | // that symbol. |
| 456 | Module* |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 457 | Archive::findModuleDefiningSymbol(const std::string& symbol, |
| 458 | std::string* ErrMsg) { |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 459 | SymTabType::iterator SI = symTab.find(symbol); |
| 460 | if (SI == symTab.end()) |
| 461 | return 0; |
| 462 | |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 463 | // The symbol table was previously constructed assuming that the members were |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 464 | // written without the symbol table header. Because VBR encoding is used, the |
| 465 | // values could not be adjusted to account for the offset of the symbol table |
| 466 | // because that could affect the size of the symbol table due to VBR encoding. |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 467 | // We now have to account for this by adjusting the offset by the size of the |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 468 | // symbol table and its header. |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 469 | unsigned fileOffset = |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 470 | SI->second + // offset in symbol-table-less file |
| 471 | firstFileOffset; // add offset to first "real" file in archive |
| 472 | |
| 473 | // See if the module is already loaded |
| 474 | ModuleMap::iterator MI = modules.find(fileOffset); |
| 475 | if (MI != modules.end()) |
| 476 | return MI->second.first; |
| 477 | |
| 478 | // Module hasn't been loaded yet, we need to load it |
| 479 | const char* modptr = base + fileOffset; |
Chris Lattner | 7f6b447 | 2008-04-01 04:26:46 +0000 | [diff] [blame] | 480 | ArchiveMember* mbr = parseMemberHeader(modptr, mapfile->getBufferEnd(), |
| 481 | ErrMsg); |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 482 | if (!mbr) |
Reid Spencer | 0b5a504 | 2006-08-25 17:43:11 +0000 | [diff] [blame] | 483 | return 0; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 484 | |
Jeffrey Yasskin | f0356fe | 2010-01-27 20:34:15 +0000 | [diff] [blame] | 485 | // Now, load the bitcode module to get the Module. |
Chris Lattner | 74382b7 | 2009-08-23 22:45:37 +0000 | [diff] [blame] | 486 | std::string FullMemberName = archPath.str() + "(" + |
| 487 | mbr->getPath().str() + ")"; |
Benjamin Kramer | 9d44e70 | 2010-04-19 16:15:31 +0000 | [diff] [blame] | 488 | MemoryBuffer *Buffer = |
| 489 | MemoryBuffer::getMemBufferCopy(StringRef(mbr->getData(), mbr->getSize()), |
| 490 | FullMemberName.c_str()); |
Chris Lattner | c1d5624 | 2007-05-06 09:28:33 +0000 | [diff] [blame] | 491 | |
Jeffrey Yasskin | f0356fe | 2010-01-27 20:34:15 +0000 | [diff] [blame] | 492 | Module *m = getLazyBitcodeModule(Buffer, Context, ErrMsg); |
| 493 | if (!m) |
Reid Spencer | 0b5a504 | 2006-08-25 17:43:11 +0000 | [diff] [blame] | 494 | return 0; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 495 | |
Jeffrey Yasskin | f0356fe | 2010-01-27 20:34:15 +0000 | [diff] [blame] | 496 | modules.insert(std::make_pair(fileOffset, std::make_pair(m, mbr))); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 497 | |
Jeffrey Yasskin | f0356fe | 2010-01-27 20:34:15 +0000 | [diff] [blame] | 498 | return m; |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 499 | } |
| 500 | |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 501 | // Look up multiple symbols in the symbol table and return a set of |
Jeffrey Yasskin | f0356fe | 2010-01-27 20:34:15 +0000 | [diff] [blame] | 502 | // Modules that define those symbols. |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 503 | bool |
Reid Spencer | 7783e8a | 2004-11-19 03:18:22 +0000 | [diff] [blame] | 504 | Archive::findModulesDefiningSymbols(std::set<std::string>& symbols, |
Rafael Espindola | 603d6b5 | 2012-01-23 03:41:53 +0000 | [diff] [blame] | 505 | SmallVectorImpl<Module*>& result, |
Chris Lattner | f2e292c | 2007-02-07 21:41:02 +0000 | [diff] [blame] | 506 | std::string* error) { |
Reid Spencer | cd5561a | 2006-12-15 19:44:51 +0000 | [diff] [blame] | 507 | if (!mapfile || !base) { |
| 508 | if (error) |
| 509 | *error = "Empty archive invalid for finding modules defining symbols"; |
| 510 | return false; |
| 511 | } |
| 512 | |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 513 | if (symTab.empty()) { |
| 514 | // We don't have a symbol table, so we must build it now but lets also |
| 515 | // make sure that we populate the modules table as we do this to ensure |
| 516 | // that we don't load them twice when findModuleDefiningSymbol is called |
| 517 | // below. |
| 518 | |
| 519 | // Get a pointer to the first file |
Chris Lattner | 7f6b447 | 2008-04-01 04:26:46 +0000 | [diff] [blame] | 520 | const char* At = base + firstFileOffset; |
| 521 | const char* End = mapfile->getBufferEnd(); |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 522 | |
| 523 | while ( At < End) { |
| 524 | // Compute the offset to be put in the symbol table |
| 525 | unsigned offset = At - base - firstFileOffset; |
| 526 | |
| 527 | // Parse the file's header |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 528 | ArchiveMember* mbr = parseMemberHeader(At, End, error); |
| 529 | if (!mbr) |
| 530 | return false; |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 531 | |
| 532 | // If it contains symbols |
Gabor Greif | e75ca3d | 2007-07-06 13:38:17 +0000 | [diff] [blame] | 533 | if (mbr->isBitcode()) { |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 534 | // Get the symbols |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 535 | std::vector<std::string> symbols; |
Chris Lattner | 74382b7 | 2009-08-23 22:45:37 +0000 | [diff] [blame] | 536 | std::string FullMemberName = archPath.str() + "(" + |
| 537 | mbr->getPath().str() + ")"; |
Jeffrey Yasskin | f0356fe | 2010-01-27 20:34:15 +0000 | [diff] [blame] | 538 | Module* M = |
Benjamin Kramer | 9d44e70 | 2010-04-19 16:15:31 +0000 | [diff] [blame] | 539 | GetBitcodeSymbols(At, mbr->getSize(), FullMemberName, Context, |
| 540 | symbols, error); |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 541 | |
Jeffrey Yasskin | f0356fe | 2010-01-27 20:34:15 +0000 | [diff] [blame] | 542 | if (M) { |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 543 | // Insert the module's symbols into the symbol table |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 544 | for (std::vector<std::string>::iterator I = symbols.begin(), |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 545 | E=symbols.end(); I != E; ++I ) { |
Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 546 | symTab.insert(std::make_pair(*I, offset)); |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 547 | } |
Jeffrey Yasskin | f0356fe | 2010-01-27 20:34:15 +0000 | [diff] [blame] | 548 | // Insert the Module and the ArchiveMember into the table of |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 549 | // modules. |
Jeffrey Yasskin | f0356fe | 2010-01-27 20:34:15 +0000 | [diff] [blame] | 550 | modules.insert(std::make_pair(offset, std::make_pair(M, mbr))); |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 551 | } else { |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 552 | if (error) |
Gabor Greif | a99be51 | 2007-07-05 17:07:56 +0000 | [diff] [blame] | 553 | *error = "Can't parse bitcode member: " + |
Chris Lattner | 74382b7 | 2009-08-23 22:45:37 +0000 | [diff] [blame] | 554 | mbr->getPath().str() + ": " + *error; |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 555 | delete mbr; |
| 556 | return false; |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 557 | } |
| 558 | } |
Reid Spencer | b323113 | 2004-11-15 01:40:20 +0000 | [diff] [blame] | 559 | |
| 560 | // Go to the next file location |
| 561 | At += mbr->getSize(); |
Reid Spencer | 6405c9e | 2004-11-19 17:08:00 +0000 | [diff] [blame] | 562 | if ((intptr_t(At) & 1) == 1) |
Reid Spencer | b323113 | 2004-11-15 01:40:20 +0000 | [diff] [blame] | 563 | At++; |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 564 | } |
| 565 | } |
| 566 | |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 567 | // At this point we have a valid symbol table (one way or another) so we |
Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 568 | // just use it to quickly find the symbols requested. |
| 569 | |
Rafael Espindola | 603d6b5 | 2012-01-23 03:41:53 +0000 | [diff] [blame] | 570 | SmallPtrSet<Module*, 16> Added; |
Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 571 | for (std::set<std::string>::iterator I=symbols.begin(), |
Rafael Espindola | 4254df3 | 2012-01-23 05:07:16 +0000 | [diff] [blame] | 572 | Next = I, |
| 573 | E=symbols.end(); I != E; I = Next) { |
| 574 | // Increment Next before we invalidate it. |
| 575 | ++Next; |
| 576 | |
Reid Spencer | 7783e8a | 2004-11-19 03:18:22 +0000 | [diff] [blame] | 577 | // See if this symbol exists |
Jeffrey Yasskin | f0356fe | 2010-01-27 20:34:15 +0000 | [diff] [blame] | 578 | Module* m = findModuleDefiningSymbol(*I,error); |
Rafael Espindola | 603d6b5 | 2012-01-23 03:41:53 +0000 | [diff] [blame] | 579 | if (!m) |
| 580 | continue; |
| 581 | bool NewMember = Added.insert(m); |
| 582 | if (!NewMember) |
| 583 | continue; |
Reid Spencer | 7783e8a | 2004-11-19 03:18:22 +0000 | [diff] [blame] | 584 | |
Rafael Espindola | 603d6b5 | 2012-01-23 03:41:53 +0000 | [diff] [blame] | 585 | // The symbol exists, insert the Module into our result. |
| 586 | result.push_back(m); |
| 587 | |
| 588 | // Remove the symbol now that its been resolved. |
| 589 | symbols.erase(I); |
Reid Spencer | f9d7a51 | 2004-11-14 21:58:33 +0000 | [diff] [blame] | 590 | } |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 591 | return true; |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 592 | } |
Reid Spencer | eaa06bb | 2005-02-26 22:00:32 +0000 | [diff] [blame] | 593 | |
Gabor Greif | a99be51 | 2007-07-05 17:07:56 +0000 | [diff] [blame] | 594 | bool Archive::isBitcodeArchive() { |
Chris Lattner | 7c43992 | 2005-09-23 06:22:58 +0000 | [diff] [blame] | 595 | // Make sure the symTab has been loaded. In most cases this should have been |
| 596 | // done when the archive was constructed, but still, this is just in case. |
Dan Gohman | 3035959 | 2008-01-29 13:02:09 +0000 | [diff] [blame] | 597 | if (symTab.empty()) |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 598 | if (!loadSymbolTable(0)) |
| 599 | return false; |
Reid Spencer | eaa06bb | 2005-02-26 22:00:32 +0000 | [diff] [blame] | 600 | |
Chris Lattner | 7c43992 | 2005-09-23 06:22:58 +0000 | [diff] [blame] | 601 | // Now that we know it's been loaded, return true |
| 602 | // if it has a size |
| 603 | if (symTab.size()) return true; |
Reid Spencer | eaa06bb | 2005-02-26 22:00:32 +0000 | [diff] [blame] | 604 | |
Gabor Greif | a99be51 | 2007-07-05 17:07:56 +0000 | [diff] [blame] | 605 | // We still can't be sure it isn't a bitcode archive |
Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 606 | if (!loadArchive(0)) |
| 607 | return false; |
Reid Spencer | eaa06bb | 2005-02-26 22:00:32 +0000 | [diff] [blame] | 608 | |
| 609 | std::vector<Module *> Modules; |
| 610 | std::string ErrorMessage; |
| 611 | |
Gabor Greif | a99be51 | 2007-07-05 17:07:56 +0000 | [diff] [blame] | 612 | // Scan the archive, trying to load a bitcode member. We only load one to |
Chris Lattner | 7c43992 | 2005-09-23 06:22:58 +0000 | [diff] [blame] | 613 | // see if this works. |
| 614 | for (iterator I = begin(), E = end(); I != E; ++I) { |
Gabor Greif | e75ca3d | 2007-07-06 13:38:17 +0000 | [diff] [blame] | 615 | if (!I->isBitcode()) |
Chris Lattner | 7c43992 | 2005-09-23 06:22:58 +0000 | [diff] [blame] | 616 | continue; |
| 617 | |
| 618 | std::string FullMemberName = |
Chris Lattner | 74382b7 | 2009-08-23 22:45:37 +0000 | [diff] [blame] | 619 | archPath.str() + "(" + I->getPath().str() + ")"; |
Chris Lattner | c1d5624 | 2007-05-06 09:28:33 +0000 | [diff] [blame] | 620 | |
| 621 | MemoryBuffer *Buffer = |
Benjamin Kramer | 9d44e70 | 2010-04-19 16:15:31 +0000 | [diff] [blame] | 622 | MemoryBuffer::getMemBufferCopy(StringRef(I->getData(), I->getSize()), |
| 623 | FullMemberName.c_str()); |
Owen Anderson | 8b477ed | 2009-07-01 16:58:40 +0000 | [diff] [blame] | 624 | Module *M = ParseBitcodeFile(Buffer, Context); |
Chris Lattner | c1d5624 | 2007-05-06 09:28:33 +0000 | [diff] [blame] | 625 | delete Buffer; |
Chris Lattner | 7c43992 | 2005-09-23 06:22:58 +0000 | [diff] [blame] | 626 | if (!M) |
Gabor Greif | a99be51 | 2007-07-05 17:07:56 +0000 | [diff] [blame] | 627 | return false; // Couldn't parse bitcode, not a bitcode archive. |
Chris Lattner | 7c43992 | 2005-09-23 06:22:58 +0000 | [diff] [blame] | 628 | delete M; |
| 629 | return true; |
| 630 | } |
| 631 | |
| 632 | return false; |
Reid Spencer | eaa06bb | 2005-02-26 22:00:32 +0000 | [diff] [blame] | 633 | } |