Chris Lattner | 23219d1 | 2003-09-22 23:42:00 +0000 | [diff] [blame] | 1 | //===- ArchiveReader.cpp - Code to read LLVM bytecode from .a files -------===// |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file was developed by the LLVM research group and is distributed under |
| 6 | // the University of Illinois Open Source License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 9 | // |
| 10 | // This file implements the ReadArchiveFile interface, which allows a linker to |
| 11 | // read all of the LLVM bytecode files contained in a .a file. This file |
| 12 | // understands the standard system .a file format. This can only handle the .a |
Misha Brukman | 09ff150 | 2003-04-23 02:59:05 +0000 | [diff] [blame] | 13 | // variant prevalent on Linux systems so far, but may be extended. See |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 14 | // information in this source file for more information: |
| 15 | // http://sources.redhat.com/cgi-bin/cvsweb.cgi/src/bfd/archive.c?cvsroot=src |
| 16 | // |
| 17 | //===----------------------------------------------------------------------===// |
| 18 | |
| 19 | #include "llvm/Bytecode/Reader.h" |
| 20 | #include "llvm/Module.h" |
Chris Lattner | b70abe1 | 2003-12-30 07:40:35 +0000 | [diff] [blame] | 21 | #include "Support/FileUtilities.h" |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 22 | #include <cstdlib> |
Chris Lattner | 3446ae8 | 2004-01-10 19:00:15 +0000 | [diff] [blame] | 23 | using namespace llvm; |
Brian Gaeke | d0fde30 | 2003-11-11 22:41:34 +0000 | [diff] [blame] | 24 | |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 25 | namespace { |
| 26 | struct ar_hdr { |
| 27 | char name[16]; |
| 28 | char date[12]; |
| 29 | char uid[6]; |
| 30 | char gid[6]; |
| 31 | char mode[8]; |
| 32 | char size[10]; |
| 33 | char fmag[2]; // Always equal to '`\n' |
| 34 | }; |
| 35 | |
| 36 | enum ObjectType { |
| 37 | UserObject, // A user .o/.bc file |
| 38 | Unknown, // Unknown file, just ignore it |
| 39 | SVR4LongFilename, // a "//" section used for long file names |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 40 | ArchiveSymbolTable, // Symbol table produced by ranlib. |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 41 | }; |
| 42 | } |
| 43 | |
Brian Gaeke | 3c09636 | 2003-12-11 00:38:04 +0000 | [diff] [blame] | 44 | /// getObjectType - Determine the type of object that this header represents. |
| 45 | /// This is capable of parsing the variety of special sections used for various |
| 46 | /// purposes. |
| 47 | /// |
Brian Gaeke | 60d6e54 | 2004-03-31 19:51:00 +0000 | [diff] [blame] | 48 | static enum ObjectType getObjectType(ar_hdr *H, std::string MemberName, |
| 49 | unsigned char *MemberData, unsigned Size) { |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 50 | // Check for sections with special names... |
Brian Gaeke | 60d6e54 | 2004-03-31 19:51:00 +0000 | [diff] [blame] | 51 | if (MemberName == "__.SYMDEF " || MemberName == "__.SYMDEF SORTED") |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 52 | return ArchiveSymbolTable; |
Brian Gaeke | 60d6e54 | 2004-03-31 19:51:00 +0000 | [diff] [blame] | 53 | else if (MemberName == "// ") |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 54 | return SVR4LongFilename; |
| 55 | |
| 56 | // Check to see if it looks like an llvm object file... |
Brian Gaeke | 3c09636 | 2003-12-11 00:38:04 +0000 | [diff] [blame] | 57 | if (Size >= 4 && !memcmp(MemberData, "llvm", 4)) |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 58 | return UserObject; |
| 59 | |
| 60 | return Unknown; |
| 61 | } |
| 62 | |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 63 | static inline bool Error(std::string *ErrorStr, const char *Message) { |
| 64 | if (ErrorStr) *ErrorStr = Message; |
| 65 | return true; |
| 66 | } |
| 67 | |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 68 | static bool ParseSymbolTableSection(unsigned char *Buffer, unsigned Size, |
| 69 | std::string *S) { |
| 70 | // Currently not supported (succeeds without doing anything) |
| 71 | return false; |
| 72 | } |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 73 | |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 74 | static bool ReadArchiveBuffer(const std::string &ArchiveName, |
Chris Lattner | 75f2053 | 2003-04-22 18:02:52 +0000 | [diff] [blame] | 75 | unsigned char *Buffer, unsigned Length, |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 76 | std::vector<Module*> &Objects, |
| 77 | std::string *ErrorStr) { |
| 78 | if (Length < 8 || memcmp(Buffer, "!<arch>\n", 8)) |
| 79 | return Error(ErrorStr, "signature incorrect for an archive file!"); |
| 80 | Buffer += 8; Length -= 8; // Skip the magic string. |
| 81 | |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 82 | std::vector<char> LongFilenames; |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 83 | |
| 84 | while (Length >= sizeof(ar_hdr)) { |
| 85 | ar_hdr *Hdr = (ar_hdr*)Buffer; |
Brian Gaeke | 3c09636 | 2003-12-11 00:38:04 +0000 | [diff] [blame] | 86 | unsigned SizeFromHeader = atoi(Hdr->size); |
| 87 | if (SizeFromHeader + sizeof(ar_hdr) > Length) |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 88 | return Error(ErrorStr, "invalid record length in archive file!"); |
| 89 | |
Brian Gaeke | 3c09636 | 2003-12-11 00:38:04 +0000 | [diff] [blame] | 90 | unsigned char *MemberData = Buffer + sizeof(ar_hdr); |
| 91 | unsigned MemberSize = SizeFromHeader; |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 92 | // Get name of archive member. |
| 93 | char *startp = Hdr->name; |
Brian Gaeke | 3c09636 | 2003-12-11 00:38:04 +0000 | [diff] [blame] | 94 | char *endp = (char *) memchr (startp, '/', sizeof(ar_hdr)); |
| 95 | if (memcmp (Hdr->name, "#1/", 3) == 0) { |
| 96 | // 4.4BSD/MacOSX long filenames are abbreviated as "#1/L", where L is an |
| 97 | // ASCII-coded decimal number representing the length of the name buffer, |
| 98 | // which is prepended to the archive member's contents. |
| 99 | unsigned NameLength = atoi (&Hdr->name[3]); |
| 100 | startp = (char *) MemberData; |
| 101 | endp = startp + NameLength; |
| 102 | MemberData += NameLength; |
| 103 | MemberSize -= NameLength; |
| 104 | } else if (startp == endp && isdigit (Hdr->name[1])) { |
| 105 | // SVR4 long filenames are abbreviated as "/I", where I is |
| 106 | // an ASCII-coded decimal index into the LongFilenames vector. |
| 107 | unsigned NameIndex = atoi (&Hdr->name[1]); |
| 108 | assert (LongFilenames.size () > NameIndex |
| 109 | && "SVR4-style long filename for archive member not found"); |
| 110 | startp = &LongFilenames[NameIndex]; |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 111 | endp = strchr (startp, '/'); |
Brian Gaeke | 60d6e54 | 2004-03-31 19:51:00 +0000 | [diff] [blame] | 112 | } else if (startp == endp && Hdr->name[1] == '/') { |
| 113 | // This is for the SVR4 long filename table (there might be other |
| 114 | // names starting with // but I don't know about them). Make sure that |
| 115 | // getObjectType sees it. |
| 116 | endp = &Hdr->name[sizeof (Hdr->name)]; |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 117 | } |
Brian Gaeke | 3c09636 | 2003-12-11 00:38:04 +0000 | [diff] [blame] | 118 | if (!endp) { |
| 119 | // 4.4BSD/MacOSX *short* filenames are not guaranteed to have a |
| 120 | // terminator. Start at the end of the field and backtrack over spaces. |
| 121 | endp = startp + sizeof(Hdr->name); |
| 122 | while (endp[-1] == ' ') |
| 123 | --endp; |
| 124 | } |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 125 | std::string MemberName (startp, endp); |
John Criswell | 9059158 | 2003-12-22 16:22:49 +0000 | [diff] [blame] | 126 | std::string FullMemberName = ArchiveName + "(" + MemberName + ")"; |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 127 | |
Brian Gaeke | 60d6e54 | 2004-03-31 19:51:00 +0000 | [diff] [blame] | 128 | switch (getObjectType(Hdr, MemberName, MemberData, MemberSize)) { |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 129 | case SVR4LongFilename: |
| 130 | // If this is a long filename section, read all of the file names into the |
| 131 | // LongFilenames vector. |
Brian Gaeke | 3c09636 | 2003-12-11 00:38:04 +0000 | [diff] [blame] | 132 | LongFilenames.assign (MemberData, MemberData + MemberSize); |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 133 | break; |
| 134 | case UserObject: { |
Brian Gaeke | 3c09636 | 2003-12-11 00:38:04 +0000 | [diff] [blame] | 135 | Module *M = ParseBytecodeBuffer(MemberData, MemberSize, |
John Criswell | 9059158 | 2003-12-22 16:22:49 +0000 | [diff] [blame] | 136 | FullMemberName, ErrorStr); |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 137 | if (!M) return true; |
| 138 | Objects.push_back(M); |
| 139 | break; |
| 140 | } |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 141 | case ArchiveSymbolTable: |
Brian Gaeke | 3c09636 | 2003-12-11 00:38:04 +0000 | [diff] [blame] | 142 | if (ParseSymbolTableSection(MemberData, MemberSize, ErrorStr)) |
Brian Gaeke | 2c61d7b | 2003-11-16 23:08:48 +0000 | [diff] [blame] | 143 | return true; |
| 144 | break; |
| 145 | default: |
| 146 | std::cerr << "ReadArchiveBuffer: WARNING: Skipping unknown file: " |
John Criswell | 9059158 | 2003-12-22 16:22:49 +0000 | [diff] [blame] | 147 | << FullMemberName << "\n"; |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 148 | break; // Just ignore unknown files. |
| 149 | } |
| 150 | |
Brian Gaeke | 3c09636 | 2003-12-11 00:38:04 +0000 | [diff] [blame] | 151 | // Round SizeFromHeader up to an even number... |
| 152 | SizeFromHeader = (SizeFromHeader+1)/2*2; |
| 153 | Buffer += sizeof(ar_hdr)+SizeFromHeader; // Move to the next entry |
| 154 | Length -= sizeof(ar_hdr)+SizeFromHeader; |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 155 | } |
| 156 | |
| 157 | return Length != 0; |
| 158 | } |
| 159 | |
| 160 | |
Misha Brukman | 37f92e2 | 2003-09-11 22:34:13 +0000 | [diff] [blame] | 161 | // ReadArchiveFile - Read bytecode files from the specified .a file, returning |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 162 | // true on error, or false on success. This does not support reading files from |
| 163 | // standard input. |
| 164 | // |
Chris Lattner | 3446ae8 | 2004-01-10 19:00:15 +0000 | [diff] [blame] | 165 | bool llvm::ReadArchiveFile(const std::string &Filename, |
| 166 | std::vector<Module*> &Objects,std::string *ErrorStr){ |
Chris Lattner | fb777c2 | 2004-05-28 00:24:41 +0000 | [diff] [blame^] | 167 | unsigned Length; |
Chris Lattner | b70abe1 | 2003-12-30 07:40:35 +0000 | [diff] [blame] | 168 | |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 169 | // mmap in the file all at once... |
Chris Lattner | fb777c2 | 2004-05-28 00:24:41 +0000 | [diff] [blame^] | 170 | unsigned char *Buffer = |
| 171 | (unsigned char*)ReadFileIntoAddressSpace(Filename, Length); |
| 172 | if (Buffer == 0) { |
| 173 | if (ErrorStr) *ErrorStr = "Error reading file '" + Filename + "'!"; |
| 174 | return true; |
| 175 | } |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 176 | |
| 177 | // Parse the archive files we mmap'ped in |
Chris Lattner | 75f2053 | 2003-04-22 18:02:52 +0000 | [diff] [blame] | 178 | bool Result = ReadArchiveBuffer(Filename, Buffer, Length, Objects, ErrorStr); |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 179 | |
| 180 | // Unmmap the archive... |
Chris Lattner | fb777c2 | 2004-05-28 00:24:41 +0000 | [diff] [blame^] | 181 | UnmapFileFromAddressSpace(Buffer, Length); |
Chris Lattner | 968cfd0 | 2003-04-19 21:45:34 +0000 | [diff] [blame] | 182 | |
| 183 | if (Result) // Free any loaded objects |
| 184 | while (!Objects.empty()) { |
| 185 | delete Objects.back(); |
| 186 | Objects.pop_back(); |
| 187 | } |
| 188 | |
| 189 | return Result; |
| 190 | } |