blob: e12648386525ad5ee55a86fdc984e481de800b63 [file] [log] [blame]
Chris Lattner23219d12003-09-22 23:42:00 +00001//===- ArchiveReader.cpp - Code to read LLVM bytecode from .a files -------===//
John Criswellb576c942003-10-20 19:43:21 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by the LLVM research group and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
Chris Lattner968cfd02003-04-19 21:45:34 +00009//
10// This file implements the ReadArchiveFile interface, which allows a linker to
11// read all of the LLVM bytecode files contained in a .a file. This file
12// understands the standard system .a file format. This can only handle the .a
Misha Brukman09ff1502003-04-23 02:59:05 +000013// variant prevalent on Linux systems so far, but may be extended. See
Chris Lattner968cfd02003-04-19 21:45:34 +000014// information in this source file for more information:
15// http://sources.redhat.com/cgi-bin/cvsweb.cgi/src/bfd/archive.c?cvsroot=src
16//
17//===----------------------------------------------------------------------===//
18
19#include "llvm/Bytecode/Reader.h"
20#include "llvm/Module.h"
Reid Spencer551ccae2004-09-01 22:55:40 +000021#include "llvm/Support/FileUtilities.h"
Brian Gaeke2c61d7b2003-11-16 23:08:48 +000022#include <cstdlib>
Reid Spencer77cf2962004-07-04 11:01:27 +000023#include <iostream>
Chris Lattner3446ae82004-01-10 19:00:15 +000024using namespace llvm;
Brian Gaeked0fde302003-11-11 22:41:34 +000025
Chris Lattner968cfd02003-04-19 21:45:34 +000026namespace {
27 struct ar_hdr {
28 char name[16];
29 char date[12];
30 char uid[6];
31 char gid[6];
32 char mode[8];
33 char size[10];
34 char fmag[2]; // Always equal to '`\n'
35 };
36
37 enum ObjectType {
38 UserObject, // A user .o/.bc file
39 Unknown, // Unknown file, just ignore it
40 SVR4LongFilename, // a "//" section used for long file names
Brian Gaeke2c61d7b2003-11-16 23:08:48 +000041 ArchiveSymbolTable, // Symbol table produced by ranlib.
Chris Lattner968cfd02003-04-19 21:45:34 +000042 };
43}
44
Brian Gaeke3c096362003-12-11 00:38:04 +000045/// getObjectType - Determine the type of object that this header represents.
46/// This is capable of parsing the variety of special sections used for various
47/// purposes.
48///
Brian Gaeke60d6e542004-03-31 19:51:00 +000049static enum ObjectType getObjectType(ar_hdr *H, std::string MemberName,
50 unsigned char *MemberData, unsigned Size) {
Chris Lattner968cfd02003-04-19 21:45:34 +000051 // Check for sections with special names...
Brian Gaeke60d6e542004-03-31 19:51:00 +000052 if (MemberName == "__.SYMDEF " || MemberName == "__.SYMDEF SORTED")
Brian Gaeke2c61d7b2003-11-16 23:08:48 +000053 return ArchiveSymbolTable;
Brian Gaeke60d6e542004-03-31 19:51:00 +000054 else if (MemberName == "// ")
Chris Lattner968cfd02003-04-19 21:45:34 +000055 return SVR4LongFilename;
56
57 // Check to see if it looks like an llvm object file...
Brian Gaeke3c096362003-12-11 00:38:04 +000058 if (Size >= 4 && !memcmp(MemberData, "llvm", 4))
Chris Lattner968cfd02003-04-19 21:45:34 +000059 return UserObject;
60
John Criswellb5810282004-11-09 19:37:07 +000061 if (Size >= 4 && !memcmp(MemberData, "llvc", 4))
62 return UserObject;
63
Chris Lattner968cfd02003-04-19 21:45:34 +000064 return Unknown;
65}
66
Chris Lattner968cfd02003-04-19 21:45:34 +000067static inline bool Error(std::string *ErrorStr, const char *Message) {
68 if (ErrorStr) *ErrorStr = Message;
69 return true;
70}
71
Brian Gaeke2c61d7b2003-11-16 23:08:48 +000072static bool ParseSymbolTableSection(unsigned char *Buffer, unsigned Size,
73 std::string *S) {
74 // Currently not supported (succeeds without doing anything)
75 return false;
76}
Chris Lattner968cfd02003-04-19 21:45:34 +000077
Brian Gaeke2c61d7b2003-11-16 23:08:48 +000078static bool ReadArchiveBuffer(const std::string &ArchiveName,
Chris Lattner75f20532003-04-22 18:02:52 +000079 unsigned char *Buffer, unsigned Length,
Chris Lattner968cfd02003-04-19 21:45:34 +000080 std::vector<Module*> &Objects,
81 std::string *ErrorStr) {
82 if (Length < 8 || memcmp(Buffer, "!<arch>\n", 8))
83 return Error(ErrorStr, "signature incorrect for an archive file!");
84 Buffer += 8; Length -= 8; // Skip the magic string.
85
Brian Gaeke2c61d7b2003-11-16 23:08:48 +000086 std::vector<char> LongFilenames;
Chris Lattner968cfd02003-04-19 21:45:34 +000087
88 while (Length >= sizeof(ar_hdr)) {
89 ar_hdr *Hdr = (ar_hdr*)Buffer;
Brian Gaeke3c096362003-12-11 00:38:04 +000090 unsigned SizeFromHeader = atoi(Hdr->size);
91 if (SizeFromHeader + sizeof(ar_hdr) > Length)
Chris Lattner968cfd02003-04-19 21:45:34 +000092 return Error(ErrorStr, "invalid record length in archive file!");
93
Brian Gaeke3c096362003-12-11 00:38:04 +000094 unsigned char *MemberData = Buffer + sizeof(ar_hdr);
95 unsigned MemberSize = SizeFromHeader;
Brian Gaeke2c61d7b2003-11-16 23:08:48 +000096 // Get name of archive member.
97 char *startp = Hdr->name;
Brian Gaeke3c096362003-12-11 00:38:04 +000098 char *endp = (char *) memchr (startp, '/', sizeof(ar_hdr));
99 if (memcmp (Hdr->name, "#1/", 3) == 0) {
100 // 4.4BSD/MacOSX long filenames are abbreviated as "#1/L", where L is an
101 // ASCII-coded decimal number representing the length of the name buffer,
102 // which is prepended to the archive member's contents.
103 unsigned NameLength = atoi (&Hdr->name[3]);
104 startp = (char *) MemberData;
105 endp = startp + NameLength;
106 MemberData += NameLength;
107 MemberSize -= NameLength;
108 } else if (startp == endp && isdigit (Hdr->name[1])) {
109 // SVR4 long filenames are abbreviated as "/I", where I is
110 // an ASCII-coded decimal index into the LongFilenames vector.
111 unsigned NameIndex = atoi (&Hdr->name[1]);
112 assert (LongFilenames.size () > NameIndex
113 && "SVR4-style long filename for archive member not found");
114 startp = &LongFilenames[NameIndex];
Brian Gaeke2c61d7b2003-11-16 23:08:48 +0000115 endp = strchr (startp, '/');
Brian Gaeke60d6e542004-03-31 19:51:00 +0000116 } else if (startp == endp && Hdr->name[1] == '/') {
117 // This is for the SVR4 long filename table (there might be other
118 // names starting with // but I don't know about them). Make sure that
119 // getObjectType sees it.
120 endp = &Hdr->name[sizeof (Hdr->name)];
Brian Gaeke2c61d7b2003-11-16 23:08:48 +0000121 }
Brian Gaeke3c096362003-12-11 00:38:04 +0000122 if (!endp) {
123 // 4.4BSD/MacOSX *short* filenames are not guaranteed to have a
124 // terminator. Start at the end of the field and backtrack over spaces.
125 endp = startp + sizeof(Hdr->name);
126 while (endp[-1] == ' ')
127 --endp;
128 }
Brian Gaeke2c61d7b2003-11-16 23:08:48 +0000129 std::string MemberName (startp, endp);
John Criswell90591582003-12-22 16:22:49 +0000130 std::string FullMemberName = ArchiveName + "(" + MemberName + ")";
Brian Gaeke2c61d7b2003-11-16 23:08:48 +0000131
Brian Gaeke60d6e542004-03-31 19:51:00 +0000132 switch (getObjectType(Hdr, MemberName, MemberData, MemberSize)) {
Chris Lattner968cfd02003-04-19 21:45:34 +0000133 case SVR4LongFilename:
134 // If this is a long filename section, read all of the file names into the
135 // LongFilenames vector.
Brian Gaeke3c096362003-12-11 00:38:04 +0000136 LongFilenames.assign (MemberData, MemberData + MemberSize);
Chris Lattner968cfd02003-04-19 21:45:34 +0000137 break;
138 case UserObject: {
Brian Gaeke3c096362003-12-11 00:38:04 +0000139 Module *M = ParseBytecodeBuffer(MemberData, MemberSize,
John Criswell90591582003-12-22 16:22:49 +0000140 FullMemberName, ErrorStr);
Chris Lattner968cfd02003-04-19 21:45:34 +0000141 if (!M) return true;
142 Objects.push_back(M);
143 break;
144 }
Brian Gaeke2c61d7b2003-11-16 23:08:48 +0000145 case ArchiveSymbolTable:
Brian Gaeke3c096362003-12-11 00:38:04 +0000146 if (ParseSymbolTableSection(MemberData, MemberSize, ErrorStr))
Brian Gaeke2c61d7b2003-11-16 23:08:48 +0000147 return true;
148 break;
149 default:
150 std::cerr << "ReadArchiveBuffer: WARNING: Skipping unknown file: "
John Criswell90591582003-12-22 16:22:49 +0000151 << FullMemberName << "\n";
Chris Lattner968cfd02003-04-19 21:45:34 +0000152 break; // Just ignore unknown files.
153 }
154
Brian Gaeke3c096362003-12-11 00:38:04 +0000155 // Round SizeFromHeader up to an even number...
156 SizeFromHeader = (SizeFromHeader+1)/2*2;
157 Buffer += sizeof(ar_hdr)+SizeFromHeader; // Move to the next entry
158 Length -= sizeof(ar_hdr)+SizeFromHeader;
Chris Lattner968cfd02003-04-19 21:45:34 +0000159 }
160
161 return Length != 0;
162}
163
164
Misha Brukman37f92e22003-09-11 22:34:13 +0000165// ReadArchiveFile - Read bytecode files from the specified .a file, returning
Chris Lattner968cfd02003-04-19 21:45:34 +0000166// true on error, or false on success. This does not support reading files from
167// standard input.
168//
Chris Lattner3446ae82004-01-10 19:00:15 +0000169bool llvm::ReadArchiveFile(const std::string &Filename,
170 std::vector<Module*> &Objects,std::string *ErrorStr){
Chris Lattnerfb777c22004-05-28 00:24:41 +0000171 unsigned Length;
Chris Lattnerb70abe12003-12-30 07:40:35 +0000172
Chris Lattner968cfd02003-04-19 21:45:34 +0000173 // mmap in the file all at once...
Chris Lattnerfb777c22004-05-28 00:24:41 +0000174 unsigned char *Buffer =
175 (unsigned char*)ReadFileIntoAddressSpace(Filename, Length);
176 if (Buffer == 0) {
177 if (ErrorStr) *ErrorStr = "Error reading file '" + Filename + "'!";
178 return true;
179 }
Chris Lattner968cfd02003-04-19 21:45:34 +0000180
181 // Parse the archive files we mmap'ped in
Chris Lattner75f20532003-04-22 18:02:52 +0000182 bool Result = ReadArchiveBuffer(Filename, Buffer, Length, Objects, ErrorStr);
Chris Lattner968cfd02003-04-19 21:45:34 +0000183
184 // Unmmap the archive...
Chris Lattnerfb777c22004-05-28 00:24:41 +0000185 UnmapFileFromAddressSpace(Buffer, Length);
Chris Lattner968cfd02003-04-19 21:45:34 +0000186
187 if (Result) // Free any loaded objects
188 while (!Objects.empty()) {
189 delete Objects.back();
190 Objects.pop_back();
191 }
192
193 return Result;
194}