blob: aff7ab8f1e6bc1450196c63991e89f563f36b746 [file] [log] [blame]
Reid Spencer362cbf02004-11-06 08:51:45 +00001//===-- Archive.cpp - Generic LLVM archive functions ------------*- C++ -*-===//
Misha Brukman2b37d7c2005-04-21 21:13:18 +00002//
Reid Spencer362cbf02004-11-06 08:51:45 +00003// The LLVM Compiler Infrastructure
4//
Misha Brukman2b37d7c2005-04-21 21:13:18 +00005// This file was developed by Reid Spencer and is distributed under the
Reid Spencer362cbf02004-11-06 08:51:45 +00006// University of Illinois Open Source License. See LICENSE.TXT for details.
Misha Brukman2b37d7c2005-04-21 21:13:18 +00007//
Reid Spencer362cbf02004-11-06 08:51:45 +00008//===----------------------------------------------------------------------===//
9//
Reid Spencercf6afc62004-11-14 21:56:59 +000010// This file contains the implementation of the Archive and ArchiveMember
11// classes that is common to both reading and writing archives..
Reid Spencer362cbf02004-11-06 08:51:45 +000012//
13//===----------------------------------------------------------------------===//
14
15#include "ArchiveInternals.h"
Reid Spencercf6afc62004-11-14 21:56:59 +000016#include "llvm/ModuleProvider.h"
Chris Lattnerf36c7b82007-02-07 23:53:17 +000017#include "llvm/Module.h"
18#include "llvm/Bytecode/Reader.h"
Reid Spencer8e827e82005-04-21 17:49:57 +000019#include "llvm/System/Process.h"
Reid Spencer362cbf02004-11-06 08:51:45 +000020using namespace llvm;
21
Reid Spencercf6afc62004-11-14 21:56:59 +000022// getMemberSize - compute the actual physical size of the file member as seen
23// on disk. This isn't the size of member's payload. Use getSize() for that.
24unsigned
25ArchiveMember::getMemberSize() const {
26 // Basically its the file size plus the header size
27 unsigned result = info.fileSize + sizeof(ArchiveMemberHeader);
28
29 // If it has a long filename, include the name length
30 if (hasLongFilename())
Reid Spencer1fce0912004-12-11 00:14:15 +000031 result += path.toString().length() + 1;
Reid Spencercf6afc62004-11-14 21:56:59 +000032
33 // If its now odd lengthed, include the padding byte
Misha Brukman2b37d7c2005-04-21 21:13:18 +000034 if (result % 2 != 0 )
Reid Spencercf6afc62004-11-14 21:56:59 +000035 result++;
36
37 return result;
Reid Spencer362cbf02004-11-06 08:51:45 +000038}
39
Reid Spencercf6afc62004-11-14 21:56:59 +000040// This default constructor is only use by the ilist when it creates its
41// sentry node. We give it specific static values to make it stand out a bit.
Misha Brukman2b37d7c2005-04-21 21:13:18 +000042ArchiveMember::ArchiveMember()
Jeff Cohen943b9b62006-05-06 23:25:53 +000043 : next(0), prev(0), parent(0), path("--invalid--"), flags(0), data(0)
Reid Spencercf6afc62004-11-14 21:56:59 +000044{
Reid Spencer8e827e82005-04-21 17:49:57 +000045 info.user = sys::Process::GetCurrentUserId();
Misha Brukman2b37d7c2005-04-21 21:13:18 +000046 info.group = sys::Process::GetCurrentGroupId();
47 info.mode = 0777;
48 info.fileSize = 0;
Reid Spencercf6afc62004-11-14 21:56:59 +000049 info.modTime = sys::TimeValue::now();
50}
51
52// This is the constructor that the Archive class uses when it is building or
53// reading an archive. It just defaults a few things and ensures the parent is
Misha Brukman2b37d7c2005-04-21 21:13:18 +000054// set for the iplist. The Archive class fills in the ArchiveMember's data.
55// This is required because correctly setting the data may depend on other
Reid Spencercf6afc62004-11-14 21:56:59 +000056// things in the Archive.
57ArchiveMember::ArchiveMember(Archive* PAR)
58 : next(0), prev(0), parent(PAR), path(), flags(0), data(0)
59{
60}
61
Misha Brukman2b37d7c2005-04-21 21:13:18 +000062// This method allows an ArchiveMember to be replaced with the data for a
Reid Spencercf6afc62004-11-14 21:56:59 +000063// different file, presumably as an update to the member. It also makes sure
64// the flags are reset correctly.
Reid Spencer0ff2d312006-08-24 23:45:08 +000065bool ArchiveMember::replaceWith(const sys::Path& newFile, std::string* ErrMsg) {
Reid Spencercd5561a2006-12-15 19:44:51 +000066 if (!newFile.exists()) {
67 if (ErrMsg)
68 *ErrMsg = "Can not replace an archive member with a non-existent file";
69 return true;
70 }
71
Reid Spencercf6afc62004-11-14 21:56:59 +000072 data = 0;
73 path = newFile;
74
Reid Spencer9a29db42004-11-20 07:29:40 +000075 // SVR4 symbol tables have an empty name
Reid Spencer1fce0912004-12-11 00:14:15 +000076 if (path.toString() == ARFILE_SVR4_SYMTAB_NAME)
Reid Spencer9a29db42004-11-20 07:29:40 +000077 flags |= SVR4SymbolTableFlag;
Reid Spencercf6afc62004-11-14 21:56:59 +000078 else
Reid Spencer9a29db42004-11-20 07:29:40 +000079 flags &= ~SVR4SymbolTableFlag;
80
81 // BSD4.4 symbol tables have a special name
Reid Spencer1fce0912004-12-11 00:14:15 +000082 if (path.toString() == ARFILE_BSD4_SYMTAB_NAME)
Reid Spencer9a29db42004-11-20 07:29:40 +000083 flags |= BSD4SymbolTableFlag;
84 else
85 flags &= ~BSD4SymbolTableFlag;
Reid Spencercf6afc62004-11-14 21:56:59 +000086
87 // LLVM symbol tables have a very specific name
Reid Spencer1fce0912004-12-11 00:14:15 +000088 if (path.toString() == ARFILE_LLVM_SYMTAB_NAME)
Reid Spencercf6afc62004-11-14 21:56:59 +000089 flags |= LLVMSymbolTableFlag;
90 else
91 flags &= ~LLVMSymbolTableFlag;
92
93 // String table name
Reid Spencer1fce0912004-12-11 00:14:15 +000094 if (path.toString() == ARFILE_STRTAB_NAME)
Reid Spencercf6afc62004-11-14 21:56:59 +000095 flags |= StringTableFlag;
96 else
97 flags &= ~StringTableFlag;
98
99 // If it has a slash then it has a path
Reid Spencer1fce0912004-12-11 00:14:15 +0000100 bool hasSlash = path.toString().find('/') != std::string::npos;
Reid Spencercf6afc62004-11-14 21:56:59 +0000101 if (hasSlash)
102 flags |= HasPathFlag;
103 else
104 flags &= ~HasPathFlag;
105
106 // If it has a slash or its over 15 chars then its a long filename format
Reid Spencer1fce0912004-12-11 00:14:15 +0000107 if (hasSlash || path.toString().length() > 15)
Reid Spencercf6afc62004-11-14 21:56:59 +0000108 flags |= HasLongFilenameFlag;
109 else
110 flags &= ~HasLongFilenameFlag;
111
112 // Get the signature and status info
Reid Spencercf6afc62004-11-14 21:56:59 +0000113 const char* signature = (const char*) data;
Chris Lattner252ad032006-07-28 22:03:44 +0000114 std::string magic;
Reid Spencercf6afc62004-11-14 21:56:59 +0000115 if (!signature) {
116 path.getMagicNumber(magic,4);
117 signature = magic.c_str();
Chris Lattner252ad032006-07-28 22:03:44 +0000118 std::string err;
Reid Spencer5ba2b702007-03-29 16:48:16 +0000119 if (path.getFileStatus(info, false, ErrMsg))
Reid Spencer0ff2d312006-08-24 23:45:08 +0000120 return true;
Reid Spencercf6afc62004-11-14 21:56:59 +0000121 }
122
123 // Determine what kind of file it is
124 switch (sys::IdentifyFileType(signature,4)) {
125 case sys::BytecodeFileType:
126 flags |= BytecodeFlag;
127 break;
128 case sys::CompressedBytecodeFileType:
129 flags |= CompressedBytecodeFlag;
130 flags &= ~CompressedFlag;
131 break;
132 default:
133 flags &= ~(BytecodeFlag|CompressedBytecodeFlag);
134 break;
135 }
Reid Spencer0ff2d312006-08-24 23:45:08 +0000136 return false;
Reid Spencercf6afc62004-11-14 21:56:59 +0000137}
138
139// Archive constructor - this is the only constructor that gets used for the
Misha Brukman2b37d7c2005-04-21 21:13:18 +0000140// Archive class. Everything else (default,copy) is deprecated. This just
Reid Spencercf6afc62004-11-14 21:56:59 +0000141// initializes and maps the file into memory, if requested.
Chris Lattnerf2e292c2007-02-07 21:41:02 +0000142Archive::Archive(const sys::Path& filename, BCDecompressor_t *BCDC)
Reid Spencer1f465802004-11-16 06:47:07 +0000143 : archPath(filename), members(), mapfile(0), base(0), symTab(), strtab(),
Chris Lattnerf2e292c2007-02-07 21:41:02 +0000144 symTabSize(0), firstFileOffset(0), modules(), foreignST(0),
145 Decompressor(BCDC) {
Reid Spencer0ff2d312006-08-24 23:45:08 +0000146}
147
148bool
149Archive::mapToMemory(std::string* ErrMsg)
150{
151 mapfile = new sys::MappedFile();
152 if (mapfile->open(archPath, sys::MappedFile::READ_ACCESS, ErrMsg))
153 return true;
154 if (!(base = (char*) mapfile->map(ErrMsg)))
155 return true;
156 return false;
Reid Spencercf6afc62004-11-14 21:56:59 +0000157}
158
Reid Spencer6ff72402005-11-30 05:21:10 +0000159void Archive::cleanUpMemory() {
Reid Spencercf6afc62004-11-14 21:56:59 +0000160 // Shutdown the file mapping
161 if (mapfile) {
Jeff Cohend19d89a2005-01-28 01:17:07 +0000162 mapfile->close();
Reid Spencercf6afc62004-11-14 21:56:59 +0000163 delete mapfile;
Reid Spencer6ff72402005-11-30 05:21:10 +0000164
165 mapfile = 0;
166 base = 0;
Reid Spencercf6afc62004-11-14 21:56:59 +0000167 }
Reid Spencer6ff72402005-11-30 05:21:10 +0000168
169 // Forget the entire symbol table
170 symTab.clear();
171 symTabSize = 0;
172
173 firstFileOffset = 0;
174
175 // Free the foreign symbol table member
176 if (foreignST) {
177 delete foreignST;
178 foreignST = 0;
179 }
180
Reid Spencercf6afc62004-11-14 21:56:59 +0000181 // Delete any ModuleProviders and ArchiveMember's we've allocated as a result
182 // of symbol table searches.
183 for (ModuleMap::iterator I=modules.begin(), E=modules.end(); I != E; ++I ) {
184 delete I->second.first;
185 delete I->second.second;
186 }
Reid Spencer362cbf02004-11-06 08:51:45 +0000187}
188
Reid Spencer6ff72402005-11-30 05:21:10 +0000189// Archive destructor - just clean up memory
190Archive::~Archive() {
191 cleanUpMemory();
192}
193
Chris Lattnerf36c7b82007-02-07 23:53:17 +0000194
195
196static void getSymbols(Module*M, std::vector<std::string>& symbols) {
197 // Loop over global variables
198 for (Module::global_iterator GI = M->global_begin(), GE=M->global_end(); GI != GE; ++GI)
199 if (!GI->isDeclaration() && !GI->hasInternalLinkage())
200 if (!GI->getName().empty())
201 symbols.push_back(GI->getName());
202
203 // Loop over functions.
204 for (Module::iterator FI = M->begin(), FE = M->end(); FI != FE; ++FI)
205 if (!FI->isDeclaration() && !FI->hasInternalLinkage())
206 if (!FI->getName().empty())
207 symbols.push_back(FI->getName());
208}
209
210// Get just the externally visible defined symbols from the bytecode
211bool llvm::GetBytecodeSymbols(const sys::Path& fName,
212 std::vector<std::string>& symbols,
213 BCDecompressor_t *BCDC,
214 std::string* ErrMsg) {
215 ModuleProvider *MP = getBytecodeModuleProvider(fName.toString(), BCDC,ErrMsg);
216 if (!MP)
217 return true;
218
219 // Get the module from the provider
220 Module* M = MP->materializeModule();
221 if (M == 0) {
222 delete MP;
223 return true;
224 }
225
226 // Get the symbols
227 getSymbols(M, symbols);
228
229 // Done with the module.
230 delete MP;
231 return true;
232}
233
234ModuleProvider*
235llvm::GetBytecodeSymbols(const unsigned char*Buffer, unsigned Length,
236 const std::string& ModuleID,
237 std::vector<std::string>& symbols,
238 BCDecompressor_t *BCDC,
239 std::string* ErrMsg) {
240 // Get the module provider
241 ModuleProvider* MP =
242 getBytecodeBufferModuleProvider(Buffer, Length, ModuleID, BCDC, ErrMsg, 0);
243 if (!MP)
244 return 0;
245
246 // Get the module from the provider
247 Module* M = MP->materializeModule();
248 if (M == 0) {
249 delete MP;
250 return 0;
251 }
252
253 // Get the symbols
254 getSymbols(M, symbols);
255
256 // Done with the module. Note that ModuleProvider will delete the
257 // Module when it is deleted. Also note that its the caller's responsibility
258 // to delete the ModuleProvider.
259 return MP;
260}