blob: f9fa80748bcc8360b41185eb000f5170ee1f6868 [file] [log] [blame]
Reid Spencer362cbf02004-11-06 08:51:45 +00001//===-- Archive.cpp - Generic LLVM archive functions ------------*- C++ -*-===//
Misha Brukman2b37d7c2005-04-21 21:13:18 +00002//
Reid Spencer362cbf02004-11-06 08:51:45 +00003// The LLVM Compiler Infrastructure
4//
Misha Brukman2b37d7c2005-04-21 21:13:18 +00005// This file was developed by Reid Spencer and is distributed under the
Reid Spencer362cbf02004-11-06 08:51:45 +00006// University of Illinois Open Source License. See LICENSE.TXT for details.
Misha Brukman2b37d7c2005-04-21 21:13:18 +00007//
Reid Spencer362cbf02004-11-06 08:51:45 +00008//===----------------------------------------------------------------------===//
9//
Reid Spencercf6afc62004-11-14 21:56:59 +000010// This file contains the implementation of the Archive and ArchiveMember
11// classes that is common to both reading and writing archives..
Reid Spencer362cbf02004-11-06 08:51:45 +000012//
13//===----------------------------------------------------------------------===//
14
15#include "ArchiveInternals.h"
Reid Spencercf6afc62004-11-14 21:56:59 +000016#include "llvm/ModuleProvider.h"
Chris Lattnerf36c7b82007-02-07 23:53:17 +000017#include "llvm/Module.h"
18#include "llvm/Bytecode/Reader.h"
Reid Spencer8e827e82005-04-21 17:49:57 +000019#include "llvm/System/Process.h"
Reid Spencer362cbf02004-11-06 08:51:45 +000020using namespace llvm;
21
Reid Spencercf6afc62004-11-14 21:56:59 +000022// getMemberSize - compute the actual physical size of the file member as seen
23// on disk. This isn't the size of member's payload. Use getSize() for that.
24unsigned
25ArchiveMember::getMemberSize() const {
26 // Basically its the file size plus the header size
27 unsigned result = info.fileSize + sizeof(ArchiveMemberHeader);
28
29 // If it has a long filename, include the name length
30 if (hasLongFilename())
Reid Spencer1fce0912004-12-11 00:14:15 +000031 result += path.toString().length() + 1;
Reid Spencercf6afc62004-11-14 21:56:59 +000032
33 // If its now odd lengthed, include the padding byte
Misha Brukman2b37d7c2005-04-21 21:13:18 +000034 if (result % 2 != 0 )
Reid Spencercf6afc62004-11-14 21:56:59 +000035 result++;
36
37 return result;
Reid Spencer362cbf02004-11-06 08:51:45 +000038}
39
Reid Spencercf6afc62004-11-14 21:56:59 +000040// This default constructor is only use by the ilist when it creates its
41// sentry node. We give it specific static values to make it stand out a bit.
Misha Brukman2b37d7c2005-04-21 21:13:18 +000042ArchiveMember::ArchiveMember()
Jeff Cohen943b9b62006-05-06 23:25:53 +000043 : next(0), prev(0), parent(0), path("--invalid--"), flags(0), data(0)
Reid Spencercf6afc62004-11-14 21:56:59 +000044{
Reid Spencer8e827e82005-04-21 17:49:57 +000045 info.user = sys::Process::GetCurrentUserId();
Misha Brukman2b37d7c2005-04-21 21:13:18 +000046 info.group = sys::Process::GetCurrentGroupId();
47 info.mode = 0777;
48 info.fileSize = 0;
Reid Spencercf6afc62004-11-14 21:56:59 +000049 info.modTime = sys::TimeValue::now();
50}
51
52// This is the constructor that the Archive class uses when it is building or
53// reading an archive. It just defaults a few things and ensures the parent is
Misha Brukman2b37d7c2005-04-21 21:13:18 +000054// set for the iplist. The Archive class fills in the ArchiveMember's data.
55// This is required because correctly setting the data may depend on other
Reid Spencercf6afc62004-11-14 21:56:59 +000056// things in the Archive.
57ArchiveMember::ArchiveMember(Archive* PAR)
58 : next(0), prev(0), parent(PAR), path(), flags(0), data(0)
59{
60}
61
Misha Brukman2b37d7c2005-04-21 21:13:18 +000062// This method allows an ArchiveMember to be replaced with the data for a
Reid Spencercf6afc62004-11-14 21:56:59 +000063// different file, presumably as an update to the member. It also makes sure
64// the flags are reset correctly.
Reid Spencer0ff2d312006-08-24 23:45:08 +000065bool ArchiveMember::replaceWith(const sys::Path& newFile, std::string* ErrMsg) {
Reid Spencercd5561a2006-12-15 19:44:51 +000066 if (!newFile.exists()) {
67 if (ErrMsg)
68 *ErrMsg = "Can not replace an archive member with a non-existent file";
69 return true;
70 }
71
Reid Spencercf6afc62004-11-14 21:56:59 +000072 data = 0;
73 path = newFile;
74
Reid Spencer9a29db42004-11-20 07:29:40 +000075 // SVR4 symbol tables have an empty name
Reid Spencer1fce0912004-12-11 00:14:15 +000076 if (path.toString() == ARFILE_SVR4_SYMTAB_NAME)
Reid Spencer9a29db42004-11-20 07:29:40 +000077 flags |= SVR4SymbolTableFlag;
Reid Spencercf6afc62004-11-14 21:56:59 +000078 else
Reid Spencer9a29db42004-11-20 07:29:40 +000079 flags &= ~SVR4SymbolTableFlag;
80
81 // BSD4.4 symbol tables have a special name
Reid Spencer1fce0912004-12-11 00:14:15 +000082 if (path.toString() == ARFILE_BSD4_SYMTAB_NAME)
Reid Spencer9a29db42004-11-20 07:29:40 +000083 flags |= BSD4SymbolTableFlag;
84 else
85 flags &= ~BSD4SymbolTableFlag;
Reid Spencercf6afc62004-11-14 21:56:59 +000086
87 // LLVM symbol tables have a very specific name
Reid Spencer1fce0912004-12-11 00:14:15 +000088 if (path.toString() == ARFILE_LLVM_SYMTAB_NAME)
Reid Spencercf6afc62004-11-14 21:56:59 +000089 flags |= LLVMSymbolTableFlag;
90 else
91 flags &= ~LLVMSymbolTableFlag;
92
93 // String table name
Reid Spencer1fce0912004-12-11 00:14:15 +000094 if (path.toString() == ARFILE_STRTAB_NAME)
Reid Spencercf6afc62004-11-14 21:56:59 +000095 flags |= StringTableFlag;
96 else
97 flags &= ~StringTableFlag;
98
99 // If it has a slash then it has a path
Reid Spencer1fce0912004-12-11 00:14:15 +0000100 bool hasSlash = path.toString().find('/') != std::string::npos;
Reid Spencercf6afc62004-11-14 21:56:59 +0000101 if (hasSlash)
102 flags |= HasPathFlag;
103 else
104 flags &= ~HasPathFlag;
105
106 // If it has a slash or its over 15 chars then its a long filename format
Reid Spencer1fce0912004-12-11 00:14:15 +0000107 if (hasSlash || path.toString().length() > 15)
Reid Spencercf6afc62004-11-14 21:56:59 +0000108 flags |= HasLongFilenameFlag;
109 else
110 flags &= ~HasLongFilenameFlag;
111
112 // Get the signature and status info
Reid Spencercf6afc62004-11-14 21:56:59 +0000113 const char* signature = (const char*) data;
Chris Lattner252ad032006-07-28 22:03:44 +0000114 std::string magic;
Reid Spencercf6afc62004-11-14 21:56:59 +0000115 if (!signature) {
116 path.getMagicNumber(magic,4);
117 signature = magic.c_str();
Chris Lattner252ad032006-07-28 22:03:44 +0000118 std::string err;
Reid Spencer8475ec02007-03-29 19:05:44 +0000119 const sys::FileStatus *FSinfo = path.getFileStatus(false, ErrMsg);
120 if (FSinfo)
121 info = *FSinfo;
122 else
Reid Spencer0ff2d312006-08-24 23:45:08 +0000123 return true;
Reid Spencercf6afc62004-11-14 21:56:59 +0000124 }
125
126 // Determine what kind of file it is
127 switch (sys::IdentifyFileType(signature,4)) {
128 case sys::BytecodeFileType:
129 flags |= BytecodeFlag;
130 break;
131 case sys::CompressedBytecodeFileType:
132 flags |= CompressedBytecodeFlag;
133 flags &= ~CompressedFlag;
134 break;
135 default:
136 flags &= ~(BytecodeFlag|CompressedBytecodeFlag);
137 break;
138 }
Reid Spencer0ff2d312006-08-24 23:45:08 +0000139 return false;
Reid Spencercf6afc62004-11-14 21:56:59 +0000140}
141
142// Archive constructor - this is the only constructor that gets used for the
Misha Brukman2b37d7c2005-04-21 21:13:18 +0000143// Archive class. Everything else (default,copy) is deprecated. This just
Reid Spencercf6afc62004-11-14 21:56:59 +0000144// initializes and maps the file into memory, if requested.
Chris Lattnerf2e292c2007-02-07 21:41:02 +0000145Archive::Archive(const sys::Path& filename, BCDecompressor_t *BCDC)
Reid Spencer1f465802004-11-16 06:47:07 +0000146 : archPath(filename), members(), mapfile(0), base(0), symTab(), strtab(),
Chris Lattnerf2e292c2007-02-07 21:41:02 +0000147 symTabSize(0), firstFileOffset(0), modules(), foreignST(0),
148 Decompressor(BCDC) {
Reid Spencer0ff2d312006-08-24 23:45:08 +0000149}
150
151bool
152Archive::mapToMemory(std::string* ErrMsg)
153{
154 mapfile = new sys::MappedFile();
155 if (mapfile->open(archPath, sys::MappedFile::READ_ACCESS, ErrMsg))
156 return true;
157 if (!(base = (char*) mapfile->map(ErrMsg)))
158 return true;
159 return false;
Reid Spencercf6afc62004-11-14 21:56:59 +0000160}
161
Reid Spencer6ff72402005-11-30 05:21:10 +0000162void Archive::cleanUpMemory() {
Reid Spencercf6afc62004-11-14 21:56:59 +0000163 // Shutdown the file mapping
164 if (mapfile) {
Jeff Cohend19d89a2005-01-28 01:17:07 +0000165 mapfile->close();
Reid Spencercf6afc62004-11-14 21:56:59 +0000166 delete mapfile;
Reid Spencer6ff72402005-11-30 05:21:10 +0000167
168 mapfile = 0;
169 base = 0;
Reid Spencercf6afc62004-11-14 21:56:59 +0000170 }
Reid Spencer6ff72402005-11-30 05:21:10 +0000171
172 // Forget the entire symbol table
173 symTab.clear();
174 symTabSize = 0;
175
176 firstFileOffset = 0;
177
178 // Free the foreign symbol table member
179 if (foreignST) {
180 delete foreignST;
181 foreignST = 0;
182 }
183
Reid Spencercf6afc62004-11-14 21:56:59 +0000184 // Delete any ModuleProviders and ArchiveMember's we've allocated as a result
185 // of symbol table searches.
186 for (ModuleMap::iterator I=modules.begin(), E=modules.end(); I != E; ++I ) {
187 delete I->second.first;
188 delete I->second.second;
189 }
Reid Spencer362cbf02004-11-06 08:51:45 +0000190}
191
Reid Spencer6ff72402005-11-30 05:21:10 +0000192// Archive destructor - just clean up memory
193Archive::~Archive() {
194 cleanUpMemory();
195}
196
Chris Lattnerf36c7b82007-02-07 23:53:17 +0000197
198
199static void getSymbols(Module*M, std::vector<std::string>& symbols) {
200 // Loop over global variables
201 for (Module::global_iterator GI = M->global_begin(), GE=M->global_end(); GI != GE; ++GI)
202 if (!GI->isDeclaration() && !GI->hasInternalLinkage())
203 if (!GI->getName().empty())
204 symbols.push_back(GI->getName());
205
206 // Loop over functions.
207 for (Module::iterator FI = M->begin(), FE = M->end(); FI != FE; ++FI)
208 if (!FI->isDeclaration() && !FI->hasInternalLinkage())
209 if (!FI->getName().empty())
210 symbols.push_back(FI->getName());
211}
212
213// Get just the externally visible defined symbols from the bytecode
214bool llvm::GetBytecodeSymbols(const sys::Path& fName,
215 std::vector<std::string>& symbols,
216 BCDecompressor_t *BCDC,
217 std::string* ErrMsg) {
218 ModuleProvider *MP = getBytecodeModuleProvider(fName.toString(), BCDC,ErrMsg);
219 if (!MP)
220 return true;
221
222 // Get the module from the provider
223 Module* M = MP->materializeModule();
224 if (M == 0) {
225 delete MP;
226 return true;
227 }
228
229 // Get the symbols
230 getSymbols(M, symbols);
231
232 // Done with the module.
233 delete MP;
234 return true;
235}
236
237ModuleProvider*
238llvm::GetBytecodeSymbols(const unsigned char*Buffer, unsigned Length,
239 const std::string& ModuleID,
240 std::vector<std::string>& symbols,
241 BCDecompressor_t *BCDC,
242 std::string* ErrMsg) {
243 // Get the module provider
244 ModuleProvider* MP =
245 getBytecodeBufferModuleProvider(Buffer, Length, ModuleID, BCDC, ErrMsg, 0);
246 if (!MP)
247 return 0;
248
249 // Get the module from the provider
250 Module* M = MP->materializeModule();
251 if (M == 0) {
252 delete MP;
253 return 0;
254 }
255
256 // Get the symbols
257 getSymbols(M, symbols);
258
259 // Done with the module. Note that ModuleProvider will delete the
260 // Module when it is deleted. Also note that its the caller's responsibility
261 // to delete the ModuleProvider.
262 return MP;
263}