blob: 7fbd15e59fcb11f11109a12ca62adbd24d69a50f [file] [log] [blame]
Reid Spencer362cbf02004-11-06 08:51:45 +00001//===-- Archive.cpp - Generic LLVM archive functions ------------*- C++ -*-===//
Misha Brukman2b37d7c2005-04-21 21:13:18 +00002//
Reid Spencer362cbf02004-11-06 08:51:45 +00003// The LLVM Compiler Infrastructure
4//
Misha Brukman2b37d7c2005-04-21 21:13:18 +00005// This file was developed by Reid Spencer and is distributed under the
Reid Spencer362cbf02004-11-06 08:51:45 +00006// University of Illinois Open Source License. See LICENSE.TXT for details.
Misha Brukman2b37d7c2005-04-21 21:13:18 +00007//
Reid Spencer362cbf02004-11-06 08:51:45 +00008//===----------------------------------------------------------------------===//
9//
Reid Spencercf6afc62004-11-14 21:56:59 +000010// This file contains the implementation of the Archive and ArchiveMember
11// classes that is common to both reading and writing archives..
Reid Spencer362cbf02004-11-06 08:51:45 +000012//
13//===----------------------------------------------------------------------===//
14
15#include "ArchiveInternals.h"
Reid Spencercf6afc62004-11-14 21:56:59 +000016#include "llvm/ModuleProvider.h"
Chris Lattnerf36c7b82007-02-07 23:53:17 +000017#include "llvm/Module.h"
18#include "llvm/Bytecode/Reader.h"
Reid Spencer8e827e82005-04-21 17:49:57 +000019#include "llvm/System/Process.h"
Reid Spencer362cbf02004-11-06 08:51:45 +000020using namespace llvm;
21
Reid Spencercf6afc62004-11-14 21:56:59 +000022// getMemberSize - compute the actual physical size of the file member as seen
23// on disk. This isn't the size of member's payload. Use getSize() for that.
24unsigned
25ArchiveMember::getMemberSize() const {
26 // Basically its the file size plus the header size
27 unsigned result = info.fileSize + sizeof(ArchiveMemberHeader);
28
29 // If it has a long filename, include the name length
30 if (hasLongFilename())
Reid Spencer1fce0912004-12-11 00:14:15 +000031 result += path.toString().length() + 1;
Reid Spencercf6afc62004-11-14 21:56:59 +000032
33 // If its now odd lengthed, include the padding byte
Misha Brukman2b37d7c2005-04-21 21:13:18 +000034 if (result % 2 != 0 )
Reid Spencercf6afc62004-11-14 21:56:59 +000035 result++;
36
37 return result;
Reid Spencer362cbf02004-11-06 08:51:45 +000038}
39
Reid Spencercf6afc62004-11-14 21:56:59 +000040// This default constructor is only use by the ilist when it creates its
41// sentry node. We give it specific static values to make it stand out a bit.
Misha Brukman2b37d7c2005-04-21 21:13:18 +000042ArchiveMember::ArchiveMember()
Jeff Cohen943b9b62006-05-06 23:25:53 +000043 : next(0), prev(0), parent(0), path("--invalid--"), flags(0), data(0)
Reid Spencercf6afc62004-11-14 21:56:59 +000044{
Reid Spencer8e827e82005-04-21 17:49:57 +000045 info.user = sys::Process::GetCurrentUserId();
Misha Brukman2b37d7c2005-04-21 21:13:18 +000046 info.group = sys::Process::GetCurrentGroupId();
47 info.mode = 0777;
48 info.fileSize = 0;
Reid Spencercf6afc62004-11-14 21:56:59 +000049 info.modTime = sys::TimeValue::now();
50}
51
52// This is the constructor that the Archive class uses when it is building or
53// reading an archive. It just defaults a few things and ensures the parent is
Misha Brukman2b37d7c2005-04-21 21:13:18 +000054// set for the iplist. The Archive class fills in the ArchiveMember's data.
55// This is required because correctly setting the data may depend on other
Reid Spencercf6afc62004-11-14 21:56:59 +000056// things in the Archive.
57ArchiveMember::ArchiveMember(Archive* PAR)
58 : next(0), prev(0), parent(PAR), path(), flags(0), data(0)
59{
60}
61
Misha Brukman2b37d7c2005-04-21 21:13:18 +000062// This method allows an ArchiveMember to be replaced with the data for a
Reid Spencercf6afc62004-11-14 21:56:59 +000063// different file, presumably as an update to the member. It also makes sure
64// the flags are reset correctly.
Reid Spencer0ff2d312006-08-24 23:45:08 +000065bool ArchiveMember::replaceWith(const sys::Path& newFile, std::string* ErrMsg) {
Reid Spencercd5561a2006-12-15 19:44:51 +000066 if (!newFile.exists()) {
67 if (ErrMsg)
68 *ErrMsg = "Can not replace an archive member with a non-existent file";
69 return true;
70 }
71
Reid Spencercf6afc62004-11-14 21:56:59 +000072 data = 0;
73 path = newFile;
74
Reid Spencer9a29db42004-11-20 07:29:40 +000075 // SVR4 symbol tables have an empty name
Reid Spencer1fce0912004-12-11 00:14:15 +000076 if (path.toString() == ARFILE_SVR4_SYMTAB_NAME)
Reid Spencer9a29db42004-11-20 07:29:40 +000077 flags |= SVR4SymbolTableFlag;
Reid Spencercf6afc62004-11-14 21:56:59 +000078 else
Reid Spencer9a29db42004-11-20 07:29:40 +000079 flags &= ~SVR4SymbolTableFlag;
80
81 // BSD4.4 symbol tables have a special name
Reid Spencer1fce0912004-12-11 00:14:15 +000082 if (path.toString() == ARFILE_BSD4_SYMTAB_NAME)
Reid Spencer9a29db42004-11-20 07:29:40 +000083 flags |= BSD4SymbolTableFlag;
84 else
85 flags &= ~BSD4SymbolTableFlag;
Reid Spencercf6afc62004-11-14 21:56:59 +000086
87 // LLVM symbol tables have a very specific name
Reid Spencer1fce0912004-12-11 00:14:15 +000088 if (path.toString() == ARFILE_LLVM_SYMTAB_NAME)
Reid Spencercf6afc62004-11-14 21:56:59 +000089 flags |= LLVMSymbolTableFlag;
90 else
91 flags &= ~LLVMSymbolTableFlag;
92
93 // String table name
Reid Spencer1fce0912004-12-11 00:14:15 +000094 if (path.toString() == ARFILE_STRTAB_NAME)
Reid Spencercf6afc62004-11-14 21:56:59 +000095 flags |= StringTableFlag;
96 else
97 flags &= ~StringTableFlag;
98
99 // If it has a slash then it has a path
Reid Spencer1fce0912004-12-11 00:14:15 +0000100 bool hasSlash = path.toString().find('/') != std::string::npos;
Reid Spencercf6afc62004-11-14 21:56:59 +0000101 if (hasSlash)
102 flags |= HasPathFlag;
103 else
104 flags &= ~HasPathFlag;
105
106 // If it has a slash or its over 15 chars then its a long filename format
Reid Spencer1fce0912004-12-11 00:14:15 +0000107 if (hasSlash || path.toString().length() > 15)
Reid Spencercf6afc62004-11-14 21:56:59 +0000108 flags |= HasLongFilenameFlag;
109 else
110 flags &= ~HasLongFilenameFlag;
111
112 // Get the signature and status info
Reid Spencercf6afc62004-11-14 21:56:59 +0000113 const char* signature = (const char*) data;
Chris Lattner252ad032006-07-28 22:03:44 +0000114 std::string magic;
Reid Spencercf6afc62004-11-14 21:56:59 +0000115 if (!signature) {
116 path.getMagicNumber(magic,4);
117 signature = magic.c_str();
Chris Lattner252ad032006-07-28 22:03:44 +0000118 std::string err;
Reid Spencer44218f92007-04-07 19:45:30 +0000119 const sys::FileStatus *FSinfo =
120 sys::PathWithStatus(path).getFileStatus(false, ErrMsg);
Reid Spencer8475ec02007-03-29 19:05:44 +0000121 if (FSinfo)
122 info = *FSinfo;
123 else
Reid Spencer0ff2d312006-08-24 23:45:08 +0000124 return true;
Reid Spencercf6afc62004-11-14 21:56:59 +0000125 }
126
127 // Determine what kind of file it is
128 switch (sys::IdentifyFileType(signature,4)) {
Reid Spencer20c34892007-04-04 06:31:04 +0000129 case sys::Bytecode_FileType:
Reid Spencercf6afc62004-11-14 21:56:59 +0000130 flags |= BytecodeFlag;
131 break;
Reid Spencer20c34892007-04-04 06:31:04 +0000132 case sys::CompressedBytecode_FileType:
Reid Spencercf6afc62004-11-14 21:56:59 +0000133 flags |= CompressedBytecodeFlag;
134 flags &= ~CompressedFlag;
135 break;
136 default:
137 flags &= ~(BytecodeFlag|CompressedBytecodeFlag);
138 break;
139 }
Reid Spencer0ff2d312006-08-24 23:45:08 +0000140 return false;
Reid Spencercf6afc62004-11-14 21:56:59 +0000141}
142
143// Archive constructor - this is the only constructor that gets used for the
Misha Brukman2b37d7c2005-04-21 21:13:18 +0000144// Archive class. Everything else (default,copy) is deprecated. This just
Reid Spencercf6afc62004-11-14 21:56:59 +0000145// initializes and maps the file into memory, if requested.
Chris Lattnerf2e292c2007-02-07 21:41:02 +0000146Archive::Archive(const sys::Path& filename, BCDecompressor_t *BCDC)
Reid Spencer1f465802004-11-16 06:47:07 +0000147 : archPath(filename), members(), mapfile(0), base(0), symTab(), strtab(),
Chris Lattnerf2e292c2007-02-07 21:41:02 +0000148 symTabSize(0), firstFileOffset(0), modules(), foreignST(0),
149 Decompressor(BCDC) {
Reid Spencer0ff2d312006-08-24 23:45:08 +0000150}
151
152bool
153Archive::mapToMemory(std::string* ErrMsg)
154{
155 mapfile = new sys::MappedFile();
156 if (mapfile->open(archPath, sys::MappedFile::READ_ACCESS, ErrMsg))
157 return true;
158 if (!(base = (char*) mapfile->map(ErrMsg)))
159 return true;
160 return false;
Reid Spencercf6afc62004-11-14 21:56:59 +0000161}
162
Reid Spencer6ff72402005-11-30 05:21:10 +0000163void Archive::cleanUpMemory() {
Reid Spencercf6afc62004-11-14 21:56:59 +0000164 // Shutdown the file mapping
165 if (mapfile) {
Jeff Cohend19d89a2005-01-28 01:17:07 +0000166 mapfile->close();
Reid Spencercf6afc62004-11-14 21:56:59 +0000167 delete mapfile;
Reid Spencer6ff72402005-11-30 05:21:10 +0000168
169 mapfile = 0;
170 base = 0;
Reid Spencercf6afc62004-11-14 21:56:59 +0000171 }
Reid Spencer6ff72402005-11-30 05:21:10 +0000172
173 // Forget the entire symbol table
174 symTab.clear();
175 symTabSize = 0;
176
177 firstFileOffset = 0;
178
179 // Free the foreign symbol table member
180 if (foreignST) {
181 delete foreignST;
182 foreignST = 0;
183 }
184
Reid Spencercf6afc62004-11-14 21:56:59 +0000185 // Delete any ModuleProviders and ArchiveMember's we've allocated as a result
186 // of symbol table searches.
187 for (ModuleMap::iterator I=modules.begin(), E=modules.end(); I != E; ++I ) {
188 delete I->second.first;
189 delete I->second.second;
190 }
Reid Spencer362cbf02004-11-06 08:51:45 +0000191}
192
Reid Spencer6ff72402005-11-30 05:21:10 +0000193// Archive destructor - just clean up memory
194Archive::~Archive() {
195 cleanUpMemory();
196}
197
Chris Lattnerf36c7b82007-02-07 23:53:17 +0000198
199
200static void getSymbols(Module*M, std::vector<std::string>& symbols) {
201 // Loop over global variables
202 for (Module::global_iterator GI = M->global_begin(), GE=M->global_end(); GI != GE; ++GI)
203 if (!GI->isDeclaration() && !GI->hasInternalLinkage())
204 if (!GI->getName().empty())
205 symbols.push_back(GI->getName());
206
207 // Loop over functions.
208 for (Module::iterator FI = M->begin(), FE = M->end(); FI != FE; ++FI)
209 if (!FI->isDeclaration() && !FI->hasInternalLinkage())
210 if (!FI->getName().empty())
211 symbols.push_back(FI->getName());
212}
213
214// Get just the externally visible defined symbols from the bytecode
215bool llvm::GetBytecodeSymbols(const sys::Path& fName,
216 std::vector<std::string>& symbols,
217 BCDecompressor_t *BCDC,
218 std::string* ErrMsg) {
219 ModuleProvider *MP = getBytecodeModuleProvider(fName.toString(), BCDC,ErrMsg);
220 if (!MP)
221 return true;
222
223 // Get the module from the provider
224 Module* M = MP->materializeModule();
225 if (M == 0) {
226 delete MP;
227 return true;
228 }
229
230 // Get the symbols
231 getSymbols(M, symbols);
232
233 // Done with the module.
234 delete MP;
235 return true;
236}
237
238ModuleProvider*
239llvm::GetBytecodeSymbols(const unsigned char*Buffer, unsigned Length,
240 const std::string& ModuleID,
241 std::vector<std::string>& symbols,
242 BCDecompressor_t *BCDC,
243 std::string* ErrMsg) {
244 // Get the module provider
245 ModuleProvider* MP =
246 getBytecodeBufferModuleProvider(Buffer, Length, ModuleID, BCDC, ErrMsg, 0);
247 if (!MP)
248 return 0;
249
250 // Get the module from the provider
251 Module* M = MP->materializeModule();
252 if (M == 0) {
253 delete MP;
254 return 0;
255 }
256
257 // Get the symbols
258 getSymbols(M, symbols);
259
260 // Done with the module. Note that ModuleProvider will delete the
261 // Module when it is deleted. Also note that its the caller's responsibility
262 // to delete the ModuleProvider.
263 return MP;
264}