blob: a0e5eedc9c94a2369f13db9b02f22a6c42f6e035 [file] [log] [blame]
Reid Spencer362cbf02004-11-06 08:51:45 +00001//===-- Archive.cpp - Generic LLVM archive functions ------------*- C++ -*-===//
Misha Brukman2b37d7c2005-04-21 21:13:18 +00002//
Reid Spencer362cbf02004-11-06 08:51:45 +00003// The LLVM Compiler Infrastructure
4//
Chris Lattner4ee451d2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Misha Brukman2b37d7c2005-04-21 21:13:18 +00007//
Reid Spencer362cbf02004-11-06 08:51:45 +00008//===----------------------------------------------------------------------===//
9//
Reid Spencercf6afc62004-11-14 21:56:59 +000010// This file contains the implementation of the Archive and ArchiveMember
11// classes that is common to both reading and writing archives..
Reid Spencer362cbf02004-11-06 08:51:45 +000012//
13//===----------------------------------------------------------------------===//
14
15#include "ArchiveInternals.h"
Chris Lattnerc1d56242007-05-06 09:28:33 +000016#include "llvm/Bitcode/ReaderWriter.h"
Reid Spencercf6afc62004-11-14 21:56:59 +000017#include "llvm/ModuleProvider.h"
Chris Lattnerf36c7b82007-02-07 23:53:17 +000018#include "llvm/Module.h"
Chris Lattnerc1d56242007-05-06 09:28:33 +000019#include "llvm/Support/MemoryBuffer.h"
Reid Spencer8e827e82005-04-21 17:49:57 +000020#include "llvm/System/Process.h"
Anton Korobeynikovae9f3a32008-02-20 11:08:44 +000021#include <memory>
22#include <cstring>
Reid Spencer362cbf02004-11-06 08:51:45 +000023using namespace llvm;
24
Reid Spencercf6afc62004-11-14 21:56:59 +000025// getMemberSize - compute the actual physical size of the file member as seen
26// on disk. This isn't the size of member's payload. Use getSize() for that.
27unsigned
28ArchiveMember::getMemberSize() const {
29 // Basically its the file size plus the header size
30 unsigned result = info.fileSize + sizeof(ArchiveMemberHeader);
31
32 // If it has a long filename, include the name length
33 if (hasLongFilename())
Reid Spencer1fce0912004-12-11 00:14:15 +000034 result += path.toString().length() + 1;
Reid Spencercf6afc62004-11-14 21:56:59 +000035
36 // If its now odd lengthed, include the padding byte
Misha Brukman2b37d7c2005-04-21 21:13:18 +000037 if (result % 2 != 0 )
Reid Spencercf6afc62004-11-14 21:56:59 +000038 result++;
39
40 return result;
Reid Spencer362cbf02004-11-06 08:51:45 +000041}
42
Reid Spencercf6afc62004-11-14 21:56:59 +000043// This default constructor is only use by the ilist when it creates its
44// sentry node. We give it specific static values to make it stand out a bit.
Misha Brukman2b37d7c2005-04-21 21:13:18 +000045ArchiveMember::ArchiveMember()
Jeff Cohen943b9b62006-05-06 23:25:53 +000046 : next(0), prev(0), parent(0), path("--invalid--"), flags(0), data(0)
Reid Spencercf6afc62004-11-14 21:56:59 +000047{
Reid Spencer8e827e82005-04-21 17:49:57 +000048 info.user = sys::Process::GetCurrentUserId();
Misha Brukman2b37d7c2005-04-21 21:13:18 +000049 info.group = sys::Process::GetCurrentGroupId();
50 info.mode = 0777;
51 info.fileSize = 0;
Reid Spencercf6afc62004-11-14 21:56:59 +000052 info.modTime = sys::TimeValue::now();
53}
54
55// This is the constructor that the Archive class uses when it is building or
56// reading an archive. It just defaults a few things and ensures the parent is
Misha Brukman2b37d7c2005-04-21 21:13:18 +000057// set for the iplist. The Archive class fills in the ArchiveMember's data.
58// This is required because correctly setting the data may depend on other
Reid Spencercf6afc62004-11-14 21:56:59 +000059// things in the Archive.
60ArchiveMember::ArchiveMember(Archive* PAR)
61 : next(0), prev(0), parent(PAR), path(), flags(0), data(0)
62{
63}
64
Misha Brukman2b37d7c2005-04-21 21:13:18 +000065// This method allows an ArchiveMember to be replaced with the data for a
Reid Spencercf6afc62004-11-14 21:56:59 +000066// different file, presumably as an update to the member. It also makes sure
67// the flags are reset correctly.
Reid Spencer0ff2d312006-08-24 23:45:08 +000068bool ArchiveMember::replaceWith(const sys::Path& newFile, std::string* ErrMsg) {
Reid Spencercd5561a2006-12-15 19:44:51 +000069 if (!newFile.exists()) {
70 if (ErrMsg)
71 *ErrMsg = "Can not replace an archive member with a non-existent file";
72 return true;
73 }
74
Reid Spencercf6afc62004-11-14 21:56:59 +000075 data = 0;
76 path = newFile;
77
Reid Spencer9a29db42004-11-20 07:29:40 +000078 // SVR4 symbol tables have an empty name
Reid Spencer1fce0912004-12-11 00:14:15 +000079 if (path.toString() == ARFILE_SVR4_SYMTAB_NAME)
Reid Spencer9a29db42004-11-20 07:29:40 +000080 flags |= SVR4SymbolTableFlag;
Reid Spencercf6afc62004-11-14 21:56:59 +000081 else
Reid Spencer9a29db42004-11-20 07:29:40 +000082 flags &= ~SVR4SymbolTableFlag;
83
84 // BSD4.4 symbol tables have a special name
Reid Spencer1fce0912004-12-11 00:14:15 +000085 if (path.toString() == ARFILE_BSD4_SYMTAB_NAME)
Reid Spencer9a29db42004-11-20 07:29:40 +000086 flags |= BSD4SymbolTableFlag;
87 else
88 flags &= ~BSD4SymbolTableFlag;
Reid Spencercf6afc62004-11-14 21:56:59 +000089
90 // LLVM symbol tables have a very specific name
Reid Spencer1fce0912004-12-11 00:14:15 +000091 if (path.toString() == ARFILE_LLVM_SYMTAB_NAME)
Reid Spencercf6afc62004-11-14 21:56:59 +000092 flags |= LLVMSymbolTableFlag;
93 else
94 flags &= ~LLVMSymbolTableFlag;
95
96 // String table name
Reid Spencer1fce0912004-12-11 00:14:15 +000097 if (path.toString() == ARFILE_STRTAB_NAME)
Reid Spencercf6afc62004-11-14 21:56:59 +000098 flags |= StringTableFlag;
99 else
100 flags &= ~StringTableFlag;
101
102 // If it has a slash then it has a path
Reid Spencer1fce0912004-12-11 00:14:15 +0000103 bool hasSlash = path.toString().find('/') != std::string::npos;
Reid Spencercf6afc62004-11-14 21:56:59 +0000104 if (hasSlash)
105 flags |= HasPathFlag;
106 else
107 flags &= ~HasPathFlag;
108
109 // If it has a slash or its over 15 chars then its a long filename format
Reid Spencer1fce0912004-12-11 00:14:15 +0000110 if (hasSlash || path.toString().length() > 15)
Reid Spencercf6afc62004-11-14 21:56:59 +0000111 flags |= HasLongFilenameFlag;
112 else
113 flags &= ~HasLongFilenameFlag;
114
115 // Get the signature and status info
Reid Spencercf6afc62004-11-14 21:56:59 +0000116 const char* signature = (const char*) data;
Chris Lattner252ad032006-07-28 22:03:44 +0000117 std::string magic;
Reid Spencercf6afc62004-11-14 21:56:59 +0000118 if (!signature) {
119 path.getMagicNumber(magic,4);
120 signature = magic.c_str();
Chris Lattner252ad032006-07-28 22:03:44 +0000121 std::string err;
Reid Spencera021d5d2007-04-07 19:51:45 +0000122 const sys::FileStatus *FSinfo = path.getFileStatus(false, ErrMsg);
Reid Spencer8475ec02007-03-29 19:05:44 +0000123 if (FSinfo)
124 info = *FSinfo;
125 else
Reid Spencer0ff2d312006-08-24 23:45:08 +0000126 return true;
Reid Spencercf6afc62004-11-14 21:56:59 +0000127 }
128
129 // Determine what kind of file it is
130 switch (sys::IdentifyFileType(signature,4)) {
Reid Spencercf6afc62004-11-14 21:56:59 +0000131 default:
Gabor Greife75ca3d2007-07-06 13:38:17 +0000132 flags &= ~BitcodeFlag;
Reid Spencercf6afc62004-11-14 21:56:59 +0000133 break;
134 }
Reid Spencer0ff2d312006-08-24 23:45:08 +0000135 return false;
Reid Spencercf6afc62004-11-14 21:56:59 +0000136}
137
138// Archive constructor - this is the only constructor that gets used for the
Misha Brukman2b37d7c2005-04-21 21:13:18 +0000139// Archive class. Everything else (default,copy) is deprecated. This just
Reid Spencercf6afc62004-11-14 21:56:59 +0000140// initializes and maps the file into memory, if requested.
Chris Lattnerc1d56242007-05-06 09:28:33 +0000141Archive::Archive(const sys::Path& filename)
Reid Spencer1f465802004-11-16 06:47:07 +0000142 : archPath(filename), members(), mapfile(0), base(0), symTab(), strtab(),
Chris Lattnerc1d56242007-05-06 09:28:33 +0000143 symTabSize(0), firstFileOffset(0), modules(), foreignST(0) {
Reid Spencer0ff2d312006-08-24 23:45:08 +0000144}
145
146bool
Chris Lattner7f6b4472008-04-01 04:26:46 +0000147Archive::mapToMemory(std::string* ErrMsg) {
Chris Lattner038112a2008-04-01 18:04:03 +0000148 mapfile = MemoryBuffer::getFile(archPath.c_str(), ErrMsg);
Chris Lattner7f6b4472008-04-01 04:26:46 +0000149 if (mapfile == 0)
Reid Spencer0ff2d312006-08-24 23:45:08 +0000150 return true;
Chris Lattner7f6b4472008-04-01 04:26:46 +0000151 base = mapfile->getBufferStart();
Reid Spencer0ff2d312006-08-24 23:45:08 +0000152 return false;
Reid Spencercf6afc62004-11-14 21:56:59 +0000153}
154
Reid Spencer6ff72402005-11-30 05:21:10 +0000155void Archive::cleanUpMemory() {
Reid Spencercf6afc62004-11-14 21:56:59 +0000156 // Shutdown the file mapping
Chris Lattner7f6b4472008-04-01 04:26:46 +0000157 delete mapfile;
158 mapfile = 0;
159 base = 0;
Reid Spencer6ff72402005-11-30 05:21:10 +0000160
161 // Forget the entire symbol table
162 symTab.clear();
163 symTabSize = 0;
164
165 firstFileOffset = 0;
166
167 // Free the foreign symbol table member
168 if (foreignST) {
169 delete foreignST;
170 foreignST = 0;
171 }
172
Reid Spencercf6afc62004-11-14 21:56:59 +0000173 // Delete any ModuleProviders and ArchiveMember's we've allocated as a result
174 // of symbol table searches.
175 for (ModuleMap::iterator I=modules.begin(), E=modules.end(); I != E; ++I ) {
176 delete I->second.first;
177 delete I->second.second;
178 }
Reid Spencer362cbf02004-11-06 08:51:45 +0000179}
180
Reid Spencer6ff72402005-11-30 05:21:10 +0000181// Archive destructor - just clean up memory
182Archive::~Archive() {
183 cleanUpMemory();
184}
185
Chris Lattnerf36c7b82007-02-07 23:53:17 +0000186
187
188static void getSymbols(Module*M, std::vector<std::string>& symbols) {
189 // Loop over global variables
190 for (Module::global_iterator GI = M->global_begin(), GE=M->global_end(); GI != GE; ++GI)
191 if (!GI->isDeclaration() && !GI->hasInternalLinkage())
192 if (!GI->getName().empty())
193 symbols.push_back(GI->getName());
194
Anton Korobeynikovd58ceb22008-03-04 20:15:35 +0000195 // Loop over functions
Chris Lattnerf36c7b82007-02-07 23:53:17 +0000196 for (Module::iterator FI = M->begin(), FE = M->end(); FI != FE; ++FI)
197 if (!FI->isDeclaration() && !FI->hasInternalLinkage())
198 if (!FI->getName().empty())
199 symbols.push_back(FI->getName());
Anton Korobeynikovd58ceb22008-03-04 20:15:35 +0000200
201 // Loop over aliases
202 for (Module::alias_iterator AI = M->alias_begin(), AE = M->alias_end();
203 AI != AE; ++AI) {
Anton Korobeynikov7fcb6b62008-03-11 00:24:53 +0000204 if (AI->hasName())
205 symbols.push_back(AI->getName());
Anton Korobeynikovd58ceb22008-03-04 20:15:35 +0000206 }
Chris Lattnerf36c7b82007-02-07 23:53:17 +0000207}
208
Gabor Greifa99be512007-07-05 17:07:56 +0000209// Get just the externally visible defined symbols from the bitcode
210bool llvm::GetBitcodeSymbols(const sys::Path& fName,
211 std::vector<std::string>& symbols,
212 std::string* ErrMsg) {
Chris Lattnerc1d56242007-05-06 09:28:33 +0000213 std::auto_ptr<MemoryBuffer> Buffer(
Chris Lattner038112a2008-04-01 18:04:03 +0000214 MemoryBuffer::getFileOrSTDIN(fName.c_str()));
Chris Lattnerc1d56242007-05-06 09:28:33 +0000215 if (!Buffer.get()) {
216 if (ErrMsg) *ErrMsg = "Could not open file '" + fName.toString() + "'";
217 return true;
218 }
219
220 ModuleProvider *MP = getBitcodeModuleProvider(Buffer.get(), ErrMsg);
Chris Lattnerf36c7b82007-02-07 23:53:17 +0000221 if (!MP)
222 return true;
223
224 // Get the module from the provider
225 Module* M = MP->materializeModule();
226 if (M == 0) {
227 delete MP;
228 return true;
229 }
230
231 // Get the symbols
232 getSymbols(M, symbols);
233
234 // Done with the module.
235 delete MP;
236 return true;
237}
238
239ModuleProvider*
Gabor Greifa99be512007-07-05 17:07:56 +0000240llvm::GetBitcodeSymbols(const unsigned char *BufPtr, unsigned Length,
241 const std::string& ModuleID,
242 std::vector<std::string>& symbols,
243 std::string* ErrMsg) {
Chris Lattnerf36c7b82007-02-07 23:53:17 +0000244 // Get the module provider
Chris Lattnerc1d56242007-05-06 09:28:33 +0000245 MemoryBuffer *Buffer =MemoryBuffer::getNewMemBuffer(Length, ModuleID.c_str());
246 memcpy((char*)Buffer->getBufferStart(), BufPtr, Length);
247
248 ModuleProvider *MP = getBitcodeModuleProvider(Buffer, ErrMsg);
Chris Lattnerf36c7b82007-02-07 23:53:17 +0000249 if (!MP)
250 return 0;
251
252 // Get the module from the provider
253 Module* M = MP->materializeModule();
254 if (M == 0) {
255 delete MP;
256 return 0;
257 }
258
259 // Get the symbols
260 getSymbols(M, symbols);
261
262 // Done with the module. Note that ModuleProvider will delete the
263 // Module when it is deleted. Also note that its the caller's responsibility
264 // to delete the ModuleProvider.
265 return MP;
266}