| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 1 | //===-- ArchiveWriter.cpp - Write LLVM archive files ----------------------===// | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 2 | // | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 3 | //                     The LLVM Compiler Infrastructure | 
|  | 4 | // | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 5 | // This file was developed by Reid Spencer and is distributed under the | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 6 | // University of Illinois Open Source License. See LICENSE.TXT for details. | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 7 | // | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// | 
|  | 9 | // | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 10 | // Builds up an LLVM archive file (.a) containing LLVM bytecode. | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 11 | // | 
|  | 12 | //===----------------------------------------------------------------------===// | 
|  | 13 |  | 
|  | 14 | #include "ArchiveInternals.h" | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 15 | #include "llvm/Bytecode/Reader.h" | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 16 | #include "llvm/Support/Compressor.h" | 
|  | 17 | #include "llvm/System/Signals.h" | 
| Reid Spencer | 3468e57 | 2005-04-21 16:15:19 +0000 | [diff] [blame] | 18 | #include "llvm/System/Process.h" | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 19 | #include <fstream> | 
| Bill Wendling | a21900d | 2006-11-28 22:49:32 +0000 | [diff] [blame] | 20 | #include <ostream> | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 21 | #include <iomanip> | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 22 | using namespace llvm; | 
|  | 23 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 24 | // Write an integer using variable bit rate encoding. This saves a few bytes | 
|  | 25 | // per entry in the symbol table. | 
|  | 26 | inline void writeInteger(unsigned num, std::ofstream& ARFile) { | 
|  | 27 | while (1) { | 
|  | 28 | if (num < 0x80) { // done? | 
|  | 29 | ARFile << (unsigned char)num; | 
|  | 30 | return; | 
|  | 31 | } | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 32 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 33 | // Nope, we are bigger than a character, output the next 7 bits and set the | 
|  | 34 | // high bit to say that there is more coming... | 
|  | 35 | ARFile << (unsigned char)(0x80 | ((unsigned char)num & 0x7F)); | 
|  | 36 | num >>= 7;  // Shift out 7 bits now... | 
|  | 37 | } | 
|  | 38 | } | 
|  | 39 |  | 
|  | 40 | // Compute how many bytes are taken by a given VBR encoded value. This is needed | 
|  | 41 | // to pre-compute the size of the symbol table. | 
|  | 42 | inline unsigned numVbrBytes(unsigned num) { | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 43 |  | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 44 | // Note that the following nested ifs are somewhat equivalent to a binary | 
|  | 45 | // search. We split it in half by comparing against 2^14 first. This allows | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 46 | // most reasonable values to be done in 2 comparisons instead of 1 for | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 47 | // small ones and four for large ones. We expect this to access file offsets | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 48 | // in the 2^10 to 2^24 range and symbol lengths in the 2^0 to 2^8 range, | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 49 | // so this approach is reasonable. | 
|  | 50 | if (num < 1<<14) | 
|  | 51 | if (num < 1<<7) | 
|  | 52 | return 1; | 
|  | 53 | else | 
|  | 54 | return 2; | 
|  | 55 | if (num < 1<<21) | 
|  | 56 | return 3; | 
|  | 57 |  | 
|  | 58 | if (num < 1<<28) | 
|  | 59 | return 4; | 
|  | 60 | return 5; // anything >= 2^28 takes 5 bytes | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 61 | } | 
|  | 62 |  | 
|  | 63 | // Create an empty archive. | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 64 | Archive* | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 65 | Archive::CreateEmpty(const sys::Path& FilePath ) { | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 66 | Archive* result = new Archive(FilePath); | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 67 | return result; | 
|  | 68 | } | 
|  | 69 |  | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 70 | // Fill the ArchiveMemberHeader with the information from a member. If | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 71 | // TruncateNames is true, names are flattened to 15 chars or less. The sz field | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 72 | // is provided here instead of coming from the mbr because the member might be | 
|  | 73 | // stored compressed and the compressed size is not the ArchiveMember's size. | 
|  | 74 | // Furthermore compressed files have negative size fields to identify them as | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 75 | // compressed. | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 76 | bool | 
|  | 77 | Archive::fillHeader(const ArchiveMember &mbr, ArchiveMemberHeader& hdr, | 
|  | 78 | int sz, bool TruncateNames) const { | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 79 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 80 | // Set the permissions mode, uid and gid | 
|  | 81 | hdr.init(); | 
|  | 82 | char buffer[32]; | 
|  | 83 | sprintf(buffer, "%-8o", mbr.getMode()); | 
|  | 84 | memcpy(hdr.mode,buffer,8); | 
|  | 85 | sprintf(buffer,  "%-6u", mbr.getUser()); | 
|  | 86 | memcpy(hdr.uid,buffer,6); | 
|  | 87 | sprintf(buffer,  "%-6u", mbr.getGroup()); | 
|  | 88 | memcpy(hdr.gid,buffer,6); | 
|  | 89 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 90 | // Set the last modification date | 
|  | 91 | uint64_t secondsSinceEpoch = mbr.getModTime().toEpochTime(); | 
|  | 92 | sprintf(buffer,"%-12u", unsigned(secondsSinceEpoch)); | 
|  | 93 | memcpy(hdr.date,buffer,12); | 
|  | 94 |  | 
| Reid Spencer | d4543da | 2004-11-17 18:28:29 +0000 | [diff] [blame] | 95 | // Get rid of trailing blanks in the name | 
| Reid Spencer | 1fce091 | 2004-12-11 00:14:15 +0000 | [diff] [blame] | 96 | std::string mbrPath = mbr.getPath().toString(); | 
| Reid Spencer | d4543da | 2004-11-17 18:28:29 +0000 | [diff] [blame] | 97 | size_t mbrLen = mbrPath.length(); | 
|  | 98 | while (mbrLen > 0 && mbrPath[mbrLen-1] == ' ') { | 
|  | 99 | mbrPath.erase(mbrLen-1,1); | 
|  | 100 | mbrLen--; | 
|  | 101 | } | 
|  | 102 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 103 | // Set the name field in one of its various flavors. | 
|  | 104 | bool writeLongName = false; | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 105 | if (mbr.isStringTable()) { | 
|  | 106 | memcpy(hdr.name,ARFILE_STRTAB_NAME,16); | 
| Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 107 | } else if (mbr.isSVR4SymbolTable()) { | 
|  | 108 | memcpy(hdr.name,ARFILE_SVR4_SYMTAB_NAME,16); | 
|  | 109 | } else if (mbr.isBSD4SymbolTable()) { | 
|  | 110 | memcpy(hdr.name,ARFILE_BSD4_SYMTAB_NAME,16); | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 111 | } else if (mbr.isLLVMSymbolTable()) { | 
|  | 112 | memcpy(hdr.name,ARFILE_LLVM_SYMTAB_NAME,16); | 
|  | 113 | } else if (TruncateNames) { | 
|  | 114 | const char* nm = mbrPath.c_str(); | 
|  | 115 | unsigned len = mbrPath.length(); | 
|  | 116 | size_t slashpos = mbrPath.rfind('/'); | 
|  | 117 | if (slashpos != std::string::npos) { | 
|  | 118 | nm += slashpos + 1; | 
|  | 119 | len -= slashpos +1; | 
|  | 120 | } | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 121 | if (len > 15) | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 122 | len = 15; | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 123 | memcpy(hdr.name,nm,len); | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 124 | hdr.name[len] = '/'; | 
|  | 125 | } else if (mbrPath.length() < 16 && mbrPath.find('/') == std::string::npos) { | 
| Reid Spencer | d4543da | 2004-11-17 18:28:29 +0000 | [diff] [blame] | 126 | memcpy(hdr.name,mbrPath.c_str(),mbrPath.length()); | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 127 | hdr.name[mbrPath.length()] = '/'; | 
|  | 128 | } else { | 
|  | 129 | std::string nm = "#1/"; | 
|  | 130 | nm += utostr(mbrPath.length()); | 
| Reid Spencer | d4543da | 2004-11-17 18:28:29 +0000 | [diff] [blame] | 131 | memcpy(hdr.name,nm.data(),nm.length()); | 
| Reid Spencer | 96ce335 | 2004-11-17 16:14:21 +0000 | [diff] [blame] | 132 | if (sz < 0) | 
|  | 133 | sz -= mbrPath.length(); | 
|  | 134 | else | 
|  | 135 | sz += mbrPath.length(); | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 136 | writeLongName = true; | 
|  | 137 | } | 
| Reid Spencer | 96ce335 | 2004-11-17 16:14:21 +0000 | [diff] [blame] | 138 |  | 
|  | 139 | // Set the size field | 
|  | 140 | if (sz < 0) { | 
|  | 141 | buffer[0] = '-'; | 
|  | 142 | sprintf(&buffer[1],"%-9u",(unsigned)-sz); | 
|  | 143 | } else { | 
|  | 144 | sprintf(buffer, "%-10u", (unsigned)sz); | 
|  | 145 | } | 
|  | 146 | memcpy(hdr.size,buffer,10); | 
|  | 147 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 148 | return writeLongName; | 
|  | 149 | } | 
|  | 150 |  | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 151 | // Insert a file into the archive before some other member. This also takes care | 
|  | 152 | // of extracting the necessary flags and information from the file. | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 153 | bool | 
|  | 154 | Archive::addFileBefore(const sys::Path& filePath, iterator where, | 
|  | 155 | std::string* ErrMsg) { | 
| Reid Spencer | cd5561a | 2006-12-15 19:44:51 +0000 | [diff] [blame] | 156 | if (!filePath.exists()) { | 
|  | 157 | if (ErrMsg) | 
|  | 158 | *ErrMsg = "Can not add a non-existent file to archive"; | 
|  | 159 | return true; | 
|  | 160 | } | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 161 |  | 
|  | 162 | ArchiveMember* mbr = new ArchiveMember(this); | 
|  | 163 |  | 
|  | 164 | mbr->data = 0; | 
|  | 165 | mbr->path = filePath; | 
| Reid Spencer | 8475ec0 | 2007-03-29 19:05:44 +0000 | [diff] [blame^] | 166 | const sys::FileStatus *FSInfo = mbr->path.getFileStatus(false, ErrMsg); | 
|  | 167 | if (FSInfo) | 
|  | 168 | mbr->info = *FSInfo; | 
|  | 169 | else | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 170 | return true; | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 171 |  | 
|  | 172 | unsigned flags = 0; | 
| Reid Spencer | 1fce091 | 2004-12-11 00:14:15 +0000 | [diff] [blame] | 173 | bool hasSlash = filePath.toString().find('/') != std::string::npos; | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 174 | if (hasSlash) | 
|  | 175 | flags |= ArchiveMember::HasPathFlag; | 
| Reid Spencer | 1fce091 | 2004-12-11 00:14:15 +0000 | [diff] [blame] | 176 | if (hasSlash || filePath.toString().length() > 15) | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 177 | flags |= ArchiveMember::HasLongFilenameFlag; | 
|  | 178 | std::string magic; | 
|  | 179 | mbr->path.getMagicNumber(magic,4); | 
|  | 180 | switch (sys::IdentifyFileType(magic.c_str(),4)) { | 
|  | 181 | case sys::BytecodeFileType: | 
|  | 182 | flags |= ArchiveMember::BytecodeFlag; | 
|  | 183 | break; | 
|  | 184 | case sys::CompressedBytecodeFileType: | 
|  | 185 | flags |= ArchiveMember::CompressedBytecodeFlag; | 
|  | 186 | break; | 
|  | 187 | default: | 
|  | 188 | break; | 
|  | 189 | } | 
|  | 190 | mbr->flags = flags; | 
|  | 191 | members.insert(where,mbr); | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 192 | return false; | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 193 | } | 
|  | 194 |  | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 195 | // Write one member out to the file. | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 196 | bool | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 197 | Archive::writeMember( | 
|  | 198 | const ArchiveMember& member, | 
|  | 199 | std::ofstream& ARFile, | 
|  | 200 | bool CreateSymbolTable, | 
|  | 201 | bool TruncateNames, | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 202 | bool ShouldCompress, | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 203 | std::string* ErrMsg | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 204 | ) { | 
|  | 205 |  | 
|  | 206 | unsigned filepos = ARFile.tellp(); | 
|  | 207 | filepos -= 8; | 
|  | 208 |  | 
|  | 209 | // Get the data and its size either from the | 
|  | 210 | // member's in-memory data or directly from the file. | 
|  | 211 | size_t fSize = member.getSize(); | 
|  | 212 | const char* data = (const char*)member.getData(); | 
|  | 213 | sys::MappedFile* mFile = 0; | 
|  | 214 | if (!data) { | 
| Reid Spencer | 751ca6b | 2006-08-22 16:07:44 +0000 | [diff] [blame] | 215 | mFile = new sys::MappedFile(); | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 216 | if (mFile->open(member.getPath(), sys::MappedFile::READ_ACCESS, ErrMsg)) | 
|  | 217 | return true; | 
|  | 218 | if (!(data = (const char*) mFile->map(ErrMsg))) | 
|  | 219 | return true; | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 220 | fSize = mFile->size(); | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 221 | } | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 222 |  | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 223 | // Now that we have the data in memory, update the | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 224 | // symbol table if its a bytecode file. | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 225 | if (CreateSymbolTable && | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 226 | (member.isBytecode() || member.isCompressedBytecode())) { | 
|  | 227 | std::vector<std::string> symbols; | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 228 | std::string FullMemberName = archPath.toString() + "(" + | 
|  | 229 | member.getPath().toString() | 
| Reid Spencer | d4543da | 2004-11-17 18:28:29 +0000 | [diff] [blame] | 230 | + ")"; | 
| Chris Lattner | f2e292c | 2007-02-07 21:41:02 +0000 | [diff] [blame] | 231 | ModuleProvider* MP = | 
|  | 232 | GetBytecodeSymbols((const unsigned char*)data,fSize, | 
|  | 233 | FullMemberName, symbols, | 
|  | 234 | Compressor::decompressToNewBuffer, ErrMsg); | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 235 |  | 
| Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 236 | // If the bytecode parsed successfully | 
|  | 237 | if ( MP ) { | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 238 | for (std::vector<std::string>::iterator SI = symbols.begin(), | 
| Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 239 | SE = symbols.end(); SI != SE; ++SI) { | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 240 |  | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 241 | std::pair<SymTabType::iterator,bool> Res = | 
| Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 242 | symTab.insert(std::make_pair(*SI,filepos)); | 
|  | 243 |  | 
|  | 244 | if (Res.second) { | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 245 | symTabSize += SI->length() + | 
|  | 246 | numVbrBytes(SI->length()) + | 
| Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 247 | numVbrBytes(filepos); | 
|  | 248 | } | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 249 | } | 
| Reid Spencer | 766b793 | 2004-11-15 01:20:11 +0000 | [diff] [blame] | 250 | // We don't need this module any more. | 
|  | 251 | delete MP; | 
|  | 252 | } else { | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 253 | if (mFile != 0) { | 
|  | 254 | mFile->close(); | 
|  | 255 | delete mFile; | 
|  | 256 | } | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 257 | if (ErrMsg) | 
| Reid Spencer | 0b5a504 | 2006-08-25 17:43:11 +0000 | [diff] [blame] | 258 | *ErrMsg = "Can't parse bytecode member: " + member.getPath().toString() | 
|  | 259 | + ": " + *ErrMsg; | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 260 | return true; | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 261 | } | 
|  | 262 | } | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 263 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 264 | // Determine if we actually should compress this member | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 265 | bool willCompress = | 
|  | 266 | (ShouldCompress && | 
|  | 267 | !member.isCompressed() && | 
| Reid Spencer | 9a29db4 | 2004-11-20 07:29:40 +0000 | [diff] [blame] | 268 | !member.isCompressedBytecode() && | 
|  | 269 | !member.isLLVMSymbolTable() && | 
|  | 270 | !member.isSVR4SymbolTable() && | 
|  | 271 | !member.isBSD4SymbolTable()); | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 272 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 273 | // Perform the compression. Note that if the file is uncompressed bytecode | 
|  | 274 | // then we turn the file into compressed bytecode rather than treating it as | 
|  | 275 | // compressed data. This is necessary since it allows us to determine that the | 
|  | 276 | // file contains bytecode instead of looking like a regular compressed data | 
|  | 277 | // member. A compressed bytecode file has its content compressed but has a | 
|  | 278 | // magic number of "llvc". This acounts for the +/-4 arithmetic in the code | 
|  | 279 | // below. | 
|  | 280 | int hdrSize; | 
|  | 281 | if (willCompress) { | 
|  | 282 | char* output = 0; | 
|  | 283 | if (member.isBytecode()) { | 
|  | 284 | data +=4; | 
|  | 285 | fSize -= 4; | 
|  | 286 | } | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 287 | fSize = Compressor::compressToNewBuffer(data,fSize,output,ErrMsg); | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 288 | if (fSize == 0) | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 289 | return true; | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 290 | data = output; | 
|  | 291 | if (member.isBytecode()) | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 292 | hdrSize = -fSize-4; | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 293 | else | 
|  | 294 | hdrSize = -fSize; | 
|  | 295 | } else { | 
|  | 296 | hdrSize = fSize; | 
|  | 297 | } | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 298 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 299 | // Compute the fields of the header | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 300 | ArchiveMemberHeader Hdr; | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 301 | bool writeLongName = fillHeader(member,Hdr,hdrSize,TruncateNames); | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 302 |  | 
|  | 303 | // Write header to archive file | 
|  | 304 | ARFile.write((char*)&Hdr, sizeof(Hdr)); | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 305 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 306 | // Write the long filename if its long | 
|  | 307 | if (writeLongName) { | 
| Reid Spencer | 1fce091 | 2004-12-11 00:14:15 +0000 | [diff] [blame] | 308 | ARFile.write(member.getPath().toString().data(), | 
|  | 309 | member.getPath().toString().length()); | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 310 | } | 
|  | 311 |  | 
|  | 312 | // Make sure we write the compressed bytecode magic number if we should. | 
|  | 313 | if (willCompress && member.isBytecode()) | 
|  | 314 | ARFile.write("llvc",4); | 
|  | 315 |  | 
|  | 316 | // Write the (possibly compressed) member's content to the file. | 
|  | 317 | ARFile.write(data,fSize); | 
|  | 318 |  | 
|  | 319 | // Make sure the member is an even length | 
| Jeff Cohen | e133721 | 2004-12-20 03:23:46 +0000 | [diff] [blame] | 320 | if ((ARFile.tellp() & 1) == 1) | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 321 | ARFile << ARFILE_PAD; | 
|  | 322 |  | 
|  | 323 | // Free the compressed data, if necessary | 
|  | 324 | if (willCompress) { | 
|  | 325 | free((void*)data); | 
|  | 326 | } | 
|  | 327 |  | 
|  | 328 | // Close the mapped file if it was opened | 
|  | 329 | if (mFile != 0) { | 
| Jeff Cohen | d19d89a | 2005-01-28 01:17:07 +0000 | [diff] [blame] | 330 | mFile->close(); | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 331 | delete mFile; | 
|  | 332 | } | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 333 | return false; | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 334 | } | 
|  | 335 |  | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 336 | // Write out the LLVM symbol table as an archive member to the file. | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 337 | void | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 338 | Archive::writeSymbolTable(std::ofstream& ARFile) { | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 339 |  | 
|  | 340 | // Construct the symbol table's header | 
|  | 341 | ArchiveMemberHeader Hdr; | 
|  | 342 | Hdr.init(); | 
|  | 343 | memcpy(Hdr.name,ARFILE_LLVM_SYMTAB_NAME,16); | 
|  | 344 | uint64_t secondsSinceEpoch = sys::TimeValue::now().toEpochTime(); | 
|  | 345 | char buffer[32]; | 
| Misha Brukman | 4b2afe6 | 2005-04-20 03:55:35 +0000 | [diff] [blame] | 346 | sprintf(buffer, "%-8o", 0644); | 
|  | 347 | memcpy(Hdr.mode,buffer,8); | 
| Reid Spencer | 3468e57 | 2005-04-21 16:15:19 +0000 | [diff] [blame] | 348 | sprintf(buffer, "%-6u", sys::Process::GetCurrentUserId()); | 
| Misha Brukman | 4b2afe6 | 2005-04-20 03:55:35 +0000 | [diff] [blame] | 349 | memcpy(Hdr.uid,buffer,6); | 
| Reid Spencer | 3468e57 | 2005-04-21 16:15:19 +0000 | [diff] [blame] | 350 | sprintf(buffer, "%-6u", sys::Process::GetCurrentGroupId()); | 
| Misha Brukman | 4b2afe6 | 2005-04-20 03:55:35 +0000 | [diff] [blame] | 351 | memcpy(Hdr.gid,buffer,6); | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 352 | sprintf(buffer,"%-12u", unsigned(secondsSinceEpoch)); | 
|  | 353 | memcpy(Hdr.date,buffer,12); | 
|  | 354 | sprintf(buffer,"%-10u",symTabSize); | 
|  | 355 | memcpy(Hdr.size,buffer,10); | 
|  | 356 |  | 
|  | 357 | // Write the header | 
|  | 358 | ARFile.write((char*)&Hdr, sizeof(Hdr)); | 
|  | 359 |  | 
|  | 360 | // Save the starting position of the symbol tables data content. | 
|  | 361 | unsigned startpos = ARFile.tellp(); | 
|  | 362 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 363 | // Write out the symbols sequentially | 
|  | 364 | for ( Archive::SymTabType::iterator I = symTab.begin(), E = symTab.end(); | 
|  | 365 | I != E; ++I) | 
|  | 366 | { | 
|  | 367 | // Write out the file index | 
|  | 368 | writeInteger(I->second, ARFile); | 
|  | 369 | // Write out the length of the symbol | 
|  | 370 | writeInteger(I->first.length(), ARFile); | 
|  | 371 | // Write out the symbol | 
|  | 372 | ARFile.write(I->first.data(), I->first.length()); | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 373 | } | 
|  | 374 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 375 | // Now that we're done with the symbol table, get the ending file position | 
|  | 376 | unsigned endpos = ARFile.tellp(); | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 377 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 378 | // Make sure that the amount we wrote is what we pre-computed. This is | 
|  | 379 | // critical for file integrity purposes. | 
|  | 380 | assert(endpos - startpos == symTabSize && "Invalid symTabSize computation"); | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 381 |  | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 382 | // Make sure the symbol table is even sized | 
|  | 383 | if (symTabSize % 2 != 0 ) | 
|  | 384 | ARFile << ARFILE_PAD; | 
| Reid Spencer | 362cbf0 | 2004-11-06 08:51:45 +0000 | [diff] [blame] | 385 | } | 
|  | 386 |  | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 387 | // Write the entire archive to the file specified when the archive was created. | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 388 | // This writes to a temporary file first. Options are for creating a symbol | 
|  | 389 | // table, flattening the file names (no directories, 15 chars max) and | 
| Reid Spencer | 87f9072 | 2004-11-16 06:47:30 +0000 | [diff] [blame] | 390 | // compressing each archive member. | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 391 | bool | 
|  | 392 | Archive::writeToDisk(bool CreateSymbolTable, bool TruncateNames, bool Compress, | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 393 | std::string* ErrMsg) | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 394 | { | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 395 | // Make sure they haven't opened up the file, not loaded it, | 
|  | 396 | // but are now trying to write it which would wipe out the file. | 
| Reid Spencer | cd5561a | 2006-12-15 19:44:51 +0000 | [diff] [blame] | 397 | if (members.empty() && mapfile->size() > 8) { | 
|  | 398 | if (ErrMsg) | 
|  | 399 | *ErrMsg = "Can't write an archive not opened for writing"; | 
|  | 400 | return true; | 
|  | 401 | } | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 402 |  | 
|  | 403 | // Create a temporary file to store the archive in | 
|  | 404 | sys::Path TmpArchive = archPath; | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 405 | if (TmpArchive.createTemporaryFileOnDisk(ErrMsg)) | 
|  | 406 | return true; | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 407 |  | 
|  | 408 | // Make sure the temporary gets removed if we crash | 
|  | 409 | sys::RemoveFileOnSignal(TmpArchive); | 
|  | 410 |  | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 411 | // Create archive file for output. | 
|  | 412 | std::ios::openmode io_mode = std::ios::out | std::ios::trunc | | 
|  | 413 | std::ios::binary; | 
|  | 414 | std::ofstream ArchiveFile(TmpArchive.c_str(), io_mode); | 
| Misha Brukman | 2b37d7c | 2005-04-21 21:13:18 +0000 | [diff] [blame] | 415 |  | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 416 | // Check for errors opening or creating archive file. | 
| Chris Lattner | 0c33231 | 2006-07-28 22:29:50 +0000 | [diff] [blame] | 417 | if (!ArchiveFile.is_open() || ArchiveFile.bad()) { | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 418 | if (TmpArchive.exists()) | 
| Reid Spencer | a229c5c | 2005-07-08 03:08:58 +0000 | [diff] [blame] | 419 | TmpArchive.eraseFromDisk(); | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 420 | if (ErrMsg) | 
|  | 421 | *ErrMsg = "Error opening archive file: " + archPath.toString(); | 
|  | 422 | return true; | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 423 | } | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 424 |  | 
|  | 425 | // If we're creating a symbol table, reset it now | 
|  | 426 | if (CreateSymbolTable) { | 
|  | 427 | symTabSize = 0; | 
|  | 428 | symTab.clear(); | 
|  | 429 | } | 
|  | 430 |  | 
|  | 431 | // Write magic string to archive. | 
|  | 432 | ArchiveFile << ARFILE_MAGIC; | 
|  | 433 |  | 
|  | 434 | // Loop over all member files, and write them out. Note that this also | 
|  | 435 | // builds the symbol table, symTab. | 
| Chris Lattner | 0c33231 | 2006-07-28 22:29:50 +0000 | [diff] [blame] | 436 | for (MembersList::iterator I = begin(), E = end(); I != E; ++I) { | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 437 | if (writeMember(*I, ArchiveFile, CreateSymbolTable, | 
|  | 438 | TruncateNames, Compress, ErrMsg)) { | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 439 | if (TmpArchive.exists()) | 
|  | 440 | TmpArchive.eraseFromDisk(); | 
|  | 441 | ArchiveFile.close(); | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 442 | return true; | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 443 | } | 
|  | 444 | } | 
|  | 445 |  | 
|  | 446 | // Close archive file. | 
|  | 447 | ArchiveFile.close(); | 
|  | 448 |  | 
|  | 449 | // Write the symbol table | 
|  | 450 | if (CreateSymbolTable) { | 
|  | 451 | // At this point we have written a file that is a legal archive but it | 
|  | 452 | // doesn't have a symbol table in it. To aid in faster reading and to | 
|  | 453 | // ensure compatibility with other archivers we need to put the symbol | 
|  | 454 | // table first in the file. Unfortunately, this means mapping the file | 
|  | 455 | // we just wrote back in and copying it to the destination file. | 
|  | 456 |  | 
|  | 457 | // Map in the archive we just wrote. | 
| Reid Spencer | 751ca6b | 2006-08-22 16:07:44 +0000 | [diff] [blame] | 458 | sys::MappedFile arch; | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 459 | if (arch.open(TmpArchive, sys::MappedFile::READ_ACCESS, ErrMsg)) | 
|  | 460 | return true; | 
| Reid Spencer | 751ca6b | 2006-08-22 16:07:44 +0000 | [diff] [blame] | 461 | const char* base; | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 462 | if (!(base = (const char*) arch.map(ErrMsg))) | 
|  | 463 | return true; | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 464 |  | 
|  | 465 | // Open another temporary file in order to avoid invalidating the | 
|  | 466 | // mmapped data | 
|  | 467 | sys::Path FinalFilePath = archPath; | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 468 | if (FinalFilePath.createTemporaryFileOnDisk(ErrMsg)) | 
|  | 469 | return true; | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 470 | sys::RemoveFileOnSignal(FinalFilePath); | 
|  | 471 |  | 
|  | 472 | std::ofstream FinalFile(FinalFilePath.c_str(), io_mode); | 
| Chris Lattner | 0c33231 | 2006-07-28 22:29:50 +0000 | [diff] [blame] | 473 | if (!FinalFile.is_open() || FinalFile.bad()) { | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 474 | if (TmpArchive.exists()) | 
|  | 475 | TmpArchive.eraseFromDisk(); | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 476 | if (ErrMsg) | 
|  | 477 | *ErrMsg = "Error opening archive file: " + FinalFilePath.toString(); | 
|  | 478 | return true; | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 479 | } | 
|  | 480 |  | 
|  | 481 | // Write the file magic number | 
|  | 482 | FinalFile << ARFILE_MAGIC; | 
|  | 483 |  | 
|  | 484 | // If there is a foreign symbol table, put it into the file now. Most | 
|  | 485 | // ar(1) implementations require the symbol table to be first but llvm-ar | 
|  | 486 | // can deal with it being after a foreign symbol table. This ensures | 
|  | 487 | // compatibility with other ar(1) implementations as well as allowing the | 
|  | 488 | // archive to store both native .o and LLVM .bc files, both indexed. | 
|  | 489 | if (foreignST) { | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 490 | if (writeMember(*foreignST, FinalFile, false, false, false, ErrMsg)) { | 
| Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 491 | FinalFile.close(); | 
|  | 492 | if (TmpArchive.exists()) | 
|  | 493 | TmpArchive.eraseFromDisk(); | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 494 | return true; | 
| Reid Spencer | 8d8a7ff | 2006-07-07 20:56:50 +0000 | [diff] [blame] | 495 | } | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 496 | } | 
|  | 497 |  | 
|  | 498 | // Put out the LLVM symbol table now. | 
|  | 499 | writeSymbolTable(FinalFile); | 
|  | 500 |  | 
|  | 501 | // Copy the temporary file contents being sure to skip the file's magic | 
|  | 502 | // number. | 
|  | 503 | FinalFile.write(base + sizeof(ARFILE_MAGIC)-1, | 
|  | 504 | arch.size()-sizeof(ARFILE_MAGIC)+1); | 
|  | 505 |  | 
|  | 506 | // Close up shop | 
|  | 507 | FinalFile.close(); | 
|  | 508 | arch.close(); | 
|  | 509 |  | 
|  | 510 | // Move the final file over top of TmpArchive | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 511 | if (FinalFilePath.renamePathOnDisk(TmpArchive, ErrMsg)) | 
|  | 512 | return true; | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 513 | } | 
|  | 514 |  | 
|  | 515 | // Before we replace the actual archive, we need to forget all the | 
|  | 516 | // members, since they point to data in that old archive. We need to do | 
|  | 517 | // this because we cannot replace an open file on Windows. | 
|  | 518 | cleanUpMemory(); | 
|  | 519 |  | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 520 | if (TmpArchive.renamePathOnDisk(archPath, ErrMsg)) | 
|  | 521 | return true; | 
| Reid Spencer | 3039b99 | 2006-07-07 19:09:14 +0000 | [diff] [blame] | 522 |  | 
| Reid Spencer | 0ff2d31 | 2006-08-24 23:45:08 +0000 | [diff] [blame] | 523 | return false; | 
| Reid Spencer | cf6afc6 | 2004-11-14 21:56:59 +0000 | [diff] [blame] | 524 | } |