| /* |
| * Copyright (C) 2006 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| // |
| // Access to Zip archives. |
| // |
| |
| #define LOG_TAG "zip" |
| |
| #include "utils/ZipFile.h" |
| #include "utils/ZipUtils.h" |
| #include "utils/Log.h" |
| |
| #include <zlib.h> |
| #define DEF_MEM_LEVEL 8 // normally in zutil.h? |
| |
| #include <memory.h> |
| #include <sys/stat.h> |
| #include <errno.h> |
| #include <assert.h> |
| |
| using namespace android; |
| |
| /* |
| * Some environments require the "b", some choke on it. |
| */ |
| #define FILE_OPEN_RO "rb" |
| #define FILE_OPEN_RW "r+b" |
| #define FILE_OPEN_RW_CREATE "w+b" |
| |
| /* should live somewhere else? */ |
| static status_t errnoToStatus(int err) |
| { |
| if (err == ENOENT) |
| return NAME_NOT_FOUND; |
| else if (err == EACCES) |
| return PERMISSION_DENIED; |
| else |
| return UNKNOWN_ERROR; |
| } |
| |
| /* |
| * Open a file and parse its guts. |
| */ |
| status_t ZipFile::open(const char* zipFileName, int flags) |
| { |
| bool newArchive = false; |
| |
| assert(mZipFp == NULL); // no reopen |
| |
| if ((flags & kOpenTruncate)) |
| flags |= kOpenCreate; // trunc implies create |
| |
| if ((flags & kOpenReadOnly) && (flags & kOpenReadWrite)) |
| return INVALID_OPERATION; // not both |
| if (!((flags & kOpenReadOnly) || (flags & kOpenReadWrite))) |
| return INVALID_OPERATION; // not neither |
| if ((flags & kOpenCreate) && !(flags & kOpenReadWrite)) |
| return INVALID_OPERATION; // create requires write |
| |
| if (flags & kOpenTruncate) { |
| newArchive = true; |
| } else { |
| newArchive = (access(zipFileName, F_OK) != 0); |
| if (!(flags & kOpenCreate) && newArchive) { |
| /* not creating, must already exist */ |
| LOGD("File %s does not exist", zipFileName); |
| return NAME_NOT_FOUND; |
| } |
| } |
| |
| /* open the file */ |
| const char* openflags; |
| if (flags & kOpenReadWrite) { |
| if (newArchive) |
| openflags = FILE_OPEN_RW_CREATE; |
| else |
| openflags = FILE_OPEN_RW; |
| } else { |
| openflags = FILE_OPEN_RO; |
| } |
| mZipFp = fopen(zipFileName, openflags); |
| if (mZipFp == NULL) { |
| int err = errno; |
| LOGD("fopen failed: %d\n", err); |
| return errnoToStatus(err); |
| } |
| |
| status_t result; |
| if (!newArchive) { |
| /* |
| * Load the central directory. If that fails, then this probably |
| * isn't a Zip archive. |
| */ |
| result = readCentralDir(); |
| } else { |
| /* |
| * Newly-created. The EndOfCentralDir constructor actually |
| * sets everything to be the way we want it (all zeroes). We |
| * set mNeedCDRewrite so that we create *something* if the |
| * caller doesn't add any files. (We could also just unlink |
| * the file if it's brand new and nothing was added, but that's |
| * probably doing more than we really should -- the user might |
| * have a need for empty zip files.) |
| */ |
| mNeedCDRewrite = true; |
| result = NO_ERROR; |
| } |
| |
| if (flags & kOpenReadOnly) |
| mReadOnly = true; |
| else |
| assert(!mReadOnly); |
| |
| return result; |
| } |
| |
| /* |
| * Return the Nth entry in the archive. |
| */ |
| ZipEntry* ZipFile::getEntryByIndex(int idx) const |
| { |
| if (idx < 0 || idx >= (int) mEntries.size()) |
| return NULL; |
| |
| return mEntries[idx]; |
| } |
| |
| /* |
| * Find an entry by name. |
| */ |
| ZipEntry* ZipFile::getEntryByName(const char* fileName) const |
| { |
| /* |
| * Do a stupid linear string-compare search. |
| * |
| * There are various ways to speed this up, especially since it's rare |
| * to intermingle changes to the archive with "get by name" calls. We |
| * don't want to sort the mEntries vector itself, however, because |
| * it's used to recreate the Central Directory. |
| * |
| * (Hash table works, parallel list of pointers in sorted order is good.) |
| */ |
| int idx; |
| |
| for (idx = mEntries.size()-1; idx >= 0; idx--) { |
| ZipEntry* pEntry = mEntries[idx]; |
| if (!pEntry->getDeleted() && |
| strcmp(fileName, pEntry->getFileName()) == 0) |
| { |
| return pEntry; |
| } |
| } |
| |
| return NULL; |
| } |
| |
| /* |
| * Empty the mEntries vector. |
| */ |
| void ZipFile::discardEntries(void) |
| { |
| int count = mEntries.size(); |
| |
| while (--count >= 0) |
| delete mEntries[count]; |
| |
| mEntries.clear(); |
| } |
| |
| |
| /* |
| * Find the central directory and read the contents. |
| * |
| * The fun thing about ZIP archives is that they may or may not be |
| * readable from start to end. In some cases, notably for archives |
| * that were written to stdout, the only length information is in the |
| * central directory at the end of the file. |
| * |
| * Of course, the central directory can be followed by a variable-length |
| * comment field, so we have to scan through it backwards. The comment |
| * is at most 64K, plus we have 18 bytes for the end-of-central-dir stuff |
| * itself, plus apparently sometimes people throw random junk on the end |
| * just for the fun of it. |
| * |
| * This is all a little wobbly. If the wrong value ends up in the EOCD |
| * area, we're hosed. This appears to be the way that everbody handles |
| * it though, so we're in pretty good company if this fails. |
| */ |
| status_t ZipFile::readCentralDir(void) |
| { |
| status_t result = NO_ERROR; |
| unsigned char* buf = NULL; |
| off_t fileLength, seekStart; |
| long readAmount; |
| int i; |
| |
| fseek(mZipFp, 0, SEEK_END); |
| fileLength = ftell(mZipFp); |
| rewind(mZipFp); |
| |
| /* too small to be a ZIP archive? */ |
| if (fileLength < EndOfCentralDir::kEOCDLen) { |
| LOGD("Length is %ld -- too small\n", (long)fileLength); |
| result = INVALID_OPERATION; |
| goto bail; |
| } |
| |
| buf = new unsigned char[EndOfCentralDir::kMaxEOCDSearch]; |
| if (buf == NULL) { |
| LOGD("Failure allocating %d bytes for EOCD search", |
| EndOfCentralDir::kMaxEOCDSearch); |
| result = NO_MEMORY; |
| goto bail; |
| } |
| |
| if (fileLength > EndOfCentralDir::kMaxEOCDSearch) { |
| seekStart = fileLength - EndOfCentralDir::kMaxEOCDSearch; |
| readAmount = EndOfCentralDir::kMaxEOCDSearch; |
| } else { |
| seekStart = 0; |
| readAmount = (long) fileLength; |
| } |
| if (fseek(mZipFp, seekStart, SEEK_SET) != 0) { |
| LOGD("Failure seeking to end of zip at %ld", (long) seekStart); |
| result = UNKNOWN_ERROR; |
| goto bail; |
| } |
| |
| /* read the last part of the file into the buffer */ |
| if (fread(buf, 1, readAmount, mZipFp) != (size_t) readAmount) { |
| LOGD("short file? wanted %ld\n", readAmount); |
| result = UNKNOWN_ERROR; |
| goto bail; |
| } |
| |
| /* find the end-of-central-dir magic */ |
| for (i = readAmount - 4; i >= 0; i--) { |
| if (buf[i] == 0x50 && |
| ZipEntry::getLongLE(&buf[i]) == EndOfCentralDir::kSignature) |
| { |
| LOGV("+++ Found EOCD at buf+%d\n", i); |
| break; |
| } |
| } |
| if (i < 0) { |
| LOGD("EOCD not found, not Zip\n"); |
| result = INVALID_OPERATION; |
| goto bail; |
| } |
| |
| /* extract eocd values */ |
| result = mEOCD.readBuf(buf + i, readAmount - i); |
| if (result != NO_ERROR) { |
| LOGD("Failure reading %ld bytes of EOCD values", readAmount - i); |
| goto bail; |
| } |
| //mEOCD.dump(); |
| |
| if (mEOCD.mDiskNumber != 0 || mEOCD.mDiskWithCentralDir != 0 || |
| mEOCD.mNumEntries != mEOCD.mTotalNumEntries) |
| { |
| LOGD("Archive spanning not supported\n"); |
| result = INVALID_OPERATION; |
| goto bail; |
| } |
| |
| /* |
| * So far so good. "mCentralDirSize" is the size in bytes of the |
| * central directory, so we can just seek back that far to find it. |
| * We can also seek forward mCentralDirOffset bytes from the |
| * start of the file. |
| * |
| * We're not guaranteed to have the rest of the central dir in the |
| * buffer, nor are we guaranteed that the central dir will have any |
| * sort of convenient size. We need to skip to the start of it and |
| * read the header, then the other goodies. |
| * |
| * The only thing we really need right now is the file comment, which |
| * we're hoping to preserve. |
| */ |
| if (fseek(mZipFp, mEOCD.mCentralDirOffset, SEEK_SET) != 0) { |
| LOGD("Failure seeking to central dir offset %ld\n", |
| mEOCD.mCentralDirOffset); |
| result = UNKNOWN_ERROR; |
| goto bail; |
| } |
| |
| /* |
| * Loop through and read the central dir entries. |
| */ |
| LOGV("Scanning %d entries...\n", mEOCD.mTotalNumEntries); |
| int entry; |
| for (entry = 0; entry < mEOCD.mTotalNumEntries; entry++) { |
| ZipEntry* pEntry = new ZipEntry; |
| |
| result = pEntry->initFromCDE(mZipFp); |
| if (result != NO_ERROR) { |
| LOGD("initFromCDE failed\n"); |
| delete pEntry; |
| goto bail; |
| } |
| |
| mEntries.add(pEntry); |
| } |
| |
| |
| /* |
| * If all went well, we should now be back at the EOCD. |
| */ |
| { |
| unsigned char checkBuf[4]; |
| if (fread(checkBuf, 1, 4, mZipFp) != 4) { |
| LOGD("EOCD check read failed\n"); |
| result = INVALID_OPERATION; |
| goto bail; |
| } |
| if (ZipEntry::getLongLE(checkBuf) != EndOfCentralDir::kSignature) { |
| LOGD("EOCD read check failed\n"); |
| result = UNKNOWN_ERROR; |
| goto bail; |
| } |
| LOGV("+++ EOCD read check passed\n"); |
| } |
| |
| bail: |
| delete[] buf; |
| return result; |
| } |
| |
| |
| /* |
| * Add a new file to the archive. |
| * |
| * This requires creating and populating a ZipEntry structure, and copying |
| * the data into the file at the appropriate position. The "appropriate |
| * position" is the current location of the central directory, which we |
| * casually overwrite (we can put it back later). |
| * |
| * If we were concerned about safety, we would want to make all changes |
| * in a temp file and then overwrite the original after everything was |
| * safely written. Not really a concern for us. |
| */ |
| status_t ZipFile::addCommon(const char* fileName, const void* data, size_t size, |
| const char* storageName, int sourceType, int compressionMethod, |
| ZipEntry** ppEntry) |
| { |
| ZipEntry* pEntry = NULL; |
| status_t result = NO_ERROR; |
| long lfhPosn, startPosn, endPosn, uncompressedLen; |
| FILE* inputFp = NULL; |
| unsigned long crc; |
| time_t modWhen; |
| |
| if (mReadOnly) |
| return INVALID_OPERATION; |
| |
| assert(compressionMethod == ZipEntry::kCompressDeflated || |
| compressionMethod == ZipEntry::kCompressStored); |
| |
| /* make sure we're in a reasonable state */ |
| assert(mZipFp != NULL); |
| assert(mEntries.size() == mEOCD.mTotalNumEntries); |
| |
| /* make sure it doesn't already exist */ |
| if (getEntryByName(storageName) != NULL) |
| return ALREADY_EXISTS; |
| |
| if (!data) { |
| inputFp = fopen(fileName, FILE_OPEN_RO); |
| if (inputFp == NULL) |
| return errnoToStatus(errno); |
| } |
| |
| if (fseek(mZipFp, mEOCD.mCentralDirOffset, SEEK_SET) != 0) { |
| result = UNKNOWN_ERROR; |
| goto bail; |
| } |
| |
| pEntry = new ZipEntry; |
| pEntry->initNew(storageName, NULL); |
| |
| /* |
| * From here on out, failures are more interesting. |
| */ |
| mNeedCDRewrite = true; |
| |
| /* |
| * Write the LFH, even though it's still mostly blank. We need it |
| * as a place-holder. In theory the LFH isn't necessary, but in |
| * practice some utilities demand it. |
| */ |
| lfhPosn = ftell(mZipFp); |
| pEntry->mLFH.write(mZipFp); |
| startPosn = ftell(mZipFp); |
| |
| /* |
| * Copy the data in, possibly compressing it as we go. |
| */ |
| if (sourceType == ZipEntry::kCompressStored) { |
| if (compressionMethod == ZipEntry::kCompressDeflated) { |
| bool failed = false; |
| result = compressFpToFp(mZipFp, inputFp, data, size, &crc); |
| if (result != NO_ERROR) { |
| LOGD("compression failed, storing\n"); |
| failed = true; |
| } else { |
| /* |
| * Make sure it has compressed "enough". This probably ought |
| * to be set through an API call, but I don't expect our |
| * criteria to change over time. |
| */ |
| long src = inputFp ? ftell(inputFp) : size; |
| long dst = ftell(mZipFp) - startPosn; |
| if (dst + (dst / 10) > src) { |
| LOGD("insufficient compression (src=%ld dst=%ld), storing\n", |
| src, dst); |
| failed = true; |
| } |
| } |
| |
| if (failed) { |
| compressionMethod = ZipEntry::kCompressStored; |
| if (inputFp) rewind(inputFp); |
| fseek(mZipFp, startPosn, SEEK_SET); |
| /* fall through to kCompressStored case */ |
| } |
| } |
| /* handle "no compression" request, or failed compression from above */ |
| if (compressionMethod == ZipEntry::kCompressStored) { |
| if (inputFp) { |
| result = copyFpToFp(mZipFp, inputFp, &crc); |
| } else { |
| result = copyDataToFp(mZipFp, data, size, &crc); |
| } |
| if (result != NO_ERROR) { |
| // don't need to truncate; happens in CDE rewrite |
| LOGD("failed copying data in\n"); |
| goto bail; |
| } |
| } |
| |
| // currently seeked to end of file |
| uncompressedLen = inputFp ? ftell(inputFp) : size; |
| } else if (sourceType == ZipEntry::kCompressDeflated) { |
| /* we should support uncompressed-from-compressed, but it's not |
| * important right now */ |
| assert(compressionMethod == ZipEntry::kCompressDeflated); |
| |
| bool scanResult; |
| int method; |
| long compressedLen; |
| |
| scanResult = ZipUtils::examineGzip(inputFp, &method, &uncompressedLen, |
| &compressedLen, &crc); |
| if (!scanResult || method != ZipEntry::kCompressDeflated) { |
| LOGD("this isn't a deflated gzip file?"); |
| result = UNKNOWN_ERROR; |
| goto bail; |
| } |
| |
| result = copyPartialFpToFp(mZipFp, inputFp, compressedLen, NULL); |
| if (result != NO_ERROR) { |
| LOGD("failed copying gzip data in\n"); |
| goto bail; |
| } |
| } else { |
| assert(false); |
| result = UNKNOWN_ERROR; |
| goto bail; |
| } |
| |
| /* |
| * We could write the "Data Descriptor", but there doesn't seem to |
| * be any point since we're going to go back and write the LFH. |
| * |
| * Update file offsets. |
| */ |
| endPosn = ftell(mZipFp); // seeked to end of compressed data |
| |
| /* |
| * Success! Fill out new values. |
| */ |
| pEntry->setDataInfo(uncompressedLen, endPosn - startPosn, crc, |
| compressionMethod); |
| modWhen = getModTime(inputFp ? fileno(inputFp) : fileno(mZipFp)); |
| pEntry->setModWhen(modWhen); |
| pEntry->setLFHOffset(lfhPosn); |
| mEOCD.mNumEntries++; |
| mEOCD.mTotalNumEntries++; |
| mEOCD.mCentralDirSize = 0; // mark invalid; set by flush() |
| mEOCD.mCentralDirOffset = endPosn; |
| |
| /* |
| * Go back and write the LFH. |
| */ |
| if (fseek(mZipFp, lfhPosn, SEEK_SET) != 0) { |
| result = UNKNOWN_ERROR; |
| goto bail; |
| } |
| pEntry->mLFH.write(mZipFp); |
| |
| /* |
| * Add pEntry to the list. |
| */ |
| mEntries.add(pEntry); |
| if (ppEntry != NULL) |
| *ppEntry = pEntry; |
| pEntry = NULL; |
| |
| bail: |
| if (inputFp != NULL) |
| fclose(inputFp); |
| delete pEntry; |
| return result; |
| } |
| |
| /* |
| * Add an entry by copying it from another zip file. If "padding" is |
| * nonzero, the specified number of bytes will be added to the "extra" |
| * field in the header. |
| * |
| * If "ppEntry" is non-NULL, a pointer to the new entry will be returned. |
| */ |
| status_t ZipFile::add(const ZipFile* pSourceZip, const ZipEntry* pSourceEntry, |
| int padding, ZipEntry** ppEntry) |
| { |
| ZipEntry* pEntry = NULL; |
| status_t result; |
| long lfhPosn, endPosn; |
| |
| if (mReadOnly) |
| return INVALID_OPERATION; |
| |
| /* make sure we're in a reasonable state */ |
| assert(mZipFp != NULL); |
| assert(mEntries.size() == mEOCD.mTotalNumEntries); |
| |
| if (fseek(mZipFp, mEOCD.mCentralDirOffset, SEEK_SET) != 0) { |
| result = UNKNOWN_ERROR; |
| goto bail; |
| } |
| |
| pEntry = new ZipEntry; |
| if (pEntry == NULL) { |
| result = NO_MEMORY; |
| goto bail; |
| } |
| |
| result = pEntry->initFromExternal(pSourceZip, pSourceEntry); |
| if (result != NO_ERROR) |
| goto bail; |
| if (padding != 0) { |
| result = pEntry->addPadding(padding); |
| if (result != NO_ERROR) |
| goto bail; |
| } |
| |
| /* |
| * From here on out, failures are more interesting. |
| */ |
| mNeedCDRewrite = true; |
| |
| /* |
| * Write the LFH. Since we're not recompressing the data, we already |
| * have all of the fields filled out. |
| */ |
| lfhPosn = ftell(mZipFp); |
| pEntry->mLFH.write(mZipFp); |
| |
| /* |
| * Copy the data over. |
| * |
| * If the "has data descriptor" flag is set, we want to copy the DD |
| * fields as well. This is a fixed-size area immediately following |
| * the data. |
| */ |
| if (fseek(pSourceZip->mZipFp, pSourceEntry->getFileOffset(), SEEK_SET) != 0) |
| { |
| result = UNKNOWN_ERROR; |
| goto bail; |
| } |
| |
| off_t copyLen; |
| copyLen = pSourceEntry->getCompressedLen(); |
| if ((pSourceEntry->mLFH.mGPBitFlag & ZipEntry::kUsesDataDescr) != 0) |
| copyLen += ZipEntry::kDataDescriptorLen; |
| |
| if (copyPartialFpToFp(mZipFp, pSourceZip->mZipFp, copyLen, NULL) |
| != NO_ERROR) |
| { |
| LOGW("copy of '%s' failed\n", pEntry->mCDE.mFileName); |
| result = UNKNOWN_ERROR; |
| goto bail; |
| } |
| |
| /* |
| * Update file offsets. |
| */ |
| endPosn = ftell(mZipFp); |
| |
| /* |
| * Success! Fill out new values. |
| */ |
| pEntry->setLFHOffset(lfhPosn); // sets mCDE.mLocalHeaderRelOffset |
| mEOCD.mNumEntries++; |
| mEOCD.mTotalNumEntries++; |
| mEOCD.mCentralDirSize = 0; // mark invalid; set by flush() |
| mEOCD.mCentralDirOffset = endPosn; |
| |
| /* |
| * Add pEntry to the list. |
| */ |
| mEntries.add(pEntry); |
| if (ppEntry != NULL) |
| *ppEntry = pEntry; |
| pEntry = NULL; |
| |
| result = NO_ERROR; |
| |
| bail: |
| delete pEntry; |
| return result; |
| } |
| |
| /* |
| * Copy all of the bytes in "src" to "dst". |
| * |
| * On exit, "srcFp" will be seeked to the end of the file, and "dstFp" |
| * will be seeked immediately past the data. |
| */ |
| status_t ZipFile::copyFpToFp(FILE* dstFp, FILE* srcFp, unsigned long* pCRC32) |
| { |
| unsigned char tmpBuf[32768]; |
| size_t count; |
| |
| *pCRC32 = crc32(0L, Z_NULL, 0); |
| |
| while (1) { |
| count = fread(tmpBuf, 1, sizeof(tmpBuf), srcFp); |
| if (ferror(srcFp) || ferror(dstFp)) |
| return errnoToStatus(errno); |
| if (count == 0) |
| break; |
| |
| *pCRC32 = crc32(*pCRC32, tmpBuf, count); |
| |
| if (fwrite(tmpBuf, 1, count, dstFp) != count) { |
| LOGD("fwrite %d bytes failed\n", (int) count); |
| return UNKNOWN_ERROR; |
| } |
| } |
| |
| return NO_ERROR; |
| } |
| |
| /* |
| * Copy all of the bytes in "src" to "dst". |
| * |
| * On exit, "dstFp" will be seeked immediately past the data. |
| */ |
| status_t ZipFile::copyDataToFp(FILE* dstFp, |
| const void* data, size_t size, unsigned long* pCRC32) |
| { |
| size_t count; |
| |
| *pCRC32 = crc32(0L, Z_NULL, 0); |
| if (size > 0) { |
| *pCRC32 = crc32(*pCRC32, (const unsigned char*)data, size); |
| if (fwrite(data, 1, size, dstFp) != size) { |
| LOGD("fwrite %d bytes failed\n", (int) size); |
| return UNKNOWN_ERROR; |
| } |
| } |
| |
| return NO_ERROR; |
| } |
| |
| /* |
| * Copy some of the bytes in "src" to "dst". |
| * |
| * If "pCRC32" is NULL, the CRC will not be computed. |
| * |
| * On exit, "srcFp" will be seeked to the end of the file, and "dstFp" |
| * will be seeked immediately past the data just written. |
| */ |
| status_t ZipFile::copyPartialFpToFp(FILE* dstFp, FILE* srcFp, long length, |
| unsigned long* pCRC32) |
| { |
| unsigned char tmpBuf[32768]; |
| size_t count; |
| |
| if (pCRC32 != NULL) |
| *pCRC32 = crc32(0L, Z_NULL, 0); |
| |
| while (length) { |
| long readSize; |
| |
| readSize = sizeof(tmpBuf); |
| if (readSize > length) |
| readSize = length; |
| |
| count = fread(tmpBuf, 1, readSize, srcFp); |
| if ((long) count != readSize) { // error or unexpected EOF |
| LOGD("fread %d bytes failed\n", (int) readSize); |
| return UNKNOWN_ERROR; |
| } |
| |
| if (pCRC32 != NULL) |
| *pCRC32 = crc32(*pCRC32, tmpBuf, count); |
| |
| if (fwrite(tmpBuf, 1, count, dstFp) != count) { |
| LOGD("fwrite %d bytes failed\n", (int) count); |
| return UNKNOWN_ERROR; |
| } |
| |
| length -= readSize; |
| } |
| |
| return NO_ERROR; |
| } |
| |
| /* |
| * Compress all of the data in "srcFp" and write it to "dstFp". |
| * |
| * On exit, "srcFp" will be seeked to the end of the file, and "dstFp" |
| * will be seeked immediately past the compressed data. |
| */ |
| status_t ZipFile::compressFpToFp(FILE* dstFp, FILE* srcFp, |
| const void* data, size_t size, unsigned long* pCRC32) |
| { |
| status_t result = NO_ERROR; |
| const size_t kBufSize = 32768; |
| unsigned char* inBuf = NULL; |
| unsigned char* outBuf = NULL; |
| z_stream zstream; |
| bool atEof = false; // no feof() aviailable yet |
| unsigned long crc; |
| int zerr; |
| |
| /* |
| * Create an input buffer and an output buffer. |
| */ |
| inBuf = new unsigned char[kBufSize]; |
| outBuf = new unsigned char[kBufSize]; |
| if (inBuf == NULL || outBuf == NULL) { |
| result = NO_MEMORY; |
| goto bail; |
| } |
| |
| /* |
| * Initialize the zlib stream. |
| */ |
| memset(&zstream, 0, sizeof(zstream)); |
| zstream.zalloc = Z_NULL; |
| zstream.zfree = Z_NULL; |
| zstream.opaque = Z_NULL; |
| zstream.next_in = NULL; |
| zstream.avail_in = 0; |
| zstream.next_out = outBuf; |
| zstream.avail_out = kBufSize; |
| zstream.data_type = Z_UNKNOWN; |
| |
| zerr = deflateInit2(&zstream, Z_BEST_COMPRESSION, |
| Z_DEFLATED, -MAX_WBITS, DEF_MEM_LEVEL, Z_DEFAULT_STRATEGY); |
| if (zerr != Z_OK) { |
| result = UNKNOWN_ERROR; |
| if (zerr == Z_VERSION_ERROR) { |
| LOGE("Installed zlib is not compatible with linked version (%s)\n", |
| ZLIB_VERSION); |
| } else { |
| LOGD("Call to deflateInit2 failed (zerr=%d)\n", zerr); |
| } |
| goto bail; |
| } |
| |
| crc = crc32(0L, Z_NULL, 0); |
| |
| /* |
| * Loop while we have data. |
| */ |
| do { |
| size_t getSize; |
| int flush; |
| |
| /* only read if the input buffer is empty */ |
| if (zstream.avail_in == 0 && !atEof) { |
| LOGV("+++ reading %d bytes\n", (int)kBufSize); |
| if (data) { |
| getSize = size > kBufSize ? kBufSize : size; |
| memcpy(inBuf, data, getSize); |
| data = ((const char*)data) + getSize; |
| size -= getSize; |
| } else { |
| getSize = fread(inBuf, 1, kBufSize, srcFp); |
| if (ferror(srcFp)) { |
| LOGD("deflate read failed (errno=%d)\n", errno); |
| goto z_bail; |
| } |
| } |
| if (getSize < kBufSize) { |
| LOGV("+++ got %d bytes, EOF reached\n", |
| (int)getSize); |
| atEof = true; |
| } |
| |
| crc = crc32(crc, inBuf, getSize); |
| |
| zstream.next_in = inBuf; |
| zstream.avail_in = getSize; |
| } |
| |
| if (atEof) |
| flush = Z_FINISH; /* tell zlib that we're done */ |
| else |
| flush = Z_NO_FLUSH; /* more to come! */ |
| |
| zerr = deflate(&zstream, flush); |
| if (zerr != Z_OK && zerr != Z_STREAM_END) { |
| LOGD("zlib deflate call failed (zerr=%d)\n", zerr); |
| result = UNKNOWN_ERROR; |
| goto z_bail; |
| } |
| |
| /* write when we're full or when we're done */ |
| if (zstream.avail_out == 0 || |
| (zerr == Z_STREAM_END && zstream.avail_out != (uInt) kBufSize)) |
| { |
| LOGV("+++ writing %d bytes\n", (int) (zstream.next_out - outBuf)); |
| if (fwrite(outBuf, 1, zstream.next_out - outBuf, dstFp) != |
| (size_t)(zstream.next_out - outBuf)) |
| { |
| LOGD("write %d failed in deflate\n", |
| (int) (zstream.next_out - outBuf)); |
| goto z_bail; |
| } |
| |
| zstream.next_out = outBuf; |
| zstream.avail_out = kBufSize; |
| } |
| } while (zerr == Z_OK); |
| |
| assert(zerr == Z_STREAM_END); /* other errors should've been caught */ |
| |
| *pCRC32 = crc; |
| |
| z_bail: |
| deflateEnd(&zstream); /* free up any allocated structures */ |
| |
| bail: |
| delete[] inBuf; |
| delete[] outBuf; |
| |
| return result; |
| } |
| |
| /* |
| * Mark an entry as deleted. |
| * |
| * We will eventually need to crunch the file down, but if several files |
| * are being removed (perhaps as part of an "update" process) we can make |
| * things considerably faster by deferring the removal to "flush" time. |
| */ |
| status_t ZipFile::remove(ZipEntry* pEntry) |
| { |
| /* |
| * Should verify that pEntry is actually part of this archive, and |
| * not some stray ZipEntry from a different file. |
| */ |
| |
| /* mark entry as deleted, and mark archive as dirty */ |
| pEntry->setDeleted(); |
| mNeedCDRewrite = true; |
| return NO_ERROR; |
| } |
| |
| /* |
| * Flush any pending writes. |
| * |
| * In particular, this will crunch out deleted entries, and write the |
| * Central Directory and EOCD if we have stomped on them. |
| */ |
| status_t ZipFile::flush(void) |
| { |
| status_t result = NO_ERROR; |
| long eocdPosn; |
| int i, count; |
| |
| if (mReadOnly) |
| return INVALID_OPERATION; |
| if (!mNeedCDRewrite) |
| return NO_ERROR; |
| |
| assert(mZipFp != NULL); |
| |
| result = crunchArchive(); |
| if (result != NO_ERROR) |
| return result; |
| |
| if (fseek(mZipFp, mEOCD.mCentralDirOffset, SEEK_SET) != 0) |
| return UNKNOWN_ERROR; |
| |
| count = mEntries.size(); |
| for (i = 0; i < count; i++) { |
| ZipEntry* pEntry = mEntries[i]; |
| pEntry->mCDE.write(mZipFp); |
| } |
| |
| eocdPosn = ftell(mZipFp); |
| mEOCD.mCentralDirSize = eocdPosn - mEOCD.mCentralDirOffset; |
| |
| mEOCD.write(mZipFp); |
| |
| /* |
| * If we had some stuff bloat up during compression and get replaced |
| * with plain files, or if we deleted some entries, there's a lot |
| * of wasted space at the end of the file. Remove it now. |
| */ |
| if (ftruncate(fileno(mZipFp), ftell(mZipFp)) != 0) { |
| LOGW("ftruncate failed %ld: %s\n", ftell(mZipFp), strerror(errno)); |
| // not fatal |
| } |
| |
| /* should we clear the "newly added" flag in all entries now? */ |
| |
| mNeedCDRewrite = false; |
| return NO_ERROR; |
| } |
| |
| /* |
| * Crunch deleted files out of an archive by shifting the later files down. |
| * |
| * Because we're not using a temp file, we do the operation inside the |
| * current file. |
| */ |
| status_t ZipFile::crunchArchive(void) |
| { |
| status_t result = NO_ERROR; |
| int i, count; |
| long delCount, adjust; |
| |
| #if 0 |
| printf("CONTENTS:\n"); |
| for (i = 0; i < (int) mEntries.size(); i++) { |
| printf(" %d: lfhOff=%ld del=%d\n", |
| i, mEntries[i]->getLFHOffset(), mEntries[i]->getDeleted()); |
| } |
| printf(" END is %ld\n", (long) mEOCD.mCentralDirOffset); |
| #endif |
| |
| /* |
| * Roll through the set of files, shifting them as appropriate. We |
| * could probably get a slight performance improvement by sliding |
| * multiple files down at once (because we could use larger reads |
| * when operating on batches of small files), but it's not that useful. |
| */ |
| count = mEntries.size(); |
| delCount = adjust = 0; |
| for (i = 0; i < count; i++) { |
| ZipEntry* pEntry = mEntries[i]; |
| long span; |
| |
| if (pEntry->getLFHOffset() != 0) { |
| long nextOffset; |
| |
| /* Get the length of this entry by finding the offset |
| * of the next entry. Directory entries don't have |
| * file offsets, so we need to find the next non-directory |
| * entry. |
| */ |
| nextOffset = 0; |
| for (int ii = i+1; nextOffset == 0 && ii < count; ii++) |
| nextOffset = mEntries[ii]->getLFHOffset(); |
| if (nextOffset == 0) |
| nextOffset = mEOCD.mCentralDirOffset; |
| span = nextOffset - pEntry->getLFHOffset(); |
| |
| assert(span >= ZipEntry::LocalFileHeader::kLFHLen); |
| } else { |
| /* This is a directory entry. It doesn't have |
| * any actual file contents, so there's no need to |
| * move anything. |
| */ |
| span = 0; |
| } |
| |
| //printf("+++ %d: off=%ld span=%ld del=%d [count=%d]\n", |
| // i, pEntry->getLFHOffset(), span, pEntry->getDeleted(), count); |
| |
| if (pEntry->getDeleted()) { |
| adjust += span; |
| delCount++; |
| |
| delete pEntry; |
| mEntries.removeAt(i); |
| |
| /* adjust loop control */ |
| count--; |
| i--; |
| } else if (span != 0 && adjust > 0) { |
| /* shuffle this entry back */ |
| //printf("+++ Shuffling '%s' back %ld\n", |
| // pEntry->getFileName(), adjust); |
| result = filemove(mZipFp, pEntry->getLFHOffset() - adjust, |
| pEntry->getLFHOffset(), span); |
| if (result != NO_ERROR) { |
| /* this is why you use a temp file */ |
| LOGE("error during crunch - archive is toast\n"); |
| return result; |
| } |
| |
| pEntry->setLFHOffset(pEntry->getLFHOffset() - adjust); |
| } |
| } |
| |
| /* |
| * Fix EOCD info. We have to wait until the end to do some of this |
| * because we use mCentralDirOffset to determine "span" for the |
| * last entry. |
| */ |
| mEOCD.mCentralDirOffset -= adjust; |
| mEOCD.mNumEntries -= delCount; |
| mEOCD.mTotalNumEntries -= delCount; |
| mEOCD.mCentralDirSize = 0; // mark invalid; set by flush() |
| |
| assert(mEOCD.mNumEntries == mEOCD.mTotalNumEntries); |
| assert(mEOCD.mNumEntries == count); |
| |
| return result; |
| } |
| |
| /* |
| * Works like memmove(), but on pieces of a file. |
| */ |
| status_t ZipFile::filemove(FILE* fp, off_t dst, off_t src, size_t n) |
| { |
| if (dst == src || n <= 0) |
| return NO_ERROR; |
| |
| unsigned char readBuf[32768]; |
| |
| if (dst < src) { |
| /* shift stuff toward start of file; must read from start */ |
| while (n != 0) { |
| size_t getSize = sizeof(readBuf); |
| if (getSize > n) |
| getSize = n; |
| |
| if (fseek(fp, (long) src, SEEK_SET) != 0) { |
| LOGD("filemove src seek %ld failed\n", (long) src); |
| return UNKNOWN_ERROR; |
| } |
| |
| if (fread(readBuf, 1, getSize, fp) != getSize) { |
| LOGD("filemove read %ld off=%ld failed\n", |
| (long) getSize, (long) src); |
| return UNKNOWN_ERROR; |
| } |
| |
| if (fseek(fp, (long) dst, SEEK_SET) != 0) { |
| LOGD("filemove dst seek %ld failed\n", (long) dst); |
| return UNKNOWN_ERROR; |
| } |
| |
| if (fwrite(readBuf, 1, getSize, fp) != getSize) { |
| LOGD("filemove write %ld off=%ld failed\n", |
| (long) getSize, (long) dst); |
| return UNKNOWN_ERROR; |
| } |
| |
| src += getSize; |
| dst += getSize; |
| n -= getSize; |
| } |
| } else { |
| /* shift stuff toward end of file; must read from end */ |
| assert(false); // write this someday, maybe |
| return UNKNOWN_ERROR; |
| } |
| |
| return NO_ERROR; |
| } |
| |
| |
| /* |
| * Get the modification time from a file descriptor. |
| */ |
| time_t ZipFile::getModTime(int fd) |
| { |
| struct stat sb; |
| |
| if (fstat(fd, &sb) < 0) { |
| LOGD("HEY: fstat on fd %d failed\n", fd); |
| return (time_t) -1; |
| } |
| |
| return sb.st_mtime; |
| } |
| |
| |
| #if 0 /* this is a bad idea */ |
| /* |
| * Get a copy of the Zip file descriptor. |
| * |
| * We don't allow this if the file was opened read-write because we tend |
| * to leave the file contents in an uncertain state between calls to |
| * flush(). The duplicated file descriptor should only be valid for reads. |
| */ |
| int ZipFile::getZipFd(void) const |
| { |
| if (!mReadOnly) |
| return INVALID_OPERATION; |
| assert(mZipFp != NULL); |
| |
| int fd; |
| fd = dup(fileno(mZipFp)); |
| if (fd < 0) { |
| LOGD("didn't work, errno=%d\n", errno); |
| } |
| |
| return fd; |
| } |
| #endif |
| |
| |
| #if 0 |
| /* |
| * Expand data. |
| */ |
| bool ZipFile::uncompress(const ZipEntry* pEntry, void* buf) const |
| { |
| return false; |
| } |
| #endif |
| |
| // free the memory when you're done |
| void* ZipFile::uncompress(const ZipEntry* entry) |
| { |
| size_t unlen = entry->getUncompressedLen(); |
| size_t clen = entry->getCompressedLen(); |
| |
| void* buf = malloc(unlen); |
| if (buf == NULL) { |
| return NULL; |
| } |
| |
| fseek(mZipFp, 0, SEEK_SET); |
| |
| off_t offset = entry->getFileOffset(); |
| if (fseek(mZipFp, offset, SEEK_SET) != 0) { |
| goto bail; |
| } |
| |
| switch (entry->getCompressionMethod()) |
| { |
| case ZipEntry::kCompressStored: { |
| ssize_t amt = fread(buf, 1, unlen, mZipFp); |
| if (amt != (ssize_t)unlen) { |
| goto bail; |
| } |
| #if 0 |
| printf("data...\n"); |
| const unsigned char* p = (unsigned char*)buf; |
| const unsigned char* end = p+unlen; |
| for (int i=0; i<32 && p < end; i++) { |
| printf("0x%08x ", (int)(offset+(i*0x10))); |
| for (int j=0; j<0x10 && p < end; j++) { |
| printf(" %02x", *p); |
| p++; |
| } |
| printf("\n"); |
| } |
| #endif |
| |
| } |
| break; |
| case ZipEntry::kCompressDeflated: { |
| if (!ZipUtils::inflateToBuffer(mZipFp, buf, unlen, clen)) { |
| goto bail; |
| } |
| } |
| break; |
| default: |
| goto bail; |
| } |
| return buf; |
| |
| bail: |
| free(buf); |
| return NULL; |
| } |
| |
| |
| /* |
| * =========================================================================== |
| * ZipFile::EndOfCentralDir |
| * =========================================================================== |
| */ |
| |
| /* |
| * Read the end-of-central-dir fields. |
| * |
| * "buf" should be positioned at the EOCD signature, and should contain |
| * the entire EOCD area including the comment. |
| */ |
| status_t ZipFile::EndOfCentralDir::readBuf(const unsigned char* buf, int len) |
| { |
| /* don't allow re-use */ |
| assert(mComment == NULL); |
| |
| if (len < kEOCDLen) { |
| /* looks like ZIP file got truncated */ |
| LOGD(" Zip EOCD: expected >= %d bytes, found %d\n", |
| kEOCDLen, len); |
| return INVALID_OPERATION; |
| } |
| |
| /* this should probably be an assert() */ |
| if (ZipEntry::getLongLE(&buf[0x00]) != kSignature) |
| return UNKNOWN_ERROR; |
| |
| mDiskNumber = ZipEntry::getShortLE(&buf[0x04]); |
| mDiskWithCentralDir = ZipEntry::getShortLE(&buf[0x06]); |
| mNumEntries = ZipEntry::getShortLE(&buf[0x08]); |
| mTotalNumEntries = ZipEntry::getShortLE(&buf[0x0a]); |
| mCentralDirSize = ZipEntry::getLongLE(&buf[0x0c]); |
| mCentralDirOffset = ZipEntry::getLongLE(&buf[0x10]); |
| mCommentLen = ZipEntry::getShortLE(&buf[0x14]); |
| |
| // TODO: validate mCentralDirOffset |
| |
| if (mCommentLen > 0) { |
| if (kEOCDLen + mCommentLen > len) { |
| LOGD("EOCD(%d) + comment(%d) exceeds len (%d)\n", |
| kEOCDLen, mCommentLen, len); |
| return UNKNOWN_ERROR; |
| } |
| mComment = new unsigned char[mCommentLen]; |
| memcpy(mComment, buf + kEOCDLen, mCommentLen); |
| } |
| |
| return NO_ERROR; |
| } |
| |
| /* |
| * Write an end-of-central-directory section. |
| */ |
| status_t ZipFile::EndOfCentralDir::write(FILE* fp) |
| { |
| unsigned char buf[kEOCDLen]; |
| |
| ZipEntry::putLongLE(&buf[0x00], kSignature); |
| ZipEntry::putShortLE(&buf[0x04], mDiskNumber); |
| ZipEntry::putShortLE(&buf[0x06], mDiskWithCentralDir); |
| ZipEntry::putShortLE(&buf[0x08], mNumEntries); |
| ZipEntry::putShortLE(&buf[0x0a], mTotalNumEntries); |
| ZipEntry::putLongLE(&buf[0x0c], mCentralDirSize); |
| ZipEntry::putLongLE(&buf[0x10], mCentralDirOffset); |
| ZipEntry::putShortLE(&buf[0x14], mCommentLen); |
| |
| if (fwrite(buf, 1, kEOCDLen, fp) != kEOCDLen) |
| return UNKNOWN_ERROR; |
| if (mCommentLen > 0) { |
| assert(mComment != NULL); |
| if (fwrite(mComment, mCommentLen, 1, fp) != mCommentLen) |
| return UNKNOWN_ERROR; |
| } |
| |
| return NO_ERROR; |
| } |
| |
| /* |
| * Dump the contents of an EndOfCentralDir object. |
| */ |
| void ZipFile::EndOfCentralDir::dump(void) const |
| { |
| LOGD(" EndOfCentralDir contents:\n"); |
| LOGD(" diskNum=%u diskWCD=%u numEnt=%u totalNumEnt=%u\n", |
| mDiskNumber, mDiskWithCentralDir, mNumEntries, mTotalNumEntries); |
| LOGD(" centDirSize=%lu centDirOff=%lu commentLen=%u\n", |
| mCentralDirSize, mCentralDirOffset, mCommentLen); |
| } |
| |