blob: eca3ffee0c9b90680c8e6ac9cd6e3679c0d6af1f [file] [log] [blame]
Narayan Kamath7462f022013-11-21 13:05:04 +00001/*
2 * Copyright (C) 2008 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17/*
18 * Read-only access to Zip archives, with minimal heap allocation.
19 */
Narayan Kamath7462f022013-11-21 13:05:04 +000020
Mark Salyzyncfd5b082016-10-17 14:28:00 -070021#define LOG_TAG "ziparchive"
22
Narayan Kamath7462f022013-11-21 13:05:04 +000023#include <assert.h>
24#include <errno.h>
Mark Salyzyn99ef9912014-03-14 14:26:22 -070025#include <fcntl.h>
26#include <inttypes.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000027#include <limits.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000028#include <stdlib.h>
29#include <string.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000030#include <unistd.h>
31
Dan Albert1ae07642015-04-09 14:11:18 -070032#include <memory>
33#include <vector>
34
Mark Salyzynff2dcd92016-09-28 15:54:45 -070035#include <android-base/file.h>
36#include <android-base/logging.h>
37#include <android-base/macros.h> // TEMP_FAILURE_RETRY may or may not be in unistd
38#include <android-base/memory.h>
Mark Salyzyncfd5b082016-10-17 14:28:00 -070039#include <log/log.h>
Mark Salyzynff2dcd92016-09-28 15:54:45 -070040#include <utils/Compat.h>
41#include <utils/FileMap.h>
Christopher Ferrise6884ce2015-11-10 14:55:12 -080042#include "ziparchive/zip_archive.h"
Dan Albert1ae07642015-04-09 14:11:18 -070043#include "zlib.h"
Narayan Kamath7462f022013-11-21 13:05:04 +000044
Narayan Kamath044bc8e2014-12-03 18:22:53 +000045#include "entry_name_utils-inl.h"
Adam Lesinskiad4ad8c2015-10-05 18:16:18 -070046#include "zip_archive_common.h"
Christopher Ferrise6884ce2015-11-10 14:55:12 -080047#include "zip_archive_private.h"
Mark Salyzyn99ef9912014-03-14 14:26:22 -070048
Dan Albert1ae07642015-04-09 14:11:18 -070049using android::base::get_unaligned;
Narayan Kamath044bc8e2014-12-03 18:22:53 +000050
Narayan Kamath162b7052017-06-05 13:21:12 +010051// Used to turn on crc checks - verify that the content CRC matches the values
52// specified in the local file header and the central directory.
53static const bool kCrcChecksEnabled = false;
54
Narayan Kamath926973e2014-06-09 14:18:14 +010055// This is for windows. If we don't open a file in binary mode, weird
Narayan Kamath7462f022013-11-21 13:05:04 +000056// things will happen.
57#ifndef O_BINARY
58#define O_BINARY 0
59#endif
60
Narayan Kamath926973e2014-06-09 14:18:14 +010061// The maximum number of bytes to scan backwards for the EOCD start.
62static const uint32_t kMaxEOCDSearch = kMaxCommentLen + sizeof(EocdRecord);
63
Narayan Kamath7462f022013-11-21 13:05:04 +000064static const char* kErrorMessages[] = {
65 "Unknown return code.",
Narayan Kamatheb41ad22013-12-09 16:26:36 +000066 "Iteration ended",
Narayan Kamath7462f022013-11-21 13:05:04 +000067 "Zlib error",
68 "Invalid file",
69 "Invalid handle",
70 "Duplicate entries in archive",
71 "Empty archive",
72 "Entry not found",
73 "Invalid offset",
74 "Inconsistent information",
75 "Invalid entry name",
Narayan Kamatheb41ad22013-12-09 16:26:36 +000076 "I/O Error",
Narayan Kamatheaf98852013-12-11 14:51:51 +000077 "File mapping failed"
Narayan Kamath7462f022013-11-21 13:05:04 +000078};
79
80static const int32_t kErrorMessageUpperBound = 0;
81
Narayan Kamatheb41ad22013-12-09 16:26:36 +000082static const int32_t kIterationEnd = -1;
Narayan Kamath7462f022013-11-21 13:05:04 +000083
84// We encountered a Zlib error when inflating a stream from this file.
85// Usually indicates file corruption.
86static const int32_t kZlibError = -2;
87
88// The input file cannot be processed as a zip archive. Usually because
89// it's too small, too large or does not have a valid signature.
90static const int32_t kInvalidFile = -3;
91
92// An invalid iteration / ziparchive handle was passed in as an input
93// argument.
94static const int32_t kInvalidHandle = -4;
95
96// The zip archive contained two (or possibly more) entries with the same
97// name.
98static const int32_t kDuplicateEntry = -5;
99
100// The zip archive contains no entries.
101static const int32_t kEmptyArchive = -6;
102
103// The specified entry was not found in the archive.
104static const int32_t kEntryNotFound = -7;
105
106// The zip archive contained an invalid local file header pointer.
107static const int32_t kInvalidOffset = -8;
108
109// The zip archive contained inconsistent entry information. This could
110// be because the central directory & local file header did not agree, or
111// if the actual uncompressed length or crc32 do not match their declared
112// values.
113static const int32_t kInconsistentInformation = -9;
114
115// An invalid entry name was encountered.
116static const int32_t kInvalidEntryName = -10;
117
Narayan Kamatheb41ad22013-12-09 16:26:36 +0000118// An I/O related system call (read, lseek, ftruncate, map) failed.
119static const int32_t kIoError = -11;
Narayan Kamath7462f022013-11-21 13:05:04 +0000120
Narayan Kamatheaf98852013-12-11 14:51:51 +0000121// We were not able to mmap the central directory or entry contents.
122static const int32_t kMmapFailed = -12;
Narayan Kamath7462f022013-11-21 13:05:04 +0000123
Narayan Kamatheaf98852013-12-11 14:51:51 +0000124static const int32_t kErrorMessageLowerBound = -13;
Narayan Kamath7462f022013-11-21 13:05:04 +0000125
Narayan Kamath7462f022013-11-21 13:05:04 +0000126/*
127 * A Read-only Zip archive.
128 *
129 * We want "open" and "find entry by name" to be fast operations, and
130 * we want to use as little memory as possible. We memory-map the zip
131 * central directory, and load a hash table with pointers to the filenames
132 * (which aren't null-terminated). The other fields are at a fixed offset
133 * from the filename, so we don't need to extract those (but we do need
134 * to byte-read and endian-swap them every time we want them).
135 *
136 * It's possible that somebody has handed us a massive (~1GB) zip archive,
137 * so we can't expect to mmap the entire file.
138 *
139 * To speed comparisons when doing a lookup by name, we could make the mapping
140 * "private" (copy-on-write) and null-terminate the filenames after verifying
141 * the record structure. However, this requires a private mapping of
142 * every page that the Central Directory touches. Easier to tuck a copy
143 * of the string length into the hash table entry.
144 */
Narayan Kamath7462f022013-11-21 13:05:04 +0000145
Narayan Kamath7462f022013-11-21 13:05:04 +0000146/*
147 * Round up to the next highest power of 2.
148 *
149 * Found on http://graphics.stanford.edu/~seander/bithacks.html.
150 */
151static uint32_t RoundUpPower2(uint32_t val) {
152 val--;
153 val |= val >> 1;
154 val |= val >> 2;
155 val |= val >> 4;
156 val |= val >> 8;
157 val |= val >> 16;
158 val++;
159
160 return val;
161}
162
Yusuke Sato07447542015-06-25 14:39:19 -0700163static uint32_t ComputeHash(const ZipString& name) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000164 uint32_t hash = 0;
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100165 uint16_t len = name.name_length;
166 const uint8_t* str = name.name;
Narayan Kamath7462f022013-11-21 13:05:04 +0000167
168 while (len--) {
169 hash = hash * 31 + *str++;
170 }
171
172 return hash;
173}
174
175/*
176 * Convert a ZipEntry to a hash table index, verifying that it's in a
177 * valid range.
178 */
Yusuke Sato07447542015-06-25 14:39:19 -0700179static int64_t EntryToIndex(const ZipString* hash_table,
Narayan Kamath7462f022013-11-21 13:05:04 +0000180 const uint32_t hash_table_size,
Yusuke Sato07447542015-06-25 14:39:19 -0700181 const ZipString& name) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100182 const uint32_t hash = ComputeHash(name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000183
184 // NOTE: (hash_table_size - 1) is guaranteed to be non-negative.
185 uint32_t ent = hash & (hash_table_size - 1);
186 while (hash_table[ent].name != NULL) {
Yusuke Sato07447542015-06-25 14:39:19 -0700187 if (hash_table[ent] == name) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000188 return ent;
189 }
190
191 ent = (ent + 1) & (hash_table_size - 1);
192 }
193
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100194 ALOGV("Zip: Unable to find entry %.*s", name.name_length, name.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000195 return kEntryNotFound;
196}
197
198/*
199 * Add a new entry to the hash table.
200 */
Yusuke Sato07447542015-06-25 14:39:19 -0700201static int32_t AddToHash(ZipString *hash_table, const uint64_t hash_table_size,
202 const ZipString& name) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100203 const uint64_t hash = ComputeHash(name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000204 uint32_t ent = hash & (hash_table_size - 1);
205
206 /*
207 * We over-allocated the table, so we're guaranteed to find an empty slot.
208 * Further, we guarantee that the hashtable size is not 0.
209 */
210 while (hash_table[ent].name != NULL) {
Yusuke Sato07447542015-06-25 14:39:19 -0700211 if (hash_table[ent] == name) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000212 // We've found a duplicate entry. We don't accept it
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100213 ALOGW("Zip: Found duplicate entry %.*s", name.name_length, name.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000214 return kDuplicateEntry;
215 }
216 ent = (ent + 1) & (hash_table_size - 1);
217 }
218
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100219 hash_table[ent].name = name.name;
220 hash_table[ent].name_length = name.name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000221 return 0;
222}
223
Tianjie Xu18c25922016-09-29 15:27:41 -0700224static int32_t MapCentralDirectory0(const char* debug_file_name, ZipArchive* archive,
225 off64_t file_length, off64_t read_amount,
226 uint8_t* scan_buffer) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000227 const off64_t search_start = file_length - read_amount;
228
Tianjie Xu18c25922016-09-29 15:27:41 -0700229 if(!archive->mapped_zip.ReadAtOffset(scan_buffer, read_amount, search_start)) {
230 ALOGE("Zip: read %" PRId64 " from offset %" PRId64 " failed",
231 static_cast<int64_t>(read_amount), static_cast<int64_t>(search_start));
Narayan Kamath7462f022013-11-21 13:05:04 +0000232 return kIoError;
233 }
234
235 /*
236 * Scan backward for the EOCD magic. In an archive without a trailing
237 * comment, we'll find it on the first try. (We may want to consider
238 * doing an initial minimal read; if we don't find it, retry with a
239 * second read as above.)
240 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100241 int i = read_amount - sizeof(EocdRecord);
242 for (; i >= 0; i--) {
Dan Albert1ae07642015-04-09 14:11:18 -0700243 if (scan_buffer[i] == 0x50) {
244 uint32_t* sig_addr = reinterpret_cast<uint32_t*>(&scan_buffer[i]);
245 if (get_unaligned<uint32_t>(sig_addr) == EocdRecord::kSignature) {
246 ALOGV("+++ Found EOCD at buf+%d", i);
247 break;
248 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000249 }
250 }
251 if (i < 0) {
252 ALOGD("Zip: EOCD not found, %s is not zip", debug_file_name);
253 return kInvalidFile;
254 }
255
256 const off64_t eocd_offset = search_start + i;
Narayan Kamath926973e2014-06-09 14:18:14 +0100257 const EocdRecord* eocd = reinterpret_cast<const EocdRecord*>(scan_buffer + i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000258 /*
Narayan Kamath926973e2014-06-09 14:18:14 +0100259 * Verify that there's no trailing space at the end of the central directory
260 * and its comment.
Narayan Kamath7462f022013-11-21 13:05:04 +0000261 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100262 const off64_t calculated_length = eocd_offset + sizeof(EocdRecord)
263 + eocd->comment_length;
264 if (calculated_length != file_length) {
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100265 ALOGW("Zip: %" PRId64 " extraneous bytes at the end of the central directory",
Narayan Kamath926973e2014-06-09 14:18:14 +0100266 static_cast<int64_t>(file_length - calculated_length));
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100267 return kInvalidFile;
268 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000269
Narayan Kamath926973e2014-06-09 14:18:14 +0100270 /*
271 * Grab the CD offset and size, and the number of entries in the
272 * archive and verify that they look reasonable.
273 */
Tianjie Xu1ee48922016-09-21 14:58:11 -0700274 if (static_cast<off64_t>(eocd->cd_start_offset) + eocd->cd_size > eocd_offset) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100275 ALOGW("Zip: bad offsets (dir %" PRIu32 ", size %" PRIu32 ", eocd %" PRId64 ")",
276 eocd->cd_start_offset, eocd->cd_size, static_cast<int64_t>(eocd_offset));
Tianjie Xu1ee48922016-09-21 14:58:11 -0700277#if defined(__ANDROID__)
278 if (eocd->cd_start_offset + eocd->cd_size <= eocd_offset) {
279 android_errorWriteLog(0x534e4554, "31251826");
280 }
281#endif
Narayan Kamath7462f022013-11-21 13:05:04 +0000282 return kInvalidOffset;
283 }
Narayan Kamath926973e2014-06-09 14:18:14 +0100284 if (eocd->num_records == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000285 ALOGW("Zip: empty archive?");
286 return kEmptyArchive;
287 }
288
Elliott Hughese49236b2015-06-04 15:21:59 -0700289 ALOGV("+++ num_entries=%" PRIu32 " dir_size=%" PRIu32 " dir_offset=%" PRIu32,
Narayan Kamath926973e2014-06-09 14:18:14 +0100290 eocd->num_records, eocd->cd_size, eocd->cd_start_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000291
292 /*
293 * It all looks good. Create a mapping for the CD, and set the fields
294 * in archive.
295 */
Tianjie Xu18c25922016-09-29 15:27:41 -0700296
297 if (!archive->InitializeCentralDirectory(debug_file_name,
298 static_cast<off64_t>(eocd->cd_start_offset),
299 static_cast<size_t>(eocd->cd_size))) {
300 ALOGE("Zip: failed to intialize central directory.\n");
Narayan Kamatheaf98852013-12-11 14:51:51 +0000301 return kMmapFailed;
Narayan Kamath7462f022013-11-21 13:05:04 +0000302 }
303
Narayan Kamath926973e2014-06-09 14:18:14 +0100304 archive->num_entries = eocd->num_records;
305 archive->directory_offset = eocd->cd_start_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000306
307 return 0;
308}
309
310/*
311 * Find the zip Central Directory and memory-map it.
312 *
313 * On success, returns 0 after populating fields from the EOCD area:
314 * directory_offset
Tianjie Xu18c25922016-09-29 15:27:41 -0700315 * directory_ptr
Narayan Kamath7462f022013-11-21 13:05:04 +0000316 * num_entries
317 */
Tianjie Xu18c25922016-09-29 15:27:41 -0700318static int32_t MapCentralDirectory(const char* debug_file_name, ZipArchive* archive) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000319
320 // Test file length. We use lseek64 to make sure the file
321 // is small enough to be a zip file (Its size must be less than
322 // 0xffffffff bytes).
Tianjie Xu18c25922016-09-29 15:27:41 -0700323 off64_t file_length = archive->mapped_zip.GetFileLength();
Narayan Kamath7462f022013-11-21 13:05:04 +0000324 if (file_length == -1) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000325 return kInvalidFile;
326 }
327
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800328 if (file_length > static_cast<off64_t>(0xffffffff)) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100329 ALOGV("Zip: zip file too long %" PRId64, static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000330 return kInvalidFile;
331 }
332
Narayan Kamath926973e2014-06-09 14:18:14 +0100333 if (file_length < static_cast<off64_t>(sizeof(EocdRecord))) {
334 ALOGV("Zip: length %" PRId64 " is too small to be zip", static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000335 return kInvalidFile;
336 }
337
338 /*
339 * Perform the traditional EOCD snipe hunt.
340 *
341 * We're searching for the End of Central Directory magic number,
342 * which appears at the start of the EOCD block. It's followed by
343 * 18 bytes of EOCD stuff and up to 64KB of archive comment. We
344 * need to read the last part of the file into a buffer, dig through
345 * it to find the magic number, parse some values out, and use those
346 * to determine the extent of the CD.
347 *
348 * We start by pulling in the last part of the file.
349 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100350 off64_t read_amount = kMaxEOCDSearch;
351 if (file_length < read_amount) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000352 read_amount = file_length;
353 }
354
Tianjie Xu18c25922016-09-29 15:27:41 -0700355 std::vector<uint8_t> scan_buffer(read_amount);
356 int32_t result = MapCentralDirectory0(debug_file_name, archive, file_length, read_amount,
357 scan_buffer.data());
Narayan Kamath7462f022013-11-21 13:05:04 +0000358 return result;
359}
360
361/*
362 * Parses the Zip archive's Central Directory. Allocates and populates the
363 * hash table.
364 *
365 * Returns 0 on success.
366 */
367static int32_t ParseZipArchive(ZipArchive* archive) {
Tianjie Xu18c25922016-09-29 15:27:41 -0700368 const uint8_t* const cd_ptr = archive->central_directory.GetBasePtr();
369 const size_t cd_length = archive->central_directory.GetMapLength();
Narayan Kamath926973e2014-06-09 14:18:14 +0100370 const uint16_t num_entries = archive->num_entries;
Narayan Kamath7462f022013-11-21 13:05:04 +0000371
372 /*
373 * Create hash table. We have a minimum 75% load factor, possibly as
374 * low as 50% after we round off to a power of 2. There must be at
375 * least one unused entry to avoid an infinite loop during creation.
376 */
377 archive->hash_table_size = RoundUpPower2(1 + (num_entries * 4) / 3);
Yusuke Sato07447542015-06-25 14:39:19 -0700378 archive->hash_table = reinterpret_cast<ZipString*>(calloc(archive->hash_table_size,
379 sizeof(ZipString)));
Narayan Kamath7462f022013-11-21 13:05:04 +0000380
381 /*
382 * Walk through the central directory, adding entries to the hash
383 * table and verifying values.
384 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100385 const uint8_t* const cd_end = cd_ptr + cd_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000386 const uint8_t* ptr = cd_ptr;
387 for (uint16_t i = 0; i < num_entries; i++) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100388 const CentralDirectoryRecord* cdr =
389 reinterpret_cast<const CentralDirectoryRecord*>(ptr);
390 if (cdr->record_signature != CentralDirectoryRecord::kSignature) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700391 ALOGW("Zip: missed a central dir sig (at %" PRIu16 ")", i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800392 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000393 }
394
Narayan Kamath926973e2014-06-09 14:18:14 +0100395 if (ptr + sizeof(CentralDirectoryRecord) > cd_end) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700396 ALOGW("Zip: ran off the end (at %" PRIu16 ")", i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800397 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000398 }
399
Narayan Kamath926973e2014-06-09 14:18:14 +0100400 const off64_t local_header_offset = cdr->local_file_header_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000401 if (local_header_offset >= archive->directory_offset) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800402 ALOGW("Zip: bad LFH offset %" PRId64 " at entry %" PRIu16,
403 static_cast<int64_t>(local_header_offset), i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800404 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000405 }
406
Narayan Kamath926973e2014-06-09 14:18:14 +0100407 const uint16_t file_name_length = cdr->file_name_length;
408 const uint16_t extra_length = cdr->extra_field_length;
409 const uint16_t comment_length = cdr->comment_length;
Piotr Jastrzebski78271ba2014-08-15 12:53:00 +0100410 const uint8_t* file_name = ptr + sizeof(CentralDirectoryRecord);
411
Narayan Kamath044bc8e2014-12-03 18:22:53 +0000412 /* check that file name is valid UTF-8 and doesn't contain NUL (U+0000) characters */
413 if (!IsValidEntryName(file_name, file_name_length)) {
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800414 return -1;
Piotr Jastrzebski78271ba2014-08-15 12:53:00 +0100415 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000416
417 /* add the CDE filename to the hash table */
Yusuke Sato07447542015-06-25 14:39:19 -0700418 ZipString entry_name;
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100419 entry_name.name = file_name;
420 entry_name.name_length = file_name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000421 const int add_result = AddToHash(archive->hash_table,
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100422 archive->hash_table_size, entry_name);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800423 if (add_result != 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000424 ALOGW("Zip: Error adding entry to hash table %d", add_result);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800425 return add_result;
Narayan Kamath7462f022013-11-21 13:05:04 +0000426 }
427
Narayan Kamath926973e2014-06-09 14:18:14 +0100428 ptr += sizeof(CentralDirectoryRecord) + file_name_length + extra_length + comment_length;
429 if ((ptr - cd_ptr) > static_cast<int64_t>(cd_length)) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700430 ALOGW("Zip: bad CD advance (%tu vs %zu) at entry %" PRIu16,
431 ptr - cd_ptr, cd_length, i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800432 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000433 }
434 }
Mark Salyzyn088bf902014-05-08 16:02:20 -0700435 ALOGV("+++ zip good scan %" PRIu16 " entries", num_entries);
Narayan Kamath7462f022013-11-21 13:05:04 +0000436
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800437 return 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000438}
439
440static int32_t OpenArchiveInternal(ZipArchive* archive,
441 const char* debug_file_name) {
442 int32_t result = -1;
Tianjie Xu18c25922016-09-29 15:27:41 -0700443 if ((result = MapCentralDirectory(debug_file_name, archive)) != 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000444 return result;
445 }
446
447 if ((result = ParseZipArchive(archive))) {
448 return result;
449 }
450
451 return 0;
452}
453
454int32_t OpenArchiveFd(int fd, const char* debug_file_name,
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700455 ZipArchiveHandle* handle, bool assume_ownership) {
456 ZipArchive* archive = new ZipArchive(fd, assume_ownership);
Narayan Kamath7462f022013-11-21 13:05:04 +0000457 *handle = archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000458 return OpenArchiveInternal(archive, debug_file_name);
459}
460
461int32_t OpenArchive(const char* fileName, ZipArchiveHandle* handle) {
Neil Fullerb1a113f2014-07-25 14:43:04 +0100462 const int fd = open(fileName, O_RDONLY | O_BINARY, 0);
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700463 ZipArchive* archive = new ZipArchive(fd, true);
Narayan Kamath7462f022013-11-21 13:05:04 +0000464 *handle = archive;
465
Narayan Kamath7462f022013-11-21 13:05:04 +0000466 if (fd < 0) {
467 ALOGW("Unable to open '%s': %s", fileName, strerror(errno));
468 return kIoError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000469 }
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700470
Narayan Kamath7462f022013-11-21 13:05:04 +0000471 return OpenArchiveInternal(archive, fileName);
472}
473
Tianjie Xu18c25922016-09-29 15:27:41 -0700474int32_t OpenArchiveFromMemory(void* address, size_t length, const char* debug_file_name,
475 ZipArchiveHandle *handle) {
476 ZipArchive* archive = new ZipArchive(address, length);
477 *handle = archive;
478 return OpenArchiveInternal(archive, debug_file_name);
479}
480
Narayan Kamath7462f022013-11-21 13:05:04 +0000481/*
482 * Close a ZipArchive, closing the file and freeing the contents.
483 */
484void CloseArchive(ZipArchiveHandle handle) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800485 ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Narayan Kamath7462f022013-11-21 13:05:04 +0000486 ALOGV("Closing archive %p", archive);
Neil Fullerb1a113f2014-07-25 14:43:04 +0100487 delete archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000488}
489
Narayan Kamath162b7052017-06-05 13:21:12 +0100490static int32_t ValidateDataDescriptor(MappedZipFile& mapped_zip, ZipEntry* entry) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100491 uint8_t ddBuf[sizeof(DataDescriptor) + sizeof(DataDescriptor::kOptSignature)];
Tianjie Xu18c25922016-09-29 15:27:41 -0700492 if (!mapped_zip.ReadData(ddBuf, sizeof(ddBuf))) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000493 return kIoError;
494 }
495
Narayan Kamath926973e2014-06-09 14:18:14 +0100496 const uint32_t ddSignature = *(reinterpret_cast<const uint32_t*>(ddBuf));
497 const uint16_t offset = (ddSignature == DataDescriptor::kOptSignature) ? 4 : 0;
498 const DataDescriptor* descriptor = reinterpret_cast<const DataDescriptor*>(ddBuf + offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000499
Narayan Kamath162b7052017-06-05 13:21:12 +0100500 // Validate that the values in the data descriptor match those in the central
501 // directory.
502 if (entry->compressed_length != descriptor->compressed_size ||
503 entry->uncompressed_length != descriptor->uncompressed_size ||
504 entry->crc32 != descriptor->crc32) {
505 ALOGW("Zip: size/crc32 mismatch. expected {%" PRIu32 ", %" PRIu32 ", %" PRIx32
506 "}, was {%" PRIu32 ", %" PRIu32 ", %" PRIx32 "}",
507 entry->compressed_length, entry->uncompressed_length, entry->crc32,
508 descriptor->compressed_size, descriptor->uncompressed_size, descriptor->crc32);
509 return kInconsistentInformation;
510 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000511
512 return 0;
513}
514
Narayan Kamath7462f022013-11-21 13:05:04 +0000515static int32_t FindEntry(const ZipArchive* archive, const int ent,
516 ZipEntry* data) {
517 const uint16_t nameLen = archive->hash_table[ent].name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000518
519 // Recover the start of the central directory entry from the filename
520 // pointer. The filename is the first entry past the fixed-size data,
521 // so we can just subtract back from that.
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100522 const uint8_t* ptr = archive->hash_table[ent].name;
Narayan Kamath926973e2014-06-09 14:18:14 +0100523 ptr -= sizeof(CentralDirectoryRecord);
Narayan Kamath7462f022013-11-21 13:05:04 +0000524
525 // This is the base of our mmapped region, we have to sanity check that
526 // the name that's in the hash table is a pointer to a location within
527 // this mapped region.
Tianjie Xu18c25922016-09-29 15:27:41 -0700528 const uint8_t* base_ptr = archive->central_directory.GetBasePtr();
529 if (ptr < base_ptr || ptr > base_ptr + archive->central_directory.GetMapLength()) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000530 ALOGW("Zip: Invalid entry pointer");
531 return kInvalidOffset;
532 }
533
Narayan Kamath926973e2014-06-09 14:18:14 +0100534 const CentralDirectoryRecord *cdr =
535 reinterpret_cast<const CentralDirectoryRecord*>(ptr);
536
Narayan Kamath7462f022013-11-21 13:05:04 +0000537 // The offset of the start of the central directory in the zipfile.
538 // We keep this lying around so that we can sanity check all our lengths
539 // and our per-file structures.
540 const off64_t cd_offset = archive->directory_offset;
541
542 // Fill out the compression method, modification time, crc32
543 // and other interesting attributes from the central directory. These
544 // will later be compared against values from the local file header.
Narayan Kamath926973e2014-06-09 14:18:14 +0100545 data->method = cdr->compression_method;
beonit0e99a2f2015-07-18 02:08:16 +0900546 data->mod_time = cdr->last_mod_date << 16 | cdr->last_mod_time;
Narayan Kamath926973e2014-06-09 14:18:14 +0100547 data->crc32 = cdr->crc32;
548 data->compressed_length = cdr->compressed_size;
549 data->uncompressed_length = cdr->uncompressed_size;
Narayan Kamath7462f022013-11-21 13:05:04 +0000550
551 // Figure out the local header offset from the central directory. The
552 // actual file data will begin after the local header and the name /
553 // extra comments.
Narayan Kamath926973e2014-06-09 14:18:14 +0100554 const off64_t local_header_offset = cdr->local_file_header_offset;
555 if (local_header_offset + static_cast<off64_t>(sizeof(LocalFileHeader)) >= cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000556 ALOGW("Zip: bad local hdr offset in zip");
557 return kInvalidOffset;
558 }
559
Narayan Kamath926973e2014-06-09 14:18:14 +0100560 uint8_t lfh_buf[sizeof(LocalFileHeader)];
Tianjie Xu18c25922016-09-29 15:27:41 -0700561 if (!archive->mapped_zip.ReadAtOffset(lfh_buf, sizeof(lfh_buf), local_header_offset)) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800562 ALOGW("Zip: failed reading lfh name from offset %" PRId64,
563 static_cast<int64_t>(local_header_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000564 return kIoError;
565 }
566
Narayan Kamath926973e2014-06-09 14:18:14 +0100567 const LocalFileHeader *lfh = reinterpret_cast<const LocalFileHeader*>(lfh_buf);
568
569 if (lfh->lfh_signature != LocalFileHeader::kSignature) {
Mark Salyzyn99ef9912014-03-14 14:26:22 -0700570 ALOGW("Zip: didn't find signature at start of lfh, offset=%" PRId64,
Narayan Kamath926973e2014-06-09 14:18:14 +0100571 static_cast<int64_t>(local_header_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000572 return kInvalidOffset;
573 }
574
575 // Paranoia: Match the values specified in the local file header
576 // to those specified in the central directory.
Adam Lesinskid987c9d2017-04-06 18:55:47 -0700577
Narayan Kamath162b7052017-06-05 13:21:12 +0100578 // Warn if central directory and local file header don't agree on the use
579 // of a trailing Data Descriptor. The reference implementation is inconsistent
580 // and appears to use the LFH value during extraction (unzip) but the CD value
581 // while displayng information about archives (zipinfo). The spec remains
582 // silent on this inconsistency as well.
583 //
584 // For now, always use the version from the LFH but make sure that the values
585 // specified in the central directory match those in the data descriptor.
586 //
587 // NOTE: It's also worth noting that unzip *does* warn about inconsistencies in
588 // bit 11 (EFS: The language encoding flag, marking that filename and comment are
589 // encoded using UTF-8). This implementation does not check for the presence of
590 // that flag and always enforces that entry names are valid UTF-8.
591 if ((lfh->gpb_flags & kGPBDDFlagMask) != (cdr->gpb_flags & kGPBDDFlagMask)) {
592 ALOGW("Zip: gpb flag mismatch at bit 3. expected {%04" PRIx16 "}, was {%04" PRIx16 "}",
Adam Lesinskid987c9d2017-04-06 18:55:47 -0700593 cdr->gpb_flags, lfh->gpb_flags);
Adam Lesinskid987c9d2017-04-06 18:55:47 -0700594 }
595
596 // If there is no trailing data descriptor, verify that the central directory and local file
597 // header agree on the crc, compressed, and uncompressed sizes of the entry.
Narayan Kamath926973e2014-06-09 14:18:14 +0100598 if ((lfh->gpb_flags & kGPBDDFlagMask) == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000599 data->has_data_descriptor = 0;
Narayan Kamath926973e2014-06-09 14:18:14 +0100600 if (data->compressed_length != lfh->compressed_size
601 || data->uncompressed_length != lfh->uncompressed_size
602 || data->crc32 != lfh->crc32) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700603 ALOGW("Zip: size/crc32 mismatch. expected {%" PRIu32 ", %" PRIu32
604 ", %" PRIx32 "}, was {%" PRIu32 ", %" PRIu32 ", %" PRIx32 "}",
Narayan Kamath7462f022013-11-21 13:05:04 +0000605 data->compressed_length, data->uncompressed_length, data->crc32,
Narayan Kamath926973e2014-06-09 14:18:14 +0100606 lfh->compressed_size, lfh->uncompressed_size, lfh->crc32);
Narayan Kamath7462f022013-11-21 13:05:04 +0000607 return kInconsistentInformation;
608 }
609 } else {
610 data->has_data_descriptor = 1;
611 }
612
613 // Check that the local file header name matches the declared
614 // name in the central directory.
Narayan Kamath926973e2014-06-09 14:18:14 +0100615 if (lfh->file_name_length == nameLen) {
616 const off64_t name_offset = local_header_offset + sizeof(LocalFileHeader);
Mykola Kondratenko50afc152014-09-08 12:46:37 +0200617 if (name_offset + lfh->file_name_length > cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000618 ALOGW("Zip: Invalid declared length");
619 return kInvalidOffset;
620 }
621
Tianjie Xu18c25922016-09-29 15:27:41 -0700622 std::vector<uint8_t> name_buf(nameLen);
623 if (!archive->mapped_zip.ReadAtOffset(name_buf.data(), nameLen, name_offset)) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800624 ALOGW("Zip: failed reading lfh name from offset %" PRId64, static_cast<int64_t>(name_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000625 return kIoError;
626 }
627
Tianjie Xu18c25922016-09-29 15:27:41 -0700628 if (memcmp(archive->hash_table[ent].name, name_buf.data(), nameLen)) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000629 return kInconsistentInformation;
630 }
631
Narayan Kamath7462f022013-11-21 13:05:04 +0000632 } else {
633 ALOGW("Zip: lfh name did not match central directory.");
634 return kInconsistentInformation;
635 }
636
Narayan Kamath926973e2014-06-09 14:18:14 +0100637 const off64_t data_offset = local_header_offset + sizeof(LocalFileHeader)
638 + lfh->file_name_length + lfh->extra_field_length;
Narayan Kamath48953a12014-01-24 12:32:39 +0000639 if (data_offset > cd_offset) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800640 ALOGW("Zip: bad data offset %" PRId64 " in zip", static_cast<int64_t>(data_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000641 return kInvalidOffset;
642 }
643
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800644 if (static_cast<off64_t>(data_offset + data->compressed_length) > cd_offset) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700645 ALOGW("Zip: bad compressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800646 static_cast<int64_t>(data_offset), data->compressed_length, static_cast<int64_t>(cd_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000647 return kInvalidOffset;
648 }
649
650 if (data->method == kCompressStored &&
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800651 static_cast<off64_t>(data_offset + data->uncompressed_length) > cd_offset) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700652 ALOGW("Zip: bad uncompressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800653 static_cast<int64_t>(data_offset), data->uncompressed_length,
654 static_cast<int64_t>(cd_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000655 return kInvalidOffset;
656 }
657
658 data->offset = data_offset;
659 return 0;
660}
661
662struct IterationHandle {
663 uint32_t position;
Piotr Jastrzebski10aa9a02014-08-19 09:01:20 +0100664 // We're not using vector here because this code is used in the Windows SDK
665 // where the STL is not available.
Yusuke Sato07447542015-06-25 14:39:19 -0700666 ZipString prefix;
667 ZipString suffix;
Narayan Kamath7462f022013-11-21 13:05:04 +0000668 ZipArchive* archive;
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100669
Yusuke Sato07447542015-06-25 14:39:19 -0700670 IterationHandle(const ZipString* in_prefix,
671 const ZipString* in_suffix) {
672 if (in_prefix) {
673 uint8_t* name_copy = new uint8_t[in_prefix->name_length];
674 memcpy(name_copy, in_prefix->name, in_prefix->name_length);
675 prefix.name = name_copy;
676 prefix.name_length = in_prefix->name_length;
677 } else {
678 prefix.name = NULL;
679 prefix.name_length = 0;
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700680 }
Yusuke Sato07447542015-06-25 14:39:19 -0700681 if (in_suffix) {
682 uint8_t* name_copy = new uint8_t[in_suffix->name_length];
683 memcpy(name_copy, in_suffix->name, in_suffix->name_length);
684 suffix.name = name_copy;
685 suffix.name_length = in_suffix->name_length;
686 } else {
687 suffix.name = NULL;
688 suffix.name_length = 0;
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700689 }
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100690 }
691
692 ~IterationHandle() {
Yusuke Sato07447542015-06-25 14:39:19 -0700693 delete[] prefix.name;
694 delete[] suffix.name;
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100695 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000696};
697
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100698int32_t StartIteration(ZipArchiveHandle handle, void** cookie_ptr,
Yusuke Sato07447542015-06-25 14:39:19 -0700699 const ZipString* optional_prefix,
700 const ZipString* optional_suffix) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800701 ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Narayan Kamath7462f022013-11-21 13:05:04 +0000702
703 if (archive == NULL || archive->hash_table == NULL) {
704 ALOGW("Zip: Invalid ZipArchiveHandle");
705 return kInvalidHandle;
706 }
707
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700708 IterationHandle* cookie = new IterationHandle(optional_prefix, optional_suffix);
Narayan Kamath7462f022013-11-21 13:05:04 +0000709 cookie->position = 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000710 cookie->archive = archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000711
712 *cookie_ptr = cookie ;
713 return 0;
714}
715
Piotr Jastrzebski79c8b342014-08-08 14:02:17 +0100716void EndIteration(void* cookie) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100717 delete reinterpret_cast<IterationHandle*>(cookie);
Piotr Jastrzebski79c8b342014-08-08 14:02:17 +0100718}
719
Yusuke Sato07447542015-06-25 14:39:19 -0700720int32_t FindEntry(const ZipArchiveHandle handle, const ZipString& entryName,
Narayan Kamath7462f022013-11-21 13:05:04 +0000721 ZipEntry* data) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800722 const ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100723 if (entryName.name_length == 0) {
724 ALOGW("Zip: Invalid filename %.*s", entryName.name_length, entryName.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000725 return kInvalidEntryName;
726 }
727
728 const int64_t ent = EntryToIndex(archive->hash_table,
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100729 archive->hash_table_size, entryName);
Narayan Kamath7462f022013-11-21 13:05:04 +0000730
731 if (ent < 0) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100732 ALOGV("Zip: Could not find entry %.*s", entryName.name_length, entryName.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000733 return ent;
734 }
735
736 return FindEntry(archive, ent, data);
737}
738
Yusuke Sato07447542015-06-25 14:39:19 -0700739int32_t Next(void* cookie, ZipEntry* data, ZipString* name) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800740 IterationHandle* handle = reinterpret_cast<IterationHandle*>(cookie);
Narayan Kamath7462f022013-11-21 13:05:04 +0000741 if (handle == NULL) {
742 return kInvalidHandle;
743 }
744
745 ZipArchive* archive = handle->archive;
746 if (archive == NULL || archive->hash_table == NULL) {
747 ALOGW("Zip: Invalid ZipArchiveHandle");
748 return kInvalidHandle;
749 }
750
751 const uint32_t currentOffset = handle->position;
752 const uint32_t hash_table_length = archive->hash_table_size;
Yusuke Sato07447542015-06-25 14:39:19 -0700753 const ZipString* hash_table = archive->hash_table;
Narayan Kamath7462f022013-11-21 13:05:04 +0000754
755 for (uint32_t i = currentOffset; i < hash_table_length; ++i) {
756 if (hash_table[i].name != NULL &&
Yusuke Sato07447542015-06-25 14:39:19 -0700757 (handle->prefix.name_length == 0 ||
758 hash_table[i].StartsWith(handle->prefix)) &&
759 (handle->suffix.name_length == 0 ||
760 hash_table[i].EndsWith(handle->suffix))) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000761 handle->position = (i + 1);
762 const int error = FindEntry(archive, i, data);
763 if (!error) {
764 name->name = hash_table[i].name;
765 name->name_length = hash_table[i].name_length;
766 }
767
768 return error;
769 }
770 }
771
772 handle->position = 0;
773 return kIterationEnd;
774}
775
Narayan Kamathf899bd52015-04-17 11:53:14 +0100776class Writer {
777 public:
778 virtual bool Append(uint8_t* buf, size_t buf_size) = 0;
779 virtual ~Writer() {}
780 protected:
781 Writer() = default;
782 private:
783 DISALLOW_COPY_AND_ASSIGN(Writer);
784};
785
786// A Writer that writes data to a fixed size memory region.
787// The size of the memory region must be equal to the total size of
788// the data appended to it.
789class MemoryWriter : public Writer {
790 public:
791 MemoryWriter(uint8_t* buf, size_t size) : Writer(),
792 buf_(buf), size_(size), bytes_written_(0) {
793 }
794
795 virtual bool Append(uint8_t* buf, size_t buf_size) override {
796 if (bytes_written_ + buf_size > size_) {
797 ALOGW("Zip: Unexpected size " ZD " (declared) vs " ZD " (actual)",
798 size_, bytes_written_ + buf_size);
799 return false;
800 }
801
802 memcpy(buf_ + bytes_written_, buf, buf_size);
803 bytes_written_ += buf_size;
804 return true;
805 }
806
807 private:
808 uint8_t* const buf_;
809 const size_t size_;
810 size_t bytes_written_;
811};
812
813// A Writer that appends data to a file |fd| at its current position.
814// The file will be truncated to the end of the written data.
815class FileWriter : public Writer {
816 public:
817
818 // Creates a FileWriter for |fd| and prepare to write |entry| to it,
819 // guaranteeing that the file descriptor is valid and that there's enough
820 // space on the volume to write out the entry completely and that the file
Tao Baoa456c212016-11-15 10:08:07 -0800821 // is truncated to the correct length (no truncation if |fd| references a
822 // block device).
Narayan Kamathf899bd52015-04-17 11:53:14 +0100823 //
824 // Returns a valid FileWriter on success, |nullptr| if an error occurred.
825 static std::unique_ptr<FileWriter> Create(int fd, const ZipEntry* entry) {
826 const uint32_t declared_length = entry->uncompressed_length;
827 const off64_t current_offset = lseek64(fd, 0, SEEK_CUR);
828 if (current_offset == -1) {
829 ALOGW("Zip: unable to seek to current location on fd %d: %s", fd, strerror(errno));
830 return nullptr;
831 }
832
833 int result = 0;
834#if defined(__linux__)
835 if (declared_length > 0) {
836 // Make sure we have enough space on the volume to extract the compressed
837 // entry. Note that the call to ftruncate below will change the file size but
838 // will not allocate space on disk and this call to fallocate will not
839 // change the file size.
Badhri Jagan Sridharana68d0d12015-06-02 14:47:57 -0700840 // Note: fallocate is only supported by the following filesystems -
841 // btrfs, ext4, ocfs2, and xfs. Therefore fallocate might fail with
842 // EOPNOTSUPP error when issued in other filesystems.
843 // Hence, check for the return error code before concluding that the
844 // disk does not have enough space.
Narayan Kamathf899bd52015-04-17 11:53:14 +0100845 result = TEMP_FAILURE_RETRY(fallocate(fd, 0, current_offset, declared_length));
Badhri Jagan Sridharana68d0d12015-06-02 14:47:57 -0700846 if (result == -1 && errno == ENOSPC) {
Narayan Kamathd5d7abe2016-08-10 12:24:05 +0100847 ALOGW("Zip: unable to allocate %" PRId64 " bytes at offset %" PRId64 " : %s",
848 static_cast<int64_t>(declared_length), static_cast<int64_t>(current_offset),
849 strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +0100850 return std::unique_ptr<FileWriter>(nullptr);
851 }
852 }
853#endif // __linux__
854
Tao Baoa456c212016-11-15 10:08:07 -0800855 struct stat sb;
856 if (fstat(fd, &sb) == -1) {
857 ALOGW("Zip: unable to fstat file: %s", strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +0100858 return std::unique_ptr<FileWriter>(nullptr);
859 }
860
Tao Baoa456c212016-11-15 10:08:07 -0800861 // Block device doesn't support ftruncate(2).
862 if (!S_ISBLK(sb.st_mode)) {
863 result = TEMP_FAILURE_RETRY(ftruncate(fd, declared_length + current_offset));
864 if (result == -1) {
865 ALOGW("Zip: unable to truncate file to %" PRId64 ": %s",
866 static_cast<int64_t>(declared_length + current_offset), strerror(errno));
867 return std::unique_ptr<FileWriter>(nullptr);
868 }
869 }
870
Narayan Kamathf899bd52015-04-17 11:53:14 +0100871 return std::unique_ptr<FileWriter>(new FileWriter(fd, declared_length));
872 }
873
874 virtual bool Append(uint8_t* buf, size_t buf_size) override {
875 if (total_bytes_written_ + buf_size > declared_length_) {
876 ALOGW("Zip: Unexpected size " ZD " (declared) vs " ZD " (actual)",
877 declared_length_, total_bytes_written_ + buf_size);
878 return false;
879 }
880
Narayan Kamathe97e66e2015-04-27 16:25:53 +0100881 const bool result = android::base::WriteFully(fd_, buf, buf_size);
882 if (result) {
883 total_bytes_written_ += buf_size;
884 } else {
885 ALOGW("Zip: unable to write " ZD " bytes to file; %s", buf_size, strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +0100886 }
887
Narayan Kamathe97e66e2015-04-27 16:25:53 +0100888 return result;
Narayan Kamathf899bd52015-04-17 11:53:14 +0100889 }
890 private:
891 FileWriter(const int fd, const size_t declared_length) :
892 Writer(),
893 fd_(fd),
894 declared_length_(declared_length),
895 total_bytes_written_(0) {
896 }
897
898 const int fd_;
899 const size_t declared_length_;
900 size_t total_bytes_written_;
901};
902
Dmitriy Ivanovf94e1592015-03-06 13:27:59 -0800903// This method is using libz macros with old-style-casts
904#pragma GCC diagnostic push
905#pragma GCC diagnostic ignored "-Wold-style-cast"
906static inline int zlib_inflateInit2(z_stream* stream, int window_bits) {
907 return inflateInit2(stream, window_bits);
908}
909#pragma GCC diagnostic pop
910
Tianjie Xu18c25922016-09-29 15:27:41 -0700911static int32_t InflateEntryToWriter(MappedZipFile& mapped_zip, const ZipEntry* entry,
Narayan Kamathf899bd52015-04-17 11:53:14 +0100912 Writer* writer, uint64_t* crc_out) {
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700913 const size_t kBufSize = 32768;
914 std::vector<uint8_t> read_buf(kBufSize);
915 std::vector<uint8_t> write_buf(kBufSize);
Narayan Kamath7462f022013-11-21 13:05:04 +0000916 z_stream zstream;
917 int zerr;
918
919 /*
920 * Initialize the zlib stream struct.
921 */
922 memset(&zstream, 0, sizeof(zstream));
923 zstream.zalloc = Z_NULL;
924 zstream.zfree = Z_NULL;
925 zstream.opaque = Z_NULL;
926 zstream.next_in = NULL;
927 zstream.avail_in = 0;
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700928 zstream.next_out = &write_buf[0];
Narayan Kamath7462f022013-11-21 13:05:04 +0000929 zstream.avail_out = kBufSize;
930 zstream.data_type = Z_UNKNOWN;
931
932 /*
933 * Use the undocumented "negative window bits" feature to tell zlib
934 * that there's no zlib header waiting for it.
935 */
Dmitriy Ivanovf94e1592015-03-06 13:27:59 -0800936 zerr = zlib_inflateInit2(&zstream, -MAX_WBITS);
Narayan Kamath7462f022013-11-21 13:05:04 +0000937 if (zerr != Z_OK) {
938 if (zerr == Z_VERSION_ERROR) {
939 ALOGE("Installed zlib is not compatible with linked version (%s)",
940 ZLIB_VERSION);
941 } else {
942 ALOGW("Call to inflateInit2 failed (zerr=%d)", zerr);
943 }
944
945 return kZlibError;
946 }
947
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800948 auto zstream_deleter = [](z_stream* stream) {
949 inflateEnd(stream); /* free up any allocated structures */
950 };
951
952 std::unique_ptr<z_stream, decltype(zstream_deleter)> zstream_guard(&zstream, zstream_deleter);
953
Narayan Kamath7462f022013-11-21 13:05:04 +0000954 const uint32_t uncompressed_length = entry->uncompressed_length;
955
Narayan Kamath162b7052017-06-05 13:21:12 +0100956 uint64_t crc = 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000957 uint32_t compressed_length = entry->compressed_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000958 do {
959 /* read as much as we can */
960 if (zstream.avail_in == 0) {
Yabin Cuib2a77002016-02-08 16:26:33 -0800961 const size_t getSize = (compressed_length > kBufSize) ? kBufSize : compressed_length;
Tianjie Xu18c25922016-09-29 15:27:41 -0700962 if (!mapped_zip.ReadData(read_buf.data(), getSize)) {
Yabin Cuib2a77002016-02-08 16:26:33 -0800963 ALOGW("Zip: inflate read failed, getSize = %zu: %s", getSize, strerror(errno));
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800964 return kIoError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000965 }
966
967 compressed_length -= getSize;
968
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700969 zstream.next_in = &read_buf[0];
Narayan Kamath7462f022013-11-21 13:05:04 +0000970 zstream.avail_in = getSize;
971 }
972
973 /* uncompress the data */
974 zerr = inflate(&zstream, Z_NO_FLUSH);
975 if (zerr != Z_OK && zerr != Z_STREAM_END) {
976 ALOGW("Zip: inflate zerr=%d (nIn=%p aIn=%u nOut=%p aOut=%u)",
977 zerr, zstream.next_in, zstream.avail_in,
978 zstream.next_out, zstream.avail_out);
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800979 return kZlibError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000980 }
981
982 /* write when we're full or when we're done */
983 if (zstream.avail_out == 0 ||
984 (zerr == Z_STREAM_END && zstream.avail_out != kBufSize)) {
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700985 const size_t write_size = zstream.next_out - &write_buf[0];
Narayan Kamathf899bd52015-04-17 11:53:14 +0100986 if (!writer->Append(&write_buf[0], write_size)) {
987 // The file might have declared a bogus length.
988 return kInconsistentInformation;
Narayan Kamath162b7052017-06-05 13:21:12 +0100989 } else {
990 crc = crc32(crc, &write_buf[0], write_size);
Narayan Kamath7462f022013-11-21 13:05:04 +0000991 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000992
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700993 zstream.next_out = &write_buf[0];
Narayan Kamath7462f022013-11-21 13:05:04 +0000994 zstream.avail_out = kBufSize;
995 }
996 } while (zerr == Z_OK);
997
998 assert(zerr == Z_STREAM_END); /* other errors should've been caught */
999
Narayan Kamath162b7052017-06-05 13:21:12 +01001000 // NOTE: zstream.adler is always set to 0, because we're using the -MAX_WBITS
1001 // "feature" of zlib to tell it there won't be a zlib file header. zlib
1002 // doesn't bother calculating the checksum in that scenario. We just do
1003 // it ourselves above because there are no additional gains to be made by
1004 // having zlib calculate it for us, since they do it by calling crc32 in
1005 // the same manner that we have above.
1006 *crc_out = crc;
Narayan Kamath7462f022013-11-21 13:05:04 +00001007
1008 if (zstream.total_out != uncompressed_length || compressed_length != 0) {
Mark Salyzyn088bf902014-05-08 16:02:20 -07001009 ALOGW("Zip: size mismatch on inflated file (%lu vs %" PRIu32 ")",
Narayan Kamath7462f022013-11-21 13:05:04 +00001010 zstream.total_out, uncompressed_length);
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -08001011 return kInconsistentInformation;
Narayan Kamath7462f022013-11-21 13:05:04 +00001012 }
1013
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -08001014 return 0;
Narayan Kamath7462f022013-11-21 13:05:04 +00001015}
1016
Tianjie Xu18c25922016-09-29 15:27:41 -07001017static int32_t CopyEntryToWriter(MappedZipFile& mapped_zip, const ZipEntry* entry, Writer* writer,
Narayan Kamathf899bd52015-04-17 11:53:14 +01001018 uint64_t *crc_out) {
1019 static const uint32_t kBufSize = 32768;
1020 std::vector<uint8_t> buf(kBufSize);
1021
1022 const uint32_t length = entry->uncompressed_length;
1023 uint32_t count = 0;
1024 uint64_t crc = 0;
1025 while (count < length) {
1026 uint32_t remaining = length - count;
1027
1028 // Safe conversion because kBufSize is narrow enough for a 32 bit signed
1029 // value.
Yabin Cuib2a77002016-02-08 16:26:33 -08001030 const size_t block_size = (remaining > kBufSize) ? kBufSize : remaining;
Tianjie Xu18c25922016-09-29 15:27:41 -07001031 if (!mapped_zip.ReadData(buf.data(), block_size)) {
Yabin Cuib2a77002016-02-08 16:26:33 -08001032 ALOGW("CopyFileToFile: copy read failed, block_size = %zu: %s", block_size, strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +01001033 return kIoError;
1034 }
1035
1036 if (!writer->Append(&buf[0], block_size)) {
1037 return kIoError;
1038 }
1039 crc = crc32(crc, &buf[0], block_size);
1040 count += block_size;
1041 }
1042
1043 *crc_out = crc;
1044
1045 return 0;
1046}
1047
1048int32_t ExtractToWriter(ZipArchiveHandle handle,
1049 ZipEntry* entry, Writer* writer) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -08001050 ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Narayan Kamath7462f022013-11-21 13:05:04 +00001051 const uint16_t method = entry->method;
1052 off64_t data_offset = entry->offset;
1053
Tianjie Xu18c25922016-09-29 15:27:41 -07001054 if (!archive->mapped_zip.SeekToOffset(data_offset)) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -08001055 ALOGW("Zip: lseek to data at %" PRId64 " failed", static_cast<int64_t>(data_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +00001056 return kIoError;
1057 }
1058
1059 // this should default to kUnknownCompressionMethod.
1060 int32_t return_value = -1;
1061 uint64_t crc = 0;
1062 if (method == kCompressStored) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001063 return_value = CopyEntryToWriter(archive->mapped_zip, entry, writer, &crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001064 } else if (method == kCompressDeflated) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001065 return_value = InflateEntryToWriter(archive->mapped_zip, entry, writer, &crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001066 }
1067
1068 if (!return_value && entry->has_data_descriptor) {
Narayan Kamath162b7052017-06-05 13:21:12 +01001069 return_value = ValidateDataDescriptor(archive->mapped_zip, entry);
Narayan Kamath7462f022013-11-21 13:05:04 +00001070 if (return_value) {
1071 return return_value;
1072 }
1073 }
1074
Narayan Kamath162b7052017-06-05 13:21:12 +01001075 // Validate that the CRC matches the calculated value.
1076 if (kCrcChecksEnabled && (entry->crc32 != static_cast<uint32_t>(crc))) {
Mark Salyzyn088bf902014-05-08 16:02:20 -07001077 ALOGW("Zip: crc mismatch: expected %" PRIu32 ", was %" PRIu64, entry->crc32, crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001078 return kInconsistentInformation;
1079 }
1080
1081 return return_value;
1082}
1083
Narayan Kamathf899bd52015-04-17 11:53:14 +01001084int32_t ExtractToMemory(ZipArchiveHandle handle, ZipEntry* entry,
1085 uint8_t* begin, uint32_t size) {
1086 std::unique_ptr<Writer> writer(new MemoryWriter(begin, size));
1087 return ExtractToWriter(handle, entry, writer.get());
1088}
1089
Narayan Kamath7462f022013-11-21 13:05:04 +00001090int32_t ExtractEntryToFile(ZipArchiveHandle handle,
1091 ZipEntry* entry, int fd) {
Narayan Kamathf899bd52015-04-17 11:53:14 +01001092 std::unique_ptr<Writer> writer(FileWriter::Create(fd, entry));
1093 if (writer.get() == nullptr) {
Narayan Kamath7462f022013-11-21 13:05:04 +00001094 return kIoError;
1095 }
1096
Narayan Kamathf899bd52015-04-17 11:53:14 +01001097 return ExtractToWriter(handle, entry, writer.get());
Narayan Kamath7462f022013-11-21 13:05:04 +00001098}
1099
1100const char* ErrorCodeString(int32_t error_code) {
1101 if (error_code > kErrorMessageLowerBound && error_code < kErrorMessageUpperBound) {
1102 return kErrorMessages[error_code * -1];
1103 }
1104
1105 return kErrorMessages[0];
1106}
1107
1108int GetFileDescriptor(const ZipArchiveHandle handle) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001109 return reinterpret_cast<ZipArchive*>(handle)->mapped_zip.GetFileDescriptor();
Narayan Kamath7462f022013-11-21 13:05:04 +00001110}
Colin Cross7c6c7f02016-09-16 10:15:51 -07001111
1112ZipString::ZipString(const char* entry_name)
1113 : name(reinterpret_cast<const uint8_t*>(entry_name)) {
1114 size_t len = strlen(entry_name);
1115 CHECK_LE(len, static_cast<size_t>(UINT16_MAX));
1116 name_length = static_cast<uint16_t>(len);
1117}
Tianjie Xu18c25922016-09-29 15:27:41 -07001118
1119#if !defined(_WIN32)
1120class ProcessWriter : public Writer {
1121 public:
1122 ProcessWriter(ProcessZipEntryFunction func, void* cookie) : Writer(),
1123 proc_function_(func),
1124 cookie_(cookie) {
1125 }
1126
1127 virtual bool Append(uint8_t* buf, size_t buf_size) override {
1128 return proc_function_(buf, buf_size, cookie_);
1129 }
1130
1131 private:
1132 ProcessZipEntryFunction proc_function_;
1133 void* cookie_;
1134};
1135
1136int32_t ProcessZipEntryContents(ZipArchiveHandle handle, ZipEntry* entry,
1137 ProcessZipEntryFunction func, void* cookie) {
1138 ProcessWriter writer(func, cookie);
1139 return ExtractToWriter(handle, entry, &writer);
1140}
1141
1142#endif //!defined(_WIN32)
1143
1144int MappedZipFile::GetFileDescriptor() const {
1145 if (!has_fd_) {
1146 ALOGW("Zip: MappedZipFile doesn't have a file descriptor.");
1147 return -1;
1148 }
1149 return fd_;
1150}
1151
1152void* MappedZipFile::GetBasePtr() const {
1153 if (has_fd_) {
1154 ALOGW("Zip: MappedZipFile doesn't have a base pointer.");
1155 return nullptr;
1156 }
1157 return base_ptr_;
1158}
1159
1160off64_t MappedZipFile::GetFileLength() const {
1161 if (has_fd_) {
1162 off64_t result = lseek64(fd_, 0, SEEK_END);
1163 if (result == -1) {
1164 ALOGE("Zip: lseek on fd %d failed: %s", fd_, strerror(errno));
1165 }
1166 return result;
1167 } else {
1168 if (base_ptr_ == nullptr) {
1169 ALOGE("Zip: invalid file map\n");
1170 return -1;
1171 }
1172 return static_cast<off64_t>(data_length_);
1173 }
1174}
1175
1176bool MappedZipFile::SeekToOffset(off64_t offset) {
1177 if (has_fd_) {
1178 if (lseek64(fd_, offset, SEEK_SET) != offset) {
1179 ALOGE("Zip: lseek to %" PRId64 " failed: %s\n", offset, strerror(errno));
1180 return false;
1181 }
1182 return true;
1183 } else {
1184 if (offset < 0 || offset > static_cast<off64_t>(data_length_)) {
1185 ALOGE("Zip: invalid offset: %" PRId64 ", data length: %" PRId64 "\n" , offset,
1186 data_length_);
1187 return false;
1188 }
1189
1190 read_pos_ = offset;
1191 return true;
1192 }
1193}
1194
1195bool MappedZipFile::ReadData(uint8_t* buffer, size_t read_amount) {
1196 if (has_fd_) {
1197 if(!android::base::ReadFully(fd_, buffer, read_amount)) {
1198 ALOGE("Zip: read from %d failed\n", fd_);
1199 return false;
1200 }
1201 } else {
1202 memcpy(buffer, static_cast<uint8_t*>(base_ptr_) + read_pos_, read_amount);
1203 read_pos_ += read_amount;
1204 }
1205 return true;
1206}
1207
1208// Attempts to read |len| bytes into |buf| at offset |off|.
1209bool MappedZipFile::ReadAtOffset(uint8_t* buf, size_t len, off64_t off) {
1210#if !defined(_WIN32)
1211 if (has_fd_) {
1212 if (static_cast<size_t>(TEMP_FAILURE_RETRY(pread64(fd_, buf, len, off))) != len) {
1213 ALOGE("Zip: failed to read at offset %" PRId64 "\n", off);
1214 return false;
1215 }
1216 return true;
1217 }
1218#endif
1219 if (!SeekToOffset(off)) {
1220 return false;
1221 }
1222 return ReadData(buf, len);
1223
1224}
1225
1226void CentralDirectory::Initialize(void* map_base_ptr, off64_t cd_start_offset, size_t cd_size) {
1227 base_ptr_ = static_cast<uint8_t*>(map_base_ptr) + cd_start_offset;
1228 length_ = cd_size;
1229}
1230
1231bool ZipArchive::InitializeCentralDirectory(const char* debug_file_name, off64_t cd_start_offset,
1232 size_t cd_size) {
1233 if (mapped_zip.HasFd()) {
1234 if (!directory_map->create(debug_file_name, mapped_zip.GetFileDescriptor(),
1235 cd_start_offset, cd_size, true /* read only */)) {
1236 return false;
1237 }
1238
1239 CHECK_EQ(directory_map->getDataLength(), cd_size);
1240 central_directory.Initialize(directory_map->getDataPtr(), 0/*offset*/, cd_size);
1241 } else {
1242 if (mapped_zip.GetBasePtr() == nullptr) {
1243 ALOGE("Zip: Failed to map central directory, bad mapped_zip base pointer\n");
1244 return false;
1245 }
1246 if (static_cast<off64_t>(cd_start_offset) + static_cast<off64_t>(cd_size) >
1247 mapped_zip.GetFileLength()) {
1248 ALOGE("Zip: Failed to map central directory, offset exceeds mapped memory region ("
1249 "start_offset %" PRId64 ", cd_size %zu, mapped_region_size %" PRId64 ")",
1250 static_cast<int64_t>(cd_start_offset), cd_size, mapped_zip.GetFileLength());
1251 return false;
1252 }
1253
1254 central_directory.Initialize(mapped_zip.GetBasePtr(), cd_start_offset, cd_size);
1255 }
1256 return true;
1257}