blob: 25b1da4ca590e06a6e9f8dd20d1f6a2a1c90384f [file] [log] [blame]
Adam Lesinski622f3042015-10-05 18:16:18 -07001/*
2 * Copyright (C) 2015 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
Adam Lesinski622f3042015-10-05 18:16:18 -070017#include "ziparchive/zip_writer.h"
18
Adam Lesinski2e216de2017-03-16 13:23:51 -070019#include <sys/param.h>
Adam Lesinskif61aaf42017-03-29 16:10:11 -070020#include <sys/stat.h>
Adam Lesinski622f3042015-10-05 18:16:18 -070021#include <zlib.h>
Jiyong Park6821cc82017-06-30 17:23:33 +090022#include <cstdio>
23#define DEF_MEM_LEVEL 8 // normally in zutil.h?
Adam Lesinski622f3042015-10-05 18:16:18 -070024
Adam Lesinski2e216de2017-03-16 13:23:51 -070025#include <memory>
26#include <vector>
27
28#include "android-base/logging.h"
Adam Lesinski2e216de2017-03-16 13:23:51 -070029
30#include "entry_name_utils-inl.h"
31#include "zip_archive_common.h"
32
Nick Kralevich622f9b32019-03-27 07:46:39 -070033#undef powerof2
34#define powerof2(x) \
35 ({ \
36 __typeof__(x) _x = (x); \
37 __typeof__(x) _x2; \
38 __builtin_add_overflow(_x, -1, &_x2) ? 1 : ((_x2 & _x) == 0); \
39 })
Christopher Ferris72082ab2016-01-19 10:33:03 -080040
Adam Lesinski622f3042015-10-05 18:16:18 -070041/* Zip compression methods we support */
42enum {
Jiyong Park6821cc82017-06-30 17:23:33 +090043 kCompressStored = 0, // no compression
44 kCompressDeflated = 8, // standard deflate
Adam Lesinski622f3042015-10-05 18:16:18 -070045};
46
Adam Lesinskic322b432015-10-06 15:23:46 -070047// Size of the output buffer used for compression.
48static const size_t kBufSize = 32768u;
49
Adam Lesinski622f3042015-10-05 18:16:18 -070050// No error, operation completed successfully.
51static const int32_t kNoError = 0;
52
53// The ZipWriter is in a bad state.
54static const int32_t kInvalidState = -1;
55
56// There was an IO error while writing to disk.
57static const int32_t kIoError = -2;
58
59// The zip entry name was invalid.
60static const int32_t kInvalidEntryName = -3;
61
Adam Lesinskic322b432015-10-06 15:23:46 -070062// An error occurred in zlib.
63static const int32_t kZlibError = -4;
64
Christopher Ferris72082ab2016-01-19 10:33:03 -080065// The start aligned function was called with the aligned flag.
66static const int32_t kInvalidAlign32Flag = -5;
67
68// The alignment parameter is not a power of 2.
69static const int32_t kInvalidAlignment = -6;
70
Adam Lesinski622f3042015-10-05 18:16:18 -070071static const char* sErrorCodes[] = {
Jiyong Park6821cc82017-06-30 17:23:33 +090072 "Invalid state", "IO error", "Invalid entry name", "Zlib error",
Adam Lesinski622f3042015-10-05 18:16:18 -070073};
74
75const char* ZipWriter::ErrorCodeString(int32_t error_code) {
76 if (error_code < 0 && (-error_code) < static_cast<int32_t>(arraysize(sErrorCodes))) {
77 return sErrorCodes[-error_code];
78 }
79 return nullptr;
80}
81
Adam Lesinskic322b432015-10-06 15:23:46 -070082static void DeleteZStream(z_stream* stream) {
83 deflateEnd(stream);
84 delete stream;
85}
86
Jiyong Park6821cc82017-06-30 17:23:33 +090087ZipWriter::ZipWriter(FILE* f)
88 : file_(f),
89 seekable_(false),
90 current_offset_(0),
91 state_(State::kWritingZip),
92 z_stream_(nullptr, DeleteZStream),
93 buffer_(kBufSize) {
Adam Lesinskif61aaf42017-03-29 16:10:11 -070094 // Check if the file is seekable (regular file). If fstat fails, that's fine, subsequent calls
95 // will fail as well.
96 struct stat file_stats;
97 if (fstat(fileno(f), &file_stats) == 0) {
98 seekable_ = S_ISREG(file_stats.st_mode);
99 }
Adam Lesinski622f3042015-10-05 18:16:18 -0700100}
101
Chih-Hung Hsiehbb79eac2018-09-25 11:16:22 -0700102ZipWriter::ZipWriter(ZipWriter&& writer) noexcept
Jiyong Park6821cc82017-06-30 17:23:33 +0900103 : file_(writer.file_),
104 seekable_(writer.seekable_),
105 current_offset_(writer.current_offset_),
106 state_(writer.state_),
107 files_(std::move(writer.files_)),
108 z_stream_(std::move(writer.z_stream_)),
109 buffer_(std::move(writer.buffer_)) {
Adam Lesinski622f3042015-10-05 18:16:18 -0700110 writer.file_ = nullptr;
111 writer.state_ = State::kError;
112}
113
Chih-Hung Hsiehbb79eac2018-09-25 11:16:22 -0700114ZipWriter& ZipWriter::operator=(ZipWriter&& writer) noexcept {
Adam Lesinski622f3042015-10-05 18:16:18 -0700115 file_ = writer.file_;
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700116 seekable_ = writer.seekable_;
Adam Lesinski622f3042015-10-05 18:16:18 -0700117 current_offset_ = writer.current_offset_;
118 state_ = writer.state_;
119 files_ = std::move(writer.files_);
Adam Lesinskic322b432015-10-06 15:23:46 -0700120 z_stream_ = std::move(writer.z_stream_);
121 buffer_ = std::move(writer.buffer_);
Adam Lesinski622f3042015-10-05 18:16:18 -0700122 writer.file_ = nullptr;
123 writer.state_ = State::kError;
124 return *this;
125}
126
127int32_t ZipWriter::HandleError(int32_t error_code) {
128 state_ = State::kError;
Adam Lesinskic322b432015-10-06 15:23:46 -0700129 z_stream_.reset();
Adam Lesinski622f3042015-10-05 18:16:18 -0700130 return error_code;
131}
132
Yurii Zubrytskyi5338b872019-06-17 14:26:30 -0700133int32_t ZipWriter::StartEntry(std::string_view path, size_t flags) {
Christopher Ferris72082ab2016-01-19 10:33:03 -0800134 uint32_t alignment = 0;
135 if (flags & kAlign32) {
136 flags &= ~kAlign32;
137 alignment = 4;
138 }
139 return StartAlignedEntryWithTime(path, flags, time_t(), alignment);
140}
141
Yurii Zubrytskyi5338b872019-06-17 14:26:30 -0700142int32_t ZipWriter::StartAlignedEntry(std::string_view path, size_t flags, uint32_t alignment) {
Christopher Ferris72082ab2016-01-19 10:33:03 -0800143 return StartAlignedEntryWithTime(path, flags, time_t(), alignment);
144}
145
Yurii Zubrytskyi5338b872019-06-17 14:26:30 -0700146int32_t ZipWriter::StartEntryWithTime(std::string_view path, size_t flags, time_t time) {
Christopher Ferris72082ab2016-01-19 10:33:03 -0800147 uint32_t alignment = 0;
148 if (flags & kAlign32) {
149 flags &= ~kAlign32;
150 alignment = 4;
151 }
152 return StartAlignedEntryWithTime(path, flags, time, alignment);
Adam Lesinski622f3042015-10-05 18:16:18 -0700153}
154
155static void ExtractTimeAndDate(time_t when, uint16_t* out_time, uint16_t* out_date) {
156 /* round up to an even number of seconds */
157 when = static_cast<time_t>((static_cast<unsigned long>(when) + 1) & (~1));
158
159 struct tm* ptm;
160#if !defined(_WIN32)
Jiyong Park6821cc82017-06-30 17:23:33 +0900161 struct tm tm_result;
162 ptm = localtime_r(&when, &tm_result);
Adam Lesinski622f3042015-10-05 18:16:18 -0700163#else
Jiyong Park6821cc82017-06-30 17:23:33 +0900164 ptm = localtime(&when);
Adam Lesinski622f3042015-10-05 18:16:18 -0700165#endif
166
167 int year = ptm->tm_year;
168 if (year < 80) {
169 year = 80;
170 }
171
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700172 *out_date = static_cast<uint16_t>((year - 80) << 9 | (ptm->tm_mon + 1) << 5 | ptm->tm_mday);
173 *out_time = static_cast<uint16_t>(ptm->tm_hour << 11 | ptm->tm_min << 5 | ptm->tm_sec >> 1);
Adam Lesinski622f3042015-10-05 18:16:18 -0700174}
175
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700176static void CopyFromFileEntry(const ZipWriter::FileEntry& src, bool use_data_descriptor,
177 LocalFileHeader* dst) {
178 dst->lfh_signature = LocalFileHeader::kSignature;
179 if (use_data_descriptor) {
180 // Set this flag to denote that a DataDescriptor struct will appear after the data,
181 // containing the crc and size fields.
182 dst->gpb_flags |= kGPBDDFlagMask;
183
184 // The size and crc fields must be 0.
185 dst->compressed_size = 0u;
186 dst->uncompressed_size = 0u;
187 dst->crc32 = 0u;
188 } else {
189 dst->compressed_size = src.compressed_size;
190 dst->uncompressed_size = src.uncompressed_size;
191 dst->crc32 = src.crc32;
192 }
193 dst->compression_method = src.compression_method;
194 dst->last_mod_time = src.last_mod_time;
195 dst->last_mod_date = src.last_mod_date;
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700196 DCHECK_LE(src.path.size(), std::numeric_limits<uint16_t>::max());
197 dst->file_name_length = static_cast<uint16_t>(src.path.size());
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700198 dst->extra_field_length = src.padding_length;
199}
200
Yurii Zubrytskyi5338b872019-06-17 14:26:30 -0700201int32_t ZipWriter::StartAlignedEntryWithTime(std::string_view path, size_t flags, time_t time,
Jiyong Park6821cc82017-06-30 17:23:33 +0900202 uint32_t alignment) {
Adam Lesinski622f3042015-10-05 18:16:18 -0700203 if (state_ != State::kWritingZip) {
204 return kInvalidState;
205 }
206
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700207 // Can only have 16535 entries because of zip records.
208 if (files_.size() == std::numeric_limits<uint16_t>::max()) {
209 return HandleError(kIoError);
210 }
211
Christopher Ferris72082ab2016-01-19 10:33:03 -0800212 if (flags & kAlign32) {
213 return kInvalidAlign32Flag;
214 }
215
216 if (powerof2(alignment) == 0) {
217 return kInvalidAlignment;
218 }
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700219 if (alignment > std::numeric_limits<uint16_t>::max()) {
220 return kInvalidAlignment;
221 }
Christopher Ferris72082ab2016-01-19 10:33:03 -0800222
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700223 FileEntry file_entry = {};
224 file_entry.local_file_header_offset = current_offset_;
225 file_entry.path = path;
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700226 // No support for larger than 4GB files.
227 if (file_entry.local_file_header_offset > std::numeric_limits<uint32_t>::max()) {
228 return HandleError(kIoError);
229 }
Adam Lesinski622f3042015-10-05 18:16:18 -0700230
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700231 if (!IsValidEntryName(reinterpret_cast<const uint8_t*>(file_entry.path.data()),
232 file_entry.path.size())) {
Adam Lesinski622f3042015-10-05 18:16:18 -0700233 return kInvalidEntryName;
234 }
235
Adam Lesinskic322b432015-10-06 15:23:46 -0700236 if (flags & ZipWriter::kCompress) {
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700237 file_entry.compression_method = kCompressDeflated;
Adam Lesinskic322b432015-10-06 15:23:46 -0700238
239 int32_t result = PrepareDeflate();
240 if (result != kNoError) {
241 return result;
242 }
243 } else {
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700244 file_entry.compression_method = kCompressStored;
Adam Lesinskic322b432015-10-06 15:23:46 -0700245 }
Adam Lesinski622f3042015-10-05 18:16:18 -0700246
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700247 ExtractTimeAndDate(time, &file_entry.last_mod_time, &file_entry.last_mod_date);
Adam Lesinski622f3042015-10-05 18:16:18 -0700248
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700249 off_t offset = current_offset_ + sizeof(LocalFileHeader) + file_entry.path.size();
Yurii Zubrytskyibb0e58f2019-06-17 15:43:16 -0700250 // prepare a pre-zeroed memory page in case when we need to pad some aligned data.
251 static constexpr auto kPageSize = 4096;
252 static constexpr char kSmallZeroPadding[kPageSize] = {};
253 // use this buffer if our preallocated one is too small
254 std::vector<char> zero_padding_big;
255 const char* zero_padding = nullptr;
256
Christopher Ferris72082ab2016-01-19 10:33:03 -0800257 if (alignment != 0 && (offset & (alignment - 1))) {
Adam Lesinski622f3042015-10-05 18:16:18 -0700258 // Pad the extra field so the data will be aligned.
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700259 uint16_t padding = static_cast<uint16_t>(alignment - (offset % alignment));
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700260 file_entry.padding_length = padding;
Adam Lesinski622f3042015-10-05 18:16:18 -0700261 offset += padding;
Yurii Zubrytskyibb0e58f2019-06-17 15:43:16 -0700262 if (padding <= std::size(kSmallZeroPadding)) {
263 zero_padding = kSmallZeroPadding;
264 } else {
265 zero_padding_big.resize(padding, 0);
266 zero_padding = zero_padding_big.data();
267 }
Adam Lesinski622f3042015-10-05 18:16:18 -0700268 }
269
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700270 LocalFileHeader header = {};
271 // Always start expecting a data descriptor. When the data has finished being written,
272 // if it is possible to seek back, the GPB flag will reset and the sizes written.
273 CopyFromFileEntry(file_entry, true /*use_data_descriptor*/, &header);
274
Adam Lesinski622f3042015-10-05 18:16:18 -0700275 if (fwrite(&header, sizeof(header), 1, file_) != 1) {
276 return HandleError(kIoError);
277 }
278
Yurii Zubrytskyi5338b872019-06-17 14:26:30 -0700279 if (fwrite(path.data(), 1, path.size(), file_) != path.size()) {
Adam Lesinski622f3042015-10-05 18:16:18 -0700280 return HandleError(kIoError);
281 }
282
Yurii Zubrytskyibb0e58f2019-06-17 15:43:16 -0700283 if (file_entry.padding_length != 0 && fwrite(zero_padding, 1, file_entry.padding_length,
Jiyong Park6821cc82017-06-30 17:23:33 +0900284 file_) != file_entry.padding_length) {
Adam Lesinski622f3042015-10-05 18:16:18 -0700285 return HandleError(kIoError);
286 }
287
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700288 current_file_entry_ = std::move(file_entry);
Adam Lesinski622f3042015-10-05 18:16:18 -0700289 current_offset_ = offset;
290 state_ = State::kWritingEntry;
291 return kNoError;
292}
293
Adam Lesinski2e216de2017-03-16 13:23:51 -0700294int32_t ZipWriter::DiscardLastEntry() {
295 if (state_ != State::kWritingZip || files_.empty()) {
296 return kInvalidState;
297 }
298
299 FileEntry& last_entry = files_.back();
300 current_offset_ = last_entry.local_file_header_offset;
301 if (fseeko(file_, current_offset_, SEEK_SET) != 0) {
302 return HandleError(kIoError);
303 }
304 files_.pop_back();
305 return kNoError;
306}
307
308int32_t ZipWriter::GetLastEntry(FileEntry* out_entry) {
309 CHECK(out_entry != nullptr);
310
311 if (files_.empty()) {
312 return kInvalidState;
313 }
314 *out_entry = files_.back();
315 return kNoError;
316}
317
Adam Lesinskic322b432015-10-06 15:23:46 -0700318int32_t ZipWriter::PrepareDeflate() {
Adam Lesinski2e216de2017-03-16 13:23:51 -0700319 CHECK(state_ == State::kWritingZip);
Adam Lesinskic322b432015-10-06 15:23:46 -0700320
321 // Initialize the z_stream for compression.
Jiyong Park6821cc82017-06-30 17:23:33 +0900322 z_stream_ = std::unique_ptr<z_stream, void (*)(z_stream*)>(new z_stream(), DeleteZStream);
Adam Lesinskic322b432015-10-06 15:23:46 -0700323
Colin Crossdf227762016-09-16 10:15:51 -0700324#pragma GCC diagnostic push
325#pragma GCC diagnostic ignored "-Wold-style-cast"
Adam Lesinskic322b432015-10-06 15:23:46 -0700326 int zerr = deflateInit2(z_stream_.get(), Z_BEST_COMPRESSION, Z_DEFLATED, -MAX_WBITS,
327 DEF_MEM_LEVEL, Z_DEFAULT_STRATEGY);
Colin Crossdf227762016-09-16 10:15:51 -0700328#pragma GCC diagnostic pop
329
Adam Lesinskic322b432015-10-06 15:23:46 -0700330 if (zerr != Z_OK) {
331 if (zerr == Z_VERSION_ERROR) {
Elliott Hughes51cbbaa2018-10-19 16:09:39 -0700332 LOG(ERROR) << "Installed zlib is not compatible with linked version (" << ZLIB_VERSION << ")";
Adam Lesinskic322b432015-10-06 15:23:46 -0700333 return HandleError(kZlibError);
334 } else {
Elliott Hughes51cbbaa2018-10-19 16:09:39 -0700335 LOG(ERROR) << "deflateInit2 failed (zerr=" << zerr << ")";
Adam Lesinskic322b432015-10-06 15:23:46 -0700336 return HandleError(kZlibError);
337 }
338 }
339
340 z_stream_->next_out = buffer_.data();
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700341 DCHECK_EQ(buffer_.size(), kBufSize);
342 z_stream_->avail_out = static_cast<uint32_t>(buffer_.size());
Adam Lesinskic322b432015-10-06 15:23:46 -0700343 return kNoError;
344}
345
Adam Lesinski622f3042015-10-05 18:16:18 -0700346int32_t ZipWriter::WriteBytes(const void* data, size_t len) {
347 if (state_ != State::kWritingEntry) {
348 return HandleError(kInvalidState);
349 }
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700350 // Need to be able to mark down data correctly.
351 if (len + static_cast<uint64_t>(current_file_entry_.uncompressed_size) >
352 std::numeric_limits<uint32_t>::max()) {
353 return HandleError(kIoError);
354 }
355 uint32_t len32 = static_cast<uint32_t>(len);
Adam Lesinski622f3042015-10-05 18:16:18 -0700356
Adam Lesinskic322b432015-10-06 15:23:46 -0700357 int32_t result = kNoError;
Adam Lesinski2e216de2017-03-16 13:23:51 -0700358 if (current_file_entry_.compression_method & kCompressDeflated) {
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700359 result = CompressBytes(&current_file_entry_, data, len32);
Adam Lesinski622f3042015-10-05 18:16:18 -0700360 } else {
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700361 result = StoreBytes(&current_file_entry_, data, len32);
Adam Lesinski622f3042015-10-05 18:16:18 -0700362 }
363
Adam Lesinskic322b432015-10-06 15:23:46 -0700364 if (result != kNoError) {
365 return result;
366 }
367
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700368 current_file_entry_.crc32 = static_cast<uint32_t>(
369 crc32(current_file_entry_.crc32, reinterpret_cast<const Bytef*>(data), len32));
370 current_file_entry_.uncompressed_size += len32;
Adam Lesinski622f3042015-10-05 18:16:18 -0700371 return kNoError;
372}
373
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700374int32_t ZipWriter::StoreBytes(FileEntry* file, const void* data, uint32_t len) {
Adam Lesinski2e216de2017-03-16 13:23:51 -0700375 CHECK(state_ == State::kWritingEntry);
Adam Lesinskic322b432015-10-06 15:23:46 -0700376
377 if (fwrite(data, 1, len, file_) != len) {
378 return HandleError(kIoError);
379 }
380 file->compressed_size += len;
381 current_offset_ += len;
382 return kNoError;
383}
384
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700385int32_t ZipWriter::CompressBytes(FileEntry* file, const void* data, uint32_t len) {
Adam Lesinski2e216de2017-03-16 13:23:51 -0700386 CHECK(state_ == State::kWritingEntry);
387 CHECK(z_stream_);
388 CHECK(z_stream_->next_out != nullptr);
389 CHECK(z_stream_->avail_out != 0);
Adam Lesinskic322b432015-10-06 15:23:46 -0700390
391 // Prepare the input.
392 z_stream_->next_in = reinterpret_cast<const uint8_t*>(data);
393 z_stream_->avail_in = len;
394
395 while (z_stream_->avail_in > 0) {
396 // We have more data to compress.
397 int zerr = deflate(z_stream_.get(), Z_NO_FLUSH);
398 if (zerr != Z_OK) {
399 return HandleError(kZlibError);
400 }
401
402 if (z_stream_->avail_out == 0) {
403 // The output is full, let's write it to disk.
Christopher Ferrisfcc081f2015-11-04 17:54:32 -0800404 size_t write_bytes = z_stream_->next_out - buffer_.data();
405 if (fwrite(buffer_.data(), 1, write_bytes, file_) != write_bytes) {
Adam Lesinskic322b432015-10-06 15:23:46 -0700406 return HandleError(kIoError);
407 }
Christopher Ferrisfcc081f2015-11-04 17:54:32 -0800408 file->compressed_size += write_bytes;
409 current_offset_ += write_bytes;
Adam Lesinskic322b432015-10-06 15:23:46 -0700410
411 // Reset the output buffer for the next input.
412 z_stream_->next_out = buffer_.data();
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700413 DCHECK_EQ(buffer_.size(), kBufSize);
414 z_stream_->avail_out = static_cast<uint32_t>(buffer_.size());
Adam Lesinskic322b432015-10-06 15:23:46 -0700415 }
416 }
417 return kNoError;
418}
419
Adam Lesinski2e216de2017-03-16 13:23:51 -0700420int32_t ZipWriter::FlushCompressedBytes(FileEntry* file) {
421 CHECK(state_ == State::kWritingEntry);
422 CHECK(z_stream_);
423 CHECK(z_stream_->next_out != nullptr);
424 CHECK(z_stream_->avail_out != 0);
Adam Lesinskic322b432015-10-06 15:23:46 -0700425
Christopher Ferrisfcc081f2015-11-04 17:54:32 -0800426 // Keep deflating while there isn't enough space in the buffer to
427 // to complete the compress.
428 int zerr;
429 while ((zerr = deflate(z_stream_.get(), Z_FINISH)) == Z_OK) {
Adam Lesinski2e216de2017-03-16 13:23:51 -0700430 CHECK(z_stream_->avail_out == 0);
Christopher Ferrisfcc081f2015-11-04 17:54:32 -0800431 size_t write_bytes = z_stream_->next_out - buffer_.data();
432 if (fwrite(buffer_.data(), 1, write_bytes, file_) != write_bytes) {
433 return HandleError(kIoError);
434 }
435 file->compressed_size += write_bytes;
436 current_offset_ += write_bytes;
437
438 z_stream_->next_out = buffer_.data();
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700439 DCHECK_EQ(buffer_.size(), kBufSize);
440 z_stream_->avail_out = static_cast<uint32_t>(buffer_.size());
Christopher Ferrisfcc081f2015-11-04 17:54:32 -0800441 }
Adam Lesinskic322b432015-10-06 15:23:46 -0700442 if (zerr != Z_STREAM_END) {
443 return HandleError(kZlibError);
444 }
445
Christopher Ferrisfcc081f2015-11-04 17:54:32 -0800446 size_t write_bytes = z_stream_->next_out - buffer_.data();
447 if (write_bytes != 0) {
448 if (fwrite(buffer_.data(), 1, write_bytes, file_) != write_bytes) {
Adam Lesinskic322b432015-10-06 15:23:46 -0700449 return HandleError(kIoError);
450 }
Christopher Ferrisfcc081f2015-11-04 17:54:32 -0800451 file->compressed_size += write_bytes;
452 current_offset_ += write_bytes;
Adam Lesinskic322b432015-10-06 15:23:46 -0700453 }
454 z_stream_.reset();
455 return kNoError;
456}
457
Donald Chai322a60b2019-07-02 17:25:03 -0700458bool ZipWriter::ShouldUseDataDescriptor() const {
459 // Only use a trailing "data descriptor" if the output isn't seekable.
460 return !seekable_;
461}
462
Adam Lesinski622f3042015-10-05 18:16:18 -0700463int32_t ZipWriter::FinishEntry() {
464 if (state_ != State::kWritingEntry) {
465 return kInvalidState;
466 }
467
Adam Lesinski2e216de2017-03-16 13:23:51 -0700468 if (current_file_entry_.compression_method & kCompressDeflated) {
469 int32_t result = FlushCompressedBytes(&current_file_entry_);
Adam Lesinskic322b432015-10-06 15:23:46 -0700470 if (result != kNoError) {
471 return result;
472 }
473 }
474
Donald Chai322a60b2019-07-02 17:25:03 -0700475 if (ShouldUseDataDescriptor()) {
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700476 // Some versions of ZIP don't allow STORED data to have a trailing DataDescriptor.
477 // If this file is not seekable, or if the data is compressed, write a DataDescriptor.
Tianjiecc924632020-03-26 12:34:44 -0700478 // We haven't supported zip64 format yet. Write both uncompressed size and compressed
479 // size as uint32_t.
480 std::vector<uint32_t> dataDescriptor = {
481 DataDescriptor::kOptSignature, current_file_entry_.crc32,
482 current_file_entry_.compressed_size, current_file_entry_.uncompressed_size};
483 if (fwrite(dataDescriptor.data(), dataDescriptor.size() * sizeof(uint32_t), 1, file_) != 1) {
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700484 return HandleError(kIoError);
485 }
Adam Lesinski622f3042015-10-05 18:16:18 -0700486
Tianjiecc924632020-03-26 12:34:44 -0700487 current_offset_ += sizeof(uint32_t) * dataDescriptor.size();
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700488 } else {
489 // Seek back to the header and rewrite to include the size.
490 if (fseeko(file_, current_file_entry_.local_file_header_offset, SEEK_SET) != 0) {
491 return HandleError(kIoError);
492 }
493
494 LocalFileHeader header = {};
495 CopyFromFileEntry(current_file_entry_, false /*use_data_descriptor*/, &header);
496
497 if (fwrite(&header, sizeof(header), 1, file_) != 1) {
498 return HandleError(kIoError);
499 }
500
501 if (fseeko(file_, current_offset_, SEEK_SET) != 0) {
502 return HandleError(kIoError);
503 }
Adam Lesinski622f3042015-10-05 18:16:18 -0700504 }
505
Adam Lesinski2e216de2017-03-16 13:23:51 -0700506 files_.emplace_back(std::move(current_file_entry_));
Adam Lesinski622f3042015-10-05 18:16:18 -0700507 state_ = State::kWritingZip;
508 return kNoError;
509}
510
511int32_t ZipWriter::Finish() {
512 if (state_ != State::kWritingZip) {
513 return kInvalidState;
514 }
515
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700516 off_t startOfCdr = current_offset_;
Adam Lesinski2e216de2017-03-16 13:23:51 -0700517 for (FileEntry& file : files_) {
Adam Lesinski622f3042015-10-05 18:16:18 -0700518 CentralDirectoryRecord cdr = {};
519 cdr.record_signature = CentralDirectoryRecord::kSignature;
Donald Chai322a60b2019-07-02 17:25:03 -0700520 if (ShouldUseDataDescriptor()) {
Adam Lesinski253cc062017-04-06 18:55:47 -0700521 cdr.gpb_flags |= kGPBDDFlagMask;
522 }
Adam Lesinski622f3042015-10-05 18:16:18 -0700523 cdr.compression_method = file.compression_method;
524 cdr.last_mod_time = file.last_mod_time;
525 cdr.last_mod_date = file.last_mod_date;
526 cdr.crc32 = file.crc32;
527 cdr.compressed_size = file.compressed_size;
528 cdr.uncompressed_size = file.uncompressed_size;
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700529 // Checked in IsValidEntryName.
530 DCHECK_LE(file.path.size(), std::numeric_limits<uint16_t>::max());
531 cdr.file_name_length = static_cast<uint16_t>(file.path.size());
532 // Checked in StartAlignedEntryWithTime.
533 DCHECK_LE(file.local_file_header_offset, std::numeric_limits<uint32_t>::max());
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700534 cdr.local_file_header_offset = static_cast<uint32_t>(file.local_file_header_offset);
Adam Lesinski622f3042015-10-05 18:16:18 -0700535 if (fwrite(&cdr, sizeof(cdr), 1, file_) != 1) {
536 return HandleError(kIoError);
537 }
538
539 if (fwrite(file.path.data(), 1, file.path.size(), file_) != file.path.size()) {
540 return HandleError(kIoError);
541 }
542
543 current_offset_ += sizeof(cdr) + file.path.size();
544 }
545
546 EocdRecord er = {};
547 er.eocd_signature = EocdRecord::kSignature;
Adam Lesinskia8d71d62015-10-20 12:41:49 -0700548 er.disk_num = 0;
549 er.cd_start_disk = 0;
Andreas Gampe5a5ffb52019-04-05 13:48:02 -0700550 // Checked when adding entries.
551 DCHECK_LE(files_.size(), std::numeric_limits<uint16_t>::max());
552 er.num_records_on_disk = static_cast<uint16_t>(files_.size());
553 er.num_records = static_cast<uint16_t>(files_.size());
554 if (current_offset_ > std::numeric_limits<uint32_t>::max()) {
555 return HandleError(kIoError);
556 }
557 er.cd_size = static_cast<uint32_t>(current_offset_ - startOfCdr);
558 er.cd_start_offset = static_cast<uint32_t>(startOfCdr);
Adam Lesinski622f3042015-10-05 18:16:18 -0700559
560 if (fwrite(&er, sizeof(er), 1, file_) != 1) {
561 return HandleError(kIoError);
562 }
563
Adam Lesinski2e216de2017-03-16 13:23:51 -0700564 current_offset_ += sizeof(er);
565
566 // Since we can BackUp() and potentially finish writing at an offset less than one we had
567 // already written at, we must truncate the file.
568
Adam Lesinskif61aaf42017-03-29 16:10:11 -0700569 if (ftruncate(fileno(file_), current_offset_) != 0) {
Adam Lesinski2e216de2017-03-16 13:23:51 -0700570 return HandleError(kIoError);
571 }
572
Adam Lesinski622f3042015-10-05 18:16:18 -0700573 if (fflush(file_) != 0) {
574 return HandleError(kIoError);
575 }
576
Adam Lesinski622f3042015-10-05 18:16:18 -0700577 state_ = State::kDone;
578 return kNoError;
579}