| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1 | """ | 
 | 2 | Read and write ZIP files. | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 3 |  | 
 | 4 | XXX references to utf-8 need further investigation. | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 5 | """ | 
| Christian Heimes | 790c823 | 2008-01-07 21:14:23 +0000 | [diff] [blame] | 6 | import struct, os, time, sys, shutil | 
| Guido van Rossum | 68937b4 | 2007-05-18 00:51:22 +0000 | [diff] [blame] | 7 | import binascii, io | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 8 |  | 
 | 9 | try: | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 10 |     import zlib # We may need its compression method | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 11 |     crc32 = zlib.crc32 | 
| Guido van Rossum | 9c673f3 | 2001-04-10 15:37:12 +0000 | [diff] [blame] | 12 | except ImportError: | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 13 |     zlib = None | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 14 |     crc32 = binascii.crc32 | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 15 |  | 
| Skip Montanaro | 40fc160 | 2001-03-01 04:27:19 +0000 | [diff] [blame] | 16 | __all__ = ["BadZipfile", "error", "ZIP_STORED", "ZIP_DEFLATED", "is_zipfile", | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 17 |            "ZipInfo", "ZipFile", "PyZipFile", "LargeZipFile" ] | 
| Skip Montanaro | 40fc160 | 2001-03-01 04:27:19 +0000 | [diff] [blame] | 18 |  | 
| Fred Drake | 5db246d | 2000-09-29 20:44:48 +0000 | [diff] [blame] | 19 | class BadZipfile(Exception): | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 20 |     pass | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 21 |  | 
 | 22 |  | 
 | 23 | class LargeZipFile(Exception): | 
 | 24 |     """ | 
 | 25 |     Raised when writing a zipfile, the zipfile requires ZIP64 extensions | 
 | 26 |     and those extensions are disabled. | 
 | 27 |     """ | 
 | 28 |  | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 29 | error = BadZipfile      # The exception raised by this module | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 30 |  | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 31 | ZIP64_LIMIT= (1 << 31) - 1 | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 32 | ZIP_FILECOUNT_LIMIT = 1 << 16 | 
 | 33 | ZIP_MAX_COMMENT = (1 << 16) - 1 | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 34 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 35 | # constants for Zip file compression methods | 
 | 36 | ZIP_STORED = 0 | 
 | 37 | ZIP_DEFLATED = 8 | 
 | 38 | # Other ZIP compression methods not supported | 
 | 39 |  | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 40 | # Below are some formats and associated data for reading/writing headers using | 
 | 41 | # the struct module.  The names and structures of headers/records are those used | 
 | 42 | # in the PKWARE description of the ZIP file format: | 
 | 43 | #     http://www.pkware.com/documents/casestudies/APPNOTE.TXT | 
 | 44 | # (URL valid as of January 2008) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 45 |  | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 46 | # The "end of central directory" structure, magic number, size, and indices | 
 | 47 | # (section V.I in the format document) | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 48 | structEndArchive = b"<4s4H2LH" | 
 | 49 | stringEndArchive = b"PK\005\006" | 
 | 50 | sizeEndCentDir = struct.calcsize(structEndArchive) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 51 |  | 
 | 52 | _ECD_SIGNATURE = 0 | 
 | 53 | _ECD_DISK_NUMBER = 1 | 
 | 54 | _ECD_DISK_START = 2 | 
 | 55 | _ECD_ENTRIES_THIS_DISK = 3 | 
 | 56 | _ECD_ENTRIES_TOTAL = 4 | 
 | 57 | _ECD_SIZE = 5 | 
 | 58 | _ECD_OFFSET = 6 | 
 | 59 | _ECD_COMMENT_SIZE = 7 | 
 | 60 | # These last two indices are not part of the structure as defined in the | 
 | 61 | # spec, but they are used internally by this module as a convenience | 
 | 62 | _ECD_COMMENT = 8 | 
 | 63 | _ECD_LOCATION = 9 | 
 | 64 |  | 
 | 65 | # The "central directory" structure, magic number, size, and indices | 
 | 66 | # of entries in the structure (section V.F in the format document) | 
 | 67 | structCentralDir = "<4s4B4HL2L5H2L" | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 68 | stringCentralDir = b"PK\001\002" | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 69 | sizeCentralDir = struct.calcsize(structCentralDir) | 
 | 70 |  | 
| Fred Drake | 3e038e5 | 2001-02-28 17:56:26 +0000 | [diff] [blame] | 71 | # indexes of entries in the central directory structure | 
 | 72 | _CD_SIGNATURE = 0 | 
 | 73 | _CD_CREATE_VERSION = 1 | 
 | 74 | _CD_CREATE_SYSTEM = 2 | 
 | 75 | _CD_EXTRACT_VERSION = 3 | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 76 | _CD_EXTRACT_SYSTEM = 4 | 
| Fred Drake | 3e038e5 | 2001-02-28 17:56:26 +0000 | [diff] [blame] | 77 | _CD_FLAG_BITS = 5 | 
 | 78 | _CD_COMPRESS_TYPE = 6 | 
 | 79 | _CD_TIME = 7 | 
 | 80 | _CD_DATE = 8 | 
 | 81 | _CD_CRC = 9 | 
 | 82 | _CD_COMPRESSED_SIZE = 10 | 
 | 83 | _CD_UNCOMPRESSED_SIZE = 11 | 
 | 84 | _CD_FILENAME_LENGTH = 12 | 
 | 85 | _CD_EXTRA_FIELD_LENGTH = 13 | 
 | 86 | _CD_COMMENT_LENGTH = 14 | 
 | 87 | _CD_DISK_NUMBER_START = 15 | 
 | 88 | _CD_INTERNAL_FILE_ATTRIBUTES = 16 | 
 | 89 | _CD_EXTERNAL_FILE_ATTRIBUTES = 17 | 
 | 90 | _CD_LOCAL_HEADER_OFFSET = 18 | 
 | 91 |  | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 92 | # The "local file header" structure, magic number, size, and indices | 
 | 93 | # (section V.A in the format document) | 
 | 94 | structFileHeader = "<4s2B4HL2L2H" | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 95 | stringFileHeader = b"PK\003\004" | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 96 | sizeFileHeader = struct.calcsize(structFileHeader) | 
 | 97 |  | 
| Fred Drake | 3e038e5 | 2001-02-28 17:56:26 +0000 | [diff] [blame] | 98 | _FH_SIGNATURE = 0 | 
 | 99 | _FH_EXTRACT_VERSION = 1 | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 100 | _FH_EXTRACT_SYSTEM = 2 | 
| Fred Drake | 3e038e5 | 2001-02-28 17:56:26 +0000 | [diff] [blame] | 101 | _FH_GENERAL_PURPOSE_FLAG_BITS = 3 | 
 | 102 | _FH_COMPRESSION_METHOD = 4 | 
 | 103 | _FH_LAST_MOD_TIME = 5 | 
 | 104 | _FH_LAST_MOD_DATE = 6 | 
 | 105 | _FH_CRC = 7 | 
 | 106 | _FH_COMPRESSED_SIZE = 8 | 
 | 107 | _FH_UNCOMPRESSED_SIZE = 9 | 
 | 108 | _FH_FILENAME_LENGTH = 10 | 
 | 109 | _FH_EXTRA_FIELD_LENGTH = 11 | 
 | 110 |  | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 111 | # The "Zip64 end of central directory locator" structure, magic number, and size | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 112 | structEndArchive64Locator = "<4sLQL" | 
 | 113 | stringEndArchive64Locator = b"PK\x06\x07" | 
 | 114 | sizeEndCentDir64Locator = struct.calcsize(structEndArchive64Locator) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 115 |  | 
 | 116 | # The "Zip64 end of central directory" record, magic number, size, and indices | 
 | 117 | # (section V.G in the format document) | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 118 | structEndArchive64 = "<4sQ2H2L4Q" | 
 | 119 | stringEndArchive64 = b"PK\x06\x06" | 
 | 120 | sizeEndCentDir64 = struct.calcsize(structEndArchive64) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 121 |  | 
 | 122 | _CD64_SIGNATURE = 0 | 
 | 123 | _CD64_DIRECTORY_RECSIZE = 1 | 
 | 124 | _CD64_CREATE_VERSION = 2 | 
 | 125 | _CD64_EXTRACT_VERSION = 3 | 
 | 126 | _CD64_DISK_NUMBER = 4 | 
 | 127 | _CD64_DISK_NUMBER_START = 5 | 
 | 128 | _CD64_NUMBER_ENTRIES_THIS_DISK = 6 | 
 | 129 | _CD64_NUMBER_ENTRIES_TOTAL = 7 | 
 | 130 | _CD64_DIRECTORY_SIZE = 8 | 
 | 131 | _CD64_OFFSET_START_CENTDIR = 9 | 
 | 132 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 133 | def is_zipfile(filename): | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 134 |     """Quickly see if file is a ZIP file by checking the magic number.""" | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 135 |     try: | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 136 |         fpin = io.open(filename, "rb") | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 137 |         endrec = _EndRecData(fpin) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 138 |         fpin.close() | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 139 |         if endrec: | 
| Guido van Rossum | 8ca162f | 2002-04-07 06:36:23 +0000 | [diff] [blame] | 140 |             return True                 # file has correct magic number | 
| Fred Drake | 7e47380 | 2001-05-11 19:52:57 +0000 | [diff] [blame] | 141 |     except IOError: | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 142 |         pass | 
| Guido van Rossum | 8ca162f | 2002-04-07 06:36:23 +0000 | [diff] [blame] | 143 |     return False | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 144 |  | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 145 | def _EndRecData64(fpin, offset, endrec): | 
 | 146 |     """ | 
 | 147 |     Read the ZIP64 end-of-archive records and use that to update endrec | 
 | 148 |     """ | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 149 |     fpin.seek(offset - sizeEndCentDir64Locator, 2) | 
 | 150 |     data = fpin.read(sizeEndCentDir64Locator) | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 151 |     sig, diskno, reloff, disks = struct.unpack(structEndArchive64Locator, data) | 
 | 152 |     if sig != stringEndArchive64Locator: | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 153 |         return endrec | 
 | 154 |  | 
 | 155 |     if diskno != 0 or disks != 1: | 
 | 156 |         raise BadZipfile("zipfiles that span multiple disks are not supported") | 
 | 157 |  | 
 | 158 |     # Assume no 'zip64 extensible data' | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 159 |     fpin.seek(offset - sizeEndCentDir64Locator - sizeEndCentDir64, 2) | 
 | 160 |     data = fpin.read(sizeEndCentDir64) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 161 |     sig, sz, create_version, read_version, disk_num, disk_dir, \ | 
 | 162 |             dircount, dircount2, dirsize, diroffset = \ | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 163 |             struct.unpack(structEndArchive64, data) | 
 | 164 |     if sig != stringEndArchive64: | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 165 |         return endrec | 
 | 166 |  | 
 | 167 |     # Update the original endrec using data from the ZIP64 record | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 168 |     endrec[_ECD_DISK_NUMBER] = disk_num | 
 | 169 |     endrec[_ECD_DISK_START] = disk_dir | 
 | 170 |     endrec[_ECD_ENTRIES_THIS_DISK] = dircount | 
 | 171 |     endrec[_ECD_ENTRIES_TOTAL] = dircount2 | 
 | 172 |     endrec[_ECD_SIZE] = dirsize | 
 | 173 |     endrec[_ECD_OFFSET] = diroffset | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 174 |     return endrec | 
 | 175 |  | 
 | 176 |  | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 177 | def _EndRecData(fpin): | 
 | 178 |     """Return data from the "End of Central Directory" record, or None. | 
 | 179 |  | 
 | 180 |     The data is a list of the nine items in the ZIP "End of central dir" | 
 | 181 |     record followed by a tenth item, the file seek offset of this record.""" | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 182 |  | 
 | 183 |     # Determine file size | 
 | 184 |     fpin.seek(0, 2) | 
 | 185 |     filesize = fpin.tell() | 
 | 186 |  | 
 | 187 |     # Check to see if this is ZIP file with no archive comment (the | 
 | 188 |     # "end of central directory" structure should be the last item in the | 
 | 189 |     # file if this is the case). | 
 | 190 |     fpin.seek(-sizeEndCentDir, 2) | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 191 |     data = fpin.read() | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 192 |     if data[0:4] == stringEndArchive and data[-2:] == b"\000\000": | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 193 |         # the signature is correct and there's no comment, unpack structure | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 194 |         endrec = struct.unpack(structEndArchive, data) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 195 |         endrec=list(endrec) | 
 | 196 |  | 
 | 197 |         # Append a blank comment and record start offset | 
 | 198 |         endrec.append(b"") | 
 | 199 |         endrec.append(filesize - sizeEndCentDir) | 
 | 200 |         if endrec[_ECD_OFFSET] == 0xffffffff: | 
 | 201 |             # the value for the "offset of the start of the central directory" | 
 | 202 |             # indicates that there is a "Zip64 end of central directory" | 
 | 203 |             # structure present, so go look for it | 
 | 204 |             return _EndRecData64(fpin, -sizeEndCentDir, endrec) | 
 | 205 |  | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 206 |         return endrec | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 207 |  | 
 | 208 |     # Either this is not a ZIP file, or it is a ZIP file with an archive | 
 | 209 |     # comment.  Search the end of the file for the "end of central directory" | 
 | 210 |     # record signature. The comment is the last item in the ZIP file and may be | 
 | 211 |     # up to 64K long.  It is assumed that the "end of central directory" magic | 
 | 212 |     # number does not appear in the comment. | 
 | 213 |     maxCommentStart = max(filesize - (1 << 16) - sizeEndCentDir, 0) | 
 | 214 |     fpin.seek(maxCommentStart, 0) | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 215 |     data = fpin.read() | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 216 |     start = data.rfind(stringEndArchive) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 217 |     if start >= 0: | 
 | 218 |         # found the magic number; attempt to unpack and interpret | 
 | 219 |         recData = data[start:start+sizeEndCentDir] | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 220 |         endrec = list(struct.unpack(structEndArchive, recData)) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 221 |         comment = data[start+sizeEndCentDir:] | 
 | 222 |         # check that comment length is correct | 
 | 223 |         if endrec[_ECD_COMMENT_SIZE] == len(comment): | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 224 |             # Append the archive comment and start offset | 
 | 225 |             endrec.append(comment) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 226 |             endrec.append(maxCommentStart + start) | 
 | 227 |             if endrec[_ECD_OFFSET] == 0xffffffff: | 
 | 228 |                 # There is apparently a "Zip64 end of central directory" | 
 | 229 |                 # structure present, so go look for it | 
 | 230 |                 return _EndRecData64(fpin, start - filesize, endrec) | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 231 |             return endrec | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 232 |  | 
 | 233 |     # Unable to find a valid end of central directory structure | 
 | 234 |     return | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 235 |  | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 236 |  | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 237 | class ZipInfo (object): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 238 |     """Class with attributes describing each file in the ZIP archive.""" | 
 | 239 |  | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 240 |     __slots__ = ( | 
 | 241 |             'orig_filename', | 
 | 242 |             'filename', | 
 | 243 |             'date_time', | 
 | 244 |             'compress_type', | 
 | 245 |             'comment', | 
 | 246 |             'extra', | 
 | 247 |             'create_system', | 
 | 248 |             'create_version', | 
 | 249 |             'extract_version', | 
 | 250 |             'reserved', | 
 | 251 |             'flag_bits', | 
 | 252 |             'volume', | 
 | 253 |             'internal_attr', | 
 | 254 |             'external_attr', | 
 | 255 |             'header_offset', | 
 | 256 |             'CRC', | 
 | 257 |             'compress_size', | 
 | 258 |             'file_size', | 
| Christian Heimes | fdab48e | 2008-01-20 09:06:41 +0000 | [diff] [blame] | 259 |             '_raw_time', | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 260 |         ) | 
 | 261 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 262 |     def __init__(self, filename="NoName", date_time=(1980,1,1,0,0,0)): | 
| Greg Ward | 8e36d28 | 2003-06-18 00:53:06 +0000 | [diff] [blame] | 263 |         self.orig_filename = filename   # Original file name in archive | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 264 |  | 
 | 265 |         # Terminate the file name at the first null byte.  Null bytes in file | 
 | 266 |         # names are used as tricks by viruses in archives. | 
| Greg Ward | 8e36d28 | 2003-06-18 00:53:06 +0000 | [diff] [blame] | 267 |         null_byte = filename.find(chr(0)) | 
 | 268 |         if null_byte >= 0: | 
 | 269 |             filename = filename[0:null_byte] | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 270 |         # This is used to ensure paths in generated ZIP files always use | 
 | 271 |         # forward slashes as the directory separator, as required by the | 
 | 272 |         # ZIP format specification. | 
 | 273 |         if os.sep != "/" and os.sep in filename: | 
| Greg Ward | 8e36d28 | 2003-06-18 00:53:06 +0000 | [diff] [blame] | 274 |             filename = filename.replace(os.sep, "/") | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 275 |  | 
| Greg Ward | 8e36d28 | 2003-06-18 00:53:06 +0000 | [diff] [blame] | 276 |         self.filename = filename        # Normalized file name | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 277 |         self.date_time = date_time      # year, month, day, hour, min, sec | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 278 |         # Standard values: | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 279 |         self.compress_type = ZIP_STORED # Type of compression for the file | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 280 |         self.comment = b""              # Comment for each file | 
 | 281 |         self.extra = b""                # ZIP extra data | 
| Martin v. Löwis | 0075690 | 2006-02-05 17:09:41 +0000 | [diff] [blame] | 282 |         if sys.platform == 'win32': | 
 | 283 |             self.create_system = 0          # System which created ZIP archive | 
 | 284 |         else: | 
 | 285 |             # Assume everything else is unix-y | 
 | 286 |             self.create_system = 3          # System which created ZIP archive | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 287 |         self.create_version = 20        # Version which created ZIP archive | 
 | 288 |         self.extract_version = 20       # Version needed to extract archive | 
 | 289 |         self.reserved = 0               # Must be zero | 
 | 290 |         self.flag_bits = 0              # ZIP flag bits | 
 | 291 |         self.volume = 0                 # Volume number of file header | 
 | 292 |         self.internal_attr = 0          # Internal attributes | 
 | 293 |         self.external_attr = 0          # External file attributes | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 294 |         # Other attributes are set by class ZipFile: | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 295 |         # header_offset         Byte offset to the file header | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 296 |         # CRC                   CRC-32 of the uncompressed file | 
 | 297 |         # compress_size         Size of the compressed file | 
 | 298 |         # file_size             Size of the uncompressed file | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 299 |  | 
 | 300 |     def FileHeader(self): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 301 |         """Return the per-file header as a string.""" | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 302 |         dt = self.date_time | 
 | 303 |         dosdate = (dt[0] - 1980) << 9 | dt[1] << 5 | dt[2] | 
| Tim Peters | 3caca23 | 2001-12-06 06:23:26 +0000 | [diff] [blame] | 304 |         dostime = dt[3] << 11 | dt[4] << 5 | (dt[5] // 2) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 305 |         if self.flag_bits & 0x08: | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 306 |             # Set these to zero because we write them after the file data | 
 | 307 |             CRC = compress_size = file_size = 0 | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 308 |         else: | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 309 |             CRC = self.CRC | 
 | 310 |             compress_size = self.compress_size | 
 | 311 |             file_size = self.file_size | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 312 |  | 
 | 313 |         extra = self.extra | 
 | 314 |  | 
 | 315 |         if file_size > ZIP64_LIMIT or compress_size > ZIP64_LIMIT: | 
 | 316 |             # File is larger than what fits into a 4 byte integer, | 
 | 317 |             # fall back to the ZIP64 extension | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 318 |             fmt = '<HHQQ' | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 319 |             extra = extra + struct.pack(fmt, | 
 | 320 |                     1, struct.calcsize(fmt)-4, file_size, compress_size) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 321 |             file_size = 0xffffffff | 
 | 322 |             compress_size = 0xffffffff | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 323 |             self.extract_version = max(45, self.extract_version) | 
 | 324 |             self.create_version = max(45, self.extract_version) | 
 | 325 |  | 
| Martin v. Löwis | 8570f6a | 2008-05-05 17:44:38 +0000 | [diff] [blame] | 326 |         filename, flag_bits = self._encodeFilenameFlags() | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 327 |         header = struct.pack(structFileHeader, stringFileHeader, | 
| Martin v. Löwis | 8570f6a | 2008-05-05 17:44:38 +0000 | [diff] [blame] | 328 |                  self.extract_version, self.reserved, flag_bits, | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 329 |                  self.compress_type, dostime, dosdate, CRC, | 
 | 330 |                  compress_size, file_size, | 
| Martin v. Löwis | 8570f6a | 2008-05-05 17:44:38 +0000 | [diff] [blame] | 331 |                  len(filename), len(extra)) | 
 | 332 |         return header + filename + extra | 
 | 333 |  | 
 | 334 |     def _encodeFilenameFlags(self): | 
 | 335 |         try: | 
 | 336 |             return self.filename.encode('ascii'), self.flag_bits | 
 | 337 |         except UnicodeEncodeError: | 
 | 338 |             return self.filename.encode('utf-8'), self.flag_bits | 0x800 | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 339 |  | 
 | 340 |     def _decodeExtra(self): | 
 | 341 |         # Try to decode the extra field. | 
 | 342 |         extra = self.extra | 
 | 343 |         unpack = struct.unpack | 
 | 344 |         while extra: | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 345 |             tp, ln = unpack('<HH', extra[:4]) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 346 |             if tp == 1: | 
 | 347 |                 if ln >= 24: | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 348 |                     counts = unpack('<QQQ', extra[4:28]) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 349 |                 elif ln == 16: | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 350 |                     counts = unpack('<QQ', extra[4:20]) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 351 |                 elif ln == 8: | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 352 |                     counts = unpack('<Q', extra[4:12]) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 353 |                 elif ln == 0: | 
 | 354 |                     counts = () | 
 | 355 |                 else: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 356 |                     raise RuntimeError("Corrupt extra field %s"%(ln,)) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 357 |  | 
 | 358 |                 idx = 0 | 
 | 359 |  | 
 | 360 |                 # ZIP64 extension (large files and/or large archives) | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 361 |                 if self.file_size in (0xffffffffffffffff, 0xffffffff): | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 362 |                     self.file_size = counts[idx] | 
 | 363 |                     idx += 1 | 
 | 364 |  | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 365 |                 if self.compress_size == 0xFFFFFFFF: | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 366 |                     self.compress_size = counts[idx] | 
 | 367 |                     idx += 1 | 
 | 368 |  | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 369 |                 if self.header_offset == 0xffffffff: | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 370 |                     old = self.header_offset | 
 | 371 |                     self.header_offset = counts[idx] | 
 | 372 |                     idx+=1 | 
 | 373 |  | 
 | 374 |             extra = extra[ln+4:] | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 375 |  | 
 | 376 |  | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 377 | class _ZipDecrypter: | 
 | 378 |     """Class to handle decryption of files stored within a ZIP archive. | 
 | 379 |  | 
 | 380 |     ZIP supports a password-based form of encryption. Even though known | 
 | 381 |     plaintext attacks have been found against it, it is still useful | 
| Christian Heimes | fdab48e | 2008-01-20 09:06:41 +0000 | [diff] [blame] | 382 |     to be able to get data out of such a file. | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 383 |  | 
 | 384 |     Usage: | 
 | 385 |         zd = _ZipDecrypter(mypwd) | 
 | 386 |         plain_char = zd(cypher_char) | 
 | 387 |         plain_text = map(zd, cypher_text) | 
 | 388 |     """ | 
 | 389 |  | 
 | 390 |     def _GenerateCRCTable(): | 
 | 391 |         """Generate a CRC-32 table. | 
 | 392 |  | 
 | 393 |         ZIP encryption uses the CRC32 one-byte primitive for scrambling some | 
 | 394 |         internal keys. We noticed that a direct implementation is faster than | 
 | 395 |         relying on binascii.crc32(). | 
 | 396 |         """ | 
 | 397 |         poly = 0xedb88320 | 
 | 398 |         table = [0] * 256 | 
 | 399 |         for i in range(256): | 
 | 400 |             crc = i | 
 | 401 |             for j in range(8): | 
 | 402 |                 if crc & 1: | 
 | 403 |                     crc = ((crc >> 1) & 0x7FFFFFFF) ^ poly | 
 | 404 |                 else: | 
 | 405 |                     crc = ((crc >> 1) & 0x7FFFFFFF) | 
 | 406 |             table[i] = crc | 
 | 407 |         return table | 
 | 408 |     crctable = _GenerateCRCTable() | 
 | 409 |  | 
 | 410 |     def _crc32(self, ch, crc): | 
 | 411 |         """Compute the CRC32 primitive on one byte.""" | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 412 |         return ((crc >> 8) & 0xffffff) ^ self.crctable[(crc ^ ch) & 0xff] | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 413 |  | 
 | 414 |     def __init__(self, pwd): | 
 | 415 |         self.key0 = 305419896 | 
 | 416 |         self.key1 = 591751049 | 
 | 417 |         self.key2 = 878082192 | 
 | 418 |         for p in pwd: | 
 | 419 |             self._UpdateKeys(p) | 
 | 420 |  | 
 | 421 |     def _UpdateKeys(self, c): | 
 | 422 |         self.key0 = self._crc32(c, self.key0) | 
 | 423 |         self.key1 = (self.key1 + (self.key0 & 255)) & 4294967295 | 
 | 424 |         self.key1 = (self.key1 * 134775813 + 1) & 4294967295 | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 425 |         self.key2 = self._crc32((self.key1 >> 24) & 255, self.key2) | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 426 |  | 
 | 427 |     def __call__(self, c): | 
 | 428 |         """Decrypt a single character.""" | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 429 |         assert isinstance(c, int) | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 430 |         k = self.key2 | 2 | 
 | 431 |         c = c ^ (((k * (k^1)) >> 8) & 255) | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 432 |         self._UpdateKeys(c) | 
 | 433 |         return c | 
 | 434 |  | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 435 | class ZipExtFile: | 
 | 436 |     """File-like object for reading an archive member. | 
 | 437 |        Is returned by ZipFile.open(). | 
 | 438 |     """ | 
 | 439 |  | 
 | 440 |     def __init__(self, fileobj, zipinfo, decrypt=None): | 
 | 441 |         self.fileobj = fileobj | 
 | 442 |         self.decrypter = decrypt | 
 | 443 |         self.bytes_read = 0 | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 444 |         self.rawbuffer = b'' | 
 | 445 |         self.readbuffer = b'' | 
 | 446 |         self.linebuffer = b'' | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 447 |         self.eof = False | 
 | 448 |         self.univ_newlines = False | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 449 |         self.nlSeps = (b"\n", ) | 
 | 450 |         self.lastdiscard = b'' | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 451 |  | 
 | 452 |         self.compress_type = zipinfo.compress_type | 
 | 453 |         self.compress_size = zipinfo.compress_size | 
 | 454 |  | 
 | 455 |         self.closed  = False | 
 | 456 |         self.mode    = "r" | 
 | 457 |         self.name = zipinfo.filename | 
 | 458 |  | 
 | 459 |         # read from compressed files in 64k blocks | 
 | 460 |         self.compreadsize = 64*1024 | 
 | 461 |         if self.compress_type == ZIP_DEFLATED: | 
 | 462 |             self.dc = zlib.decompressobj(-15) | 
 | 463 |  | 
 | 464 |     def set_univ_newlines(self, univ_newlines): | 
 | 465 |         self.univ_newlines = univ_newlines | 
 | 466 |  | 
 | 467 |         # pick line separator char(s) based on universal newlines flag | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 468 |         self.nlSeps = (b"\n", ) | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 469 |         if self.univ_newlines: | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 470 |             self.nlSeps = (b"\r\n", b"\r", b"\n") | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 471 |  | 
 | 472 |     def __iter__(self): | 
 | 473 |         return self | 
 | 474 |  | 
 | 475 |     def __next__(self): | 
 | 476 |         nextline = self.readline() | 
 | 477 |         if not nextline: | 
 | 478 |             raise StopIteration() | 
 | 479 |  | 
 | 480 |         return nextline | 
 | 481 |  | 
 | 482 |     def close(self): | 
 | 483 |         self.closed = True | 
 | 484 |  | 
 | 485 |     def _checkfornewline(self): | 
 | 486 |         nl, nllen = -1, -1 | 
 | 487 |         if self.linebuffer: | 
 | 488 |             # ugly check for cases where half of an \r\n pair was | 
 | 489 |             # read on the last pass, and the \r was discarded.  In this | 
 | 490 |             # case we just throw away the \n at the start of the buffer. | 
| Guido van Rossum | 814661e | 2007-07-18 22:07:29 +0000 | [diff] [blame] | 491 |             if (self.lastdiscard, self.linebuffer[:1]) == (b'\r', b'\n'): | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 492 |                 self.linebuffer = self.linebuffer[1:] | 
 | 493 |  | 
 | 494 |             for sep in self.nlSeps: | 
 | 495 |                 nl = self.linebuffer.find(sep) | 
 | 496 |                 if nl >= 0: | 
 | 497 |                     nllen = len(sep) | 
 | 498 |                     return nl, nllen | 
 | 499 |  | 
 | 500 |         return nl, nllen | 
 | 501 |  | 
 | 502 |     def readline(self, size = -1): | 
 | 503 |         """Read a line with approx. size. If size is negative, | 
 | 504 |            read a whole line. | 
 | 505 |         """ | 
 | 506 |         if size < 0: | 
| Christian Heimes | a37d4c6 | 2007-12-04 23:02:19 +0000 | [diff] [blame] | 507 |             size = sys.maxsize | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 508 |         elif size == 0: | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 509 |             return b'' | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 510 |  | 
 | 511 |         # check for a newline already in buffer | 
 | 512 |         nl, nllen = self._checkfornewline() | 
 | 513 |  | 
 | 514 |         if nl >= 0: | 
 | 515 |             # the next line was already in the buffer | 
 | 516 |             nl = min(nl, size) | 
 | 517 |         else: | 
 | 518 |             # no line break in buffer - try to read more | 
 | 519 |             size -= len(self.linebuffer) | 
 | 520 |             while nl < 0 and size > 0: | 
 | 521 |                 buf = self.read(min(size, 100)) | 
 | 522 |                 if not buf: | 
 | 523 |                     break | 
 | 524 |                 self.linebuffer += buf | 
 | 525 |                 size -= len(buf) | 
 | 526 |  | 
 | 527 |                 # check for a newline in buffer | 
 | 528 |                 nl, nllen = self._checkfornewline() | 
 | 529 |  | 
 | 530 |             # we either ran out of bytes in the file, or | 
 | 531 |             # met the specified size limit without finding a newline, | 
 | 532 |             # so return current buffer | 
 | 533 |             if nl < 0: | 
 | 534 |                 s = self.linebuffer | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 535 |                 self.linebuffer = b'' | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 536 |                 return s | 
 | 537 |  | 
 | 538 |         buf = self.linebuffer[:nl] | 
 | 539 |         self.lastdiscard = self.linebuffer[nl:nl + nllen] | 
 | 540 |         self.linebuffer = self.linebuffer[nl + nllen:] | 
 | 541 |  | 
 | 542 |         # line is always returned with \n as newline char (except possibly | 
 | 543 |         # for a final incomplete line in the file, which is handled above). | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 544 |         return buf + b"\n" | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 545 |  | 
 | 546 |     def readlines(self, sizehint = -1): | 
 | 547 |         """Return a list with all (following) lines. The sizehint parameter | 
 | 548 |         is ignored in this implementation. | 
 | 549 |         """ | 
 | 550 |         result = [] | 
 | 551 |         while True: | 
 | 552 |             line = self.readline() | 
 | 553 |             if not line: break | 
 | 554 |             result.append(line) | 
 | 555 |         return result | 
 | 556 |  | 
 | 557 |     def read(self, size = None): | 
| Guido van Rossum | 814661e | 2007-07-18 22:07:29 +0000 | [diff] [blame] | 558 |         # act like file obj and return empty string if size is 0 | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 559 |         if size == 0: | 
| Guido van Rossum | 814661e | 2007-07-18 22:07:29 +0000 | [diff] [blame] | 560 |             return b'' | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 561 |  | 
 | 562 |         # determine read size | 
 | 563 |         bytesToRead = self.compress_size - self.bytes_read | 
 | 564 |  | 
 | 565 |         # adjust read size for encrypted files since the first 12 bytes | 
 | 566 |         # are for the encryption/password information | 
 | 567 |         if self.decrypter is not None: | 
 | 568 |             bytesToRead -= 12 | 
 | 569 |  | 
 | 570 |         if size is not None and size >= 0: | 
 | 571 |             if self.compress_type == ZIP_STORED: | 
 | 572 |                 lr = len(self.readbuffer) | 
 | 573 |                 bytesToRead = min(bytesToRead, size - lr) | 
 | 574 |             elif self.compress_type == ZIP_DEFLATED: | 
 | 575 |                 if len(self.readbuffer) > size: | 
 | 576 |                     # the user has requested fewer bytes than we've already | 
 | 577 |                     # pulled through the decompressor; don't read any more | 
 | 578 |                     bytesToRead = 0 | 
 | 579 |                 else: | 
 | 580 |                     # user will use up the buffer, so read some more | 
 | 581 |                     lr = len(self.rawbuffer) | 
 | 582 |                     bytesToRead = min(bytesToRead, self.compreadsize - lr) | 
 | 583 |  | 
 | 584 |         # avoid reading past end of file contents | 
 | 585 |         if bytesToRead + self.bytes_read > self.compress_size: | 
 | 586 |             bytesToRead = self.compress_size - self.bytes_read | 
 | 587 |  | 
 | 588 |         # try to read from file (if necessary) | 
 | 589 |         if bytesToRead > 0: | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 590 |             data = self.fileobj.read(bytesToRead) | 
 | 591 |             self.bytes_read += len(data) | 
 | 592 |             try: | 
 | 593 |                 self.rawbuffer += data | 
 | 594 |             except: | 
 | 595 |                 print(repr(self.fileobj), repr(self.rawbuffer), | 
 | 596 |                       repr(data)) | 
 | 597 |                 raise | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 598 |  | 
 | 599 |             # handle contents of raw buffer | 
 | 600 |             if self.rawbuffer: | 
 | 601 |                 newdata = self.rawbuffer | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 602 |                 self.rawbuffer = b'' | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 603 |  | 
 | 604 |                 # decrypt new data if we were given an object to handle that | 
 | 605 |                 if newdata and self.decrypter is not None: | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 606 |                     newdata = bytes(map(self.decrypter, newdata)) | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 607 |  | 
 | 608 |                 # decompress newly read data if necessary | 
 | 609 |                 if newdata and self.compress_type == ZIP_DEFLATED: | 
 | 610 |                     newdata = self.dc.decompress(newdata) | 
 | 611 |                     self.rawbuffer = self.dc.unconsumed_tail | 
 | 612 |                     if self.eof and len(self.rawbuffer) == 0: | 
 | 613 |                         # we're out of raw bytes (both from the file and | 
 | 614 |                         # the local buffer); flush just to make sure the | 
 | 615 |                         # decompressor is done | 
 | 616 |                         newdata += self.dc.flush() | 
 | 617 |                         # prevent decompressor from being used again | 
 | 618 |                         self.dc = None | 
 | 619 |  | 
 | 620 |                 self.readbuffer += newdata | 
 | 621 |  | 
 | 622 |  | 
 | 623 |         # return what the user asked for | 
 | 624 |         if size is None or len(self.readbuffer) <= size: | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 625 |             data = self.readbuffer | 
 | 626 |             self.readbuffer = b'' | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 627 |         else: | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 628 |             data = self.readbuffer[:size] | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 629 |             self.readbuffer = self.readbuffer[size:] | 
 | 630 |  | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 631 |         return data | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 632 |  | 
 | 633 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 634 | class ZipFile: | 
| Tim Peters | a19a168 | 2001-03-29 04:36:09 +0000 | [diff] [blame] | 635 |     """ Class with methods to open, read, write, close, list zip files. | 
 | 636 |  | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 637 |     z = ZipFile(file, mode="r", compression=ZIP_STORED, allowZip64=False) | 
| Tim Peters | a19a168 | 2001-03-29 04:36:09 +0000 | [diff] [blame] | 638 |  | 
| Fred Drake | 3d9091e | 2001-03-26 15:49:24 +0000 | [diff] [blame] | 639 |     file: Either the path to the file, or a file-like object. | 
 | 640 |           If it is a path, the file will be opened and closed by ZipFile. | 
 | 641 |     mode: The mode can be either read "r", write "w" or append "a". | 
 | 642 |     compression: ZIP_STORED (no compression) or ZIP_DEFLATED (requires zlib). | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 643 |     allowZip64: if True ZipFile will create files with ZIP64 extensions when | 
 | 644 |                 needed, otherwise it will raise an exception when this would | 
 | 645 |                 be necessary. | 
 | 646 |  | 
| Fred Drake | 3d9091e | 2001-03-26 15:49:24 +0000 | [diff] [blame] | 647 |     """ | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 648 |  | 
| Fred Drake | 90eac28 | 2001-02-28 05:29:34 +0000 | [diff] [blame] | 649 |     fp = None                   # Set here since __del__ checks it | 
 | 650 |  | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 651 |     def __init__(self, file, mode="r", compression=ZIP_STORED, allowZip64=False): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 652 |         """Open the ZIP file with mode read "r", write "w" or append "a".""" | 
| Guido van Rossum | b5a755e | 2007-07-18 18:15:48 +0000 | [diff] [blame] | 653 |         if mode not in ("r", "w", "a"): | 
 | 654 |             raise RuntimeError('ZipFile() requires mode "r", "w", or "a"') | 
 | 655 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 656 |         if compression == ZIP_STORED: | 
 | 657 |             pass | 
 | 658 |         elif compression == ZIP_DEFLATED: | 
 | 659 |             if not zlib: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 660 |                 raise RuntimeError( | 
 | 661 |                       "Compression requires the (missing) zlib module") | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 662 |         else: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 663 |             raise RuntimeError("That compression method is not supported") | 
| Guido van Rossum | b5a755e | 2007-07-18 18:15:48 +0000 | [diff] [blame] | 664 |  | 
 | 665 |         self._allowZip64 = allowZip64 | 
 | 666 |         self._didModify = False | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 667 |         self.debug = 0  # Level of printing: 0 through 3 | 
 | 668 |         self.NameToInfo = {}    # Find file info given name | 
 | 669 |         self.filelist = []      # List of ZipInfo instances for archive | 
 | 670 |         self.compression = compression  # Method of compression | 
| Raymond Hettinger | 2ca7c19 | 2005-02-16 09:27:49 +0000 | [diff] [blame] | 671 |         self.mode = key = mode.replace('b', '')[0] | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 672 |         self.pwd = None | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 673 |         self.comment = b'' | 
| Tim Peters | a19a168 | 2001-03-29 04:36:09 +0000 | [diff] [blame] | 674 |  | 
| Fred Drake | 3d9091e | 2001-03-26 15:49:24 +0000 | [diff] [blame] | 675 |         # Check if we were passed a file-like object | 
| Guido van Rossum | 3172c5d | 2007-10-16 18:12:55 +0000 | [diff] [blame] | 676 |         if isinstance(file, str): | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 677 |             # No, it's a filename | 
| Fred Drake | 3d9091e | 2001-03-26 15:49:24 +0000 | [diff] [blame] | 678 |             self._filePassed = 0 | 
 | 679 |             self.filename = file | 
 | 680 |             modeDict = {'r' : 'rb', 'w': 'wb', 'a' : 'r+b'} | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 681 |             try: | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 682 |                 self.fp = io.open(file, modeDict[mode]) | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 683 |             except IOError: | 
 | 684 |                 if mode == 'a': | 
 | 685 |                     mode = key = 'w' | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 686 |                     self.fp = io.open(file, modeDict[mode]) | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 687 |                 else: | 
 | 688 |                     raise | 
| Fred Drake | 3d9091e | 2001-03-26 15:49:24 +0000 | [diff] [blame] | 689 |         else: | 
 | 690 |             self._filePassed = 1 | 
 | 691 |             self.fp = file | 
 | 692 |             self.filename = getattr(file, 'name', None) | 
| Tim Peters | a19a168 | 2001-03-29 04:36:09 +0000 | [diff] [blame] | 693 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 694 |         if key == 'r': | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 695 |             self._GetContents() | 
 | 696 |         elif key == 'w': | 
| Fred Drake | 3d9091e | 2001-03-26 15:49:24 +0000 | [diff] [blame] | 697 |             pass | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 698 |         elif key == 'a': | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 699 |             try:                        # See if file is a zip file | 
 | 700 |                 self._RealGetContents() | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 701 |                 # seek to start of directory and overwrite | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 702 |                 self.fp.seek(self.start_dir, 0) | 
 | 703 |             except BadZipfile:          # file is not a zip file, just append | 
 | 704 |                 self.fp.seek(0, 2) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 705 |         else: | 
| Tim Peters | 7d3bad6 | 2001-04-04 18:56:49 +0000 | [diff] [blame] | 706 |             if not self._filePassed: | 
 | 707 |                 self.fp.close() | 
 | 708 |                 self.fp = None | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 709 |             raise RuntimeError('Mode must be "r", "w" or "a"') | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 710 |  | 
 | 711 |     def _GetContents(self): | 
| Tim Peters | 7d3bad6 | 2001-04-04 18:56:49 +0000 | [diff] [blame] | 712 |         """Read the directory, making sure we close the file if the format | 
 | 713 |         is bad.""" | 
 | 714 |         try: | 
 | 715 |             self._RealGetContents() | 
 | 716 |         except BadZipfile: | 
 | 717 |             if not self._filePassed: | 
 | 718 |                 self.fp.close() | 
 | 719 |                 self.fp = None | 
 | 720 |             raise | 
 | 721 |  | 
 | 722 |     def _RealGetContents(self): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 723 |         """Read in the table of contents for the ZIP file.""" | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 724 |         fp = self.fp | 
| Martin v. Löwis | 6f6873b | 2002-10-13 13:54:50 +0000 | [diff] [blame] | 725 |         endrec = _EndRecData(fp) | 
 | 726 |         if not endrec: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 727 |             raise BadZipfile("File is not a zip file") | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 728 |         if self.debug > 1: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 729 |             print(endrec) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 730 |         size_cd = endrec[_ECD_SIZE]             # bytes in central directory | 
 | 731 |         offset_cd = endrec[_ECD_OFFSET]         # offset of central directory | 
 | 732 |         self.comment = endrec[_ECD_COMMENT]     # archive comment | 
 | 733 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 734 |         # "concat" is zero, unless zip was concatenated to another file | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 735 |         concat = endrec[_ECD_LOCATION] - size_cd - offset_cd | 
 | 736 |         if endrec[_ECD_LOCATION] > ZIP64_LIMIT: | 
 | 737 |             # If the offset of the "End of Central Dir" record requires Zip64 | 
 | 738 |             # extension structures, account for them | 
 | 739 |             concat -= (sizeEndCentDir64 + sizeEndCentDir64Locator) | 
 | 740 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 741 |         if self.debug > 2: | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 742 |             inferred = concat + offset_cd | 
 | 743 |             print("given, inferred, offset", offset_cd, inferred, concat) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 744 |         # self.start_dir:  Position of start of central directory | 
 | 745 |         self.start_dir = offset_cd + concat | 
 | 746 |         fp.seek(self.start_dir, 0) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 747 |         data = fp.read(size_cd) | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 748 |         fp = io.BytesIO(data) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 749 |         total = 0 | 
 | 750 |         while total < size_cd: | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 751 |             centdir = fp.read(sizeCentralDir) | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 752 |             if centdir[0:4] != stringCentralDir: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 753 |                 raise BadZipfile("Bad magic number for central directory") | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 754 |             centdir = struct.unpack(structCentralDir, centdir) | 
 | 755 |             if self.debug > 2: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 756 |                 print(centdir) | 
| Fred Drake | 3e038e5 | 2001-02-28 17:56:26 +0000 | [diff] [blame] | 757 |             filename = fp.read(centdir[_CD_FILENAME_LENGTH]) | 
| Martin v. Löwis | 8570f6a | 2008-05-05 17:44:38 +0000 | [diff] [blame] | 758 |             flags = centdir[5] | 
 | 759 |             if flags & 0x800: | 
 | 760 |                 # UTF-8 file names extension | 
 | 761 |                 filename = filename.decode('utf-8') | 
 | 762 |             else: | 
 | 763 |                 # Historical ZIP filename encoding | 
 | 764 |                 filename = filename.decode('cp437') | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 765 |             # Create ZipInfo instance to store file information | 
| Martin v. Löwis | 8570f6a | 2008-05-05 17:44:38 +0000 | [diff] [blame] | 766 |             x = ZipInfo(filename) | 
| Fred Drake | 3e038e5 | 2001-02-28 17:56:26 +0000 | [diff] [blame] | 767 |             x.extra = fp.read(centdir[_CD_EXTRA_FIELD_LENGTH]) | 
 | 768 |             x.comment = fp.read(centdir[_CD_COMMENT_LENGTH]) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 769 |             x.header_offset = centdir[_CD_LOCAL_HEADER_OFFSET] | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 770 |             (x.create_version, x.create_system, x.extract_version, x.reserved, | 
 | 771 |                 x.flag_bits, x.compress_type, t, d, | 
 | 772 |                 x.CRC, x.compress_size, x.file_size) = centdir[1:12] | 
 | 773 |             x.volume, x.internal_attr, x.external_attr = centdir[15:18] | 
 | 774 |             # Convert date/time code to (year, month, day, hour, min, sec) | 
| Christian Heimes | fdab48e | 2008-01-20 09:06:41 +0000 | [diff] [blame] | 775 |             x._raw_time = t | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 776 |             x.date_time = ( (d>>9)+1980, (d>>5)&0xF, d&0x1F, | 
| Fred Drake | 414ca66 | 2000-06-13 18:49:53 +0000 | [diff] [blame] | 777 |                                      t>>11, (t>>5)&0x3F, (t&0x1F) * 2 ) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 778 |  | 
 | 779 |             x._decodeExtra() | 
 | 780 |             x.header_offset = x.header_offset + concat | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 781 |             self.filelist.append(x) | 
 | 782 |             self.NameToInfo[x.filename] = x | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 783 |  | 
 | 784 |             # update total bytes read from central directory | 
 | 785 |             total = (total + sizeCentralDir + centdir[_CD_FILENAME_LENGTH] | 
 | 786 |                      + centdir[_CD_EXTRA_FIELD_LENGTH] | 
 | 787 |                      + centdir[_CD_COMMENT_LENGTH]) | 
 | 788 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 789 |             if self.debug > 2: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 790 |                 print("total", total) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 791 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 792 |  | 
 | 793 |     def namelist(self): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 794 |         """Return a list of file names in the archive.""" | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 795 |         l = [] | 
 | 796 |         for data in self.filelist: | 
 | 797 |             l.append(data.filename) | 
 | 798 |         return l | 
 | 799 |  | 
 | 800 |     def infolist(self): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 801 |         """Return a list of class ZipInfo instances for files in the | 
 | 802 |         archive.""" | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 803 |         return self.filelist | 
 | 804 |  | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 805 |     def printdir(self, file=None): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 806 |         """Print a table of contents for the zip file.""" | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 807 |         print("%-46s %19s %12s" % ("File Name", "Modified    ", "Size"), | 
 | 808 |               file=file) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 809 |         for zinfo in self.filelist: | 
| Guido van Rossum | 7736b5b | 2008-01-15 21:44:53 +0000 | [diff] [blame] | 810 |             date = "%d-%02d-%02d %02d:%02d:%02d" % zinfo.date_time[:6] | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 811 |             print("%-46s %s %12d" % (zinfo.filename, date, zinfo.file_size), | 
 | 812 |                   file=file) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 813 |  | 
 | 814 |     def testzip(self): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 815 |         """Read all the files and check the CRC.""" | 
| Benjamin Peterson | 4cd6a95 | 2008-08-17 20:23:46 +0000 | [diff] [blame^] | 816 |         chunk_size = 2 ** 20 | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 817 |         for zinfo in self.filelist: | 
 | 818 |             try: | 
| Benjamin Peterson | 4cd6a95 | 2008-08-17 20:23:46 +0000 | [diff] [blame^] | 819 |                 # Read by chunks, to avoid an OverflowError or a | 
 | 820 |                 # MemoryError with very large embedded files. | 
 | 821 |                 f = self.open(zinfo.filename, "r") | 
 | 822 |                 while f.read(chunk_size):     # Check CRC-32 | 
 | 823 |                     pass | 
| Raymond Hettinger | c0fac96 | 2003-06-27 22:25:03 +0000 | [diff] [blame] | 824 |             except BadZipfile: | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 825 |                 return zinfo.filename | 
 | 826 |  | 
 | 827 |     def getinfo(self, name): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 828 |         """Return the instance of ZipInfo given 'name'.""" | 
| Guido van Rossum | b5a755e | 2007-07-18 18:15:48 +0000 | [diff] [blame] | 829 |         info = self.NameToInfo.get(name) | 
 | 830 |         if info is None: | 
 | 831 |             raise KeyError( | 
 | 832 |                 'There is no item named %r in the archive' % name) | 
 | 833 |  | 
 | 834 |         return info | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 835 |  | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 836 |     def setpassword(self, pwd): | 
 | 837 |         """Set default password for encrypted files.""" | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 838 |         assert isinstance(pwd, bytes) | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 839 |         self.pwd = pwd | 
 | 840 |  | 
 | 841 |     def read(self, name, pwd=None): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 842 |         """Return file bytes (as a string) for name.""" | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 843 |         return self.open(name, "r", pwd).read() | 
 | 844 |  | 
 | 845 |     def open(self, name, mode="r", pwd=None): | 
 | 846 |         """Return file-like object for 'name'.""" | 
 | 847 |         if mode not in ("r", "U", "rU"): | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 848 |             raise RuntimeError('open() requires mode "r", "U", or "rU"') | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 849 |         if not self.fp: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 850 |             raise RuntimeError( | 
 | 851 |                   "Attempt to read ZIP archive that was already closed") | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 852 |  | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 853 |         # Only open a new file for instances where we were not | 
 | 854 |         # given a file object in the constructor | 
 | 855 |         if self._filePassed: | 
 | 856 |             zef_file = self.fp | 
 | 857 |         else: | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 858 |             zef_file = io.open(self.filename, 'rb') | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 859 |  | 
| Georg Brandl | b533e26 | 2008-05-25 18:19:30 +0000 | [diff] [blame] | 860 |         # Make sure we have an info object | 
 | 861 |         if isinstance(name, ZipInfo): | 
 | 862 |             # 'name' is already an info object | 
 | 863 |             zinfo = name | 
 | 864 |         else: | 
 | 865 |             # Get info object for name | 
 | 866 |             zinfo = self.getinfo(name) | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 867 |  | 
 | 868 |         zef_file.seek(zinfo.header_offset, 0) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 869 |  | 
 | 870 |         # Skip the file header: | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 871 |         fheader = zef_file.read(sizeFileHeader) | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 872 |         if fheader[0:4] != stringFileHeader: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 873 |             raise BadZipfile("Bad magic number for file header") | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 874 |  | 
 | 875 |         fheader = struct.unpack(structFileHeader, fheader) | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 876 |         fname = zef_file.read(fheader[_FH_FILENAME_LENGTH]) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 877 |         if fheader[_FH_EXTRA_FIELD_LENGTH]: | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 878 |             zef_file.read(fheader[_FH_EXTRA_FIELD_LENGTH]) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 879 |  | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 880 |         if fname != zinfo.orig_filename.encode("utf-8"): | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 881 |             raise BadZipfile( | 
 | 882 |                   'File name in directory %r and header %r differ.' | 
 | 883 |                   % (zinfo.orig_filename, fname)) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 884 |  | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 885 |         # check for encrypted flag & handle password | 
 | 886 |         is_encrypted = zinfo.flag_bits & 0x1 | 
 | 887 |         zd = None | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 888 |         if is_encrypted: | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 889 |             if not pwd: | 
 | 890 |                 pwd = self.pwd | 
 | 891 |             if not pwd: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 892 |                 raise RuntimeError("File %s is encrypted, " | 
 | 893 |                                    "password required for extraction" % name) | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 894 |  | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 895 |             zd = _ZipDecrypter(pwd) | 
 | 896 |             # The first 12 bytes in the cypher stream is an encryption header | 
 | 897 |             #  used to strengthen the algorithm. The first 11 bytes are | 
 | 898 |             #  completely random, while the 12th contains the MSB of the CRC, | 
| Christian Heimes | fdab48e | 2008-01-20 09:06:41 +0000 | [diff] [blame] | 899 |             #  or the MSB of the file time depending on the header type | 
| Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 900 |             #  and is used to check the correctness of the password. | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 901 |             bytes = zef_file.read(12) | 
| Guido van Rossum | c1f779c | 2007-07-03 08:25:58 +0000 | [diff] [blame] | 902 |             h = list(map(zd, bytes[0:12])) | 
| Christian Heimes | fdab48e | 2008-01-20 09:06:41 +0000 | [diff] [blame] | 903 |             if zinfo.flag_bits & 0x8: | 
 | 904 |                 # compare against the file type from extended local headers | 
 | 905 |                 check_byte = (zinfo._raw_time >> 8) & 0xff | 
 | 906 |             else: | 
 | 907 |                 # compare against the CRC otherwise | 
 | 908 |                 check_byte = (zinfo.CRC >> 24) & 0xff | 
 | 909 |             if h[11] != check_byte: | 
 | 910 |                 raise RuntimeError("Bad password for file", name) | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 911 |  | 
 | 912 |         # build and return a ZipExtFile | 
 | 913 |         if zd is None: | 
 | 914 |             zef = ZipExtFile(zef_file, zinfo) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 915 |         else: | 
| Guido van Rossum | d8faa36 | 2007-04-27 19:54:29 +0000 | [diff] [blame] | 916 |             zef = ZipExtFile(zef_file, zinfo, zd) | 
 | 917 |  | 
 | 918 |         # set universal newlines on ZipExtFile if necessary | 
 | 919 |         if "U" in mode: | 
 | 920 |             zef.set_univ_newlines(True) | 
 | 921 |         return zef | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 922 |  | 
| Christian Heimes | 790c823 | 2008-01-07 21:14:23 +0000 | [diff] [blame] | 923 |     def extract(self, member, path=None, pwd=None): | 
 | 924 |         """Extract a member from the archive to the current working directory, | 
 | 925 |            using its full name. Its file information is extracted as accurately | 
 | 926 |            as possible. `member' may be a filename or a ZipInfo object. You can | 
 | 927 |            specify a different directory using `path'. | 
 | 928 |         """ | 
 | 929 |         if not isinstance(member, ZipInfo): | 
 | 930 |             member = self.getinfo(member) | 
 | 931 |  | 
 | 932 |         if path is None: | 
 | 933 |             path = os.getcwd() | 
 | 934 |  | 
 | 935 |         return self._extract_member(member, path, pwd) | 
 | 936 |  | 
 | 937 |     def extractall(self, path=None, members=None, pwd=None): | 
 | 938 |         """Extract all members from the archive to the current working | 
 | 939 |            directory. `path' specifies a different directory to extract to. | 
 | 940 |            `members' is optional and must be a subset of the list returned | 
 | 941 |            by namelist(). | 
 | 942 |         """ | 
 | 943 |         if members is None: | 
 | 944 |             members = self.namelist() | 
 | 945 |  | 
 | 946 |         for zipinfo in members: | 
 | 947 |             self.extract(zipinfo, path, pwd) | 
 | 948 |  | 
 | 949 |     def _extract_member(self, member, targetpath, pwd): | 
 | 950 |         """Extract the ZipInfo object 'member' to a physical | 
 | 951 |            file on the path targetpath. | 
 | 952 |         """ | 
 | 953 |         # build the destination pathname, replacing | 
 | 954 |         # forward slashes to platform specific separators. | 
 | 955 |         if targetpath[-1:] == "/": | 
 | 956 |             targetpath = targetpath[:-1] | 
 | 957 |  | 
 | 958 |         # don't include leading "/" from file name if present | 
 | 959 |         if os.path.isabs(member.filename): | 
 | 960 |             targetpath = os.path.join(targetpath, member.filename[1:]) | 
 | 961 |         else: | 
 | 962 |             targetpath = os.path.join(targetpath, member.filename) | 
 | 963 |  | 
 | 964 |         targetpath = os.path.normpath(targetpath) | 
 | 965 |  | 
 | 966 |         # Create all upper directories if necessary. | 
 | 967 |         upperdirs = os.path.dirname(targetpath) | 
 | 968 |         if upperdirs and not os.path.exists(upperdirs): | 
 | 969 |             os.makedirs(upperdirs) | 
 | 970 |  | 
| Georg Brandl | b533e26 | 2008-05-25 18:19:30 +0000 | [diff] [blame] | 971 |         source = self.open(member, pwd=pwd) | 
| Christian Heimes | 790c823 | 2008-01-07 21:14:23 +0000 | [diff] [blame] | 972 |         target = open(targetpath, "wb") | 
 | 973 |         shutil.copyfileobj(source, target) | 
 | 974 |         source.close() | 
 | 975 |         target.close() | 
 | 976 |  | 
 | 977 |         return targetpath | 
 | 978 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 979 |     def _writecheck(self, zinfo): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 980 |         """Check for errors before writing a file to the archive.""" | 
| Raymond Hettinger | 54f0222 | 2002-06-01 14:18:47 +0000 | [diff] [blame] | 981 |         if zinfo.filename in self.NameToInfo: | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 982 |             if self.debug:      # Warning for duplicate names | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 983 |                 print("Duplicate name:", zinfo.filename) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 984 |         if self.mode not in ("w", "a"): | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 985 |             raise RuntimeError('write() requires mode "w" or "a"') | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 986 |         if not self.fp: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 987 |             raise RuntimeError( | 
 | 988 |                   "Attempt to write ZIP archive that was already closed") | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 989 |         if zinfo.compress_type == ZIP_DEFLATED and not zlib: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 990 |             raise RuntimeError( | 
 | 991 |                   "Compression requires the (missing) zlib module") | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 992 |         if zinfo.compress_type not in (ZIP_STORED, ZIP_DEFLATED): | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 993 |             raise RuntimeError("That compression method is not supported") | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 994 |         if zinfo.file_size > ZIP64_LIMIT: | 
 | 995 |             if not self._allowZip64: | 
 | 996 |                 raise LargeZipFile("Filesize would require ZIP64 extensions") | 
 | 997 |         if zinfo.header_offset > ZIP64_LIMIT: | 
 | 998 |             if not self._allowZip64: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 999 |                 raise LargeZipFile( | 
 | 1000 |                       "Zipfile size would require ZIP64 extensions") | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1001 |  | 
 | 1002 |     def write(self, filename, arcname=None, compress_type=None): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 1003 |         """Put the bytes from filename into the archive under the name | 
 | 1004 |         arcname.""" | 
| Guido van Rossum | b5a755e | 2007-07-18 18:15:48 +0000 | [diff] [blame] | 1005 |         if not self.fp: | 
 | 1006 |             raise RuntimeError( | 
 | 1007 |                   "Attempt to write to ZIP archive that was already closed") | 
 | 1008 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1009 |         st = os.stat(filename) | 
| Raymond Hettinger | 32200ae | 2002-06-01 19:51:15 +0000 | [diff] [blame] | 1010 |         mtime = time.localtime(st.st_mtime) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1011 |         date_time = mtime[0:6] | 
 | 1012 |         # Create ZipInfo instance to store file information | 
 | 1013 |         if arcname is None: | 
| Georg Brandl | 8f7c54e | 2006-02-20 08:40:38 +0000 | [diff] [blame] | 1014 |             arcname = filename | 
 | 1015 |         arcname = os.path.normpath(os.path.splitdrive(arcname)[1]) | 
 | 1016 |         while arcname[0] in (os.sep, os.altsep): | 
 | 1017 |             arcname = arcname[1:] | 
 | 1018 |         zinfo = ZipInfo(arcname, date_time) | 
| Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 1019 |         zinfo.external_attr = (st[0] & 0xFFFF) << 16      # Unix attributes | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1020 |         if compress_type is None: | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 1021 |             zinfo.compress_type = self.compression | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1022 |         else: | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 1023 |             zinfo.compress_type = compress_type | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1024 |  | 
 | 1025 |         zinfo.file_size = st.st_size | 
| Finn Bock | 03a3bb8 | 2001-09-05 18:40:33 +0000 | [diff] [blame] | 1026 |         zinfo.flag_bits = 0x00 | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 1027 |         zinfo.header_offset = self.fp.tell()    # Start of header bytes | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1028 |  | 
 | 1029 |         self._writecheck(zinfo) | 
 | 1030 |         self._didModify = True | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 1031 |         fp = io.open(filename, "rb") | 
| Finn Bock | 03a3bb8 | 2001-09-05 18:40:33 +0000 | [diff] [blame] | 1032 |         # Must overwrite CRC and sizes with correct data later | 
 | 1033 |         zinfo.CRC = CRC = 0 | 
 | 1034 |         zinfo.compress_size = compress_size = 0 | 
 | 1035 |         zinfo.file_size = file_size = 0 | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1036 |         self.fp.write(zinfo.FileHeader()) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1037 |         if zinfo.compress_type == ZIP_DEFLATED: | 
 | 1038 |             cmpr = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION, | 
 | 1039 |                  zlib.DEFLATED, -15) | 
 | 1040 |         else: | 
 | 1041 |             cmpr = None | 
 | 1042 |         while 1: | 
 | 1043 |             buf = fp.read(1024 * 8) | 
 | 1044 |             if not buf: | 
 | 1045 |                 break | 
 | 1046 |             file_size = file_size + len(buf) | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 1047 |             CRC = crc32(buf, CRC) & 0xffffffff | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1048 |             if cmpr: | 
 | 1049 |                 buf = cmpr.compress(buf) | 
 | 1050 |                 compress_size = compress_size + len(buf) | 
 | 1051 |             self.fp.write(buf) | 
 | 1052 |         fp.close() | 
 | 1053 |         if cmpr: | 
 | 1054 |             buf = cmpr.flush() | 
 | 1055 |             compress_size = compress_size + len(buf) | 
 | 1056 |             self.fp.write(buf) | 
 | 1057 |             zinfo.compress_size = compress_size | 
 | 1058 |         else: | 
 | 1059 |             zinfo.compress_size = file_size | 
 | 1060 |         zinfo.CRC = CRC | 
 | 1061 |         zinfo.file_size = file_size | 
| Finn Bock | 03a3bb8 | 2001-09-05 18:40:33 +0000 | [diff] [blame] | 1062 |         # Seek backwards and write CRC and file sizes | 
| Tim Peters | b64bec3 | 2001-09-18 02:26:39 +0000 | [diff] [blame] | 1063 |         position = self.fp.tell()       # Preserve current position in file | 
| Finn Bock | 03a3bb8 | 2001-09-05 18:40:33 +0000 | [diff] [blame] | 1064 |         self.fp.seek(zinfo.header_offset + 14, 0) | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 1065 |         self.fp.write(struct.pack("<LLL", zinfo.CRC, zinfo.compress_size, | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1066 |               zinfo.file_size)) | 
| Finn Bock | 03a3bb8 | 2001-09-05 18:40:33 +0000 | [diff] [blame] | 1067 |         self.fp.seek(position, 0) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1068 |         self.filelist.append(zinfo) | 
 | 1069 |         self.NameToInfo[zinfo.filename] = zinfo | 
 | 1070 |  | 
| Guido van Rossum | 85825dc | 2007-08-27 17:03:28 +0000 | [diff] [blame] | 1071 |     def writestr(self, zinfo_or_arcname, data): | 
 | 1072 |         """Write a file into the archive.  The contents is 'data', which | 
 | 1073 |         may be either a 'str' or a 'bytes' instance; if it is a 'str', | 
 | 1074 |         it is encoded as UTF-8 first. | 
 | 1075 |         'zinfo_or_arcname' is either a ZipInfo instance or | 
| Just van Rossum | b083cb3 | 2002-12-12 12:23:32 +0000 | [diff] [blame] | 1076 |         the name of the file in the archive.""" | 
| Guido van Rossum | 85825dc | 2007-08-27 17:03:28 +0000 | [diff] [blame] | 1077 |         if isinstance(data, str): | 
 | 1078 |             data = data.encode("utf-8") | 
| Just van Rossum | b083cb3 | 2002-12-12 12:23:32 +0000 | [diff] [blame] | 1079 |         if not isinstance(zinfo_or_arcname, ZipInfo): | 
 | 1080 |             zinfo = ZipInfo(filename=zinfo_or_arcname, | 
| Guido van Rossum | 7736b5b | 2008-01-15 21:44:53 +0000 | [diff] [blame] | 1081 |                             date_time=time.localtime(time.time())[:6]) | 
| Just van Rossum | b083cb3 | 2002-12-12 12:23:32 +0000 | [diff] [blame] | 1082 |             zinfo.compress_type = self.compression | 
| Antoine Pitrou | 6e1df8d | 2008-07-25 19:58:18 +0000 | [diff] [blame] | 1083 |             zinfo.external_attr = 0o600 << 16 | 
| Just van Rossum | b083cb3 | 2002-12-12 12:23:32 +0000 | [diff] [blame] | 1084 |         else: | 
 | 1085 |             zinfo = zinfo_or_arcname | 
| Guido van Rossum | b5a755e | 2007-07-18 18:15:48 +0000 | [diff] [blame] | 1086 |  | 
 | 1087 |         if not self.fp: | 
 | 1088 |             raise RuntimeError( | 
 | 1089 |                   "Attempt to write to ZIP archive that was already closed") | 
 | 1090 |  | 
| Guido van Rossum | 85825dc | 2007-08-27 17:03:28 +0000 | [diff] [blame] | 1091 |         zinfo.file_size = len(data)            # Uncompressed size | 
 | 1092 |         zinfo.header_offset = self.fp.tell()    # Start of header data | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1093 |         self._writecheck(zinfo) | 
 | 1094 |         self._didModify = True | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 1095 |         zinfo.CRC = crc32(data) & 0xffffffff       # CRC-32 checksum | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1096 |         if zinfo.compress_type == ZIP_DEFLATED: | 
 | 1097 |             co = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION, | 
 | 1098 |                  zlib.DEFLATED, -15) | 
| Guido van Rossum | 85825dc | 2007-08-27 17:03:28 +0000 | [diff] [blame] | 1099 |             data = co.compress(data) + co.flush() | 
 | 1100 |             zinfo.compress_size = len(data)    # Compressed size | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1101 |         else: | 
 | 1102 |             zinfo.compress_size = zinfo.file_size | 
| Guido van Rossum | 85825dc | 2007-08-27 17:03:28 +0000 | [diff] [blame] | 1103 |         zinfo.header_offset = self.fp.tell()    # Start of header data | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1104 |         self.fp.write(zinfo.FileHeader()) | 
| Guido van Rossum | 85825dc | 2007-08-27 17:03:28 +0000 | [diff] [blame] | 1105 |         self.fp.write(data) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1106 |         self.fp.flush() | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1107 |         if zinfo.flag_bits & 0x08: | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 1108 |             # Write CRC and file sizes after the file data | 
| Brett Cannon | ff450f7 | 2004-07-10 19:09:20 +0000 | [diff] [blame] | 1109 |             self.fp.write(struct.pack("<lLL", zinfo.CRC, zinfo.compress_size, | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 1110 |                   zinfo.file_size)) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1111 |         self.filelist.append(zinfo) | 
 | 1112 |         self.NameToInfo[zinfo.filename] = zinfo | 
 | 1113 |  | 
 | 1114 |     def __del__(self): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 1115 |         """Call the "close()" method in case the user forgot.""" | 
| Tim Peters | d15f8bb | 2001-11-28 23:16:40 +0000 | [diff] [blame] | 1116 |         self.close() | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1117 |  | 
 | 1118 |     def close(self): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 1119 |         """Close the file, and for mode "w" and "a" write the ending | 
 | 1120 |         records.""" | 
| Tim Peters | d15f8bb | 2001-11-28 23:16:40 +0000 | [diff] [blame] | 1121 |         if self.fp is None: | 
 | 1122 |             return | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1123 |  | 
 | 1124 |         if self.mode in ("w", "a") and self._didModify: # write ending records | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1125 |             count = 0 | 
 | 1126 |             pos1 = self.fp.tell() | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 1127 |             for zinfo in self.filelist:         # write central directory | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1128 |                 count = count + 1 | 
 | 1129 |                 dt = zinfo.date_time | 
 | 1130 |                 dosdate = (dt[0] - 1980) << 9 | dt[1] << 5 | dt[2] | 
| Tim Peters | 3caca23 | 2001-12-06 06:23:26 +0000 | [diff] [blame] | 1131 |                 dostime = dt[3] << 11 | dt[4] << 5 | (dt[5] // 2) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1132 |                 extra = [] | 
 | 1133 |                 if zinfo.file_size > ZIP64_LIMIT \ | 
 | 1134 |                         or zinfo.compress_size > ZIP64_LIMIT: | 
 | 1135 |                     extra.append(zinfo.file_size) | 
 | 1136 |                     extra.append(zinfo.compress_size) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 1137 |                     file_size = 0xffffffff | 
 | 1138 |                     compress_size = 0xffffffff | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1139 |                 else: | 
 | 1140 |                     file_size = zinfo.file_size | 
 | 1141 |                     compress_size = zinfo.compress_size | 
 | 1142 |  | 
 | 1143 |                 if zinfo.header_offset > ZIP64_LIMIT: | 
 | 1144 |                     extra.append(zinfo.header_offset) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 1145 |                     header_offset = 0xffffffff | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1146 |                 else: | 
 | 1147 |                     header_offset = zinfo.header_offset | 
 | 1148 |  | 
 | 1149 |                 extra_data = zinfo.extra | 
 | 1150 |                 if extra: | 
 | 1151 |                     # Append a ZIP64 field to the extra's | 
 | 1152 |                     extra_data = struct.pack( | 
| Christian Heimes | d5e2b6f | 2008-03-19 21:50:51 +0000 | [diff] [blame] | 1153 |                             '<HH' + 'Q'*len(extra), | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1154 |                             1, 8*len(extra), *extra) + extra_data | 
 | 1155 |  | 
 | 1156 |                     extract_version = max(45, zinfo.extract_version) | 
 | 1157 |                     create_version = max(45, zinfo.create_version) | 
 | 1158 |                 else: | 
 | 1159 |                     extract_version = zinfo.extract_version | 
 | 1160 |                     create_version = zinfo.create_version | 
 | 1161 |  | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 1162 |                 try: | 
 | 1163 |                     filename, flag_bits = zinfo._encodeFilenameFlags() | 
 | 1164 |                     centdir = struct.pack(structCentralDir, | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 1165 |                      stringCentralDir, create_version, | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 1166 |                      zinfo.create_system, extract_version, zinfo.reserved, | 
 | 1167 |                      flag_bits, zinfo.compress_type, dostime, dosdate, | 
 | 1168 |                      zinfo.CRC, compress_size, file_size, | 
 | 1169 |                      len(filename), len(extra_data), len(zinfo.comment), | 
 | 1170 |                      0, zinfo.internal_attr, zinfo.external_attr, | 
 | 1171 |                      header_offset) | 
 | 1172 |                 except DeprecationWarning: | 
 | 1173 |                     print >>sys.stderr, (structCentralDir, | 
 | 1174 |                      stringCentralDir, create_version, | 
 | 1175 |                      zinfo.create_system, extract_version, zinfo.reserved, | 
 | 1176 |                      zinfo.flag_bits, zinfo.compress_type, dostime, dosdate, | 
 | 1177 |                      zinfo.CRC, compress_size, file_size, | 
 | 1178 |                      len(zinfo.filename), len(extra_data), len(zinfo.comment), | 
 | 1179 |                      0, zinfo.internal_attr, zinfo.external_attr, | 
 | 1180 |                      header_offset) | 
 | 1181 |                     raise | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1182 |                 self.fp.write(centdir) | 
| Martin v. Löwis | 8570f6a | 2008-05-05 17:44:38 +0000 | [diff] [blame] | 1183 |                 self.fp.write(filename) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1184 |                 self.fp.write(extra_data) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1185 |                 self.fp.write(zinfo.comment) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1186 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1187 |             pos2 = self.fp.tell() | 
 | 1188 |             # Write end-of-zip-archive record | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 1189 |             centDirOffset = pos1 | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1190 |             if pos1 > ZIP64_LIMIT: | 
 | 1191 |                 # Need to write the ZIP64 end-of-archive records | 
 | 1192 |                 zip64endrec = struct.pack( | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 1193 |                         structEndArchive64, stringEndArchive64, | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1194 |                         44, 45, 45, 0, 0, count, count, pos2 - pos1, pos1) | 
 | 1195 |                 self.fp.write(zip64endrec) | 
 | 1196 |  | 
 | 1197 |                 zip64locrec = struct.pack( | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 1198 |                         structEndArchive64Locator, | 
 | 1199 |                         stringEndArchive64Locator, 0, pos2, 1) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1200 |                 self.fp.write(zip64locrec) | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 1201 |                 centDirOffset = 0xFFFFFFFF | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1202 |  | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 1203 |             # check for valid comment length | 
 | 1204 |             if len(self.comment) >= ZIP_MAX_COMMENT: | 
 | 1205 |                 if self.debug > 0: | 
 | 1206 |                     msg = 'Archive comment is too long; truncating to %d bytes' \ | 
 | 1207 |                           % ZIP_MAX_COMMENT | 
 | 1208 |                 self.comment = self.comment[:ZIP_MAX_COMMENT] | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1209 |  | 
| Georg Brandl | 2ee470f | 2008-07-16 12:55:28 +0000 | [diff] [blame] | 1210 |             endrec = struct.pack(structEndArchive, stringEndArchive, | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 1211 |                                  0, 0, count % ZIP_FILECOUNT_LIMIT, | 
 | 1212 |                                  count % ZIP_FILECOUNT_LIMIT, pos2 - pos1, | 
 | 1213 |                                  centDirOffset, len(self.comment)) | 
 | 1214 |             self.fp.write(endrec) | 
 | 1215 |             self.fp.write(self.comment) | 
| Guido van Rossum | f85af61 | 2001-04-14 16:45:14 +0000 | [diff] [blame] | 1216 |             self.fp.flush() | 
| Martin v. Löwis | b09b844 | 2008-07-03 14:13:42 +0000 | [diff] [blame] | 1217 |  | 
| Fred Drake | 3d9091e | 2001-03-26 15:49:24 +0000 | [diff] [blame] | 1218 |         if not self._filePassed: | 
 | 1219 |             self.fp.close() | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1220 |         self.fp = None | 
 | 1221 |  | 
 | 1222 |  | 
 | 1223 | class PyZipFile(ZipFile): | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 1224 |     """Class to create ZIP archives with Python library files and packages.""" | 
 | 1225 |  | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1226 |     def writepy(self, pathname, basename = ""): | 
 | 1227 |         """Add all files from "pathname" to the ZIP archive. | 
 | 1228 |  | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 1229 |         If pathname is a package directory, search the directory and | 
 | 1230 |         all package subdirectories recursively for all *.py and enter | 
 | 1231 |         the modules into the archive.  If pathname is a plain | 
 | 1232 |         directory, listdir *.py and enter all modules.  Else, pathname | 
 | 1233 |         must be a Python *.py file and the module will be put into the | 
 | 1234 |         archive.  Added modules are always module.pyo or module.pyc. | 
 | 1235 |         This method will compile the module.py into module.pyc if | 
 | 1236 |         necessary. | 
 | 1237 |         """ | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1238 |         dir, name = os.path.split(pathname) | 
 | 1239 |         if os.path.isdir(pathname): | 
 | 1240 |             initname = os.path.join(pathname, "__init__.py") | 
 | 1241 |             if os.path.isfile(initname): | 
 | 1242 |                 # This is a package directory, add it | 
 | 1243 |                 if basename: | 
 | 1244 |                     basename = "%s/%s" % (basename, name) | 
 | 1245 |                 else: | 
 | 1246 |                     basename = name | 
 | 1247 |                 if self.debug: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1248 |                     print("Adding package in", pathname, "as", basename) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1249 |                 fname, arcname = self._get_codename(initname[0:-3], basename) | 
 | 1250 |                 if self.debug: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1251 |                     print("Adding", arcname) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1252 |                 self.write(fname, arcname) | 
 | 1253 |                 dirlist = os.listdir(pathname) | 
 | 1254 |                 dirlist.remove("__init__.py") | 
 | 1255 |                 # Add all *.py files and package subdirectories | 
 | 1256 |                 for filename in dirlist: | 
 | 1257 |                     path = os.path.join(pathname, filename) | 
 | 1258 |                     root, ext = os.path.splitext(filename) | 
 | 1259 |                     if os.path.isdir(path): | 
 | 1260 |                         if os.path.isfile(os.path.join(path, "__init__.py")): | 
 | 1261 |                             # This is a package directory, add it | 
 | 1262 |                             self.writepy(path, basename)  # Recursive call | 
 | 1263 |                     elif ext == ".py": | 
 | 1264 |                         fname, arcname = self._get_codename(path[0:-3], | 
 | 1265 |                                          basename) | 
 | 1266 |                         if self.debug: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1267 |                             print("Adding", arcname) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1268 |                         self.write(fname, arcname) | 
 | 1269 |             else: | 
 | 1270 |                 # This is NOT a package directory, add its files at top level | 
 | 1271 |                 if self.debug: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1272 |                     print("Adding files from directory", pathname) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1273 |                 for filename in os.listdir(pathname): | 
 | 1274 |                     path = os.path.join(pathname, filename) | 
 | 1275 |                     root, ext = os.path.splitext(filename) | 
 | 1276 |                     if ext == ".py": | 
 | 1277 |                         fname, arcname = self._get_codename(path[0:-3], | 
 | 1278 |                                          basename) | 
 | 1279 |                         if self.debug: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1280 |                             print("Adding", arcname) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1281 |                         self.write(fname, arcname) | 
 | 1282 |         else: | 
 | 1283 |             if pathname[-3:] != ".py": | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 1284 |                 raise RuntimeError( | 
 | 1285 |                       'Files added with writepy() must end with ".py"') | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1286 |             fname, arcname = self._get_codename(pathname[0:-3], basename) | 
 | 1287 |             if self.debug: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1288 |                 print("Adding file", arcname) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1289 |             self.write(fname, arcname) | 
 | 1290 |  | 
 | 1291 |     def _get_codename(self, pathname, basename): | 
 | 1292 |         """Return (filename, archivename) for the path. | 
 | 1293 |  | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 1294 |         Given a module name path, return the correct file path and | 
 | 1295 |         archive name, compiling if necessary.  For example, given | 
 | 1296 |         /python/lib/string, return (/python/lib/string.pyc, string). | 
 | 1297 |         """ | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1298 |         file_py  = pathname + ".py" | 
 | 1299 |         file_pyc = pathname + ".pyc" | 
 | 1300 |         file_pyo = pathname + ".pyo" | 
 | 1301 |         if os.path.isfile(file_pyo) and \ | 
| Raymond Hettinger | 32200ae | 2002-06-01 19:51:15 +0000 | [diff] [blame] | 1302 |                             os.stat(file_pyo).st_mtime >= os.stat(file_py).st_mtime: | 
| Tim Peters | e119006 | 2001-01-15 03:34:38 +0000 | [diff] [blame] | 1303 |             fname = file_pyo    # Use .pyo file | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1304 |         elif not os.path.isfile(file_pyc) or \ | 
| Raymond Hettinger | 32200ae | 2002-06-01 19:51:15 +0000 | [diff] [blame] | 1305 |              os.stat(file_pyc).st_mtime < os.stat(file_py).st_mtime: | 
| Fred Drake | 484d735 | 2000-10-02 21:14:52 +0000 | [diff] [blame] | 1306 |             import py_compile | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1307 |             if self.debug: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1308 |                 print("Compiling", file_py) | 
| Martin v. Löwis | 0c6774d | 2003-01-15 11:51:06 +0000 | [diff] [blame] | 1309 |             try: | 
 | 1310 |                 py_compile.compile(file_py, file_pyc, None, True) | 
| Guido van Rossum | b940e11 | 2007-01-10 16:19:56 +0000 | [diff] [blame] | 1311 |             except py_compile.PyCompileError as err: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1312 |                 print(err.msg) | 
| Guido van Rossum | 32abe6f | 2000-03-31 17:30:02 +0000 | [diff] [blame] | 1313 |             fname = file_pyc | 
 | 1314 |         else: | 
 | 1315 |             fname = file_pyc | 
 | 1316 |         archivename = os.path.split(fname)[1] | 
 | 1317 |         if basename: | 
 | 1318 |             archivename = "%s/%s" % (basename, archivename) | 
 | 1319 |         return (fname, archivename) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1320 |  | 
 | 1321 |  | 
 | 1322 | def main(args = None): | 
 | 1323 |     import textwrap | 
 | 1324 |     USAGE=textwrap.dedent("""\ | 
 | 1325 |         Usage: | 
 | 1326 |             zipfile.py -l zipfile.zip        # Show listing of a zipfile | 
 | 1327 |             zipfile.py -t zipfile.zip        # Test if a zipfile is valid | 
 | 1328 |             zipfile.py -e zipfile.zip target # Extract zipfile into target dir | 
 | 1329 |             zipfile.py -c zipfile.zip src ... # Create zipfile from sources | 
 | 1330 |         """) | 
 | 1331 |     if args is None: | 
 | 1332 |         args = sys.argv[1:] | 
 | 1333 |  | 
 | 1334 |     if not args or args[0] not in ('-l', '-c', '-e', '-t'): | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1335 |         print(USAGE) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1336 |         sys.exit(1) | 
 | 1337 |  | 
 | 1338 |     if args[0] == '-l': | 
 | 1339 |         if len(args) != 2: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1340 |             print(USAGE) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1341 |             sys.exit(1) | 
 | 1342 |         zf = ZipFile(args[1], 'r') | 
 | 1343 |         zf.printdir() | 
 | 1344 |         zf.close() | 
 | 1345 |  | 
 | 1346 |     elif args[0] == '-t': | 
 | 1347 |         if len(args) != 2: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1348 |             print(USAGE) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1349 |             sys.exit(1) | 
 | 1350 |         zf = ZipFile(args[1], 'r') | 
 | 1351 |         zf.testzip() | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1352 |         print("Done testing") | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1353 |  | 
 | 1354 |     elif args[0] == '-e': | 
 | 1355 |         if len(args) != 3: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1356 |             print(USAGE) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1357 |             sys.exit(1) | 
 | 1358 |  | 
 | 1359 |         zf = ZipFile(args[1], 'r') | 
 | 1360 |         out = args[2] | 
 | 1361 |         for path in zf.namelist(): | 
 | 1362 |             if path.startswith('./'): | 
 | 1363 |                 tgt = os.path.join(out, path[2:]) | 
 | 1364 |             else: | 
 | 1365 |                 tgt = os.path.join(out, path) | 
 | 1366 |  | 
 | 1367 |             tgtdir = os.path.dirname(tgt) | 
 | 1368 |             if not os.path.exists(tgtdir): | 
 | 1369 |                 os.makedirs(tgtdir) | 
| Guido van Rossum | d6ca546 | 2007-05-22 01:29:33 +0000 | [diff] [blame] | 1370 |             fp = io.open(tgt, 'wb') | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1371 |             fp.write(zf.read(path)) | 
 | 1372 |             fp.close() | 
 | 1373 |         zf.close() | 
 | 1374 |  | 
 | 1375 |     elif args[0] == '-c': | 
 | 1376 |         if len(args) < 3: | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 1377 |             print(USAGE) | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 1378 |             sys.exit(1) | 
 | 1379 |  | 
 | 1380 |         def addToZip(zf, path, zippath): | 
 | 1381 |             if os.path.isfile(path): | 
 | 1382 |                 zf.write(path, zippath, ZIP_DEFLATED) | 
 | 1383 |             elif os.path.isdir(path): | 
 | 1384 |                 for nm in os.listdir(path): | 
 | 1385 |                     addToZip(zf, | 
 | 1386 |                             os.path.join(path, nm), os.path.join(zippath, nm)) | 
 | 1387 |             # else: ignore | 
 | 1388 |  | 
 | 1389 |         zf = ZipFile(args[1], 'w', allowZip64=True) | 
 | 1390 |         for src in args[2:]: | 
 | 1391 |             addToZip(zf, src, os.path.basename(src)) | 
 | 1392 |  | 
 | 1393 |         zf.close() | 
 | 1394 |  | 
 | 1395 | if __name__ == "__main__": | 
 | 1396 |     main() |