Manual py3k backport: [svn r74155] Issue #6242: Fix deallocator of io.StringIO and...
[python.git] / Lib / zipfile.py
blob2aa4bffc4281c6f305d581e82ed6bd9a2428e2b9
1 """
2 Read and write ZIP files.
3 """
4 import struct, os, time, sys, shutil
5 import binascii, cStringIO, stat
7 try:
8 import zlib # We may need its compression method
9 crc32 = zlib.crc32
10 except ImportError:
11 zlib = None
12 crc32 = binascii.crc32
14 __all__ = ["BadZipfile", "error", "ZIP_STORED", "ZIP_DEFLATED", "is_zipfile",
15 "ZipInfo", "ZipFile", "PyZipFile", "LargeZipFile" ]
17 class BadZipfile(Exception):
18 pass
21 class LargeZipFile(Exception):
22 """
23 Raised when writing a zipfile, the zipfile requires ZIP64 extensions
24 and those extensions are disabled.
25 """
27 error = BadZipfile # The exception raised by this module
29 ZIP64_LIMIT = (1 << 31) - 1
30 ZIP_FILECOUNT_LIMIT = 1 << 16
31 ZIP_MAX_COMMENT = (1 << 16) - 1
33 # constants for Zip file compression methods
34 ZIP_STORED = 0
35 ZIP_DEFLATED = 8
36 # Other ZIP compression methods not supported
38 # Below are some formats and associated data for reading/writing headers using
39 # the struct module. The names and structures of headers/records are those used
40 # in the PKWARE description of the ZIP file format:
41 # http://www.pkware.com/documents/casestudies/APPNOTE.TXT
42 # (URL valid as of January 2008)
44 # The "end of central directory" structure, magic number, size, and indices
45 # (section V.I in the format document)
46 structEndArchive = "<4s4H2LH"
47 stringEndArchive = "PK\005\006"
48 sizeEndCentDir = struct.calcsize(structEndArchive)
50 _ECD_SIGNATURE = 0
51 _ECD_DISK_NUMBER = 1
52 _ECD_DISK_START = 2
53 _ECD_ENTRIES_THIS_DISK = 3
54 _ECD_ENTRIES_TOTAL = 4
55 _ECD_SIZE = 5
56 _ECD_OFFSET = 6
57 _ECD_COMMENT_SIZE = 7
58 # These last two indices are not part of the structure as defined in the
59 # spec, but they are used internally by this module as a convenience
60 _ECD_COMMENT = 8
61 _ECD_LOCATION = 9
63 # The "central directory" structure, magic number, size, and indices
64 # of entries in the structure (section V.F in the format document)
65 structCentralDir = "<4s4B4HL2L5H2L"
66 stringCentralDir = "PK\001\002"
67 sizeCentralDir = struct.calcsize(structCentralDir)
69 # indexes of entries in the central directory structure
70 _CD_SIGNATURE = 0
71 _CD_CREATE_VERSION = 1
72 _CD_CREATE_SYSTEM = 2
73 _CD_EXTRACT_VERSION = 3
74 _CD_EXTRACT_SYSTEM = 4
75 _CD_FLAG_BITS = 5
76 _CD_COMPRESS_TYPE = 6
77 _CD_TIME = 7
78 _CD_DATE = 8
79 _CD_CRC = 9
80 _CD_COMPRESSED_SIZE = 10
81 _CD_UNCOMPRESSED_SIZE = 11
82 _CD_FILENAME_LENGTH = 12
83 _CD_EXTRA_FIELD_LENGTH = 13
84 _CD_COMMENT_LENGTH = 14
85 _CD_DISK_NUMBER_START = 15
86 _CD_INTERNAL_FILE_ATTRIBUTES = 16
87 _CD_EXTERNAL_FILE_ATTRIBUTES = 17
88 _CD_LOCAL_HEADER_OFFSET = 18
90 # The "local file header" structure, magic number, size, and indices
91 # (section V.A in the format document)
92 structFileHeader = "<4s2B4HL2L2H"
93 stringFileHeader = "PK\003\004"
94 sizeFileHeader = struct.calcsize(structFileHeader)
96 _FH_SIGNATURE = 0
97 _FH_EXTRACT_VERSION = 1
98 _FH_EXTRACT_SYSTEM = 2
99 _FH_GENERAL_PURPOSE_FLAG_BITS = 3
100 _FH_COMPRESSION_METHOD = 4
101 _FH_LAST_MOD_TIME = 5
102 _FH_LAST_MOD_DATE = 6
103 _FH_CRC = 7
104 _FH_COMPRESSED_SIZE = 8
105 _FH_UNCOMPRESSED_SIZE = 9
106 _FH_FILENAME_LENGTH = 10
107 _FH_EXTRA_FIELD_LENGTH = 11
109 # The "Zip64 end of central directory locator" structure, magic number, and size
110 structEndArchive64Locator = "<4sLQL"
111 stringEndArchive64Locator = "PK\x06\x07"
112 sizeEndCentDir64Locator = struct.calcsize(structEndArchive64Locator)
114 # The "Zip64 end of central directory" record, magic number, size, and indices
115 # (section V.G in the format document)
116 structEndArchive64 = "<4sQ2H2L4Q"
117 stringEndArchive64 = "PK\x06\x06"
118 sizeEndCentDir64 = struct.calcsize(structEndArchive64)
120 _CD64_SIGNATURE = 0
121 _CD64_DIRECTORY_RECSIZE = 1
122 _CD64_CREATE_VERSION = 2
123 _CD64_EXTRACT_VERSION = 3
124 _CD64_DISK_NUMBER = 4
125 _CD64_DISK_NUMBER_START = 5
126 _CD64_NUMBER_ENTRIES_THIS_DISK = 6
127 _CD64_NUMBER_ENTRIES_TOTAL = 7
128 _CD64_DIRECTORY_SIZE = 8
129 _CD64_OFFSET_START_CENTDIR = 9
131 def _check_zipfile(fp):
132 try:
133 if _EndRecData(fp):
134 return True # file has correct magic number
135 except IOError:
136 pass
137 return False
139 def is_zipfile(filename):
140 """Quickly see if a file is a ZIP file by checking the magic number.
142 The filename argument may be a file or file-like object too.
144 result = False
145 try:
146 if hasattr(filename, "read"):
147 result = _check_zipfile(fp=filename)
148 else:
149 with open(filename, "rb") as fp:
150 result = _check_zipfile(fp)
151 except IOError:
152 pass
153 return result
155 def _EndRecData64(fpin, offset, endrec):
157 Read the ZIP64 end-of-archive records and use that to update endrec
159 fpin.seek(offset - sizeEndCentDir64Locator, 2)
160 data = fpin.read(sizeEndCentDir64Locator)
161 sig, diskno, reloff, disks = struct.unpack(structEndArchive64Locator, data)
162 if sig != stringEndArchive64Locator:
163 return endrec
165 if diskno != 0 or disks != 1:
166 raise BadZipfile("zipfiles that span multiple disks are not supported")
168 # Assume no 'zip64 extensible data'
169 fpin.seek(offset - sizeEndCentDir64Locator - sizeEndCentDir64, 2)
170 data = fpin.read(sizeEndCentDir64)
171 sig, sz, create_version, read_version, disk_num, disk_dir, \
172 dircount, dircount2, dirsize, diroffset = \
173 struct.unpack(structEndArchive64, data)
174 if sig != stringEndArchive64:
175 return endrec
177 # Update the original endrec using data from the ZIP64 record
178 endrec[_ECD_SIGNATURE] = sig
179 endrec[_ECD_DISK_NUMBER] = disk_num
180 endrec[_ECD_DISK_START] = disk_dir
181 endrec[_ECD_ENTRIES_THIS_DISK] = dircount
182 endrec[_ECD_ENTRIES_TOTAL] = dircount2
183 endrec[_ECD_SIZE] = dirsize
184 endrec[_ECD_OFFSET] = diroffset
185 return endrec
188 def _EndRecData(fpin):
189 """Return data from the "End of Central Directory" record, or None.
191 The data is a list of the nine items in the ZIP "End of central dir"
192 record followed by a tenth item, the file seek offset of this record."""
194 # Determine file size
195 fpin.seek(0, 2)
196 filesize = fpin.tell()
198 # Check to see if this is ZIP file with no archive comment (the
199 # "end of central directory" structure should be the last item in the
200 # file if this is the case).
201 try:
202 fpin.seek(-sizeEndCentDir, 2)
203 except IOError:
204 return None
205 data = fpin.read()
206 if data[0:4] == stringEndArchive and data[-2:] == "\000\000":
207 # the signature is correct and there's no comment, unpack structure
208 endrec = struct.unpack(structEndArchive, data)
209 endrec=list(endrec)
211 # Append a blank comment and record start offset
212 endrec.append("")
213 endrec.append(filesize - sizeEndCentDir)
215 # Try to read the "Zip64 end of central directory" structure
216 return _EndRecData64(fpin, -sizeEndCentDir, endrec)
218 # Either this is not a ZIP file, or it is a ZIP file with an archive
219 # comment. Search the end of the file for the "end of central directory"
220 # record signature. The comment is the last item in the ZIP file and may be
221 # up to 64K long. It is assumed that the "end of central directory" magic
222 # number does not appear in the comment.
223 maxCommentStart = max(filesize - (1 << 16) - sizeEndCentDir, 0)
224 fpin.seek(maxCommentStart, 0)
225 data = fpin.read()
226 start = data.rfind(stringEndArchive)
227 if start >= 0:
228 # found the magic number; attempt to unpack and interpret
229 recData = data[start:start+sizeEndCentDir]
230 endrec = list(struct.unpack(structEndArchive, recData))
231 comment = data[start+sizeEndCentDir:]
232 # check that comment length is correct
233 if endrec[_ECD_COMMENT_SIZE] == len(comment):
234 # Append the archive comment and start offset
235 endrec.append(comment)
236 endrec.append(maxCommentStart + start)
238 # Try to read the "Zip64 end of central directory" structure
239 return _EndRecData64(fpin, maxCommentStart + start - filesize,
240 endrec)
242 # Unable to find a valid end of central directory structure
243 return
246 class ZipInfo (object):
247 """Class with attributes describing each file in the ZIP archive."""
249 __slots__ = (
250 'orig_filename',
251 'filename',
252 'date_time',
253 'compress_type',
254 'comment',
255 'extra',
256 'create_system',
257 'create_version',
258 'extract_version',
259 'reserved',
260 'flag_bits',
261 'volume',
262 'internal_attr',
263 'external_attr',
264 'header_offset',
265 'CRC',
266 'compress_size',
267 'file_size',
268 '_raw_time',
271 def __init__(self, filename="NoName", date_time=(1980,1,1,0,0,0)):
272 self.orig_filename = filename # Original file name in archive
274 # Terminate the file name at the first null byte. Null bytes in file
275 # names are used as tricks by viruses in archives.
276 null_byte = filename.find(chr(0))
277 if null_byte >= 0:
278 filename = filename[0:null_byte]
279 # This is used to ensure paths in generated ZIP files always use
280 # forward slashes as the directory separator, as required by the
281 # ZIP format specification.
282 if os.sep != "/" and os.sep in filename:
283 filename = filename.replace(os.sep, "/")
285 self.filename = filename # Normalized file name
286 self.date_time = date_time # year, month, day, hour, min, sec
287 # Standard values:
288 self.compress_type = ZIP_STORED # Type of compression for the file
289 self.comment = "" # Comment for each file
290 self.extra = "" # ZIP extra data
291 if sys.platform == 'win32':
292 self.create_system = 0 # System which created ZIP archive
293 else:
294 # Assume everything else is unix-y
295 self.create_system = 3 # System which created ZIP archive
296 self.create_version = 20 # Version which created ZIP archive
297 self.extract_version = 20 # Version needed to extract archive
298 self.reserved = 0 # Must be zero
299 self.flag_bits = 0 # ZIP flag bits
300 self.volume = 0 # Volume number of file header
301 self.internal_attr = 0 # Internal attributes
302 self.external_attr = 0 # External file attributes
303 # Other attributes are set by class ZipFile:
304 # header_offset Byte offset to the file header
305 # CRC CRC-32 of the uncompressed file
306 # compress_size Size of the compressed file
307 # file_size Size of the uncompressed file
309 def FileHeader(self):
310 """Return the per-file header as a string."""
311 dt = self.date_time
312 dosdate = (dt[0] - 1980) << 9 | dt[1] << 5 | dt[2]
313 dostime = dt[3] << 11 | dt[4] << 5 | (dt[5] // 2)
314 if self.flag_bits & 0x08:
315 # Set these to zero because we write them after the file data
316 CRC = compress_size = file_size = 0
317 else:
318 CRC = self.CRC
319 compress_size = self.compress_size
320 file_size = self.file_size
322 extra = self.extra
324 if file_size > ZIP64_LIMIT or compress_size > ZIP64_LIMIT:
325 # File is larger than what fits into a 4 byte integer,
326 # fall back to the ZIP64 extension
327 fmt = '<HHQQ'
328 extra = extra + struct.pack(fmt,
329 1, struct.calcsize(fmt)-4, file_size, compress_size)
330 file_size = 0xffffffff
331 compress_size = 0xffffffff
332 self.extract_version = max(45, self.extract_version)
333 self.create_version = max(45, self.extract_version)
335 filename, flag_bits = self._encodeFilenameFlags()
336 header = struct.pack(structFileHeader, stringFileHeader,
337 self.extract_version, self.reserved, flag_bits,
338 self.compress_type, dostime, dosdate, CRC,
339 compress_size, file_size,
340 len(filename), len(extra))
341 return header + filename + extra
343 def _encodeFilenameFlags(self):
344 if isinstance(self.filename, unicode):
345 try:
346 return self.filename.encode('ascii'), self.flag_bits
347 except UnicodeEncodeError:
348 return self.filename.encode('utf-8'), self.flag_bits | 0x800
349 else:
350 return self.filename, self.flag_bits
352 def _decodeFilename(self):
353 if self.flag_bits & 0x800:
354 return self.filename.decode('utf-8')
355 else:
356 return self.filename
358 def _decodeExtra(self):
359 # Try to decode the extra field.
360 extra = self.extra
361 unpack = struct.unpack
362 while extra:
363 tp, ln = unpack('<HH', extra[:4])
364 if tp == 1:
365 if ln >= 24:
366 counts = unpack('<QQQ', extra[4:28])
367 elif ln == 16:
368 counts = unpack('<QQ', extra[4:20])
369 elif ln == 8:
370 counts = unpack('<Q', extra[4:12])
371 elif ln == 0:
372 counts = ()
373 else:
374 raise RuntimeError, "Corrupt extra field %s"%(ln,)
376 idx = 0
378 # ZIP64 extension (large files and/or large archives)
379 if self.file_size in (0xffffffffffffffffL, 0xffffffffL):
380 self.file_size = counts[idx]
381 idx += 1
383 if self.compress_size == 0xFFFFFFFFL:
384 self.compress_size = counts[idx]
385 idx += 1
387 if self.header_offset == 0xffffffffL:
388 old = self.header_offset
389 self.header_offset = counts[idx]
390 idx+=1
392 extra = extra[ln+4:]
395 class _ZipDecrypter:
396 """Class to handle decryption of files stored within a ZIP archive.
398 ZIP supports a password-based form of encryption. Even though known
399 plaintext attacks have been found against it, it is still useful
400 to be able to get data out of such a file.
402 Usage:
403 zd = _ZipDecrypter(mypwd)
404 plain_char = zd(cypher_char)
405 plain_text = map(zd, cypher_text)
408 def _GenerateCRCTable():
409 """Generate a CRC-32 table.
411 ZIP encryption uses the CRC32 one-byte primitive for scrambling some
412 internal keys. We noticed that a direct implementation is faster than
413 relying on binascii.crc32().
415 poly = 0xedb88320
416 table = [0] * 256
417 for i in range(256):
418 crc = i
419 for j in range(8):
420 if crc & 1:
421 crc = ((crc >> 1) & 0x7FFFFFFF) ^ poly
422 else:
423 crc = ((crc >> 1) & 0x7FFFFFFF)
424 table[i] = crc
425 return table
426 crctable = _GenerateCRCTable()
428 def _crc32(self, ch, crc):
429 """Compute the CRC32 primitive on one byte."""
430 return ((crc >> 8) & 0xffffff) ^ self.crctable[(crc ^ ord(ch)) & 0xff]
432 def __init__(self, pwd):
433 self.key0 = 305419896
434 self.key1 = 591751049
435 self.key2 = 878082192
436 for p in pwd:
437 self._UpdateKeys(p)
439 def _UpdateKeys(self, c):
440 self.key0 = self._crc32(c, self.key0)
441 self.key1 = (self.key1 + (self.key0 & 255)) & 4294967295
442 self.key1 = (self.key1 * 134775813 + 1) & 4294967295
443 self.key2 = self._crc32(chr((self.key1 >> 24) & 255), self.key2)
445 def __call__(self, c):
446 """Decrypt a single character."""
447 c = ord(c)
448 k = self.key2 | 2
449 c = c ^ (((k * (k^1)) >> 8) & 255)
450 c = chr(c)
451 self._UpdateKeys(c)
452 return c
454 class ZipExtFile:
455 """File-like object for reading an archive member.
456 Is returned by ZipFile.open().
459 def __init__(self, fileobj, zipinfo, decrypt=None):
460 self.fileobj = fileobj
461 self.decrypter = decrypt
462 self.bytes_read = 0L
463 self.rawbuffer = ''
464 self.readbuffer = ''
465 self.linebuffer = ''
466 self.eof = False
467 self.univ_newlines = False
468 self.nlSeps = ("\n", )
469 self.lastdiscard = ''
471 self.compress_type = zipinfo.compress_type
472 self.compress_size = zipinfo.compress_size
474 self.closed = False
475 self.mode = "r"
476 self.name = zipinfo.filename
478 # read from compressed files in 64k blocks
479 self.compreadsize = 64*1024
480 if self.compress_type == ZIP_DEFLATED:
481 self.dc = zlib.decompressobj(-15)
483 def set_univ_newlines(self, univ_newlines):
484 self.univ_newlines = univ_newlines
486 # pick line separator char(s) based on universal newlines flag
487 self.nlSeps = ("\n", )
488 if self.univ_newlines:
489 self.nlSeps = ("\r\n", "\r", "\n")
491 def __iter__(self):
492 return self
494 def next(self):
495 nextline = self.readline()
496 if not nextline:
497 raise StopIteration()
499 return nextline
501 def close(self):
502 self.closed = True
504 def _checkfornewline(self):
505 nl, nllen = -1, -1
506 if self.linebuffer:
507 # ugly check for cases where half of an \r\n pair was
508 # read on the last pass, and the \r was discarded. In this
509 # case we just throw away the \n at the start of the buffer.
510 if (self.lastdiscard, self.linebuffer[0]) == ('\r','\n'):
511 self.linebuffer = self.linebuffer[1:]
513 for sep in self.nlSeps:
514 nl = self.linebuffer.find(sep)
515 if nl >= 0:
516 nllen = len(sep)
517 return nl, nllen
519 return nl, nllen
521 def readline(self, size = -1):
522 """Read a line with approx. size. If size is negative,
523 read a whole line.
525 if size < 0:
526 size = sys.maxint
527 elif size == 0:
528 return ''
530 # check for a newline already in buffer
531 nl, nllen = self._checkfornewline()
533 if nl >= 0:
534 # the next line was already in the buffer
535 nl = min(nl, size)
536 else:
537 # no line break in buffer - try to read more
538 size -= len(self.linebuffer)
539 while nl < 0 and size > 0:
540 buf = self.read(min(size, 100))
541 if not buf:
542 break
543 self.linebuffer += buf
544 size -= len(buf)
546 # check for a newline in buffer
547 nl, nllen = self._checkfornewline()
549 # we either ran out of bytes in the file, or
550 # met the specified size limit without finding a newline,
551 # so return current buffer
552 if nl < 0:
553 s = self.linebuffer
554 self.linebuffer = ''
555 return s
557 buf = self.linebuffer[:nl]
558 self.lastdiscard = self.linebuffer[nl:nl + nllen]
559 self.linebuffer = self.linebuffer[nl + nllen:]
561 # line is always returned with \n as newline char (except possibly
562 # for a final incomplete line in the file, which is handled above).
563 return buf + "\n"
565 def readlines(self, sizehint = -1):
566 """Return a list with all (following) lines. The sizehint parameter
567 is ignored in this implementation.
569 result = []
570 while True:
571 line = self.readline()
572 if not line: break
573 result.append(line)
574 return result
576 def read(self, size = None):
577 # act like file() obj and return empty string if size is 0
578 if size == 0:
579 return ''
581 # determine read size
582 bytesToRead = self.compress_size - self.bytes_read
584 # adjust read size for encrypted files since the first 12 bytes
585 # are for the encryption/password information
586 if self.decrypter is not None:
587 bytesToRead -= 12
589 if size is not None and size >= 0:
590 if self.compress_type == ZIP_STORED:
591 lr = len(self.readbuffer)
592 bytesToRead = min(bytesToRead, size - lr)
593 elif self.compress_type == ZIP_DEFLATED:
594 if len(self.readbuffer) > size:
595 # the user has requested fewer bytes than we've already
596 # pulled through the decompressor; don't read any more
597 bytesToRead = 0
598 else:
599 # user will use up the buffer, so read some more
600 lr = len(self.rawbuffer)
601 bytesToRead = min(bytesToRead, self.compreadsize - lr)
603 # avoid reading past end of file contents
604 if bytesToRead + self.bytes_read > self.compress_size:
605 bytesToRead = self.compress_size - self.bytes_read
607 # try to read from file (if necessary)
608 if bytesToRead > 0:
609 bytes = self.fileobj.read(bytesToRead)
610 self.bytes_read += len(bytes)
611 self.rawbuffer += bytes
613 # handle contents of raw buffer
614 if self.rawbuffer:
615 newdata = self.rawbuffer
616 self.rawbuffer = ''
618 # decrypt new data if we were given an object to handle that
619 if newdata and self.decrypter is not None:
620 newdata = ''.join(map(self.decrypter, newdata))
622 # decompress newly read data if necessary
623 if newdata and self.compress_type == ZIP_DEFLATED:
624 newdata = self.dc.decompress(newdata)
625 self.rawbuffer = self.dc.unconsumed_tail
626 if self.eof and len(self.rawbuffer) == 0:
627 # we're out of raw bytes (both from the file and
628 # the local buffer); flush just to make sure the
629 # decompressor is done
630 newdata += self.dc.flush()
631 # prevent decompressor from being used again
632 self.dc = None
634 self.readbuffer += newdata
637 # return what the user asked for
638 if size is None or len(self.readbuffer) <= size:
639 bytes = self.readbuffer
640 self.readbuffer = ''
641 else:
642 bytes = self.readbuffer[:size]
643 self.readbuffer = self.readbuffer[size:]
645 return bytes
648 class ZipFile:
649 """ Class with methods to open, read, write, close, list zip files.
651 z = ZipFile(file, mode="r", compression=ZIP_STORED, allowZip64=False)
653 file: Either the path to the file, or a file-like object.
654 If it is a path, the file will be opened and closed by ZipFile.
655 mode: The mode can be either read "r", write "w" or append "a".
656 compression: ZIP_STORED (no compression) or ZIP_DEFLATED (requires zlib).
657 allowZip64: if True ZipFile will create files with ZIP64 extensions when
658 needed, otherwise it will raise an exception when this would
659 be necessary.
663 fp = None # Set here since __del__ checks it
665 def __init__(self, file, mode="r", compression=ZIP_STORED, allowZip64=False):
666 """Open the ZIP file with mode read "r", write "w" or append "a"."""
667 if mode not in ("r", "w", "a"):
668 raise RuntimeError('ZipFile() requires mode "r", "w", or "a"')
670 if compression == ZIP_STORED:
671 pass
672 elif compression == ZIP_DEFLATED:
673 if not zlib:
674 raise RuntimeError,\
675 "Compression requires the (missing) zlib module"
676 else:
677 raise RuntimeError, "That compression method is not supported"
679 self._allowZip64 = allowZip64
680 self._didModify = False
681 self.debug = 0 # Level of printing: 0 through 3
682 self.NameToInfo = {} # Find file info given name
683 self.filelist = [] # List of ZipInfo instances for archive
684 self.compression = compression # Method of compression
685 self.mode = key = mode.replace('b', '')[0]
686 self.pwd = None
687 self.comment = ''
689 # Check if we were passed a file-like object
690 if isinstance(file, basestring):
691 self._filePassed = 0
692 self.filename = file
693 modeDict = {'r' : 'rb', 'w': 'wb', 'a' : 'r+b'}
694 try:
695 self.fp = open(file, modeDict[mode])
696 except IOError:
697 if mode == 'a':
698 mode = key = 'w'
699 self.fp = open(file, modeDict[mode])
700 else:
701 raise
702 else:
703 self._filePassed = 1
704 self.fp = file
705 self.filename = getattr(file, 'name', None)
707 if key == 'r':
708 self._GetContents()
709 elif key == 'w':
710 pass
711 elif key == 'a':
712 try: # See if file is a zip file
713 self._RealGetContents()
714 # seek to start of directory and overwrite
715 self.fp.seek(self.start_dir, 0)
716 except BadZipfile: # file is not a zip file, just append
717 self.fp.seek(0, 2)
718 else:
719 if not self._filePassed:
720 self.fp.close()
721 self.fp = None
722 raise RuntimeError, 'Mode must be "r", "w" or "a"'
724 def _GetContents(self):
725 """Read the directory, making sure we close the file if the format
726 is bad."""
727 try:
728 self._RealGetContents()
729 except BadZipfile:
730 if not self._filePassed:
731 self.fp.close()
732 self.fp = None
733 raise
735 def _RealGetContents(self):
736 """Read in the table of contents for the ZIP file."""
737 fp = self.fp
738 endrec = _EndRecData(fp)
739 if not endrec:
740 raise BadZipfile, "File is not a zip file"
741 if self.debug > 1:
742 print endrec
743 size_cd = endrec[_ECD_SIZE] # bytes in central directory
744 offset_cd = endrec[_ECD_OFFSET] # offset of central directory
745 self.comment = endrec[_ECD_COMMENT] # archive comment
747 # "concat" is zero, unless zip was concatenated to another file
748 concat = endrec[_ECD_LOCATION] - size_cd - offset_cd
749 if endrec[_ECD_SIGNATURE] == stringEndArchive64:
750 # If Zip64 extension structures are present, account for them
751 concat -= (sizeEndCentDir64 + sizeEndCentDir64Locator)
753 if self.debug > 2:
754 inferred = concat + offset_cd
755 print "given, inferred, offset", offset_cd, inferred, concat
756 # self.start_dir: Position of start of central directory
757 self.start_dir = offset_cd + concat
758 fp.seek(self.start_dir, 0)
759 data = fp.read(size_cd)
760 fp = cStringIO.StringIO(data)
761 total = 0
762 while total < size_cd:
763 centdir = fp.read(sizeCentralDir)
764 if centdir[0:4] != stringCentralDir:
765 raise BadZipfile, "Bad magic number for central directory"
766 centdir = struct.unpack(structCentralDir, centdir)
767 if self.debug > 2:
768 print centdir
769 filename = fp.read(centdir[_CD_FILENAME_LENGTH])
770 # Create ZipInfo instance to store file information
771 x = ZipInfo(filename)
772 x.extra = fp.read(centdir[_CD_EXTRA_FIELD_LENGTH])
773 x.comment = fp.read(centdir[_CD_COMMENT_LENGTH])
774 x.header_offset = centdir[_CD_LOCAL_HEADER_OFFSET]
775 (x.create_version, x.create_system, x.extract_version, x.reserved,
776 x.flag_bits, x.compress_type, t, d,
777 x.CRC, x.compress_size, x.file_size) = centdir[1:12]
778 x.volume, x.internal_attr, x.external_attr = centdir[15:18]
779 # Convert date/time code to (year, month, day, hour, min, sec)
780 x._raw_time = t
781 x.date_time = ( (d>>9)+1980, (d>>5)&0xF, d&0x1F,
782 t>>11, (t>>5)&0x3F, (t&0x1F) * 2 )
784 x._decodeExtra()
785 x.header_offset = x.header_offset + concat
786 x.filename = x._decodeFilename()
787 self.filelist.append(x)
788 self.NameToInfo[x.filename] = x
790 # update total bytes read from central directory
791 total = (total + sizeCentralDir + centdir[_CD_FILENAME_LENGTH]
792 + centdir[_CD_EXTRA_FIELD_LENGTH]
793 + centdir[_CD_COMMENT_LENGTH])
795 if self.debug > 2:
796 print "total", total
799 def namelist(self):
800 """Return a list of file names in the archive."""
801 l = []
802 for data in self.filelist:
803 l.append(data.filename)
804 return l
806 def infolist(self):
807 """Return a list of class ZipInfo instances for files in the
808 archive."""
809 return self.filelist
811 def printdir(self):
812 """Print a table of contents for the zip file."""
813 print "%-46s %19s %12s" % ("File Name", "Modified ", "Size")
814 for zinfo in self.filelist:
815 date = "%d-%02d-%02d %02d:%02d:%02d" % zinfo.date_time[:6]
816 print "%-46s %s %12d" % (zinfo.filename, date, zinfo.file_size)
818 def testzip(self):
819 """Read all the files and check the CRC."""
820 chunk_size = 2 ** 20
821 for zinfo in self.filelist:
822 try:
823 # Read by chunks, to avoid an OverflowError or a
824 # MemoryError with very large embedded files.
825 f = self.open(zinfo.filename, "r")
826 while f.read(chunk_size): # Check CRC-32
827 pass
828 except BadZipfile:
829 return zinfo.filename
831 def getinfo(self, name):
832 """Return the instance of ZipInfo given 'name'."""
833 info = self.NameToInfo.get(name)
834 if info is None:
835 raise KeyError(
836 'There is no item named %r in the archive' % name)
838 return info
840 def setpassword(self, pwd):
841 """Set default password for encrypted files."""
842 self.pwd = pwd
844 def read(self, name, pwd=None):
845 """Return file bytes (as a string) for name."""
846 return self.open(name, "r", pwd).read()
848 def open(self, name, mode="r", pwd=None):
849 """Return file-like object for 'name'."""
850 if mode not in ("r", "U", "rU"):
851 raise RuntimeError, 'open() requires mode "r", "U", or "rU"'
852 if not self.fp:
853 raise RuntimeError, \
854 "Attempt to read ZIP archive that was already closed"
856 # Only open a new file for instances where we were not
857 # given a file object in the constructor
858 if self._filePassed:
859 zef_file = self.fp
860 else:
861 zef_file = open(self.filename, 'rb')
863 # Make sure we have an info object
864 if isinstance(name, ZipInfo):
865 # 'name' is already an info object
866 zinfo = name
867 else:
868 # Get info object for name
869 zinfo = self.getinfo(name)
871 zef_file.seek(zinfo.header_offset, 0)
873 # Skip the file header:
874 fheader = zef_file.read(sizeFileHeader)
875 if fheader[0:4] != stringFileHeader:
876 raise BadZipfile, "Bad magic number for file header"
878 fheader = struct.unpack(structFileHeader, fheader)
879 fname = zef_file.read(fheader[_FH_FILENAME_LENGTH])
880 if fheader[_FH_EXTRA_FIELD_LENGTH]:
881 zef_file.read(fheader[_FH_EXTRA_FIELD_LENGTH])
883 if fname != zinfo.orig_filename:
884 raise BadZipfile, \
885 'File name in directory "%s" and header "%s" differ.' % (
886 zinfo.orig_filename, fname)
888 # check for encrypted flag & handle password
889 is_encrypted = zinfo.flag_bits & 0x1
890 zd = None
891 if is_encrypted:
892 if not pwd:
893 pwd = self.pwd
894 if not pwd:
895 raise RuntimeError, "File %s is encrypted, " \
896 "password required for extraction" % name
898 zd = _ZipDecrypter(pwd)
899 # The first 12 bytes in the cypher stream is an encryption header
900 # used to strengthen the algorithm. The first 11 bytes are
901 # completely random, while the 12th contains the MSB of the CRC,
902 # or the MSB of the file time depending on the header type
903 # and is used to check the correctness of the password.
904 bytes = zef_file.read(12)
905 h = map(zd, bytes[0:12])
906 if zinfo.flag_bits & 0x8:
907 # compare against the file type from extended local headers
908 check_byte = (zinfo._raw_time >> 8) & 0xff
909 else:
910 # compare against the CRC otherwise
911 check_byte = (zinfo.CRC >> 24) & 0xff
912 if ord(h[11]) != check_byte:
913 raise RuntimeError("Bad password for file", name)
915 # build and return a ZipExtFile
916 if zd is None:
917 zef = ZipExtFile(zef_file, zinfo)
918 else:
919 zef = ZipExtFile(zef_file, zinfo, zd)
921 # set universal newlines on ZipExtFile if necessary
922 if "U" in mode:
923 zef.set_univ_newlines(True)
924 return zef
926 def extract(self, member, path=None, pwd=None):
927 """Extract a member from the archive to the current working directory,
928 using its full name. Its file information is extracted as accurately
929 as possible. `member' may be a filename or a ZipInfo object. You can
930 specify a different directory using `path'.
932 if not isinstance(member, ZipInfo):
933 member = self.getinfo(member)
935 if path is None:
936 path = os.getcwd()
938 return self._extract_member(member, path, pwd)
940 def extractall(self, path=None, members=None, pwd=None):
941 """Extract all members from the archive to the current working
942 directory. `path' specifies a different directory to extract to.
943 `members' is optional and must be a subset of the list returned
944 by namelist().
946 if members is None:
947 members = self.namelist()
949 for zipinfo in members:
950 self.extract(zipinfo, path, pwd)
952 def _extract_member(self, member, targetpath, pwd):
953 """Extract the ZipInfo object 'member' to a physical
954 file on the path targetpath.
956 # build the destination pathname, replacing
957 # forward slashes to platform specific separators.
958 # Strip trailing path separator, unless it represents the root.
959 if (targetpath[-1:] in (os.path.sep, os.path.altsep)
960 and len(os.path.splitdrive(targetpath)[1]) > 1):
961 targetpath = targetpath[:-1]
963 # don't include leading "/" from file name if present
964 if member.filename[0] == '/':
965 targetpath = os.path.join(targetpath, member.filename[1:])
966 else:
967 targetpath = os.path.join(targetpath, member.filename)
969 targetpath = os.path.normpath(targetpath)
971 # Create all upper directories if necessary.
972 upperdirs = os.path.dirname(targetpath)
973 if upperdirs and not os.path.exists(upperdirs):
974 os.makedirs(upperdirs)
976 if member.filename[-1] == '/':
977 if not os.path.isdir(targetpath):
978 os.mkdir(targetpath)
979 return targetpath
981 source = self.open(member, pwd=pwd)
982 target = file(targetpath, "wb")
983 shutil.copyfileobj(source, target)
984 source.close()
985 target.close()
987 return targetpath
989 def _writecheck(self, zinfo):
990 """Check for errors before writing a file to the archive."""
991 if zinfo.filename in self.NameToInfo:
992 if self.debug: # Warning for duplicate names
993 print "Duplicate name:", zinfo.filename
994 if self.mode not in ("w", "a"):
995 raise RuntimeError, 'write() requires mode "w" or "a"'
996 if not self.fp:
997 raise RuntimeError, \
998 "Attempt to write ZIP archive that was already closed"
999 if zinfo.compress_type == ZIP_DEFLATED and not zlib:
1000 raise RuntimeError, \
1001 "Compression requires the (missing) zlib module"
1002 if zinfo.compress_type not in (ZIP_STORED, ZIP_DEFLATED):
1003 raise RuntimeError, \
1004 "That compression method is not supported"
1005 if zinfo.file_size > ZIP64_LIMIT:
1006 if not self._allowZip64:
1007 raise LargeZipFile("Filesize would require ZIP64 extensions")
1008 if zinfo.header_offset > ZIP64_LIMIT:
1009 if not self._allowZip64:
1010 raise LargeZipFile("Zipfile size would require ZIP64 extensions")
1012 def write(self, filename, arcname=None, compress_type=None):
1013 """Put the bytes from filename into the archive under the name
1014 arcname."""
1015 if not self.fp:
1016 raise RuntimeError(
1017 "Attempt to write to ZIP archive that was already closed")
1019 st = os.stat(filename)
1020 isdir = stat.S_ISDIR(st.st_mode)
1021 mtime = time.localtime(st.st_mtime)
1022 date_time = mtime[0:6]
1023 # Create ZipInfo instance to store file information
1024 if arcname is None:
1025 arcname = filename
1026 arcname = os.path.normpath(os.path.splitdrive(arcname)[1])
1027 while arcname[0] in (os.sep, os.altsep):
1028 arcname = arcname[1:]
1029 if isdir:
1030 arcname += '/'
1031 zinfo = ZipInfo(arcname, date_time)
1032 zinfo.external_attr = (st[0] & 0xFFFF) << 16L # Unix attributes
1033 if compress_type is None:
1034 zinfo.compress_type = self.compression
1035 else:
1036 zinfo.compress_type = compress_type
1038 zinfo.file_size = st.st_size
1039 zinfo.flag_bits = 0x00
1040 zinfo.header_offset = self.fp.tell() # Start of header bytes
1042 self._writecheck(zinfo)
1043 self._didModify = True
1045 if isdir:
1046 zinfo.file_size = 0
1047 zinfo.compress_size = 0
1048 zinfo.CRC = 0
1049 self.filelist.append(zinfo)
1050 self.NameToInfo[zinfo.filename] = zinfo
1051 self.fp.write(zinfo.FileHeader())
1052 return
1054 with open(filename, "rb") as fp:
1055 # Must overwrite CRC and sizes with correct data later
1056 zinfo.CRC = CRC = 0
1057 zinfo.compress_size = compress_size = 0
1058 zinfo.file_size = file_size = 0
1059 self.fp.write(zinfo.FileHeader())
1060 if zinfo.compress_type == ZIP_DEFLATED:
1061 cmpr = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION,
1062 zlib.DEFLATED, -15)
1063 else:
1064 cmpr = None
1065 while 1:
1066 buf = fp.read(1024 * 8)
1067 if not buf:
1068 break
1069 file_size = file_size + len(buf)
1070 CRC = crc32(buf, CRC) & 0xffffffff
1071 if cmpr:
1072 buf = cmpr.compress(buf)
1073 compress_size = compress_size + len(buf)
1074 self.fp.write(buf)
1075 if cmpr:
1076 buf = cmpr.flush()
1077 compress_size = compress_size + len(buf)
1078 self.fp.write(buf)
1079 zinfo.compress_size = compress_size
1080 else:
1081 zinfo.compress_size = file_size
1082 zinfo.CRC = CRC
1083 zinfo.file_size = file_size
1084 # Seek backwards and write CRC and file sizes
1085 position = self.fp.tell() # Preserve current position in file
1086 self.fp.seek(zinfo.header_offset + 14, 0)
1087 self.fp.write(struct.pack("<LLL", zinfo.CRC, zinfo.compress_size,
1088 zinfo.file_size))
1089 self.fp.seek(position, 0)
1090 self.filelist.append(zinfo)
1091 self.NameToInfo[zinfo.filename] = zinfo
1093 def writestr(self, zinfo_or_arcname, bytes):
1094 """Write a file into the archive. The contents is the string
1095 'bytes'. 'zinfo_or_arcname' is either a ZipInfo instance or
1096 the name of the file in the archive."""
1097 if not isinstance(zinfo_or_arcname, ZipInfo):
1098 zinfo = ZipInfo(filename=zinfo_or_arcname,
1099 date_time=time.localtime(time.time())[:6])
1100 zinfo.compress_type = self.compression
1101 zinfo.external_attr = 0600 << 16
1102 else:
1103 zinfo = zinfo_or_arcname
1105 if not self.fp:
1106 raise RuntimeError(
1107 "Attempt to write to ZIP archive that was already closed")
1109 zinfo.file_size = len(bytes) # Uncompressed size
1110 zinfo.header_offset = self.fp.tell() # Start of header bytes
1111 self._writecheck(zinfo)
1112 self._didModify = True
1113 zinfo.CRC = crc32(bytes) & 0xffffffff # CRC-32 checksum
1114 if zinfo.compress_type == ZIP_DEFLATED:
1115 co = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION,
1116 zlib.DEFLATED, -15)
1117 bytes = co.compress(bytes) + co.flush()
1118 zinfo.compress_size = len(bytes) # Compressed size
1119 else:
1120 zinfo.compress_size = zinfo.file_size
1121 zinfo.header_offset = self.fp.tell() # Start of header bytes
1122 self.fp.write(zinfo.FileHeader())
1123 self.fp.write(bytes)
1124 self.fp.flush()
1125 if zinfo.flag_bits & 0x08:
1126 # Write CRC and file sizes after the file data
1127 self.fp.write(struct.pack("<LLL", zinfo.CRC, zinfo.compress_size,
1128 zinfo.file_size))
1129 self.filelist.append(zinfo)
1130 self.NameToInfo[zinfo.filename] = zinfo
1132 def __del__(self):
1133 """Call the "close()" method in case the user forgot."""
1134 self.close()
1136 def close(self):
1137 """Close the file, and for mode "w" and "a" write the ending
1138 records."""
1139 if self.fp is None:
1140 return
1142 if self.mode in ("w", "a") and self._didModify: # write ending records
1143 count = 0
1144 pos1 = self.fp.tell()
1145 for zinfo in self.filelist: # write central directory
1146 count = count + 1
1147 dt = zinfo.date_time
1148 dosdate = (dt[0] - 1980) << 9 | dt[1] << 5 | dt[2]
1149 dostime = dt[3] << 11 | dt[4] << 5 | (dt[5] // 2)
1150 extra = []
1151 if zinfo.file_size > ZIP64_LIMIT \
1152 or zinfo.compress_size > ZIP64_LIMIT:
1153 extra.append(zinfo.file_size)
1154 extra.append(zinfo.compress_size)
1155 file_size = 0xffffffff
1156 compress_size = 0xffffffff
1157 else:
1158 file_size = zinfo.file_size
1159 compress_size = zinfo.compress_size
1161 if zinfo.header_offset > ZIP64_LIMIT:
1162 extra.append(zinfo.header_offset)
1163 header_offset = 0xffffffffL
1164 else:
1165 header_offset = zinfo.header_offset
1167 extra_data = zinfo.extra
1168 if extra:
1169 # Append a ZIP64 field to the extra's
1170 extra_data = struct.pack(
1171 '<HH' + 'Q'*len(extra),
1172 1, 8*len(extra), *extra) + extra_data
1174 extract_version = max(45, zinfo.extract_version)
1175 create_version = max(45, zinfo.create_version)
1176 else:
1177 extract_version = zinfo.extract_version
1178 create_version = zinfo.create_version
1180 try:
1181 filename, flag_bits = zinfo._encodeFilenameFlags()
1182 centdir = struct.pack(structCentralDir,
1183 stringCentralDir, create_version,
1184 zinfo.create_system, extract_version, zinfo.reserved,
1185 flag_bits, zinfo.compress_type, dostime, dosdate,
1186 zinfo.CRC, compress_size, file_size,
1187 len(filename), len(extra_data), len(zinfo.comment),
1188 0, zinfo.internal_attr, zinfo.external_attr,
1189 header_offset)
1190 except DeprecationWarning:
1191 print >>sys.stderr, (structCentralDir,
1192 stringCentralDir, create_version,
1193 zinfo.create_system, extract_version, zinfo.reserved,
1194 zinfo.flag_bits, zinfo.compress_type, dostime, dosdate,
1195 zinfo.CRC, compress_size, file_size,
1196 len(zinfo.filename), len(extra_data), len(zinfo.comment),
1197 0, zinfo.internal_attr, zinfo.external_attr,
1198 header_offset)
1199 raise
1200 self.fp.write(centdir)
1201 self.fp.write(filename)
1202 self.fp.write(extra_data)
1203 self.fp.write(zinfo.comment)
1205 pos2 = self.fp.tell()
1206 # Write end-of-zip-archive record
1207 centDirCount = count
1208 centDirSize = pos2 - pos1
1209 centDirOffset = pos1
1210 if (centDirCount >= ZIP_FILECOUNT_LIMIT or
1211 centDirOffset > ZIP64_LIMIT or
1212 centDirSize > ZIP64_LIMIT):
1213 # Need to write the ZIP64 end-of-archive records
1214 zip64endrec = struct.pack(
1215 structEndArchive64, stringEndArchive64,
1216 44, 45, 45, 0, 0, centDirCount, centDirCount,
1217 centDirSize, centDirOffset)
1218 self.fp.write(zip64endrec)
1220 zip64locrec = struct.pack(
1221 structEndArchive64Locator,
1222 stringEndArchive64Locator, 0, pos2, 1)
1223 self.fp.write(zip64locrec)
1224 centDirCount = min(centDirCount, 0xFFFF)
1225 centDirSize = min(centDirSize, 0xFFFFFFFF)
1226 centDirOffset = min(centDirOffset, 0xFFFFFFFF)
1228 # check for valid comment length
1229 if len(self.comment) >= ZIP_MAX_COMMENT:
1230 if self.debug > 0:
1231 msg = 'Archive comment is too long; truncating to %d bytes' \
1232 % ZIP_MAX_COMMENT
1233 self.comment = self.comment[:ZIP_MAX_COMMENT]
1235 endrec = struct.pack(structEndArchive, stringEndArchive,
1236 0, 0, centDirCount, centDirCount,
1237 centDirSize, centDirOffset, len(self.comment))
1238 self.fp.write(endrec)
1239 self.fp.write(self.comment)
1240 self.fp.flush()
1242 if not self._filePassed:
1243 self.fp.close()
1244 self.fp = None
1247 class PyZipFile(ZipFile):
1248 """Class to create ZIP archives with Python library files and packages."""
1250 def writepy(self, pathname, basename = ""):
1251 """Add all files from "pathname" to the ZIP archive.
1253 If pathname is a package directory, search the directory and
1254 all package subdirectories recursively for all *.py and enter
1255 the modules into the archive. If pathname is a plain
1256 directory, listdir *.py and enter all modules. Else, pathname
1257 must be a Python *.py file and the module will be put into the
1258 archive. Added modules are always module.pyo or module.pyc.
1259 This method will compile the module.py into module.pyc if
1260 necessary.
1262 dir, name = os.path.split(pathname)
1263 if os.path.isdir(pathname):
1264 initname = os.path.join(pathname, "__init__.py")
1265 if os.path.isfile(initname):
1266 # This is a package directory, add it
1267 if basename:
1268 basename = "%s/%s" % (basename, name)
1269 else:
1270 basename = name
1271 if self.debug:
1272 print "Adding package in", pathname, "as", basename
1273 fname, arcname = self._get_codename(initname[0:-3], basename)
1274 if self.debug:
1275 print "Adding", arcname
1276 self.write(fname, arcname)
1277 dirlist = os.listdir(pathname)
1278 dirlist.remove("__init__.py")
1279 # Add all *.py files and package subdirectories
1280 for filename in dirlist:
1281 path = os.path.join(pathname, filename)
1282 root, ext = os.path.splitext(filename)
1283 if os.path.isdir(path):
1284 if os.path.isfile(os.path.join(path, "__init__.py")):
1285 # This is a package directory, add it
1286 self.writepy(path, basename) # Recursive call
1287 elif ext == ".py":
1288 fname, arcname = self._get_codename(path[0:-3],
1289 basename)
1290 if self.debug:
1291 print "Adding", arcname
1292 self.write(fname, arcname)
1293 else:
1294 # This is NOT a package directory, add its files at top level
1295 if self.debug:
1296 print "Adding files from directory", pathname
1297 for filename in os.listdir(pathname):
1298 path = os.path.join(pathname, filename)
1299 root, ext = os.path.splitext(filename)
1300 if ext == ".py":
1301 fname, arcname = self._get_codename(path[0:-3],
1302 basename)
1303 if self.debug:
1304 print "Adding", arcname
1305 self.write(fname, arcname)
1306 else:
1307 if pathname[-3:] != ".py":
1308 raise RuntimeError, \
1309 'Files added with writepy() must end with ".py"'
1310 fname, arcname = self._get_codename(pathname[0:-3], basename)
1311 if self.debug:
1312 print "Adding file", arcname
1313 self.write(fname, arcname)
1315 def _get_codename(self, pathname, basename):
1316 """Return (filename, archivename) for the path.
1318 Given a module name path, return the correct file path and
1319 archive name, compiling if necessary. For example, given
1320 /python/lib/string, return (/python/lib/string.pyc, string).
1322 file_py = pathname + ".py"
1323 file_pyc = pathname + ".pyc"
1324 file_pyo = pathname + ".pyo"
1325 if os.path.isfile(file_pyo) and \
1326 os.stat(file_pyo).st_mtime >= os.stat(file_py).st_mtime:
1327 fname = file_pyo # Use .pyo file
1328 elif not os.path.isfile(file_pyc) or \
1329 os.stat(file_pyc).st_mtime < os.stat(file_py).st_mtime:
1330 import py_compile
1331 if self.debug:
1332 print "Compiling", file_py
1333 try:
1334 py_compile.compile(file_py, file_pyc, None, True)
1335 except py_compile.PyCompileError,err:
1336 print err.msg
1337 fname = file_pyc
1338 else:
1339 fname = file_pyc
1340 archivename = os.path.split(fname)[1]
1341 if basename:
1342 archivename = "%s/%s" % (basename, archivename)
1343 return (fname, archivename)
1346 def main(args = None):
1347 import textwrap
1348 USAGE=textwrap.dedent("""\
1349 Usage:
1350 zipfile.py -l zipfile.zip # Show listing of a zipfile
1351 zipfile.py -t zipfile.zip # Test if a zipfile is valid
1352 zipfile.py -e zipfile.zip target # Extract zipfile into target dir
1353 zipfile.py -c zipfile.zip src ... # Create zipfile from sources
1354 """)
1355 if args is None:
1356 args = sys.argv[1:]
1358 if not args or args[0] not in ('-l', '-c', '-e', '-t'):
1359 print USAGE
1360 sys.exit(1)
1362 if args[0] == '-l':
1363 if len(args) != 2:
1364 print USAGE
1365 sys.exit(1)
1366 zf = ZipFile(args[1], 'r')
1367 zf.printdir()
1368 zf.close()
1370 elif args[0] == '-t':
1371 if len(args) != 2:
1372 print USAGE
1373 sys.exit(1)
1374 zf = ZipFile(args[1], 'r')
1375 zf.testzip()
1376 print "Done testing"
1378 elif args[0] == '-e':
1379 if len(args) != 3:
1380 print USAGE
1381 sys.exit(1)
1383 zf = ZipFile(args[1], 'r')
1384 out = args[2]
1385 for path in zf.namelist():
1386 if path.startswith('./'):
1387 tgt = os.path.join(out, path[2:])
1388 else:
1389 tgt = os.path.join(out, path)
1391 tgtdir = os.path.dirname(tgt)
1392 if not os.path.exists(tgtdir):
1393 os.makedirs(tgtdir)
1394 with open(tgt, 'wb') as fp:
1395 fp.write(zf.read(path))
1396 zf.close()
1398 elif args[0] == '-c':
1399 if len(args) < 3:
1400 print USAGE
1401 sys.exit(1)
1403 def addToZip(zf, path, zippath):
1404 if os.path.isfile(path):
1405 zf.write(path, zippath, ZIP_DEFLATED)
1406 elif os.path.isdir(path):
1407 for nm in os.listdir(path):
1408 addToZip(zf,
1409 os.path.join(path, nm), os.path.join(zippath, nm))
1410 # else: ignore
1412 zf = ZipFile(args[1], 'w', allowZip64=True)
1413 for src in args[2:]:
1414 addToZip(zf, src, os.path.basename(src))
1416 zf.close()
1418 if __name__ == "__main__":
1419 main()