1 package Archive
::Zip
::Archive
;
3 # Represents a generic ZIP archive
13 use vars
qw( $VERSION @ISA );
17 @ISA = qw( Archive::Zip );
27 # Note that this returns undef on read errors, else new zip object.
34 'diskNumberWithStartOfCentralDirectory' => 0,
35 'numberOfCentralDirectoriesOnThisDisk' => 0, # shld be # of members
36 'numberOfCentralDirectories' => 0, # shld be # of members
37 'centralDirectorySize' => 0, # must re-compute on write
38 'centralDirectoryOffsetWRTStartingDiskNumber' =>
40 'writeEOCDOffset' => 0,
41 'writeCentralDirectoryOffset' => 0,
42 'zipfileComment' => '',
48 $self->{'members'} = [];
50 my $status = $self->read(@_);
51 return $status == AZ_OK ?
$self : undef;
56 sub storeSymbolicLink
{
58 $self->{'storeSymbolicLink'} = shift;
62 @
{ shift->{'members'} };
66 scalar( shift->members() );
71 return map { $_->fileName() } $self->members();
74 # return ref to member with given name or undef
76 my ( $self, $fileName ) = @_;
77 foreach my $member ( $self->members() ) {
78 return $member if $member->fileName() eq $fileName;
84 my ( $self, $pattern ) = @_;
85 return grep { $_->fileName() =~ /$pattern/ } $self->members();
89 shift->{'diskNumber'};
92 sub diskNumberWithStartOfCentralDirectory
{
93 shift->{'diskNumberWithStartOfCentralDirectory'};
96 sub numberOfCentralDirectoriesOnThisDisk
{
97 shift->{'numberOfCentralDirectoriesOnThisDisk'};
100 sub numberOfCentralDirectories
{
101 shift->{'numberOfCentralDirectories'};
104 sub centralDirectorySize
{
105 shift->{'centralDirectorySize'};
108 sub centralDirectoryOffsetWRTStartingDiskNumber
{
109 shift->{'centralDirectoryOffsetWRTStartingDiskNumber'};
114 my $comment = $self->{'zipfileComment'};
116 $self->{'zipfileComment'} = pack( 'C0a*', shift() ); # avoid unicode
122 shift->{'eocdOffset'};
125 # Return the name of the file last read.
131 my ( $self, $member ) = @_;
132 $member = $self->memberNamed($member) unless ref($member);
133 return undef unless $member;
134 my @newMembers = grep { $_ != $member } $self->members();
135 $self->{'members'} = \
@newMembers;
140 my ( $self, $oldMember, $newMember ) = @_;
141 $oldMember = $self->memberNamed($oldMember) unless ref($oldMember);
142 return undef unless $oldMember;
143 return undef unless $newMember;
145 map { ( $_ == $oldMember ) ?
$newMember : $_ } $self->members();
146 $self->{'members'} = \
@newMembers;
153 $member = $self->memberNamed($member) unless ref($member);
154 return _error
('member not found') unless $member;
155 my $originalSize = $member->compressedSize();
156 my $name = shift; # local FS name if given
157 my ( $volumeName, $dirName, $fileName );
158 if ( defined($name) ) {
159 ( $volumeName, $dirName, $fileName ) = File
::Spec
->splitpath($name);
160 $dirName = File
::Spec
->catpath( $volumeName, $dirName, '' );
163 $name = $member->fileName();
164 ( $dirName = $name ) =~ s{[^/]*$}{};
165 $dirName = Archive
::Zip
::_asLocalName
($dirName);
166 $name = Archive
::Zip
::_asLocalName
($name);
168 if ( $dirName && !-d
$dirName ) {
170 return _ioError
("can't create dir $dirName") if ( !-d
$dirName );
172 my $rc = $member->extractToFileNamed( $name, @_ );
174 # TODO refactor this fix into extractToFileNamed()
175 $member->{'compressedSize'} = $originalSize;
179 sub extractMemberWithoutPaths
{
182 $member = $self->memberNamed($member) unless ref($member);
183 return _error
('member not found') unless $member;
184 my $originalSize = $member->compressedSize();
185 return AZ_OK
if $member->isDirectory();
188 $name = $member->fileName();
189 $name =~ s{.*/}{}; # strip off directories, if any
190 $name = Archive
::Zip
::_asLocalName
($name);
192 my $rc = $member->extractToFileNamed( $name, @_ );
193 $member->{'compressedSize'} = $originalSize;
198 my ( $self, $newMember ) = @_;
199 push( @
{ $self->{'members'} }, $newMember ) if $newMember;
205 my $fileName = shift;
207 my $newMember = $self->ZIPMEMBERCLASS->newFromFile( $fileName, $newName );
208 if ( $self->{'storeSymbolicLink'} && -l
$fileName ) {
209 my $newMember = $self->ZIPMEMBERCLASS->newFromString(readlink $fileName, $newName);
210 # For symbolic links, External File Attribute is set to 0xA1FF0000 by Info-ZIP
211 $newMember->{'externalFileAttributes'} = 0xA1FF0000;
212 $self->addMember($newMember);
214 $self->addMember($newMember);
221 my $newMember = $self->ZIPMEMBERCLASS->newFromString(@_);
222 return $self->addMember($newMember);
226 my ( $self, $name, $newName ) = @_;
227 my $newMember = $self->ZIPMEMBERCLASS->newDirectoryNamed( $name, $newName );
228 if ( $self->{'storeSymbolicLink'} && -l
$name ) {
229 my $link = readlink $name;
230 ( $newName =~ s{/$}{} ) if $newName; # Strip trailing /
231 my $newMember = $self->ZIPMEMBERCLASS->newFromString($link, $newName);
232 # For symbolic links, External File Attribute is set to 0xA1FF0000 by Info-ZIP
233 $newMember->{'externalFileAttributes'} = 0xA1FF0000;
234 $self->addMember($newMember);
236 $self->addMember($newMember);
241 # add either a file or a directory.
243 sub addFileOrDirectory
{
244 my ( $self, $name, $newName ) = @_;
252 return $self->addFile( $name, $newName );
255 return $self->addDirectory( $name, $newName );
258 return _error
("$name is neither a file nor a directory");
263 my ( $self, $member, $newContents ) = @_;
264 return _error
('No member name given') unless $member;
265 $member = $self->memberNamed($member) unless ref($member);
266 return undef unless $member;
267 return $member->contents($newContents);
270 sub writeToFileNamed
{
272 my $fileName = shift; # local FS format
273 foreach my $member ( $self->members() ) {
274 if ( $member->_usesFileNamed($fileName) ) {
275 return _error
( "$fileName is needed by member "
276 . $member->fileName()
277 . "; consider using overwrite() or overwriteAs() instead." );
280 my ( $status, $fh ) = _newFileHandle
( $fileName, 'w' );
281 return _ioError
("Can't open $fileName for write") unless $status;
282 my $retval = $self->writeToFileHandle( $fh, 1 );
289 # It is possible to write data to the FH before calling this,
290 # perhaps to make a self-extracting archive.
291 sub writeToFileHandle
{
294 return _error
('No filehandle given') unless $fh;
295 return _ioError
('filehandle not open') unless $fh->opened();
297 my $fhIsSeekable = @_ ?
shift: _isSeekable
($fh);
300 # Find out where the current position is.
301 my $offset = $fhIsSeekable ?
$fh->tell() : 0;
302 $offset = 0 if $offset < 0;
304 foreach my $member ( $self->members() ) {
305 my $retval = $member->_writeToFileHandle( $fh, $fhIsSeekable, $offset );
307 return $retval if $retval != AZ_OK
;
308 $offset += $member->_localHeaderSize() + $member->_writeOffset();
310 $member->hasDataDescriptor()
311 ? DATA_DESCRIPTOR_LENGTH
+ SIGNATURE_LENGTH
314 # changed this so it reflects the last successful position
315 $self->{'writeCentralDirectoryOffset'} = $offset;
317 return $self->writeCentralDirectory($fh);
320 # Write zip back to the original file,
321 # as safely as possible.
322 # Returns AZ_OK if successful.
325 return $self->overwriteAs( $self->{'fileName'} );
328 # Write zip to the specified file,
329 # as safely as possible.
330 # Returns AZ_OK if successful.
334 return _error
("no filename in overwriteAs()") unless defined($zipName);
336 my ( $fh, $tempName ) = Archive
::Zip
::tempFile
();
337 return _error
( "Can't open temp file", $! ) unless $fh;
339 ( my $backupName = $zipName ) =~ s{(\.[^.]*)?$}{.zbk};
341 my $status = $self->writeToFileHandle($fh);
345 if ( $status != AZ_OK
) {
347 _printError
("Can't write to $tempName");
354 if ( -f
$zipName && !rename( $zipName, $backupName ) ) {
357 return _error
( "Can't rename $zipName as $backupName", $err );
360 # move the temp to the original name (possibly copying)
361 unless ( File
::Copy
::move
( $tempName, $zipName ) ) {
363 rename( $backupName, $zipName );
365 return _error
( "Can't move $tempName to $zipName", $err );
369 if ( -f
$backupName && !unlink($backupName) ) {
371 return _error
( "Can't unlink $backupName", $err );
377 # Used only during writing
378 sub _writeCentralDirectoryOffset
{
379 shift->{'writeCentralDirectoryOffset'};
382 sub _writeEOCDOffset
{
383 shift->{'writeEOCDOffset'};
386 # Expects to have _writeEOCDOffset() set
387 sub _writeEndOfCentralDirectory
{
388 my ( $self, $fh ) = @_;
390 $self->_print($fh, END_OF_CENTRAL_DIRECTORY_SIGNATURE_STRING
)
391 or return _ioError
('writing EOCD Signature');
392 my $zipfileCommentLength = length( $self->zipfileComment() );
395 END_OF_CENTRAL_DIRECTORY_FORMAT
,
397 0, # {'diskNumberWithStartOfCentralDirectory'},
398 $self->numberOfMembers(), # {'numberOfCentralDirectoriesOnThisDisk'},
399 $self->numberOfMembers(), # {'numberOfCentralDirectories'},
400 $self->_writeEOCDOffset() - $self->_writeCentralDirectoryOffset(),
401 $self->_writeCentralDirectoryOffset(),
402 $zipfileCommentLength
404 $self->_print($fh, $header)
405 or return _ioError
('writing EOCD header');
406 if ($zipfileCommentLength) {
407 $self->_print($fh, $self->zipfileComment() )
408 or return _ioError
('writing zipfile comment');
413 # $offset can be specified to truncate a zip file.
414 sub writeCentralDirectory
{
415 my ( $self, $fh, $offset ) = @_;
417 if ( defined($offset) ) {
418 $self->{'writeCentralDirectoryOffset'} = $offset;
419 $fh->seek( $offset, IO
::Seekable
::SEEK_SET
)
420 or return _ioError
('seeking to write central directory');
423 $offset = $self->_writeCentralDirectoryOffset();
426 foreach my $member ( $self->members() ) {
427 my $status = $member->_writeCentralDirectoryFileHeader($fh);
428 return $status if $status != AZ_OK
;
429 $offset += $member->_centralDirectoryHeaderSize();
430 $self->{'writeEOCDOffset'} = $offset;
432 return $self->_writeEndOfCentralDirectory($fh);
437 my $fileName = shift;
438 return _error
('No filename given') unless $fileName;
439 my ( $status, $fh ) = _newFileHandle
( $fileName, 'r' );
440 return _ioError
("opening $fileName for read") unless $status;
442 $status = $self->readFromFileHandle( $fh, $fileName );
443 return $status if $status != AZ_OK
;
446 $self->{'fileName'} = $fileName;
450 sub readFromFileHandle
{
453 my $fileName = shift;
454 $fileName = $fh unless defined($fileName);
455 return _error
('No filehandle given') unless $fh;
456 return _ioError
('filehandle not open') unless $fh->opened();
459 $self->{'fileName'} = "$fh";
461 # TODO: how to support non-seekable zips?
462 return _error
('file not seekable')
463 unless _isSeekable
($fh);
465 $fh->seek( 0, 0 ); # rewind the file
467 my $status = $self->_findEndOfCentralDirectory($fh);
468 return $status if $status != AZ_OK
;
470 my $eocdPosition = $fh->tell();
472 $status = $self->_readEndOfCentralDirectory($fh);
473 return $status if $status != AZ_OK
;
475 $fh->seek( $eocdPosition - $self->centralDirectorySize(),
476 IO
::Seekable
::SEEK_SET
)
477 or return _ioError
("Can't seek $fileName");
479 # Try to detect garbage at beginning of archives
481 $self->{'eocdOffset'} = $eocdPosition - $self->centralDirectorySize() # here
482 - $self->centralDirectoryOffsetWRTStartingDiskNumber();
486 $self->ZIPMEMBERCLASS->_newFromZipFile( $fh, $fileName,
487 $self->eocdOffset() );
489 ( $status, $signature ) = _readSignature
( $fh, $fileName );
490 return $status if $status != AZ_OK
;
491 last if $signature == END_OF_CENTRAL_DIRECTORY_SIGNATURE
;
492 $status = $newMember->_readCentralDirectoryFileHeader();
493 return $status if $status != AZ_OK
;
494 $status = $newMember->endRead();
495 return $status if $status != AZ_OK
;
496 $newMember->_becomeDirectoryIfNecessary();
497 push( @
{ $self->{'members'} }, $newMember );
503 # Read EOCD, starting from position before signature.
504 # Return AZ_OK on success.
505 sub _readEndOfCentralDirectory
{
509 # Skip past signature
510 $fh->seek( SIGNATURE_LENGTH
, IO
::Seekable
::SEEK_CUR
)
511 or return _ioError
("Can't seek past EOCD signature");
514 my $bytesRead = $fh->read( $header, END_OF_CENTRAL_DIRECTORY_LENGTH
);
515 if ( $bytesRead != END_OF_CENTRAL_DIRECTORY_LENGTH
) {
516 return _ioError
("reading end of central directory");
519 my $zipfileCommentLength;
521 $self->{'diskNumber'},
522 $self->{'diskNumberWithStartOfCentralDirectory'},
523 $self->{'numberOfCentralDirectoriesOnThisDisk'},
524 $self->{'numberOfCentralDirectories'},
525 $self->{'centralDirectorySize'},
526 $self->{'centralDirectoryOffsetWRTStartingDiskNumber'},
527 $zipfileCommentLength
528 ) = unpack( END_OF_CENTRAL_DIRECTORY_FORMAT
, $header );
530 if ($zipfileCommentLength) {
531 my $zipfileComment = '';
532 $bytesRead = $fh->read( $zipfileComment, $zipfileCommentLength );
533 if ( $bytesRead != $zipfileCommentLength ) {
534 return _ioError
("reading zipfile comment");
536 $self->{'zipfileComment'} = $zipfileComment;
542 # Seek in my file to the end, then read backwards until we find the
543 # signature of the central directory record. Leave the file positioned right
544 # before the signature. Returns AZ_OK if success.
545 sub _findEndOfCentralDirectory
{
549 $fh->seek( 0, IO
::Seekable
::SEEK_END
)
550 or return _ioError
("seeking to end");
552 my $fileLength = $fh->tell();
553 if ( $fileLength < END_OF_CENTRAL_DIRECTORY_LENGTH
+ 4 ) {
554 return _formatError
("file is too short");
561 $seekOffset = $fileLength if ( $seekOffset > $fileLength );
562 $fh->seek( -$seekOffset, IO
::Seekable
::SEEK_END
)
563 or return _ioError
("seek failed");
564 my $bytesRead = $fh->read( $data, $seekOffset );
565 if ( $bytesRead != $seekOffset ) {
566 return _ioError
("read failed");
568 $pos = rindex( $data, END_OF_CENTRAL_DIRECTORY_SIGNATURE_STRING
);
571 or $seekOffset == $fileLength
572 or $seekOffset >= $Archive::Zip
::ChunkSize
);
576 $fh->seek( $pos - $seekOffset, IO
::Seekable
::SEEK_CUR
)
577 or return _ioError
("seeking to EOCD");
581 return _formatError
("can't find EOCD signature");
585 # Used to avoid taint problems when chdir'ing.
586 # Not intended to increase security in any way; just intended to shut up the -T
587 # complaints. If your Cwd module is giving you unreliable returns from cwd()
588 # you have bigger problems than this.
591 $dir =~ m/\A(.+)\z/s;
597 my $root = shift or return _error
("root arg missing in call to addTree()");
599 $dest = '' unless defined($dest);
600 my $pred = shift || sub { -r
};
601 my $compressionLevel = shift;
603 my $startDir = _untaintDir
( cwd
() );
605 return _error
( 'undef returned by _untaintDir on cwd ', cwd
() )
608 # This avoids chdir'ing in Find, in a way compatible with older
609 # versions of File::Find.
611 local $main::_
= $File::Find
::name
;
612 my $dir = _untaintDir
($File::Find
::dir
);
614 push( @files, $File::Find
::name
) if (&$pred);
618 File
::Find
::find
( $wanted, $root );
620 my $rootZipName = _asZipDirName
( $root, 1 ); # with trailing slash
621 my $pattern = $rootZipName eq './' ?
'^' : "^\Q$rootZipName\E";
623 $dest = _asZipDirName
( $dest, 1 ); # with trailing slash
625 foreach my $fileName (@files) {
626 my $isDir = -d
$fileName;
628 # normalize, remove leading ./
629 my $archiveName = _asZipDirName
( $fileName, $isDir );
630 if ( $archiveName eq $rootZipName ) { $archiveName = $dest }
631 else { $archiveName =~ s{$pattern}{$dest} }
632 next if $archiveName =~ m{^\.?/?$}; # skip current dir
634 ?
$self->addDirectory( $fileName, $archiveName )
635 : $self->addFile( $fileName, $archiveName );
636 $member->desiredCompressionLevel($compressionLevel);
638 return _error
("add $fileName failed in addTree()") if !$member;
643 sub addTreeMatching
{
646 or return _error
("root arg missing in call to addTreeMatching()");
648 $dest = '' unless defined($dest);
650 or return _error
("pattern missing in call to addTreeMatching()");
653 $pred ?
sub { m{$pattern} && &$pred } : sub { m{$pattern} && -r
};
654 return $self->addTree( $root, $dest, $matcher );
657 # $zip->extractTree( $root, $dest [, $volume] );
659 # $root and $dest are Unix-style.
660 # $volume is in local FS format.
664 my $root = shift; # Zip format
665 $root = '' unless defined($root);
666 my $dest = shift; # Zip format
667 $dest = './' unless defined($dest);
668 my $volume = shift; # optional
669 my $pattern = "^\Q$root";
670 my @members = $self->membersMatching($pattern);
672 foreach my $member (@members) {
673 my $fileName = $member->fileName(); # in Unix format
674 $fileName =~ s{$pattern}{$dest}; # in Unix format
675 # convert to platform format:
676 $fileName = Archive
::Zip
::_asLocalName
( $fileName, $volume );
677 my $status = $member->extractToFileNamed($fileName);
678 return $status if $status != AZ_OK
;
683 # $zip->updateMember( $memberOrName, $fileName );
684 # Returns (possibly updated) member, if any; undef on errors.
688 my $oldMember = shift;
689 my $fileName = shift;
691 if ( !defined($fileName) ) {
692 _error
("updateMember(): missing fileName argument");
696 my @newStat = stat($fileName);
698 _ioError
("Can't stat $fileName");
706 if ( ref($oldMember) ) {
707 $memberName = $oldMember->fileName();
710 $oldMember = $self->memberNamed( $memberName = $oldMember )
711 || $self->memberNamed( $memberName =
712 _asZipDirName
( $oldMember, $isDir ) );
715 unless ( defined($oldMember)
716 && $oldMember->lastModTime() == $newStat[9]
717 && $oldMember->isDirectory() == $isDir
718 && ( $isDir || ( $oldMember->uncompressedSize() == $newStat[7] ) ) )
721 # create the new member
722 my $newMember = $isDir
723 ?
$self->ZIPMEMBERCLASS->newDirectoryNamed( $fileName, $memberName )
724 : $self->ZIPMEMBERCLASS->newFromFile( $fileName, $memberName );
726 unless ( defined($newMember) ) {
727 _error
("creation of member $fileName failed in updateMember()");
731 # replace old member or append new one
732 if ( defined($oldMember) ) {
733 $self->replaceMember( $oldMember, $newMember );
735 else { $self->addMember($newMember); }
743 # $zip->updateTree( $root, [ $dest, [ $pred [, $mirror]]] );
745 # This takes the same arguments as addTree, but first checks to see
746 # whether the file or directory already exists in the zip file.
748 # If the fourth argument $mirror is true, then delete all my members
749 # if corresponding files weren't found.
754 or return _error
("root arg missing in call to updateTree()");
756 $dest = '' unless defined($dest);
757 $dest = _asZipDirName
( $dest, 1 );
758 my $pred = shift || sub { -r
};
761 my $rootZipName = _asZipDirName
( $root, 1 ); # with trailing slash
762 my $pattern = $rootZipName eq './' ?
'^' : "^\Q$rootZipName\E";
765 my $startDir = _untaintDir
( cwd
() );
767 return _error
( 'undef returned by _untaintDir on cwd ', cwd
() )
770 # This avoids chdir'ing in Find, in a way compatible with older
771 # versions of File::Find.
773 local $main::_
= $File::Find
::name
;
774 my $dir = _untaintDir
($File::Find
::dir
);
776 push( @files, $File::Find
::name
) if (&$pred);
780 File
::Find
::find
( $wanted, $root );
782 # Now @files has all the files that I could potentially be adding to
783 # the zip. Only add the ones that are necessary.
784 # For each file (updated or not), add its member name to @done.
786 foreach my $fileName (@files) {
787 my @newStat = stat($fileName);
790 # normalize, remove leading ./
791 my $memberName = _asZipDirName
( $fileName, $isDir );
792 if ( $memberName eq $rootZipName ) { $memberName = $dest }
793 else { $memberName =~ s{$pattern}{$dest} }
794 next if $memberName =~ m{^\.?/?$}; # skip current dir
796 $done{$memberName} = 1;
797 my $changedMember = $self->updateMember( $memberName, $fileName );
798 return _error
("updateTree failed to update $fileName")
799 unless ref($changedMember);
802 # @done now has the archive names corresponding to all the found files.
803 # If we're mirroring, delete all those members that aren't in @done.
805 foreach my $member ( $self->members() ) {
806 $self->removeMember($member)
807 unless $done{ $member->fileName() };