1 package Archive
::Zip
::Archive
;
3 # Represents a generic ZIP archive
13 use vars
qw( $VERSION @ISA );
17 @ISA = qw( Archive::Zip );
27 # Note that this returns undef on read errors, else new zip object.
34 'diskNumberWithStartOfCentralDirectory' => 0,
35 'numberOfCentralDirectoriesOnThisDisk' => 0, # shld be # of members
36 'numberOfCentralDirectories' => 0, # shld be # of members
37 'centralDirectorySize' => 0, # must re-compute on write
38 'centralDirectoryOffsetWRTStartingDiskNumber' =>
40 'writeEOCDOffset' => 0,
41 'writeCentralDirectoryOffset' => 0,
42 'zipfileComment' => '',
48 $self->{'members'} = [];
50 my $status = $self->read(@_);
51 return $status == AZ_OK ?
$self : undef;
56 sub storeSymbolicLink
{
58 $self->{'storeSymbolicLink'} = shift;
62 @
{ shift->{'members'} };
66 scalar( shift->members() );
71 return map { $_->fileName() } $self->members();
74 # return ref to member with given name or undef
76 my ( $self, $fileName ) = @_;
78 $fileName = Encode
::encode
( 'cp437', $fileName );
79 foreach my $member ( $self->members() ) {
80 return $member if $member->fileName() eq $fileName;
86 my ( $self, $pattern ) = @_;
87 return grep { $_->fileName() =~ /$pattern/ } $self->members();
91 shift->{'diskNumber'};
94 sub diskNumberWithStartOfCentralDirectory
{
95 shift->{'diskNumberWithStartOfCentralDirectory'};
98 sub numberOfCentralDirectoriesOnThisDisk
{
99 shift->{'numberOfCentralDirectoriesOnThisDisk'};
102 sub numberOfCentralDirectories
{
103 shift->{'numberOfCentralDirectories'};
106 sub centralDirectorySize
{
107 shift->{'centralDirectorySize'};
110 sub centralDirectoryOffsetWRTStartingDiskNumber
{
111 shift->{'centralDirectoryOffsetWRTStartingDiskNumber'};
116 my $comment = $self->{'zipfileComment'};
118 $self->{'zipfileComment'} = pack( 'C0a*', shift() ); # avoid unicode
124 shift->{'eocdOffset'};
127 # Return the name of the file last read.
133 my ( $self, $member ) = @_;
134 $member = $self->memberNamed($member) unless ref($member);
135 return undef unless $member;
136 my @newMembers = grep { $_ != $member } $self->members();
137 $self->{'members'} = \
@newMembers;
142 my ( $self, $oldMember, $newMember ) = @_;
143 $oldMember = $self->memberNamed($oldMember) unless ref($oldMember);
144 return undef unless $oldMember;
145 return undef unless $newMember;
147 map { ( $_ == $oldMember ) ?
$newMember : $_ } $self->members();
148 $self->{'members'} = \
@newMembers;
155 $member = $self->memberNamed($member) unless ref($member);
156 return _error
('member not found') unless $member;
157 my $originalSize = $member->compressedSize();
158 my $name = shift; # local FS name if given
159 my ( $volumeName, $dirName, $fileName );
160 if ( defined($name) ) {
162 $name = Encode
::encode
( 'cp437', $name );
163 ( $volumeName, $dirName, $fileName ) = File
::Spec
->splitpath($name);
164 $dirName = File
::Spec
->catpath( $volumeName, $dirName, '' );
167 $name = $member->fileName();
168 ( $dirName = $name ) =~ s{[^/]*$}{};
169 $dirName = Archive
::Zip
::_asLocalName
($dirName);
170 $name = Archive
::Zip
::_asLocalName
($name);
172 # Need to test if this is needed or not:
173 #if ( $dirName && !-d $dirName ) {
175 # return _ioError("can't create dir $dirName") if ( !-d $dirName );
177 my $rc = $member->extractToFileNamed( $name, @_ );
179 # TODO refactor this fix into extractToFileNamed()
180 $member->{'compressedSize'} = $originalSize;
184 sub extractMemberWithoutPaths
{
187 $member = $self->memberNamed($member) unless ref($member);
188 return _error
('member not found') unless $member;
189 my $originalSize = $member->compressedSize();
190 return AZ_OK
if $member->isDirectory();
192 if ( defined($name) ) {
194 $name = Encode
::encode
( 'cp437', $name );
197 $name = $member->fileName();
198 $name =~ s{.*/}{}; # strip off directories, if any
199 $name = Archive
::Zip
::_asLocalName
($name);
201 my $rc = $member->extractToFileNamed( $name, @_ );
202 $member->{'compressedSize'} = $originalSize;
207 my ( $self, $newMember ) = @_;
208 push( @
{ $self->{'members'} }, $newMember ) if $newMember;
214 my $fileName = shift;
216 my $newMember = $self->ZIPMEMBERCLASS->newFromFile( $fileName, $newName );
217 if ( $self->{'storeSymbolicLink'} && -l
$fileName ) {
218 my $newMember = $self->ZIPMEMBERCLASS->newFromString(readlink $fileName, $newName);
219 # For symbolic links, External File Attribute is set to 0000FFA1 by Info-ZIP
220 $newMember->{'externalFileAttributes'} = 2717843456;
221 $self->addMember($newMember);
223 $self->addMember($newMember);
230 my $newMember = $self->ZIPMEMBERCLASS->newFromString(@_);
231 return $self->addMember($newMember);
235 my ( $self, $name, $newName ) = @_;
236 my $newMember = $self->ZIPMEMBERCLASS->newDirectoryNamed( $name, $newName );
237 if ( $self->{'storeSymbolicLink'} && -l
$name ) {
238 my $link = readlink $name;
239 ( $newName =~ s{/$}{} ) if $newName; # Strip trailing /
240 my $newMember = $self->ZIPMEMBERCLASS->newFromString($link, $newName);
241 # For symbolic links, External File Attribute is set to 0000FFA1 by Info-ZIP
242 $newMember->{'externalFileAttributes'} = 2717843456;
243 $self->addMember($newMember);
245 $self->addMember($newMember);
250 # add either a file or a directory.
252 sub addFileOrDirectory
{
253 my ( $self, $name, $newName ) = @_;
261 return $self->addFile( $name, $newName );
264 return $self->addDirectory( $name, $newName );
267 return _error
("$name is neither a file nor a directory");
272 my ( $self, $member, $newContents ) = @_;
273 return _error
('No member name given') unless $member;
274 $member = $self->memberNamed($member) unless ref($member);
275 return undef unless $member;
276 return $member->contents($newContents);
279 sub writeToFileNamed
{
281 my $fileName = shift; # local FS format
282 foreach my $member ( $self->members() ) {
283 if ( $member->_usesFileNamed($fileName) ) {
284 return _error
( "$fileName is needed by member "
285 . $member->fileName()
286 . "; consider using overwrite() or overwriteAs() instead." );
289 my ( $status, $fh ) = _newFileHandle
( $fileName, 'w' );
290 return _ioError
("Can't open $fileName for write") unless $status;
291 my $retval = $self->writeToFileHandle( $fh, 1 );
298 # It is possible to write data to the FH before calling this,
299 # perhaps to make a self-extracting archive.
300 sub writeToFileHandle
{
303 return _error
('No filehandle given') unless $fh;
304 return _ioError
('filehandle not open') unless $fh->opened();
306 my $fhIsSeekable = @_ ?
shift: _isSeekable
($fh);
309 # Find out where the current position is.
310 my $offset = $fhIsSeekable ?
$fh->tell() : 0;
311 $offset = 0 if $offset < 0;
313 foreach my $member ( $self->members() ) {
314 my $retval = $member->_writeToFileHandle( $fh, $fhIsSeekable, $offset );
316 return $retval if $retval != AZ_OK
;
317 $offset += $member->_localHeaderSize() + $member->_writeOffset();
319 $member->hasDataDescriptor()
320 ? DATA_DESCRIPTOR_LENGTH
+ SIGNATURE_LENGTH
323 # changed this so it reflects the last successful position
324 $self->{'writeCentralDirectoryOffset'} = $offset;
326 return $self->writeCentralDirectory($fh);
329 # Write zip back to the original file,
330 # as safely as possible.
331 # Returns AZ_OK if successful.
334 return $self->overwriteAs( $self->{'fileName'} );
337 # Write zip to the specified file,
338 # as safely as possible.
339 # Returns AZ_OK if successful.
343 return _error
("no filename in overwriteAs()") unless defined($zipName);
345 my ( $fh, $tempName ) = Archive
::Zip
::tempFile
();
346 return _error
( "Can't open temp file", $! ) unless $fh;
348 ( my $backupName = $zipName ) =~ s{(\.[^.]*)?$}{.zbk};
350 my $status = $self->writeToFileHandle($fh);
354 if ( $status != AZ_OK
) {
356 _printError
("Can't write to $tempName");
363 if ( -f
$zipName && !rename( $zipName, $backupName ) ) {
366 return _error
( "Can't rename $zipName as $backupName", $err );
369 # move the temp to the original name (possibly copying)
370 unless ( File
::Copy
::move
( $tempName, $zipName ) ) {
372 rename( $backupName, $zipName );
374 return _error
( "Can't move $tempName to $zipName", $err );
378 if ( -f
$backupName && !unlink($backupName) ) {
380 return _error
( "Can't unlink $backupName", $err );
386 # Used only during writing
387 sub _writeCentralDirectoryOffset
{
388 shift->{'writeCentralDirectoryOffset'};
391 sub _writeEOCDOffset
{
392 shift->{'writeEOCDOffset'};
395 # Expects to have _writeEOCDOffset() set
396 sub _writeEndOfCentralDirectory
{
397 my ( $self, $fh ) = @_;
399 $self->_print($fh, END_OF_CENTRAL_DIRECTORY_SIGNATURE_STRING
)
400 or return _ioError
('writing EOCD Signature');
401 my $zipfileCommentLength = length( $self->zipfileComment() );
404 END_OF_CENTRAL_DIRECTORY_FORMAT
,
406 0, # {'diskNumberWithStartOfCentralDirectory'},
407 $self->numberOfMembers(), # {'numberOfCentralDirectoriesOnThisDisk'},
408 $self->numberOfMembers(), # {'numberOfCentralDirectories'},
409 $self->_writeEOCDOffset() - $self->_writeCentralDirectoryOffset(),
410 $self->_writeCentralDirectoryOffset(),
411 $zipfileCommentLength
413 $self->_print($fh, $header)
414 or return _ioError
('writing EOCD header');
415 if ($zipfileCommentLength) {
416 $self->_print($fh, $self->zipfileComment() )
417 or return _ioError
('writing zipfile comment');
422 # $offset can be specified to truncate a zip file.
423 sub writeCentralDirectory
{
424 my ( $self, $fh, $offset ) = @_;
426 if ( defined($offset) ) {
427 $self->{'writeCentralDirectoryOffset'} = $offset;
428 $fh->seek( $offset, IO
::Seekable
::SEEK_SET
)
429 or return _ioError
('seeking to write central directory');
432 $offset = $self->_writeCentralDirectoryOffset();
435 foreach my $member ( $self->members() ) {
436 my $status = $member->_writeCentralDirectoryFileHeader($fh);
437 return $status if $status != AZ_OK
;
438 $offset += $member->_centralDirectoryHeaderSize();
439 $self->{'writeEOCDOffset'} = $offset;
441 return $self->_writeEndOfCentralDirectory($fh);
446 my $fileName = shift;
447 return _error
('No filename given') unless $fileName;
448 my ( $status, $fh ) = _newFileHandle
( $fileName, 'r' );
449 return _ioError
("opening $fileName for read") unless $status;
451 $status = $self->readFromFileHandle( $fh, $fileName );
452 return $status if $status != AZ_OK
;
455 $self->{'fileName'} = $fileName;
459 sub readFromFileHandle
{
462 my $fileName = shift;
463 $fileName = $fh unless defined($fileName);
464 return _error
('No filehandle given') unless $fh;
465 return _ioError
('filehandle not open') unless $fh->opened();
468 $self->{'fileName'} = "$fh";
470 # TODO: how to support non-seekable zips?
471 return _error
('file not seekable')
472 unless _isSeekable
($fh);
474 $fh->seek( 0, 0 ); # rewind the file
476 my $status = $self->_findEndOfCentralDirectory($fh);
477 return $status if $status != AZ_OK
;
479 my $eocdPosition = $fh->tell();
481 $status = $self->_readEndOfCentralDirectory($fh);
482 return $status if $status != AZ_OK
;
484 $fh->seek( $eocdPosition - $self->centralDirectorySize(),
485 IO
::Seekable
::SEEK_SET
)
486 or return _ioError
("Can't seek $fileName");
488 # Try to detect garbage at beginning of archives
490 $self->{'eocdOffset'} = $eocdPosition - $self->centralDirectorySize() # here
491 - $self->centralDirectoryOffsetWRTStartingDiskNumber();
495 $self->ZIPMEMBERCLASS->_newFromZipFile( $fh, $fileName,
496 $self->eocdOffset() );
498 ( $status, $signature ) = _readSignature
( $fh, $fileName );
499 return $status if $status != AZ_OK
;
500 last if $signature == END_OF_CENTRAL_DIRECTORY_SIGNATURE
;
501 $status = $newMember->_readCentralDirectoryFileHeader();
502 return $status if $status != AZ_OK
;
503 $status = $newMember->endRead();
504 return $status if $status != AZ_OK
;
505 $newMember->_becomeDirectoryIfNecessary();
506 push( @
{ $self->{'members'} }, $newMember );
512 # Read EOCD, starting from position before signature.
513 # Return AZ_OK on success.
514 sub _readEndOfCentralDirectory
{
518 # Skip past signature
519 $fh->seek( SIGNATURE_LENGTH
, IO
::Seekable
::SEEK_CUR
)
520 or return _ioError
("Can't seek past EOCD signature");
523 my $bytesRead = $fh->read( $header, END_OF_CENTRAL_DIRECTORY_LENGTH
);
524 if ( $bytesRead != END_OF_CENTRAL_DIRECTORY_LENGTH
) {
525 return _ioError
("reading end of central directory");
528 my $zipfileCommentLength;
530 $self->{'diskNumber'},
531 $self->{'diskNumberWithStartOfCentralDirectory'},
532 $self->{'numberOfCentralDirectoriesOnThisDisk'},
533 $self->{'numberOfCentralDirectories'},
534 $self->{'centralDirectorySize'},
535 $self->{'centralDirectoryOffsetWRTStartingDiskNumber'},
536 $zipfileCommentLength
537 ) = unpack( END_OF_CENTRAL_DIRECTORY_FORMAT
, $header );
539 if ($zipfileCommentLength) {
540 my $zipfileComment = '';
541 $bytesRead = $fh->read( $zipfileComment, $zipfileCommentLength );
542 if ( $bytesRead != $zipfileCommentLength ) {
543 return _ioError
("reading zipfile comment");
545 $self->{'zipfileComment'} = $zipfileComment;
551 # Seek in my file to the end, then read backwards until we find the
552 # signature of the central directory record. Leave the file positioned right
553 # before the signature. Returns AZ_OK if success.
554 sub _findEndOfCentralDirectory
{
558 $fh->seek( 0, IO
::Seekable
::SEEK_END
)
559 or return _ioError
("seeking to end");
561 my $fileLength = $fh->tell();
562 if ( $fileLength < END_OF_CENTRAL_DIRECTORY_LENGTH
+ 4 ) {
563 return _formatError
("file is too short");
570 $seekOffset = $fileLength if ( $seekOffset > $fileLength );
571 $fh->seek( -$seekOffset, IO
::Seekable
::SEEK_END
)
572 or return _ioError
("seek failed");
573 my $bytesRead = $fh->read( $data, $seekOffset );
574 if ( $bytesRead != $seekOffset ) {
575 return _ioError
("read failed");
577 $pos = rindex( $data, END_OF_CENTRAL_DIRECTORY_SIGNATURE_STRING
);
580 or $seekOffset == $fileLength
581 or $seekOffset >= $Archive::Zip
::ChunkSize
);
585 $fh->seek( $pos - $seekOffset, IO
::Seekable
::SEEK_CUR
)
586 or return _ioError
("seeking to EOCD");
590 return _formatError
("can't find EOCD signature");
594 # Used to avoid taint problems when chdir'ing.
595 # Not intended to increase security in any way; just intended to shut up the -T
596 # complaints. If your Cwd module is giving you unreliable returns from cwd()
597 # you have bigger problems than this.
600 $dir =~ m/\A(.+)\z/s;
606 my $root = shift or return _error
("root arg missing in call to addTree()");
608 $dest = '' unless defined($dest);
609 my $pred = shift || sub { -r
};
610 my $compressionLevel = shift;
612 my $startDir = _untaintDir
( cwd
() );
614 return _error
( 'undef returned by _untaintDir on cwd ', cwd
() )
617 # This avoids chdir'ing in Find, in a way compatible with older
618 # versions of File::Find.
620 local $main::_
= $File::Find
::name
;
621 my $dir = _untaintDir
($File::Find
::dir
);
623 push( @files, $File::Find
::name
) if (&$pred);
627 File
::Find
::find
( $wanted, $root );
629 my $rootZipName = _asZipDirName
( $root, 1 ); # with trailing slash
630 my $pattern = $rootZipName eq './' ?
'^' : "^\Q$rootZipName\E";
632 $dest = _asZipDirName
( $dest, 1 ); # with trailing slash
634 foreach my $fileName (@files) {
635 my $isDir = -d
$fileName;
637 # normalize, remove leading ./
638 my $archiveName = _asZipDirName
( $fileName, $isDir );
639 if ( $archiveName eq $rootZipName ) { $archiveName = $dest }
640 else { $archiveName =~ s{$pattern}{$dest} }
641 next if $archiveName =~ m{^\.?/?$}; # skip current dir
643 ?
$self->addDirectory( $fileName, $archiveName )
644 : $self->addFile( $fileName, $archiveName );
645 $member->desiredCompressionLevel($compressionLevel);
647 return _error
("add $fileName failed in addTree()") if !$member;
652 sub addTreeMatching
{
655 or return _error
("root arg missing in call to addTreeMatching()");
657 $dest = '' unless defined($dest);
659 or return _error
("pattern missing in call to addTreeMatching()");
662 $pred ?
sub { m{$pattern} && &$pred } : sub { m{$pattern} && -r
};
663 return $self->addTree( $root, $dest, $matcher );
666 # $zip->extractTree( $root, $dest [, $volume] );
668 # $root and $dest are Unix-style.
669 # $volume is in local FS format.
673 my $root = shift; # Zip format
674 $root = '' unless defined($root);
675 my $dest = shift; # Zip format
676 $dest = './' unless defined($dest);
678 $dest = Encode
::encode
( 'cp437', $dest );
679 my $volume = shift; # optional
680 my $pattern = "^\Q$root";
681 my @members = $self->membersMatching($pattern);
683 foreach my $member (@members) {
684 my $fileName = $member->fileName(); # in Unix format
685 $fileName =~ s{$pattern}{$dest}; # in Unix format
686 # convert to platform format:
687 $fileName = Archive
::Zip
::_asLocalName
( $fileName, $volume );
688 my $status = $member->extractToFileNamed($fileName);
689 return $status if $status != AZ_OK
;
694 # $zip->updateMember( $memberOrName, $fileName );
695 # Returns (possibly updated) member, if any; undef on errors.
699 my $oldMember = shift;
700 my $fileName = shift;
702 if ( !defined($fileName) ) {
703 _error
("updateMember(): missing fileName argument");
707 my @newStat = stat($fileName);
709 _ioError
("Can't stat $fileName");
717 if ( ref($oldMember) ) {
718 $memberName = $oldMember->fileName();
721 $oldMember = $self->memberNamed( $memberName = $oldMember )
722 || $self->memberNamed( $memberName =
723 _asZipDirName
( $oldMember, $isDir ) );
726 unless ( defined($oldMember)
727 && $oldMember->lastModTime() == $newStat[9]
728 && $oldMember->isDirectory() == $isDir
729 && ( $isDir || ( $oldMember->uncompressedSize() == $newStat[7] ) ) )
732 # create the new member
733 my $newMember = $isDir
734 ?
$self->ZIPMEMBERCLASS->newDirectoryNamed( $fileName, $memberName )
735 : $self->ZIPMEMBERCLASS->newFromFile( $fileName, $memberName );
737 unless ( defined($newMember) ) {
738 _error
("creation of member $fileName failed in updateMember()");
742 # replace old member or append new one
743 if ( defined($oldMember) ) {
744 $self->replaceMember( $oldMember, $newMember );
746 else { $self->addMember($newMember); }
754 # $zip->updateTree( $root, [ $dest, [ $pred [, $mirror]]] );
756 # This takes the same arguments as addTree, but first checks to see
757 # whether the file or directory already exists in the zip file.
759 # If the fourth argument $mirror is true, then delete all my members
760 # if corresponding files weren't found.
765 or return _error
("root arg missing in call to updateTree()");
767 $dest = '' unless defined($dest);
768 $dest = _asZipDirName
( $dest, 1 );
769 my $pred = shift || sub { -r
};
772 my $rootZipName = _asZipDirName
( $root, 1 ); # with trailing slash
773 my $pattern = $rootZipName eq './' ?
'^' : "^\Q$rootZipName\E";
776 my $startDir = _untaintDir
( cwd
() );
778 return _error
( 'undef returned by _untaintDir on cwd ', cwd
() )
781 # This avoids chdir'ing in Find, in a way compatible with older
782 # versions of File::Find.
784 local $main::_
= $File::Find
::name
;
785 my $dir = _untaintDir
($File::Find
::dir
);
787 push( @files, $File::Find
::name
) if (&$pred);
791 File
::Find
::find
( $wanted, $root );
793 # Now @files has all the files that I could potentially be adding to
794 # the zip. Only add the ones that are necessary.
795 # For each file (updated or not), add its member name to @done.
797 foreach my $fileName (@files) {
798 my @newStat = stat($fileName);
801 # normalize, remove leading ./
802 my $memberName = _asZipDirName
( $fileName, $isDir );
803 if ( $memberName eq $rootZipName ) { $memberName = $dest }
804 else { $memberName =~ s{$pattern}{$dest} }
805 next if $memberName =~ m{^\.?/?$}; # skip current dir
807 $done{$memberName} = 1;
808 my $changedMember = $self->updateMember( $memberName, $fileName );
809 return _error
("updateTree failed to update $fileName")
810 unless ref($changedMember);
813 # @done now has the archive names corresponding to all the found files.
814 # If we're mirroring, delete all those members that aren't in @done.
816 foreach my $member ( $self->members() ) {
817 $self->removeMember($member)
818 unless $done{ $member->fileName() };