2 /* vim: set expandtab tabstop=4 shiftwidth=4: */
3 // +----------------------------------------------------------------------+
5 // +----------------------------------------------------------------------+
6 // | Copyright (c) 1997-2002 The PHP Group |
7 // +----------------------------------------------------------------------+
8 // | This source file is subject to version 2.02 of the PHP license, |
9 // | that is bundled with this package in the file LICENSE, and is |
10 // | available at through the world-wide-web at |
11 // | http://www.php.net/license/2_02.txt. |
12 // | If you did not receive a copy of the PHP license and are unable to |
13 // | obtain it through the world-wide-web, please send a note to |
14 // | license@php.net so we can mail you a copy immediately. |
15 // +----------------------------------------------------------------------+
16 // | Author: Xavier Noguer <xnoguer@php.net> |
17 // | Based on OLE::Storage_Lite by Kawai, Takanori |
18 // +----------------------------------------------------------------------+
20 // $Id: OLE.php,v 1.13 2007/03/07 14:38:25 schmidt Exp $
24 * Array for storing OLE instances that are accessed from
25 * OLE_ChainedBlockStream::stream_open().
28 $GLOBALS['_OLE_INSTANCES'] = array();
31 * OLE package base class.
33 * @author Xavier Noguer <xnoguer@php.net>
34 * @author Christian Schmidt <schmidt@php.net>
36 * @package PHPExcel_Shared_OLE
38 class PHPExcel_Shared_OLE
40 const OLE_PPS_TYPE_ROOT
= 5;
41 const OLE_PPS_TYPE_DIR
= 1;
42 const OLE_PPS_TYPE_FILE
= 2;
43 const OLE_DATA_SIZE_SMALL
= 0x1000;
44 const OLE_LONG_INT_SIZE
= 4;
45 const OLE_PPS_SIZE
= 0x80;
48 * The file handle for reading an OLE container
54 * Array of PPS's found on the OLE container
57 public $_list = array();
60 * Root directory of OLE container
66 * Big Block Allocation Table
67 * @var array (blockId => nextBlockId)
72 * Short Block Allocation Table
73 * @var array (blockId => nextBlockId)
78 * Size of big blocks. This is usually 512.
79 * @var int number of octets per block.
84 * Size of small blocks. This is usually 64.
85 * @var int number of octets per block
87 public $smallBlockSize;
90 * Reads an OLE container from the contents of the file given.
94 * @return mixed true on success, PEAR_Error on failure
96 public function read($file)
98 $fh = fopen($file, "r");
100 throw new PHPExcel_Reader_Exception("Can't open file $file");
102 $this->_file_handle
= $fh;
104 $signature = fread($fh, 8);
105 if ("\xD0\xCF\x11\xE0\xA1\xB1\x1A\xE1" != $signature) {
106 throw new PHPExcel_Reader_Exception("File doesn't seem to be an OLE container.");
109 if (fread($fh, 2) != "\xFE\xFF") {
110 // This shouldn't be a problem in practice
111 throw new PHPExcel_Reader_Exception("Only Little-Endian encoding is supported.");
113 // Size of blocks and short blocks in bytes
114 $this->bigBlockSize
= pow(2, self
::_readInt2($fh));
115 $this->smallBlockSize
= pow(2, self
::_readInt2($fh));
117 // Skip UID, revision number and version number
119 // Number of blocks in Big Block Allocation Table
120 $bbatBlockCount = self
::_readInt4($fh);
122 // Root chain 1st block
123 $directoryFirstBlockId = self
::_readInt4($fh);
127 // Streams shorter than this are stored using small blocks
128 $this->bigBlockThreshold
= self
::_readInt4($fh);
129 // Block id of first sector in Short Block Allocation Table
130 $sbatFirstBlockId = self
::_readInt4($fh);
131 // Number of blocks in Short Block Allocation Table
132 $sbbatBlockCount = self
::_readInt4($fh);
133 // Block id of first sector in Master Block Allocation Table
134 $mbatFirstBlockId = self
::_readInt4($fh);
135 // Number of blocks in Master Block Allocation Table
136 $mbbatBlockCount = self
::_readInt4($fh);
137 $this->bbat
= array();
139 // Remaining 4 * 109 bytes of current block is beginning of Master
140 // Block Allocation Table
141 $mbatBlocks = array();
142 for ($i = 0; $i < 109; ++
$i) {
143 $mbatBlocks[] = self
::_readInt4($fh);
146 // Read rest of Master Block Allocation Table (if any is left)
147 $pos = $this->_getBlockOffset($mbatFirstBlockId);
148 for ($i = 0; $i < $mbbatBlockCount; ++
$i) {
150 for ($j = 0; $j < $this->bigBlockSize
/ 4 - 1; ++
$j) {
151 $mbatBlocks[] = self
::_readInt4($fh);
153 // Last block id in each block points to next block
154 $pos = $this->_getBlockOffset(self
::_readInt4($fh));
157 // Read Big Block Allocation Table according to chain specified by
159 for ($i = 0; $i < $bbatBlockCount; ++
$i) {
160 $pos = $this->_getBlockOffset($mbatBlocks[$i]);
162 for ($j = 0 ; $j < $this->bigBlockSize
/ 4; ++
$j) {
163 $this->bbat
[] = self
::_readInt4($fh);
167 // Read short block allocation table (SBAT)
168 $this->sbat
= array();
169 $shortBlockCount = $sbbatBlockCount * $this->bigBlockSize
/ 4;
170 $sbatFh = $this->getStream($sbatFirstBlockId);
171 for ($blockId = 0; $blockId < $shortBlockCount; ++
$blockId) {
172 $this->sbat
[$blockId] = self
::_readInt4($sbatFh);
176 $this->_readPpsWks($directoryFirstBlockId);
182 * @param int block id
183 * @param int byte offset from beginning of file
186 public function _getBlockOffset($blockId)
188 return 512 +
$blockId * $this->bigBlockSize
;
192 * Returns a stream for use with fread() etc. External callers should
193 * use PHPExcel_Shared_OLE_PPS_File::getStream().
194 * @param int|PPS block id or PPS
195 * @return resource read-only stream
197 public function getStream($blockIdOrPps)
199 static $isRegistered = false;
200 if (!$isRegistered) {
201 stream_wrapper_register('ole-chainedblockstream',
202 'PHPExcel_Shared_OLE_ChainedBlockStream');
203 $isRegistered = true;
206 // Store current instance in global array, so that it can be accessed
207 // in OLE_ChainedBlockStream::stream_open().
208 // Object is removed from self::$instances in OLE_Stream::close().
209 $GLOBALS['_OLE_INSTANCES'][] = $this;
210 $instanceId = end(array_keys($GLOBALS['_OLE_INSTANCES']));
212 $path = 'ole-chainedblockstream://oleInstanceId=' . $instanceId;
213 if ($blockIdOrPps instanceof PHPExcel_Shared_OLE_PPS
) {
214 $path .= '&blockId=' . $blockIdOrPps->_StartBlock
;
215 $path .= '&size=' . $blockIdOrPps->Size
;
217 $path .= '&blockId=' . $blockIdOrPps;
219 return fopen($path, 'r');
223 * Reads a signed char.
224 * @param resource file handle
228 private static function _readInt1($fh)
230 list(, $tmp) = unpack("c", fread($fh, 1));
235 * Reads an unsigned short (2 octets).
236 * @param resource file handle
240 private static function _readInt2($fh)
242 list(, $tmp) = unpack("v", fread($fh, 2));
247 * Reads an unsigned long (4 octets).
248 * @param resource file handle
252 private static function _readInt4($fh)
254 list(, $tmp) = unpack("V", fread($fh, 4));
259 * Gets information about all PPS's on the OLE container from the PPS WK's
260 * creates an OLE_PPS object for each one.
263 * @param integer the block id of the first block
264 * @return mixed true on success, PEAR_Error on failure
266 public function _readPpsWks($blockId)
268 $fh = $this->getStream($blockId);
269 for ($pos = 0; ; $pos +
= 128) {
270 fseek($fh, $pos, SEEK_SET
);
271 $nameUtf16 = fread($fh, 64);
272 $nameLength = self
::_readInt2($fh);
273 $nameUtf16 = substr($nameUtf16, 0, $nameLength - 2);
274 // Simple conversion from UTF-16LE to ISO-8859-1
275 $name = str_replace("\x00", "", $nameUtf16);
276 $type = self
::_readInt1($fh);
278 case self
::OLE_PPS_TYPE_ROOT
:
279 $pps = new PHPExcel_Shared_OLE_PPS_Root(null, null, array());
282 case self
::OLE_PPS_TYPE_DIR
:
283 $pps = new PHPExcel_Shared_OLE_PPS(null, null, null, null, null,
284 null, null, null, null, array());
286 case self
::OLE_PPS_TYPE_FILE
:
287 $pps = new PHPExcel_Shared_OLE_PPS_File($name);
292 fseek($fh, 1, SEEK_CUR
);
295 $pps->PrevPps
= self
::_readInt4($fh);
296 $pps->NextPps
= self
::_readInt4($fh);
297 $pps->DirPps
= self
::_readInt4($fh);
298 fseek($fh, 20, SEEK_CUR
);
299 $pps->Time1st
= self
::OLE2LocalDate(fread($fh, 8));
300 $pps->Time2nd
= self
::OLE2LocalDate(fread($fh, 8));
301 $pps->_StartBlock
= self
::_readInt4($fh);
302 $pps->Size
= self
::_readInt4($fh);
303 $pps->No
= count($this->_list
);
304 $this->_list
[] = $pps;
306 // check if the PPS tree (starting from root) is complete
307 if (isset($this->root
) &&
308 $this->_ppsTreeComplete($this->root
->No
)) {
315 // Initialize $pps->children on directories
316 foreach ($this->_list
as $pps) {
317 if ($pps->Type
== self
::OLE_PPS_TYPE_DIR ||
$pps->Type
== self
::OLE_PPS_TYPE_ROOT
) {
318 $nos = array($pps->DirPps
);
319 $pps->children
= array();
321 $no = array_pop($nos);
323 $childPps = $this->_list
[$no];
324 $nos[] = $childPps->PrevPps
;
325 $nos[] = $childPps->NextPps
;
326 $pps->children
[] = $childPps;
336 * It checks whether the PPS tree is complete (all PPS's read)
337 * starting with the given PPS (not necessarily root)
340 * @param integer $index The index of the PPS from which we are checking
341 * @return boolean Whether the PPS tree for the given PPS is complete
343 public function _ppsTreeComplete($index)
345 return isset($this->_list
[$index]) &&
346 ($pps = $this->_list
[$index]) &&
347 ($pps->PrevPps
== -1 ||
348 $this->_ppsTreeComplete($pps->PrevPps
)) &&
349 ($pps->NextPps
== -1 ||
350 $this->_ppsTreeComplete($pps->NextPps
)) &&
351 ($pps->DirPps
== -1 ||
352 $this->_ppsTreeComplete($pps->DirPps
));
356 * Checks whether a PPS is a File PPS or not.
357 * If there is no PPS for the index given, it will return false.
360 * @param integer $index The index for the PPS
361 * @return bool true if it's a File PPS, false otherwise
363 public function isFile($index)
365 if (isset($this->_list
[$index])) {
366 return ($this->_list
[$index]->Type
== self
::OLE_PPS_TYPE_FILE
);
372 * Checks whether a PPS is a Root PPS or not.
373 * If there is no PPS for the index given, it will return false.
376 * @param integer $index The index for the PPS.
377 * @return bool true if it's a Root PPS, false otherwise
379 public function isRoot($index)
381 if (isset($this->_list
[$index])) {
382 return ($this->_list
[$index]->Type
== self
::OLE_PPS_TYPE_ROOT
);
388 * Gives the total number of PPS's found in the OLE container.
391 * @return integer The total number of PPS's found in the OLE container
393 public function ppsTotal()
395 return count($this->_list
);
399 * Gets data from a PPS
400 * If there is no PPS for the index given, it will return an empty string.
403 * @param integer $index The index for the PPS
404 * @param integer $position The position from which to start reading
405 * (relative to the PPS)
406 * @param integer $length The amount of bytes to read (at most)
407 * @return string The binary string containing the data requested
408 * @see OLE_PPS_File::getStream()
410 public function getData($index, $position, $length)
412 // if position is not valid return empty string
413 if (!isset($this->_list
[$index]) ||
($position >= $this->_list
[$index]->Size
) ||
($position < 0)) {
416 $fh = $this->getStream($this->_list
[$index]);
417 $data = stream_get_contents($fh, $length, $position);
423 * Gets the data length from a PPS
424 * If there is no PPS for the index given, it will return 0.
427 * @param integer $index The index for the PPS
428 * @return integer The amount of bytes in data the PPS has
430 public function getDataLength($index)
432 if (isset($this->_list
[$index])) {
433 return $this->_list
[$index]->Size
;
439 * Utility function to transform ASCII text to Unicode
443 * @param string $ascii The ASCII string to transform
444 * @return string The string in Unicode
446 public static function Asc2Ucs($ascii)
449 for ($i = 0; $i < strlen($ascii); ++
$i) {
450 $rawname .= $ascii{$i} . "\x00";
457 * Returns a string for the OLE container with the date given
461 * @param integer $date A timestamp
462 * @return string The string for the OLE container
464 public static function LocalDate2OLE($date = null)
467 return "\x00\x00\x00\x00\x00\x00\x00\x00";
470 // factor used for separating numbers into 4 bytes parts
471 $factor = pow(2, 32);
473 // days from 1-1-1601 until the beggining of UNIX era
476 $big_date = $days*24*3600 +
gmmktime(date("H",$date),date("i",$date),date("s",$date),
477 date("m",$date),date("d",$date),date("Y",$date));
478 // multiply just to make MS happy
479 $big_date *= 10000000;
481 $high_part = floor($big_date / $factor);
483 $low_part = floor((($big_date / $factor) - $high_part) * $factor);
488 for ($i = 0; $i < 4; ++
$i) {
489 $hex = $low_part %
0x100;
490 $res .= pack('c', $hex);
493 for ($i = 0; $i < 4; ++
$i) {
494 $hex = $high_part %
0x100;
495 $res .= pack('c', $hex);
502 * Returns a timestamp from an OLE container's date
506 * @param integer $string A binary string with the encoded date
507 * @return string The timestamp corresponding to the string
509 public static function OLE2LocalDate($string)
511 if (strlen($string) != 8) {
512 return new PEAR_Error("Expecting 8 byte string");
515 // factor used for separating numbers into 4 bytes parts
517 list(, $high_part) = unpack('V', substr($string, 4, 4));
518 list(, $low_part) = unpack('V', substr($string, 0, 4));
520 $big_date = ($high_part * $factor) +
$low_part;
521 // translate to seconds
522 $big_date /= 10000000;
524 // days from 1-1-1601 until the beggining of UNIX era
527 // translate to seconds from beggining of UNIX era
528 $big_date -= $days * 24 * 3600;
529 return floor($big_date);