12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097 |
- <?php
- /* vim: set expandtab tabstop=4 shiftwidth=4 softtabstop=4: */
-
- /**
- * A class for reading Microsoft Excel Spreadsheets.
- *
- * Originally developed by Vadim Tkachenko under the name PHPExcelReader.
- * (http://sourceforge.net/projects/phpexcelreader)
- * Based on the Java version by Andy Khan (http://www.andykhan.com). Now
- * maintained by David Sanders. Reads only Biff 7 and Biff 8 formats.
- *
- * PHP versions 4 and 5
- *
- * LICENSE: This source file is subject to version 3.0 of the PHP license
- * that is available through the world-wide-web at the following URI:
- * http://www.php.net/license/3_0.txt. If you did not receive a copy of
- * the PHP License and are unable to obtain it through the web, please
- * send a note to license@php.net so we can mail you a copy immediately.
- *
- * @category Spreadsheet
- * @package Spreadsheet_Excel_Reader
- * @author Vadim Tkachenko <vt@apachephp.com>
- * @license http://www.php.net/license/3_0.txt PHP License 3.0
- * @version CVS: $Id: excelreader.php 124 2017-03-10 05:40:03Z admin $
- * @link http://pear.php.net/package/Spreadsheet_Excel_Reader
- * @see OLE, Spreadsheet_Excel_Writer
- *
- */
- namespace core\extend\excel;
-
- // require_once 'PEAR.php';
- require_once 'oleread.php';
- // require_once 'OLE.php';
-
- define('SPREADSHEET_EXCEL_READER_BIFF8', 0x600);
- define('SPREADSHEET_EXCEL_READER_BIFF7', 0x500);
- define('SPREADSHEET_EXCEL_READER_WORKBOOKGLOBALS', 0x5);
- define('SPREADSHEET_EXCEL_READER_WORKSHEET', 0x10);
-
- define('SPREADSHEET_EXCEL_READER_TYPE_BOF', 0x809);
- define('SPREADSHEET_EXCEL_READER_TYPE_EOF', 0x0a);
- define('SPREADSHEET_EXCEL_READER_TYPE_BOUNDSHEET', 0x85);
- define('SPREADSHEET_EXCEL_READER_TYPE_DIMENSION', 0x200);
- define('SPREADSHEET_EXCEL_READER_TYPE_ROW', 0x208);
- define('SPREADSHEET_EXCEL_READER_TYPE_DBCELL', 0xd7);
- define('SPREADSHEET_EXCEL_READER_TYPE_FILEPASS', 0x2f);
- define('SPREADSHEET_EXCEL_READER_TYPE_NOTE', 0x1c);
- define('SPREADSHEET_EXCEL_READER_TYPE_TXO', 0x1b6);
- define('SPREADSHEET_EXCEL_READER_TYPE_RK', 0x7e);
- define('SPREADSHEET_EXCEL_READER_TYPE_RK2', 0x27e);
- define('SPREADSHEET_EXCEL_READER_TYPE_MULRK', 0xbd);
- define('SPREADSHEET_EXCEL_READER_TYPE_MULBLANK', 0xbe);
- define('SPREADSHEET_EXCEL_READER_TYPE_INDEX', 0x20b);
- define('SPREADSHEET_EXCEL_READER_TYPE_SST', 0xfc);
- define('SPREADSHEET_EXCEL_READER_TYPE_EXTSST', 0xff);
- define('SPREADSHEET_EXCEL_READER_TYPE_CONTINUE', 0x3c);
- define('SPREADSHEET_EXCEL_READER_TYPE_LABEL', 0x204);
- define('SPREADSHEET_EXCEL_READER_TYPE_LABELSST', 0xfd);
- define('SPREADSHEET_EXCEL_READER_TYPE_NUMBER', 0x203);
- define('SPREADSHEET_EXCEL_READER_TYPE_NAME', 0x18);
- define('SPREADSHEET_EXCEL_READER_TYPE_ARRAY', 0x221);
- define('SPREADSHEET_EXCEL_READER_TYPE_STRING', 0x207);
- define('SPREADSHEET_EXCEL_READER_TYPE_FORMULA', 0x406);
- define('SPREADSHEET_EXCEL_READER_TYPE_FORMULA2', 0x6);
- define('SPREADSHEET_EXCEL_READER_TYPE_FORMAT', 0x41e);
- define('SPREADSHEET_EXCEL_READER_TYPE_XF', 0xe0);
- define('SPREADSHEET_EXCEL_READER_TYPE_BOOLERR', 0x205);
- define('SPREADSHEET_EXCEL_READER_TYPE_UNKNOWN', 0xffff);
- define('SPREADSHEET_EXCEL_READER_TYPE_NINETEENFOUR', 0x22);
- define('SPREADSHEET_EXCEL_READER_TYPE_MERGEDCELLS', 0xE5);
-
- define('SPREADSHEET_EXCEL_READER_UTCOFFSETDAYS', 25569);
- define('SPREADSHEET_EXCEL_READER_UTCOFFSETDAYS1904', 24107);
- define('SPREADSHEET_EXCEL_READER_MSINADAY', 86400);
- // define('SPREADSHEET_EXCEL_READER_MSINADAY', 24 * 60 * 60);
-
- // define('SPREADSHEET_EXCEL_READER_DEF_NUM_FORMAT', "%.2f");
- define('SPREADSHEET_EXCEL_READER_DEF_NUM_FORMAT', "%s");
-
- /*
- * Place includes, constant defines and $_GLOBAL settings here.
- * Make sure they have appropriate docblocks to avoid phpDocumentor
- * construing they are documented by the page-level docblock.
- */
-
- /**
- * A class for reading Microsoft Excel Spreadsheets.
- *
- * Originally developed by Vadim Tkachenko under the name PHPExcelReader.
- * (http://sourceforge.net/projects/phpexcelreader)
- * Based on the Java version by Andy Khan (http://www.andykhan.com). Now
- * maintained by David Sanders. Reads only Biff 7 and Biff 8 formats.
- *
- * @category Spreadsheet
- * @package Spreadsheet_Excel_Reader
- * @author Vadim Tkachenko <vt@phpapache.com>
- * @copyright 1997-2005 The PHP Group
- * @license http://www.php.net/license/3_0.txt PHP License 3.0
- * @version Release: @package_version@
- * @link http://pear.php.net/package/PackageName
- * @see OLE, Spreadsheet_Excel_Writer
- *
- */
- class Spreadsheet_Excel_Reader
- {
-
- /**
- * Array of worksheets found
- *
- * @var array
- * @access public
- */
- var $boundsheets = array();
-
- /**
- * Array of format records found
- *
- * @var array
- * @access public
- */
- var $formatRecords = array();
-
- /**
- * todo
- *
- * @var array
- * @access public
- */
- var $sst = array();
-
- /**
- * Array of worksheets
- *
- * The data is stored in 'cells' and the meta-data is stored in an array
- * called 'cellsInfo'
- *
- * Example:
- *
- * $sheets --> 'cells' --> row --> column --> Interpreted value
- * --> 'cellsInfo' --> row --> column --> 'type' - Can be 'date', 'number', or 'unknown'
- * --> 'raw' - The raw data that Excel stores for that data cell
- *
- * @var array
- * @access public
- */
- var $sheets = array();
-
- /**
- * The data returned by OLE
- *
- * @var string
- * @access public
- */
- var $data;
-
- /**
- * OLE object for reading the file
- *
- * @var OLE object
- * @access private
- */
- var $_ole;
-
- /**
- * Default encoding
- *
- * @var string
- * @access private
- */
- var $_defaultEncoding;
-
- /**
- * Default number format
- *
- * @var integer
- * @access private
- */
- var $_defaultFormat = SPREADSHEET_EXCEL_READER_DEF_NUM_FORMAT;
-
- /**
- * todo
- * List of formats to use for each column
- *
- * @var array
- * @access private
- */
- var $_columnsFormat = array();
-
- /**
- * todo
- *
- * @var integer
- * @access private
- */
- var $_rowoffset = 1;
-
- /**
- * todo
- *
- * @var integer
- * @access private
- */
- var $_coloffset = 1;
-
- /**
- * List of default date formats used by Excel
- *
- * @var array
- * @access public
- */
- var $dateFormats = array(
- 0xe => "d/m/Y",
- 0xf => "d-M-Y",
- 0x10 => "d-M",
- 0x11 => "M-Y",
- 0x12 => "h:i a",
- 0x13 => "h:i:s a",
- 0x14 => "H:i",
- 0x15 => "H:i:s",
- 0x16 => "d/m/Y H:i",
- 0x2d => "i:s",
- 0x2e => "H:i:s",
- 0x2f => "i:s.S"
- );
-
- /**
- * Default number formats used by Excel
- *
- * @var array
- * @access public
- */
- var $numberFormats = array(
- 0x1 => "%1.0f", // "0"
- 0x2 => "%1.2f", // "0.00",
- 0x3 => "%1.0f", // "#,##0",
- 0x4 => "%1.2f", // "#,##0.00",
- 0x5 => "%1.0f", /*"$#,##0;($#,##0)",*/
- 0x6 => '$%1.0f', /*"$#,##0;($#,##0)",*/
- 0x7 => '$%1.2f', // "$#,##0.00;($#,##0.00)",
- 0x8 => '$%1.2f', // "$#,##0.00;($#,##0.00)",
- 0x9 => '%1.0f%%', // "0%"
- 0xa => '%1.2f%%', // "0.00%"
- 0xb => '%1.2f', // 0.00E00",
- 0x25 => '%1.0f', // "#,##0;(#,##0)",
- 0x26 => '%1.0f', // "#,##0;(#,##0)",
- 0x27 => '%1.2f', // "#,##0.00;(#,##0.00)",
- 0x28 => '%1.2f', // "#,##0.00;(#,##0.00)",
- 0x29 => '%1.0f', // "#,##0;(#,##0)",
- 0x2a => '$%1.0f', // "$#,##0;($#,##0)",
- 0x2b => '%1.2f', // "#,##0.00;(#,##0.00)",
- 0x2c => '$%1.2f', // "$#,##0.00;($#,##0.00)",
- 0x30 => '%1.0f'
- );
-
- // "##0.0E0";
-
- // }}}
- // {{{ Spreadsheet_Excel_Reader()
-
- /**
- * Constructor
- *
- * Some basic initialisation
- */
- function Spreadsheet_Excel_Reader()
- {
- $this->_ole = new OLERead();
- $this->setUTFEncoder('iconv');
- }
-
- // }}}
- // {{{ setOutputEncoding()
-
- /**
- * Set the encoding method
- *
- * @param
- * string Encoding to use
- * @access public
- */
- function setOutputEncoding($encoding)
- {
- $this->_defaultEncoding = $encoding;
- }
-
- // }}}
- // {{{ setUTFEncoder()
-
- /**
- * $encoder = 'iconv' or 'mb'
- * set iconv if you would like use 'iconv' for encode UTF-16LE to your encoding
- * set mb if you would like use 'mb_convert_encoding' for encode UTF-16LE to your encoding
- *
- * @access public
- * @param
- * string Encoding type to use. Either 'iconv' or 'mb'
- */
- function setUTFEncoder($encoder = 'iconv')
- {
- $this->_encoderFunction = '';
-
- if ($encoder == 'iconv') {
- $this->_encoderFunction = function_exists('iconv') ? 'iconv' : '';
- } elseif ($encoder == 'mb') {
- $this->_encoderFunction = function_exists('mb_convert_encoding') ? 'mb_convert_encoding' : '';
- }
- }
-
- // }}}
- // {{{ setRowColOffset()
-
- /**
- * todo
- *
- * @access public
- * @param
- * offset
- */
- function setRowColOffset($iOffset)
- {
- $this->_rowoffset = $iOffset;
- $this->_coloffset = $iOffset;
- }
-
- // }}}
- // {{{ setDefaultFormat()
-
- /**
- * Set the default number format
- *
- * @access public
- * @param
- * Default format
- */
- function setDefaultFormat($sFormat)
- {
- $this->_defaultFormat = $sFormat;
- }
-
- // }}}
- // {{{ setColumnFormat()
-
- /**
- * Force a column to use a certain format
- *
- * @access public
- * @param
- * integer Column number
- * @param
- * string Format
- */
- function setColumnFormat($column, $sFormat)
- {
- $this->_columnsFormat[$column] = $sFormat;
- }
-
- // }}}
- // {{{ read()
-
- /**
- * Read the spreadsheet file using OLE, then parse
- *
- * @access public
- * @param
- * filename
- * @todo return a valid value
- */
- function read($sFileName)
- {
- /*
- * require_once 'OLE.php';
- * $ole = new OLE();
- * $ole->read($sFileName);
- *
- * foreach ($ole->_list as $i => $pps) {
- * if (($pps->Name == 'Workbook' || $pps->Name == 'Book') &&
- * $pps->Size >= SMALL_BLOCK_THRESHOLD) {
- *
- * $this->data = $ole->getData($i, 0, $ole->getDataLength($i));
- * } elseif ($pps->Name == 'Root Entry') {
- * $this->data = $ole->getData($i, 0, $ole->getDataLength($i));
- * }
- * //var_dump(strlen($ole->getData($i, 0, $ole->getDataLength($i))), $pps->Name, md5($this->data), $ole->getDataLength($i));
- * }
- * //exit;
- * $this->_parse();
- *
- * return sizeof($this->sheets) > 0;
- */
- $res = $this->_ole->read($sFileName);
-
- // oops, something goes wrong (Darko Miljanovic)
- if ($res === false) {
- // check error code
- if ($this->_ole->error == 1) {
- // bad file
- die('The filename ' . $sFileName . ' is not readable');
- }
- // check other error codes here (eg bad fileformat, etc...)
- }
-
- $this->data = $this->_ole->getWorkBook();
-
- /*
- * $res = $this->_ole->read($sFileName);
- *
- * if ($this->isError($res)) {
- * // var_dump($res);
- * return $this->raiseError($res);
- * }
- *
- * $total = $this->_ole->ppsTotal();
- * for ($i = 0; $i < $total; $i++) {
- * if ($this->_ole->isFile($i)) {
- * $type = unpack("v", $this->_ole->getData($i, 0, 2));
- * if ($type[''] == 0x0809) { // check if it's a BIFF stream
- * $this->_index = $i;
- * $this->data = $this->_ole->getData($i, 0, $this->_ole->getDataLength($i));
- * break;
- * }
- * }
- * }
- *
- * if ($this->_index === null) {
- * return $this->raiseError("$file doesn't seem to be an Excel file");
- * }
- *
- */
-
- // echo "data =".$this->data;
- // $this->readRecords();
- $this->_parse();
- }
-
- // }}}
- // {{{ _parse()
-
- /**
- * Parse a workbook
- *
- * @access private
- * @return bool
- */
- function _parse()
- {
- $pos = 0;
-
- $code = ord($this->data[$pos]) | ord($this->data[$pos + 1]) << 8;
- $length = ord($this->data[$pos + 2]) | ord($this->data[$pos + 3]) << 8;
-
- $version = ord($this->data[$pos + 4]) | ord($this->data[$pos + 5]) << 8;
- $substreamType = ord($this->data[$pos + 6]) | ord($this->data[$pos + 7]) << 8;
- // echo "Start parse code=".base_convert($code,10,16)." version=".base_convert($version,10,16)." substreamType=".base_convert($substreamType,10,16).""."\n";
-
- if (($version != SPREADSHEET_EXCEL_READER_BIFF8) && ($version != SPREADSHEET_EXCEL_READER_BIFF7)) {
- return false;
- }
-
- if ($substreamType != SPREADSHEET_EXCEL_READER_WORKBOOKGLOBALS) {
- return false;
- }
-
- // print_r($rec);
- $pos += $length + 4;
-
- $code = ord($this->data[$pos]) | ord($this->data[$pos + 1]) << 8;
- $length = ord($this->data[$pos + 2]) | ord($this->data[$pos + 3]) << 8;
-
- while ($code != SPREADSHEET_EXCEL_READER_TYPE_EOF) {
- switch ($code) {
- case SPREADSHEET_EXCEL_READER_TYPE_SST:
- // echo "Type_SST\n";
- $spos = $pos + 4;
- $limitpos = $spos + $length;
- $uniqueStrings = $this->_GetInt4d($this->data, $spos + 4);
- $spos += 8;
- for ($i = 0; $i < $uniqueStrings; $i ++) {
- // Read in the number of characters
- if ($spos == $limitpos) {
- $opcode = ord($this->data[$spos]) | ord($this->data[$spos + 1]) << 8;
- $conlength = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
- if ($opcode != 0x3c) {
- return - 1;
- }
- $spos += 4;
- $limitpos = $spos + $conlength;
- }
- $numChars = ord($this->data[$spos]) | (ord($this->data[$spos + 1]) << 8);
- // echo "i = $i pos = $pos numChars = $numChars ";
- $spos += 2;
- $optionFlags = ord($this->data[$spos]);
- $spos ++;
- $asciiEncoding = (($optionFlags & 0x01) == 0);
- $extendedString = (($optionFlags & 0x04) != 0);
-
- // See if string contains formatting information
- $richString = (($optionFlags & 0x08) != 0);
-
- if ($richString) {
- // Read in the crun
- $formattingRuns = ord($this->data[$spos]) | (ord($this->data[$spos + 1]) << 8);
- $spos += 2;
- }
-
- if ($extendedString) {
- // Read in cchExtRst
- $extendedRunLength = $this->_GetInt4d($this->data, $spos);
- $spos += 4;
- }
-
- $len = ($asciiEncoding) ? $numChars : $numChars * 2;
- if ($spos + $len < $limitpos) {
- $retstr = substr($this->data, $spos, $len);
- $spos += $len;
- } else {
- // found countinue
- $retstr = substr($this->data, $spos, $limitpos - $spos);
- $bytesRead = $limitpos - $spos;
- $charsLeft = $numChars - (($asciiEncoding) ? $bytesRead : ($bytesRead / 2));
- $spos = $limitpos;
-
- while ($charsLeft > 0) {
- $opcode = ord($this->data[$spos]) | ord($this->data[$spos + 1]) << 8;
- $conlength = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
- if ($opcode != 0x3c) {
- return - 1;
- }
- $spos += 4;
- $limitpos = $spos + $conlength;
- $option = ord($this->data[$spos]);
- $spos += 1;
- if ($asciiEncoding && ($option == 0)) {
- $len = min($charsLeft, $limitpos - $spos); // min($charsLeft, $conlength);
- $retstr .= substr($this->data, $spos, $len);
- $charsLeft -= $len;
- $asciiEncoding = true;
- } elseif (! $asciiEncoding && ($option != 0)) {
- $len = min($charsLeft * 2, $limitpos - $spos); // min($charsLeft, $conlength);
- $retstr .= substr($this->data, $spos, $len);
- $charsLeft -= $len / 2;
- $asciiEncoding = false;
- } elseif (! $asciiEncoding && ($option == 0)) {
- // Bummer - the string starts off as Unicode, but after the
- // continuation it is in straightforward ASCII encoding
- $len = min($charsLeft, $limitpos - $spos); // min($charsLeft, $conlength);
- for ($j = 0; $j < $len; $j ++) {
- $retstr .= $this->data[$spos + $j] . chr(0);
- }
- $charsLeft -= $len;
- $asciiEncoding = false;
- } else {
- $newstr = '';
- for ($j = 0; $j < strlen($retstr); $j ++) {
- $newstr = $retstr[$j] . chr(0);
- }
- $retstr = $newstr;
- $len = min($charsLeft * 2, $limitpos - $spos); // min($charsLeft, $conlength);
- $retstr .= substr($this->data, $spos, $len);
- $charsLeft -= $len / 2;
- $asciiEncoding = false;
- // echo "Izavrat\n";
- }
- $spos += $len;
- }
- }
- $retstr = ($asciiEncoding) ? $retstr : $this->_encodeUTF16($retstr);
- // echo "Str $i = $retstr\n";
- if ($richString) {
- $spos += 4 * $formattingRuns;
- }
-
- // For extended strings, skip over the extended string data
- if ($extendedString) {
- $spos += $extendedRunLength;
- }
- // if ($retstr == 'Derby'){
- // echo "bb\n";
- // }
- $this->sst[] = $retstr;
- }
- /*
- * $continueRecords = array();
- * while ($this->getNextCode() == Type_CONTINUE) {
- * $continueRecords[] = &$this->nextRecord();
- * }
- * //echo " 1 Type_SST\n";
- * $this->shareStrings = new SSTRecord($r, $continueRecords);
- * //print_r($this->shareStrings->strings);
- */
- // echo 'SST read: '.($time_end-$time_start)."\n";
- break;
-
- case SPREADSHEET_EXCEL_READER_TYPE_FILEPASS:
- return false;
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_NAME:
- // echo "Type_NAME\n";
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_FORMAT:
- $indexCode = ord($this->data[$pos + 4]) | ord($this->data[$pos + 5]) << 8;
-
- if ($version == SPREADSHEET_EXCEL_READER_BIFF8) {
- $numchars = ord($this->data[$pos + 6]) | ord($this->data[$pos + 7]) << 8;
- if (ord($this->data[$pos + 8]) == 0) {
- $formatString = substr($this->data, $pos + 9, $numchars);
- } else {
- $formatString = substr($this->data, $pos + 9, $numchars * 2);
- }
- } else {
- $numchars = ord($this->data[$pos + 6]);
- $formatString = substr($this->data, $pos + 7, $numchars * 2);
- }
-
- $this->formatRecords[$indexCode] = $formatString;
- // echo "Type.FORMAT\n";
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_XF:
- // global $dateFormats, $numberFormats;
- $indexCode = ord($this->data[$pos + 6]) | ord($this->data[$pos + 7]) << 8;
- // echo "\nType.XF ".count($this->formatRecords['xfrecords'])." $indexCode ";
- if (array_key_exists($indexCode, $this->dateFormats)) {
- // echo "isdate ".$dateFormats[$indexCode];
- $this->formatRecords['xfrecords'][] = array(
- 'type' => 'date',
- 'format' => $this->dateFormats[$indexCode]
- );
- } elseif (array_key_exists($indexCode, $this->numberFormats)) {
- // echo "isnumber ".$this->numberFormats[$indexCode];
- $this->formatRecords['xfrecords'][] = array(
- 'type' => 'number',
- 'format' => $this->numberFormats[$indexCode]
- );
- } else {
- $isdate = FALSE;
- if ($indexCode > 0) {
- if (isset($this->formatRecords[$indexCode]))
- $formatstr = $this->formatRecords[$indexCode];
- // echo '.other.';
- // echo "\ndate-time=$formatstr=\n";
- if (isset($formatstr))
- if (preg_match("/[^hmsday\/-:\s]/i", $formatstr) == 0) { // found day and time format
- $isdate = TRUE;
- $formatstr = str_replace('mm', 'i', $formatstr);
- $formatstr = str_replace('h', 'H', $formatstr);
- // echo "\ndate-time $formatstr \n";
- }
- }
-
- if ($isdate) {
- $this->formatRecords['xfrecords'][] = array(
- 'type' => 'date',
- 'format' => $formatstr
- );
- } else {
- $this->formatRecords['xfrecords'][] = array(
- 'type' => 'other',
- 'format' => '',
- 'code' => $indexCode
- );
- }
- }
- // echo "\n";
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_NINETEENFOUR:
- // echo "Type.NINETEENFOUR\n";
- $this->nineteenFour = (ord($this->data[$pos + 4]) == 1);
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_BOUNDSHEET:
- // echo "Type.BOUNDSHEET\n";
- $rec_offset = $this->_GetInt4d($this->data, $pos + 4);
- $rec_typeFlag = ord($this->data[$pos + 8]);
- $rec_visibilityFlag = ord($this->data[$pos + 9]);
- $rec_length = ord($this->data[$pos + 10]);
-
- if ($version == SPREADSHEET_EXCEL_READER_BIFF8) {
- $chartype = ord($this->data[$pos + 11]);
- if ($chartype == 0) {
- $rec_name = substr($this->data, $pos + 12, $rec_length);
- } else {
- $rec_name = $this->_encodeUTF16(substr($this->data, $pos + 12, $rec_length * 2));
- }
- } elseif ($version == SPREADSHEET_EXCEL_READER_BIFF7) {
- $rec_name = substr($this->data, $pos + 11, $rec_length);
- }
- $this->boundsheets[] = array(
- 'name' => $rec_name,
- 'offset' => $rec_offset
- );
-
- break;
- }
-
- // echo "Code = ".base_convert($r['code'],10,16)."\n";
- $pos += $length + 4;
- $code = ord($this->data[$pos]) | ord($this->data[$pos + 1]) << 8;
- $length = ord($this->data[$pos + 2]) | ord($this->data[$pos + 3]) << 8;
-
- // $r = &$this->nextRecord();
- // echo "1 Code = ".base_convert($r['code'],10,16)."\n";
- }
-
- foreach ($this->boundsheets as $key => $val) {
- $this->sn = $key;
- $this->_parsesheet($val['offset']);
- }
- return true;
- }
-
- /**
- * Parse a worksheet
- *
- * @access private
- * @param
- * todo
- * @todo fix return codes
- */
- function _parsesheet($spos)
- {
- $cont = true;
- // read BOF
- $code = ord($this->data[$spos]) | ord($this->data[$spos + 1]) << 8;
- $length = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
-
- $version = ord($this->data[$spos + 4]) | ord($this->data[$spos + 5]) << 8;
- $substreamType = ord($this->data[$spos + 6]) | ord($this->data[$spos + 7]) << 8;
-
- if (($version != SPREADSHEET_EXCEL_READER_BIFF8) && ($version != SPREADSHEET_EXCEL_READER_BIFF7)) {
- return - 1;
- }
-
- if ($substreamType != SPREADSHEET_EXCEL_READER_WORKSHEET) {
- return - 2;
- }
- // echo "Start parse code=".base_convert($code,10,16)." version=".base_convert($version,10,16)." substreamType=".base_convert($substreamType,10,16).""."\n";
- $spos += $length + 4;
- // var_dump($this->formatRecords);
- // echo "code $code $length";
- while ($cont) {
- // echo "mem= ".memory_get_usage()."\n";
- // $r = &$this->file->nextRecord();
- $lowcode = ord($this->data[$spos]);
- if ($lowcode == SPREADSHEET_EXCEL_READER_TYPE_EOF)
- break;
- $code = $lowcode | ord($this->data[$spos + 1]) << 8;
- $length = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
- $spos += 4;
- $this->sheets[$this->sn]['maxrow'] = $this->_rowoffset - 1;
- $this->sheets[$this->sn]['maxcol'] = $this->_coloffset - 1;
- // echo "Code=".base_convert($code,10,16)." $code\n";
- unset($this->rectype);
- $this->multiplier = 1; // need for format with %
- switch ($code) {
- case SPREADSHEET_EXCEL_READER_TYPE_DIMENSION:
- // echo 'Type_DIMENSION ';
- if (! isset($this->numRows)) {
- if (($length == 10) || ($version == SPREADSHEET_EXCEL_READER_BIFF7)) {
- $this->sheets[$this->sn]['numRows'] = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
- $this->sheets[$this->sn]['numCols'] = ord($this->data[$spos + 6]) | ord($this->data[$spos + 7]) << 8;
- } else {
- $this->sheets[$this->sn]['numRows'] = ord($this->data[$spos + 4]) | ord($this->data[$spos + 5]) << 8;
- $this->sheets[$this->sn]['numCols'] = ord($this->data[$spos + 10]) | ord($this->data[$spos + 11]) << 8;
- }
- }
- // echo 'numRows '.$this->numRows.' '.$this->numCols."\n";
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_MERGEDCELLS:
- $cellRanges = ord($this->data[$spos]) | ord($this->data[$spos + 1]) << 8;
- for ($i = 0; $i < $cellRanges; $i ++) {
- $fr = ord($this->data[$spos + 8 * $i + 2]) | ord($this->data[$spos + 8 * $i + 3]) << 8;
- $lr = ord($this->data[$spos + 8 * $i + 4]) | ord($this->data[$spos + 8 * $i + 5]) << 8;
- $fc = ord($this->data[$spos + 8 * $i + 6]) | ord($this->data[$spos + 8 * $i + 7]) << 8;
- $lc = ord($this->data[$spos + 8 * $i + 8]) | ord($this->data[$spos + 8 * $i + 9]) << 8;
- // $this->sheets[$this->sn]['mergedCells'][] = array($fr + 1, $fc + 1, $lr + 1, $lc + 1);
- if ($lr - $fr > 0) {
- $this->sheets[$this->sn]['cellsInfo'][$fr + 1][$fc + 1]['rowspan'] = $lr - $fr + 1;
- }
- if ($lc - $fc > 0) {
- $this->sheets[$this->sn]['cellsInfo'][$fr + 1][$fc + 1]['colspan'] = $lc - $fc + 1;
- }
- }
- // echo "Merged Cells $cellRanges $lr $fr $lc $fc\n";
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_RK:
- case SPREADSHEET_EXCEL_READER_TYPE_RK2:
- // echo 'SPREADSHEET_EXCEL_READER_TYPE_RK'."\n";
- $row = ord($this->data[$spos]) | ord($this->data[$spos + 1]) << 8;
- $column = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
- $rknum = $this->_GetInt4d($this->data, $spos + 6);
- $numValue = $this->_GetIEEE754($rknum);
- // echo $numValue." ";
- if ($this->isDate($spos)) {
- list ($string, $raw) = $this->createDate($numValue);
- } else {
- $raw = $numValue;
- if (isset($this->_columnsFormat[$column + 1])) {
- $this->curformat = $this->_columnsFormat[$column + 1];
- }
- $string = sprintf($this->curformat, $numValue * $this->multiplier);
- // $this->addcell(RKRecord($r));
- }
- $this->addcell($row, $column, $string, $raw);
- // echo "Type_RK $row $column $string $raw {$this->curformat}\n";
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_LABELSST:
- $row = ord($this->data[$spos]) | ord($this->data[$spos + 1]) << 8;
- $column = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
- $xfindex = ord($this->data[$spos + 4]) | ord($this->data[$spos + 5]) << 8;
- $index = $this->_GetInt4d($this->data, $spos + 6);
- // var_dump($this->sst);
- $this->addcell($row, $column, $this->sst[$index]);
- // echo "LabelSST $row $column $string\n";
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_MULRK:
- $row = ord($this->data[$spos]) | ord($this->data[$spos + 1]) << 8;
- $colFirst = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
- $colLast = ord($this->data[$spos + $length - 2]) | ord($this->data[$spos + $length - 1]) << 8;
- $columns = $colLast - $colFirst + 1;
- $tmppos = $spos + 4;
- for ($i = 0; $i < $columns; $i ++) {
- $numValue = $this->_GetIEEE754($this->_GetInt4d($this->data, $tmppos + 2));
- if ($this->isDate($tmppos - 4)) {
- list ($string, $raw) = $this->createDate($numValue);
- } else {
- $raw = $numValue;
- if (isset($this->_columnsFormat[$colFirst + $i + 1])) {
- $this->curformat = $this->_columnsFormat[$colFirst + $i + 1];
- }
- $string = sprintf($this->curformat, $numValue * $this->multiplier);
- }
- // $rec['rknumbers'][$i]['xfindex'] = ord($rec['data'][$pos]) | ord($rec['data'][$pos+1]) << 8;
- $tmppos += 6;
- $this->addcell($row, $colFirst + $i, $string, $raw);
- // echo "MULRK $row ".($colFirst + $i)." $string\n";
- }
- // MulRKRecord($r);
- // Get the individual cell records from the multiple record
- // $num = ;
-
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_NUMBER:
- $row = ord($this->data[$spos]) | ord($this->data[$spos + 1]) << 8;
- $column = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
- $tmp = unpack("ddouble", substr($this->data, $spos + 6, 8)); // It machine machine dependent
- if ($this->isDate($spos)) {
- list ($string, $raw) = $this->createDate($tmp['double']);
- // $this->addcell(DateRecord($r, 1));
- } else {
- // $raw = $tmp[''];
- if (isset($this->_columnsFormat[$column + 1])) {
- $this->curformat = $this->_columnsFormat[$column + 1];
- }
- $raw = $this->createNumber($spos);
- $string = sprintf($this->curformat, $raw * $this->multiplier);
-
- // $this->addcell(NumberRecord($r));
- }
- $this->addcell($row, $column, $string, $raw);
- // echo "Number $row $column $string\n";
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_FORMULA:
- case SPREADSHEET_EXCEL_READER_TYPE_FORMULA2:
- $row = ord($this->data[$spos]) | ord($this->data[$spos + 1]) << 8;
- $column = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
- if ((ord($this->data[$spos + 6]) == 0) && (ord($this->data[$spos + 12]) == 255) && (ord($this->data[$spos + 13]) == 255)) {
- // String formula. Result follows in a STRING record
- // echo "FORMULA $row $column Formula with a string<br>\n";
- } elseif ((ord($this->data[$spos + 6]) == 1) && (ord($this->data[$spos + 12]) == 255) && (ord($this->data[$spos + 13]) == 255)) {
- // Boolean formula. Result is in +2; 0=false,1=true
- } elseif ((ord($this->data[$spos + 6]) == 2) && (ord($this->data[$spos + 12]) == 255) && (ord($this->data[$spos + 13]) == 255)) {
- // Error formula. Error code is in +2;
- } elseif ((ord($this->data[$spos + 6]) == 3) && (ord($this->data[$spos + 12]) == 255) && (ord($this->data[$spos + 13]) == 255)) {
- // Formula result is a null string.
- } else {
- // result is a number, so first 14 bytes are just like a _NUMBER record
- $tmp = unpack("ddouble", substr($this->data, $spos + 6, 8)); // It machine machine dependent
- if ($this->isDate($spos)) {
- list ($string, $raw) = $this->createDate($tmp['double']);
- // $this->addcell(DateRecord($r, 1));
- } else {
- // $raw = $tmp[''];
- if (isset($this->_columnsFormat[$column + 1])) {
- $this->curformat = $this->_columnsFormat[$column + 1];
- }
- $raw = $this->createNumber($spos);
- $string = sprintf($this->curformat, $raw * $this->multiplier);
-
- // $this->addcell(NumberRecord($r));
- }
- $this->addcell($row, $column, $string, $raw);
- // echo "Number $row $column $string\n";
- }
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_BOOLERR:
- $row = ord($this->data[$spos]) | ord($this->data[$spos + 1]) << 8;
- $column = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
- $string = ord($this->data[$spos + 6]);
- $this->addcell($row, $column, $string);
- // echo 'Type_BOOLERR '."\n";
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_ROW:
- case SPREADSHEET_EXCEL_READER_TYPE_DBCELL:
- case SPREADSHEET_EXCEL_READER_TYPE_MULBLANK:
- break;
- case SPREADSHEET_EXCEL_READER_TYPE_LABEL:
- $row = ord($this->data[$spos]) | ord($this->data[$spos + 1]) << 8;
- $column = ord($this->data[$spos + 2]) | ord($this->data[$spos + 3]) << 8;
- $this->addcell($row, $column, substr($this->data, $spos + 8, ord($this->data[$spos + 6]) | ord($this->data[$spos + 7]) << 8));
-
- // $this->addcell(LabelRecord($r));
- break;
-
- case SPREADSHEET_EXCEL_READER_TYPE_EOF:
- $cont = false;
- break;
- default:
- // echo ' unknown :'.base_convert($r['code'],10,16)."\n";
- break;
- }
- $spos += $length;
- }
-
- if (! isset($this->sheets[$this->sn]['numRows']))
- $this->sheets[$this->sn]['numRows'] = $this->sheets[$this->sn]['maxrow'];
- if (! isset($this->sheets[$this->sn]['numCols']))
- $this->sheets[$this->sn]['numCols'] = $this->sheets[$this->sn]['maxcol'];
- }
-
- /**
- * Check whether the current record read is a date
- *
- * @param
- * todo
- * @return boolean True if date, false otherwise
- */
- function isDate($spos)
- {
- // $xfindex = GetInt2d(, 4);
- $xfindex = ord($this->data[$spos + 4]) | ord($this->data[$spos + 5]) << 8;
- // echo 'check is date '.$xfindex.' '.$this->formatRecords['xfrecords'][$xfindex]['type']."\n";
- // var_dump($this->formatRecords['xfrecords'][$xfindex]);
- if ($this->formatRecords['xfrecords'][$xfindex]['type'] == 'date') {
- $this->curformat = $this->formatRecords['xfrecords'][$xfindex]['format'];
- $this->rectype = 'date';
- return true;
- } else {
- if ($this->formatRecords['xfrecords'][$xfindex]['type'] == 'number') {
- $this->curformat = $this->formatRecords['xfrecords'][$xfindex]['format'];
- $this->rectype = 'number';
- if (($xfindex == 0x9) || ($xfindex == 0xa)) {
- $this->multiplier = 100;
- }
- } else {
- $this->curformat = $this->_defaultFormat;
- $this->rectype = 'unknown';
- }
- return false;
- }
- }
-
- // }}}
- // {{{ createDate()
-
- /**
- * Convert the raw Excel date into a human readable format
- *
- * Dates in Excel are stored as number of seconds from an epoch. On
- * Windows, the epoch is 30/12/1899 and on Mac it's 01/01/1904
- *
- * @access private
- * @param
- * integer The raw Excel value to convert
- * @return array First element is the converted date, the second element is number a unix timestamp
- */
- function createDate($numValue)
- {
- if ($numValue > 1) {
- $utcDays = $numValue - ($this->nineteenFour ? SPREADSHEET_EXCEL_READER_UTCOFFSETDAYS1904 : SPREADSHEET_EXCEL_READER_UTCOFFSETDAYS);
- $utcValue = round(($utcDays + 1) * SPREADSHEET_EXCEL_READER_MSINADAY);
- $string = date($this->curformat, $utcValue);
- $raw = $utcValue;
- } else {
- $raw = $numValue;
- $hours = floor($numValue * 24);
- $mins = floor($numValue * 24 * 60) - $hours * 60;
- $secs = floor($numValue * SPREADSHEET_EXCEL_READER_MSINADAY) - $hours * 60 * 60 - $mins * 60;
- $string = date($this->curformat, mktime($hours, $mins, $secs));
- }
-
- return array(
- $string,
- $raw
- );
- }
-
- function createNumber($spos)
- {
- $rknumhigh = $this->_GetInt4d($this->data, $spos + 10);
- $rknumlow = $this->_GetInt4d($this->data, $spos + 6);
- // for ($i=0; $i<8; $i++) { echo ord($this->data[$i+$spos+6]) . " "; } echo "<br>";
- $sign = ($rknumhigh & 0x80000000) >> 31;
- $exp = ($rknumhigh & 0x7ff00000) >> 20;
- $mantissa = (0x100000 | ($rknumhigh & 0x000fffff));
- $mantissalow1 = ($rknumlow & 0x80000000) >> 31;
- $mantissalow2 = ($rknumlow & 0x7fffffff);
- $value = $mantissa / pow(2, (20 - ($exp - 1023)));
- if ($mantissalow1 != 0)
- $value += 1 / pow(2, (21 - ($exp - 1023)));
- $value += $mantissalow2 / pow(2, (52 - ($exp - 1023)));
- // echo "Sign = $sign, Exp = $exp, mantissahighx = $mantissa, mantissalow1 = $mantissalow1, mantissalow2 = $mantissalow2<br>\n";
- if ($sign) {
- $value = - 1 * $value;
- }
- return $value;
- }
-
- function addcell($row, $col, $string, $raw = '')
- {
- // echo "ADD cel $row-$col $string\n";
- $this->sheets[$this->sn]['maxrow'] = max($this->sheets[$this->sn]['maxrow'], $row + $this->_rowoffset);
- $this->sheets[$this->sn]['maxcol'] = max($this->sheets[$this->sn]['maxcol'], $col + $this->_coloffset);
- $this->sheets[$this->sn]['cells'][$row + $this->_rowoffset][$col + $this->_coloffset] = $string;
- if ($raw)
- $this->sheets[$this->sn]['cellsInfo'][$row + $this->_rowoffset][$col + $this->_coloffset]['raw'] = $raw;
- if (isset($this->rectype))
- $this->sheets[$this->sn]['cellsInfo'][$row + $this->_rowoffset][$col + $this->_coloffset]['type'] = $this->rectype;
- }
-
- function _GetIEEE754($rknum)
- {
- if (($rknum & 0x02) != 0) {
- $value = $rknum >> 2;
- } else {
- // mmp
- // first comment out the previously existing 7 lines of code here
- // $tmp = unpack("d", pack("VV", 0, ($rknum & 0xfffffffc)));
- // //$value = $tmp[''];
- // if (array_key_exists(1, $tmp)) {
- // $value = $tmp[1];
- // } else {
- // $value = $tmp[''];
- // }
- // I got my info on IEEE754 encoding from
- // http://research.microsoft.com/~hollasch/cgindex/coding/ieeefloat.html
- // The RK format calls for using only the most significant 30 bits of the
- // 64 bit floating point value. The other 34 bits are assumed to be 0
- // So, we use the upper 30 bits of $rknum as follows...
- $sign = ($rknum & 0x80000000) >> 31;
- $exp = ($rknum & 0x7ff00000) >> 20;
- $mantissa = (0x100000 | ($rknum & 0x000ffffc));
- $value = $mantissa / pow(2, (20 - ($exp - 1023)));
- if ($sign) {
- $value = - 1 * $value;
- }
- // end of changes by mmp
- }
-
- if (($rknum & 0x01) != 0) {
- $value /= 100;
- }
- return $value;
- }
-
- function _encodeUTF16($string)
- {
- $result = $string;
- if ($this->_defaultEncoding) {
- switch ($this->_encoderFunction) {
- case 'iconv':
- $result = iconv('UTF-16LE', $this->_defaultEncoding, $string);
- break;
- case 'mb_convert_encoding':
- $result = mb_convert_encoding($string, $this->_defaultEncoding, 'UTF-16LE');
- break;
- }
- }
- return $result;
- }
-
- function _GetInt4d($data, $pos)
- {
- $value = ord($data[$pos]) | (ord($data[$pos + 1]) << 8) | (ord($data[$pos + 2]) << 16) | (ord($data[$pos + 3]) << 24);
- if ($value >= 4294967294) {
- $value = - 2;
- }
- return $value;
- }
- }
-
- /*
- * Local variables:
- * tab-width: 4
- * c-basic-offset: 4
- * c-hanging-comment-ender-p: nil
- * End:
- */
-
- ?>
|