php编程实现获取excel文档内容的代码实例
前端之家收集整理的这篇文章主要介绍了
php编程实现获取excel文档内容的代码实例,
前端之家小编觉得挺不错的,现在分享给大家,也给大家做个参考。
1、readexcel.system.PHP
<div class="codetitle"><a style="CURSOR: pointer" data="53716" class="copybut" id="copybut53716" onclick="doCopy('code53716')"> 代码如下:
<div class="codebody" id="code53716">
<?
PHP /
vim: set expandtab tabstop=4 shiftwidth=4 softtabstop=4: /
/
A class for reading Microsoft Excel Spreadsheets.
Originally developed by Vadim Tkachenko under the name PHPExcelReader.
(http://sourceforge.net/projects/PHPexcelreader)
Based on the Java version by Andy Khan (http://www.3ppt.com). Now
maintained by David Sanders. Reads only Biff 7 and Biff 8 formats.
PHP versions 4 and 5
LICENSE: This source file is subject to version 3.0 of the PHP license
that is available through the world-wide-web at the following URI:
http://www.PHP.net/license/3_0.txt. If you did not receive a copy of
the PHP License and are unable to obtain it through the web,please
send a note to license@PHP.net so we can mail you a copy immediately.
@category Spreadsheet
@package Spreadsheet_Excel_Reader
@author Vadim Tkachenko vt@apachephp.com
@license http://www.PHP.net/license/3_0.txt PHP License 3.0
@version CVS: $Id: reader.PHP 19 2007-03-13 12:42:41Z shangxiao $
@link http://pear.PHP.net/package/Spreadsheet_Excel_Reader
@see OLE,Spreadsheet_Excel_Writer
/
//require_once 'PEAR.PHP';
//require_once 'oleread.PHP';
//oleread.PHP的内容start=======================================================================================================
define('NUM_BIG_BLOCK_DEPOT_BLOCKS_POS',0x2c);
define('SMALL_BLOCK_DEPOT_BLOCK_POS',0x3c);
define('ROOT_START_BLOCK_POS',0x30);
define('BIG_BLOCK_SIZE',0x200);
define('SMALL_BLOCK_SIZE',0x40);
define('EXTENSION_BLOCK_POS',0x44);
define('NUM_EXTENSION_BLOCK_POS',0x48);
define('PROPERTY_STORAGE_BLOCK_SIZE',0x80);
define('BIG_BLOCK_DEPOT_BLOCKS_POS',0x4c);
define('SMALL_BLOCK_THRESHOLD',0x1000);
// property storage offsets
define('SIZE_OF_NAME_POS',0x40);
define('TYPE_POS',0x42);
define('START_BLOCK_POS',0x74);
define('SIZE_POS',0x78);
define('IDENTIFIER_OLE',pack("CCCCCCCC",0xd0,0xcf,0x11,0xe0,0xa1,0xb1,0x1a,0xe1));
//echo 'ROOT_START_BLOCK_POS = '.ROOT_START_BLOCK_POS."n";
//echo bin2hex($data[ROOT_START_BLOCK_POS])."n";
//echo "a=";
//echo $data[ROOT_START_BLOCK_POS];
//function log
function GetInt4d($data,$pos)
{
$value = ord($data[$pos]) | (ord($data[$pos+1]) << 8) | (ord($data[$pos+2]) << 16) | (ord($data[$pos+3]) << 24);
if ($value>=4294967294)
{
$value=-2;
}
return $value;
}
class OLERead {
var $data = '';
function OLERead(){
}
function read($sFileName){
// check if file exist and is readable (Darko Miljanovic)
if(!is_readable($sFileName)) {
$this->error = 1;
return false;
}
$this->data = @file_get_contents($sFileName);
if (!$this->data) {
$this->error = 1;
return false;
}
//echo IDENTIFIER_OLE;
//echo 'start';
if (substr($this->data,8) != IDENTIFIER_OLE) {
$this->error = 1;
return false;
}
$this->numBigBlockDepotBlocks = GetInt4d($this->data,NUM_BIG_BLOCK_DEPOT_BLOCKS_POS);
$this->sbdStartBlock = GetInt4d($this->data,SMALL_BLOCK_DEPOT_BLOCK_POS);
$this->rootStartBlock = GetInt4d($this->data,ROOT_START_BLOCK_POS);
$this->extensionBlock = GetInt4d($this->data,EXTENSION_BLOCK_POS);
$this->numExtensionBlocks = GetInt4d($this->data,NUM_EXTENSION_BLOCK_POS);
/
echo $this->numBigBlockDepotBlocks." ";
echo $this->sbdStartBlock." ";
echo $this->rootStartBlock." ";
echo $this->extensionBlock." ";
echo $this->numExtensionBlocks." ";
/
//echo "sbdStartBlock = $this->sbdStartBlockn";
$bigBlockDepotBlocks = array();
$pos = BIG_BLOCK_DEPOT_BLOCKS_POS;
// echo "pos = $pos";
$bbdBlocks = $this->numBigBlockDepotBlocks;
if ($this->numExtensionBlocks != 0) {
$bbdBlocks = (BIG_BLOCK_SIZE - BIG_BLOCK_DEPOT_BLOCKS_POS)/4;
}
for ($i = 0; $i < $bbdBlocks; $i++) {
$bigBlockDepotBlocks[$i] = GetInt4d($this->data,$pos);
$pos += 4;
}
for ($j = 0; $j < $this->numExtensionBlocks; $j++) {
$pos = ($this->extensionBlock + 1) BIG_BLOCK_SIZE;
$blocksToRead = min($this->numBigBlockDepotBlocks - $bbdBlocks,BIG_BLOCK_SIZE / 4 - 1);
for ($i = $bbdBlocks; $i < $bbdBlocks + $blocksToRead; $i++) {
$bigBlockDepotBlocks[$i] = GetInt4d($this->data,$pos);
$pos += 4;
}
$bbdBlocks += $blocksToRead;
if ($bbdBlocks < $this->numBigBlockDepotBlocks) {
$this->extensionBlock = GetInt4d($this->data,$pos);
}
}
// var_dump($bigBlockDepotBlocks);
// readBigBlockDepot
$pos = 0;
$index = 0;
$this->bigBlockChain = array();
for ($i = 0; $i < $this->numBigBlockDepotBlocks; $i++) {
$pos = ($bigBlockDepotBlocks[$i] + 1) BIG_BLOCK_SIZE;
//echo "pos = $pos";
for ($j = 0 ; $j < BIG_BLOCK_SIZE / 4; $j++) {
$this->bigBlockChain[$index] = GetInt4d($this->data,$pos);
$pos += 4 ;
$index++;
}
}
//var_dump($this->bigBlockChain);
//echo '=====2';
// readSmallBlockDepot();
$pos = 0;
$index = 0;
$sbdBlock = $this->sbdStartBlock;
$this->smallBlockChain = array();
while ($sbdBlock != -2) {
$pos = ($sbdBlock + 1) BIG_BLOCK_SIZE;
for ($j = 0; $j < BIG_BLOCK_SIZE / 4; $j++) {
$this->smallBlockChain[$index] = GetInt4d($this->data,$pos);
$pos += 4;
$index++;
}
$sbdBlock = $this->bigBlockChain[$sbdBlock];
}
// readData(rootStartBlock)
$block = $this->rootStartBlock;
$pos = 0;
$this->entry = $this->readData($block);
/
while ($block != -2) {
$pos = ($block + 1) BIG_BLOCK_SIZE;
$this->entry = $this->entry.substr($this->data,$pos,BIG_BLOCK_SIZE);
$block = $this->bigBlockChain[$block];
}
*/
//echo '==='.$this->entry."===";
$this->readPropertySets();
}
function __readData($bl) {
$block = $bl;
$pos = 0;
$data = '';
while ($block != -2) {
$pos = ($block + 1) BIG_BLOCK_SIZE;
$data = $data.substr($this->data,BIG_BLOCK_SIZE);
//echo "pos = $pos data=$datan";
$block = $this->bigBlockChain[$block];
}
return $data;
}
function readPropertySets(){
$offset = 0;
//var_dump($this->entry);
while ($offset < strlen($this->entry)) {
$d = substr($this->entry,$offset,PROPERTY_STORAGE_BLOCK_SIZE);
$nameSize = ord($d[SIZE_OF_NAME_POS]) | (ord($d[SIZE_OF_NAME_POS+1]) << 8);
$type = ord($d[TYPE_POS]);
//$maxBlock = strlen($d) / BIG_BLOCK_SIZE - 1;
$startBlock = GetInt4d($d,START_BLOCK_POS);
$size = GetInt4d($d,SIZE_POS);
$name = '';
for ($i = 0; $i < $nameSize ; $i++) {
$name .= $d[$i];
}
$name = str_replace("x00","",$name);
$this->props[] = array (
'name' => $name,
'type' => $type,
'startBlock' => $startBlock,
'size' => $size);
if (($name == "Workbook") || ($name == "Book")) {
$this->wrkbook = count($this->props) - 1;
}
if ($name == "Root Entry") {
$this->rootentry = count($this->props) - 1;
}
//echo "name ==$name=n";
$offset += PROPERTY_STORAGE_BLOCK_SIZE;
}
}
function getWorkBook(){
if ($this->props[$this->wrkbook]['size'] < SMALL_BLOCK_THRESHOLD){
// getSmallBlockStream(PropertyStorage ps)
$rootdata = $this->readData($this->props[$this->rootentry]['startBlock']);
$streamData = '';
$block = $this->props[$this->wrkbook]['startBlock'];
//$count = 0;
$pos = 0;
while ($block != -2) {
$pos = $block SMALL_BLOCK_SIZE;
$streamData .= substr($rootdata,SMALL_BLOCK_SIZE);
$block = $this->smallBlockChain[$block];
}
return $streamData;
}else{
$numBlocks = $this->props[$this->wrkbook]['size'] / BIG_BLOCK_SIZE;
if ($this->props[$this->wrkbook]['size'] % BIG_BLOCK_SIZE != 0) {
$numBlocks++;
}
if ($numBlocks == 0) return '';
//echo "numBlocks = $numBlocksn";
//byte[] streamData = new byte[numBlocks BIG_BLOCK_SIZE];
//print_r($this->wrkbook);
$streamData = '';
$block = $this->props[$this->wrkbook]['startBlock'];
//$count = 0;
$pos = 0;
//echo "block = $block";
while ($block != -2) {
$pos = ($block + 1) BIG_BLOCK_SIZE;
$streamData .= substr($this->data,BIG_BLOCK_SIZE);
$block = $this->bigBlockChain[$block];
}
//echo 'stream'.$streamData;
return $streamData;
}
}
}
//oleread.PHP的内容end=======================================================================================================
//require_once 'OLE.PHP';
define('SPREADSHEET_EXCEL_READER_BIFF8',0x600);
define('SPREADSHEET_EXCEL_READER_BIFF7',0x500);
define('SPREADSHEET_EXCEL_READER_WORKBOOKGLOBALS',0x5);
define('SPREADSHEET_EXCEL_READER_WORKSHEET',0x10);
define('SPREADSHEET_EXCEL_READER_TYPE_BOF',0x809);
define('SPREADSHEET_EXCEL_READER_TYPE_EOF',0x0a);
define('SPREADSHEET_EXCEL_READER_TYPE_BOUNDSHEET',0x85);
define('SPREADSHEET_EXCEL_READER_TYPE_DIMENSION',0x200);
define('SPREADSHEET_EXCEL_READER_TYPE_ROW',0x208);
define('SPREADSHEET_EXCEL_READER_TYPE_DBCELL',0xd7);
define('SPREADSHEET_EXCEL_READER_TYPE_FILEPASS',0x2f);
define('SPREADSHEET_EXCEL_READER_TYPE_NOTE',0x1c);
define('SPREADSHEET_EXCEL_READER_TYPE_TXO',0x1b6);
define('SPREADSHEET_EXCEL_READER_TYPE_RK',0x7e);
define('SPREADSHEET_EXCEL_READER_TYPE_RK2',0x27e);
define('SPREADSHEET_EXCEL_READER_TYPE_MULRK',0xbd);
define('SPREADSHEET_EXCEL_READER_TYPE_MULBLANK',0xbe);
define('SPREADSHEET_EXCEL_READER_TYPE_INDEX',0x20b);
define('SPREADSHEET_EXCEL_READER_TYPE_SST',0xfc);
define('SPREADSHEET_EXCEL_READER_TYPE_EXTSST',0xff);
define('SPREADSHEET_EXCEL_READER_TYPE_CONTINUE',0x3c);
define('SPREADSHEET_EXCEL_READER_TYPE_LABEL',0x204);
define('SPREADSHEET_EXCEL_READER_TYPE_LABELSST',0xfd);
define('SPREADSHEET_EXCEL_READER_TYPE_NUMBER',0x203);
define('SPREADSHEET_EXCEL_READER_TYPE_NAME',0x18);
define('SPREADSHEET_EXCEL_READER_TYPE_ARRAY',0x221);
define('SPREADSHEET_EXCEL_READER_TYPE_STRING',0x207);
define('SPREADSHEET_EXCEL_READER_TYPE_FORMULA',0x406);
define('SPREADSHEET_EXCEL_READER_TYPE_FORMULA2',0x6);
define('SPREADSHEET_EXCEL_READER_TYPE_FORMAT',0x41e);
define('SPREADSHEET_EXCEL_READER_TYPE_XF',0xe0);
define('SPREADSHEET_EXCEL_READER_TYPE_BOOLERR',0x205);
define('SPREADSHEET_EXCEL_READER_TYPE_UNKNOWN',0xffff);
define('SPREADSHEET_EXCEL_READER_TYPE_NINETEENFOUR',0x22);
define('SPREADSHEET_EXCEL_READER_TYPE_MERGEDCELLS',0xE5);
define('SPREADSHEET_EXCEL_READER_UTCOFFSETDAYS',25569);
define('SPREADSHEET_EXCEL_READER_UTCOFFSETDAYS1904',24107);
define('SPREADSHEET_EXCEL_READER_MSINADAY',86400);
//define('SPREADSHEET_EXCEL_READER_MSINADAY',24 60 60);
//define('SPREADSHEET_EXCEL_READER_DEF_NUM_FORMAT',"%.2f");
define('SPREADSHEET_EXCEL_READER_DEF_NUM_FORMAT',"%s");
/
Place includes,constant defines and $_GLOBAL settings here.
Make sure they have appropriate docblocks to avoid PHPDocumentor
construing they are documented by the page-level docblock.
*/
/ A class for reading Microsoft Excel Spreadsheets.
Originally developed by Vadim Tkachenko under the name PHPExcelReader.
(
http://sourceforge.net/projects/PHPexcelreader)
Based on the Java version by Andy Khan (http://www.3ppt.com). Now
maintained by David Sanders. Reads only Biff 7 and Biff 8 formats.
@category Spreadsheet
@package Spreadsheet_Excel_Reader
@author Vadim Tkachenko
vt@shoujidy.com @copyright 2010-2011 The PHP Group
@license
http://www.
PHP.net/license/3_0.txt
PHP License 3.0
@version Release: @package_version@
@link
http://pear.
PHP.net/package/PackageName
@see OLE,Spreadsheet_Excel_Writer
/
class ReadexcelSystem{
/
Array of worksheets found
@var array
@access public
*/
var $boundsheets = array();
/*
Array of format records found
@var array
@access public
/
var $formatRecords = array();
/ todo
@var array
@access public
*/
var $sst = array();
/
Array of worksheets
The data is stored in 'cells' and the Meta-data is stored in an array
called 'cellsInfo'
Example:
$sheets --> 'cells' --> row --> column --> Interpreted value
--> 'cellsInfo' --> row --> column --> 'type' - Can be 'date','number',or 'unknown'
--> 'raw' - The raw data that Excel stores for that data cell
@var array
@access public
/
var $sheets = array();
/ The data returned by OLE
@var string
@access public
*/
var $data;
/
OLE object for reading the file
@var OLE object
@access private
*/
var $_ole;
/*
Default encoding
@var string
@access private
/
var $_defaultEncoding;
/ Default number format
@var integer
@access private
*/
var $_defaultFormat = SPREADSHEET_EXCEL_READER_DEF_NUM_FORMAT;
/
todo
List of formats to use for each column
@var array
@access private
/
var $_columnsFormat = array();
/ todo
@var integer
@access private
*/
var $_rowoffset = 1;
/
todo
@var integer
@access private
*/
var $_coloffset = 1;
/*
List of default date formats used by Excel
@var array
@access public
/
var $dateFormats = array (
0xe => "d/m/Y",
0xf => "d-M-Y",
0x10 => "d-M",
0x11 => "M-Y",
0x12 => "h:i a",
0x13 => "h:i:s a",
0x14 => "H:i",
0x15 => "H:i:s",
0x16 => "d/m/Y H:i",
0x2d => "i:s",
0x2e => "H:i:s",
0x2f => "i:s.S");
/ Default number formats used by Excel
@var array
@access public
/
var $numberFormats = array(
0x1 => "%1.0f",// "0"
0x2 => "%1.2f",// "0.00",
0x3 => "%1.0f",//"#,##0",
0x4 => "%1.2f",##0.00",
0x5 => "%1.0f",/"$#,##0;($#,##0)",
/
0x6 => '$%1.0f',/
0x7 => '$%1.2f',//"$#,##0.00;($#,##0.00)",
0x8 => '$%1.2f',
0x9 => '%1.0f%%',// "0%"
0xa => '%1.2f%%',// "0.00%"
0xb => '%1.2f',// 0.00E00",
0x25 => '%1.0f',// "#,##0;(#,
0x26 => '%1.0f',
0x27 => '%1.2f',##0.00;(#,
0x28 => '%1.2f',
0x29 => '%1.0f',
0x2a => '$%1.0f',
0x2b => '%1.2f',
0x2c => '$%1.2f',
0x30 => '%1.0f'); //"##0.0E0";
// }}}
// {{{ Spreadsheet_Excel_Reader()
/
Constructor
Some basic initialisation
/
function __construct()
{
$this->_ole =& new OLERead();
$this->setUTFEncoder('iconv');
}
// }}}
// {{{ setOutputEncoding()
/ Set the encoding method
@param string Encoding to use
@access public
*/
function setOutputEncoding($encoding)
{
$this->_defaultEncoding = $encoding;
}
// }}}
// {{{ setUTFEncoder()
/
$encoder = 'iconv' or 'mb'
set iconv if you would like use 'iconv' for encode UTF-16LE to your encoding
set mb if you would like use 'mb_convert_encoding' for encode UTF-16LE to your encoding
@access public
@param string Encoding type to use. Either 'iconv' or 'mb'
*/
function setUTFEncoder($encoder = 'iconv')
{
$this->_encoderFunction = '';
if ($encoder == 'iconv') {
$this->_encoderFunction = function_exists('iconv') ? 'iconv' : '';
} elseif ($encoder == 'mb') {
$this->_encoderFunction = function_exists('mb_convert_encoding') ?
'mb_convert_encoding' :
'';
}
}
// }}}
// {{{ setRowColOffset()
/*
todo
@access public
@param offset
/
function setRowColOffset($iOffset)
{
$this->_rowoffset = $iOffset;
$this->_coloffset = $iOffset;
}
// }}}
// {{{ setDefaultFormat()
/ Set the default number format
@access public
@param Default format
*/
function setDefaultFormat($sFormat)
{
$this->_defaultFormat = $sFormat;
}
// }}}
// {{{ setColumnFormat()
/
Force a column to use a certain format
@access public
@param integer Column number
@param string Format
/
function setColumnFormat($column,$sFormat)
{
$this->_columnsFormat[$column] = $sFormat;
}
// }}}
// {{{ read()
/ Read the spreadsheet file using OLE,then parse
@access public
@param filename
@todo return a valid value
/
function read($sFileName)
{
/
require_once 'OLE.PHP';
$ole = new OLE();
$ole->read($sFileName);
foreach ($ole->_list as $i => $pps) {
if (($pps->Name == 'Workbook' || $pps->Name == 'Book') &&
$pps->Size >= SMALL_BLOCK_THRESHOLD) {
$this->data = $ole->getData($i,$ole->getDataLength($i));
} elseif ($pps->Name == 'Root Entry') {
$this->data = $ole->getData($i,$ole->getDataLength($i));
}
//var_dump(strlen($ole->getData($i,$ole->getDataLength($i))),$pps->Name,md5($this->data),$ole->getDataLength($i));
}
//exit;
$this->_parse();
return sizeof($this->sheets) > 0;
/
$res = $this->_ole->read($sFileName);
// oops,something goes wrong (Darko Miljanovic)
if($res === false) {
// check error code
if($this->_ole->error == 1) {
// bad file
die('The filename ' . $sFileName . ' is not readable');
}
// check other error codes here (eg bad fileformat,etc...)
}
$this->data = $this->_ole->getWorkBook();
/
$res = $this->_ole->read($sFileName);
if ($this->isError($res)) {
// var_dump($res);
return $this->raiseError($res);
}
$total = $this->_ole->ppsTotal();
for ($i = 0; $i < $total; $i++) {
if ($this->_ole->isFile($i)) {
$type = unpack("v",$this->_ole->getData($i,2));
if ($type[''] == 0x0809) { // check if it's a BIFF stream
$this->_index = $i;
$this->data = $this->_ole->getData($i,$this->_ole->getDataLength($i));
break;
}
}
}
if ($this->_index === null) {
return $this->raiseError("$file doesn't seem to be an Excel file");
}
/
//echo "data =".$this->data;
//$this->readRecords();
$this->_parse();
}
// }}}
// {{{ _parse()
/
Parse a workbook
@access private
@return bool
/
function _parse()
{
$pos = 0;
$code = ord($this->data[$pos]) | ord($this->data[$pos+1])<<8;
$length = ord($this->data[$pos+2]) | ord($this->data[$pos+3])<<8;
$version = ord($this->data[$pos + 4]) | ord($this->data[$pos + 5])<<8;
$substreamType = ord($this->data[$pos + 6]) | ord($this->data[$pos + 7])<<8;
//echo "Start parse code=".base_convert($code,10,16)." version=".base_convert($version,16)." substreamType=".base_convert($substreamType,16).""."n";
if (($version != SPREADSHEET_EXCEL_READER_BIFF8) &&
($version != SPREADSHEET_EXCEL_READER_BIFF7)) {
return false;
}
if ($substreamType != SPREADSHEET_EXCEL_READER_WORKBOOKGLOBALS){
return false;
}
//print_r($rec);
$pos += $length + 4;
$code = ord($this->data[$pos]) | ord($this->data[$pos+1])<<8;
$length = ord($this->data[$pos+2]) | ord($this->data[$pos+3])<<8;
while ($code != SPREADSHEET_EXCEL_READER_TYPE_EOF) {
switch ($code) {
case SPREADSHEET_EXCEL_READER_TYPE_SST:
//echo "Type_SSTn";
$spos = $pos + 4;
$limitpos = $spos + $length;
$uniqueStrings = $this->_GetInt4d($this->data,$spos+4);
$spos += 8;
for ($i = 0; $i < $uniqueStrings; $i++) {
// Read in the number of characters
if ($spos == $limitpos) {
$opcode = ord($this->data[$spos]) | ord($this->data[$spos+1])<<8;
$conlength = ord($this->data[$spos+2]) | ord($this->data[$spos+3])<<8;
if ($opcode != 0x3c) {
return -1;
}
$spos += 4;
$limitpos = $spos + $conlength;
}
$numChars = ord($this->data[$spos]) | (ord($this->data[$spos+1]) << 8);
//echo "i = $i pos = $pos numChars = $numChars ";
$spos += 2;
$optionFlags = ord($this->data[$spos]);
$spos++;
$asciiEncoding = (($optionFlags & 0x01) == 0) ;
$extendedString = ( ($optionFlags & 0x04) != 0);
// See if string contains formatting information
$richString = ( ($optionFlags & 0x08) != 0);
if ($richString) {
// Read in the crun
$formattingRuns = ord($this->data[$spos]) | (ord($this->data[$spos+1]) << 8);
$spos += 2;
}
if ($extendedString) {
// Read in cchExtRst
$extendedRunLength = $this->_GetInt4d($this->data,$spos);
$spos += 4;
}
$len = ($asciiEncoding)? $numChars : $numChars2;
if ($spos + $len < $limitpos) {
$retstr = substr($this->data,$spos,$len);
$spos += $len;
}else{
// found countinue
$retstr = substr($this->data,$limitpos - $spos);
$bytesRead = $limitpos - $spos;
$charsLeft = $numChars - (($asciiEncoding) ? $bytesRead : ($bytesRead / 2));
$spos = $limitpos;
while ($charsLeft > 0){
$opcode = ord($this->data[$spos]) | ord($this->data[$spos+1])<<8;
$conlength = ord($this->data[$spos+2]) | ord($this->data[$spos+3])<<8;
if ($opcode != 0x3c) {
return -1;
}
$spos += 4;
$limitpos = $spos + $conlength;
$option = ord($this->data[$spos]);
$spos += 1;
if ($asciiEncoding && ($option == 0)) {
$len = min($charsLeft,$limitpos - $spos); // min($charsLeft,$conlength);
$retstr .= substr($this->data,$len);
$charsLeft -= $len;
$asciiEncoding = true;
}elseif (!$asciiEncoding && ($option != 0)){
$len = min($charsLeft 2,$len);
$charsLeft -= $len/2;
$asciiEncoding = false;
}elseif (!$asciiEncoding && ($option == 0)) {
// Bummer - the string starts off as Unicode,but after the
// continuation it is in straightforward ASCII encoding
$len = min($charsLeft,$conlength);
for ($j = 0; $j < $len; $j++) {
$retstr .= $this->data[$spos + $j].chr(0);
}
$charsLeft -= $len;
$asciiEncoding = false;
}else{
$newstr = '';
for ($j = 0; $j < strlen($retstr); $j++) {
$newstr = $retstr[$j].chr(0);
}
$retstr = $newstr;
$len = min($charsLeft 2,$len);
$charsLeft -= $len/2;
$asciiEncoding = false;
//echo "Izavratn";
}
$spos += $len;
}
}
$retstr = ($asciiEncoding) ? $retstr : $this->_encodeUTF16($retstr);
// echo "Str $i = $retstrn";
if ($richString){
$spos += 4 $formattingRuns;
}
// For extended strings,skip over the extended string data
if ($extendedString) {
$spos += $extendedRunLength;
}
//if ($retstr == 'Derby'){
// echo "bbn";
//}
$this->sst[]=$retstr;
}
/$continueRecords = array();
while ($this->getNextCode() == Type_CONTINUE) {
$continueRecords[] = &$this->nextRecord();
}
//echo " 1 Type_SSTn";
$this->shareStrings = new SSTRecord($r,$continueRecords);
//print_r($this->shareStrings->strings);
/
// echo 'SST read: '.($time_end-$time_start)."n";
break;
case SPREADSHEET_EXCEL_READER_TYPE_FILEPASS:
return false;
break;
case SPREADSHEET_EXCEL_READER_TYPE_NAME:
//echo "Type_NAMEn";
break;
case SPREADSHEET_EXCEL_READER_TYPE_FORMAT:
$indexCode = ord($this->data[$pos+4]) | ord($this->data[$pos+5]) << 8;
if ($version == SPREADSHEET_EXCEL_READER_BIFF8) {
$numchars = ord($this->data[$pos+6]) | ord($this->data[$pos+7]) << 8;
if (ord($this->data[$pos+8]) == 0){
$formatString = substr($this->data,$pos+9,$numchars);
} else {
$formatString = substr($this->data,$numchars2);
}
} else {
$numchars = ord($this->data[$pos+6]);
$formatString = substr($this->data,$pos+7,$numchars2);
}
$this->formatRecords[$indexCode] = $formatString;
// echo "Type.FORMATn";
break;
case SPREADSHEET_EXCEL_READER_TYPE_XF:
//global $dateFormats,$numberFormats;
$indexCode = ord($this->data[$pos+6]) | ord($this->data[$pos+7]) << 8;
//echo "nType.XF ".count($this->formatRecords['xfrecords'])." $indexCode ";
if (array_key_exists($indexCode,$this->dateFormats)) {
//echo "isdate ".$dateFormats[$indexCode];
$this->formatRecords['xfrecords'][] = array(
'type' => 'date',
'format' => $this->dateFormats[$indexCode]
);
}elseif (array_key_exists($indexCode,$this->numberFormats)) {
//echo "isnumber ".$this->numberFormats[$indexCode];
$this->formatRecords['xfrecords'][] = array(
'type' => 'number',
'format' => $this->numberFormats[$indexCode]
);
}else{
$isdate = FALSE;
if ($indexCode > 0){
if (isset($this->formatRecords[$indexCode]))
$formatstr = $this->formatRecords[$indexCode];
//echo '.other.';
//echo "ndate-time=$formatstr=n";
if ($formatstr)
if (preg_match("/[^hmsday/-:s]/i",$formatstr) == 0) { // found day and time format
$isdate = TRUE;
$formatstr = str_replace('mm','i',$formatstr);
$formatstr = str_replace('h','H',$formatstr);
//echo "ndate-time $formatstr n";
}
}
if ($isdate){
$this->formatRecords['xfrecords'][] = array(
'type' => 'date',
'format' => $formatstr,
);
}else{
$this->formatRecords['xfrecords'][] = array(
'type' => 'other',
'format' => '',
'code' => $indexCode
);
}
}
//echo "n";
break;
case SPREADSHEET_EXCEL_READER_TYPE_NINETEENFOUR:
//echo "Type.NINETEENFOURn";
$this->nineteenFour = (ord($this->data[$pos+4]) == 1);
break;
case SPREADSHEET_EXCEL_READER_TYPE_BOUNDSHEET:
//echo "Type.BOUNDSHEETn";
$rec_offset = $this->_GetInt4d($this->data,$pos+4);
$rec_typeFlag = ord($this->data[$pos+8]);
$rec_visibilityFlag = ord($this->data[$pos+9]);
$rec_length = ord($this->data[$pos+10]);
if ($version == SPREADSHEET_EXCEL_READER_BIFF8){
$chartype = ord($this->data[$pos+11]);
if ($chartype == 0){
$rec_name = substr($this->data,$pos+12,$rec_length);
} else {
$rec_name = $this->_encodeUTF16(substr($this->data,$rec_length2));
}
}elseif ($version == SPREADSHEET_EXCEL_READER_BIFF7){
$rec_name = substr($this->data,$pos+11,$rec_length);
}
$this->boundsheets[] = array('name'=>$rec_name,
'offset'=>$rec_offset);
break;
}
//echo "Code = ".base_convert($r['code'],16)."n";
$pos += $length + 4;
$code = ord($this->data[$pos]) | ord($this->data[$pos+1])<<8;
$length = ord($this->data[$pos+2]) | ord($this->data[$pos+3])<<8;
//$r = &$this->nextRecord();
//echo "1 Code = ".base_convert($r['code'],16)."n";
}
foreach ($this->boundsheets as $key=>$val){
$this->sn = $key;
$this->_parsesheet($val['offset']);
}
return true;
}
/ Parse a worksheet
@access private
@param todo
@todo fix return codes
/
function _parsesheet($spos)
{
$cont = true;
// read BOF
$code = ord($this->data[$spos]) | ord($this->data[$spos+1])<<8;
$length = ord($this->data[$spos+2]) | ord($this->data[$spos+3])<<8;
$version = ord($this->data[$spos + 4]) | ord($this->data[$spos + 5])<<8;
$substreamType = ord($this->data[$spos + 6]) | ord($this->data[$spos + 7])<<8;
if (($version != SPREADSHEET_EXCEL_READER_BIFF8) && ($version != SPREADSHEET_EXCEL_READER_BIFF7)) {
return -1;
}
if ($substreamType != SPREADSHEET_EXCEL_READER_WORKSHEET){
return -2;
}
//echo "Start parse code=".base_convert($code,16).""."n";
$spos += $length + 4;
//var_dump($this->formatRecords);
//echo "code $code $length";
while($cont) {
//echo "mem= ".memory_get_usage()."n";
// $r = &$this->file->nextRecord();
$lowcode = ord($this->data[$spos]);
if ($lowcode == SPREADSHEET_EXCEL_READER_TYPE_EOF) break;
$code = $lowcode | ord($this->data[$spos+1])<<8;
$length = ord($this->data[$spos+2]) | ord($this->data[$spos+3])<<8;
$spos += 4;
$this->sheets[$this->sn]['maxrow'] = $this->_rowoffset - 1;
$this->sheets[$this->sn]['maxcol'] = $this->_coloffset - 1;
//echo "Code=".base_convert($code,16)." $coden";
unset($this->rectype);
$this->multiplier = 1; // need for format with %
switch ($code) {
case SPREADSHEET_EXCEL_READER_TYPE_DIMENSION:
//echo 'Type_DIMENSION ';
if (!isset($this->numRows)) {
if (($length == 10) || ($version == SPREADSHEET_EXCEL_READER_BIFF7)){
$this->sheets[$this->sn]['numRows'] = ord($this->data[$spos+2]) | ord($this->data[$spos+3]) << 8;
$this->sheets[$this->sn]['numCols'] = ord($this->data[$spos+6]) | ord($this->data[$spos+7]) << 8;
} else {
$this->sheets[$this->sn]['numRows'] = ord($this->data[$spos+4]) | ord($this->data[$spos+5]) << 8;
$this->sheets[$this->sn]['numCols'] = ord($this->data[$spos+10]) | ord($this->data[$spos+11]) << 8;
}
}
//echo 'numRows '.$this->numRows.' '.$this->numCols."n";
break;
case SPREADSHEET_EXCEL_READER_TYPE_MERGEDCELLS:
$cellRanges = ord($this->data[$spos]) | ord($this->data[$spos+1])<<8;
for ($i = 0; $i < $cellRanges; $i++) {
$fr = ord($this->data[$spos + 8
$i + 2]) | ord($this->data[$spos + 8$i + 3])<<8;
$lr = ord($this->data[$spos + 8
$i + 4]) | ord($this->data[$spos + 8$i + 5])<<8;
$fc = ord($this->data[$spos + 8
$i + 6]) | ord($this->data[$spos + 8$i + 7])<<8;
$lc = ord($this->data[$spos + 8
$i + 8]) | ord($this->data[$spos + 8$i + 9])<<8;
//$this->sheets[$this->sn]['mergedCells'][] = array($fr + 1,$fc + 1,$lr + 1,$lc + 1);
if ($lr - $fr > 0) {
$this->sheets[$this->sn]['cellsInfo'][$fr+1][$fc+1]['rowspan'] = $lr - $fr + 1;
}
if ($lc - $fc > 0) {
$this->sheets[$this->sn]['cellsInfo'][$fr+1][$fc+1]['colspan'] = $lc - $fc + 1;
}
}
//echo "Merged Cells $cellRanges $lr $fr $lc $fcn";
break;
case SPREADSHEET_EXCEL_READER_TYPE_RK:
case SPREADSHEET_EXCEL_READER_TYPE_RK2:
//echo 'SPREADSHEET_EXCEL_READER_TYPE_RK'."n";
$row = ord($this->data[$spos]) | ord($this->data[$spos+1])<<8;
$column = ord($this->data[$spos+2]) | ord($this->data[$spos+3])<<8;
$rknum = $this->_GetInt4d($this->data,$spos + 6);
$numValue = $this->_GetIEEE754($rknum);
//echo $numValue." ";
if ($this->isDate($spos)) {
list($string,$raw) = $this->createDate($numValue);
}else{
$raw = $numValue;
if (isset($this->_columnsFormat[$column + 1])){
$this->curformat = $this->_columnsFormat[$column + 1];
}
$string = sprintf($this->curformat,$numValue
$this->multiplier);
//$this->addcell(RKRecord($r));
}
$this->addcell($row,$column,$string,$raw);
//echo "Type_RK $row $column $string $raw {$this->curformat}n";
break;
case SPREADSHEET_EXCEL_READER_TYPE_LABELSST:
$row = ord($this->data[$spos]) | ord($this->data[$spos+1])<<8;
$column = ord($this->data[$spos+2]) | ord($this->data[$spos+3])<<8;
$xfindex = ord($this->data[$spos+4]) | ord($this->data[$spos+5])<<8;
$index = $this->_GetInt4d($this->data,$spos + 6);
//var_dump($this->sst);
$this->addcell($row,$this->sst[$index]);
//echo "LabelSST $row $column $stringn";
break;
case SPREADSHEET_EXCEL_READER_TYPE_MULRK:
$row = ord($this->data[$spos]) | ord($this->data[$spos+1])<<8;
$colFirst = ord($this->data[$spos+2]) | ord($this->data[$spos+3])<<8;
$colLast = ord($this->data[$spos + $length - 2]) | ord($this->data[$spos + $length - 1])<<8;
$columns = $colLast - $colFirst + 1;
$tmppos = $spos+4;
for ($i = 0; $i < $columns; $i++) {
$numValue = $this->_GetIEEE754($this->_GetInt4d($this->data,$tmppos + 2));
if ($this->isDate($tmppos-4)) {
list($string,$raw) = $this->createDate($numValue);
}else{
$raw = $numValue;
if (isset($this->_columnsFormat[$colFirst + $i + 1])){
$this->curformat = $this->_columnsFormat[$colFirst + $i + 1];
}
$string = sprintf($this->curformat,$numValue $this->multiplier);
}
//$rec['rknumbers'][$i]['xfindex'] = ord($rec['data'][$pos]) | ord($rec['data'][$pos+1]) << 8;
$tmppos += 6;
$this->addcell($row,$colFirst + $i,$raw);
//echo "MULRK $row ".($colFirst + $i)." $stringn";
}
//MulRKRecord($r);
// Get the individual cell records from the multiple record
//$num = ;
break;
case SPREADSHEET_EXCEL_READER_TYPE_NUMBER:
$row = ord($this->data[$spos]) | ord($this->data[$spos+1])<<8;
$column = ord($this->data[$spos+2]) | ord($this->data[$spos+3])<<8;
$tmp = unpack("ddouble",substr($this->data,$spos + 6,8)); // It machine machine dependent
if ($this->isDate($spos)) {
list($string,$raw) = $this->createDate($tmp['double']);
// $this->addcell(DateRecord($r,1));
}else{
//$raw = $tmp[''];
if (isset($this->_columnsFormat[$column + 1])){
$this->curformat = $this->_columnsFormat[$column + 1];
}
$raw = $this->createNumber($spos);
$string = sprintf($this->curformat,$raw * $this->multiplier);
// $this->addcell(NumberRecord($r));
}
$this->addcell($row,$raw);
//echo "Number $row $column $stringn";
break;
case SPREADSHEET_EXCEL_READER_TYPE_FORMULA:
case SPREADSHEET_EXCEL_READER_TYPE_FORMULA2:
$row = ord($this->data[$spos]) | ord($this->data[$spos+1])<<8;
$column = ord($this->data[$spos+2]) | ord($this->data[$spos+3])<<8;
if ((ord($this->data[$spos+6])==0) && (ord($this->data[$spos+12])==255) && (ord($this->data[$spos+13])==255)) {
//String formula. Result follows in a STRING record
//echo "FORMULA $row $column Formula with a string
n";
} elseif ((ord($this->data[$spos+6])==1) && (ord($this->data[$spos+12])==255) && (ord($this->data[$spos+13])==255)) {
//Boolean formula. Result is in +2; 0=false,1=true
} elseif ((ord($this->data[$spos+6])==2) && (ord($this->data[$spos+12])==255) && (ord($this->data[$spos+13])==255)) {
//Error formula. Error code is in +2;
} elseif ((ord($this->data[$spos+6])==3) && (ord($this->data[$spos+12])==255) && (ord($this->data[$spos+13])==255)) {
//Formula result is a null string.
} else {
// result is a number,so first 14 bytes are just like a _NUMBER record
$tmp = unpack("ddouble",$raw);
//echo "Number $row $column $stringn";
}
break;
case SPREADSHEET_EXCEL_READER_TYPE_BOOLERR:
$row = ord($this->data[$spos]) | ord($this->data[$spos+1])<<8;
$column = ord($this->data[$spos+2]) | ord($this->data[$spos+3])<<8;
$string = ord($this->data[$spos+6]);
$this->addcell($row,$string);
//echo 'Type_BOOLERR '."n";
break;
case SPREADSHEET_EXCEL_READER_TYPE_ROW:
case SPREADSHEET_EXCEL_READER_TYPE_DBCELL:
case SPREADSHEET_EXCEL_READER_TYPE_MULBLANK:
break;
case SPREADSHEET_EXCEL_READER_TYPE_LABEL:
$row = ord($this->data[$spos]) | ord($this->data[$spos+1])<<8;
$column = ord($this->data[$spos+2]) | ord($this->data[$spos+3])<<8;
$this->addcell($row,$spos + 8,ord($this->data[$spos + 6]) | ord($this->data[$spos + 7])<<8));
// $this->addcell(LabelRecord($r));
break;
case SPREADSHEET_EXCEL_READER_TYPE_EOF:
$cont = false;
break;
default:
//echo ' unknown :'.base_convert($r['code'],16)."n";
break;
}
$spos += $length;
}
if (!isset($this->sheets[$this->sn]['numRows']))
$this->sheets[$this->sn]['numRows'] = $this->sheets[$this->sn]['maxrow'];
if (!isset($this->sheets[$this->sn]['numCols']))
$this->sheets[$this->sn]['numCols'] = $this->sheets[$this->sn]['maxcol'];
}
/*
Check whether the current record read is a date
@param todo
@return boolean True if date,false otherwise
/
function isDate($spos)
{
//$xfindex = GetInt2d(,4);
$xfindex = ord($this->data[$spos+4]) | ord($this->data[$spos+5]) << 8;
//echo 'check is date '.$xfindex.' '.$this->formatRecords['xfrecords'][$xfindex]['type']."n";
//var_dump($this->formatRecords['xfrecords'][$xfindex]);
if ($this->formatRecords['xfrecords'][$xfindex]['type'] == 'date') {
$this->curformat = $this->formatRecords['xfrecords'][$xfindex]['format'];
$this->rectype = 'date';
return true;
} else {
if ($this->formatRecords['xfrecords'][$xfindex]['type'] == 'number') {
$this->curformat = $this->formatRecords['xfrecords'][$xfindex]['format'];
$this->rectype = 'number';
if (($xfindex == 0x9) || ($xfindex == 0xa)){
$this->multiplier = 100;
}
}else{
$this->curformat = $this->_defaultFormat;
$this->rectype = 'unknown';
}
return false;
}
}
//}}}
//{{{ createDate()
/*
Convert the raw Excel date into a human readable format
Dates in Excel are stored as number of seconds from an epoch. On
Windows,the epoch is 30/12/1899 and on Mac it's 01/01/1904
@access private
@param integer The raw Excel value to convert
@return array First element is the converted date,the second element is number a unix timestamp
/
function createDate($numValue)
{
if ($numValue > 1) {
$utcDays = $numValue - ($this->nineteenFour ? SPREADSHEET_EXCEL_READER_UTCOFFSETDAYS1904 : SPREADSHEET_EXCEL_READER_UTCOFFSETDAYS);
$utcValue = round(($utcDays+1)
SPREADSHEET_EXCEL_READER_MSINADAY);
$string = date ($this->curformat,$utcValue);
$raw = $utcValue;
} else {
$raw = $numValue;
$hours = floor($numValue 24);
$mins = floor($numValue
24 60) - $hours
60;
$secs = floor($numValue SPREADSHEET_EXCEL_READER_MSINADAY) - $hours
60 60 - $mins
60;
$string = date ($this->curformat,mktime($hours,$mins,$secs));
}
return array($string,$raw);
}
function createNumber($spos)
{
$rknumhigh = $this->_GetInt4d($this->data,$spos + 10);
$rknumlow = $this->_GetInt4d($this->data,$spos + 6);
//for ($i=0; $i<8; $i++) { echo ord($this->data[$i+$spos+6]) . " "; } echo "
";
$sign = ($rknumhigh & 0x80000000) >> 31;
$exp = ($rknumhigh & 0x7ff00000) >> 20;
$mantissa = (0x100000 | ($rknumhigh & 0x000fffff));
$mantissalow1 = ($rknumlow & 0x80000000) >> 31;
$mantissalow2 = ($rknumlow & 0x7fffffff);
$value = $mantissa / pow( 2,(20- ($exp - 1023)));
if ($mantissalow1 != 0) $value += 1 / pow (2,(21 - ($exp - 1023)));
$value += $mantissalow2 / pow (2,(52 - ($exp - 1023)));
//echo "Sign = $sign,Exp = $exp,mantissahighx = $mantissa,mantissalow1 = $mantissalow1,mantissalow2 = $mantissalow2
n";
if ($sign) {$value = -1 $value;}
return $value;
}
function addcell($row,$col,$raw = '')
{
//echo "ADD cel $row-$col $stringn";
$this->sheets[$this->sn]['maxrow'] = max($this->sheets[$this->sn]['maxrow'],$row + $this->_rowoffset);
$this->sheets[$this->sn]['maxcol'] = max($this->sheets[$this->sn]['maxcol'],$col + $this->_coloffset);
$this->sheets[$this->sn]['cells'][$row + $this->_rowoffset][$col + $this->_coloffset] = $string;
if ($raw)
$this->sheets[$this->sn]['cellsInfo'][$row + $this->_rowoffset][$col + $this->_coloffset]['raw'] = $raw;
if (isset($this->rectype))
$this->sheets[$this->sn]['cellsInfo'][$row + $this->_rowoffset][$col + $this->_coloffset]['type'] = $this->rectype;
}
function _GetIEEE754($rknum)
{
if (($rknum & 0x02) != 0) {
$value = $rknum >> 2;
} else {
//mmp
// first comment out the prev
IoUsly existing 7 lines of code here
// $tmp = unpack("d",pack("VV",($rknum & 0xfffffffc)));
// //$value = $tmp[''];
// if (array_key_exists(1,$tmp)) {
// $value = $tmp[1];
// } else {
// $value = $tmp[''];
// }
// I got my info on IEEE754 encoding from
//
http://research.microsoft.com/~hollasch/cgindex/coding/ieeefloat.html // The RK format calls for using only the most significant 30 bits of the
// 64 bit floating point value. The other 34 bits are assumed to be 0
// So,we use the upper 30 bits of $rknum as follows...
$sign = ($rknum & 0x80000000) >> 31;
$exp = ($rknum & 0x7ff00000) >> 20;
$mantissa = (0x100000 | ($rknum & 0x000ffffc));
$value = $mantissa / pow( 2,(20- ($exp - 1023)));
if ($sign) {$value = -1
$value;}
//end of changes by mmp
}
if (($rknum & 0x01) != 0) {
$value /= 100;
}
return $value;
}
function _encodeUTF16($string)
{
$result = $string;
if ($this->_defaultEncoding){
switch ($this->_encoderFunction){
case 'iconv' : $result = iconv('UTF-16LE',$this->_defaultEncoding,$string);
break;
case 'mb_convert_encoding' : $result = mb_convert_encoding($string,'UTF-16LE' );
break;
}
}
return $result;
}
function _GetInt4d($data,$pos)
{
$value = ord($data[$pos]) | (ord($data[$pos+1]) << 8) | (ord($data[$pos+2]) << 16) | (ord($data[$pos+3]) << 24);
if ($value>=4294967294)
{
$value=-2;
}
return $value;
}
}
/ Local variables:
tab-width: 4
c-basic-offset: 4
c-hanging-comment-ender-p: nil
End:
/
?>