Source for file Excel2003XML.php
Documentation is available at Excel2003XML.php
* Copyright (c) 2006 - 2011 PHPExcel
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
* You should have received a copy of the GNU Lesser General Public
* License along with this library; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
* @package PHPExcel_Reader
* @copyright Copyright (c) 2006 - 2011 PHPExcel (http://www.codeplex.com/PHPExcel)
* @license http://www.gnu.org/licenses/old-licenses/lgpl-2.1.txt LGPL
* @version 1.7.6, 2011-02-27
/** PHPExcel root directory */
define('PHPEXCEL_ROOT', dirname(__FILE__ ) . '/../../');
require (PHPEXCEL_ROOT . 'PHPExcel/Autoloader.php');
* PHPExcel_Reader_Excel2003XML
* @package PHPExcel_Reader
* @copyright Copyright (c) 2006 - 2011 PHPExcel (http://www.codeplex.com/PHPExcel)
private $_readDataOnly = false;
* Restict which sheets should be loaded?
private $_loadSheetsOnly = null;
private $_styles = array();
* PHPExcel_Reader_IReadFilter instance
* @var PHPExcel_Reader_IReadFilter
private $_readFilter = null;
return $this->_readDataOnly;
* @return PHPExcel_Reader_Excel2003XML
$this->_readDataOnly = $pValue;
* Get which sheets to load
return $this->_loadSheetsOnly;
* Set which sheets to load
* @return PHPExcel_Reader_Excel2003XML
$this->_loadSheetsOnly = is_array($value) ?
* @return PHPExcel_Reader_Excel2003XML
$this->_loadSheetsOnly = null;
* @return PHPExcel_Reader_IReadFilter
return $this->_readFilter;
* @param PHPExcel_Reader_IReadFilter $pValue
* @return PHPExcel_Reader_Excel2003XML
public function setReadFilter(PHPExcel_Reader_IReadFilter $pValue) {
$this->_readFilter = $pValue;
* Create a new PHPExcel_Reader_Excel2003XML
* Can the current PHPExcel_Reader_IReader read the file?
* @param string $pFileName
public function canRead($pFilename)
// Office xmlns:o="urn:schemas-microsoft-com:office:office"
// Excel xmlns:x="urn:schemas-microsoft-com:office:excel"
// XML Spreadsheet xmlns:ss="urn:schemas-microsoft-com:office:spreadsheet"
// Spreadsheet component xmlns:c="urn:schemas-microsoft-com:office:component:spreadsheet"
// XML schema xmlns:s="uuid:BDC6E3F0-6DA3-11d1-A2A3-00AA00C14882"
// XML data type xmlns:dt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882"
// MS-persist recordset xmlns:rs="urn:schemas-microsoft-com:rowset"
// Rowset xmlns:z="#RowsetSchema"
'<?mso-application progid="Excel.Sheet"?>'
throw new Exception("Could not open " . $pFilename . " for reading! File does not exist.");
// Read sample data (first 2 KB will do)
$fh = fopen($pFilename, 'r');
$data = fread($fh, 2048);
foreach($signature as $match) {
// every part of the signature must be present
if (strpos($data, $match) === false) {
* Reads names of the worksheets from a file, without parsing the whole file to a PHPExcel object
* @param string $pFilename
throw new Exception("Could not open " . $pFilename . " for reading! File does not exist.");
$worksheetNames = array();
$namespaces = $xml->getNamespaces(true);
$xml_ss = $xml->children($namespaces['ss']);
foreach($xml_ss->Worksheet as $worksheet) {
$worksheet_ss = $worksheet->attributes($namespaces['ss']);
$worksheetNames[] = $worksheet_ss['Name'];
* Loads PHPExcel from file
* @param string $pFilename
public function load($pFilename)
// Load into this instance
private static function identifyFixedStyleValue($styleList,&$styleAttributeValue) {
$styleAttributeValue = strtolower($styleAttributeValue);
foreach($styleList as $style) {
$styleAttributeValue = $style;
* pixel units to excel width units(units of 1/256th of a character width)
private static function _pixel2WidthUnits($pxs) {
$UNIT_OFFSET_MAP = array(0, 36, 73, 109, 146, 182, 219);
$widthUnits = 256 * ($pxs / 7);
$widthUnits += $UNIT_OFFSET_MAP[($pxs % 7)];
* excel width units(units of 1/256th of a character width) to pixel units
private static function _widthUnits2Pixel($widthUnits) {
$pixels = ($widthUnits / 256) * 7;
$offsetWidthUnits = $widthUnits % 256;
$pixels += round($offsetWidthUnits / (256 / 7));
private static function _hex2str($hex) {
* Loads PHPExcel from file into PHPExcel instance
* @param string $pFilename
* @param PHPExcel $objPHPExcel
$fromFormats = array('\-', '\ ');
$toFormats = array('-', ' ');
$underlineStyles = array (
$verticalAlignmentStyles = array (
$horizontalAlignmentStyles = array (
$timezoneObj = new DateTimeZone('Europe/London');
$GMT = new DateTimeZone('UTC');
throw new Exception("Could not open " . $pFilename . " for reading! File does not exist.");
$namespaces = $xml->getNamespaces(true);
$docProps = $objPHPExcel->getProperties();
if (isset ($xml->DocumentProperties[0])) {
foreach($xml->DocumentProperties[0] as $propertyName => $propertyValue) {
$docProps->setTitle($propertyValue);
$docProps->setSubject($propertyValue);
$docProps->setCreator($propertyValue);
$docProps->setCreated($creationDate);
$docProps->setLastModifiedBy($propertyValue);
$docProps->setModified($lastSaveDate);
$docProps->setCompany($propertyValue);
$docProps->setCategory($propertyValue);
$docProps->setManager($propertyValue);
$docProps->setKeywords($propertyValue);
$docProps->setDescription($propertyValue);
if (isset ($xml->CustomDocumentProperties)) {
foreach($xml->CustomDocumentProperties[0] as $propertyName => $propertyValue) {
$propertyAttributes = $propertyValue->attributes($namespaces['dt']);
$propertyName = preg_replace_callback('/_x([0-9a-z]{4})_/','PHPExcel_Reader_Excel2003XML::_hex2str',$propertyName);
switch((string) $propertyAttributes) {
$propertyValue = trim($propertyValue);
$propertyValue = (bool) $propertyValue;
$propertyValue = intval($propertyValue);
$propertyValue = floatval($propertyValue);
$docProps->setCustomProperty($propertyName,$propertyValue,$propertyType);
foreach($xml->Styles[0] as $style) {
$style_ss = $style->attributes($namespaces['ss']);
$styleID = (string) $style_ss['ID'];
// echo 'Style ID = '.$styleID.'<br />';
if ($styleID == 'Default') {
$this->_styles['Default'] = array();
$this->_styles[$styleID] = $this->_styles['Default'];
foreach ($style as $styleType => $styleData) {
$styleAttributes = $styleData->attributes($namespaces['ss']);
// echo $styleType.'<br />';
foreach($styleAttributes as $styleAttributeKey => $styleAttributeValue) {
// echo $styleAttributeKey.' = '.$styleAttributeValue.'<br />';
$styleAttributeValue = (string) $styleAttributeValue;
switch ($styleAttributeKey) {
if (self::identifyFixedStyleValue($verticalAlignmentStyles,$styleAttributeValue)) {
$this->_styles[$styleID]['alignment']['vertical'] = $styleAttributeValue;
if (self::identifyFixedStyleValue($horizontalAlignmentStyles,$styleAttributeValue)) {
$this->_styles[$styleID]['alignment']['horizontal'] = $styleAttributeValue;
$this->_styles[$styleID]['alignment']['wrap'] = true;
foreach($styleData->Border as $borderStyle) {
$borderAttributes = $borderStyle->attributes($namespaces['ss']);
foreach($borderAttributes as $borderStyleKey => $borderStyleValue) {
// echo $borderStyleKey.' = '.$borderStyleValue.'<br />';
switch ($borderStyleKey) {
// $thisBorder['style'] = $borderStyleValue;
// $thisBorder['style'] = $borderStyleValue;
$borderColour = substr($borderStyleValue,1);
$thisBorder['color']['rgb'] = $borderColour;
if (count($thisBorder) > 0) {
if (($borderPosition == 'left') || ($borderPosition == 'right') || ($borderPosition == 'top') || ($borderPosition == 'bottom')) {
$this->_styles[$styleID]['borders'][$borderPosition] = $thisBorder;
foreach($styleAttributes as $styleAttributeKey => $styleAttributeValue) {
// echo $styleAttributeKey.' = '.$styleAttributeValue.'<br />';
$styleAttributeValue = (string) $styleAttributeValue;
switch ($styleAttributeKey) {
$this->_styles[$styleID]['font']['name'] = $styleAttributeValue;
$this->_styles[$styleID]['font']['size'] = $styleAttributeValue;
$this->_styles[$styleID]['font']['color']['rgb'] = substr($styleAttributeValue,1);
$this->_styles[$styleID]['font']['bold'] = true;
$this->_styles[$styleID]['font']['italic'] = true;
if (self::identifyFixedStyleValue($underlineStyles,$styleAttributeValue)) {
$this->_styles[$styleID]['font']['underline'] = $styleAttributeValue;
foreach($styleAttributes as $styleAttributeKey => $styleAttributeValue) {
// echo $styleAttributeKey.' = '.$styleAttributeValue.'<br />';
switch ($styleAttributeKey) {
$this->_styles[$styleID]['fill']['color']['rgb'] = substr($styleAttributeValue,1);
foreach($styleAttributes as $styleAttributeKey => $styleAttributeValue) {
// echo $styleAttributeKey.' = '.$styleAttributeValue.'<br />';
$styleAttributeValue = str_replace($fromFormats,$toFormats,$styleAttributeValue);
switch ($styleAttributeValue) {
$styleAttributeValue = 'dd/mm/yyyy';
if ($styleAttributeValue > '') {
$this->_styles[$styleID]['numberformat']['code'] = $styleAttributeValue;
foreach($styleAttributes as $styleAttributeKey => $styleAttributeValue) {
// echo $styleAttributeKey.' = '.$styleAttributeValue.'<br />';
// print_r($this->_styles[$styleID]);
$xml_ss = $xml->children($namespaces['ss']);
foreach($xml_ss->Worksheet as $worksheet) {
$worksheet_ss = $worksheet->attributes($namespaces['ss']);
if ((isset ($this->_loadSheetsOnly)) && (isset ($worksheet_ss['Name'])) &&
(!in_array($worksheet_ss['Name'], $this->_loadSheetsOnly))) {
// echo '<h3>Worksheet: ',$worksheet_ss['Name'],'<h3>';
$objPHPExcel->createSheet();
$objPHPExcel->setActiveSheetIndex($worksheetID);
if (isset ($worksheet_ss['Name'])) {
$worksheetName = (string) $worksheet_ss['Name'];
$objPHPExcel->getActiveSheet()->setTitle($worksheetName);
if (isset ($worksheet->Table->Column)) {
foreach($worksheet->Table->Column as $columnData) {
$columnData_ss = $columnData->attributes($namespaces['ss']);
if (isset ($columnData_ss['Index'])) {
if (isset ($columnData_ss['Width'])) {
$columnWidth = $columnData_ss['Width'];
// echo '<b>Setting column width for '.$columnID.' to '.$columnWidth.'</b><br />';
$objPHPExcel->getActiveSheet()->getColumnDimension($columnID)->setWidth($columnWidth / 5.4);
if (isset ($worksheet->Table->Row)) {
foreach($worksheet->Table->Row as $rowData) {
$row_ss = $rowData->attributes($namespaces['ss']);
if (isset ($row_ss['Index'])) {
$rowID = (integer) $row_ss['Index'];
// echo '<b>Row '.$rowID.'</b><br />';
foreach($rowData->Cell as $cell) {
$cell_ss = $cell->attributes($namespaces['ss']);
if (isset ($cell_ss['Index'])) {
$cellRange = $columnID. $rowID;
if (!$this->getReadFilter()->readCell($columnID, $rowID, $worksheetName)) {
if ((isset ($cell_ss['MergeAcross'])) || (isset ($cell_ss['MergeDown']))) {
if (isset ($cell_ss['MergeAcross'])) {
if (isset ($cell_ss['MergeDown'])) {
$rowTo = $rowTo + $cell_ss['MergeDown'];
$cellRange .= ':'. $columnTo. $rowTo;
$objPHPExcel->getActiveSheet()->mergeCells($cellRange);
$cellIsSet = $hasCalculatedValue = false;
if (isset ($cell_ss['Formula'])) {
$cellDataFormula = $cell_ss['Formula'];
// added this as a check for array formulas
if (isset ($cell_ss['ArrayRange'])) {
$cellDataCSEFormula = $cell_ss['ArrayRange'];
// echo "found an array formula at ".$columnID.$rowID."<br />";
$hasCalculatedValue = true;
if (isset ($cell->Data)) {
$cellValue = $cellData = $cell->Data;
$cellData_ss = $cellData->attributes($namespaces['ss']);
if (isset ($cellData_ss['Type'])) {
$cellDataType = $cellData_ss['Type'];
const TYPE_FORMULA = 'f';
const TYPE_NUMERIC = 'n';
const TYPE_INLINE = 'inlineStr';
$cellValue = (float) $cellValue;
if (floor($cellValue) == $cellValue) {
$cellValue = (integer) $cellValue;
$cellValue = ($cellValue != 0);
if ($hasCalculatedValue) {
if (substr($cellDataFormula,0,3) == 'of:') {
$cellDataFormula = substr($cellDataFormula,3);
// echo 'Before: ',$cellDataFormula,'<br />';
$temp = explode('"',$cellDataFormula);
foreach($temp as &$value) {
// Only replace in alternate array entries (i.e. non-quoted blocks)
// Convert R1C1 style references to A1 style references (but only when not quoted)
// echo 'Before: ',$cellDataFormula,'<br />';
$temp = explode('"',$cellDataFormula);
foreach($temp as &$value) {
// Only replace in alternate array entries (i.e. non-quoted blocks)
preg_match_all('/(R(\[?-?\d*\]?))(C(\[?-?\d*\]?))/',$value, $cellReferences,PREG_SET_ORDER+ PREG_OFFSET_CAPTURE);
// Reverse the matches array, otherwise all our offsets will become incorrect if we modify our way
// through the formula from left to right. Reversing means that we work right to left.through
// Loop through each R1C1 style reference in turn, converting it to its A1 style equivalent,
// then modify the formula to use that new reference
foreach($cellReferences as $cellReference) {
$rowReference = $cellReference[2][0];
// Empty R reference is the current row
if ($rowReference == '') $rowReference = $rowID;
// Bracketed R references are relative to the current row
if ($rowReference{0} == '[') $rowReference = $rowID + trim($rowReference,'[]');
$columnReference = $cellReference[4][0];
// Empty C reference is the current column
if ($columnReference == '') $columnReference = $columnNumber;
// Bracketed C references are relative to the current column
if ($columnReference{0} == '[') $columnReference = $columnNumber + trim($columnReference,'[]');
// Then rebuild the formula string
$cellDataFormula = implode('"',$temp);
// echo 'After: ',$cellDataFormula,'<br />';
// echo 'Cell '.$columnID.$rowID.' is a '.$type.' with a value of '.(($hasCalculatedValue) ? $cellDataFormula : $cellValue).'<br />';
$objPHPExcel->getActiveSheet()->getCell($columnID. $rowID)->setValueExplicit((($hasCalculatedValue) ? $cellDataFormula : $cellValue),$type);
if ($hasCalculatedValue) {
// echo 'Formula result is '.$cellValue.'<br />';
$objPHPExcel->getActiveSheet()->getCell($columnID. $rowID)->setCalculatedValue($cellValue);
$cellIsSet = $rowHasData = true;
if (isset ($cell->Comment)) {
// echo '<b>comment found</b><br />';
$commentAttributes = $cell->Comment->attributes($namespaces['ss']);
if (isset ($commentAttributes->Author)) {
$author = (string) $commentAttributes->Author;
// echo 'Author: ',$author,'<br />';
$node = $cell->Comment->Data->asXML();
// $annotation = str_replace('html:','',substr($node,49,-10));
// echo $annotation,'<br />';
// echo 'Annotation: ',$annotation,'<br />';
$objPHPExcel->getActiveSheet()->getComment( $columnID. $rowID )
->setText($this->_parseRichText($annotation) );
if (($cellIsSet) && (isset ($cell_ss['StyleID']))) {
$style = (string) $cell_ss['StyleID'];
// echo 'Cell style for '.$columnID.$rowID.' is '.$style.'<br />';
if ((isset ($this->_styles[$style])) && (count($this->_styles[$style]) > 0)) {
// echo 'Cell '.$columnID.$rowID.'<br />';
// print_r($this->_styles[$style]);
if (!$objPHPExcel->getActiveSheet()->cellExists($columnID. $rowID)) {
$objPHPExcel->getActiveSheet()->getCell($columnID. $rowID)->setValue(NULL);
$objPHPExcel->getActiveSheet()->getStyle($cellRange)->applyFromArray($this->_styles[$style]);
if (isset ($row_ss['StyleID'])) {
$rowStyle = $row_ss['StyleID'];
if (isset ($row_ss['Height'])) {
$rowHeight = $row_ss['Height'];
// echo '<b>Setting row height to '.$rowHeight.'</b><br />';
$objPHPExcel->getActiveSheet()->getRowDimension($rowID)->setRowHeight($rowHeight);
private function _parseRichText($is = '') {
|