<?php
|
|
namespace PhpOffice\PhpSpreadsheet\Reader;
|
|
use PhpOffice\PhpSpreadsheet\Calculation\Calculation;
|
use PhpOffice\PhpSpreadsheet\Cell\Coordinate;
|
use PhpOffice\PhpSpreadsheet\Shared\StringHelper;
|
use PhpOffice\PhpSpreadsheet\Spreadsheet;
|
use PhpOffice\PhpSpreadsheet\Style\Border;
|
|
class Slk extends BaseReader
|
{
|
/**
|
* Input encoding.
|
*
|
* @var string
|
*/
|
private $inputEncoding = 'ANSI';
|
|
/**
|
* Sheet index to read.
|
*
|
* @var int
|
*/
|
private $sheetIndex = 0;
|
|
/**
|
* Formats.
|
*
|
* @var array
|
*/
|
private $formats = [];
|
|
/**
|
* Format Count.
|
*
|
* @var int
|
*/
|
private $format = 0;
|
|
/**
|
* Create a new SYLK Reader instance.
|
*/
|
public function __construct()
|
{
|
parent::__construct();
|
}
|
|
/**
|
* Validate that the current file is a SYLK file.
|
*
|
* @param string $pFilename
|
*
|
* @return bool
|
*/
|
public function canRead($pFilename)
|
{
|
// Check if file exists
|
try {
|
$this->openFile($pFilename);
|
} catch (Exception $e) {
|
return false;
|
}
|
|
// Read sample data (first 2 KB will do)
|
$data = fread($this->fileHandle, 2048);
|
|
// Count delimiters in file
|
$delimiterCount = substr_count($data, ';');
|
$hasDelimiter = $delimiterCount > 0;
|
|
// Analyze first line looking for ID; signature
|
$lines = explode("\n", $data);
|
$hasId = substr($lines[0], 0, 4) === 'ID;P';
|
|
fclose($this->fileHandle);
|
|
return $hasDelimiter && $hasId;
|
}
|
|
/**
|
* Set input encoding.
|
*
|
* @param string $pValue Input encoding, eg: 'ANSI'
|
*
|
* @return $this
|
*/
|
public function setInputEncoding($pValue)
|
{
|
$this->inputEncoding = $pValue;
|
|
return $this;
|
}
|
|
/**
|
* Get input encoding.
|
*
|
* @return string
|
*/
|
public function getInputEncoding()
|
{
|
return $this->inputEncoding;
|
}
|
|
/**
|
* Return worksheet info (Name, Last Column Letter, Last Column Index, Total Rows, Total Columns).
|
*
|
* @param string $pFilename
|
*
|
* @throws Exception
|
*
|
* @return array
|
*/
|
public function listWorksheetInfo($pFilename)
|
{
|
// Open file
|
if (!$this->canRead($pFilename)) {
|
throw new Exception($pFilename . ' is an Invalid Spreadsheet file.');
|
}
|
$this->openFile($pFilename);
|
$fileHandle = $this->fileHandle;
|
rewind($fileHandle);
|
|
$worksheetInfo = [];
|
$worksheetInfo[0]['worksheetName'] = 'Worksheet';
|
$worksheetInfo[0]['lastColumnLetter'] = 'A';
|
$worksheetInfo[0]['lastColumnIndex'] = 0;
|
$worksheetInfo[0]['totalRows'] = 0;
|
$worksheetInfo[0]['totalColumns'] = 0;
|
|
// loop through one row (line) at a time in the file
|
$rowIndex = 0;
|
while (($rowData = fgets($fileHandle)) !== false) {
|
$columnIndex = 0;
|
|
// convert SYLK encoded $rowData to UTF-8
|
$rowData = StringHelper::SYLKtoUTF8($rowData);
|
|
// explode each row at semicolons while taking into account that literal semicolon (;)
|
// is escaped like this (;;)
|
$rowData = explode("\t", str_replace('¤', ';', str_replace(';', "\t", str_replace(';;', '¤', rtrim($rowData)))));
|
|
$dataType = array_shift($rowData);
|
if ($dataType == 'C') {
|
// Read cell value data
|
foreach ($rowData as $rowDatum) {
|
switch ($rowDatum[0]) {
|
case 'C':
|
case 'X':
|
$columnIndex = substr($rowDatum, 1) - 1;
|
|
break;
|
case 'R':
|
case 'Y':
|
$rowIndex = substr($rowDatum, 1);
|
|
break;
|
}
|
|
$worksheetInfo[0]['totalRows'] = max($worksheetInfo[0]['totalRows'], $rowIndex);
|
$worksheetInfo[0]['lastColumnIndex'] = max($worksheetInfo[0]['lastColumnIndex'], $columnIndex);
|
}
|
}
|
}
|
|
$worksheetInfo[0]['lastColumnLetter'] = Coordinate::stringFromColumnIndex($worksheetInfo[0]['lastColumnIndex'] + 1);
|
$worksheetInfo[0]['totalColumns'] = $worksheetInfo[0]['lastColumnIndex'] + 1;
|
|
// Close file
|
fclose($fileHandle);
|
|
return $worksheetInfo;
|
}
|
|
/**
|
* Loads PhpSpreadsheet from file.
|
*
|
* @param string $pFilename
|
*
|
* @throws Exception
|
*
|
* @return Spreadsheet
|
*/
|
public function load($pFilename)
|
{
|
// Create new Spreadsheet
|
$spreadsheet = new Spreadsheet();
|
|
// Load into this instance
|
return $this->loadIntoExisting($pFilename, $spreadsheet);
|
}
|
|
/**
|
* Loads PhpSpreadsheet from file into PhpSpreadsheet instance.
|
*
|
* @param string $pFilename
|
* @param Spreadsheet $spreadsheet
|
*
|
* @throws Exception
|
*
|
* @return Spreadsheet
|
*/
|
public function loadIntoExisting($pFilename, Spreadsheet $spreadsheet)
|
{
|
// Open file
|
if (!$this->canRead($pFilename)) {
|
throw new Exception($pFilename . ' is an Invalid Spreadsheet file.');
|
}
|
$this->openFile($pFilename);
|
$fileHandle = $this->fileHandle;
|
rewind($fileHandle);
|
|
// Create new Worksheets
|
while ($spreadsheet->getSheetCount() <= $this->sheetIndex) {
|
$spreadsheet->createSheet();
|
}
|
$spreadsheet->setActiveSheetIndex($this->sheetIndex);
|
|
$fromFormats = ['\-', '\ '];
|
$toFormats = ['-', ' '];
|
|
// Loop through file
|
$column = $row = '';
|
|
// loop through one row (line) at a time in the file
|
while (($rowData = fgets($fileHandle)) !== false) {
|
// convert SYLK encoded $rowData to UTF-8
|
$rowData = StringHelper::SYLKtoUTF8($rowData);
|
|
// explode each row at semicolons while taking into account that literal semicolon (;)
|
// is escaped like this (;;)
|
$rowData = explode("\t", str_replace('¤', ';', str_replace(';', "\t", str_replace(';;', '¤', rtrim($rowData)))));
|
|
$dataType = array_shift($rowData);
|
// Read shared styles
|
if ($dataType == 'P') {
|
$formatArray = [];
|
foreach ($rowData as $rowDatum) {
|
switch ($rowDatum[0]) {
|
case 'P':
|
$formatArray['numberFormat']['formatCode'] = str_replace($fromFormats, $toFormats, substr($rowDatum, 1));
|
|
break;
|
case 'E':
|
case 'F':
|
$formatArray['font']['name'] = substr($rowDatum, 1);
|
|
break;
|
case 'L':
|
$formatArray['font']['size'] = substr($rowDatum, 1);
|
|
break;
|
case 'S':
|
$styleSettings = substr($rowDatum, 1);
|
$iMax = strlen($styleSettings);
|
for ($i = 0; $i < $iMax; ++$i) {
|
switch ($styleSettings[$i]) {
|
case 'I':
|
$formatArray['font']['italic'] = true;
|
|
break;
|
case 'D':
|
$formatArray['font']['bold'] = true;
|
|
break;
|
case 'T':
|
$formatArray['borders']['top']['borderStyle'] = Border::BORDER_THIN;
|
|
break;
|
case 'B':
|
$formatArray['borders']['bottom']['borderStyle'] = Border::BORDER_THIN;
|
|
break;
|
case 'L':
|
$formatArray['borders']['left']['borderStyle'] = Border::BORDER_THIN;
|
|
break;
|
case 'R':
|
$formatArray['borders']['right']['borderStyle'] = Border::BORDER_THIN;
|
|
break;
|
}
|
}
|
|
break;
|
}
|
}
|
$this->formats['P' . $this->format++] = $formatArray;
|
// Read cell value data
|
} elseif ($dataType == 'C') {
|
$hasCalculatedValue = false;
|
$cellData = $cellDataFormula = '';
|
foreach ($rowData as $rowDatum) {
|
switch ($rowDatum[0]) {
|
case 'C':
|
case 'X':
|
$column = substr($rowDatum, 1);
|
|
break;
|
case 'R':
|
case 'Y':
|
$row = substr($rowDatum, 1);
|
|
break;
|
case 'K':
|
$cellData = substr($rowDatum, 1);
|
|
break;
|
case 'E':
|
$cellDataFormula = '=' . substr($rowDatum, 1);
|
// Convert R1C1 style references to A1 style references (but only when not quoted)
|
$temp = explode('"', $cellDataFormula);
|
$key = false;
|
foreach ($temp as &$value) {
|
// Only count/replace in alternate array entries
|
if ($key = !$key) {
|
preg_match_all('/(R(\[?-?\d*\]?))(C(\[?-?\d*\]?))/', $value, $cellReferences, PREG_SET_ORDER + PREG_OFFSET_CAPTURE);
|
// Reverse the matches array, otherwise all our offsets will become incorrect if we modify our way
|
// through the formula from left to right. Reversing means that we work right to left.through
|
// the formula
|
$cellReferences = array_reverse($cellReferences);
|
// Loop through each R1C1 style reference in turn, converting it to its A1 style equivalent,
|
// then modify the formula to use that new reference
|
foreach ($cellReferences as $cellReference) {
|
$rowReference = $cellReference[2][0];
|
// Empty R reference is the current row
|
if ($rowReference == '') {
|
$rowReference = $row;
|
}
|
// Bracketed R references are relative to the current row
|
if ($rowReference[0] == '[') {
|
$rowReference = $row + trim($rowReference, '[]');
|
}
|
$columnReference = $cellReference[4][0];
|
// Empty C reference is the current column
|
if ($columnReference == '') {
|
$columnReference = $column;
|
}
|
// Bracketed C references are relative to the current column
|
if ($columnReference[0] == '[') {
|
$columnReference = $column + trim($columnReference, '[]');
|
}
|
$A1CellReference = Coordinate::stringFromColumnIndex($columnReference) . $rowReference;
|
|
$value = substr_replace($value, $A1CellReference, $cellReference[0][1], strlen($cellReference[0][0]));
|
}
|
}
|
}
|
unset($value);
|
// Then rebuild the formula string
|
$cellDataFormula = implode('"', $temp);
|
$hasCalculatedValue = true;
|
|
break;
|
}
|
}
|
$columnLetter = Coordinate::stringFromColumnIndex($column);
|
$cellData = Calculation::unwrapResult($cellData);
|
|
// Set cell value
|
$spreadsheet->getActiveSheet()->getCell($columnLetter . $row)->setValue(($hasCalculatedValue) ? $cellDataFormula : $cellData);
|
if ($hasCalculatedValue) {
|
$cellData = Calculation::unwrapResult($cellData);
|
$spreadsheet->getActiveSheet()->getCell($columnLetter . $row)->setCalculatedValue($cellData);
|
}
|
// Read cell formatting
|
} elseif ($dataType == 'F') {
|
$formatStyle = $columnWidth = $styleSettings = '';
|
$styleData = [];
|
foreach ($rowData as $rowDatum) {
|
switch ($rowDatum[0]) {
|
case 'C':
|
case 'X':
|
$column = substr($rowDatum, 1);
|
|
break;
|
case 'R':
|
case 'Y':
|
$row = substr($rowDatum, 1);
|
|
break;
|
case 'P':
|
$formatStyle = $rowDatum;
|
|
break;
|
case 'W':
|
[$startCol, $endCol, $columnWidth] = explode(' ', substr($rowDatum, 1));
|
|
break;
|
case 'S':
|
$styleSettings = substr($rowDatum, 1);
|
$iMax = strlen($styleSettings);
|
for ($i = 0; $i < $iMax; ++$i) {
|
switch ($styleSettings[$i]) {
|
case 'I':
|
$styleData['font']['italic'] = true;
|
|
break;
|
case 'D':
|
$styleData['font']['bold'] = true;
|
|
break;
|
case 'T':
|
$styleData['borders']['top']['borderStyle'] = Border::BORDER_THIN;
|
|
break;
|
case 'B':
|
$styleData['borders']['bottom']['borderStyle'] = Border::BORDER_THIN;
|
|
break;
|
case 'L':
|
$styleData['borders']['left']['borderStyle'] = Border::BORDER_THIN;
|
|
break;
|
case 'R':
|
$styleData['borders']['right']['borderStyle'] = Border::BORDER_THIN;
|
|
break;
|
}
|
}
|
|
break;
|
}
|
}
|
if (($formatStyle > '') && ($column > '') && ($row > '')) {
|
$columnLetter = Coordinate::stringFromColumnIndex($column);
|
if (isset($this->formats[$formatStyle])) {
|
$spreadsheet->getActiveSheet()->getStyle($columnLetter . $row)->applyFromArray($this->formats[$formatStyle]);
|
}
|
}
|
if ((!empty($styleData)) && ($column > '') && ($row > '')) {
|
$columnLetter = Coordinate::stringFromColumnIndex($column);
|
$spreadsheet->getActiveSheet()->getStyle($columnLetter . $row)->applyFromArray($styleData);
|
}
|
if ($columnWidth > '') {
|
if ($startCol == $endCol) {
|
$startCol = Coordinate::stringFromColumnIndex($startCol);
|
$spreadsheet->getActiveSheet()->getColumnDimension($startCol)->setWidth($columnWidth);
|
} else {
|
$startCol = Coordinate::stringFromColumnIndex($startCol);
|
$endCol = Coordinate::stringFromColumnIndex($endCol);
|
$spreadsheet->getActiveSheet()->getColumnDimension($startCol)->setWidth($columnWidth);
|
do {
|
$spreadsheet->getActiveSheet()->getColumnDimension(++$startCol)->setWidth($columnWidth);
|
} while ($startCol != $endCol);
|
}
|
}
|
} else {
|
foreach ($rowData as $rowDatum) {
|
switch ($rowDatum[0]) {
|
case 'C':
|
case 'X':
|
$column = substr($rowDatum, 1);
|
|
break;
|
case 'R':
|
case 'Y':
|
$row = substr($rowDatum, 1);
|
|
break;
|
}
|
}
|
}
|
}
|
|
// Close file
|
fclose($fileHandle);
|
|
// Return
|
return $spreadsheet;
|
}
|
|
/**
|
* Get sheet index.
|
*
|
* @return int
|
*/
|
public function getSheetIndex()
|
{
|
return $this->sheetIndex;
|
}
|
|
/**
|
* Set sheet index.
|
*
|
* @param int $pValue Sheet index
|
*
|
* @return $this
|
*/
|
public function setSheetIndex($pValue)
|
{
|
$this->sheetIndex = $pValue;
|
|
return $this;
|
}
|
}
|