| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515 |
- <?php
- /**
- * This file is part of PHPWord - A pure PHP library for reading and writing
- * word processing documents.
- *
- * PHPWord is free software distributed under the terms of the GNU Lesser
- * General Public License version 3 as published by the Free Software Foundation.
- *
- * For the full copyright and license information, please read the LICENSE
- * file that was distributed with this source code. For the full list of
- * contributors, visit https://github.com/PHPOffice/PHPWord/contributors.
- *
- * @link https://github.com/PHPOffice/PHPWord
- * @copyright 2010-2014 PHPWord contributors
- * @license http://www.gnu.org/licenses/lgpl.txt LGPL version 3
- */
- namespace PhpOffice\PhpWord\Reader\Word2007;
- use PhpOffice\PhpWord\PhpWord;
- use PhpOffice\PhpWord\Shared\XMLReader;
- /**
- * Abstract part reader
- *
- * This class is inherited by ODText reader
- *
- * @since 0.10.0
- */
- abstract class AbstractPart
- {
- /**
- * Conversion method
- *
- * @const int
- */
- const READ_VALUE = 'attributeValue'; // Read attribute value
- const READ_EQUAL = 'attributeEquals'; // Read `true` when attribute value equals specified value
- const READ_TRUE = 'attributeTrue'; // Read `true` when element exists
- const READ_FALSE = 'attributeFalse'; // Read `false` when element exists
- const READ_SIZE = 'attributeMultiplyByTwo'; // Read special attribute value for Font::$size
- /**
- * Document file
- *
- * @var string
- */
- protected $docFile;
- /**
- * XML file
- *
- * @var string
- */
- protected $xmlFile;
- /**
- * Part relationships
- *
- * @var array
- */
- protected $rels = array();
- /**
- * Read part.
- */
- abstract public function read(PhpWord $phpWord);
- /**
- * Create new instance
- *
- * @param string $docFile
- * @param string $xmlFile
- */
- public function __construct($docFile, $xmlFile)
- {
- $this->docFile = $docFile;
- $this->xmlFile = $xmlFile;
- }
- /**
- * Set relationships.
- *
- * @param array $value
- * @return void
- */
- public function setRels($value)
- {
- $this->rels = $value;
- }
- /**
- * Read w:p.
- *
- * @param \PhpOffice\PhpWord\Shared\XMLReader $xmlReader
- * @param \DOMElement $domNode
- * @param mixed $parent
- * @param string $docPart
- * @return void
- *
- * @todo Get font style for preserve text
- */
- protected function readParagraph(XMLReader $xmlReader, \DOMElement $domNode, $parent, $docPart = 'document')
- {
- // Paragraph style
- $paragraphStyle = null;
- $headingMatches = array();
- if ($xmlReader->elementExists('w:pPr', $domNode)) {
- $paragraphStyle = $this->readParagraphStyle($xmlReader, $domNode);
- if (is_array($paragraphStyle) && isset($paragraphStyle['styleName'])) {
- preg_match('/Heading(\d)/', $paragraphStyle['styleName'], $headingMatches);
- }
- }
- // PreserveText
- if ($xmlReader->elementExists('w:r/w:instrText', $domNode)) {
- $ignoreText = false;
- $textContent = '';
- $fontStyle = $this->readFontStyle($xmlReader, $domNode);
- $nodes = $xmlReader->getElements('w:r', $domNode);
- foreach ($nodes as $node) {
- $instrText = $xmlReader->getValue('w:instrText', $node);
- if ($xmlReader->elementExists('w:fldChar', $node)) {
- $fldCharType = $xmlReader->getAttribute('w:fldCharType', $node, 'w:fldChar');
- if ($fldCharType == 'begin') {
- $ignoreText = true;
- } elseif ($fldCharType == 'end') {
- $ignoreText = false;
- }
- }
- if (!is_null($instrText)) {
- $textContent .= '{' . $instrText . '}';
- } else {
- if ($ignoreText === false) {
- $textContent .= $xmlReader->getValue('w:t', $node);
- }
- }
- }
- $parent->addPreserveText($textContent, $fontStyle, $paragraphStyle);
- // List item
- } elseif ($xmlReader->elementExists('w:pPr/w:numPr', $domNode)) {
- $textContent = '';
- $numID = $xmlReader->getAttribute('w:val', $domNode, 'w:pPr/w:numPr/w:numID');
- $levelID = $xmlReader->getAttribute('w:val', $domNode, 'w:pPr/w:numPr/w:ilvl');
- $nodes = $xmlReader->getElements('w:r', $domNode);
- foreach ($nodes as $node) {
- $textContent .= $xmlReader->getValue('w:t', $node);
- }
- $parent->addListItem($textContent, $levelID, null, "PHPWordList{$numID}", $paragraphStyle);
- // Heading
- } elseif (!empty($headingMatches)) {
- $textContent = '';
- $nodes = $xmlReader->getElements('w:r', $domNode);
- foreach ($nodes as $node) {
- $textContent .= $xmlReader->getValue('w:t', $node);
- }
- $parent->addTitle($textContent, $headingMatches[1]);
- // Text and TextRun
- } else {
- $runCount = $xmlReader->countElements('w:r', $domNode);
- $linkCount = $xmlReader->countElements('w:hyperlink', $domNode);
- $runLinkCount = $runCount + $linkCount;
- if ($runLinkCount == 0) {
- $parent->addTextBreak(null, $paragraphStyle);
- } else {
- $nodes = $xmlReader->getElements('*', $domNode);
- foreach ($nodes as $node) {
- $this->readRun(
- $xmlReader,
- $node,
- ($runLinkCount > 1) ? $parent->addTextRun($paragraphStyle) : $parent,
- $docPart,
- $paragraphStyle
- );
- }
- }
- }
- }
- /**
- * Read w:r.
- *
- * @param \PhpOffice\PhpWord\Shared\XMLReader $xmlReader
- * @param \DOMElement $domNode
- * @param mixed $parent
- * @param string $docPart
- * @param mixed $paragraphStyle
- * @return void
- *
- * @todo Footnote paragraph style
- */
- protected function readRun(XMLReader $xmlReader, \DOMElement $domNode, $parent, $docPart, $paragraphStyle = null)
- {
- if (!in_array($domNode->nodeName, array('w:r', 'w:hyperlink'))) {
- return;
- }
- $fontStyle = $this->readFontStyle($xmlReader, $domNode);
- // Link
- if ($domNode->nodeName == 'w:hyperlink') {
- $rID = $xmlReader->getAttribute('r:id', $domNode);
- $textContent = $xmlReader->getValue('w:r/w:t', $domNode);
- $target = $this->getMediaTarget($docPart, $rID);
- if (!is_null($target)) {
- $parent->addLink($target, $textContent, $fontStyle, $paragraphStyle);
- }
- } else {
- // Footnote
- if ($xmlReader->elementExists('w:footnoteReference', $domNode)) {
- $parent->addFootnote();
- // Endnote
- } elseif ($xmlReader->elementExists('w:endnoteReference', $domNode)) {
- $parent->addEndnote();
- // Image
- } elseif ($xmlReader->elementExists('w:pict', $domNode)) {
- $rID = $xmlReader->getAttribute('r:id', $domNode, 'w:pict/v:shape/v:imagedata');
- $target = $this->getMediaTarget($docPart, $rID);
- if (!is_null($target)) {
- $imageSource = "zip://{$this->docFile}#{$target}";
- $parent->addImage($imageSource);
- }
- // Object
- } elseif ($xmlReader->elementExists('w:object', $domNode)) {
- $rID = $xmlReader->getAttribute('r:id', $domNode, 'w:object/o:OLEObject');
- // $rIDIcon = $xmlReader->getAttribute('r:id', $domNode, 'w:object/v:shape/v:imagedata');
- $target = $this->getMediaTarget($docPart, $rID);
- if (!is_null($target)) {
- $textContent = "<Object: {$target}>";
- $parent->addText($textContent, $fontStyle, $paragraphStyle);
- }
- // TextRun
- } else {
- $textContent = $xmlReader->getValue('w:t', $domNode);
- $parent->addText($textContent, $fontStyle, $paragraphStyle);
- }
- }
- }
- /**
- * Read w:tbl.
- *
- * @param \PhpOffice\PhpWord\Shared\XMLReader $xmlReader
- * @param \DOMElement $domNode
- * @param mixed $parent
- * @param string $docPart
- * @return void
- */
- protected function readTable(XMLReader $xmlReader, \DOMElement $domNode, $parent, $docPart = 'document')
- {
- // Table style
- $tblStyle = null;
- if ($xmlReader->elementExists('w:tblPr', $domNode)) {
- $tblStyle = $this->readTableStyle($xmlReader, $domNode);
- }
- /** @var \PhpOffice\PhpWord\Element\Table $table Type hint */
- $table = $parent->addTable($tblStyle);
- $tblNodes = $xmlReader->getElements('*', $domNode);
- foreach ($tblNodes as $tblNode) {
- if ($tblNode->nodeName == 'w:tblGrid') { // Column
- // @todo Do something with table columns
- } elseif ($tblNode->nodeName == 'w:tr') { // Row
- $rowHeight = $xmlReader->getAttribute('w:val', $tblNode, 'w:trPr/w:trHeight');
- $rowHRule = $xmlReader->getAttribute('w:hRule', $tblNode, 'w:trPr/w:trHeight');
- $rowHRule = $rowHRule == 'exact' ? true : false;
- $rowStyle = array(
- 'tblHeader' => $xmlReader->elementExists('w:trPr/w:tblHeader', $tblNode),
- 'cantSplit' => $xmlReader->elementExists('w:trPr/w:cantSplit', $tblNode),
- 'exactHeight' => $rowHRule,
- );
- $row = $table->addRow($rowHeight, $rowStyle);
- $rowNodes = $xmlReader->getElements('*', $tblNode);
- foreach ($rowNodes as $rowNode) {
- if ($rowNode->nodeName == 'w:trPr') { // Row style
- // @todo Do something with row style
- } elseif ($rowNode->nodeName == 'w:tc') { // Cell
- $cellWidth = $xmlReader->getAttribute('w:w', $rowNode, 'w:tcPr/w:tcW');
- $cellStyle = null;
- $cellStyleNode = $xmlReader->getElement('w:tcPr', $rowNode);
- if (!is_null($cellStyleNode)) {
- $cellStyle = $this->readCellStyle($xmlReader, $cellStyleNode);
- }
- $cell = $row->addCell($cellWidth, $cellStyle);
- $cellNodes = $xmlReader->getElements('*', $rowNode);
- foreach ($cellNodes as $cellNode) {
- if ($cellNode->nodeName == 'w:p') { // Paragraph
- $this->readParagraph($xmlReader, $cellNode, $cell, $docPart);
- }
- }
- }
- }
- }
- }
- }
- /**
- * Read w:pPr.
- *
- * @param \PhpOffice\PhpWord\Shared\XMLReader $xmlReader
- * @param \DOMElement $domNode
- * @return array|null
- */
- protected function readParagraphStyle(XMLReader $xmlReader, \DOMElement $domNode)
- {
- if (!$xmlReader->elementExists('w:pPr', $domNode)) {
- return null;
- }
- $styleNode = $xmlReader->getElement('w:pPr', $domNode);
- $styleDefs = array(
- 'styleName' => array(self::READ_VALUE, 'w:pStyle'),
- 'align' => array(self::READ_VALUE, 'w:jc'),
- 'basedOn' => array(self::READ_VALUE, 'w:basedOn'),
- 'next' => array(self::READ_VALUE, 'w:next'),
- 'indent' => array(self::READ_VALUE, 'w:ind', 'w:left'),
- 'hanging' => array(self::READ_VALUE, 'w:ind', 'w:hanging'),
- 'spaceAfter' => array(self::READ_VALUE, 'w:spacing', 'w:after'),
- 'spaceBefore' => array(self::READ_VALUE, 'w:spacing', 'w:before'),
- 'widowControl' => array(self::READ_FALSE, 'w:widowControl'),
- 'keepNext' => array(self::READ_TRUE, 'w:keepNext'),
- 'keepLines' => array(self::READ_TRUE, 'w:keepLines'),
- 'pageBreakBefore' => array(self::READ_TRUE, 'w:pageBreakBefore'),
- );
- return $this->readStyleDefs($xmlReader, $styleNode, $styleDefs);
- }
- /**
- * Read w:rPr
- *
- * @param \PhpOffice\PhpWord\Shared\XMLReader $xmlReader
- * @param \DOMElement $domNode
- * @return array|null
- */
- protected function readFontStyle(XMLReader $xmlReader, \DOMElement $domNode)
- {
- if (is_null($domNode)) {
- return null;
- }
- // Hyperlink has an extra w:r child
- if ($domNode->nodeName == 'w:hyperlink') {
- $domNode = $xmlReader->getElement('w:r', $domNode);
- }
- if (!$xmlReader->elementExists('w:rPr', $domNode)) {
- return null;
- }
- $styleNode = $xmlReader->getElement('w:rPr', $domNode);
- $styleDefs = array(
- 'styleName' => array(self::READ_VALUE, 'w:rStyle'),
- 'name' => array(self::READ_VALUE, 'w:rFonts', 'w:ascii'),
- 'hint' => array(self::READ_VALUE, 'w:rFonts', 'w:hint'),
- 'size' => array(self::READ_SIZE, 'w:sz'),
- 'color' => array(self::READ_VALUE, 'w:color'),
- 'underline' => array(self::READ_VALUE, 'w:u'),
- 'bold' => array(self::READ_TRUE, 'w:b'),
- 'italic' => array(self::READ_TRUE, 'w:i'),
- 'strikethrough' => array(self::READ_TRUE, 'w:strike'),
- 'doubleStrikethrough' => array(self::READ_TRUE, 'w:dstrike'),
- 'smallCaps' => array(self::READ_TRUE, 'w:smallCaps'),
- 'allCaps' => array(self::READ_TRUE, 'w:caps'),
- 'superScript' => array(self::READ_EQUAL, 'w:vertAlign', 'w:val', 'superscript'),
- 'subScript' => array(self::READ_EQUAL, 'w:vertAlign', 'w:val', 'subscript'),
- 'fgColor' => array(self::READ_VALUE, 'w:highlight'),
- 'rtl' => array(self::READ_TRUE, 'w:rtl'),
- );
- return $this->readStyleDefs($xmlReader, $styleNode, $styleDefs);
- }
- /**
- * Read w:tblPr
- *
- * @param \PhpOffice\PhpWord\Shared\XMLReader $xmlReader
- * @param \DOMElement $domNode
- * @return string|array|null
- * @todo Capture w:tblStylePr w:type="firstRow"
- */
- protected function readTableStyle(XMLReader $xmlReader, \DOMElement $domNode)
- {
- $style = null;
- $margins = array('top', 'left', 'bottom', 'right');
- $borders = $margins + array('insideH', 'insideV');
- if ($xmlReader->elementExists('w:tblPr', $domNode)) {
- if ($xmlReader->elementExists('w:tblPr/w:tblStyle', $domNode)) {
- $style = $xmlReader->getAttribute('w:val', $domNode, 'w:tblPr/w:tblStyle');
- } else {
- $styleNode = $xmlReader->getElement('w:tblPr', $domNode);
- $styleDefs = array();
- // $styleDefs['styleName'] = array(self::READ_VALUE, 'w:tblStyle');
- foreach ($margins as $side) {
- $ucfSide = ucfirst($side);
- $styleDefs["cellMargin$ucfSide"] = array(self::READ_VALUE, "w:tblCellMar/w:$side", 'w:w');
- }
- foreach ($borders as $side) {
- $ucfSide = ucfirst($side);
- $styleDefs["border{$ucfSide}Size"] = array(self::READ_VALUE, "w:tblBorders/w:$side", 'w:sz');
- $styleDefs["border{$ucfSide}Color"] = array(self::READ_VALUE, "w:tblBorders/w:$side", 'w:color');
- }
- $style = $this->readStyleDefs($xmlReader, $styleNode, $styleDefs);
- }
- }
- return $style;
- }
- /**
- * Read w:tcPr
- *
- * @param \PhpOffice\PhpWord\Shared\XMLReader $xmlReader
- * @param \DOMElement $domNode
- * @return array
- */
- private function readCellStyle(XMLReader $xmlReader, \DOMElement $domNode)
- {
- $styleDefs = array(
- 'valign' => array(self::READ_VALUE, 'w:vAlign'),
- 'textDirection' => array(self::READ_VALUE, 'w:textDirection'),
- 'gridSpan' => array(self::READ_VALUE, 'w:gridSpan'),
- 'vMerge' => array(self::READ_VALUE, 'w:vMerge'),
- 'bgColor' => array(self::READ_VALUE, 'w:shd/w:fill'),
- );
- return $this->readStyleDefs($xmlReader, $domNode, $styleDefs);
- }
- /**
- * Read style definition
- *
- * @param \PhpOffice\PhpWord\Shared\XMLReader $xmlReader
- * @param \DOMElement $parentNode
- * @param array $styleDefs
- * @ignoreScrutinizerPatch
- * @return array
- */
- protected function readStyleDefs(XMLReader $xmlReader, \DOMElement $parentNode = null, $styleDefs = array())
- {
- $styles = array();
- foreach ($styleDefs as $styleProp => $styleVal) {
- @list($method, $element, $attribute, $expected) = $styleVal;
- if ($xmlReader->elementExists($element, $parentNode)) {
- $node = $xmlReader->getElement($element, $parentNode);
- // Use w:val as default if no attribute assigned
- $attribute = ($attribute === null) ? 'w:val' : $attribute;
- $attributeValue = $xmlReader->getAttribute($attribute, $node);
- $styleValue = $this->readStyleDef($method, $attributeValue, $expected);
- if ($styleValue !== null) {
- $styles[$styleProp] = $styleValue;
- }
- }
- }
- return $styles;
- }
- /**
- * Return style definition based on conversion method
- *
- * @param string $method
- * @ignoreScrutinizerPatch
- * @param mixed $attributeValue
- * @param mixed $expected
- * @return mixed
- */
- private function readStyleDef($method, $attributeValue, $expected)
- {
- $style = $attributeValue;
- if ($method == self::READ_SIZE) {
- $style = $attributeValue / 2;
- } elseif ($method == self::READ_TRUE) {
- $style = true;
- } elseif ($method == self::READ_FALSE) {
- $style = false;
- } elseif ($method == self::READ_EQUAL) {
- $style = $attributeValue == $expected;
- }
- return $style;
- }
- /**
- * Returns the target of image, object, or link as stored in ::readMainRels
- *
- * @param string $docPart
- * @param string $rID
- * @return string|null
- */
- private function getMediaTarget($docPart, $rID)
- {
- $target = null;
- if (isset($this->rels[$docPart]) && isset($this->rels[$docPart][$rID])) {
- $target = $this->rels[$docPart][$rID]['target'];
- }
- return $target;
- }
- }
|