From bf402949989293efa8f86d382b247528b001f414 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Stefan=20B=C3=BCrk?= Date: Mon, 31 Jul 2023 11:49:06 +0200 Subject: [PATCH] [BUGFIX] Ensure nested `w:sdt -> w:sdtContent` node parsing for Document Nodes can be nested or directly provided for the document structure. Until now, the `sdt->sdtContent` wrapping have not been respected. This change moves the node parsing for a document to a dedicated method and make it recursivly callable to unnest the wrapped node. --- src/PhpWord/Reader/Word2007/Document.php | 29 ++++++++++++++++++++---- 1 file changed, 24 insertions(+), 5 deletions(-) diff --git a/src/PhpWord/Reader/Word2007/Document.php b/src/PhpWord/Reader/Word2007/Document.php index da42bddc9e..8571a477c6 100644 --- a/src/PhpWord/Reader/Word2007/Document.php +++ b/src/PhpWord/Reader/Word2007/Document.php @@ -18,6 +18,7 @@ namespace PhpOffice\PhpWord\Reader\Word2007; use DOMElement; +use DOMNode; use PhpOffice\PhpWord\Element\Section; use PhpOffice\PhpWord\PhpWord; use PhpOffice\PhpWord\Shared\XMLReader; @@ -46,15 +47,33 @@ public function read(PhpWord $phpWord): void $this->phpWord = $phpWord; $xmlReader = new XMLReader(); $xmlReader->getDomFromZip($this->docFile, $this->xmlFile); - $readMethods = ['w:p' => 'readWPNode', 'w:tbl' => 'readTable', 'w:sectPr' => 'readWSectPrNode']; - $nodes = $xmlReader->getElements('w:body/*'); if ($nodes->length > 0) { $section = $this->phpWord->addSection(); foreach ($nodes as $node) { - if (isset($readMethods[$node->nodeName])) { - $readMethod = $readMethods[$node->nodeName]; - $this->$readMethod($xmlReader, $node, $section); + $this->readNode($phpWord, $xmlReader, $node, $section); + } + } + } + + private function readNode(PhpWord $phpWord, XMLReader $xmlReader, DOMNode $node, Section $section): void + { + $readMethods = ['w:p' => 'readWPNode', 'w:tbl' => 'readTable', 'w:sectPr' => 'readWSectPrNode']; + if (isset($readMethods[$node->nodeName])) { + $readMethod = $readMethods[$node->nodeName]; + $this->$readMethod($xmlReader, $node, $section); + } elseif ($node->nodeName === 'w:sdt' && $node instanceof DOMElement) { + $nodes = $xmlReader->getElements('w:sdtContent/*', $node); + if ($nodes->length > 0) { + foreach ($nodes as $subNode) { + $this->readNode($phpWord, $xmlReader, $subNode, $section); + } + } + } elseif ($node->nodeName === 'w:sdtContent' && $node instanceof DOMElement) { + $nodes = $xmlReader->getElements('*', $node); + if ($nodes->length > 0) { + foreach ($nodes as $subNode) { + $this->readNode($phpWord, $xmlReader, $subNode, $section); } } }