' ', self::XML_NODE_TEXT_TAB => "\t", self::XML_NODE_TEXT_LINE_BREAK => "\n", ]; /** * @param bool $shouldFormatDates Whether date/time values should be returned as PHP objects or be formatted as strings * @param \OpenSpout\Common\Helper\Escaper\ODS $escaper Used to unescape XML data */ public function __construct($shouldFormatDates, $escaper) { $this->shouldFormatDates = $shouldFormatDates; $this->escaper = $escaper; } /** * Returns the (unescaped) correctly marshalled, cell value associated to the given XML node. * * @see http://docs.oasis-open.org/office/v1.2/os/OpenDocument-v1.2-os-part1.html#refTable13 * * @param \DOMElement $node * * @throws InvalidValueException If the node value is not valid * * @return bool|\DateInterval|\DateTime|float|int|string The value associated with the cell, empty string if cell's type is void/undefined */ public function extractAndFormatNodeValue($node) { $cellType = $node->getAttribute(self::XML_ATTRIBUTE_TYPE); switch ($cellType) { case self::CELL_TYPE_STRING: return $this->formatStringCellValue($node); case self::CELL_TYPE_FLOAT: return $this->formatFloatCellValue($node); case self::CELL_TYPE_BOOLEAN: return $this->formatBooleanCellValue($node); case self::CELL_TYPE_DATE: return $this->formatDateCellValue($node); case self::CELL_TYPE_TIME: return $this->formatTimeCellValue($node); case self::CELL_TYPE_CURRENCY: return $this->formatCurrencyCellValue($node); case self::CELL_TYPE_PERCENTAGE: return $this->formatPercentageCellValue($node); case self::CELL_TYPE_VOID: default: return ''; } } /** * Returns the cell String value. * * @param \DOMElement $node * * @return string The value associated with the cell */ protected function formatStringCellValue($node) { $pNodeValues = []; $pNodes = $node->getElementsByTagName(self::XML_NODE_P); foreach ($pNodes as $pNode) { $pNodeValues[] = $this->extractTextValueFromNode($pNode); } $escapedCellValue = implode("\n", $pNodeValues); return $this->escaper->unescape($escapedCellValue); } /** * Returns the cell Numeric value from the given node. * * @param \DOMElement $node * * @return float|int The value associated with the cell */ protected function formatFloatCellValue($node) { $nodeValue = $node->getAttribute(self::XML_ATTRIBUTE_VALUE); $nodeIntValue = (int) $nodeValue; $nodeFloatValue = (float) $nodeValue; return ((float) $nodeIntValue === $nodeFloatValue) ? $nodeIntValue : $nodeFloatValue; } /** * Returns the cell Boolean value from the given node. * * @param \DOMElement $node * * @return bool The value associated with the cell */ protected function formatBooleanCellValue($node) { $nodeValue = $node->getAttribute(self::XML_ATTRIBUTE_BOOLEAN_VALUE); return (bool) $nodeValue; } /** * Returns the cell Date value from the given node. * * @param \DOMElement $node * * @throws InvalidValueException If the value is not a valid date * * @return \DateTime|string The value associated with the cell */ protected function formatDateCellValue($node) { // The XML node looks like this: // // 05/19/16 04:39 PM // if ($this->shouldFormatDates) { // The date is already formatted in the "p" tag $nodeWithValueAlreadyFormatted = $node->getElementsByTagName(self::XML_NODE_P)->item(0); $cellValue = $nodeWithValueAlreadyFormatted->nodeValue; } else { // otherwise, get it from the "date-value" attribute $nodeValue = $node->getAttribute(self::XML_ATTRIBUTE_DATE_VALUE); try { $cellValue = new \DateTime($nodeValue); } catch (\Exception $e) { throw new InvalidValueException($nodeValue); } } return $cellValue; } /** * Returns the cell Time value from the given node. * * @param \DOMElement $node * * @throws InvalidValueException If the value is not a valid time * * @return \DateInterval|string The value associated with the cell */ protected function formatTimeCellValue($node) { // The XML node looks like this: // // 01:24:00 PM // if ($this->shouldFormatDates) { // The date is already formatted in the "p" tag $nodeWithValueAlreadyFormatted = $node->getElementsByTagName(self::XML_NODE_P)->item(0); $cellValue = $nodeWithValueAlreadyFormatted->nodeValue; } else { // otherwise, get it from the "time-value" attribute $nodeValue = $node->getAttribute(self::XML_ATTRIBUTE_TIME_VALUE); try { $cellValue = new \DateInterval($nodeValue); } catch (\Exception $e) { throw new InvalidValueException($nodeValue); } } return $cellValue; } /** * Returns the cell Currency value from the given node. * * @param \DOMElement $node * * @return string The value associated with the cell (e.g. "100 USD" or "9.99 EUR") */ protected function formatCurrencyCellValue($node) { $value = $node->getAttribute(self::XML_ATTRIBUTE_VALUE); $currency = $node->getAttribute(self::XML_ATTRIBUTE_CURRENCY); return "{$value} {$currency}"; } /** * Returns the cell Percentage value from the given node. * * @param \DOMElement $node * * @return float|int The value associated with the cell */ protected function formatPercentageCellValue($node) { // percentages are formatted like floats return $this->formatFloatCellValue($node); } /** * @param \DOMNode $pNode * * @return string */ private function extractTextValueFromNode($pNode) { $textValue = ''; foreach ($pNode->childNodes as $childNode) { if ($childNode instanceof \DOMText) { $textValue .= $childNode->nodeValue; } elseif ($this->isWhitespaceNode($childNode->nodeName)) { $textValue .= $this->transformWhitespaceNode($childNode); } elseif (self::XML_NODE_TEXT_A === $childNode->nodeName || self::XML_NODE_TEXT_SPAN === $childNode->nodeName) { $textValue .= $this->extractTextValueFromNode($childNode); } } return $textValue; } /** * Returns whether the given node is a whitespace node. It must be one of these: * - * - * - . * * @param string $nodeName * * @return bool */ private function isWhitespaceNode($nodeName) { return isset(self::$WHITESPACE_XML_NODES[$nodeName]); } /** * The "" node can contain the string value directly * or contain child elements. In this case, whitespaces contain in * the child elements should be replaced by their XML equivalent: * - space => * - tab => * - line break => . * * @see https://docs.oasis-open.org/office/v1.2/os/OpenDocument-v1.2-os-part1.html#__RefHeading__1415200_253892949 * * @param \DOMElement $node The XML node representing a whitespace * * @return string The corresponding whitespace value */ private function transformWhitespaceNode($node) { $countAttribute = $node->getAttribute(self::XML_ATTRIBUTE_C); // only defined for "" $numWhitespaces = (!empty($countAttribute)) ? (int) $countAttribute : 1; return str_repeat(self::$WHITESPACE_XML_NODES[$node->nodeName], $numWhitespaces); } }