init
This commit is contained in:
+534
@@ -0,0 +1,534 @@
|
||||
<?php
|
||||
declare(strict_types=1);
|
||||
|
||||
/**
|
||||
* CakePHP(tm) : Rapid Development Framework (https://cakephp.org)
|
||||
* Copyright (c) Cake Software Foundation, Inc. (https://cakefoundation.org)
|
||||
*
|
||||
* Licensed under The MIT License
|
||||
* For full copyright and license information, please see the LICENSE.txt
|
||||
* Redistributions of files must retain the above copyright notice.
|
||||
*
|
||||
* @copyright Copyright (c) Cake Software Foundation, Inc. (https://cakefoundation.org)
|
||||
* @link https://cakephp.org CakePHP(tm) Project
|
||||
* @since 0.10.3
|
||||
* @license https://opensource.org/licenses/mit-license.php MIT License
|
||||
*/
|
||||
namespace Cake\Utility;
|
||||
|
||||
use BackedEnum;
|
||||
use Cake\Core\Exception\CakeException;
|
||||
use Cake\Utility\Exception\XmlException;
|
||||
use Closure;
|
||||
use DOMDocument;
|
||||
use DOMElement;
|
||||
use DOMNode;
|
||||
use DOMText;
|
||||
use Exception;
|
||||
use SimpleXMLElement;
|
||||
use UnitEnum;
|
||||
|
||||
/**
|
||||
* XML handling for CakePHP.
|
||||
*
|
||||
* The methods in these classes enable the datasources that use XML to work.
|
||||
*/
|
||||
class Xml
|
||||
{
|
||||
/**
|
||||
* Initialize SimpleXMLElement or DOMDocument from a given XML string, file path, URL or array.
|
||||
*
|
||||
* ### Usage:
|
||||
*
|
||||
* Building XML from a string:
|
||||
*
|
||||
* ```
|
||||
* $xml = Xml::build('<example>text</example>');
|
||||
* ```
|
||||
*
|
||||
* Building XML from string (output DOMDocument):
|
||||
*
|
||||
* ```
|
||||
* $xml = Xml::build('<example>text</example>', ['return' => 'domdocument']);
|
||||
* ```
|
||||
*
|
||||
* Building XML from a file path:
|
||||
*
|
||||
* ```
|
||||
* $xml = Xml::build('/path/to/an/xml/file.xml', ['readFile' => true]);
|
||||
* ```
|
||||
*
|
||||
* Building XML from a remote URL:
|
||||
*
|
||||
* ```
|
||||
* use Cake\Http\Client;
|
||||
*
|
||||
* $http = new Client();
|
||||
* $response = $http->get('http://example.com/example.xml');
|
||||
* $xml = Xml::build($response->body());
|
||||
* ```
|
||||
*
|
||||
* Building from an array:
|
||||
*
|
||||
* ```
|
||||
* $value = [
|
||||
* 'tags' => [
|
||||
* 'tag' => [
|
||||
* [
|
||||
* 'id' => '1',
|
||||
* 'name' => 'defect'
|
||||
* ],
|
||||
* [
|
||||
* 'id' => '2',
|
||||
* 'name' => 'enhancement'
|
||||
* ]
|
||||
* ]
|
||||
* ]
|
||||
* ];
|
||||
* $xml = Xml::build($value);
|
||||
* ```
|
||||
*
|
||||
* When building XML from an array ensure that there is only one top level element.
|
||||
*
|
||||
* ### Options
|
||||
*
|
||||
* - `return` Can be 'simplexml' to return object of SimpleXMLElement or 'domdocument' to return DOMDocument.
|
||||
* - `loadEntities` Defaults to false. Set to true to enable loading of `<!ENTITY` definitions. This
|
||||
* is disabled by default for security reasons.
|
||||
* - `readFile` Set to true to enable file reading. This is disabled by default to prevent
|
||||
* local filesystem access. Only enable this setting when the input is safe.
|
||||
* - `parseHuge` Enable the `LIBXML_PARSEHUGE` flag.
|
||||
*
|
||||
* If using array as input, you can pass `options` from Xml::fromArray.
|
||||
*
|
||||
* @param object|array|string $input XML string, a path to a file, a URL or an array
|
||||
* @param array<string, mixed> $options The options to use
|
||||
* @return \SimpleXMLElement|\DOMDocument SimpleXMLElement or DOMDocument
|
||||
* @throws \Cake\Utility\Exception\XmlException
|
||||
*/
|
||||
public static function build(object|array|string $input, array $options = []): SimpleXMLElement|DOMDocument
|
||||
{
|
||||
$defaults = [
|
||||
'return' => 'simplexml',
|
||||
'loadEntities' => false,
|
||||
'readFile' => false,
|
||||
'parseHuge' => false,
|
||||
];
|
||||
$options += $defaults;
|
||||
|
||||
if (is_array($input) || is_object($input)) {
|
||||
return static::fromArray($input, $options);
|
||||
}
|
||||
|
||||
if ($options['readFile'] && file_exists($input)) {
|
||||
$content = file_get_contents($input);
|
||||
if ($content === false) {
|
||||
throw new CakeException(sprintf('Cannot read file content of `%s`', $input));
|
||||
}
|
||||
|
||||
return static::_loadXml($content, $options);
|
||||
}
|
||||
|
||||
if (str_contains($input, '<')) {
|
||||
return static::_loadXml($input, $options);
|
||||
}
|
||||
|
||||
throw new XmlException('XML cannot be read.');
|
||||
}
|
||||
|
||||
/**
|
||||
* Parse the input data and create either a SimpleXmlElement object or a DOMDocument.
|
||||
*
|
||||
* @param string $input The input to load.
|
||||
* @param array<string, mixed> $options The options to use. See Xml::build()
|
||||
* @return \SimpleXMLElement|\DOMDocument
|
||||
* @throws \Cake\Utility\Exception\XmlException
|
||||
*/
|
||||
protected static function _loadXml(string $input, array $options): SimpleXMLElement|DOMDocument
|
||||
{
|
||||
return static::load(
|
||||
$input,
|
||||
$options,
|
||||
function ($input, $options, $flags) {
|
||||
if ($options['return'] === 'simplexml' || $options['return'] === 'simplexmlelement') {
|
||||
$flags |= LIBXML_NOCDATA;
|
||||
$xml = new SimpleXMLElement($input, $flags);
|
||||
} else {
|
||||
$xml = new DOMDocument();
|
||||
$xml->loadXML($input, $flags);
|
||||
}
|
||||
|
||||
return $xml;
|
||||
},
|
||||
);
|
||||
}
|
||||
|
||||
/**
|
||||
* Parse the input html string and create either a SimpleXmlElement object or a DOMDocument.
|
||||
*
|
||||
* @param string $input The input html string to load.
|
||||
* @param array<string, mixed> $options The options to use. See Xml::build()
|
||||
* @return \SimpleXMLElement|\DOMDocument
|
||||
* @throws \Cake\Utility\Exception\XmlException
|
||||
*/
|
||||
public static function loadHtml(string $input, array $options = []): SimpleXMLElement|DOMDocument
|
||||
{
|
||||
$defaults = [
|
||||
'return' => 'simplexml',
|
||||
'loadEntities' => false,
|
||||
];
|
||||
$options += $defaults;
|
||||
|
||||
return static::load(
|
||||
$input,
|
||||
$options,
|
||||
function ($input, $options, $flags) {
|
||||
$xml = new DOMDocument();
|
||||
$xml->loadHTML($input, $flags);
|
||||
|
||||
if ($options['return'] === 'simplexml' || $options['return'] === 'simplexmlelement') {
|
||||
return simplexml_import_dom($xml);
|
||||
}
|
||||
|
||||
return $xml;
|
||||
},
|
||||
);
|
||||
}
|
||||
|
||||
/**
|
||||
* Parse the input data and create either a SimpleXmlElement object or a DOMDocument.
|
||||
*
|
||||
* @param string $input The input to load.
|
||||
* @param array<string, mixed> $options The options to use. See Xml::build()
|
||||
* @param \Closure $callable Closure that should return SimpleXMLElement or DOMDocument instance.
|
||||
* @return \SimpleXMLElement|\DOMDocument
|
||||
* @throws \Cake\Utility\Exception\XmlException
|
||||
*/
|
||||
protected static function load(string $input, array $options, Closure $callable): SimpleXMLElement|DOMDocument
|
||||
{
|
||||
$flags = 0;
|
||||
if (!empty($options['parseHuge'])) {
|
||||
$flags |= LIBXML_PARSEHUGE;
|
||||
}
|
||||
|
||||
$internalErrors = libxml_use_internal_errors(true);
|
||||
if ($options['loadEntities']) {
|
||||
$flags |= LIBXML_NOENT;
|
||||
}
|
||||
|
||||
try {
|
||||
return $callable($input, $options, $flags);
|
||||
} catch (Exception $e) {
|
||||
throw new XmlException('Xml cannot be read. ' . $e->getMessage(), null, $e);
|
||||
} finally {
|
||||
libxml_use_internal_errors($internalErrors);
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* Transform an array into a SimpleXMLElement
|
||||
*
|
||||
* ### Options
|
||||
*
|
||||
* - `format` If create children ('tags') or attributes ('attributes').
|
||||
* - `pretty` Returns formatted Xml when set to `true`. Defaults to `false`
|
||||
* - `version` Version of XML document. Default is 1.0.
|
||||
* - `encoding` Encoding of XML document. If null remove from XML header.
|
||||
* Defaults to the application's encoding
|
||||
* - `return` If return object of SimpleXMLElement ('simplexml')
|
||||
* or DOMDocument ('domdocument'). Default is SimpleXMLElement.
|
||||
*
|
||||
* Using the following data:
|
||||
*
|
||||
* ```
|
||||
* $value = [
|
||||
* 'root' => [
|
||||
* 'tag' => [
|
||||
* 'id' => 1,
|
||||
* 'value' => 'defect',
|
||||
* '@' => 'description'
|
||||
* ]
|
||||
* ]
|
||||
* ];
|
||||
* ```
|
||||
*
|
||||
* Calling `Xml::fromArray($value, 'tags');` Will generate:
|
||||
*
|
||||
* `<root><tag><id>1</id><value>defect</value>description</tag></root>`
|
||||
*
|
||||
* And calling `Xml::fromArray($value, 'attributes');` Will generate:
|
||||
*
|
||||
* `<root><tag id="1" value="defect">description</tag></root>`
|
||||
*
|
||||
* @param object|array $input Array with data or a collection instance.
|
||||
* @param array<string, mixed> $options The options to use.
|
||||
* @return \SimpleXMLElement|\DOMDocument SimpleXMLElement or DOMDocument
|
||||
* @throws \Cake\Utility\Exception\XmlException
|
||||
*/
|
||||
public static function fromArray(object|array $input, array $options = []): SimpleXMLElement|DOMDocument
|
||||
{
|
||||
// @phpstan-ignore function.alreadyNarrowedType (is_callable check for visibility)
|
||||
if (is_object($input) && method_exists($input, 'toArray') && is_callable([$input, 'toArray'])) {
|
||||
$input = $input->toArray();
|
||||
}
|
||||
if (!is_array($input) || count($input) !== 1) {
|
||||
throw new XmlException(
|
||||
'Invalid input of type `' . gettype($input) . '`'
|
||||
. (is_array($input) ? ' (Count of ' . count($input) . ')' : '') . '.',
|
||||
);
|
||||
}
|
||||
$key = key($input);
|
||||
if (is_int($key)) {
|
||||
throw new XmlException('The key of input must be alphanumeric');
|
||||
}
|
||||
|
||||
$defaults = [
|
||||
'format' => 'tags',
|
||||
'version' => '1.0',
|
||||
'encoding' => mb_internal_encoding(),
|
||||
'return' => 'simplexml',
|
||||
'pretty' => false,
|
||||
];
|
||||
$options += $defaults;
|
||||
|
||||
$dom = new DOMDocument($options['version'], $options['encoding']);
|
||||
if ($options['pretty']) {
|
||||
$dom->formatOutput = true;
|
||||
}
|
||||
self::_fromArray($dom, $dom, $input, $options['format']);
|
||||
|
||||
$options['return'] = strtolower($options['return']);
|
||||
if ($options['return'] === 'simplexml' || $options['return'] === 'simplexmlelement') {
|
||||
$xmlString = (string)$dom->saveXML();
|
||||
$check = new DOMDocument();
|
||||
libxml_use_internal_errors(true);
|
||||
|
||||
if (!$check->loadXML($xmlString, LIBXML_NOWARNING | LIBXML_NOERROR)) {
|
||||
$errors = libxml_get_errors();
|
||||
$messages = [];
|
||||
|
||||
foreach ($errors as $error) {
|
||||
$messages[] = trim(sprintf(
|
||||
'File: %s, Line %d, Column %d: %s',
|
||||
$error->file ?: '[string input]',
|
||||
$error->line,
|
||||
$error->column,
|
||||
$error->message,
|
||||
));
|
||||
}
|
||||
libxml_clear_errors();
|
||||
throw new XmlException("Invalid XML string:\n" . implode("\n", $messages));
|
||||
}
|
||||
|
||||
return new SimpleXMLElement($xmlString);
|
||||
}
|
||||
|
||||
return $dom;
|
||||
}
|
||||
|
||||
/**
|
||||
* Recursive method to create children from array
|
||||
*
|
||||
* @param \DOMDocument $dom Handler to DOMDocument
|
||||
* @param \DOMDocument|\DOMElement $node Handler to DOMElement (child)
|
||||
* @param mixed $data Array of data to append to the $node.
|
||||
* @param string $format Either 'attributes' or 'tags'. This determines where nested keys go.
|
||||
* @return void
|
||||
* @throws \Cake\Utility\Exception\XmlException
|
||||
*/
|
||||
protected static function _fromArray(
|
||||
DOMDocument $dom,
|
||||
DOMDocument|DOMElement $node,
|
||||
mixed $data,
|
||||
string $format,
|
||||
): void {
|
||||
if (!$data || !is_array($data)) {
|
||||
return;
|
||||
}
|
||||
foreach ($data as $key => $value) {
|
||||
if (is_string($key)) {
|
||||
// @phpstan-ignore function.alreadyNarrowedType (is_callable check for visibility)
|
||||
if (is_object($value) && method_exists($value, 'toArray') && is_callable([$value, 'toArray'])) {
|
||||
$value = $value->toArray();
|
||||
}
|
||||
|
||||
if (!is_array($value)) {
|
||||
if (is_bool($value)) {
|
||||
$value = (int)$value;
|
||||
} elseif ($value === null) {
|
||||
$value = '';
|
||||
}
|
||||
if (str_contains($key, 'xmlns:')) {
|
||||
assert($node instanceof DOMElement);
|
||||
$node->setAttributeNS('http://www.w3.org/2000/xmlns/', $key, (string)$value);
|
||||
continue;
|
||||
}
|
||||
if (!str_starts_with($key, '@') && $format === 'tags') {
|
||||
if (!is_numeric($value)) {
|
||||
// Escape special characters
|
||||
// https://www.w3.org/TR/REC-xml/#syntax
|
||||
// https://bugs.php.net/bug.php?id=36795
|
||||
$child = $dom->createElement($key, '');
|
||||
if ($value instanceof BackedEnum) {
|
||||
$value = (string)$value->value;
|
||||
} elseif ($value instanceof UnitEnum) {
|
||||
$value = $value->name;
|
||||
} else {
|
||||
$value = (string)$value;
|
||||
}
|
||||
$child->appendChild(new DOMText($value));
|
||||
} else {
|
||||
$child = $dom->createElement($key, (string)$value);
|
||||
}
|
||||
$node->appendChild($child);
|
||||
} else {
|
||||
if (str_starts_with($key, '@')) {
|
||||
$key = substr($key, 1);
|
||||
}
|
||||
$attribute = $dom->createAttribute($key);
|
||||
$attribute->appendChild($dom->createTextNode((string)$value));
|
||||
$node->appendChild($attribute);
|
||||
}
|
||||
} else {
|
||||
if (str_starts_with($key, '@')) {
|
||||
throw new XmlException('Invalid array');
|
||||
}
|
||||
if (is_numeric(implode('', array_keys($value)))) {
|
||||
// List
|
||||
foreach ($value as $item) {
|
||||
$itemData = compact('dom', 'node', 'key', 'format');
|
||||
$itemData['value'] = $item;
|
||||
static::_createChild($itemData);
|
||||
}
|
||||
} else {
|
||||
// Struct
|
||||
static::_createChild(compact('dom', 'node', 'key', 'value', 'format'));
|
||||
}
|
||||
}
|
||||
} else {
|
||||
throw new XmlException('Invalid array');
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* Helper to _fromArray(). It will create children of arrays
|
||||
*
|
||||
* @param array<string, mixed> $data Array with information to create children
|
||||
* @return void
|
||||
* @phpstan-param array{dom: \DOMDocument, node: \DOMNode, key: string, format: string, value?: mixed} $data
|
||||
*/
|
||||
protected static function _createChild(array $data): void
|
||||
{
|
||||
$data += [
|
||||
'value' => null,
|
||||
];
|
||||
|
||||
$key = $data['key'];
|
||||
$format = $data['format'];
|
||||
$value = $data['value'];
|
||||
$dom = $data['dom'];
|
||||
$node = $data['node'];
|
||||
$childNS = null;
|
||||
$childValue = null;
|
||||
// @phpstan-ignore function.alreadyNarrowedType (is_callable check for visibility)
|
||||
if (is_object($value) && method_exists($value, 'toArray') && is_callable([$value, 'toArray'])) {
|
||||
$value = $value->toArray();
|
||||
}
|
||||
if (is_array($value)) {
|
||||
if (isset($value['@'])) {
|
||||
$childValue = (string)$value['@'];
|
||||
unset($value['@']);
|
||||
}
|
||||
if (isset($value['xmlns:'])) {
|
||||
$childNS = $value['xmlns:'];
|
||||
unset($value['xmlns:']);
|
||||
}
|
||||
} elseif ($value || $value === 0 || $value === '0') {
|
||||
$childValue = (string)$value;
|
||||
}
|
||||
|
||||
$child = $dom->createElement($key);
|
||||
if ($childValue !== null) {
|
||||
$child->appendChild($dom->createTextNode($childValue));
|
||||
}
|
||||
if ($childNS) {
|
||||
$child->setAttribute('xmlns', $childNS);
|
||||
}
|
||||
|
||||
static::_fromArray($dom, $child, $value, $format);
|
||||
$node->appendChild($child);
|
||||
}
|
||||
|
||||
/**
|
||||
* Returns this XML structure as an array.
|
||||
*
|
||||
* @param \SimpleXMLElement|\DOMNode $obj SimpleXMLElement, DOMNode instance
|
||||
* @return array Array representation of the XML structure.
|
||||
* @throws \Cake\Utility\Exception\XmlException
|
||||
*/
|
||||
public static function toArray(SimpleXMLElement|DOMNode $obj): array
|
||||
{
|
||||
if ($obj instanceof DOMNode) {
|
||||
$obj = simplexml_import_dom($obj);
|
||||
}
|
||||
|
||||
if ($obj === null) {
|
||||
throw new XmlException('Failed converting DOMNode to SimpleXMLElement');
|
||||
}
|
||||
|
||||
$result = [];
|
||||
$namespaces = array_merge(['' => ''], $obj->getNamespaces(true));
|
||||
static::_toArray($obj, $result, '', array_keys($namespaces));
|
||||
|
||||
return $result;
|
||||
}
|
||||
|
||||
/**
|
||||
* Recursive method to toArray
|
||||
*
|
||||
* @param \SimpleXMLElement $xml SimpleXMLElement object
|
||||
* @param array<string, mixed> $parentData Parent array with data
|
||||
* @param string $ns Namespace of current child
|
||||
* @param array<string> $namespaces List of namespaces in XML
|
||||
* @return void
|
||||
*/
|
||||
protected static function _toArray(SimpleXMLElement $xml, array &$parentData, string $ns, array $namespaces): void
|
||||
{
|
||||
$data = [];
|
||||
|
||||
foreach ($namespaces as $namespace) {
|
||||
$attributes = $xml->attributes($namespace, true);
|
||||
foreach ($attributes as $key => $value) {
|
||||
if ($namespace) {
|
||||
$key = $namespace . ':' . $key;
|
||||
}
|
||||
$data['@' . $key] = (string)$value;
|
||||
}
|
||||
|
||||
foreach ($xml->children($namespace, true) as $child) {
|
||||
static::_toArray($child, $data, $namespace, $namespaces);
|
||||
}
|
||||
}
|
||||
|
||||
$asString = trim((string)$xml);
|
||||
if (!$data) {
|
||||
$data = $asString;
|
||||
} elseif ($asString !== '') {
|
||||
$data['@'] = $asString;
|
||||
}
|
||||
|
||||
if ($ns) {
|
||||
$ns .= ':';
|
||||
}
|
||||
$name = $ns . $xml->getName();
|
||||
if (isset($parentData[$name])) {
|
||||
if (!is_array($parentData[$name]) || !isset($parentData[$name][0])) {
|
||||
$parentData[$name] = [$parentData[$name]];
|
||||
}
|
||||
$parentData[$name][] = $data;
|
||||
} else {
|
||||
$parentData[$name] = $data;
|
||||
}
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user