PortableInfobox/services/Parser/XmlParser.php
2015-06-10 14:51:07 +02:00

158 lines
3.9 KiB
PHP

<?php
namespace Wikia\PortableInfobox\Parser;
class XmlParser {
protected $infoboxData;
protected $externalParser;
protected $xmlParseErrors;
public function __construct( $infoboxData ) {
$this->infoboxData = $infoboxData;
}
/**
* @return mixed
*/
public function getXmlParseErrors() {
return $this->xmlParseErrors;
}
/**
* @param mixed $xmlParseErrors
*/
public function setXmlParseErrors( $xmlParseErrors ) {
$this->xmlParseErrors = $xmlParseErrors;
}
/**
* @return mixed
*/
public function getExternalParser() {
return $this->externalParser;
}
/**
* @param mixed $externalParser
*/
public function setExternalParser( ExternalParser $externalParser ) {
$this->externalParser = $externalParser;
}
/**
* @param \SimpleXMLElement $xmlIterable
* @return array
*/
public function getDataFromNodes( \SimpleXMLElement $xmlIterable, $parentNode = null ) {
wfProfileIn(__METHOD__);
$data = [ ];
foreach ( $xmlIterable as $node ) {
$nodeHandler = $this->getNode( $node, $parentNode );
$nodeData = $nodeHandler->getData();
// add data if node is not empty or - when node can not be ignored when empty
if ( !$nodeHandler->isEmpty( $nodeData ) || !$nodeHandler->ignoreNodeWhenEmpty() ) {
$data[ ] = [
'type' => $nodeHandler->getType(),
'data' => $nodeData,
'isEmpty' => $nodeHandler->isEmpty( $nodeData )
];
}
}
wfProfileOut(__METHOD__);
return $data;
}
/**
* @param $xmlString
* @return array
* @throws XmlMarkupParseErrorException
*/
public function getDataFromXmlString( $xmlString ) {
wfProfileIn( __METHOD__ );
$xml = $this->parseXmlString( $xmlString );
$data = $this->getDataFromNodes( $xml );
wfProfileOut( __METHOD__ );
return $data;
}
public function getInfoboxParams( $xmlString ) {
$xml = $this->parseXmlString( $xmlString );
$result = [];
foreach ( $xml->attributes() as $k => $v ) {
$result[$k] = (string) $v;
}
return $result;
}
protected function logXmlParseError( $level, $code, $message ) {
\Wikia\Logger\WikiaLogger::instance()->info( "PortableInfobox XML Parser problem", [
"level" => $level,
"code" => $code,
"message" => $message ] );
}
/**
* @param \SimpleXMLElement $xmlNode
* @param Node $parent
* @return \Wikia\PortableInfobox\Parser\Nodes\Node
*/
public function getNode( \SimpleXMLElement $xmlNode, $parent = null ) {
wfProfileIn(__METHOD__);
$tagType = $xmlNode->getName();
$className = 'Wikia\\PortableInfobox\\Parser\\Nodes\\' . 'Node' . ucfirst( strtolower( $tagType ) );
if ( class_exists( $className ) ) {
/* @var $instance \Wikia\PortableInfobox\Parser\Nodes\Node */
$instance = new $className( $xmlNode, $this->infoboxData );
if ( !empty( $this->externalParser ) ) {
$instance->setExternalParser( $this->externalParser );
}
if ( $parent ) {
$instance->setParent( $parent );
}
wfProfileOut( __METHOD__ );
return $instance;
}
wfProfileOut( __METHOD__ );
return new Nodes\NodeUnimplemented( $xmlNode, $this->infoboxData );
}
/**
* @param $xmlString
* @return \SimpleXMLElement
* @throws XmlMarkupParseErrorException
*/
protected function parseXmlString( $xmlString ) {
$global_libxml_setting = libxml_use_internal_errors();
libxml_use_internal_errors( true );
$xml = simplexml_load_string( $xmlString );
$errors = libxml_get_errors();
libxml_use_internal_errors( $global_libxml_setting );
if ( $xml === false ) {
foreach ( $errors as $xmlerror ) {
$this->logXmlParseError( $xmlerror->level, $xmlerror->code, trim( $xmlerror->message ) );
}
libxml_clear_errors();
$this->setXmlParseErrors( $errors );
throw new XmlMarkupParseErrorException( $this->getXmlParseErrors() );
}
return $xml;
}
}
class XmlMarkupParseErrorException extends \Exception {
private $errors;
public function __construct( $errors ) {
$this->errors = $errors;
return parent::__construct();
}
public function getErrors() {
return $this->errors;
}
}