PortableInfobox/services/Parser/Nodes/Node.php

285 lines
7.5 KiB
PHP
Raw Normal View History

<?php
namespace Wikia\PortableInfobox\Parser\Nodes;
use Wikia\PortableInfobox\Parser\ExternalParser;
use Wikia\PortableInfobox\Parser\SimpleParser;
class Node {
const DATA_SRC_ATTR_NAME = 'source';
2015-07-01 15:31:37 +00:00
const DEFAULT_TAG_NAME = 'default';
2015-06-22 13:53:01 +00:00
const FORMAT_TAG_NAME = 'format';
2015-06-22 15:51:59 +00:00
const LABEL_TAG_NAME = 'label';
2015-06-23 12:25:37 +00:00
const EXTRACT_SOURCE_REGEX = '/{{{([^\|}]*?)\|?.*}}}/sU';
protected $xmlNode;
2015-06-11 09:34:28 +00:00
protected $children;
protected $cachedSources = null;
protected $data = null;
2015-06-09 13:09:01 +00:00
/**
* @var $externalParser ExternalParser
*/
protected $externalParser;
public function __construct( \SimpleXMLElement $xmlNode, $infoboxData ) {
$this->xmlNode = $xmlNode;
$this->infoboxData = $infoboxData;
}
public function getSources() {
if ( is_null( $this->cachedSources ) ) {
$this->cachedSources = $this->extractSourcesFromNode( $this->xmlNode );
}
return $this->cachedSources;
}
public function getSourcesMetadata() {
$metadata = [ ];
$sources = $this->getSources();
$sourcesLength = count( $sources );
$baseLabel = \Sanitizer::stripAllTags( $this->getInnerValue( $this->xmlNode->{self::LABEL_TAG_NAME} ) );
2016-04-01 11:07:30 +00:00
foreach ( $sources as $source ) {
$metadata[ $source ] = [ ];
$metadata[ $source ][ 'label' ] = ( $sourcesLength > 1 ) ?
( !empty( $baseLabel ) ? "{$baseLabel} ({$source})" : '' ) :
$baseLabel;
}
if ( $sourcesLength > 0 && $this->hasPrimarySource( $this->xmlNode ) ) {
// self::extractSourcesFromNode() puts the value of the `source` attribute as the first element of $sources
$firstSource = reset( $sources );
$metadata[ $firstSource ][ 'primary' ] = true;
}
return $metadata;
}
2016-12-09 14:56:57 +00:00
public function getMetadata() {
/** @var Node $item */
$result = [ ];
foreach ( $this->getChildNodes() as $item ) {
$type = $item->getType();
if ( $type === 'group' ) {
$result[] = [
'type' => $type,
'metadata' => $item->getMetadata()
];
} else {
$result[] = [
'type' => $type,
'sources' => $item->getSourcesMetadata()
];
}
}
return $result;
}
/**
* @return ExternalParser
*/
public function getExternalParser() {
if ( !isset( $this->externalParser ) ) {
$this->setExternalParser( new SimpleParser() );
}
return $this->externalParser;
}
/**
* @param ExternalParser|null $externalParser
*
* @return $this
*/
public function setExternalParser( $externalParser ) {
// we can pass anything, and ignore it if not ExternalParser instance
2015-06-12 13:51:25 +00:00
// we use builder pattern here, for fluently passing external parser to children nodes,
// type hinting was removed to prevent catchable fatal error appearing
if ( $externalParser instanceof ExternalParser ) {
$this->externalParser = $externalParser;
}
return $this;
}
public function getType() {
2015-05-25 13:03:45 +00:00
/*
* Node type generation is based on XML tag name.
* It's worth to remember that SimpleXMLElement::getName method is
* case - sensitive ( "<Data>" != "<data>" ), so we need to sanitize Node Type
* by using mb_strtolower function
2015-05-25 13:03:45 +00:00
*/
return mb_strtolower( $this->xmlNode->getName() );
}
2015-06-11 09:34:28 +00:00
public function isType( $type ) {
return strcmp( $this->getType(), mb_strtolower( $type ) ) == 0;
2015-06-11 09:34:28 +00:00
}
public function getData() {
if ( !isset( $this->data ) ) {
$this->data = [ 'value' => (string)$this->xmlNode ];
}
return $this->data;
}
2015-06-11 09:34:28 +00:00
public function getRenderData() {
return [
'type' => $this->getType(),
'data' => $this->getData(),
];
}
2015-05-19 18:14:39 +00:00
/**
* @desc Check if node is empty.
* Note that a '0' value cannot be treated like a null
*
* @return bool
2015-05-19 18:14:39 +00:00
*/
public function isEmpty() {
$data = $this->getData()[ 'value' ];
return ( empty( $data ) && $data != '0' );
}
protected function getChildNodes() {
2015-06-11 09:34:28 +00:00
if ( !isset( $this->children ) ) {
$this->children = [ ];
foreach ( $this->xmlNode as $child ) {
$this->children[] = NodeFactory::newFromSimpleXml( $child, $this->infoboxData )
2015-06-11 09:34:28 +00:00
->setExternalParser( $this->externalParser );
}
}
2015-06-11 09:34:28 +00:00
return $this->children;
}
protected function getDataForChildren() {
return array_map(
function ( Node $item ) {
return [
'type' => $item->getType(),
'data' => $item->getData(),
'isEmpty' => $item->isEmpty(),
'source' => $item->getSources()
];
},
$this->getChildNodes()
);
2015-06-11 09:34:28 +00:00
}
protected function getRenderDataForChildren() {
$renderData = array_map( function ( Node $item ) {
2015-06-11 09:34:28 +00:00
return $item->getRenderData();
}, array_filter( $this->getChildNodes(), function ( Node $item ) {
return !$item->isEmpty();
} ) );
// rebase keys
return array_values( $renderData );
}
protected function getSourcesForChildren() {
/** @var Node $item */
$result = [ ];
foreach ( $this->getChildNodes() as $item ) {
$result = array_merge( $result, $item->getSources() );
}
2015-08-25 11:00:04 +00:00
$uniqueParams = array_unique( $result );
2015-08-25 11:00:04 +00:00
return array_values( $uniqueParams );
}
protected function getValueWithDefault( \SimpleXMLElement $xmlNode ) {
$value = $this->extractDataFromSource( $xmlNode );
2015-07-01 15:31:37 +00:00
if ( !$value && $xmlNode->{self::DEFAULT_TAG_NAME} ) {
return $this->getInnerValue( $xmlNode->{self::DEFAULT_TAG_NAME} );
2015-06-22 15:38:47 +00:00
}
if ( ( $value || $value == '0' ) && $xmlNode->{self::FORMAT_TAG_NAME} ) {
return $this->getInnerValue( $xmlNode->{self::FORMAT_TAG_NAME} );
}
return $value;
}
protected function getRawValueWithDefault( \SimpleXMLElement $xmlNode ) {
$value = $this->getRawInfoboxData( $this->getXmlAttribute( $xmlNode, self::DATA_SRC_ATTR_NAME ) );
2015-07-01 15:31:37 +00:00
if ( !$value && $xmlNode->{self::DEFAULT_TAG_NAME} ) {
$value = $this->getExternalParser()->replaceVariables( (string)$xmlNode->{self::DEFAULT_TAG_NAME} );
}
return $value;
}
protected function getValueWithData( \SimpleXMLElement $xmlNode ) {
$value = $this->extractDataFromSource( $xmlNode );
return $value ? $value
: $this->getInnerValue( $xmlNode );
}
2015-06-11 12:51:54 +00:00
protected function getInnerValue( \SimpleXMLElement $xmlNode ) {
return $this->getExternalParser()->parseRecursive( (string)$xmlNode );
2015-06-11 12:51:54 +00:00
}
protected function getXmlAttribute( \SimpleXMLElement $xmlNode, $attribute ) {
return ( isset( $xmlNode[ $attribute ] ) ) ? (string)$xmlNode[ $attribute ]
: null;
}
protected function getRawInfoboxData( $key ) {
return isset( $this->infoboxData[ $key ] ) ? $this->infoboxData[ $key ]
: null;
}
protected function getInfoboxData( $key ) {
return $this->getExternalParser()->parseRecursive( $this->getRawInfoboxData( $key ) );
}
/**
* @param \SimpleXMLElement $xmlNode
*
* @return mixed
*/
protected function extractDataFromSource( \SimpleXMLElement $xmlNode ) {
$source = $this->getXmlAttribute( $xmlNode, self::DATA_SRC_ATTR_NAME );
return ( !empty( $source ) || $source == '0' ) ? $this->getInfoboxData( $source )
: null;
}
/**
* @param \SimpleXMLElement $xmlNode
*
* @return array
*
*/
protected function extractSourcesFromNode( \SimpleXMLElement $xmlNode ) {
$sources = $this->hasPrimarySource( $xmlNode ) ?
[ $this->getXmlAttribute( $xmlNode, self::DATA_SRC_ATTR_NAME ) ] : [ ];
2015-06-23 11:05:25 +00:00
if ( $xmlNode->{self::FORMAT_TAG_NAME} ) {
$sources = $this->matchVariables( $xmlNode->{self::FORMAT_TAG_NAME}, $sources );
2015-06-23 11:05:25 +00:00
}
2015-07-01 15:31:37 +00:00
if ( $xmlNode->{self::DEFAULT_TAG_NAME} ) {
$sources = $this->matchVariables( $xmlNode->{self::DEFAULT_TAG_NAME}, $sources );
}
return $sources;
}
2015-06-23 12:25:37 +00:00
protected function hasPrimarySource( \SimpleXMLElement $xmlNode ) {
return (bool)$this->getXmlAttribute( $xmlNode, self::DATA_SRC_ATTR_NAME );
}
2015-06-23 12:25:37 +00:00
protected function matchVariables( \SimpleXMLElement $node, array $source ) {
preg_match_all( self::EXTRACT_SOURCE_REGEX, (string)$node, $sources );
return array_unique( array_merge( $source, $sources[ 1 ] ) );
2015-06-23 12:25:37 +00:00
}
}