mediawiki-extensions-Cite/src/Parsoid/ReferencesData.php

130 lines
3.5 KiB
PHP
Raw Normal View History

<?php
declare( strict_types = 1 );
namespace Wikimedia\Parsoid\Ext\Cite;
use stdClass;
use Wikimedia\Parsoid\Ext\ParsoidExtensionAPI;
class ReferencesData {
/**
* @var int
*/
private $index;
/**
* @var RefGroup[]
*/
private $refGroups;
/**
* ReferencesData constructor.
*/
public function __construct() {
$this->index = 0;
$this->refGroups = [];
}
/**
* @param string $groupName
* @param bool $allocIfMissing
* @return RefGroup|null
*/
public function getRefGroup( string $groupName = '', bool $allocIfMissing = false ): ?RefGroup {
if ( !isset( $this->refGroups[$groupName] ) && $allocIfMissing ) {
$this->refGroups[$groupName] = new RefGroup( $groupName );
}
return $this->refGroups[$groupName] ?? null;
}
/**
* @param string|null $groupName
*/
public function removeRefGroup( ?string $groupName = null ): void {
if ( $groupName !== null ) {
// '' is a valid group (the default group)
unset( $this->refGroups[$groupName] );
}
}
/**
* @param ParsoidExtensionAPI $extApi
* @param string $groupName
* @param string $refName
* @param string $about
* @param bool $skipLinkback
* @return stdClass
*/
public function add(
ParsoidExtensionAPI $extApi, string $groupName, string $refName, string $about, bool $skipLinkback
): stdClass {
$group = $this->getRefGroup( $groupName, true );
// Looks like Cite.php doesn't try to fix ids that already have
// a "_" in them. Ex: name="a b" and name="a_b" are considered
// identical. Not sure if this is a feature or a bug.
// It also considers entities equal to their encoding
// (i.e. '&' === '&amp;'), which is done:
// in PHP: Sanitizer#decodeTagAttributes and
// in Parsoid: ExtensionHandler#normalizeExtOptions
$refName = $extApi->sanitizeHTMLId( $refName );
$hasRefName = strlen( $refName ) > 0;
if ( $hasRefName && isset( $group->indexByName[$refName] ) ) {
$ref = $group->indexByName[$refName];
if ( $ref->contentId && !$ref->hasMultiples ) {
$ref->hasMultiples = true;
// Use the non-pp version here since we've already stored attribs
// before putting them in the map.
$ref->cachedHtml = $extApi->getContentHTML( $ref->contentId );
}
} else {
// The ids produced Cite.php have some particulars:
// Simple refs get 'cite_ref-' + index
// Refs with names get 'cite_ref-' + name + '_' + index + (backlink num || 0)
// Notes (references) whose ref doesn't have a name are 'cite_note-' + index
// Notes whose ref has a name are 'cite_note-' + name + '-' + index
$n = $this->index;
$refKey = strval( 1 + $n );
$refIdBase = 'cite_ref-' . ( $hasRefName ? $refName . '_' . $refKey : $refKey );
$noteId = 'cite_note-' . ( $hasRefName ? $refName . '-' . $refKey : $refKey );
// bump index
$this->index += 1;
$ref = (object)[
'about' => $about,
'contentId' => null,
'dir' => '',
'group' => $group->name,
'groupIndex' => count( $group->refs ) + 1,
'index' => $n,
'key' => $refIdBase,
'id' => $hasRefName ? $refIdBase . '-0' : $refIdBase,
'linkbacks' => [],
'name' => $refName,
'target' => $noteId,
'hasMultiples' => false,
// Just used for comparison when we have multiples
'cachedHtml' => ''
];
$group->refs[] = $ref;
if ( $refName ) {
$group->indexByName[$refName] = $ref;
}
}
if ( !$skipLinkback ) {
$ref->linkbacks[] = $ref->key . '-' . count( $ref->linkbacks );
}
return $ref;
}
/**
* @return RefGroup[]
*/
public function getRefGroups(): array {
return $this->refGroups;
}
}