2024-01-12 22:30:44 +00:00
|
|
|
/**
|
|
|
|
* @module gateway/reference
|
|
|
|
*/
|
|
|
|
|
2024-12-16 12:36:38 +00:00
|
|
|
const TYPE_REFERENCE = 'reference';
|
2024-01-12 22:30:44 +00:00
|
|
|
|
|
|
|
/**
|
|
|
|
* @return {Gateway}
|
|
|
|
*/
|
|
|
|
module.exports = function createReferenceGateway() {
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @param {string} id
|
2024-06-26 15:05:56 +00:00
|
|
|
* @return {HTMLElement|null}
|
2024-01-12 22:30:44 +00:00
|
|
|
*/
|
2024-06-26 15:05:56 +00:00
|
|
|
function findReferenceTextElement( id ) {
|
2024-01-12 22:30:44 +00:00
|
|
|
const idSelector = `#${ CSS.escape( id ) }`;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Same alternative selectors with and without mw-… as in the RESTbased endpoint.
|
|
|
|
*
|
|
|
|
* @see https://phabricator.wikimedia.org/diffusion/GMOA/browse/master/lib/transformations/references/structureReferenceListContent.js$138
|
|
|
|
*/
|
|
|
|
return document.querySelector( `${ idSelector } .mw-reference-text, ${ idSelector } .reference-text` );
|
|
|
|
}
|
|
|
|
|
2024-06-26 15:05:56 +00:00
|
|
|
/**
|
|
|
|
* @param {HTMLElement} el
|
|
|
|
* @return {HTMLElement|null}
|
|
|
|
*/
|
|
|
|
function findParentReferenceTextElement( el ) {
|
|
|
|
// This finds either the inner <ol class="mw-extended-references">, or the outer
|
|
|
|
// <ol class="references">
|
|
|
|
const ol = el.closest( 'ol' );
|
|
|
|
|
|
|
|
return ol && ol.classList.contains( 'mw-extended-references' ) ?
|
|
|
|
ol.parentElement.querySelector( '.mw-reference-text, .reference-text' ) :
|
|
|
|
null;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @param {HTMLElement} referenceElement
|
|
|
|
* @param {(HTMLElement|null)} parentElement
|
|
|
|
* @return {string}
|
|
|
|
*/
|
|
|
|
function scrapeReferenceText( referenceElement, parentElement ) {
|
|
|
|
if ( !parentElement ) {
|
|
|
|
return referenceElement.innerHTML;
|
|
|
|
}
|
|
|
|
|
|
|
|
return `
|
|
|
|
<div class="mw-reference-previews-parent">${ parentElement.innerHTML }</div>
|
|
|
|
<div>${ referenceElement.innerHTML }</div>
|
|
|
|
`;
|
|
|
|
}
|
|
|
|
|
2024-01-12 22:30:44 +00:00
|
|
|
/**
|
|
|
|
* Attempts to find a single reference type identifier, limited to a list of known types.
|
|
|
|
* - When a `class="…"` attribute mentions multiple known types, the last one is used, following
|
|
|
|
* CSS semantics.
|
|
|
|
* - When there are multiple <cite> tags, the first with a known type is used.
|
|
|
|
*
|
2024-06-26 15:05:56 +00:00
|
|
|
* @param {HTMLElement} referenceElement
|
2024-01-12 22:30:44 +00:00
|
|
|
* @return {string|null}
|
|
|
|
*/
|
2024-06-26 15:05:56 +00:00
|
|
|
function scrapeReferenceType( referenceElement ) {
|
2024-01-12 22:30:44 +00:00
|
|
|
const KNOWN_TYPES = [ 'book', 'journal', 'news', 'note', 'web' ];
|
|
|
|
let type = null;
|
2024-06-26 15:05:56 +00:00
|
|
|
const citeTags = referenceElement.querySelectorAll( 'cite[class]' );
|
2024-01-12 22:30:44 +00:00
|
|
|
Array.prototype.forEach.call( citeTags, ( element ) => {
|
|
|
|
// don't need to keep scanning if one is found.
|
|
|
|
if ( type ) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
const classNames = element.className.split( /\s+/ );
|
|
|
|
for ( let i = classNames.length; i--; ) {
|
|
|
|
if ( KNOWN_TYPES.indexOf( classNames[ i ] ) !== -1 ) {
|
|
|
|
type = classNames[ i ];
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} );
|
|
|
|
return type;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @param {mw.Title} title
|
|
|
|
* @param {HTMLAnchorElement} el
|
|
|
|
* @return {Promise<ext.popups.PreviewModel>}
|
|
|
|
*/
|
|
|
|
function fetchPreviewForTitle( title, el ) {
|
|
|
|
// Need to encode the fragment again as mw.Title returns it as decoded text
|
2024-06-26 15:05:56 +00:00
|
|
|
const id = title.getFragment().replace( / /g, '_' );
|
|
|
|
const referenceTextElement = findReferenceTextElement( id );
|
2024-01-12 22:30:44 +00:00
|
|
|
|
2024-06-26 15:05:56 +00:00
|
|
|
if ( !referenceTextElement ||
|
2024-01-12 22:30:44 +00:00
|
|
|
// Skip references that don't contain anything but whitespace, e.g. a single
|
2024-06-26 15:05:56 +00:00
|
|
|
( !referenceTextElement.textContent.trim() && !referenceTextElement.children.length )
|
2024-01-12 22:30:44 +00:00
|
|
|
) {
|
|
|
|
return Promise.reject(
|
2024-06-26 15:05:56 +00:00
|
|
|
// Required to set showNullPreview to false and not open an error popup
|
2024-01-12 22:30:44 +00:00
|
|
|
{ textStatus: 'abort', textContext: 'Footnote not found or empty', xhr: { readyState: 0 } }
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
2024-06-26 15:05:56 +00:00
|
|
|
const referenceParentTextElement = findParentReferenceTextElement( referenceTextElement );
|
|
|
|
|
2024-01-12 22:30:44 +00:00
|
|
|
const model = {
|
|
|
|
url: `#${ id }`,
|
2024-06-26 15:05:56 +00:00
|
|
|
extract: scrapeReferenceText( referenceTextElement, referenceParentTextElement ),
|
2024-01-12 22:30:44 +00:00
|
|
|
type: TYPE_REFERENCE,
|
2024-06-26 15:05:56 +00:00
|
|
|
referenceType: scrapeReferenceType( referenceParentTextElement || referenceTextElement ),
|
2024-01-12 22:30:44 +00:00
|
|
|
// Note: Even the top-most HTMLHtmlElement is guaranteed to have a parent.
|
|
|
|
sourceElementId: el.parentNode.id
|
|
|
|
};
|
|
|
|
|
|
|
|
// Make promise abortable.
|
|
|
|
const promise = Promise.resolve( model );
|
|
|
|
promise.abort = () => {};
|
|
|
|
return promise;
|
|
|
|
}
|
|
|
|
|
|
|
|
return {
|
|
|
|
fetchPreviewForTitle
|
|
|
|
};
|
|
|
|
};
|