mediawiki-extensions-Visual.../modules/parser/mediawiki.DOMPostProcessor.js
Gabriel Wicke 2bb512a4de A bit of tokenizer grammar clean-up and additional expected-html
normalization. 99 parser tests now passing.
2011-11-30 13:40:17 +00:00

80 lines
1.9 KiB
JavaScript

/* Perform post-processing steps on an already-built HTML DOM. */
var isBlock = function isBlock (name) {
switch (name.toLowerCase()) {
case 'div':
case 'table':
case 'td':
case 'tr':
case 'tbody':
case 'p':
case 'ul':
case 'ol':
case 'li':
case 'dl':
case 'dt':
case 'dd':
case 'img': // hmm!
case 'pre':
case 'center':
case 'blockquote':
return true;
default:
return false;
}
};
// Wrap all top-level inline elements in paragraphs. This should also be
// applied inside block-level elements, but in that case the first paragraph
// usually remains plain inline.
var process_inlines_in_p = function ( document ) {
// document.body does not always work in jsdom, so work around it.
var body = document.getElementsByTagName('body')[0],
newP = document.createElement('p'),
cnodes = body.childNodes,
haveInlines = false,
deleted = 0;
function isElementContentWhitespace ( e ) {
return (e.data.match(/^[ \r\n\t]*$/) !== null);
}
for(var i = 0, length = cnodes.length; i < length; i++) {
var child = cnodes[i - deleted],
ctype = child.nodeType;
//console.log(child + ctype);
if ((ctype === 3 && (haveInlines || !isElementContentWhitespace(child))) ||
(ctype !== 3 && // text
ctype !== 8 && // comment
!isBlock(child.nodeName))) {
// text node
newP.appendChild(child);
haveInlines = true;
deleted++;
} else if (haveInlines) {
body.insertBefore(newP, child);
newP = document.createElement('p');
haveInlines = false;
}
}
if (haveInlines) {
body.appendChild(newP);
}
};
function DOMPostProcessor () {
this.processors = [process_inlines_in_p];
}
DOMPostProcessor.prototype.doPostProcess = function ( document ) {
for(var i = 0; i < this.processors.length; i++) {
this.processors[i](document);
}
};
if (typeof module == "object") {
module.exports.DOMPostProcessor = DOMPostProcessor;
}