mediawiki-extensions-Math/tests/phpunit/unit/TexVC/MMLFullCoverageTest.php

142 lines
4.8 KiB
PHP
Raw Normal View History

<?php
namespace MediaWiki\Extension\Math\TexVC;
use InvalidArgumentException;
use MediaWiki\Extension\Math\TexVC\MMLmappings\Util\MMLComparator;
use MediaWiki\Extension\Math\TexVC\MMLmappings\Util\MMLTestUtil;
use MediaWiki\Extension\Math\TexVC\MMLmappings\Util\MMLTestUtilHTML;
use MediaWikiUnitTestCase;
/**
* This is a test which checks the TexVC (LaTeX to MathML) converter capabilities
* It uses the Full-Coverage definition of tests from:
* https://www.mediawiki.org/wiki/Extension:Math/CoverageTest
*
* The json test-files for this can be updated with:
* 'MathSearch-Extension/maintenance/UpdateMath.php --mode mathml --exportmml /var/www/html/extensions/MathSearch'
*
* WIP:
* Currently this is just checking that texVC can generate MathML
* for the specified tests, not how the MathML looks like.
*
* @covers \MediaWiki\Extension\Math\TexVC\TexVC
* @group stub
*/
final class MMLFullCoverageTest extends MediaWikiUnitTestCase {
private static $SIMILARITYTRESH = 0.7;
private static $SKIPXMLVALIDATION = true;
private static $FILENAMELATEXML = __DIR__ . "/mmlRes-latexml-FullCoverage.json";
private static $FILENAMEMATHOID = __DIR__ . "/mmlRes-mathml-FullCoverage.json";
private static $APPLYFILTER = false;
private static $FILTERSTART = 0;
private static $FILTERLENGTH = 60;
private static $GENERATEHTML = false;
private static $GENERATEDHTMLFILE = __DIR__ . "/MMLFullCoverageTest-Output.html";
private static $SKIPPEDINDICES = [ 0,58, 380, 388 ];
private static $FILTERMML = true;
public static function setUpBeforeClass(): void {
MMLTestUtilHTML::generateHTMLstart( self::$GENERATEDHTMLFILE, [ "name","TeX-Input","MathML(LaTeXML)",
"MathML(Mathoid)", "MathML(TexVC)", "F-Similarity" ], self::$GENERATEHTML );
}
public static function tearDownAfterClass(): void {
MMLTestUtilHTML::generateHTMLEnd( self::$GENERATEDHTMLFILE, self::$GENERATEHTML );
}
/**
* @dataProvider provideTestCases
*/
public function testTexVC( $title, $tc ) {
$texVC = new TexVC();
if ( in_array( $tc->ctr, self::$SKIPPEDINDICES ) ) {
MMLTestUtilHTML::generateHTMLtableRow( self::$GENERATEDHTMLFILE, [ $tc->ctr, $tc->tex,
"skipped", "skipped", "skipped" ], false, self::$GENERATEHTML );
$this->assertTrue( true );
return;
}
# Fetch result from TexVC(PHP)
$resultT = $texVC->check( $tc->tex, [
'debug' => false,
'usemathrm' => $tc->usemathrm ?? false,
'oldtexvc' => $tc->oldtexvc ?? false
] );
$mml_latexml = self::$FILTERMML ? self::loadXMLandDeleteAttrs( $tc->mml_latexml ) : $tc->mml_latexml;
$mathMLtexVC = MMLTestUtil::getMMLwrapped( $resultT["input"] );
$mmlComparator = new MMLComparator();
$compRes = $mmlComparator->compareMathML( $tc->mml_mathoid, $mathMLtexVC );
MMLTestUtilHTML::generateHTMLtableRow( self::$GENERATEDHTMLFILE, [ $tc->ctr, $tc->tex, $mml_latexml,
$tc->mml_mathoid, $mathMLtexVC, $compRes['similarityF'] ], false, self::$GENERATEHTML );
if ( !self::$SKIPXMLVALIDATION ) {
if ( !$tc->mml_mathoid ) {
$this->fail( "No Mathoid reference found for: " . $tc->tex );
}
if ( $compRes['similarityF'] >= self::$SIMILARITYTRESH ) {
$this->assertTrue( true );
} else {
$this->assertXmlStringEqualsXmlString( $tc->mml_mathoid, $mathMLtexVC );
}
} else {
$this->assertTrue( true );
}
}
/**
* Deletes some attributes from the mathml which are not necessary for comparisons.
* @param string $mml mathml as string
* @return bool|string false if problem, mathml as xml string without the specified attributes if ok
*/
public static function loadXMLandDeleteAttrs( $mml ) {
$xml = simplexml_load_string( $mml );
self::unsetAttrs( $xml );
// Recursive call deleting attributes
self::deleteAttributes( $xml );
return $xml->asXML();
}
public static function deleteAttributes( &$xml ) {
foreach ( $xml as $node ) {
self::unsetAttrs( $node );
self::deleteAttributes( $node );
}
}
public static function unsetAttrs( $node ): void {
$attrs = $node->attributes();
unset( $attrs['id'] );
unset( $attrs['xref'] );
}
public static function provideTestCases() {
$resMathoid = MMLTestUtil::getJSON( self::$FILENAMEMATHOID );
$resLaTeXML = MMLTestUtil::getJSON( self::$FILENAMELATEXML );
if ( count( $resMathoid ) != count( $resLaTeXML ) ) {
throw new InvalidArgumentException( "Test files dont have the same number of entries." );
}
$f = [];
// Adding running indices for location of tests.
foreach ( $resMathoid as $index => $tcMathoid ) {
$tcLaTeXML = $resLaTeXML[$index];
$tc = [
"ctr" => $index,
"tex" => $tcMathoid->tex,
"type" => $tcMathoid->type,
"mml_mathoid" => $tcMathoid->mml,
"mml_latexml" => $tcLaTeXML->mml,
];
array_push( $f, [ "title N/A", (object)$tc ] );
}
// Filtering results by index if necessary
if ( self::$APPLYFILTER ) {
$f = array_slice( $f, self::$FILTERSTART, self::$FILTERLENGTH );
}
return $f;
}
}