2022-12-23 13:33:57 +00:00
|
|
|
<?php
|
|
|
|
|
|
|
|
namespace MediaWiki\Extension\Math\Tests\TexVC;
|
|
|
|
|
2023-02-03 09:25:09 +00:00
|
|
|
use MediaWiki\Extension\Math\TexVC\MMLmappings\Util\MMLComparator;
|
2022-12-23 13:33:57 +00:00
|
|
|
use MediaWiki\Extension\Math\TexVC\MMLmappings\Util\MMLTestUtil;
|
|
|
|
use MediaWiki\Extension\Math\TexVC\MMLmappings\Util\MMLTestUtilHTML;
|
|
|
|
use MediaWiki\Extension\Math\TexVC\TexUtil;
|
|
|
|
use MediaWiki\Extension\Math\TexVC\TexVC;
|
|
|
|
use MediaWikiUnitTestCase;
|
|
|
|
|
|
|
|
/**
|
2023-01-26 15:34:27 +00:00
|
|
|
* This test is checking the MathML generation from LaTeX by TexVC.
|
2022-12-23 13:33:57 +00:00
|
|
|
* It creates a list of basic LaTeX statements from the supported functions
|
2023-01-26 15:34:27 +00:00
|
|
|
* of TexVC from TexUtil.php. Also it loads Reference MathML (mathoid,latexml) from a file
|
|
|
|
* usually defined as "TexUtil-Ref.json"
|
|
|
|
*
|
|
|
|
* This reference file can be generated by reading texutil.json with
|
|
|
|
* the maintenance script: "JsonToMathML.php".
|
|
|
|
*
|
|
|
|
* WIP: This currently just generates MathML with TexVC, but does not do
|
|
|
|
* a comparison.
|
|
|
|
*
|
2022-12-23 13:33:57 +00:00
|
|
|
* @covers \MediaWiki\Extension\Math\TexVC\TexVC
|
|
|
|
*/
|
2023-01-26 15:34:27 +00:00
|
|
|
class MMLGenerationTexUtilTest extends MediaWikiUnitTestCase {
|
2023-02-03 09:25:09 +00:00
|
|
|
private static $SIMILARITYTRESH = 0.7;
|
2022-12-23 13:33:57 +00:00
|
|
|
private static $SKIPXMLVALIDATION = true;
|
|
|
|
private static $APPLYFILTER = false;
|
|
|
|
private static $APPLYCATEGORYFILTER = false;
|
|
|
|
private static $FILTEREDCATEGORIES = [ "fun_ar1" ];
|
|
|
|
private static $FILTERSTART = 15;
|
|
|
|
private static $FILTERLENGTH = 1;
|
|
|
|
|
2023-02-03 13:52:39 +00:00
|
|
|
private static $GENERATEHTML = false;
|
2023-01-26 15:34:27 +00:00
|
|
|
private static $GENERATEDHTMLFILE = __DIR__ . "/MMLGenerationTexUtilTest-Output.html";
|
|
|
|
private static $MMLREFFILE = __DIR__ . "/TexUtil-Ref.json";
|
|
|
|
|
|
|
|
/** @var bool export the updated TexUtil-Tex to "./ExportedTexUtilKeys.json" */
|
|
|
|
private static $EXPORT_KEYS = false;
|
2022-12-23 13:33:57 +00:00
|
|
|
|
2023-02-14 12:54:32 +00:00
|
|
|
private static $SKIPPEDINDICES = [ 15,33,383,554 ];
|
2023-02-03 13:52:39 +00:00
|
|
|
|
2022-12-23 13:33:57 +00:00
|
|
|
/**
|
|
|
|
* @dataProvider provideTestCases
|
|
|
|
*/
|
|
|
|
public function testTexVC( $title, $input ) {
|
2023-02-03 13:52:39 +00:00
|
|
|
if ( in_array( $input->ctr, self::$SKIPPEDINDICES ) ) {
|
|
|
|
MMLTestUtilHTML::generateHTMLtableRow( self::$GENERATEDHTMLFILE, [ $title, $input->tex, $input->mmlLaTeXML,
|
|
|
|
$input->mmlMathoid, "skipped", "skipped" ], false, self::$GENERATEHTML );
|
|
|
|
$this->assertTrue( true );
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2022-12-23 13:33:57 +00:00
|
|
|
$texVC = new TexVC();
|
|
|
|
$useMHChem = self::getMHChem( $title );
|
|
|
|
|
|
|
|
// Fetching the result from TexVC
|
2023-01-26 15:34:27 +00:00
|
|
|
$resultT = $texVC->check( $input->tex, [
|
2022-12-23 13:33:57 +00:00
|
|
|
'debug' => false,
|
|
|
|
'usemathrm' => false,
|
|
|
|
'oldtexvc' => false,
|
|
|
|
'usemhchem' => $useMHChem
|
|
|
|
] );
|
2023-01-26 15:34:27 +00:00
|
|
|
$mathMLtexVC = MMLTestUtil::getMMLwrapped( $resultT["input"] ) ?? "<math> error texvc </math>";
|
2022-12-23 13:33:57 +00:00
|
|
|
|
2023-02-03 09:25:09 +00:00
|
|
|
$mmlComparator = new MMLComparator();
|
2023-02-07 10:34:48 +00:00
|
|
|
$usedMMLRef = $input->mmlMathoid;
|
|
|
|
if ( !$usedMMLRef ) {
|
|
|
|
$usedMMLRef = $input->mmlLaTeXML;
|
|
|
|
}
|
|
|
|
$compRes = $mmlComparator->compareMathML( $usedMMLRef, $mathMLtexVC );
|
2023-01-26 15:34:27 +00:00
|
|
|
MMLTestUtilHTML::generateHTMLtableRow( self::$GENERATEDHTMLFILE, [ $title, $input->tex, $input->mmlLaTeXML,
|
2023-02-03 09:25:09 +00:00
|
|
|
$input->mmlMathoid, $mathMLtexVC, $compRes['similarityF'] ], false, self::$GENERATEHTML );
|
2023-02-07 10:34:48 +00:00
|
|
|
|
2023-02-03 09:25:09 +00:00
|
|
|
// Comparing the result either to MathML result from Mathoid
|
2023-01-26 15:34:27 +00:00
|
|
|
if ( !self::$SKIPXMLVALIDATION ) {
|
2023-02-03 09:25:09 +00:00
|
|
|
if ( $compRes['similarityF'] >= self::$SIMILARITYTRESH ) {
|
|
|
|
$this->assertTrue( true );
|
|
|
|
} else {
|
2023-02-07 10:34:48 +00:00
|
|
|
$this->assertXmlStringEqualsXmlString( $usedMMLRef, $mathMLtexVC );
|
2023-02-03 09:25:09 +00:00
|
|
|
}
|
2023-01-26 15:34:27 +00:00
|
|
|
} else {
|
|
|
|
$this->assertTrue( true );
|
|
|
|
}
|
2022-12-23 13:33:57 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
private const SETS = [
|
|
|
|
'big_literals',
|
|
|
|
'box_functions',
|
|
|
|
'color_function',
|
|
|
|
'declh_function',
|
|
|
|
'definecolor_function',
|
|
|
|
'fun_ar1',
|
|
|
|
'fun_ar1nb',
|
|
|
|
'fun_ar1opt',
|
|
|
|
'fun_ar2',
|
|
|
|
'fun_ar2nb',
|
|
|
|
'fun_infix',
|
|
|
|
'fun_mhchem',
|
|
|
|
'hline_function',
|
|
|
|
'latex_function_names',
|
|
|
|
'left_function',
|
|
|
|
'mediawiki_function_names',
|
|
|
|
'mhchem_bond',
|
|
|
|
'mhchem_macro_1p',
|
|
|
|
'mhchem_macro_2p',
|
|
|
|
'mhchem_macro_2pc',
|
|
|
|
'mhchem_macro_2pu',
|
|
|
|
'mhchem_single_macro',
|
|
|
|
'nullary_macro',
|
|
|
|
'nullary_macro_in_mbox',
|
|
|
|
'other_delimiters1',
|
|
|
|
'other_delimiters2',
|
|
|
|
'right_function'
|
|
|
|
];
|
|
|
|
|
|
|
|
private const ARG_CNTS = [
|
|
|
|
"big_literals" => 1,
|
|
|
|
"box_functions" => 1,
|
|
|
|
"color_function" => 1,
|
|
|
|
"definecolor_function" => 1,
|
|
|
|
"fun_ar1" => 1,
|
|
|
|
"fun_ar1nb" => 1,
|
|
|
|
"fun_ar1opt" => 1,
|
|
|
|
"fun_ar2" => 2,
|
|
|
|
"fun_infix" => 1,
|
|
|
|
"fun_ar2nb" => 5,
|
|
|
|
"fun_mhchem" => 1,
|
|
|
|
"left_function" => 1,
|
|
|
|
"right_function" => 1,
|
|
|
|
"mhchem_bond" => 1,
|
|
|
|
"mhchem_macro_1p" => 1,
|
|
|
|
"mhchem_macro_2p" => 2,
|
|
|
|
"mhchem_macro_2pu" => 1
|
|
|
|
];
|
|
|
|
private const OTHER_ARGS = [
|
|
|
|
"declh_function" => true,
|
|
|
|
];
|
|
|
|
|
|
|
|
private const SAMPLE_ARGS_RIGHT = [
|
|
|
|
"big_literals" => '(',
|
|
|
|
"color_function" => '{red}{red}',
|
|
|
|
"mhchem_macro_2pc" => '{red}{red}',
|
|
|
|
"definecolor_function" => '{ultramarine}{RGB}{0,32,96}',
|
|
|
|
"fun_ar2nb" => '{_1^2}{_3^4}\\sum',
|
|
|
|
"left_function" => '( \\right.',
|
|
|
|
"mhchem_bond" => '{-}',
|
|
|
|
"right_function" => ')',
|
|
|
|
|
|
|
|
];
|
|
|
|
|
|
|
|
private const SAMPLE_ARGS_LEFT = [
|
|
|
|
"right_function" => '\\left(',
|
|
|
|
];
|
|
|
|
|
|
|
|
private const ENTRY_ARGS = [
|
|
|
|
"\\atop" => "{ a \\atop b }",
|
|
|
|
"\\choose" => "{ a \\choose b }",
|
|
|
|
"\\over" => "{a \\over b }",
|
|
|
|
"\\hline" => "\n\\begin{array}{|c||c|} a & b \\\\\n\\hline\n1&2 \n\\end{array}\n",
|
|
|
|
"\\nolimits" => " \mathop{\\rm cos}\\nolimits^2",
|
|
|
|
// "\\limits" =>" \mathop{\\rm cos}\\limits^2",
|
|
|
|
"\\limits" => "\\lim\\limits_{x \\to 2}",
|
|
|
|
"\\displaystyle" => "\\frac{\\displaystyle \\sum_{k=1}^N k^2}{a}",
|
|
|
|
"\\scriptscriptstyle" => "\\frac ab + \\scriptscriptstyle{\\frac cd + \\frac ef} + \\frac gh",
|
|
|
|
"\\scriptstyle" => "{\\scriptstyle \\partial \\Omega}",
|
|
|
|
"\\textstyle" => "\\textstyle \\sum_{k=1}^N k^2",
|
|
|
|
// Failing examples: ="\\vbox{{a}{b}}""\\vbox{\\vhb{eight}\\vhb{gnat}}"
|
|
|
|
// "\\vbox{\\hbox{eight}\\hbox{gnat}}";
|
|
|
|
"\\vbox" => "\\vbox{ab}",
|
|
|
|
"\\emph" => "\\mathit{\\emph{a}} \\emph{b}",
|
|
|
|
// it seems not supported for math, not in any other en_wiki test etc. probably make sense
|
|
|
|
// to drop or substitute with \\vert
|
2023-01-26 15:34:27 +00:00
|
|
|
"\\vline" => "\n\\begin{array}{|c||c|} a & b \\vline c \\\\\n\\hline\n1&2 \n\\end{array}\n",
|
2022-12-23 13:33:57 +00:00
|
|
|
];
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Check from the test title if it is a mhchem-test.
|
|
|
|
* Return a boolean indicator for this.
|
|
|
|
* @param string $title test title
|
|
|
|
* @return bool indicator if the test is mhchem related
|
|
|
|
*/
|
|
|
|
public static function getMHChem( string $title ): bool {
|
|
|
|
$useMHChem = false;
|
|
|
|
if ( str_contains( $title, "chem" ) ) {
|
|
|
|
$useMHChem = true;
|
|
|
|
}
|
|
|
|
return $useMHChem;
|
|
|
|
}
|
|
|
|
|
2022-12-29 10:03:29 +00:00
|
|
|
public static function setUpBeforeClass(): void {
|
2023-01-26 15:34:27 +00:00
|
|
|
MMLTestUtilHTML::generateHTMLstart( self::$GENERATEDHTMLFILE, [ "name","TeX-Input","MathML(LaTeXML)",
|
2023-02-03 09:25:09 +00:00
|
|
|
"MathML(Mathoid)", "MathML(TexVC)", "F-Similarity" ], self::$GENERATEHTML );
|
2022-12-23 13:33:57 +00:00
|
|
|
}
|
|
|
|
|
2022-12-29 10:03:29 +00:00
|
|
|
public static function tearDownAfterClass(): void {
|
2022-12-23 13:33:57 +00:00
|
|
|
MMLTestUtilHTML::generateHTMLEnd( self::$GENERATEDHTMLFILE, self::$GENERATEHTML );
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Generate testcases with texutil, filter them and provide them to the testrunner.
|
2023-01-26 15:34:27 +00:00
|
|
|
* Fetch the corresponding reference MathML from the file defined as $MMLREFFILE
|
2022-12-23 13:33:57 +00:00
|
|
|
* @return array
|
|
|
|
*/
|
|
|
|
public static function provideTestCases() {
|
2023-01-26 15:34:27 +00:00
|
|
|
$refFileContent = (array)MMLTestUtil::getJSON( self::$MMLREFFILE );
|
|
|
|
$refAssociative = [];
|
|
|
|
foreach ( $refFileContent as $entry ) {
|
|
|
|
$refAssociative[$entry->tex] = $entry;
|
|
|
|
}
|
|
|
|
|
2022-12-23 13:33:57 +00:00
|
|
|
$groups = self::createGroups();
|
|
|
|
$overAllCtr = 0;
|
|
|
|
$finalCases = [];
|
|
|
|
foreach ( $groups as $category => $group ) {
|
|
|
|
if ( self::$APPLYCATEGORYFILTER && !in_array( $category, self::$FILTEREDCATEGORIES ) ) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
$indexCtr = 0;
|
|
|
|
foreach ( $group as $case ) {
|
|
|
|
$title = "set#" . $overAllCtr . ": " . $category . $indexCtr;
|
2023-01-26 15:34:27 +00:00
|
|
|
$finalCase = $refAssociative[$case] ?? $case;
|
2023-02-03 13:52:39 +00:00
|
|
|
$finalCase->ctr = $overAllCtr;
|
|
|
|
|
2023-01-26 15:34:27 +00:00
|
|
|
$finalCases[$title] = [ $title, $finalCase ];
|
2022-12-23 13:33:57 +00:00
|
|
|
$indexCtr++;
|
|
|
|
$overAllCtr++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if ( self::$APPLYFILTER ) {
|
|
|
|
$finalCases = array_slice( $finalCases, self::$FILTERSTART, self::$FILTERLENGTH );
|
|
|
|
}
|
2023-01-26 15:34:27 +00:00
|
|
|
if ( self::$EXPORT_KEYS ) {
|
|
|
|
// Creating a reference file for lookup in JsonToMathML maintenance script.
|
|
|
|
$dataToExport = [];
|
|
|
|
foreach ( $finalCases as $case ) {
|
|
|
|
$dataToExport[$case[1]->tex] = $case[1]->type;
|
|
|
|
}
|
|
|
|
self::writeToFile( __DIR__ . "/ExportedTexUtilKeys.json", $dataToExport );
|
|
|
|
}
|
2022-12-23 13:33:57 +00:00
|
|
|
return $finalCases;
|
|
|
|
}
|
|
|
|
|
2023-01-26 15:34:27 +00:00
|
|
|
public static function writeToFile( string $fullPath, array $allEntries ): void {
|
|
|
|
$jsonData = json_encode( $allEntries, JSON_PRETTY_PRINT );
|
|
|
|
file_put_contents( $fullPath, $jsonData );
|
|
|
|
}
|
|
|
|
|
2022-12-23 13:33:57 +00:00
|
|
|
private static function addArgs( $set, $entry ) {
|
|
|
|
if ( isset( self::ENTRY_ARGS[$entry] ) ) {
|
|
|
|
// Some entries have specific mappings for non-group related arguments
|
|
|
|
return ( self::ENTRY_ARGS[$entry] );
|
|
|
|
}
|
|
|
|
$count = !isset( self::ARG_CNTS[$set] ) ? 0 : self::ARG_CNTS[$set];
|
|
|
|
$argsR = '';
|
|
|
|
$argsL = '';
|
|
|
|
if ( !isset( self::SAMPLE_ARGS_RIGHT[$set] ) ) {
|
|
|
|
for ( $i = 0; $i < $count; $i++ ) {
|
|
|
|
$argsR .= '{' . chr( 97 + $i ) . '}';
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
$argsR = self::SAMPLE_ARGS_RIGHT[$set];
|
|
|
|
}
|
|
|
|
if ( isset( self::SAMPLE_ARGS_LEFT[$set] ) ) {
|
|
|
|
$argsL = self::SAMPLE_ARGS_LEFT[$set];
|
|
|
|
}
|
|
|
|
if ( $argsR == '' && isset( self::OTHER_ARGS[$set] ) ) {
|
|
|
|
if ( self::OTHER_ARGS[$set] ) {
|
|
|
|
return "{" . $entry . " a }";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if ( str_starts_with( $set, "mhchem" ) ) {
|
|
|
|
$rendering = '\\ce{' . $argsL . $entry . $argsR . '}';
|
|
|
|
} else {
|
|
|
|
$rendering = $argsL . $entry . $argsR;
|
|
|
|
}
|
|
|
|
return $rendering;
|
|
|
|
}
|
|
|
|
|
|
|
|
private static function createGroups() {
|
|
|
|
$groups = [];
|
|
|
|
foreach ( self::SETS as $set ) {
|
|
|
|
$entries = array_keys( TexUtil::getInstance()->getBaseElements()[$set] );
|
|
|
|
foreach ( $entries as &$entry ) {
|
|
|
|
$entry = self::addArgs( $set, $entry );
|
|
|
|
}
|
|
|
|
$groups[$set] = $entries;
|
|
|
|
}
|
|
|
|
return $groups;
|
|
|
|
}
|
|
|
|
}
|