Recentchanges optimization: avoid a lot of senseless parsing of link text coming...
[lhc/web/wiklou.git] / maintenance / parserTests.php
1 <?php
2 # Copyright (C) 2004 Brion Vibber <brion@pobox.com>
3 # http://www.mediawiki.org/
4 #
5 # This program is free software; you can redistribute it and/or modify
6 # it under the terms of the GNU General Public License as published by
7 # the Free Software Foundation; either version 2 of the License, or
8 # (at your option) any later version.
9 #
10 # This program is distributed in the hope that it will be useful,
11 # but WITHOUT ANY WARRANTY; without even the implied warranty of
12 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 # GNU General Public License for more details.
14 #
15 # You should have received a copy of the GNU General Public License along
16 # with this program; if not, write to the Free Software Foundation, Inc.,
17 # 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
18 # http://www.gnu.org/copyleft/gpl.html
19
20 /**
21 * @todo Make this more independent of the configuration (and if possible the database)
22 * @todo document
23 * @package MediaWiki
24 * @subpackage Maintenance
25 */
26
27 /** */
28 $options = array( 'quick', 'color', 'quiet', 'help' );
29 $optionsWithArgs = array( 'regex' );
30
31 require_once( 'commandLine.inc' );
32 require_once( "$IP/includes/ObjectCache.php" );
33 require_once( "$IP/languages/LanguageUtf8.php" );
34
35 /** */
36 class ParserTest {
37 /**
38 * boolean $color whereas output should be colorized
39 * @access private
40 */
41 var $color;
42
43 /**
44 * boolean $lightcolor whereas output should use light colors
45 * @access private
46 */
47 var $lightcolor;
48
49 /**
50 * Sets terminal colorization and diff/quick modes depending on OS and
51 * command-line options (--color and --quick).
52 *
53 * @access public
54 */
55 function ParserTest() {
56 global $options;
57
58 # Only colorize output if stdout is a terminal.
59 $this->lightcolor = false;
60 $this->color = !wfIsWindows() && posix_isatty(1);
61
62 if( isset( $options['color'] ) ) {
63 switch( $options['color'] ) {
64 case 'no':
65 $this->color = false;
66 break;
67 case 'light':
68 $this->lightcolor = true;
69 # Fall through
70 case 'yes':
71 default:
72 $this->color = true;
73 break;
74 }
75 }
76
77 $this->showDiffs = !isset( $options['quick'] );
78
79 $this->quiet = isset( $options['quiet'] );
80
81 if (isset($options['regex'])) {
82 $this->regex = $options['regex'];
83 } else {
84 # Matches anything
85 $this->regex = '';
86 }
87 }
88
89 /**
90 * Remove last character if it is a newline
91 * @access private
92 */
93 function chomp($s) {
94 if (substr($s, -1) === "\n") {
95 return substr($s, 0, -1);
96 }
97 else {
98 return $s;
99 }
100 }
101
102 /**
103 * Run a series of tests listed in the given text file.
104 * Each test consists of a brief description, wikitext input,
105 * and the expected HTML output.
106 *
107 * Prints status updates on stdout and counts up the total
108 * number and percentage of passed tests.
109 *
110 * @param string $filename
111 * @return bool True if passed all tests, false if any tests failed.
112 * @access public
113 */
114 function runTestsFromFile( $filename ) {
115 $infile = fopen( $filename, 'rt' );
116 if( !$infile ) {
117 die( "Couldn't open parserTests.txt\n" );
118 }
119
120 $data = array();
121 $section = null;
122 $success = 0;
123 $total = 0;
124 $n = 0;
125 while( false !== ($line = fgets( $infile ) ) ) {
126 $n++;
127 if( preg_match( '/^!!\s*(\w+)/', $line, $matches ) ) {
128 $section = strtolower( $matches[1] );
129 if( $section == 'endarticle') {
130 if( !isset( $data['text'] ) ) {
131 die( "'endarticle' without 'text' at line $n\n" );
132 }
133 if( !isset( $data['article'] ) ) {
134 die( "'endarticle' without 'article' at line $n\n" );
135 }
136 $this->addArticle($this->chomp($data['article']), $this->chomp($data['text']), $n);
137 $data = array();
138 $section = null;
139 continue;
140 }
141 if( $section == 'end' ) {
142 if( !isset( $data['test'] ) ) {
143 die( "'end' without 'test' at line $n\n" );
144 }
145 if( !isset( $data['input'] ) ) {
146 die( "'end' without 'input' at line $n\n" );
147 }
148 if( !isset( $data['result'] ) ) {
149 die( "'end' without 'result' at line $n\n" );
150 }
151 if( !isset( $data['options'] ) ) {
152 $data['options'] = '';
153 }
154 else {
155 $data['options'] = $this->chomp( $data['options'] );
156 }
157 if (preg_match('/\\bdisabled\\b/i', $data['options'])
158 || !preg_match("/{$this->regex}/i", $data['test'])) {
159 # disabled test
160 $data = array();
161 $section = null;
162 continue;
163 }
164 if( $this->runTest(
165 $this->chomp( $data['test'] ),
166 $this->chomp( $data['input'] ),
167 $this->chomp( $data['result'] ),
168 $this->chomp( $data['options'] ) ) ) {
169 $success++;
170 }
171 $total++;
172 $data = array();
173 $section = null;
174 continue;
175 }
176 if ( isset ($data[$section] ) ) {
177 die ( "duplicate section '$section' at line $n\n" );
178 }
179 $data[$section] = '';
180 continue;
181 }
182 if( $section ) {
183 $data[$section] .= $line;
184 }
185 }
186 if( $total > 0 ) {
187 $ratio = IntVal( 100.0 * $success / $total );
188 print $this->termColor( 1 ) . "\nPassed $success of $total tests ($ratio%) ";
189 if( $success == $total ) {
190 print $this->termColor( 32 ) . "PASSED!";
191 } else {
192 print $this->termColor( 31 ) . "FAILED!";
193 }
194 print $this->termReset() . "\n";
195 return ($success == $total);
196 } else {
197 die( "No tests found.\n" );
198 }
199 }
200
201 /**
202 * Run a given wikitext input through a freshly-constructed wiki parser,
203 * and compare the output against the expected results.
204 * Prints status and explanatory messages to stdout.
205 *
206 * @param string $input Wikitext to try rendering
207 * @param string $result Result to output
208 * @return bool
209 */
210 function runTest( $desc, $input, $result, $opts ) {
211 if( !$this->quiet ) {
212 $this->showTesting( $desc );
213 }
214
215 $this->setupGlobals($opts);
216
217 $user =& new User();
218 $options =& ParserOptions::newFromUser( $user );
219
220 if (preg_match('/\\bmath\\b/i', $opts)) {
221 # XXX this should probably be done by the ParserOptions
222 require_once('Math.php');
223
224 $options->setUseTex(true);
225 }
226
227 if (preg_match('/title=\[\[(.*)\]\]/', $opts, $m)) {
228 $titleText = $m[1];
229 }
230 else {
231 $titleText = 'Parser test';
232 }
233
234 $parser =& new Parser();
235 $title =& Title::makeTitle( NS_MAIN, $titleText );
236
237 if (preg_match('/\\bpst\\b/i', $opts)) {
238 $out = $parser->preSaveTransform( $input, $title, $user, $options );
239 } elseif (preg_match('/\\bmsg\\b/i', $opts)) {
240 $out = $parser->transformMsg( $input, $options );
241 } else {
242 $output =& $parser->parse( $input, $title, $options );
243 $out = $output->getText();
244
245 if (preg_match('/\\bill\\b/i', $opts)) {
246 $out = $this->tidy( implode( ' ', $output->getLanguageLinks() ) );
247 } else if (preg_match('/\\bcat\\b/i', $opts)) {
248 $out = $this->tidy ( implode( ' ', $output->getCategoryLinks() ) );
249 }
250
251 $result = $this->tidy($result);
252 }
253
254 $this->teardownGlobals();
255
256 if( $result === $out ) {
257 return $this->showSuccess( $desc );
258 } else {
259 return $this->showFailure( $desc, $result, $out );
260 }
261 }
262
263 /**
264 * Set up the global variables for a consistent environment for each test.
265 * Ideally this should replace the global configuration entirely.
266 *
267 * @access private
268 */
269 function setupGlobals($opts = '') {
270 # Save the prefixed / quoted table names for later use when we make the temporaries.
271 $db =& wfGetDB( DB_READ );
272 $this->oldTableNames = array();
273 foreach( $this->listTables() as $table ) {
274 $this->oldTableNames[$table] = $db->tableName( $table );
275 }
276 if( !isset( $this->uploadDir ) ) {
277 $this->uploadDir = $this->setupUploadDir();
278 }
279
280 $settings = array(
281 'wgServer' => 'http://localhost',
282 'wgScript' => '/index.php',
283 'wgScriptPath' => '/',
284 'wgArticlePath' => '/wiki/$1',
285 'wgUploadPath' => '/images',
286 'wgUploadDirectory' => $this->uploadDir,
287 'wgStyleSheetPath' => '/skins',
288 'wgSitename' => 'MediaWiki',
289 'wgLanguageCode' => 'en',
290 'wgContLanguageCode' => 'en',
291 'wgUseLatin1' => false,
292 'wgDBprefix' => 'parsertest',
293 'wgDefaultUserOptions' => array(),
294
295 'wgLoadBalancer' => LoadBalancer::newFromParams( $GLOBALS['wgDBservers'] ),
296 'wgLang' => new LanguageUtf8(),
297 'wgContLang' => new LanguageUtf8(),
298 'wgNamespacesWithSubpages' => array( 0 => preg_match('/\\bsubpage\\b/i', $opts)),
299 'wgMaxTocLevel' => 999,
300 );
301 $this->savedGlobals = array();
302 foreach( $settings as $var => $val ) {
303 $this->savedGlobals[$var] = $GLOBALS[$var];
304 $GLOBALS[$var] = $val;
305 }
306 $GLOBALS['wgLoadBalancer']->loadMasterPos();
307 $GLOBALS['wgMessageCache']->initialise( new BagOStuff(), false, 0, $GLOBALS['wgDBname'] );
308 $this->setupDatabase();
309 }
310
311 # List of temporary tables to create, without prefix
312 # Some of these probably aren't necessary
313 function listTables() {
314 return array('user', 'cur', 'old', 'links',
315 'brokenlinks', 'imagelinks', 'categorylinks',
316 'linkscc', 'site_stats', 'hitcounter',
317 'ipblocks', 'image', 'oldimage',
318 'recentchanges',
319 'watchlist', 'math', 'searchindex',
320 'interwiki', 'querycache',
321 'objectcache'
322 );
323 }
324
325 /**
326 * Set up a temporary set of wiki tables to work with for the tests.
327 * Currently this will only be done once per run, and any changes to
328 * the db will be visible to later tests in the run.
329 *
330 * @access private
331 */
332 function setupDatabase() {
333 static $setupDB = false;
334 global $wgDBprefix;
335
336 # Make sure we don't mess with the live DB
337 if (!$setupDB && $wgDBprefix === 'parsertest') {
338 $db =& wfGetDB( DB_MASTER );
339
340 $tables = $this->listTables();
341
342 if (!(strcmp($db->getServerVersion(), '4.1') < 0 and stristr($db->getSoftwareLink(), 'MySQL'))) {
343 # Database that supports CREATE TABLE ... LIKE
344 global $wgDBtype;
345 if( $wgDBtype == 'PostgreSQL' ) {
346 $def = 'INCLUDING DEFAULTS';
347 } else {
348 $def = '';
349 }
350 foreach ($tables as $tbl) {
351 $newTableName = $db->tableName( $tbl );
352 $tableName = $this->oldTableNames[$tbl];
353 $db->query("CREATE TEMPORARY TABLE $newTableName (LIKE $tableName $def)");
354 }
355 } else {
356 # Hack for MySQL versions < 4.1, which don't support
357 # "CREATE TABLE ... LIKE". Note that
358 # "CREATE TEMPORARY TABLE ... SELECT * FROM ... LIMIT 0"
359 # would not create the indexes we need....
360 foreach ($tables as $tbl) {
361 $res = $db->query("SHOW CREATE TABLE {$this->oldTableNames[$tbl]}");
362 $row = $db->fetchRow($res);
363 $create = $row[1];
364 $create_tmp = preg_replace('/CREATE TABLE `(.*?)`/', 'CREATE TEMPORARY TABLE `'
365 . $wgDBprefix . $tbl .'`', $create);
366 if ($create === $create_tmp) {
367 # Couldn't do replacement
368 die("could not create temporary table $tbl");
369 }
370 $db->query($create_tmp);
371 }
372
373 }
374
375 # Hack: insert a few Wikipedia in-project interwiki prefixes,
376 # for testing inter-language links
377 $db->insert( 'interwiki', array(
378 array( 'iw_prefix' => 'Wikipedia',
379 'iw_url' => 'http://en.wikipedia.org/wiki/$1',
380 'iw_local' => 0 ),
381 array( 'iw_prefix' => 'MeatBall',
382 'iw_url' => 'http://www.usemod.com/cgi-bin/mb.pl?$1',
383 'iw_local' => 0 ),
384 array( 'iw_prefix' => 'zh',
385 'iw_url' => 'http://zh.wikipedia.org/wiki/$1',
386 'iw_local' => 1 ),
387 array( 'iw_prefix' => 'es',
388 'iw_url' => 'http://es.wikipedia.org/wiki/$1',
389 'iw_local' => 1 ),
390 array( 'iw_prefix' => 'fr',
391 'iw_url' => 'http://fr.wikipedia.org/wiki/$1',
392 'iw_local' => 1 ),
393 array( 'iw_prefix' => 'ru',
394 'iw_url' => 'http://ru.wikipedia.org/wiki/$1',
395 'iw_local' => 1 ),
396 ) );
397
398
399 $setupDB = true;
400 }
401 }
402
403 /**
404 * Create a dummy uploads directory which will contain a couple
405 * of files in order to pass existence tests.
406 * @return string The directory
407 * @access private
408 */
409 function setupUploadDir() {
410 $dir = "/tmp/mwParser-" . mt_rand() . "-images";
411 mkdir( $dir );
412 mkdir( $dir . '/3' );
413 mkdir( $dir . '/3/3a' );
414 $f = fopen( $dir . '/3/3a/Foobar.jpg', 'wb' );
415 fwrite( $f, 'Dummy file' );
416 fclose( $f );
417 return $dir;
418 }
419
420 /**
421 * Restore default values and perform any necessary clean-up
422 * after each test runs.
423 *
424 * @access private
425 */
426 function teardownGlobals() {
427 foreach( $this->savedGlobals as $var => $val ) {
428 $GLOBALS[$var] = $val;
429 }
430 if( isset( $this->uploadDir ) ) {
431 $this->teardownUploadDir( $this->uploadDir );
432 unset( $this->uploadDir );
433 }
434 }
435
436 /**
437 * Remove the dummy uploads directory
438 * @access private
439 */
440 function teardownUploadDir( $dir ) {
441 unlink( "$dir/3/3a/Foobar.jpg" );
442 rmdir( "$dir/3/3a" );
443 rmdir( "$dir/3" );
444 @rmdir( "$dir/thumb/3/39" );
445 @rmdir( "$dir/thumb/3" );
446 @rmdir( "$dir/thumb" );
447 rmdir( "$dir" );
448 }
449
450 /**
451 * "Running test $desc..."
452 * @access private
453 */
454 function showTesting( $desc ) {
455 print "Running test $desc... ";
456 }
457
458 /**
459 * Print a happy success message.
460 *
461 * @param string $desc The test name
462 * @return bool
463 * @access private
464 */
465 function showSuccess( $desc ) {
466 if( !$this->quiet ) {
467 print $this->termColor( '1;32' ) . 'PASSED' . $this->termReset() . "\n";
468 }
469 return true;
470 }
471
472 /**
473 * Print a failure message and provide some explanatory output
474 * about what went wrong if so configured.
475 *
476 * @param string $desc The test name
477 * @param string $result Expected HTML output
478 * @param string $html Actual HTML output
479 * @return bool
480 * @access private
481 */
482 function showFailure( $desc, $result, $html ) {
483 if( $this->quiet ) {
484 # In quiet mode we didn't show the 'Testing' message before the
485 # test, in case it succeeded. Show it now:
486 $this->showTesting( $desc );
487 }
488 print $this->termColor( '1;31' ) . 'FAILED!' . $this->termReset() . "\n";
489 if( $this->showDiffs ) {
490 print $this->quickDiff( $result, $html );
491 }
492 return false;
493 }
494
495 /**
496 * Run given strings through a diff and return the (colorized) output.
497 * Requires writable /tmp directory and a 'diff' command in the PATH.
498 *
499 * @param string $input
500 * @param string $output
501 * @return string
502 * @access private
503 */
504 function quickDiff( $input, $output ) {
505 $prefix = "/tmp/mwParser-" . mt_rand();
506
507 $infile = "$prefix-expected";
508 $this->dumpToFile( $input, $infile );
509
510 $outfile = "$prefix-actual";
511 $this->dumpToFile( $output, $outfile );
512
513 $diff = `diff -au $infile $outfile`;
514 unlink( $infile );
515 unlink( $outfile );
516
517 return $this->colorDiff( $diff );
518 }
519
520 /**
521 * Write the given string to a file, adding a final newline.
522 *
523 * @param string $data
524 * @param string $filename
525 * @access private
526 */
527 function dumpToFile( $data, $filename ) {
528 $file = fopen( $filename, "wt" );
529 fwrite( $file, $data . "\n" );
530 fclose( $file );
531 }
532
533 /**
534 * Return ANSI terminal escape code for changing text attribs/color,
535 * or empty string if color output is disabled.
536 *
537 * @param string $color Semicolon-separated list of attribute/color codes
538 * @return string
539 * @access private
540 */
541 function termColor( $color ) {
542 if($this->lightcolor) {
543 return $this->color ? "\x1b[1;{$color}m" : '';
544 } else {
545 return $this->color ? "\x1b[{$color}m" : '';
546 }
547 }
548
549 /**
550 * Return ANSI terminal escape code for restoring default text attributes,
551 * or empty string if color output is disabled.
552 *
553 * @return string
554 * @access private
555 */
556 function termReset() {
557 return $this->color ? "\x1b[0m" : '';
558 }
559
560 /**
561 * Colorize unified diff output if set for ANSI color output.
562 * Subtractions are colored blue, additions red.
563 *
564 * @param string $text
565 * @return string
566 * @access private
567 */
568 function colorDiff( $text ) {
569 return preg_replace(
570 array( '/^(-.*)$/m', '/^(\+.*)$/m' ),
571 array( $this->termColor( 34 ) . '$1' . $this->termReset(),
572 $this->termColor( 31 ) . '$1' . $this->termReset() ),
573 $text );
574 }
575
576 /**
577 * Insert a temporary test article
578 * @param string $name the title, including any prefix
579 * @param string $text the article text
580 * @param int $line the input line number, for reporting errors
581 * @static
582 * @access private
583 */
584 function addArticle($name, $text, $line) {
585 $this->setupGlobals();
586 $title = Title::newFromText( $name );
587 if ( is_null($title) ) {
588 die( "invalid title at line $line\n" );
589 }
590
591 $aid = $title->getArticleID( GAID_FOR_UPDATE );
592 if ($aid != 0) {
593 die( "duplicate article at line $line\n" );
594 }
595
596 $art = new Article($title);
597 $art->insertNewArticle($text, '', false, false );
598 $this->teardownGlobals();
599 }
600
601 /*
602 * Run the "tidy" command on text if the $wgUseTidy
603 * global is true
604 *
605 * @param string $text the text to tidy
606 * @return string
607 * @static
608 * @access private
609 */
610 function tidy( $text ) {
611 global $wgUseTidy;
612 if ($wgUseTidy) {
613 $text = Parser::tidy($text);
614 }
615 return $text;
616 }
617 }
618
619 if( isset( $options['help'] ) ) {
620 echo <<<END
621 MediaWiki $wgVersion parser test suite
622 Usage: php parserTests.php [--quick] [--quiet] [--color[=(yes|no|light)]]
623 [--regex <expression>] [--help]
624 Options:
625 --quick Suppress diff output of failed tests
626 --quiet Suppress notification of passed tests (shows only failed tests)
627 --color Override terminal detection and force color output on or off
628 'light' option is similar to 'yes' but with color for dark backgrounds
629 --regex Only run tests whose descriptions which match given regex
630 --help Show this help message
631
632
633 END;
634 exit( 0 );
635 }
636
637 # There is a convention that the parser should never
638 # refer to $wgTitle directly, but instead use the title
639 # passed to it.
640 $wgTitle = Title::newFromText( 'Parser test script do not use' );
641 $tester =& new ParserTest();
642
643 # Note: the command line setup changes the current working directory
644 # to the parent, which is why we have to put the subdir here:
645 $ok = $tester->runTestsFromFile( 'maintenance/parserTests.txt' );
646
647 exit ($ok ? 0 : -1);
648
649 ?>