From: Brion Vibber Date: Thu, 7 Oct 2004 03:40:06 +0000 (+0000) Subject: Fetch test data for the benchmark X-Git-Tag: 1.5.0alpha1~1639 X-Git-Url: http://git.cyclocoop.org/%7B%24www_url%7Dadmin/membres/fiche.php?a=commitdiff_plain;h=bcd1e9e844f55a4ffa13f9068edc539818bbcc4b;p=lhc%2Fweb%2Fwiklou.git Fetch test data for the benchmark --- diff --git a/includes/normal/Makefile b/includes/normal/Makefile index 04435604b7..0cb5da814d 100644 --- a/includes/normal/Makefile +++ b/includes/normal/Makefile @@ -15,7 +15,7 @@ test : testutf8 UtfNormalTest.php UtfNormalData.inc NormalizationTest.txt testutf8 : Utf8Test.php UTF-8-test.txt $(PHP) Utf8Test.php -bench : UtfNormalData.inc +bench : UtfNormalData.inc testdata/washington.txt testdata/berlin.txt testdata/tokyo.txt testdata/sociology.txt $(PHP) UtfNormalBench.php clean : @@ -42,3 +42,15 @@ UnicodeData.txt : UTF-8-test.txt : $(FETCH) http://www.cl.cam.ac.uk/~mgk25/ucs/examples/UTF-8-test.txt + +testdata/berlin.txt : + mkdir -p testdata && wget -U MediaWiki/test -O testdata/berlin.txt "http://de.wikipedia.org/w/wiki.phtml?title=Berlin&oldid=2775712&action=raw" + +testdata/washington.txt : + mkdir -p testdata && wget -U MediaWiki/test -O testdata/washington.txt "http://en.wikipedia.org/w/wiki.phtml?title=Washington%2C_DC&oldid=6370218&action=raw" + +testdata/tokyo.txt : + mkdir -p testdata && wget -U MediaWiki/test -O testdata/tokyo.txt "http://ja.wikipedia.org/w/wiki.phtml?title=%E6%9D%B1%E4%BA%AC&oldid=823926&action=raw" + +testdata/sociology.txt : + mkdir -p testdata && wget -U MediaWiki/test -O testdata/sociology.txt "http://ko.wikipedia.org/w/wiki.phtml?title=%EC%82%AC%ED%9A%8C%ED%95%99&oldid=16409&action=raw" diff --git a/includes/normal/UtfNormalBench.php b/includes/normal/UtfNormalBench.php index c37fb46928..2e1740c22b 100644 --- a/includes/normal/UtfNormalBench.php +++ b/includes/normal/UtfNormalBench.php @@ -36,7 +36,7 @@ $testfiles = array( 'testdata/washington.txt' => 'English text', 'testdata/berlin.txt' => 'German text', 'testdata/tokyo.txt' => 'Japanese text', - 'testdata/byzantium.txt' => 'Korean text' + 'testdata/sociology.txt' => 'Korean text' ); $normalizer = new UtfNormal; foreach( $testfiles as $file => $desc ) {