Workaround for bug 28146: running out of memory during Unicode validation/normalizati...

author Brion Vibber <brion@users.mediawiki.org>

Mon, 4 Apr 2011 20:59:04 +0000 (20:59 +0000)

committer Brion Vibber <brion@users.mediawiki.org>

Mon, 4 Apr 2011 20:59:04 +0000 (20:59 +0000)
author Brion Vibber <brion@users.mediawiki.org>
Mon, 4 Apr 2011 20:59:04 +0000 (20:59 +0000)
committer Brion Vibber <brion@users.mediawiki.org>
Mon, 4 Apr 2011 20:59:04 +0000 (20:59 +0000)
diff --git a/includes/DjVuImage.php b/includes/DjVuImage.php

index 7a8b5e4..f2effcb 100644 (file)
--- a/includes/DjVuImage.php
+++ b/includes/DjVuImage.php
@@ -254,8 +254,7 @@ class DjVuImage {
                         $txt = wfShellExec( $cmd, $retval );
                         wfProfileOut( 'djvutxt' );
                         if( $retval == 0) {
-                               # Get rid of invalid UTF-8, strip control characters
-                               $txt = UtfNormal::cleanUp( $txt );
+                               # Strip some control characters
                                 $txt = preg_replace( "/[\013\035\037]/", "", $txt );
                                 $reg = <<<EOR
                                         /\(page\s[\d-]*\s[\d-]*\s[\d-]*\s[\d-]*\s*"
@@ -279,7 +278,8 @@ EOR;
         }
  
         function pageTextCallback( $matches ) {
-               return '<PAGE value="' . htmlspecialchars( $matches[1] ) . '" />';
+               # Get rid of invalid UTF-8, strip control characters
+               return '<PAGE value="' . htmlspecialchars( UtfNormal::cleanUp( $matches[1] ) ) . '" />';
         }
  
         /**
author	Brion Vibber <brion@users.mediawiki.org>
	Mon, 4 Apr 2011 20:59:04 +0000 (20:59 +0000)
committer	Brion Vibber <brion@users.mediawiki.org>
	Mon, 4 Apr 2011 20:59:04 +0000 (20:59 +0000)