Revert r85288 (magic accessors for RequestContext); much more trouble than they're...

[lhc/web/wiklou.git] / includes / parser / Parser.php
diff --git a/includes/parser/Parser.php b/includes/parser/Parser.php

index 99df3d4..76974c9 100644 (file)
--- a/includes/parser/Parser.php
+++ b/includes/parser/Parser.php
@@ -34,10 +34,10 @@
   * Globals used:
   *    objects:   $wgLang, $wgContLang
   *
- * NOT $wgArticle, $wgUser or $wgTitle. Keep them away!
+ * NOT $wgUser or $wgTitle. Keep them away!
   *
   * settings:
- *  $wgUseTex*, $wgUseDynamicDates*, $wgInterwikiMagic*,
+ *  $wgUseDynamicDates*, $wgInterwikiMagic*,
   *  $wgNamespacesWithSubpages, $wgAllowExternalImages*,
   *  $wgLocaltimezone, $wgAllowSpecialInclusion*,
   *  $wgMaxArticleSize*
@@ -53,7 +53,13 @@ class Parser {
          * changes in an incompatible way, so the parser cache
          * can automatically discard old data.
          */
-       const VERSION = '1.6.4';
+       const VERSION = '1.6.5';
+
+       /**
+        * Update this version number when the output of serialiseHalfParsedText()
+        * changes in an incompatible way
+        */
+       const HALF_PARSED_VERSION = 2;
  
         # Flags for Parser::setFunctionHook
         # Also available as global constants from Defines.php
@@ -103,44 +109,87 @@ class Parser {
         var $mImageParamsMagicArray = array();
         var $mMarkerIndex = 0;
         var $mFirstCall = true;
-       var $mVariables, $mSubstWords; # Initialised by initialiseVariables()
-       var $mConf, $mPreprocessor, $mExtLinkBracketedRegex, $mUrlProtocols; # Initialised in constructor
  
+       # Initialised by initialiseVariables()
+
+       /**
+        * @var MagicWordArray
+        */
+       var $mVariables;
+
+       /**
+        * @var MagicWordArray
+        */
+       var $mSubstWords;
+       var $mConf, $mPreprocessor, $mExtLinkBracketedRegex, $mUrlProtocols; # Initialised in constructor
  
         # Cleared with clearState():
-       var $mOutput, $mAutonumber, $mDTopen, $mStripState;
+       /**
+        * @var ParserOutput
+        */
+       var $mOutput;
+       var $mAutonumber, $mDTopen;
+
+       /**
+        * @var StripState
+        */
+       var $mStripState;
+
         var $mIncludeCount, $mArgStack, $mLastSection, $mInPre;
-       var $mLinkHolders, $mLinkID;
+       /**
+        * @var LinkHolderArray
+        */
+       var $mLinkHolders;
+
+       var $mLinkID;
         var $mIncludeSizes, $mPPNodeCount, $mDefaultSort;
         var $mTplExpandCache; # empty-frame expansion cache
         var $mTplRedirCache, $mTplDomCache, $mHeadings, $mDoubleUnderscores;
         var $mExpensiveFunctionCount; # number of expensive parser function calls
+
+       /**
+        * @var User
+        */
         var $mUser; # User object; only used when doing pre-save transform
  
         # Temporary
         # These are variables reset at least once per parse regardless of $clearState
-       var $mOptions;      # ParserOptions object
+
+       /**
+        * @var ParserOptions
+        */
+       var $mOptions;
+
+       /**
+        * @var Title
+        */
         var $mTitle;        # Title context, used for self-link rendering and similar things
         var $mOutputType;   # Output type, one of the OT_xxx constants
         var $ot;            # Shortcut alias, see setOutputType()
         var $mRevisionObject; # The revision object of the specified revision ID
         var $mRevisionId;   # ID to display in {{REVISIONID}} tags
         var $mRevisionTimestamp; # The timestamp of the specified revision ID
-       var $mRevisionUser; # Userto display in {{REVISIONUSER}} tag
+       var $mRevisionUser; # User to display in {{REVISIONUSER}} tag
         var $mRevIdForTs;   # The revision ID which was used to fetch the timestamp
  
+       /**
+        * @var string
+        */
+       var $mUniqPrefix;
+
         /**
          * Constructor
-        *
-        * @public
          */
-       function __construct( $conf = array() ) {
+       public function __construct( $conf = array() ) {
                 $this->mConf = $conf;
                 $this->mUrlProtocols = wfUrlProtocols();
                 $this->mExtLinkBracketedRegex = '/\[(\b(' . wfUrlProtocols() . ')'.
                         '[^][<>"\\x00-\\x20\\x7F]+) *([^\]\\x00-\\x08\\x0a-\\x1F]*?)\]/S';
                 if ( isset( $conf['preprocessorClass'] ) ) {
                         $this->mPreprocessorClass = $conf['preprocessorClass'];
+               } elseif ( defined( 'MW_COMPILED' ) ) {
+                       # Preprocessor_Hash is much faster than Preprocessor_DOM in compiled mode
+                       $this->mPreprocessorClass = 'Preprocessor_Hash';
                 } elseif ( extension_loaded( 'domxml' ) ) {
                         # PECL extension that conflicts with the core DOM extension (bug 13770)
                         wfDebug( "Warning: you have the obsolete domxml extension for PHP. Please remove it!\n" );
@@ -150,6 +199,7 @@ class Parser {
                 } else {
                         $this->mPreprocessorClass = 'Preprocessor_Hash';
                 }
+               wfDebug( __CLASS__ . ": using preprocessor: {$this->mPreprocessorClass}\n" );
         }
  
         /**
@@ -157,7 +207,7 @@ class Parser {
          */
         function __destruct() {
                 if ( isset( $this->mLinkHolders ) ) {
-                       $this->mLinkHolders->__destruct();
+                       unset( $this->mLinkHolders );
                 }
                 foreach ( $this as $name => $value ) {
                         unset( $this->$name );
@@ -199,7 +249,6 @@ class Parser {
                 $this->mLastSection = '';
                 $this->mDTopen = false;
                 $this->mIncludeCount = array();
-               $this->mStripState = new StripState;
                 $this->mArgStack = false;
                 $this->mInPre = false;
                 $this->mLinkHolders = new LinkHolderArray( $this );
@@ -222,6 +271,7 @@ class Parser {
                 # $this->mUniqPrefix = "\x07UNIQ" . Parser::getRandomString();
                 # Changed to \x7f to allow XML double-parsing -- TS
                 $this->mUniqPrefix = "\x7fUNIQ" . self::getRandomString();
+               $this->mStripState = new StripState( $this->mUniqPrefix );
  
  
                 # Clear these on every parse, bug 4549
@@ -253,7 +303,7 @@ class Parser {
          * Do not call this function recursively.
          *
          * @param $text String: text we want to parse
-        * @param $title A title object
+        * @param $title Title object
          * @param $options ParserOptions
          * @param $linestart boolean
          * @param $clearState boolean
@@ -271,12 +321,7 @@ class Parser {
                 wfProfileIn( __METHOD__ );
                 wfProfileIn( $fname );
  
-               $this->mOptions = $options;
-               if ( $clearState ) {
-                       $this->clearState();
-               }
-
-               $this->setTitle( $title ); # Page title has to be set for the pre-processor
+               $this->startParse( $title, $options, self::OT_HTML, $clearState );
  
                 $oldRevisionId = $this->mRevisionId;
                 $oldRevisionObject = $this->mRevisionObject;
@@ -288,7 +333,7 @@ class Parser {
                         $this->mRevisionTimestamp = null;
                         $this->mRevisionUser = null;
                 }
-               $this->setOutputType( self::OT_HTML );
+
                 wfRunHooks( 'ParserBeforeStrip', array( &$this, &$text, &$this->mStripState ) );
                 # No more strip!
                 wfRunHooks( 'ParserAfterStrip', array( &$this, &$text, &$this->mStripState ) );
@@ -330,8 +375,8 @@ class Parser {
  
                 /**
                  * A converted title will be provided in the output object if title and
-                * content conversion are enabled, the article text does not contain 
-                * a conversion-suppressing double-underscore tag, and no 
+                * content conversion are enabled, the article text does not contain
+                * a conversion-suppressing double-underscore tag, and no
                  * {{DISPLAYTITLE:...}} is present. DISPLAYTITLE takes precedence over
                  * automatic link conversion.
                  */
@@ -354,23 +399,7 @@ class Parser {
  
                 wfRunHooks( 'ParserBeforeTidy', array( &$this, &$text ) );
  
-//!JF Move to its own function
-
-               $uniq_prefix = $this->mUniqPrefix;
-               $matches = array();
-               $elements = array_keys( $this->mTransparentTagHooks );
-               $text = $this->extractTagsAndParams( $elements, $text, $matches, $uniq_prefix );
-
-               foreach ( $matches as $marker => $data ) {
-                       list( $element, $content, $params, $tag ) = $data;
-                       $tagName = strtolower( $element );
-                       if ( isset( $this->mTransparentTagHooks[$tagName] ) ) {
-                               $output = call_user_func_array( $this->mTransparentTagHooks[$tagName], array( $content, $params, $this ) );
-                       } else {
-                               $output = $tag;
-                       }
-                       $this->mStripState->general->setPair( $marker, $output );
-               }
+               $text = $this->replaceTransparentTags( $text );
                 $text = $this->mStripState->unstripGeneral( $text );
  
                 $text = Sanitizer::normalizeCharReferences( $text );
@@ -444,6 +473,8 @@ class Parser {
          *
          * @param $text String: text extension wants to have parsed
          * @param $frame PPFrame: The frame to use for expanding any template variables
+        *
+        * @return string
          */
         function recursiveTagParse( $text, $frame=false ) {
                 wfProfileIn( __METHOD__ );
@@ -458,12 +489,9 @@ class Parser {
          * Expand templates and variables in the text, producing valid, static wikitext.
          * Also removes comments.
          */
-       function preprocess( $text, $title, $options, $revid = null ) {
+       function preprocess( $text, Title $title, ParserOptions $options, $revid = null ) {
                 wfProfileIn( __METHOD__ );
-               $this->mOptions = $options;
-               $this->clearState();
-               $this->setOutputType( self::OT_PREPROCESS );
-               $this->setTitle( $title );
+               $this->startParse( $title, $options, self::OT_PREPROCESS, true );
                 if ( $revid !== null ) {
                         $this->mRevisionId = $revid;
                 }
@@ -481,25 +509,23 @@ class Parser {
          * <noinclude>, <includeonly> etc. are parsed as for template transclusion,
          * comments, templates, arguments, tags hooks and parser functions are untouched.
          */
-       public function getPreloadText( $text, $title, $options ) {
+       public function getPreloadText( $text, Title $title, ParserOptions $options ) {
                 # Parser (re)initialisation
-               $this->mOptions = $options;
-               $this->clearState();
-               $this->setOutputType( self::OT_PLAIN );
-               $this->setTitle( $title );
+               $this->startParse( $title, $options, self::OT_PLAIN, true );
  
                 $flags = PPFrame::NO_ARGS | PPFrame::NO_TEMPLATES;
                 $dom = $this->preprocessToDom( $text, self::PTD_FOR_INCLUSION );
-               return $this->getPreprocessor()->newFrame()->expand( $dom, $flags );
+               $text = $this->getPreprocessor()->newFrame()->expand( $dom, $flags );
+               $text = $this->mStripState->unstripBoth( $text );
+               return $text;
         }
  
         /**
          * Get a random string
          *
-        * @private
-        * @static
+        * @return string
          */
-       static private function getRandomString() {
+       static public function getRandomString() {
                 return dechex( mt_rand( 0, 0x7fffffff ) ) . dechex( mt_rand( 0, 0x7fffffff ) );
         }
  
@@ -520,7 +546,7 @@ class Parser {
          */
         public function uniqPrefix() {
                 if ( !isset( $this->mUniqPrefix ) ) {
-                       # @todo Fixme: this is probably *horribly wrong*
+                       # @todo FIXME: This is probably *horribly wrong*
                         # LanguageConverter seems to want $wgParser's uniqPrefix, however
                         # if this is called for a parser cache hit, the parser may not
                         # have ever been initialized in the first place.
@@ -533,6 +559,8 @@ class Parser {
  
         /**
          * Set the context title
+        *
+        * @param $t Title
          */
         function setTitle( $t ) {
                 if ( !$t || $t instanceof FakeTitle ) {
@@ -621,10 +649,23 @@ class Parser {
                 return wfSetVar( $this->mOptions, $x );
         }
  
+       /**
+        * @return int
+        */
         function nextLinkID() {
                 return $this->mLinkID++;
         }
  
+       /**
+        * @param $id int
+        */
+       function setLinkID( $id ) {
+               $this->mLinkID = $id;
+       }
+
+       /**
+        * @return Language
+        */
         function getFunctionLang() {
                 global $wgLang, $wgContLang;
  
@@ -632,7 +673,7 @@ class Parser {
                 if ( $target !== null ) {
                         return $target;
                 } else {
-                       return $this->mOptions->getInterfaceMessage() ? $wgLang : $wgContLang;
+                       return $this->mOptions->getInterfaceMessage() ? $wgLang : $this->mTitle->getPageLanguage();
                 }
         }
  
@@ -673,15 +714,13 @@ class Parser {
          *     array( 'param' => 'x' ),
          *     '<element param="x">tag content</element>' ) )
          *
-        * @param $elements list of element names. Comments are always extracted.
-        * @param $text Source text string.
-        * @param $matches Out parameter, Array: extracted tags
-        * @param $uniq_prefix
+        * @param $elements array list of element names. Comments are always extracted.
+        * @param $text string Source text string.
+        * @param $matches array Out parameter, Array: extracted tags
+        * @param $uniq_prefix string
          * @return String: stripped text
-        *
-        * @static
          */
-       public function extractTagsAndParams( $elements, $text, &$matches, $uniq_prefix = '' ) {
+       public static function extractTagsAndParams( $elements, $text, &$matches, $uniq_prefix = '' ) {
                 static $n = 1;
                 $stripped = '';
                 $matches = array();
@@ -745,69 +784,25 @@ class Parser {
  
         /**
          * Get a list of strippable XML-like elements
+        *
+        * @return array
          */
         function getStripList() {
                 return $this->mStripList;
         }
  
-       /**
-        * @deprecated use replaceVariables
-        */
-       function strip( $text, $state, $stripcomments = false , $dontstrip = array() ) {
-               return $text;
-       }
-
-       /**
-        * Restores pre, math, and other extensions removed by strip()
-        *
-        * always call unstripNoWiki() after this one
-        * @private
-        * @deprecated use $this->mStripState->unstrip()
-        */
-       function unstrip( $text, $state ) {
-               return $state->unstripGeneral( $text );
-       }
-
-       /**
-        * Always call this after unstrip() to preserve the order
-        *
-        * @private
-        * @deprecated use $this->mStripState->unstrip()
-        */
-       function unstripNoWiki( $text, $state ) {
-               return $state->unstripNoWiki( $text );
-       }
-
-       /**
-        * @deprecated use $this->mStripState->unstripBoth()
-        */
-       function unstripForHTML( $text ) {
-               return $this->mStripState->unstripBoth( $text );
-       }
-
         /**
          * Add an item to the strip state
          * Returns the unique tag which must be inserted into the stripped text
          * The tag will be replaced with the original text in unstrip()
-        *
-        * @private
          */
         function insertStripItem( $text ) {
                 $rnd = "{$this->mUniqPrefix}-item-{$this->mMarkerIndex}-" . self::MARKER_SUFFIX;
                 $this->mMarkerIndex++;
-               $this->mStripState->general->setPair( $rnd, $text );
+               $this->mStripState->addGeneral( $rnd, $text );
                 return $rnd;
         }
  
-       /**
-        * Interface with html tidy
-        * @deprecated Use MWTidy::tidy()
-        */
-       public static function tidy( $text ) {
-               wfDeprecated( __METHOD__ );
-               return MWTidy::tidy( $text );
-       }
-
         /**
          * parse the wiki syntax used to render tables
          *
@@ -818,225 +813,300 @@ class Parser {
  
                 $lines = StringUtils::explode( "\n", $text );
                 $out = '';
-               $td_history = array(); # Is currently a td tag open?
-               $last_tag_history = array(); # Save history of last lag activated (td, th or caption)
-               $tr_history = array(); # Is currently a tr tag open?
-               $tr_attributes = array(); # history of tr attributes
-               $has_opened_tr = array(); # Did this table open a <tr> element?
-               $indent_level = 0; # indent level of the table
-
-               # Keep pulling lines off the front of the array until they're all gone.
-               # we want to be able to push lines back on to the front of the stream,
-               # but StringUtils::explode() returns funky optimised Iterators which don't
-               # support insertion.  So maintain a separate buffer and draw on that first if
-               # there's anything in it
-               $extraLines = array();
-               $lines->rewind();
-               do {
-                       if( $extraLines ){
-                               $outLine = array_shift( $extraLines );
-                       } elseif( $lines->valid() ) {
-                               $outLine = $lines->current();
-                               $lines->next();
-                       } else {
-                               break;
-                       }
+               $output =& $out;
+
+               foreach ( $lines as $outLine ) {
                         $line = trim( $outLine );
  
-                       if ( $line === '' ) { # empty line, go to next line
-                               $out .= $outLine."\n";
+                       # empty line, go to next line,
+                       # but only append \n if outside of table
+                       if ( $line === '') {
+                               $output .= $outLine . "\n";
                                 continue;
                         }
-
-                       $first_character = $line[0];
+                       $firstChars = $line[0];
+                       if ( strlen( $line ) > 1 ) {
+                               $firstChars .= in_array( $line[1], array( '}', '+', '-' ) ) ? $line[1] : '';
+                       }
                         $matches = array();
  
-                       if ( preg_match( '/^(:*)\{\|(.*)$/', $line , $matches ) ) {
-                               # First check if we are starting a new table
-                               $indent_level = strlen( $matches[1] );
+                       if ( preg_match( '/^(:*)\s*\{\|(.*)$/', $line , $matches ) ) {
+                               $tables[] = array();
+                               $table =& $this->last( $tables );
+                               $table[0] = array(); // first row
+                               $currentRow =& $table[0];
+                               $table['indent'] = strlen( $matches[1] );
  
                                 $attributes = $this->mStripState->unstripBoth( $matches[2] );
                                 $attributes = Sanitizer::fixTagAttributes( $attributes , 'table' );
  
-                               $outLine = str_repeat( '<dl><dd>' , $indent_level ) . "<table{$attributes}>";
-                               array_push( $td_history , false );
-                               array_push( $last_tag_history , '' );
-                               array_push( $tr_history , false );
-                               array_push( $tr_attributes , '' );
-                               array_push( $has_opened_tr , false );
-                       } elseif ( count( $td_history ) == 0 ) {
-                               # Don't do any of the following
-                               $out .= $outLine."\n";
-                               continue;
-                       } elseif ( substr( $line , 0 , 2 ) === '|}' ) {
-                               # We are ending a table
-                               $line = '</table>' . substr( $line , 2 );
-                               $last_tag = array_pop( $last_tag_history );
+                               if ( $attributes !== '' ) {
+                                       $table['attributes'] = $attributes;
+                               }
+                       } elseif ( !isset( $tables[0] ) ) {
+                               // we're outside the table
+
+                               $out .= $outLine . "\n";
+                       } elseif ( $firstChars === '|}' ) {
+                               // trim the |} code from the line
+                               $line = substr ( $line , 2 );
+
+                               // Shorthand for last row
+                               $lastRow =& $this->last( $table );
+
+                               // a thead at the end becomes a tfoot, unless there is only one row
+                               // Do this before deleting empty last lines to allow headers at the bottom of tables
+                               if ( isset( $lastRow['type'] ) && $lastRow['type'] == 'thead' && isset( $table[1] ) ) {
+                                       $lastRow['type'] = 'tfoot';
+                                       for ( $i = 0; isset( $lastRow[$i] ); $i++ ) {
+                                               $lastRow[$i]['type'] = 'th';
+                                       }
+                               }
  
-                               if ( !array_pop( $has_opened_tr ) ) {
-                                       $line = "<tr><td></td></tr>{$line}";
+                               // Delete empty last lines
+                               if ( empty( $lastRow ) ) {
+                                       $lastRow = NULL;
                                 }
+                               $o = '';
+                               $curtable = array_pop( $tables );
  
-                               if ( array_pop( $tr_history ) ) {
-                                       $line = "</tr>{$line}";
+                               #Add a line-ending before the table, but only if there isn't one already
+                               if ( substr( $out, -1 ) !== "\n" ) {
+                                       $o .= "\n";
                                 }
+                               $o .= $this->generateTableHTML( $curtable ) . $line . "\n";
+
+                               if ( count( $tables ) > 0 ) {
+                                       $table =& $this->last( $tables );
+                                       $currentRow =& $this->last( $table );
+                                       $currentElement =& $this->last( $currentRow );
  
-                               if ( array_pop( $td_history ) ) {
-                                       $line = "</{$last_tag}>{$line}";
+                                       $output =& $currentElement['content'];
+                               } else {
+                                       $output =& $out;
                                 }
-                               array_pop( $tr_attributes );
-                               $outLine = $line . str_repeat( '</dd></dl>' , $indent_level );
-                       } elseif ( substr( $line , 0 , 2 ) === '|-' ) {
-                               # Now we have a table row
-                               $line = preg_replace( '#^\|-+#', '', $line );
  
-                               # Whats after the tag is now only attributes
+                               $output .= $o;
+
+                       } elseif ( $firstChars === '|-' ) {
+                               // start a new row element
+                               // but only when we haven't started one already
+                               if ( count( $currentRow ) != 0 ) {
+                                       $table[] = array();
+                                       $currentRow =& $this->last( $table );
+                               }
+                               // Get the attributes, there's nothing else useful in $line now
+                               $line = substr ( $line , 2 );
                                 $attributes = $this->mStripState->unstripBoth( $line );
                                 $attributes = Sanitizer::fixTagAttributes( $attributes, 'tr' );
-                               array_pop( $tr_attributes );
-                               array_push( $tr_attributes, $attributes );
-
-                               $line = '';
-                               $last_tag = array_pop( $last_tag_history );
-                               array_pop( $has_opened_tr );
-                               array_push( $has_opened_tr , true );
-
-                               if ( array_pop( $tr_history ) ) {
-                                       $line = '</tr>';
+                               if ( $attributes !== '' ) {
+                                       $currentRow['attributes'] = $attributes;
                                 }
  
-                               if ( array_pop( $td_history ) ) {
-                                       $line = "</{$last_tag}>{$line}";
+                       } elseif ( $firstChars  === '|+' ) {
+                               // a table caption, but only proceed if there isn't one already
+                               if ( !isset ( $table['caption'] ) ) {
+                                       $line = substr ( $line , 2 );
+
+                                       $c = $this->getCellAttr( $line , 'caption' );
+                                       $table['caption'] = array();
+                                       $table['caption']['content'] = $c[0];
+                                       if ( isset( $c[1] ) ) $table['caption']['attributes'] = $c[1];
+                                       unset( $c );
+                                       $output =& $table['caption']['content'];
                                 }
-
-                               $outLine = $line;
-                               array_push( $tr_history , false );
-                               array_push( $td_history , false );
-                               array_push( $last_tag_history , '' );
-                       } elseif ( $first_character === '|' || $first_character === '!' || substr( $line , 0 , 2 )  === '|+' ) {
-                               # This might be cell elements, td, th or captions
-                               if ( substr( $line , 0 , 2 ) === '|+' ) {
-                                       $first_character = '|+';
+                       } elseif ( $firstChars === '|' || $firstChars === '!' || $firstChars === '!+' ) {
+                               // Which kind of cells are we dealing with
+                               $currentTag = 'td';
+                               $line = substr ( $line , 1 );
+
+                               if ( $firstChars === '!'  || $firstChars === '!+' ) {
+                                       $line = str_replace ( '!!' , '||' , $line );
+                                       $currentTag = 'th';
                                 }
  
-                               $line = substr( $line , strlen( $first_character ) );
+                               // Split up multiple cells on the same line.
+                               $cells = StringUtils::explodeMarkup( '||' , $line );
+                               $line = ''; // save memory
  
-                               if ( $first_character === '!' ) {
-                                       $line = str_replace( '!!' , '||' , $line );
+                               // decide whether thead to tbody
+                               if ( !array_key_exists( 'type', $currentRow ) ) {
+                                       $currentRow['type'] = ( $firstChars === '!' ) ? 'thead' : 'tbody' ;
+                               } elseif ( $firstChars === '|' ) {
+                                       $currentRow['type'] = 'tbody';
                                 }
  
-                               # Split up multiple cells on the same line.
-                               # FIXME : This can result in improper nesting of tags processed
-                               # by earlier parser steps, but should avoid splitting up eg
-                               # attribute values containing literal "||".
-                               $cells = StringUtils::explodeMarkup( '||' , $line );
-                               $cell = array_shift( $cells );
-
-                               # Inject cells back into the stream to be dealt with later
-                               # TODO: really we should do the whole thing as a stream...
-                               # but that would be too much like a sensible implementation :P
-                               if( count( $cells ) ){
-                                       foreach( array_reverse( $cells ) as $extraCell ){
-                                               array_unshift( $extraLines, $first_character . $extraCell );
-                                       }
-                               }
+                               // Loop through each table cell
+                               foreach ( $cells as $cell ) {
+                                       // a new cell
+                                       $currentRow[] = array();
+                                       $currentElement =& $this->last( $currentRow );
  
-                               $outLine = '';
+                                       $currentElement['type'] = $currentTag;
  
-                               $previous = '';
-                               if ( $first_character !== '|+' ) {
-                                       $tr_after = array_pop( $tr_attributes );
-                                       if ( !array_pop( $tr_history ) ) {
-                                               $previous = "<tr{$tr_after}>\n";
-                                       }
-                                       array_push( $tr_history , true );
-                                       array_push( $tr_attributes , '' );
-                                       array_pop( $has_opened_tr );
-                                       array_push( $has_opened_tr , true );
+                                       $c = $this->getCellAttr( $cell , $currentTag );
+                                       $currentElement['content'] = $c[0];
+                                       if ( isset( $c[1] ) ) $currentElement['attributes'] = $c[1];
+                                       unset( $c );
                                 }
+                               $output =& $currentElement['content'];
  
-                               $last_tag = array_pop( $last_tag_history );
+                       } else {
+                               $output .= "\n$outLine";
+                       }
+               }
  
-                               if ( array_pop( $td_history ) ) {
-                                       $previous = "</{$last_tag}>\n{$previous}";
-                               }
+               # Remove trailing line-ending (b/c)
+               if ( substr( $out, -1 ) === "\n" ) {
+                       $out = substr( $out, 0, -1 );
+               }
  
-                               if ( $first_character === '|' ) {
-                                       $last_tag = 'td';
-                               } elseif ( $first_character === '!' ) {
-                                       $last_tag = 'th';
-                               } elseif ( $first_character === '|+' ) {
-                                       $last_tag = 'caption';
-                               } else {
-                                       $last_tag = '';
+               # Close any unclosed tables
+               if ( isset( $tables ) && count( $tables ) > 0 ) {
+                       for ( $i = 0; $i < count( $tables ); $i++ ) {
+                               $curtable = array_pop( $tables );
+                               $curtable = $this->generateTableHTML( $curtable );
+                               #Add a line-ending before the table, but only if there isn't one already
+                               if ( substr( $out, -1 ) !== "\n"  && $curtable !== "" ) {
+                                       $out .= "\n";
                                 }
+                               $out .= $curtable;
+                       }
+               }
  
-                               array_push( $last_tag_history , $last_tag );
-
-                               # A cell could contain both parameters and data... but the pipe could
-                               # also be the start of a nested table, or a raw pipe inside an invalid
-                               # link (bug 553).  
-                               $cell_data = preg_split( '/(?<!\{)\|/', $cell, 2 );
-
-                               # Bug 553: a '|' inside an invalid link should not
-                               # be mistaken as delimiting cell parameters
-                               if ( strpos( $cell_data[0], '[[' ) !== false ) {
-                                       $data = $cell;
-                                       $cell = "{$previous}<{$last_tag}>";
-                               } elseif ( count( $cell_data ) == 1 ) {
-                                       $cell = "{$previous}<{$last_tag}>";
-                                       $data = $cell_data[0];
-                               } else {
-                                       $attributes = $this->mStripState->unstripBoth( $cell_data[0] );
-                                       $attributes = Sanitizer::fixTagAttributes( $attributes , $last_tag );
-                                       $cell = "{$previous}<{$last_tag}{$attributes}>";
-                                       $data = $cell_data[1];
-                               }
+               wfProfileOut( __METHOD__ );
  
-                               # Bug 529: the start of a table cell should be a linestart context for
-                               # processing other block markup, including nested tables.  The original
-                               # implementation of this was to add a newline before every brace construct,
-                               # which broke all manner of other things.  Instead, push the contents
-                               # of the cell back into the stream and come back to it later.  But don't
-                               # do that if the first line is empty, or you may get extra whitespace
-                               if( $data ){
-                                       array_unshift( $extraLines, trim( $data ) );
-                               }
+               return $out;
+       }
  
-                               $outLine .= $cell;
-                               array_push( $td_history , true );
-                       }
-                       $out .= $outLine . "\n";
-               } while( $lines->valid() || count( $extraLines ) );
+       /**
+        * Helper function for doTableStuff() separating the contents of cells from
+        * attributes. Particularly useful as there's a possible bug and this action
+        * is repeated twice.
+        *
+        * @private
+        * @param $cell
+        * @param $tagName
+        * @return array
+        */
+       function getCellAttr ( $cell, $tagName ) {
+               $attributes = null;
  
-               # Closing open td, tr && table
-               while ( count( $td_history ) > 0 ) {
-                       if ( array_pop( $td_history ) ) {
-                               $out .= "</td>\n";
+               $cell = trim ( $cell );
+
+               // A cell could contain both parameters and data
+               $cellData = explode ( '|' , $cell , 2 );
+
+               // Bug 553: Note that a '|' inside an invalid link should not
+               // be mistaken as delimiting cell parameters
+               if ( strpos( $cellData[0], '[[' ) !== false ) {
+                       $content = trim ( $cell );
+               }
+               elseif ( count ( $cellData ) == 1 ) {
+                       $content = trim ( $cellData[0] );
+               } else {
+                       $attributes = $this->mStripState->unstripBoth( $cellData[0] );
+                       $attributes = Sanitizer::fixTagAttributes( $attributes , $tagName );
+
+                       $content = trim ( $cellData[1] );
+               }
+               return array( $content, $attributes );
+       }
+
+
+       /**
+        * Helper function for doTableStuff(). This converts the structured array into html.
+        *
+        * @private
+        */
+       function generateTableHTML( &$table ) {
+               $return = "";
+               $return .= str_repeat( '<dl><dd>' , $table['indent'] );
+               $return .= '<table';
+               $return .= isset( $table['attributes'] ) ? $table['attributes'] : '';
+               $return .= '>';
+               unset( $table['attributes'] );
+
+               if ( isset( $table['caption'] ) ) {
+                       $return .= "\n<caption";
+                       $return .= isset( $table['caption']['attributes'] ) ? $table['caption']['attributes'] : '';
+                       $return .= '>';
+                       $return .= $table['caption']['content'];
+                       $return .= "\n</caption>";
+               }
+               $lastSection = '';
+               $empty = true;
+               $simple = true;
+
+               // If we only have tbodies, mark table as simple
+               for ( $i = 0; isset( $table[$i] ); $i++ ) {
+                       if ( !count( $table[$i] ) ) continue;
+                       if ( !isset( $table[$i]['type'] ) ) {
+                               $table[$i]['type'] = 'tbody';
                         }
-                       if ( array_pop( $tr_history ) ) {
-                               $out .= "</tr>\n";
+                       if ( !$lastSection ) {
+                               $lastSection = $table[$i]['type'];
+                       } elseif ( $lastSection != $table[$i]['type'] ) {
+                               $simple = false;
                         }
-                       if ( !array_pop( $has_opened_tr ) ) {
-                               $out .= "<tr><td></td></tr>\n" ;
+               }
+               $lastSection = '';
+               for ( $i = 0; isset( $table[$i] ); $i++ ) {
+                       if ( !count( $table[$i] ) ) continue;
+                       $empty = false; // check for empty tables
+
+                       if ( $table[$i]['type'] != $lastSection && !$simple ) {
+                               $return .= "\n<" . $table[$i]['type'] . '>';
                         }
  
-                       $out .= "</table>\n";
-               }
+                       $return .= "\n<tr";
+                       $return .= isset( $table[$i]['attributes'] ) ? $table[$i]['attributes'] : '';
+                       $return .= '>';
+                       for ( $j = 0; isset( $table[$i][$j] ); $j++ ) {
+                               if ( !isset( $table[$i][$j]['type'] ) ) $table[$i][$j]['type'] = 'td';
+                               $return .= "\n<" . $table[$i][$j]['type'];
+                               $return .= isset( $table[$i][$j]['attributes'] ) ? $table[$i][$j]['attributes'] : '';
+                               $return .= '>';
+
+                               $return .= $table[$i][$j]['content'];
+                               if ( $table[$i][$j]['content'] != '' )
+                                       $return .= "\n";
+
+                               $return .= '</' . $table[$i][$j]['type'] . '>';
+                               unset( $table[$i][$j] );
+                       }
+                       $return .= "\n</tr>";
  
-               # Remove trailing line-ending (b/c)
-               if ( substr( $out, -1 ) === "\n" ) {
-                       $out = substr( $out, 0, -1 );
+                       if ( ( !isset( $table[$i + 1] ) && !$simple ) || ( isset( $table[$i + 1] ) && isset( $table[$i + 1]['type'] ) && $table[$i]['type'] != $table[$i + 1]['type'] ) ) {
+                               $return .= '</' . $table[$i]['type'] . '>';
+                       }
+                       $lastSection = $table[$i]['type'];
+                       unset( $table[$i] );
                 }
-
-               # special case: don't return empty table
-               if ( $out === "<table>\n<tr><td></td></tr>\n</table>" ) {
-                       $out = '';
+               if ( $empty ) {
+                       if ( isset( $table['caption'] ) ) {
+                               $return .= "\n<tr><td></td></tr>";
+                       } else {
+                               return '';
+                       }
                 }
+               $return .= "\n</table>";
+               $return .= str_repeat( '</dd></dl>' , $table['indent'] );
  
-               wfProfileOut( __METHOD__ );
+               return $return;
+       }
  
-               return $out;
+       /**
+        * like end() but only works on the numeric array index and php's internal pointers
+        * returns a reference to the last element of an array much like "\$arr[-1]" in perl
+        * ignores associative elements and will create a 0 key will a NULL value if there were
+        * no numric elements and an array itself if not previously defined.
+        *
+        * @private
+        */
+       function &last ( &$arr ) {
+               for ( $i = count( $arr ); ( !isset( $arr[$i] ) && $i > 0 ); $i-- ) {  }
+               return $arr[$i];
         }
  
         /**
@@ -1132,6 +1202,11 @@ class Parser {
                 return $text;
         }
  
+       /**
+        * @throws MWException
+        * @param $m array
+        * @return HTML|string
+        */
         function magicLinkCallback( $m ) {
                 if ( isset( $m[1] ) && $m[1] !== '' ) {
                         # Skip anchor
@@ -1158,10 +1233,8 @@ class Parser {
                                 throw new MWException( __METHOD__.': unrecognised match type "' .
                                         substr( $m[0], 0, 20 ) . '"' );
                         }
-                       $url = wfMsgForContent( $urlmsg, $id);
-                       $sk = $this->mOptions->getSkin( $this->mTitle );
-                       $la = $sk->getExternalLinkAttributes( "external $CssClass" );
-                       return "<a href=\"{$url}\"{$la}>{$keyword} {$id}</a>";
+                       $url = wfMsgForContent( $urlmsg, $id );
+                       return Linker::makeExternalLink( $url, "{$keyword} {$id}", true, $CssClass );
                 } elseif ( isset( $m[5] ) && $m[5] !== '' ) {
                         # ISBN
                         $isbn = $m[5];
@@ -1188,7 +1261,6 @@ class Parser {
                 global $wgContLang;
                 wfProfileIn( __METHOD__ );
  
-               $sk = $this->mOptions->getSkin( $this->mTitle );
                 $trail = '';
  
                 # The characters '<' and '>' (which were escaped by
@@ -1219,7 +1291,7 @@ class Parser {
                 $text = $this->maybeMakeExternalImage( $url );
                 if ( $text === false ) {
                         # Not an image, make a link
-                       $text = $sk->makeExternalLink( $url, $wgContLang->markNoConversion($url), true, 'free',
+                       $text = Linker::makeExternalLink( $url, $wgContLang->markNoConversion($url), true, 'free',
                                 $this->getExternalLinkAttribs( $url ) );
                         # Register it in the output object...
                         # Replace unnecessary URL escape codes with their equivalent characters
@@ -1435,8 +1507,6 @@ class Parser {
                 global $wgContLang;
                 wfProfileIn( __METHOD__ );
  
-               $sk = $this->mOptions->getSkin( $this->mTitle );
-
                 $bits = preg_split( $this->mExtLinkBracketedRegex, $text, -1, PREG_SPLIT_DELIM_CAPTURE );
                 $s = array_shift( $bits );
  
@@ -1494,7 +1564,7 @@ class Parser {
                         # This means that users can paste URLs directly into the text
                         # Funny characters like ö aren't valid in URLs anyway
                         # This was changed in August 2004
-                       $s .= $sk->makeExternalLink( $url, $text, false, $linktype,
+                       $s .= Linker::makeExternalLink( $url, $text, false, $linktype,
                                 $this->getExternalLinkAttribs( $url ) ) . $dtrail . $trail;
  
                         # Register link in the output object.
@@ -1544,7 +1614,6 @@ class Parser {
                 return $attribs;
         }
  
-
         /**
          * Replace unusual URL escape codes with their equivalent characters
          *
@@ -1584,7 +1653,6 @@ class Parser {
          * @private
          */
         function maybeMakeExternalImage( $url ) {
-               $sk = $this->mOptions->getSkin( $this->mTitle );
                 $imagesfrom = $this->mOptions->getAllowExternalImagesFrom();
                 $imagesexception = !empty( $imagesfrom );
                 $text = false;
@@ -1606,7 +1674,7 @@ class Parser {
                          || ( $imagesexception && $imagematch ) ) {
                         if ( preg_match( self::EXT_IMAGE_REGEX, $url ) ) {
                                 # Image found
-                               $text = $sk->makeExternalImage( $url );
+                               $text = Linker::makeExternalImage( $url );
                         }
                 }
                 if ( !$text && $this->mOptions->getEnableImageWhitelist()
@@ -1619,7 +1687,7 @@ class Parser {
                                 }
                                 if ( preg_match( '/' . str_replace( '/', '\\/', $entry ) . '/i', $url ) ) {
                                         # Image matches a whitelist entry
-                                       $text = $sk->makeExternalImage( $url );
+                                       $text = Linker::makeExternalImage( $url );
                                         break;
                                 }
                         }
@@ -1660,7 +1728,6 @@ class Parser {
                         $e1_img = "/^([{$tc}]+)\\|(.*)\$/sD";
                 }
  
-               $sk = $this->mOptions->getSkin( $this->mTitle );
                 $holders = new LinkHolderArray( $this );
  
                 # split the entire text string on occurences of [[
@@ -1895,14 +1962,13 @@ class Parser {
                                                         $holders->merge( $this->replaceInternalLinks2( $text ) );
                                                 }
                                                 # cloak any absolute URLs inside the image markup, so replaceExternalLinks() won't touch them
-                                               $s .= $prefix . $this->armorLinks( $this->makeImage( $nt, $text, $holders ) ) . $trail;
+                                               $s .= $prefix . $this->armorLinks(
+                                                       $this->makeImage( $nt, $text, $holders ) ) . $trail;
                                         } else {
                                                 $s .= $prefix . $trail;
                                         }
-                                       $this->mOutput->addImage( $nt->getDBkey() );
                                         wfProfileOut( __METHOD__."-image" );
                                         continue;
-
                                 }
  
                                 if ( $ns == NS_CATEGORY ) {
@@ -1933,26 +1999,24 @@ class Parser {
                         # Self-link checking
                         if ( $nt->getFragment() === '' && $ns != NS_SPECIAL ) {
                                 if ( in_array( $nt->getPrefixedText(), $selflink, true ) ) {
-                                       $s .= $prefix . $sk->makeSelfLinkObj( $nt, $text, '', $trail );
+                                       $s .= $prefix . Linker::makeSelfLinkObj( $nt, $text, '', $trail );
                                         continue;
                                 }
                         }
  
                         # NS_MEDIA is a pseudo-namespace for linking directly to a file
-                       # FIXME: Should do batch file existence checks, see comment below
+                       # @todo FIXME: Should do batch file existence checks, see comment below
                         if ( $ns == NS_MEDIA ) {
                                 wfProfileIn( __METHOD__."-media" );
                                 # Give extensions a chance to select the file revision for us
-                               $skip = $time = false;
-                               wfRunHooks( 'BeforeParserMakeImageLinkObj', array( &$this, &$nt, &$skip, &$time ) );
-                               if ( $skip ) {
-                                       $link = $sk->link( $nt );
-                               } else {
-                                       $link = $sk->makeMediaLinkObj( $nt, $text, $time );
-                               }
+                               $time = $sha1 = $descQuery = false;
+                               wfRunHooks( 'BeforeParserFetchFileAndTitle',
+                                       array( $this, $nt, &$time, &$sha1, &$descQuery ) );
+                               # Fetch and register the file (file title may be different via hooks)
+                               list( $file, $nt ) = $this->fetchFileAndTitle( $nt, $time, $sha1 );
                                 # Cloak with NOPARSE to avoid replacement in replaceExternalLinks
-                               $s .= $prefix . $this->armorLinks( $link ) . $trail;
-                               $this->mOutput->addImage( $nt->getDBkey() );
+                               $s .= $prefix . $this->armorLinks(
+                                       Linker::makeMediaLinkFile( $nt, $file, $text ) ) . $trail;
                                 wfProfileOut( __METHOD__."-media" );
                                 continue;
                         }
@@ -1961,14 +2025,14 @@ class Parser {
                         # Some titles, such as valid special pages or files in foreign repos, should
                         # be shown as bluelinks even though they're not included in the page table
                         #
-                       # FIXME: isAlwaysKnown() can be expensive for file links; we should really do
+                       # @todo FIXME: isAlwaysKnown() can be expensive for file links; we should really do
                         # batch file existence checks for NS_FILE and NS_MEDIA
                         if ( $iw == '' && $nt->isAlwaysKnown() ) {
                                 $this->mOutput->addLink( $nt );
-                               $s .= $this->makeKnownLinkHolder( $nt, $text, '', $trail, $prefix );
+                               $s .= $this->makeKnownLinkHolder( $nt, $text, array(), $trail, $prefix );
                         } else {
                                 # Links will be added to the output link list after checking
-                               $s .= $holders->makeHolder( $nt, $text, '', $trail, $prefix );
+                               $s .= $holders->makeHolder( $nt, $text, array(), $trail, $prefix );
                         }
                         wfProfileOut( __METHOD__."-always_known" );
                 }
@@ -1976,18 +2040,6 @@ class Parser {
                 return $holders;
         }
  
-       /**
-        * Make a link placeholder. The text returned can be later resolved to a real link with
-        * replaceLinkHolders(). This is done for two reasons: firstly to avoid further
-        * parsing of interwiki links, and secondly to allow all existence checks and
-        * article length checks (for stub links) to be bundled into a single query.
-        *
-        * @deprecated
-        */
-       function makeLinkHolder( &$nt, $text = '', $query = '', $trail = '', $prefix = '' ) {
-               return $this->mLinkHolders->makeHolder( $nt, $text, $query, $trail, $prefix );
-       }
-
         /**
          * Render a forced-blue link inline; protect against double expansion of
          * URLs if we're in a mode that prepends full URL prefixes to internal links.
@@ -1997,16 +2049,23 @@ class Parser {
          *
          * @param $nt Title
          * @param $text String
-        * @param $query String
+        * @param $query Array or String
          * @param $trail String
          * @param $prefix String
          * @return String: HTML-wikitext mix oh yuck
          */
-       function makeKnownLinkHolder( $nt, $text = '', $query = '', $trail = '', $prefix = '' ) {
+       function makeKnownLinkHolder( $nt, $text = '', $query = array(), $trail = '', $prefix = '' ) {
                 list( $inside, $trail ) = Linker::splitTrail( $trail );
-               $sk = $this->mOptions->getSkin( $this->mTitle );
-               # FIXME: use link() instead of deprecated makeKnownLinkObj()
-               $link = $sk->makeKnownLinkObj( $nt, $text, $query, $inside, $prefix );
+
+               if ( is_string( $query ) ) {
+                       $query = wfCgiToArray( $query );
+               }
+               if ( $text == '' ) {
+                       $text = htmlspecialchars( $nt->getPrefixedText() );
+               }
+
+               $link = Linker::linkKnown( $nt, "$prefix$text$inside", array(), $query );
+
                 return $this->armorLinks( $link ) . $trail;
         }
  
@@ -2049,6 +2108,8 @@ class Parser {
         /**#@+
          * Used by doBlockLevels()
          * @private
+        *
+        * @return string
          */
         function closeParagraph() {
                 $result = '';
@@ -2073,7 +2134,7 @@ class Parser {
                 }
  
                 for ( $i = 0; $i < $shorter; ++$i ) {
-                       if ( $st1{$i} != $st2{$i} ) {
+                       if ( $st1[$i] != $st2[$i] ) {
                                 break;
                         }
                 }
@@ -2084,6 +2145,8 @@ class Parser {
          * These next three functions open, continue, and close the list
          * element appropriate to the prefix character passed into them.
          * @private
+        *
+        * @return string
          */
         function openList( $char ) {
                 $result = $this->closeParagraph();
@@ -2108,6 +2171,8 @@ class Parser {
          * TODO: document
          * @param $char String
          * @private
+        *
+        * @return string
          */
         function nextItem( $char ) {
                 if ( '*' === $char || '#' === $char ) {
@@ -2132,6 +2197,8 @@ class Parser {
          * TODO: document
          * @param $char String
          * @private
+        *
+        * @return string
          */
         function closeList( $char ) {
                 if ( '*' === $char ) {
@@ -2250,7 +2317,7 @@ class Parser {
                                         $output .= $this->openList( $char );
  
                                         if ( ';' === $char ) {
-                                               # FIXME: This is dupe of code above
+                                               # @todo FIXME: This is dupe of code above
                                                 if ( $this->findColonNoLinks( $t, $term, $t2 ) !== false ) {
                                                         $t = $t2;
                                                         $output .= $term . $this->nextItem( ':' );
@@ -2271,9 +2338,8 @@ class Parser {
                                         '/(?:<\\/table|<\\/blockquote|<\\/h1|<\\/h2|<\\/h3|<\\/h4|<\\/h5|<\\/h6|'.
                                         '<td|<th|<\\/?div|<hr|<\\/pre|<\\/p|'.$this->mUniqPrefix.'-pre|<\\/li|<\\/ul|<\\/ol|<\\/?center)/iS', $t );
                                 if ( $openmatch or $closematch ) {
-
                                         $paragraphStack = false;
-                                       # TODO bug 5718: paragraph closed
+                                       # TODO bug 5718: paragraph closed
                                         $output .= $this->closeParagraph();
                                         if ( $preOpenMatch and !$preCloseMatch ) {
                                                 $this->mInPre = true;
@@ -2372,7 +2438,7 @@ class Parser {
                 $stack = 0;
                 $len = strlen( $str );
                 for( $i = 0; $i < $len; $i++ ) {
-                       $c = $str{$i};
+                       $c = $str[$i];
  
                         switch( $state ) {
                         # (Using the number is a performance hack for common cases)
@@ -2497,6 +2563,7 @@ class Parser {
                 }
                 if ( $stack > 0 ) {
                         wfDebug( __METHOD__.": Invalid input; not enough close tags (stack $stack, state $state)\n" );
+                       wfProfileOut( __METHOD__ );
                         return false;
                 }
                 wfProfileOut( __METHOD__ );
@@ -2507,6 +2574,9 @@ class Parser {
          * Return value of a magic variable (like PAGENAME)
          *
          * @private
+        *
+        * @param $index integer
+        * @param $frame PPFrame
          */
         function getVariableValue( $index, $frame=false ) {
                 global $wgContLang, $wgSitename, $wgServer;
@@ -2855,6 +2925,8 @@ class Parser {
          * dependency requirements.
          *
          * @private
+        *
+        * @return PPNode
          */
         function preprocessToDom( $text, $flags = 0 ) {
                 $dom = $this->getPreprocessor()->preprocessToObj( $text, $flags );
@@ -2863,6 +2935,8 @@ class Parser {
  
         /**
          * Return a three-element array: leading whitespace, string contents, trailing whitespace
+        *
+        * @return array
          */
         public static function splitWhitespace( $s ) {
                 $ltrimmed = ltrim( $s );
@@ -2893,6 +2967,8 @@ class Parser {
          *        Providing arguments this way may be useful for extensions wishing to perform variable replacement explicitly.
          * @param $argsOnly Boolean: only do argument (triple-brace) expansion, not double-brace expansion
          * @private
+        *
+        * @return string
          */
         function replaceVariables( $text, $frame = false, $argsOnly = false ) {
                 # Is there any text? Also, Prevent too big inclusions!
@@ -2916,7 +2992,11 @@ class Parser {
                 return $text;
         }
  
-       # Clean up argument array - refactored in 1.9 so parserfunctions can use it, too.
+       /**
+        * Clean up argument array - refactored in 1.9 so parserfunctions can use it, too.
+        *
+        * @return array
+        */
         static function createAssocArgs( $args ) {
                 $assocArgs = array();
                 $index = 1;
@@ -3002,9 +3082,10 @@ class Parser {
                 $originalTitle = $part1;
  
                 # $args is a list of argument nodes, starting from index 0, not including $part1
-               # *** FIXME if piece['parts'] is null then the call to getLength() below won't work b/c this $args isn't an object
+               # @todo FIXME: If piece['parts'] is null then the call to getLength() below won't work b/c this $args isn't an object
                 $args = ( null == $piece['parts'] ) ? array() : $piece['parts'];
                 wfProfileOut( __METHOD__.'-setup' );
+               wfProfileIn( __METHOD__."-title-$originalTitle" );
  
                 # SUBST
                 wfProfileIn( __METHOD__.'-modifiers' );
@@ -3173,7 +3254,7 @@ class Parser {
                                         && $this->mOptions->getAllowSpecialInclusion()
                                         && $this->ot['html'] )
                                 {
-                                       $text = SpecialPage::capturePath( $title );
+                                       $text = SpecialPageFactory::capturePath( $title );
                                         if ( is_string( $text ) ) {
                                                 $found = true;
                                                 $isHTML = true;
@@ -3223,6 +3304,7 @@ class Parser {
                 # Recover the source wikitext and return it
                 if ( !$found ) {
                         $text = $frame->virtualBracketedImplode( '{{', '|', '}}', $titleWithSpaces, $args );
+                       wfProfileOut( __METHOD__."-title-$originalTitle" );
                         wfProfileOut( __METHOD__ );
                         return array( 'object' => $text );
                 }
@@ -3262,11 +3344,11 @@ class Parser {
                         $text = wfEscapeWikiText( $text );
                 } elseif ( is_string( $text )
                         && !$piece['lineStart']
-                       && preg_match( '/^{\\|/', $text ) )
+                       && preg_match( '/^(?:{\\||:|;|#|\*)/', $text ) )
                 {
-                       # Bug 529: if the template begins with a table, it should be treated as
-                       # beginning a new line.  This previously handled other block-level elements
-                       # such as #, :, etc, but these have many false-positives (bug 12974).
+                       # Bug 529: if the template begins with a table or block-level
+                       # element, it should be treated as beginning a new line.
+                       # This behaviour is somewhat controversial.
                         $text = "\n" . $text;
                 }
  
@@ -3291,6 +3373,7 @@ class Parser {
                         $ret = array( 'text' => $text );
                 }
  
+               wfProfileOut( __METHOD__."-title-$originalTitle" );
                 wfProfileOut( __METHOD__ );
                 return $ret;
         }
@@ -3298,6 +3381,8 @@ class Parser {
         /**
          * Get the semi-parsed DOM representation of a template with a given title,
          * and its redirect destination title. Cached.
+        *
+        * @return array
          */
         function getTemplateDom( $title ) {
                 $cacheTitle = $title;
@@ -3325,7 +3410,7 @@ class Parser {
  
                 if ( !$title->equals( $cacheTitle ) ) {
                         $this->mTplRedirCache[$cacheTitle->getPrefixedDBkey()] =
-                               array( $title->getNamespace(), $title->getDBkey() );
+                               array( $title->getNamespace(), $cdb = $title->getDBkey() );
                 }
  
                 return array( $dom, $title );
@@ -3333,6 +3418,8 @@ class Parser {
  
         /**
          * Fetch the unparsed text of a template and register a reference to it.
+        * @param Title $title
+        * @return Array ( string or false, Title )
          */
         function fetchTemplateAndTitle( $title ) {
                 $templateCb = $this->mOptions->getTemplateCallback(); # Defaults to Parser::statelessFetchTemplate()
@@ -3347,6 +3434,11 @@ class Parser {
                 return array( $text, $finalTitle );
         }
  
+       /**
+        * Fetch the unparsed text of a template and register a reference to it.
+        * @param Title $title
+        * @return mixed string or false
+        */
         function fetchTemplate( $title ) {
                 $rv = $this->fetchTemplateAndTitle( $title );
                 return $rv[0];
@@ -3355,8 +3447,10 @@ class Parser {
         /**
          * Static function to get a template
          * Can be overridden via ParserOptions::setTemplateCallback().
+        *
+        * @return array
          */
-       static function statelessFetchTemplate( $title, $parser=false ) {
+       static function statelessFetchTemplate( $title, $parser = false ) {
                 $text = $skip = false;
                 $finalTitle = $title;
                 $deps = array();
@@ -3365,17 +3459,22 @@ class Parser {
                 for ( $i = 0; $i < 2 && is_object( $title ); $i++ ) {
                         # Give extensions a chance to select the revision instead
                         $id = false; # Assume current
-                       wfRunHooks( 'BeforeParserFetchTemplateAndtitle', array( $parser, &$title, &$skip, &$id ) );
+                       wfRunHooks( 'BeforeParserFetchTemplateAndtitle',
+                               array( $parser, $title, &$skip, &$id ) );
  
                         if ( $skip ) {
                                 $text = false;
                                 $deps[] = array(
-                                       'title' => $title,
-                                       'page_id' => $title->getArticleID(),
-                                       'rev_id' => null );
+                                       'title'         => $title,
+                                       'page_id'       => $title->getArticleID(),
+                                       'rev_id'        => null
+                               );
                                 break;
                         }
-                       $rev = $id ? Revision::newFromId( $id ) : Revision::newFromTitle( $title );
+                       # Get the revision
+                       $rev = $id
+                               ? Revision::newFromId( $id )
+                               : Revision::newFromTitle( $title );
                         $rev_id = $rev ? $rev->getId() : 0;
                         # If there is no current revision, there is no page
                         if ( $id === false && !$rev ) {
@@ -3384,9 +3483,16 @@ class Parser {
                         }
  
                         $deps[] = array(
-                               'title' => $title,
-                               'page_id' => $title->getArticleID(),
-                               'rev_id' => $rev_id );
+                               'title'         => $title,
+                               'page_id'       => $title->getArticleID(),
+                               'rev_id'        => $rev_id );
+                       if ( $rev && !$title->equals( $rev->getTitle() ) ) {
+                               # We fetched a rev from a different title; register it too...
+                               $deps[] = array(
+                                       'title'         => $rev->getTitle(),
+                                       'page_id'       => $rev->getPage(),
+                                       'rev_id'        => $rev_id );
+                       }
  
                         if ( $rev ) {
                                 $text = $rev->getText();
@@ -3414,8 +3520,51 @@ class Parser {
                         'deps' => $deps );
         }
  
+       /**
+        * Fetch a file and its title and register a reference to it.
+        * @param Title $title
+        * @param string $time MW timestamp
+        * @param string $sha1 base 36 SHA-1
+        * @return mixed File or false
+        */
+       function fetchFile( $title, $time = false, $sha1 = false ) {
+               $res = $this->fetchFileAndTitle( $title, $time, $sha1 );
+               return $res[0];
+       }
+
+       /**
+        * Fetch a file and its title and register a reference to it.
+        * @param Title $title
+        * @param string $time MW timestamp
+        * @param string $sha1 base 36 SHA-1
+        * @return Array ( File or false, Title of file )
+        */
+       function fetchFileAndTitle( $title, $time = false, $sha1 = false ) {
+               if ( $time === '0' ) {
+                       $file = false; // broken thumbnail forced by hook
+               } elseif ( $sha1 ) { // get by (sha1,timestamp)
+                       $file = RepoGroup::singleton()->findFileFromKey( $sha1, array( 'time' => $time ) );
+               } else { // get by (name,timestamp)
+                       $file = wfFindFile( $title, array( 'time' => $time ) );
+               }
+               $time = $file ? $file->getTimestamp() : false;
+               $sha1 = $file ? $file->getSha1() : false;
+               # Register the file as a dependency...
+               $this->mOutput->addImage( $title->getDBkey(), $time, $sha1 );
+               if ( $file && !$title->equals( $file->getTitle() ) ) {
+                       # Update fetched file title
+                       $title = $file->getTitle();
+               }
+               return array( $file, $title );
+       }
+
         /**
          * Transclude an interwiki link.
+        *
+        * @param $title Title
+        * @param $action
+        *
+        * @return string
          */
         function interwikiTransclude( $title, $action ) {
                 global $wgEnableScaryTranscluding;
@@ -3432,6 +3581,10 @@ class Parser {
                 return $this->fetchScaryTemplateMaybeFromCache( $url );
         }
  
+       /**
+        * @param $url string
+        * @return Mixed|String
+        */
         function fetchScaryTemplateMaybeFromCache( $url ) {
                 global $wgTranscludeCacheExpiry;
                 $dbr = wfGetDB( DB_SLAVE );
@@ -3456,10 +3609,14 @@ class Parser {
                 return $text;
         }
  
-
         /**
          * Triple brace replacement -- used for template arguments
          * @private
+        *
+        * @param $peice array
+        * @param $frame PPFrame
+        *
+        * @return array
          */
         function argSubstitution( $piece, $frame ) {
                 wfProfileIn( __METHOD__ );
@@ -3513,6 +3670,8 @@ class Parser {
          *     inner      Contents of extension element
          *     noClose    Original text did not have a close tag
          * @param $frame PPFrame
+        *
+        * @return string
          */
         function extensionSubstitution( $params, $frame ) {
                 $name = $frame->expand( $params['name'] );
@@ -3581,9 +3740,9 @@ class Parser {
                 if ( $markerType === 'none' ) {
                         return $output;
                 } elseif ( $markerType === 'nowiki' ) {
-                       $this->mStripState->nowiki->setPair( $marker, $output );
+                       $this->mStripState->addNoWiki( $marker, $output );
                 } elseif ( $markerType === 'general' ) {
-                       $this->mStripState->general->setPair( $marker, $output );
+                       $this->mStripState->addGeneral( $marker, $output );
                 } else {
                         throw new MWException( __METHOD__.': invalid marker type' );
                 }
@@ -3655,7 +3814,7 @@ class Parser {
                 }
                 # (bug 8068) Allow control over whether robots index a page.
                 #
-               # FIXME (bug 14899): __INDEX__ always overrides __NOINDEX__ here!  This
+               # @todo FIXME: Bug 14899: __INDEX__ always overrides __NOINDEX__ here!  This
                 # is not desirable, the last one on the page should win.
                 if ( isset( $this->mDoubleUnderscores['noindex'] ) && $this->mTitle->canUseNoindex() ) {
                         $this->mOutput->setIndexPolicy( 'noindex' );
@@ -3718,8 +3877,6 @@ class Parser {
         function formatHeadings( $text, $origText, $isMain=true ) {
                 global $wgMaxTocLevel, $wgContLang, $wgHtml5, $wgExperimentalHtmlIds;
  
-               $doNumberHeadings = $this->mOptions->getNumberHeadings();
-
                 # Inhibit editsection links if requested in the page
                 if ( isset( $this->mDoubleUnderscores['noeditsection'] ) ) {
                         $showEditLink = 0;
@@ -3759,9 +3916,6 @@ class Parser {
                         $enoughToc = true;
                 }
  
-               # We need this to perform operations on the HTML
-               $sk = $this->mOptions->getSkin( $this->mTitle );
-
                 # headline counter
                 $headlineCount = 0;
                 $numVisible = 0;
@@ -3812,7 +3966,7 @@ class Parser {
                                 $sublevelCount[$toclevel] = 0;
                                 if ( $toclevel<$wgMaxTocLevel ) {
                                         $prevtoclevel = $toclevel;
-                                       $toc .= $sk->tocIndent();
+                                       $toc .= Linker::tocIndent();
                                         $numVisible++;
                                 }
                         } elseif ( $level < $prevlevel && $toclevel > 1 ) {
@@ -3835,16 +3989,16 @@ class Parser {
                                 if ( $toclevel<$wgMaxTocLevel ) {
                                         if ( $prevtoclevel < $wgMaxTocLevel ) {
                                                 # Unindent only if the previous toc level was shown :p
-                                               $toc .= $sk->tocUnindent( $prevtoclevel - $toclevel );
+                                               $toc .= Linker::tocUnindent( $prevtoclevel - $toclevel );
                                                 $prevtoclevel = $toclevel;
                                         } else {
-                                               $toc .= $sk->tocLineEnd();
+                                               $toc .= Linker::tocLineEnd();
                                         }
                                 }
                         } else {
                                 # No change in level, end TOC line
                                 if ( $toclevel<$wgMaxTocLevel ) {
-                                       $toc .= $sk->tocLineEnd();
+                                       $toc .= Linker::tocLineEnd();
                                 }
                         }
  
@@ -3858,7 +4012,10 @@ class Parser {
                                         if ( $dot ) {
                                                 $numbering .= '.';
                                         }
-                                       $numbering .= $wgContLang->formatNum( $sublevelCount[$i] );
+                                       global $wgBetterDirectionality;
+                                       $pagelang = $this->mTitle->getPageLanguage();
+                                       $toclang = ( $wgBetterDirectionality ? $pagelang : $wgContLang );
+                                       $numbering .= $toclang->formatNum( $sublevelCount[$i] );
                                         $dot = 1;
                                 }
                         }
@@ -3916,7 +4073,7 @@ class Parser {
                         # HTML names must be case-insensitively unique (bug 10721).
                         # This does not apply to Unicode characters per
                         # http://dev.w3.org/html5/spec/infrastructure.html#case-sensitivity-and-string-comparison
-                       # FIXME: We may be changing them depending on the current locale.
+                       # @todo FIXME: We may be changing them depending on the current locale.
                         $arrayKey = strtolower( $safeHeadline );
                         if ( $legacyHeadline === false ) {
                                 $legacyArrayKey = false;
@@ -3937,7 +4094,7 @@ class Parser {
                         }
  
                         # Don't number the heading if it is the only one (looks silly)
-                       if ( $doNumberHeadings && count( $matches[3] ) > 1) {
+                       if ( count( $matches[3] ) > 1 && $this->mOptions->getNumberHeadings() ) {
                                 # the two are different if the line contains a link
                                 $headline = $numbering . ' ' . $headline;
                         }
@@ -3952,7 +4109,7 @@ class Parser {
                                 $legacyAnchor .= '_' . $refers[$legacyArrayKey];
                         }
                         if ( $enoughToc && ( !isset( $wgMaxTocLevel ) || $toclevel < $wgMaxTocLevel ) ) {
-                               $toc .= $sk->tocLine( $anchor, $tocline,
+                               $toc .= Linker::tocLine( $anchor, $tocline,
                                         $numbering, $toclevel, ( $isTemplate ? false : $sectionIndex ) );
                         }
  
@@ -3997,17 +4154,17 @@ class Parser {
                                 // We use a page and section attribute to stop the language converter from converting these important bits
                                 // of data, but put the headline hint inside a content block because the language converter is supposed to
                                 // be able to convert that piece of data.
-                               $editlink = '<editsection page="' . htmlspecialchars($editlinkArgs[0]);
+                               $editlink = '<mw:editsection page="' . htmlspecialchars($editlinkArgs[0]);
                                 $editlink .= '" section="' . htmlspecialchars($editlinkArgs[1]) .'"';
                                 if ( isset($editlinkArgs[2]) ) {
-                                       $editlink .= '>' . $editlinkArgs[2] . '</editsection>';
+                                       $editlink .= '>' . $editlinkArgs[2] . '</mw:editsection>';
                                 } else {
                                         $editlink .= '/>';
                                 }
                         } else {
                                 $editlink = '';
                         }
-                       $head[$headlineCount] = $sk->makeHeadline( $level,
+                       $head[$headlineCount] = Linker::makeHeadline( $level,
                                 $matches['attrib'][$headlineCount], $anchor, $headline,
                                 $editlink, $legacyAnchor );
  
@@ -4023,9 +4180,9 @@ class Parser {
  
                 if ( $enoughToc ) {
                         if ( $prevtoclevel > 0 && $prevtoclevel < $wgMaxTocLevel ) {
-                               $toc .= $sk->tocUnindent( $prevtoclevel - 1 );
+                               $toc .= Linker::tocUnindent( $prevtoclevel - 1 );
                         }
-                       $toc = $sk->tocList( $toc );
+                       $toc = Linker::tocList( $toc, $this->mOptions->getUserLang() );
                         $this->mOutput->setTOCHTML( $toc );
                 }
  
@@ -4077,14 +4234,8 @@ class Parser {
          * @return String: the altered wiki markup
          */
         public function preSaveTransform( $text, Title $title, User $user, ParserOptions $options, $clearState = true ) {
-               $this->mOptions = $options;
-               $this->setTitle( $title );
+               $this->startParse( $title, $options, self::OT_WIKI, $clearState );
                 $this->setUser( $user );
-               $this->setOutputType( self::OT_WIKI );
-
-               if ( $clearState ) {
-                       $this->clearState();
-               }
  
                 $pairs = array(
                         "\r\n" => "\n",
@@ -4142,6 +4293,9 @@ class Parser {
                 # Because mOutputType is OT_WIKI, this will only process {{subst:xxx}} type tags
                 $text = $this->replaceVariables( $text );
  
+               # This works almost by chance, as the replaceVariables are done before the getUserSig(),
+               # which may corrupt this parser instance via its wfMsgExt( parsemag ) call-
+
                 # Signatures
                 $sigText = $this->getUserSig( $user );
                 $text = strtr( $text, array(
@@ -4187,6 +4341,8 @@ class Parser {
          * validated, ready-to-insert wikitext.
          * If you have pre-fetched the nickname or the fancySig option, you can
          * specify them here to save a database query.
+        * Do not reuse this parser instance after calling getUserSig(),
+        * as it may have changed if it's the $wgParser.
          *
          * @param $user User
          * @param $nickname String: nickname to use or false to use user's default nickname
@@ -4230,11 +4386,9 @@ class Parser {
                 # If we're still here, make it a link to the user page
                 $userText = wfEscapeWikiText( $username );
                 $nickText = wfEscapeWikiText( $nickname );
-               if ( $user->isAnon() )  {
-                       return wfMsgExt( 'signature-anon', array( 'content', 'parsemag' ), $userText, $nickText );
-               } else {
-                       return wfMsgExt( 'signature', array( 'content', 'parsemag' ), $userText, $nickText );
-               }
+               $msgName = $user->isAnon() ? 'signature-anon' : 'signature';
+
+               return wfMessage( $msgName, $userText, $nickText )->inContentLanguage()->title( $this->getTitle() )->text();
         }
  
         /**
@@ -4271,7 +4425,7 @@ class Parser {
                         return $text;
                 }
  
-               # FIXME: regex doesn't respect extension tags or nowiki
+               # @todo FIXME: Regex doesn't respect extension tags or nowiki
                 #  => Move this logic to braceSubstitution()
                 $substWord = MagicWord::get( 'subst' );
                 $substRegex = '/\{\{(?!(?:' . $substWord->getBaseRegex() . '))/x' . $substWord->getRegexCase();
@@ -4305,7 +4459,11 @@ class Parser {
          * Set up some variables which are usually set up in parse()
          * so that an external function can call some class members with confidence
          */
-       public function startExternalParse( &$title, $options, $outputType, $clearState = true ) {
+       public function startExternalParse( Title $title = null, ParserOptions $options, $outputType, $clearState = true ) {
+               $this->startParse( $title, $options, $outputType, $clearState );
+       }
+
+       private function startParse( Title $title = null, ParserOptions $options, $outputType, $clearState = true ) {
                 $this->setTitle( $title );
                 $this->mOptions = $options;
                 $this->setOutputType( $outputType );
@@ -4319,10 +4477,10 @@ class Parser {
          *
          * @param $text String: the text to preprocess
          * @param $options ParserOptions: options
+        * @param $title Title object or null to use $wgTitle
          * @return String
          */
-       public function transformMsg( $text, $options ) {
-               global $wgTitle;
+       public function transformMsg( $text, $options, $title = null ) {
                 static $executing = false;
  
                 # Guard against infinite recursion
@@ -4332,7 +4490,16 @@ class Parser {
                 $executing = true;
  
                 wfProfileIn( __METHOD__ );
-               $text = $this->preprocess( $text, $wgTitle, $options );
+               if ( !$title ) {
+                       global $wgTitle;
+                       $title = $wgTitle;
+               }
+               if ( !$title ) {
+                       # It's not uncommon having a null $wgTitle in scripts. See r80898
+                       # Create a ghost title in such case
+                       $title = Title::newFromText( 'Dwimmerlaik' );
+               }
+               $text = $this->preprocess( $text, $title, $options );
  
                 $executing = false;
                 wfProfileOut( __METHOD__ );
@@ -4342,11 +4509,22 @@ class Parser {
         /**
          * Create an HTML-style tag, e.g. <yourtag>special text</yourtag>
          * The callback should have the following form:
-        *    function myParserHook( $text, $params, $parser ) { ... }
+        *    function myParserHook( $text, $params, $parser, $frame ) { ... }
          *
          * Transform and return $text. Use $parser for any required context, e.g. use
          * $parser->getTitle() and $parser->getOptions() not $wgTitle or $wgOut->mParserOptions
          *
+        * Hooks may return extended information by returning an array, of which the
+        * first numbered element (index 0) must be the return string, and all other
+        * entries are extracted into local variables within an internal function
+        * in the Parser class.
+        *
+        * This interface (introduced r61913) appears to be undocumented, but
+        * 'markerName' is used by some core tag hooks to override which strip
+        * array their results are placed in. **Use great caution if attempting
+        * this interface, as it is not documented and injudicious use could smash
+        * private variables.**
+        *
          * @param $tag Mixed: the tag to use, e.g. 'hook' for <hook>
          * @param $callback Mixed: the callback function (and object) to use for the tag
          * @return The old value of the mTagHooks array associated with the hook
@@ -4363,6 +4541,22 @@ class Parser {
                 return $oldVal;
         }
  
+       /**
+        * As setHook(), but letting the contents be parsed.
+        *
+        * Transparent tag hooks are like regular XML-style tag hooks, except they
+        * operate late in the transformation sequence, on HTML instead of wikitext.
+        *
+        * This is probably obsoleted by things dealing with parser frames?
+        * The only extension currently using it is geoserver.
+        *
+        * @since 1.10
+        * @todo better document or deprecate this
+        *
+        * @param $tag Mixed: the tag to use, e.g. 'hook' for <hook>
+        * @param $callback Mixed: the callback function (and object) to use for the tag
+        * @return The old value of the mTagHooks array associated with the hook
+        */
         function setTransparentTagHook( $tag, $callback ) {
                 $tag = strtolower( $tag );
                 if ( preg_match( '/[<>\r\n]/', $tag, $m ) ) throw new MWException( "Invalid character {$m[0]} in setTransparentHook('$tag', ...) call" );
@@ -4380,6 +4574,19 @@ class Parser {
                 $this->mStripList = $this->mDefaultStripList;
         }
  
+       /**
+        * Remove a specific tag hook. Should not be called on $wgParser.
+        * Does not change the strip list.
+        *
+        * @param string $tag
+        * @return void
+        */
+       function clearTagHook( $tag ) {
+               if ( isset( $this->mTagHooks[$tag] ) ) {
+                       unset( $this->mTagHooks[$tag] );
+               }
+       }
+
         /**
          * Create a function, e.g. {{sum:1|2|3}}
          * The callback function should have the form:
@@ -4483,7 +4690,7 @@ class Parser {
         }
  
         /**
-        * FIXME: update documentation. makeLinkObj() is deprecated.
+        * @todo FIXME: Update documentation. makeLinkObj() is deprecated.
          * Replace <!--LINK--> link placeholders with actual links, in the buffer
          * Placeholders created in Skin::makeLinkObj()
          * Returns an array of link CSS classes, indexed by PDBK.
@@ -4511,6 +4718,10 @@ class Parser {
          * given as text will return the HTML of a gallery with two images,
          * labeled 'The number "1"' and
          * 'A tree'.
+        *
+        * @param string $text
+        * @param array $param
+        * @return string HTML
          */
         function renderImageGallery( $text, $params ) {
                 $ig = new ImageGallery();
@@ -4520,8 +4731,6 @@ class Parser {
                 $ig->setParser( $this );
                 $ig->setHideBadImages();
                 $ig->setAttributes( Sanitizer::validateTagAttributes( $params, 'table' ) );
-               $ig->useSkin( $this->mOptions->getSkin( $this->mTitle ) );
-               $ig->mRevisionId = $this->mRevisionId;
  
                 if ( isset( $params['showfilename'] ) ) {
                         $ig->setShowFilename( true );
@@ -4560,26 +4769,38 @@ class Parser {
                         if ( strpos( $matches[0], '%' ) !== false ) {
                                 $matches[1] = rawurldecode( $matches[1] );
                         }
-                       $tp = Title::newFromText( $matches[1], NS_FILE );
-                       $nt =& $tp;
-                       if ( is_null( $nt ) ) {
+                       $title = Title::newFromText( $matches[1], NS_FILE );
+                       if ( is_null( $title ) ) {
                                 # Bogus title. Ignore these so we don't bomb out later.
                                 continue;
                         }
+
+                       $label = '';
+                       $alt = '';
                         if ( isset( $matches[3] ) ) {
-                               $label = $matches[3];
-                       } else {
-                               $label = '';
+                               // look for an |alt= definition while trying not to break existing
+                               // captions with multiple pipes (|) in it, until a more sensible grammar
+                               // is defined for images in galleries
+
+                               $matches[3] = $this->recursiveTagParse( trim( $matches[3] ) );
+                               $altmatches = StringUtils::explode('|', $matches[3]);
+                               $magicWordAlt = MagicWord::get( 'img_alt' );
+
+                               foreach ( $altmatches as $altmatch ) {
+                                       $match = $magicWordAlt->matchVariableStartToEnd( $altmatch );
+                                       if ( $match ) {
+                                               $alt = $this->stripAltText( $match, false );
+                                       }
+                                       else {
+                                               // concatenate all other pipes
+                                               $label .= '|' . $altmatch;
+                                       }
+                               }
+                               // remove the first pipe
+                               $label = substr( $label, 1 );
                         }
  
-                       $html = $this->recursiveTagParse( trim( $label ) );
-
-                       $ig->add( $nt, $html );
-
-                       # Only add real images (bug #5586)
-                       if ( $nt->getNamespace() == NS_FILE ) {
-                               $this->mOutput->addImage( $nt->getDBkey() );
-                       }
+                       $ig->add( $title, $label, $alt );
                 }
                 return $ig->toHTML();
         }
@@ -4630,6 +4851,7 @@ class Parser {
          * @param $title Title
          * @param $options String
          * @param $holders LinkHolderArray
+        * @return string HTML
          */
         function makeImage( $title, $options, $holders = false ) {
                 # Check if the options text is of the form "options|alt text"
@@ -4658,23 +4880,23 @@ class Parser {
                 #  * text-bottom
  
                 $parts = StringUtils::explode( "|", $options );
-               $sk = $this->mOptions->getSkin( $this->mTitle );
  
                 # Give extensions a chance to select the file revision for us
-               $skip = $time = $descQuery = false;
-               wfRunHooks( 'BeforeParserMakeImageLinkObj', array( &$this, &$title, &$skip, &$time, &$descQuery ) );
+               $time = $sha1 = $descQuery = false;
+               wfRunHooks( 'BeforeParserFetchFileAndTitle',
+                       array( $this, $title, &$time, &$sha1, &$descQuery ) );
+               # Fetch and register the file (file title may be different via hooks)
+               list( $file, $title ) = $this->fetchFileAndTitle( $title, $time, $sha1 );
  
-               if ( $skip ) {
-                       return $sk->link( $title );
-               }
-
-               # Get the file
-               $file = wfFindFile( $title, array( 'time' => $time ) );
                 # Get parameter map
                 $handler = $file ? $file->getHandler() : false;
  
                 list( $paramMap, $mwArray ) = $this->getImageParams( $handler );
  
+               if ( !$file ) {
+                       $this->addTrackingCategory( 'broken-file-category' );
+               }
+
                 # Process the input parameters
                 $caption = '';
                 $params = array( 'frame' => array(), 'handler' => array(),
@@ -4718,7 +4940,7 @@ class Parser {
                                                 switch( $paramName ) {
                                                 case 'manualthumb':
                                                 case 'alt':
-                                                       # @todo Fixme: possibly check validity here for
+                                                       # @todo FIXME: Possibly check validity here for
                                                         # manualthumb? downstream behavior seems odd with
                                                         # missing manual thumbs.
                                                         $validated = true;
@@ -4824,7 +5046,8 @@ class Parser {
                 wfRunHooks( 'ParserMakeImageParams', array( $title, $file, &$params ) );
  
                 # Linker does the rest
-               $ret = $sk->makeImageLink2( $title, $file, $params['frame'], $params['handler'], $time, $descQuery, $this->mOptions->getThumbSize() );
+               $ret = Linker::makeImageLink2( $title, $file, $params['frame'], $params['handler'],
+                       $time, $descQuery, $this->mOptions->getThumbSize() );
  
                 # Give the handler a chance to modify the parser object
                 if ( $handler ) {
@@ -4834,6 +5057,11 @@ class Parser {
                 return $ret;
         }
  
+       /**
+        * @param $caption
+        * @param $holders LinkHolderArray
+        * @return mixed|String
+        */
         protected function stripAltText( $caption, $holders ) {
                 # Strip bad stuff out of the title (tooltip).  We can't just use
                 # replaceLinkHoldersText() here, because if this function is called
@@ -4870,7 +5098,6 @@ class Parser {
          * @param $text String
          * @param $frame PPFrame
          * @return String
-        * @private
          */
         function attributeStripCallback( &$text, $frame = false ) {
                 $text = $this->replaceVariables( $text, $frame );
@@ -4880,11 +5107,38 @@ class Parser {
  
         /**
          * Accessor
+        *
+        * @return array
          */
         function getTags() {
                 return array_merge( array_keys( $this->mTransparentTagHooks ), array_keys( $this->mTagHooks ) );
         }
  
+       /**
+        * Replace transparent tags in $text with the values given by the callbacks.
+        *
+        * Transparent tag hooks are like regular XML-style tag hooks, except they
+        * operate late in the transformation sequence, on HTML instead of wikitext.
+        */
+       function replaceTransparentTags( $text ) {
+               $matches = array();
+               $elements = array_keys( $this->mTransparentTagHooks );
+               $text = self::extractTagsAndParams( $elements, $text, $matches, $this->mUniqPrefix );
+               $replacements = array();
+
+               foreach ( $matches as $marker => $data ) {
+                       list( $element, $content, $params, $tag ) = $data;
+                       $tagName = strtolower( $element );
+                       if ( isset( $this->mTransparentTagHooks[$tagName] ) ) {
+                               $output = call_user_func_array( $this->mTransparentTagHooks[$tagName], array( $content, $params, $this ) );
+                       } else {
+                               $output = $tag;
+                       }
+                       $replacements[$marker] = $output;
+               }
+               return strtr( $text, $replacements );
+       }
+
         /**
          * Break wikitext input into sections, and either pull or replace
          * some particular section's text.
@@ -4909,13 +5163,12 @@ class Parser {
          * @param $newText String: replacement text for section data.
          * @return String: for "get", the extracted section text.
          *                 for "replace", the whole page with the section replaced.
+        *                 If the page is empty and section 0 is requested, $text (as '')
+        *                  is returned
          */
         private function extractSections( $text, $section, $mode, $newText='' ) {
-               global $wgTitle;
-               $this->mOptions = new ParserOptions;
-               $this->clearState();
-               $this->setTitle( $wgTitle ); # not generally used but removes an ugly failure mode
-               $this->setOutputType( self::OT_PLAIN );
+               global $wgTitle; # not generally used but removes an ugly failure mode
+               $this->startParse( $wgTitle, new ParserOptions, self::OT_PLAIN, true );
                 $outText = '';
                 $frame = $this->getPreprocessor()->newFrame();
  
@@ -4939,6 +5192,10 @@ class Parser {
                 if ( $sectionIndex == 0 ) {
                         # Section zero doesn't nest, level=big
                         $targetLevel = 1000;
+                       if ( !$node ) {
+                               # The page definitely exists - we checked that earlier - so it must be blank: see bug #14005
+                               return $text;
+                       }
                 } else {
                         while ( $node ) {
                                 if ( $node->getName() === 'h' ) {
@@ -5020,13 +5277,13 @@ class Parser {
         }
  
         /**
-        * This function returns $oldtext after the content of the section 
+        * This function returns $oldtext after the content of the section
          * specified by $section has been replaced with $text.
-        * 
-        * @param $text String: former text of the article
+        *
+        * @param $oldtext String: former text of the article
          * @param $section Numeric: section identifier
          * @param $text String: replacing text
-        * #return String: modified text
+        * @return String: modified text
          */
         public function replaceSection( $oldtext, $section, $text ) {
                 return $this->extractSections( $oldtext, $section, "replace", $text );
@@ -5044,7 +5301,7 @@ class Parser {
         /**
          * Get the revision object for $this->mRevisionId
          *
-        * @return either a Revision object or null
+        * @return Revision|null either a Revision object or null
          */
         protected function getRevisionObject() {
                 if ( !is_null( $this->mRevisionObject ) ) {
@@ -5118,7 +5375,11 @@ class Parser {
  
         /**
          * Accessor for $mDefaultSort
-        * Will use the title/prefixed title if none is set
+        * Will use the empty string if none is set.
+        *
+        * This value is treated as a prefix, so the
+        * empty string is equivalent to sorting by
+        * page name.
          *
          * @return string
          */
@@ -5126,7 +5387,7 @@ class Parser {
                 if ( $this->mDefaultSort !== false ) {
                         return $this->mDefaultSort;
                 } else {
-                       return $this->mTitle->getCategorySortkey();
+                       return '';
                 }
         }
  
@@ -5186,7 +5447,8 @@ class Parser {
                 $text = preg_replace( '/\[\[:?([^[|]+)\|([^[]+)\]\]/', '$2', $text );
                 $text = preg_replace( '/\[\[:?([^[]+)\|?\]\]/', '$1', $text );
  
-               # Strip external link markup (FIXME: Not Tolerant to blank link text
+               # Strip external link markup
+               # @todo FIXME: Not tolerant to blank link text
                 # I.E. [http://www.mediawiki.org] will render as [1] or something depending
                 # on how many empty links there are on the page - need to figure that out.
                 $text = preg_replace( '/\[(?:' . wfUrlProtocols() . ')([^ ]+?) ([^[]+)\]/', '$2', $text );
@@ -5201,36 +5463,39 @@ class Parser {
  
         /**
          * strip/replaceVariables/unstrip for preprocessor regression testing
+        *
+        * @return string
          */
-       function testSrvus( $text, $title, $options, $outputType = self::OT_HTML ) {
-               $this->mOptions = $options;
-               $this->clearState();
-               if ( !$title instanceof Title ) {
-                       $title = Title::newFromText( $title );
-               }
-               $this->mTitle = $title;
-               $this->setOutputType( $outputType );
+       function testSrvus( $text, Title $title, ParserOptions $options, $outputType = self::OT_HTML ) {
+               $this->startParse( $title, $options, $outputType, true );
+
                 $text = $this->replaceVariables( $text );
                 $text = $this->mStripState->unstripBoth( $text );
                 $text = Sanitizer::removeHTMLtags( $text );
                 return $text;
         }
  
-       function testPst( $text, $title, $options ) {
-               global $wgUser;
-               if ( !$title instanceof Title ) {
-                       $title = Title::newFromText( $title );
-               }
-               return $this->preSaveTransform( $text, $title, $wgUser, $options );
+       function testPst( $text, Title $title, ParserOptions $options ) {
+               return $this->preSaveTransform( $text, $title, $options->getUser(), $options );
         }
  
-       function testPreprocess( $text, $title, $options ) {
-               if ( !$title instanceof Title ) {
-                       $title = Title::newFromText( $title );
-               }
+       function testPreprocess( $text, Title $title, ParserOptions $options ) {
                 return $this->testSrvus( $text, $title, $options, self::OT_PREPROCESS );
         }
  
+       /**
+        * Call a callback function on all regions of the given text that are not
+        * inside strip markers, and replace those regions with the return value
+        * of the callback. For example, with input:
+        *
+        *  aaa<MARKER>bbb
+        *
+        * This will call the callback function twice, with 'aaa' and 'bbb'. Those
+        * two strings will be replaced with the value returned by the callback in
+        * each case.
+        *
+        * @return string
+        */
         function markerSkipCallback( $s, $callback ) {
                 $i = 0;
                 $out = '';
@@ -5255,168 +5520,72 @@ class Parser {
                 return $out;
         }
  
-       function serialiseHalfParsedText( $text ) {
-               $data = array();
-               $data['text'] = $text;
-
-               # First, find all strip markers, and store their
-               #  data in an array.
-               $stripState = new StripState;
-               $pos = 0;
-               while ( ( $start_pos = strpos( $text, $this->mUniqPrefix, $pos ) )
-                       && ( $end_pos = strpos( $text, self::MARKER_SUFFIX, $pos ) ) )
-               {
-                       $end_pos += strlen( self::MARKER_SUFFIX );
-                       $marker = substr( $text, $start_pos, $end_pos-$start_pos );
-
-                       if ( !empty( $this->mStripState->general->data[$marker] ) ) {
-                               $replaceArray = $stripState->general;
-                               $stripText = $this->mStripState->general->data[$marker];
-                       } elseif ( !empty( $this->mStripState->nowiki->data[$marker] ) ) {
-                               $replaceArray = $stripState->nowiki;
-                               $stripText = $this->mStripState->nowiki->data[$marker];
-                       } else {
-                               throw new MWException( "Hanging strip marker: '$marker'." );
-                       }
-
-                       $replaceArray->setPair( $marker, $stripText );
-                       $pos = $end_pos;
-               }
-               $data['stripstate'] = $stripState;
-
-               # Now, find all of our links, and store THEIR
-               #  data in an array! :)
-               $links = array( 'internal' => array(), 'interwiki' => array() );
-               $pos = 0;
-
-               # Internal links
-               while ( ( $start_pos = strpos( $text, '<!--LINK ', $pos ) ) ) {
-                       list( $ns, $trail ) = explode( ':', substr( $text, $start_pos + strlen( '<!--LINK ' ) ), 2 );
-
-                       $ns = trim( $ns );
-                       if ( empty( $links['internal'][$ns] ) ) {
-                               $links['internal'][$ns] = array();
-                       }
-
-                       $key = trim( substr( $trail, 0, strpos( $trail, '-->' ) ) );
-                       $links['internal'][$ns][] = $this->mLinkHolders->internals[$ns][$key];
-                       $pos = $start_pos + strlen( "<!--LINK $ns:$key-->" );
-               }
-
-               $pos = 0;
-
-               # Interwiki links
-               while ( ( $start_pos = strpos( $text, '<!--IWLINK ', $pos ) ) ) {
-                       $data = substr( $text, $start_pos );
-                       $key = trim( substr( $data, 0, strpos( $data, '-->' ) ) );
-                       $links['interwiki'][] = $this->mLinkHolders->interwiki[$key];
-                       $pos = $start_pos + strlen( "<!--IWLINK $key-->" );
-               }
-
-               $data['linkholder'] = $links;
-
+       /**
+        * Save the parser state required to convert the given half-parsed text to
+        * HTML. "Half-parsed" in this context means the output of
+        * recursiveTagParse() or internalParse(). This output has strip markers
+        * from replaceVariables (extensionSubstitution() etc.), and link
+        * placeholders from replaceLinkHolders().
+        *
+        * Returns an array which can be serialized and stored persistently. This
+        * array can later be loaded into another parser instance with
+        * unserializeHalfParsedText(). The text can then be safely incorporated into
+        * the return value of a parser hook.
+        *
+        * @return array
+        */
+       function serializeHalfParsedText( $text ) {
+               wfProfileIn( __METHOD__ );
+               $data = array(
+                       'text' => $text,
+                       'version' => self::HALF_PARSED_VERSION,
+                       'stripState' => $this->mStripState->getSubState( $text ),
+                       'linkHolders' => $this->mLinkHolders->getSubArray( $text )
+               );
+               wfProfileOut( __METHOD__ );
                 return $data;
         }
  
         /**
-        * TODO: document
-        * @param $data Array
-        * @param $intPrefix String unique identifying prefix
+        * Load the parser state given in the $data array, which is assumed to
+        * have been generated by serializeHalfParsedText(). The text contents is
+        * extracted from the array, and its markers are transformed into markers
+        * appropriate for the current Parser instance. This transformed text is
+        * returned, and can be safely included in the return value of a parser
+        * hook.
+        *
+        * If the $data array has been stored persistently, the caller should first
+        * check whether it is still valid, by calling isValidHalfParsedText().
+        *
+        * @param $data Serialized data
          * @return String
          */
-       function unserialiseHalfParsedText( $data, $intPrefix = null ) {
-               if ( !$intPrefix ) {
-                       $intPrefix = self::getRandomString();
+       function unserializeHalfParsedText( $data ) {
+               if ( !isset( $data['version'] ) || $data['version'] != self::HALF_PARSED_VERSION ) {
+                       throw new MWException( __METHOD__.': invalid version' );
                 }
  
                 # First, extract the strip state.
-               $stripState = $data['stripstate'];
-               $this->mStripState->general->merge( $stripState->general );
-               $this->mStripState->nowiki->merge( $stripState->nowiki );
-
-               # Now, extract the text, and renumber links
-               $text = $data['text'];
-               $links = $data['linkholder'];
+               $texts = array( $data['text'] );
+               $texts = $this->mStripState->merge( $data['stripState'], $texts );
  
-               # Internal...
-               foreach ( $links['internal'] as $ns => $nsLinks ) {
-                       foreach ( $nsLinks as $key => $entry ) {
-                               $newKey = $intPrefix . '-' . $key;
-                               $this->mLinkHolders->internals[$ns][$newKey] = $entry;
-
-                               $text = str_replace( "<!--LINK $ns:$key-->", "<!--LINK $ns:$newKey-->", $text );
-                       }
-               }
-
-               # Interwiki...
-               foreach ( $links['interwiki'] as $key => $entry ) {
-                       $newKey = "$intPrefix-$key";
-                       $this->mLinkHolders->interwikis[$newKey] = $entry;
-
-                       $text = str_replace( "<!--IWLINK $key-->", "<!--IWLINK $newKey-->", $text );
-               }
+               # Now renumber links
+               $texts = $this->mLinkHolders->mergeForeign( $data['linkHolders'], $texts );
  
                 # Should be good to go.
-               return $text;
-       }
-}
-
-/**
- * @todo document, briefly.
- * @ingroup Parser
- */
-class StripState {
-       var $general, $nowiki;
-
-       function __construct() {
-               $this->general = new ReplacementArray;
-               $this->nowiki = new ReplacementArray;
-       }
-
-       function unstripGeneral( $text ) {
-               wfProfileIn( __METHOD__ );
-               do {
-                       $oldText = $text;
-                       $text = $this->general->replace( $text );
-               } while ( $text !== $oldText );
-               wfProfileOut( __METHOD__ );
-               return $text;
-       }
-
-       function unstripNoWiki( $text ) {
-               wfProfileIn( __METHOD__ );
-               do {
-                       $oldText = $text;
-                       $text = $this->nowiki->replace( $text );
-               } while ( $text !== $oldText );
-               wfProfileOut( __METHOD__ );
-               return $text;
+               return $texts[0];
         }
  
-       function unstripBoth( $text ) {
-               wfProfileIn( __METHOD__ );
-               do {
-                       $oldText = $text;
-                       $text = $this->general->replace( $text );
-                       $text = $this->nowiki->replace( $text );
-               } while ( $text !== $oldText );
-               wfProfileOut( __METHOD__ );
-               return $text;
-       }
-}
-
-/**
- * @todo document, briefly.
- * @ingroup Parser
- */
-class OnlyIncludeReplacer {
-       var $output = '';
-
-       function replace( $matches ) {
-               if ( substr( $matches[1], -1 ) === "\n" ) {
-                       $this->output .= substr( $matches[1], 0, -1 );
-               } else {
-                       $this->output .= $matches[1];
-               }
+       /**
+        * Returns true if the given array, presumed to be generated by
+        * serializeHalfParsedText(), is compatible with the current version of the
+        * parser.
+        *
+        * @param $data Array
+        *
+        * @return bool
+        */
+       function isValidHalfParsedText( $data ) {
+               return isset( $data['version'] ) && $data['version'] == self::HALF_PARSED_VERSION;
         }
  }