replace TYPE= with ENGINE=, (supported since 4.0, TYPE deprecated since 4.1)
[lhc/web/wiklou.git] / includes / Export.php
index 7f34a80..88ef6e3 100644 (file)
@@ -1,17 +1,17 @@
 <?php
 # Copyright (C) 2003, 2005 Brion Vibber <brion@pobox.com>
 # http://www.mediawiki.org/
-# 
+#
 # This program is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License as published by
-# the Free Software Foundation; either version 2 of the License, or 
+# the Free Software Foundation; either version 2 of the License, or
 # (at your option) any later version.
-# 
+#
 # This program is distributed in the hope that it will be useful,
 # but WITHOUT ANY WARRANTY; without even the implied warranty of
 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 # GNU General Public License for more details.
-# 
+#
 # You should have received a copy of the GNU General Public License along
 # with this program; if not, write to the Free Software Foundation, Inc.,
 # 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
@@ -31,6 +31,9 @@ define( 'MW_EXPORT_CURRENT',  1 );
 define( 'MW_EXPORT_BUFFER',   0 );
 define( 'MW_EXPORT_STREAM',   1 );
 
+define( 'MW_EXPORT_TEXT',     0 );
+define( 'MW_EXPORT_STUB',     1 );
+
 
 /**
  * @package MediaWiki
@@ -49,14 +52,15 @@ class WikiExporter {
         * @param int $buffer one of MW_EXPORT_BUFFER or MW_EXPORT_STREAM
         */
        function WikiExporter( &$db, $history = MW_EXPORT_CURRENT,
-                       $buffer = MW_EXPORT_BUFFER ) {
+                       $buffer = MW_EXPORT_BUFFER, $text = MW_EXPORT_TEXT ) {
                $this->db =& $db;
                $this->history = $history;
                $this->buffer  = $buffer;
                $this->writer  = new XmlDumpWriter();
                $this->sink    = new DumpOutput();
+               $this->text    = $text;
        }
-       
+
        /**
         * Set the DumpOutput or DumpFilter object which will receive
         * various row objects and XML output for filtering. Filters
@@ -67,7 +71,7 @@ class WikiExporter {
        function setOutputSink( &$sink ) {
                $this->sink =& $sink;
        }
-       
+
        function openStream() {
                $output = $this->writer->openStream();
                $this->sink->writeOpenStream( $output );
@@ -86,7 +90,7 @@ class WikiExporter {
        function allPages() {
                return $this->dumpFrom( '' );
        }
-       
+
        /**
         * Dumps a series of page and revision records for those pages
         * in the database falling within the page_id range given.
@@ -101,7 +105,7 @@ class WikiExporter {
                }
                return $this->dumpFrom( $condition );
        }
-       
+
        /**
         * @param Title $title
         */
@@ -110,7 +114,7 @@ class WikiExporter {
                        'page_namespace=' . $title->getNamespace() .
                        ' AND page_title=' . $this->db->addQuotes( $title->getDbKey() ) );
        }
-       
+
        function pageByName( $name ) {
                $title = Title::newFromText( $name );
                if( is_null( $title ) ) {
@@ -119,24 +123,24 @@ class WikiExporter {
                        return $this->pageByTitle( $title );
                }
        }
-       
+
        function pagesByName( $names ) {
                foreach( $names as $name ) {
                        $this->pageByName( $name );
                }
        }
 
-       
+
        // -------------------- private implementation below --------------------
-       
+
        function dumpFrom( $cond = '' ) {
                $fname = 'WikiExporter::dumpFrom';
                wfProfileIn( $fname );
-               
+
                $page     = $this->db->tableName( 'page' );
                $revision = $this->db->tableName( 'revision' );
                $text     = $this->db->tableName( 'text' );
-               
+
                if( $this->history == MW_EXPORT_FULL ) {
                        $join = 'page_id=rev_page';
                } elseif( $this->history == MW_EXPORT_CURRENT ) {
@@ -146,7 +150,7 @@ class WikiExporter {
                        return new WikiError( "$fname given invalid history dump type." );
                }
                $where = ( $cond == '' ) ? '' : "$cond AND";
-               
+
                if( $this->buffer == MW_EXPORT_STREAM ) {
                        $prev = $this->db->bufferResults( false );
                }
@@ -158,23 +162,31 @@ class WikiExporter {
                        $pageindex = '';
                        $revindex = '';
                }
-               $result = $this->db->query(
-                       "SELECT * FROM
-                               $page $pageindex,
-                               $revision $revindex,
-                               $text
-                               WHERE $where $join AND rev_text_id=old_id
-                               ORDER BY page_id", $fname );
+               if( $this->text == MW_EXPORT_STUB ) {
+                       $sql = "SELECT * FROM
+                                       $page $pageindex,
+                                       $revision $revindex
+                                       WHERE $where $join
+                                       ORDER BY page_id";
+               } else {
+                       $sql = "SELECT * FROM
+                                       $page $pageindex,
+                                       $revision $revindex,
+                                       $text
+                                       WHERE $where $join AND rev_text_id=old_id
+                                       ORDER BY page_id";
+               }
+               $result = $this->db->query( $sql, $fname );
                $wrapper = $this->db->resultObject( $result );
                $this->outputStream( $wrapper );
-               
+
                if( $this->buffer == MW_EXPORT_STREAM ) {
                        $this->db->bufferResults( $prev );
                }
-               
+
                wfProfileOut( $fname );
        }
-       
+
        /**
         * Runs through a query result set dumping page and revision records.
         * The result set should be sorted/grouped by page to avoid duplicate
@@ -214,7 +226,7 @@ class WikiExporter {
 }
 
 class XmlDumpWriter {
-       
+
        /**
         * Returns the export schema version.
         * @return string
@@ -222,7 +234,7 @@ class XmlDumpWriter {
        function schemaVersion() {
                return "0.3";
        }
-       
+
        /**
         * Opens the XML output stream's root <mediawiki> element.
         * This does not include an xml directive, so is safe to include
@@ -247,7 +259,7 @@ class XmlDumpWriter {
                        "\n" .
                        $this->siteInfo();
        }
-       
+
        function siteInfo() {
                $info = array(
                        $this->sitename(),
@@ -259,29 +271,29 @@ class XmlDumpWriter {
                        implode( "\n    ", $info ) .
                        "\n  </siteinfo>\n";
        }
-       
+
        function sitename() {
                global $wgSitename;
                return wfElement( 'sitename', array(), $wgSitename );
        }
-       
+
        function generator() {
                global $wgVersion;
                return wfElement( 'generator', array(), "MediaWiki $wgVersion" );
        }
-       
+
        function homelink() {
                $page = Title::newFromText( wfMsgForContent( 'mainpage' ) );
                return wfElement( 'base', array(), $page->getFullUrl() );
        }
-       
+
        function caseSetting() {
                global $wgCapitalLinks;
                // "case-insensitive" option is reserved for future
                $sensitivity = $wgCapitalLinks ? 'first-letter' : 'case-sensitive';
                return wfElement( 'case', array(), $sensitivity );
        }
-       
+
        function namespaces() {
                global $wgContLang;
                $spaces = "  <namespaces>\n";
@@ -291,7 +303,7 @@ class XmlDumpWriter {
                $spaces .= "    </namespaces>";
                return $spaces;
        }
-       
+
        /**
         * Closes the output stream with the closing root element.
         * Call when finished dumping things.
@@ -300,7 +312,7 @@ class XmlDumpWriter {
                return "</mediawiki>\n";
        }
 
-       
+
        /**
         * Opens a <page> section on the output stream, with data
         * from the given database row.
@@ -320,7 +332,7 @@ class XmlDumpWriter {
                }
                return $out;
        }
-       
+
        /**
         * Closes a <page> section on the output stream.
         *
@@ -329,7 +341,7 @@ class XmlDumpWriter {
        function closePage() {
                return "  </page>\n";
        }
-       
+
        /**
         * Dumps a <revision> section on the output stream, with
         * data filled in from the given database row.
@@ -341,13 +353,13 @@ class XmlDumpWriter {
        function writeRevision( $row ) {
                $fname = 'WikiExporter::dumpRev';
                wfProfileIn( $fname );
-               
+
                $out  = "    <revision>\n";
                $out .= "      " . wfElement( 'id', null, strval( $row->rev_id ) ) . "\n";
-               
-               $ts = wfTimestamp2ISO8601( strval( $row->rev_timestamp ) );
+
+               $ts = wfTimestamp( TS_ISO_8601, $row->rev_timestamp );
                $out .= "      " . wfElement( 'timestamp', null, $ts ) . "\n";
-               
+
                $out .= "      <contributor>\n";
                if( $row->rev_user ) {
                        $out .= "        " . wfElementClean( 'username', null, strval( $row->rev_user_text ) ) . "\n";
@@ -356,21 +368,29 @@ class XmlDumpWriter {
                        $out .= "        " . wfElementClean( 'ip', null, strval( $row->rev_user_text ) ) . "\n";
                }
                $out .= "      </contributor>\n";
-               
+
                if( $row->rev_minor_edit ) {
                        $out .=  "      <minor/>\n";
                }
                if( $row->rev_comment != '' ) {
                        $out .= "      " . wfElementClean( 'comment', null, strval( $row->rev_comment ) ) . "\n";
                }
-       
-               $text = strval( Revision::getRevisionText( $row ) );
-               $out .= "      " . wfElementClean( 'text',
-                       array( 'xml:space' => 'preserve' ),
-                       strval( $text ) ) . "\n";
-               
+
+               if( isset( $row->old_text ) ) {
+                       // Raw text from the database may have invalid chars
+                       $text = strval( Revision::getRevisionText( $row ) );
+                       $out .= "      " . wfElementClean( 'text',
+                               array( 'xml:space' => 'preserve' ),
+                               strval( $text ) ) . "\n";
+               } else {
+                       // Stub output
+                       $out .= "      " . wfElement( 'text',
+                               array( 'id' => $row->rev_text_id ),
+                               "" ) . "\n";
+               }
+
                $out .= "    </revision>\n";
-               
+
                wfProfileOut( $fname );
                return $out;
        }
@@ -385,23 +405,23 @@ class DumpOutput {
        function writeOpenStream( $string ) {
                $this->write( $string );
        }
-       
+
        function writeCloseStream( $string ) {
                $this->write( $string );
        }
-       
+
        function writeOpenPage( $page, $string ) {
                $this->write( $string );
        }
-       
+
        function writeClosePage( $string ) {
                $this->write( $string );
        }
-       
+
        function writeRevision( $rev, $string ) {
                $this->write( $string );
        }
-       
+
        /**
         * Override to write to a different stream type.
         * @return bool
@@ -416,11 +436,11 @@ class DumpOutput {
  */
 class DumpFileOutput extends DumpOutput {
        var $handle;
-       
+
        function DumpFileOutput( $file ) {
                $this->handle = fopen( $file, "wt" );
        }
-       
+
        function write( $string ) {
                fputs( $this->handle, $string );
        }
@@ -463,7 +483,7 @@ class DumpBZip2Output extends DumpPipeOutput {
  */
 class Dump7ZipOutput extends DumpPipeOutput {
        function Dump7ZipOutput( $file ) {
-               $command = "7za a -si " . wfEscapeShellArg( $file );
+               $command = "7za a -bd -si " . wfEscapeShellArg( $file );
                parent::DumpPipeOutput( $command );
        }
 }
@@ -479,35 +499,35 @@ class DumpFilter {
        function DumpFilter( &$sink ) {
                $this->sink =& $sink;
        }
-       
+
        function writeOpenStream( $string ) {
                $this->sink->writeOpenStream( $string );
        }
-       
+
        function writeCloseStream( $string ) {
                $this->sink->writeCloseStream( $string );
        }
-       
+
        function writeOpenPage( $page, $string ) {
                $this->sendingThisPage = $this->pass( $page, $string );
                if( $this->sendingThisPage ) {
                        $this->sink->writeOpenPage( $page, $string );
                }
        }
-       
+
        function writeClosePage( $string ) {
                if( $this->sendingThisPage ) {
                        $this->sink->writeClosePage( $string );
                        $this->sendingThisPage = false;
                }
        }
-       
+
        function writeRevision( $rev, $string ) {
                if( $this->sendingThisPage ) {
                        $this->sink->writeRevision( $rev, $string );
                }
        }
-       
+
        /**
         * Override for page-based filter types.
         * @return bool
@@ -522,7 +542,7 @@ class DumpFilter {
  */
 class DumpNotalkFilter extends DumpFilter {
        function pass( $page ) {
-               return Namespace::isTalk( $page->page_namespace );
+               return !Namespace::isTalk( $page->page_namespace );
        }
 }
 
@@ -531,11 +551,11 @@ class DumpNotalkFilter extends DumpFilter {
  */
 class DumpNamespaceFilter extends DumpFilter {
        var $invert = false;
-       var $match = array();
-       
+       var $namespaces = array();
+
        function DumpNamespaceFilter( &$sink, $param ) {
                parent::DumpFilter( $sink );
-               
+
                $constants = array(
                        "NS_MAIN"           => NS_MAIN,
                        "NS_TALK"           => NS_TALK,
@@ -553,24 +573,26 @@ class DumpNamespaceFilter extends DumpFilter {
                        "NS_HELP_TALK"      => NS_HELP_TALK,
                        "NS_CATEGORY"       => NS_CATEGORY,
                        "NS_CATEGORY_TALK"  => NS_CATEGORY_TALK );
-               
+
                if( $param{0} == '!' ) {
                        $this->invert = true;
                        $param = substr( $param, 1 );
                }
-               
+
                foreach( explode( ',', $param ) as $key ) {
                        $key = trim( $key );
-                       if( isset( $contants[$key] ) ) {
+                       if( isset( $constants[$key] ) ) {
                                $ns = $constants[$key];
                                $this->namespaces[$ns] = true;
                        } elseif( is_numeric( $key ) ) {
                                $ns = intval( $key );
                                $this->namespaces[$ns] = true;
+                       } else {
+                               wfDie( "Unrecognized namespace key '$key'\n" );
                        }
                }
        }
-       
+
        function pass( $page ) {
                $match = isset( $this->namespaces[$page->page_namespace] );
                return $this->invert xor $match;
@@ -583,12 +605,12 @@ class DumpNamespaceFilter extends DumpFilter {
  */
 class DumpLatestFilter extends DumpFilter {
        var $page, $pageString, $rev, $revString;
-       
+
        function writeOpenPage( $page, $string ) {
                $this->page = $page;
                $this->pageString = $string;
        }
-       
+
        function writeClosePage( $string ) {
                if( $this->rev ) {
                        $this->sink->writeOpenPage( $this->page, $this->pageString );
@@ -600,7 +622,7 @@ class DumpLatestFilter extends DumpFilter {
                $this->page = null;
                $this->pageString = null;
        }
-       
+
        function writeRevision( $rev, $string ) {
                if( $rev->rev_id == $this->page->page_latest ) {
                        $this->rev = $rev;
@@ -617,31 +639,31 @@ class DumpMultiWriter {
                $this->sinks = $sinks;
                $this->count = count( $sinks );
        }
-       
+
        function writeOpenStream( $string ) {
                for( $i = 0; $i < $this->count; $i++ ) {
                        $this->sinks[$i]->writeOpenStream( $string );
                }
        }
-       
+
        function writeCloseStream( $string ) {
                for( $i = 0; $i < $this->count; $i++ ) {
                        $this->sinks[$i]->writeCloseStream( $string );
                }
        }
-       
+
        function writeOpenPage( $page, $string ) {
                for( $i = 0; $i < $this->count; $i++ ) {
                        $this->sinks[$i]->writeOpenPage( $page, $string );
                }
        }
-       
+
        function writeClosePage( $string ) {
                for( $i = 0; $i < $this->count; $i++ ) {
                        $this->sinks[$i]->writeClosePage( $string );
                }
        }
-       
+
        function writeRevision( $rev, $string ) {
                for( $i = 0; $i < $this->count; $i++ ) {
                        $this->sinks[$i]->writeRevision( $rev, $string );
@@ -649,24 +671,17 @@ class DumpMultiWriter {
        }
 }
 
-
-
-function wfTimestamp2ISO8601( $ts ) {
-       #2003-08-05T18:30:02Z
-       return preg_replace( '/^(....)(..)(..)(..)(..)(..)$/', '$1-$2-$3T$4:$5:$6Z', wfTimestamp( TS_MW, $ts ) );
-}
-
 function xmlsafe( $string ) {
        $fname = 'xmlsafe';
        wfProfileIn( $fname );
-       
+
        /**
         * The page may contain old data which has not been properly normalized.
         * Invalid UTF-8 sequences or forbidden control characters will make our
         * XML output invalid, so be sure to strip them out.
         */
        $string = UtfNormal::cleanUp( $string );
-       
+
        $string = htmlspecialchars( $string );
        wfProfileOut( $fname );
        return $string;