X-Git-Url: https://git.cyclocoop.org/%27.WWW_URL.%27admin/?a=blobdiff_plain;f=maintenance%2FrefreshLinks.php;h=420f5553a413d63b44f4854bf3f521a092b284b7;hb=3112302c73dc1e30a114ee4ead4a6a4caab8b76a;hp=018e3d78c58e7dba21b4792461c24cc3c2e070ee;hpb=659778619cc12d156d3547834c0f90f407584104;p=lhc%2Fweb%2Fwiklou.git diff --git a/maintenance/refreshLinks.php b/maintenance/refreshLinks.php index 018e3d78c5..420f5553a4 100644 --- a/maintenance/refreshLinks.php +++ b/maintenance/refreshLinks.php @@ -1,5 +1,7 @@ getOption( 'm', 0 ); if ( !$this->hasOption( 'dfn-only' ) ) { $start = $this->getArg( 0, 1 ); $new = $this->getOption( 'new-only', false ); - $max = $this->getOption( 'm', false ); $end = $this->getOption( 'e', 0 ); $redir = $this->getOption( 'redirects-only', false ); $oldRedir = $this->getOption( 'old-redirects-only', false ); @@ -58,19 +60,17 @@ class RefreshLinks extends Maintenance { */ private function doRefreshLinks( $start, $newOnly = false, $maxLag = false, $end = 0, $redirectsOnly = false, $oldRedirectsOnly = false ) { - global $wgUser, $wgParser, $wgUseTidy; + global $wgParser, $wgUseTidy; $reportingInterval = 100; $dbr = wfGetDB( DB_SLAVE ); $start = intval( $start ); - # Don't generate TeX PNGs (lack of a sensible current directory causes errors anyway) - $wgUser->setOption( 'math', MW_MATH_SOURCE ); + // Give extensions a chance to optimize settings + wfRunHooks( 'MaintenanceRefreshLinksInit', array( $this ) ); # Don't generate extension images (e.g. Timeline) - if ( method_exists( $wgParser, "clearTagHooks" ) ) { - $wgParser->clearTagHooks(); - } + $wgParser->clearTagHooks(); # Don't use HTML tidy $wgUseTidy = false; @@ -79,18 +79,31 @@ class RefreshLinks extends Maintenance { if ( $oldRedirectsOnly ) { # This entire code path is cut-and-pasted from below. Hurrah. - $res = $dbr->query( - "SELECT page_id " . - "FROM page " . - "LEFT JOIN redirect ON page_id=rd_from " . - "WHERE page_is_redirect=1 AND rd_from IS NULL AND " . - ( $end == 0 ? "page_id >= $start" - : "page_id BETWEEN $start AND $end" ), - __METHOD__ + + $conds = array( + "page_is_redirect=1", + "rd_from IS NULL" + ); + + if ( $end == 0 ) { + $conds[] = "page_id >= $start"; + } else { + $conds[] = "page_id BETWEEN $start AND $end"; + } + + $res = $dbr->select( + array( 'page', 'redirect' ), + 'page_id', + $conds, + __METHOD__, + array(), + array( 'redirect' => array( "LEFT JOIN", "page_id=rd_from" ) ) ); $num = $dbr->numRows( $res ); $this->output( "Refreshing $num old redirects from $start...\n" ); + $i = 0; + foreach ( $res as $row ) { if ( !( ++$i % $reportingInterval ) ) { $this->output( "$i\n" ); @@ -109,17 +122,18 @@ class RefreshLinks extends Maintenance { ); $num = $dbr->numRows( $res ); $this->output( "$num new articles...\n" ); - + $i = 0; foreach ( $res as $row ) { if ( !( ++$i % $reportingInterval ) ) { $this->output( "$i\n" ); wfWaitForSlaves( $maxLag ); } - if ( $redirectsOnly ) + if ( $redirectsOnly ) { $this->fixRedirect( $row->page_id ); - else - $this->fixLinksFromArticle( $row->page_id ); + } else { + self::fixLinksFromArticle( $row->page_id ); + } } } else { if ( !$end ) { @@ -129,9 +143,9 @@ class RefreshLinks extends Maintenance { } $this->output( "Refreshing redirects table.\n" ); $this->output( "Starting from page_id $start of $end.\n" ); - + for ( $id = $start; $id <= $end; $id++ ) { - + if ( !( $id % $reportingInterval ) ) { $this->output( "$id\n" ); wfWaitForSlaves( $maxLag ); @@ -144,12 +158,12 @@ class RefreshLinks extends Maintenance { $this->output( "Starting from page_id $start of $end.\n" ); for ( $id = $start; $id <= $end; $id++ ) { - + if ( !( $id % $reportingInterval ) ) { $this->output( "$id\n" ); wfWaitForSlaves( $maxLag ); } - $this->fixLinksFromArticle( $id ); + self::fixLinksFromArticle( $id ); } } } @@ -160,29 +174,27 @@ class RefreshLinks extends Maintenance { * @param $id int The page_id of the redirect */ private function fixRedirect( $id ) { - global $wgTitle, $wgArticle; - - $wgTitle = Title::newFromID( $id ); + $title = Title::newFromID( $id ); $dbw = wfGetDB( DB_MASTER ); - - if ( is_null( $wgTitle ) ) { + + if ( is_null( $title ) ) { // This page doesn't exist (any more) // Delete any redirect table entry for it $dbw->delete( 'redirect', array( 'rd_from' => $id ), __METHOD__ ); return; } - $wgArticle = new Article( $wgTitle ); - - $rt = $wgArticle->followRedirect(); - - if ( $rt == false || !is_object( $rt ) ) { - // $wgTitle is not a redirect + $article = new Article( $title ); + + $rt = $article->followRedirect(); + + if ( !$rt || !is_object( $rt ) ) { + // $title is not a redirect // Delete any redirect table entry for it $dbw->delete( 'redirect', array( 'rd_from' => $id ), __METHOD__ ); } else { - $wgArticle->updateRedirectOn( $dbw, $rt ); + $article->updateRedirectOn( $dbw, $rt ); } } @@ -190,28 +202,27 @@ class RefreshLinks extends Maintenance { * Run LinksUpdate for all links on a given page_id * @param $id int The page_id */ - private function fixLinksFromArticle( $id ) { - global $wgTitle, $wgParser; + public static function fixLinksFromArticle( $id ) { + global $wgParser; - $wgTitle = Title::newFromID( $id ); + $title = Title::newFromID( $id ); $dbw = wfGetDB( DB_MASTER ); - $linkCache =& LinkCache::singleton(); - $linkCache->clear(); + LinkCache::singleton()->clear(); - if ( is_null( $wgTitle ) ) { + if ( is_null( $title ) ) { return; } $dbw->begin(); - $revision = Revision::newFromTitle( $wgTitle ); + $revision = Revision::newFromTitle( $title ); if ( !$revision ) { return; } $options = new ParserOptions; - $parserOutput = $wgParser->parse( $revision->getText(), $wgTitle, $options, true, true, $revision->getId() ); - $update = new LinksUpdate( $wgTitle, $parserOutput, false ); + $parserOutput = $wgParser->parse( $revision->getText(), $title, $options, true, true, $revision->getId() ); + $update = new LinksUpdate( $title, $parserOutput, false ); $update->doUpdate(); $dbw->commit(); } @@ -280,4 +291,4 @@ class RefreshLinks extends Maintenance { } $maintClass = 'RefreshLinks'; -require_once( DO_MAINTENANCE ); +require_once( RUN_MAINTENANCE_IF_MAIN );