3 * Updater for link tracking tables after a page edit.
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
22 use MediaWiki\MediaWikiServices
;
23 use Wikimedia\ScopedCallback
;
24 use Wikimedia\Rdbms\IDatabase
;
27 * Update object handling the cleanup of links tables after a page was deleted.
29 class LinksDeletionUpdate
extends DataUpdate
implements EnqueueableDataUpdate
{
41 * @param WikiPage $page Page we are updating
42 * @param int|null $pageId ID of the page we are updating [optional]
43 * @param string|null $timestamp TS_MW timestamp of deletion
46 function __construct( WikiPage
$page, $pageId = null, $timestamp = null ) {
47 parent
::__construct();
51 $this->pageId
= $pageId; // page ID at time of deletion
52 } elseif ( $page->exists() ) {
53 $this->pageId
= $page->getId();
55 throw new InvalidArgumentException( "Page ID not known. Page doesn't exist?" );
58 $this->timestamp
= $timestamp ?
: wfTimestampNow();
61 public function doUpdate() {
62 $services = MediaWikiServices
::getInstance();
63 $config = $services->getMainConfig();
64 $lbFactory = $services->getDBLoadBalancerFactory();
65 $batchSize = $config->get( 'UpdateRowsPerQuery' );
67 // Page may already be deleted, so don't just getId()
70 if ( $this->ticket
) {
71 // Make sure all links update threads see the changes of each other.
72 // This handles the case when updates have to batched into several COMMITs.
73 $scopedLock = LinksUpdate
::acquirePageLock( $this->getDB(), $id );
76 $title = $this->page
->getTitle();
77 $dbw = $this->getDB(); // convenience
79 // Delete restrictions for it
80 $dbw->delete( 'page_restrictions', [ 'pr_page' => $id ], __METHOD__
);
82 // Fix category table counts
83 $cats = $dbw->selectFieldValues(
89 $catBatches = array_chunk( $cats, $batchSize );
90 foreach ( $catBatches as $catBatch ) {
91 $this->page
->updateCategoryCounts( [], $catBatch, $id );
92 if ( count( $catBatches ) > 1 ) {
93 $lbFactory->commitAndWaitForReplication(
94 __METHOD__
, $this->ticket
, [ 'wiki' => $dbw->getWikiID() ]
99 // Refresh the category table entry if it seems to have no pages. Check
100 // master for the most up-to-date cat_pages count.
101 if ( $title->getNamespace() === NS_CATEGORY
) {
102 $row = $dbw->selectRow(
104 [ 'cat_id', 'cat_title', 'cat_pages', 'cat_subcats', 'cat_files' ],
105 [ 'cat_title' => $title->getDBkey(), 'cat_pages <= 0' ],
109 $cat = Category
::newFromRow( $row, $title );
110 // T166757: do the update after the main job DB commit
111 DeferredUpdates
::addCallableUpdate( function () use ( $cat ) {
112 $cat->refreshCounts();
117 $this->batchDeleteByPK(
119 [ 'pl_from' => $id ],
120 [ 'pl_from', 'pl_namespace', 'pl_title' ],
123 $this->batchDeleteByPK(
125 [ 'il_from' => $id ],
126 [ 'il_from', 'il_to' ],
129 $this->batchDeleteByPK(
131 [ 'cl_from' => $id ],
132 [ 'cl_from', 'cl_to' ],
135 $this->batchDeleteByPK(
137 [ 'tl_from' => $id ],
138 [ 'tl_from', 'tl_namespace', 'tl_title' ],
141 $this->batchDeleteByPK(
143 [ 'el_from' => $id ],
147 $this->batchDeleteByPK(
149 [ 'll_from' => $id ],
150 [ 'll_from', 'll_lang' ],
153 $this->batchDeleteByPK(
155 [ 'iwl_from' => $id ],
156 [ 'iwl_from', 'iwl_prefix', 'iwl_title' ],
160 // Delete any redirect entry or page props entries
161 $dbw->delete( 'redirect', [ 'rd_from' => $id ], __METHOD__
);
162 $dbw->delete( 'page_props', [ 'pp_page' => $id ], __METHOD__
);
164 // Find recentchanges entries to clean up...
165 $rcIdsForTitle = $dbw->selectFieldValues(
169 'rc_type != ' . RC_LOG
,
170 'rc_namespace' => $title->getNamespace(),
171 'rc_title' => $title->getDBkey(),
173 $dbw->addQuotes( $dbw->timestamp( $this->timestamp
) )
177 $rcIdsForPage = $dbw->selectFieldValues(
180 [ 'rc_type != ' . RC_LOG
, 'rc_cur_id' => $id ],
184 // T98706: delete by PK to avoid lock contention with RC delete log insertions
185 $rcIdBatches = array_chunk( array_merge( $rcIdsForTitle, $rcIdsForPage ), $batchSize );
186 foreach ( $rcIdBatches as $rcIdBatch ) {
187 $dbw->delete( 'recentchanges', [ 'rc_id' => $rcIdBatch ], __METHOD__
);
188 if ( count( $rcIdBatches ) > 1 ) {
189 $lbFactory->commitAndWaitForReplication(
190 __METHOD__
, $this->ticket
, [ 'wiki' => $dbw->getWikiID() ]
195 // Commit and release the lock (if set)
196 ScopedCallback
::consume( $scopedLock );
199 private function batchDeleteByPK( $table, array $conds, array $pk, $bSize ) {
200 $services = MediaWikiServices
::getInstance();
201 $lbFactory = $services->getDBLoadBalancerFactory();
202 $dbw = $this->getDB(); // convenience
204 $res = $dbw->select( $table, $pk, $conds, __METHOD__
);
207 foreach ( $res as $row ) {
208 $pkDeleteConds[] = $dbw->makeList( (array)$row, LIST_AND
);
209 if ( count( $pkDeleteConds ) >= $bSize ) {
210 $dbw->delete( $table, $dbw->makeList( $pkDeleteConds, LIST_OR
), __METHOD__
);
211 $lbFactory->commitAndWaitForReplication(
212 __METHOD__
, $this->ticket
, [ 'wiki' => $dbw->getWikiID() ]
218 if ( $pkDeleteConds ) {
219 $dbw->delete( $table, $dbw->makeList( $pkDeleteConds, LIST_OR
), __METHOD__
);
223 protected function getDB() {
225 $this->db
= wfGetDB( DB_MASTER
);
231 public function getAsJobSpecification() {
233 'wiki' => $this->getDB()->getWikiID(),
234 'job' => new JobSpecification(
236 [ 'pageId' => $this->pageId
, 'timestamp' => $this->timestamp
],
237 [ 'removeDuplicates' => true ],
238 $this->page
->getTitle()