Prefix searches for users, not pages
[lhc/web/wiklou.git] / maintenance / fixSlaveDesync.php
1 <?php
2 /**
3 * This program is free software; you can redistribute it and/or modify
4 * it under the terms of the GNU General Public License as published by
5 * the Free Software Foundation; either version 2 of the License, or
6 * (at your option) any later version.
7 *
8 * This program is distributed in the hope that it will be useful,
9 * but WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 * GNU General Public License for more details.
12 *
13 * You should have received a copy of the GNU General Public License along
14 * with this program; if not, write to the Free Software Foundation, Inc.,
15 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
16 * http://www.gnu.org/copyleft/gpl.html
17 *
18 * @ingroup Maintenance
19 */
20
21 require_once( dirname( __FILE__ ) . '/Maintenance.php' );
22
23 class FixSlaveDesync extends Maintenance {
24 public function __construct() {
25 parent::__construct();
26 $this->mDescription = "";
27
28 }
29
30 public function execute() {
31 global $slaveIndexes, $wgDBservers;
32 $slaveIndexes = array();
33 for ( $i = 1; $i < count( $wgDBservers ); $i++ ) {
34 if ( wfGetLB()->isNonZeroLoad( $i ) ) {
35 $slaveIndexes[] = $i;
36 }
37 }
38
39 if ( $this->hasArg() ) {
40 $this->desyncFixPage( $this->getArg() );
41 } else {
42 $dbw = wfGetDB( DB_MASTER );
43 $maxPage = $dbw->selectField( 'page', 'MAX(page_id)', false, __METHOD__ );
44 $corrupt = $this->findPageLatestCorruption();
45 foreach ( $corrupt as $id => $dummy ) {
46 $this->desyncFixPage( $id );
47 }
48 }
49 }
50
51 /**
52 * Find all pages that have a corrupted page_latest
53 * @return array
54 */
55 private function findPageLatestCorruption() {
56 $desync = array();
57 $n = 0;
58 $dbw = wfGetDB( DB_MASTER );
59 $masterIDs = array();
60 $res = $dbw->select( 'page', array( 'page_id', 'page_latest' ), array( 'page_id<6054123' ), __METHOD__ );
61 $this->output( "Number of pages: " . $dbw->numRows( $res ) . "\n" );
62 foreach ( $res as $row ) {
63 $masterIDs[$row->page_id] = $row->page_latest;
64 if ( !( ++$n % 10000 ) ) {
65 $this->output( "$n\r" );
66 }
67 }
68 $this->output( "\n" );
69
70 global $slaveIndexes;
71 foreach ( $slaveIndexes as $i ) {
72 $db = wfGetDB( $i );
73 $res = $db->select( 'page', array( 'page_id', 'page_latest' ), array( 'page_id<6054123' ), __METHOD__ );
74 foreach ( $res as $row ) {
75 if ( isset( $masterIDs[$row->page_id] ) && $masterIDs[$row->page_id] != $row->page_latest ) {
76 $desync[$row->page_id] = true;
77 $this->output( $row->page_id . "\t" );
78 }
79 }
80 }
81 $this->output( "\n" );
82 return $desync;
83 }
84
85 /**
86 * Fix a broken page entry
87 * @param $pageID int The page_id to fix
88 */
89 private function desyncFixPage( $pageID ) {
90 global $slaveIndexes;
91
92 # Check for a corrupted page_latest
93 $dbw = wfGetDB( DB_MASTER );
94 $dbw->begin();
95 $realLatest = $dbw->selectField( 'page', 'page_latest', array( 'page_id' => $pageID ),
96 __METHOD__, 'FOR UPDATE' );
97 # list( $masterFile, $masterPos ) = $dbw->getMasterPos();
98 $found = false;
99 foreach ( $slaveIndexes as $i ) {
100 $db = wfGetDB( $i );
101 /*
102 if ( !$db->masterPosWait( $masterFile, $masterPos, 10 ) ) {
103 $this->output( "Slave is too lagged, aborting\n" );
104 $dbw->commit();
105 sleep(10);
106 return;
107 }*/
108 $latest = $db->selectField( 'page', 'page_latest', array( 'page_id' => $pageID ), __METHOD__ );
109 $max = $db->selectField( 'revision', 'MAX(rev_id)', false, __METHOD__ );
110 if ( $latest != $realLatest && $realLatest < $max ) {
111 $this->output( "page_latest corrupted in page $pageID, server $i\n" );
112 $found = true;
113 break;
114 }
115 }
116 if ( !$found ) {
117 $this->output( "page_id $pageID seems fine\n" );
118 $dbw->commit();
119 return;
120 }
121
122 # Find the missing revisions
123 $res = $dbw->select( 'revision', array( 'rev_id' ), array( 'rev_page' => $pageID ),
124 __METHOD__, 'FOR UPDATE' );
125 $masterIDs = array();
126 foreach ( $res as $row ) {
127 $masterIDs[] = $row->rev_id;
128 }
129
130 $res = $db->select( 'revision', array( 'rev_id' ), array( 'rev_page' => $pageID ), __METHOD__ );
131 $slaveIDs = array();
132 foreach ( $res as $row ) {
133 $slaveIDs[] = $row->rev_id;
134 }
135 if ( count( $masterIDs ) < count( $slaveIDs ) ) {
136 $missingIDs = array_diff( $slaveIDs, $masterIDs );
137 if ( count( $missingIDs ) ) {
138 $this->output( "Found " . count( $missingIDs ) . " lost in master, copying from slave... " );
139 $dbFrom = $db;
140 $found = true;
141 $toMaster = true;
142 } else {
143 $found = false;
144 }
145 } else {
146 $missingIDs = array_diff( $masterIDs, $slaveIDs );
147 if ( count( $missingIDs ) ) {
148 $this->output( "Found " . count( $missingIDs ) . " missing revision(s), copying from master... " );
149 $dbFrom = $dbw;
150 $found = true;
151 $toMaster = false;
152 } else {
153 $found = false;
154 }
155 }
156
157 if ( $found ) {
158 foreach ( $missingIDs as $rid ) {
159 $this->output( "$rid " );
160 # Revision
161 $row = $dbFrom->selectRow( 'revision', '*', array( 'rev_id' => $rid ), __METHOD__ );
162 if ( $toMaster ) {
163 $id = $dbw->selectField( 'revision', 'rev_id', array( 'rev_id' => $rid ),
164 __METHOD__, 'FOR UPDATE' );
165 if ( $id ) {
166 $this->output( "Revision already exists\n" );
167 $found = false;
168 break;
169 } else {
170 $dbw->insert( 'revision', get_object_vars( $row ), __METHOD__, 'IGNORE' );
171 }
172 } else {
173 foreach ( $slaveIndexes as $i ) {
174 $db = wfGetDB( $i );
175 $db->insert( 'revision', get_object_vars( $row ), __METHOD__, 'IGNORE' );
176 }
177 }
178
179 # Text
180 $row = $dbFrom->selectRow( 'text', '*', array( 'old_id' => $row->rev_text_id ), __METHOD__ );
181 if ( $toMaster ) {
182 $dbw->insert( 'text', get_object_vars( $row ), __METHOD__, 'IGNORE' );
183 } else {
184 foreach ( $slaveIndexes as $i ) {
185 $db = wfGetDB( $i );
186 $db->insert( 'text', get_object_vars( $row ), __METHOD__, 'IGNORE' );
187 }
188 }
189 }
190 $this->output( "done\n" );
191 }
192
193 if ( $found ) {
194 $this->output( "Fixing page_latest... " );
195 if ( $toMaster ) {
196 # $dbw->update( 'page', array( 'page_latest' => $realLatest ), array( 'page_id' => $pageID ), __METHOD__ );
197 } else {
198 foreach ( $slaveIndexes as $i ) {
199 $db = wfGetDB( $i );
200 $db->update( 'page', array( 'page_latest' => $realLatest ), array( 'page_id' => $pageID ), __METHOD__ );
201 }
202 }
203 $this->output( "done\n" );
204 }
205 $dbw->commit();
206 }
207 }
208
209 $maintClass = "FixSlaveDesync";
210 require_once( DO_MAINTENANCE );