Quick solution for problems with limit=max when using slow queries: allowing modules...
[lhc/web/wiklou.git] / includes / api / ApiQueryRevisions.php
1 <?php
2
3 /*
4 * Created on Sep 7, 2006
5 *
6 * API for MediaWiki 1.8+
7 *
8 * Copyright (C) 2006 Yuri Astrakhan <Firstname><Lastname>@gmail.com
9 *
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License along
21 * with this program; if not, write to the Free Software Foundation, Inc.,
22 * 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
23 * http://www.gnu.org/copyleft/gpl.html
24 */
25
26 if (!defined('MEDIAWIKI')) {
27 // Eclipse helper - will be ignored in production
28 require_once ('ApiQueryBase.php');
29 }
30
31 /**
32 * A query action to enumerate revisions of a given page, or show top revisions of multiple pages.
33 * Various pieces of information may be shown - flags, comments, and the actual wiki markup of the rev.
34 * In the enumeration mode, ranges of revisions may be requested and filtered.
35 *
36 * @addtogroup API
37 */
38 class ApiQueryRevisions extends ApiQueryBase {
39
40 public function __construct($query, $moduleName) {
41 parent :: __construct($query, $moduleName, 'rv');
42 }
43
44 private $fld_ids = false, $fld_flags = false, $fld_timestamp = false, $fld_size = false,
45 $fld_comment = false, $fld_user = false, $fld_content = false;
46
47 public function execute() {
48 $limit = $startid = $endid = $start = $end = $dir = $prop = $user = $excludeuser = $token = null;
49 extract($this->extractRequestParams(false));
50
51 // If any of those parameters are used, work in 'enumeration' mode.
52 // Enum mode can only be used when exactly one page is provided.
53 // Enumerating revisions on multiple pages make it extremely
54 // difficult to manage continuations and require additional SQL indexes
55 $enumRevMode = (!is_null($user) || !is_null($excludeuser) || !is_null($limit) || !is_null($startid) || !is_null($endid) || $dir === 'newer' || !is_null($start) || !is_null($end));
56
57
58 $pageSet = $this->getPageSet();
59 $pageCount = $pageSet->getGoodTitleCount();
60 $revCount = $pageSet->getRevisionCount();
61
62 // Optimization -- nothing to do
63 if ($revCount === 0 && $pageCount === 0)
64 return;
65
66 if ($revCount > 0 && $enumRevMode)
67 $this->dieUsage('The revids= parameter may not be used with the list options (limit, startid, endid, dirNewer, start, end).', 'revids');
68
69 if ($pageCount > 1 && $enumRevMode)
70 $this->dieUsage('titles, pageids or a generator was used to supply multiple pages, but the limit, startid, endid, dirNewer, user, excludeuser, start and end parameters may only be used on a single page.', 'multpages');
71
72 $this->addTables('revision');
73 $this->addWhere('rev_deleted=0');
74
75 $prop = array_flip($prop);
76
77 // These field are needed regardless of the client requesting them
78 $this->addFields('rev_id');
79 $this->addFields('rev_page');
80
81 // Optional fields
82 $this->fld_ids = isset ($prop['ids']);
83 // $this->addFieldsIf('rev_text_id', $this->fld_ids); // should this be exposed?
84 $this->fld_flags = $this->addFieldsIf('rev_minor_edit', isset ($prop['flags']));
85 $this->fld_timestamp = $this->addFieldsIf('rev_timestamp', isset ($prop['timestamp']));
86 $this->fld_comment = $this->addFieldsIf('rev_comment', isset ($prop['comment']));
87 $this->fld_size = $this->addFieldsIf('rev_len', isset ($prop['size']));
88 $this->tok_rollback = false; // Prevent PHP undefined property notice
89 if(!is_null($token))
90 {
91 $this->tok_rollback = $this->getTokenFlag($token, 'rollback');
92 }
93
94 if (isset ($prop['user'])) {
95 $this->addFields('rev_user');
96 $this->addFields('rev_user_text');
97 $this->fld_user = true;
98 }
99 else if($this->tok_rollback)
100 $this->addFields('rev_user_text');
101
102 if (isset ($prop['content'])) {
103
104 // For each page we will request, the user must have read rights for that page
105 foreach ($pageSet->getGoodTitles() as $title) {
106 if( !$title->userCanRead() )
107 $this->dieUsage(
108 'The current user is not allowed to read ' . $title->getPrefixedText(),
109 'accessdenied');
110 }
111
112 $this->addTables('text');
113 $this->addWhere('rev_text_id=old_id');
114 $this->addFields('old_id');
115 $this->addFields('old_text');
116 $this->addFields('old_flags');
117
118 $this->fld_content = true;
119
120 $this->expandTemplates = $expandtemplates;
121 }
122
123 $userMax = ( $this->fld_content ? ApiBase::LIMIT_SML1 : ApiBase::LIMIT_BIG1 );
124 $botMax = ( $this->fld_content ? ApiBase::LIMIT_SML2 : ApiBase::LIMIT_BIG2 );
125 if( $limit == 'max' ) {
126 $limit = $this->getMain()->canApiHighLimits() ? $botMax : $userMax;
127 $this->getResult()->addValue( 'limits', 'limit', $limit );
128 }
129
130 if ($enumRevMode) {
131
132 // This is mostly to prevent parameter errors (and optimize SQL?)
133 if (!is_null($startid) && !is_null($start))
134 $this->dieUsage('start and startid cannot be used together', 'badparams');
135
136 if (!is_null($endid) && !is_null($end))
137 $this->dieUsage('end and endid cannot be used together', 'badparams');
138
139 if(!is_null($user) && !is_null( $excludeuser))
140 $this->dieUsage('user and excludeuser cannot be used together', 'badparams');
141
142 // This code makes an assumption that sorting by rev_id and rev_timestamp produces
143 // the same result. This way users may request revisions starting at a given time,
144 // but to page through results use the rev_id returned after each page.
145 // Switching to rev_id removes the potential problem of having more than
146 // one row with the same timestamp for the same page.
147 // The order needs to be the same as start parameter to avoid SQL filesort.
148
149 if (is_null($startid) && is_null($endid))
150 $this->addWhereRange('rev_timestamp', $dir, $start, $end);
151 else
152 $this->addWhereRange('rev_id', $dir, $startid, $endid);
153
154 // must manually initialize unset limit
155 if (is_null($limit))
156 $limit = 10;
157 $this->validateLimit('limit', $limit, 1, $userMax, $botMax);
158
159 // There is only one ID, use it
160 $this->addWhereFld('rev_page', current(array_keys($pageSet->getGoodTitles())));
161
162 if(!is_null($user)) {
163 $this->addWhereFld('rev_user_text', $user);
164 } elseif (!is_null( $excludeuser)) {
165 $this->addWhere('rev_user_text != ' . $this->getDB()->addQuotes($excludeuser));
166 }
167 }
168 elseif ($revCount > 0) {
169 $this->validateLimit('rev_count', $revCount, 1, $userMax, $botMax);
170
171 // Get all revision IDs
172 $this->addWhereFld('rev_id', array_keys($pageSet->getRevisionIDs()));
173
174 // assumption testing -- we should never get more then $revCount rows.
175 $limit = $revCount;
176 }
177 elseif ($pageCount > 0) {
178 // When working in multi-page non-enumeration mode,
179 // limit to the latest revision only
180 $this->addTables('page');
181 $this->addWhere('page_id=rev_page');
182 $this->addWhere('page_latest=rev_id');
183 $this->validateLimit('page_count', $pageCount, 1, $userMax, $botMax);
184
185 // Get all page IDs
186 $this->addWhereFld('page_id', array_keys($pageSet->getGoodTitles()));
187
188 // assumption testing -- we should never get more then $pageCount rows.
189 $limit = $pageCount;
190 } else
191 ApiBase :: dieDebug(__METHOD__, 'param validation?');
192
193 $this->addOption('LIMIT', $limit +1);
194
195 $data = array ();
196 $count = 0;
197 $res = $this->select(__METHOD__);
198
199 $db = $this->getDB();
200 while ($row = $db->fetchObject($res)) {
201
202 if (++ $count > $limit) {
203 // We've reached the one extra which shows that there are additional pages to be had. Stop here...
204 if (!$enumRevMode)
205 ApiBase :: dieDebug(__METHOD__, 'Got more rows then expected'); // bug report
206 $this->setContinueEnumParameter('startid', intval($row->rev_id));
207 break;
208 }
209
210 $this->getResult()->addValue(
211 array (
212 'query',
213 'pages',
214 intval($row->rev_page),
215 'revisions'),
216 null,
217 $this->extractRowInfo($row));
218 }
219 $db->freeResult($res);
220
221 // Ensure that all revisions are shown as '<rev>' elements
222 $result = $this->getResult();
223 if ($result->getIsRawMode()) {
224 $data =& $result->getData();
225 foreach ($data['query']['pages'] as & $page) {
226 if (is_array($page) && array_key_exists('revisions', $page)) {
227 $result->setIndexedTagName($page['revisions'], 'rev');
228 }
229 }
230 }
231 }
232
233 private function extractRowInfo($row) {
234
235 $vals = array ();
236
237 if ($this->fld_ids) {
238 $vals['revid'] = intval($row->rev_id);
239 // $vals['oldid'] = intval($row->rev_text_id); // todo: should this be exposed?
240 }
241
242 if ($this->fld_flags && $row->rev_minor_edit)
243 $vals['minor'] = '';
244
245 if ($this->fld_user) {
246 $vals['user'] = $row->rev_user_text;
247 if (!$row->rev_user)
248 $vals['anon'] = '';
249 }
250
251 if ($this->fld_timestamp) {
252 $vals['timestamp'] = wfTimestamp(TS_ISO_8601, $row->rev_timestamp);
253 }
254
255 if ($this->fld_size && !is_null($row->rev_len)) {
256 $vals['size'] = intval($row->rev_len);
257 }
258
259 if ($this->fld_comment && !empty ($row->rev_comment)) {
260 $vals['comment'] = $row->rev_comment;
261 }
262
263 if($this->tok_rollback || ($this->fld_content && $this->expandTemplates))
264 $title = Title::newFromID($row->rev_page);
265
266 if($this->tok_rollback) {
267 global $wgUser;
268 $vals['rollbacktoken'] = $wgUser->editToken(array($title->getPrefixedText(), $row->rev_user_text));
269 }
270
271
272 if ($this->fld_content) {
273 $text = Revision :: getRevisionText($row);
274 if ($this->expandTemplates) {
275 global $wgParser;
276 $text = $wgParser->preprocess( $text, $title, new ParserOptions() );
277 }
278 ApiResult :: setContent($vals, $text);
279 }
280 return $vals;
281 }
282
283 protected function getAllowedParams() {
284 return array (
285 'prop' => array (
286 ApiBase :: PARAM_ISMULTI => true,
287 ApiBase :: PARAM_DFLT => 'ids|timestamp|flags|comment|user',
288 ApiBase :: PARAM_TYPE => array (
289 'ids',
290 'flags',
291 'timestamp',
292 'user',
293 'size',
294 'comment',
295 'content',
296 )
297 ),
298 'limit' => array (
299 ApiBase :: PARAM_TYPE => 'limit',
300 ApiBase :: PARAM_MIN => 1,
301 ApiBase :: PARAM_MAX => ApiBase :: LIMIT_BIG1,
302 ApiBase :: PARAM_MAX2 => ApiBase :: LIMIT_BIG2
303 ),
304 'startid' => array (
305 ApiBase :: PARAM_TYPE => 'integer'
306 ),
307 'endid' => array (
308 ApiBase :: PARAM_TYPE => 'integer'
309 ),
310 'start' => array (
311 ApiBase :: PARAM_TYPE => 'timestamp'
312 ),
313 'end' => array (
314 ApiBase :: PARAM_TYPE => 'timestamp'
315 ),
316 'dir' => array (
317 ApiBase :: PARAM_DFLT => 'older',
318 ApiBase :: PARAM_TYPE => array (
319 'newer',
320 'older'
321 )
322 ),
323 'user' => array(
324 ApiBase :: PARAM_TYPE => 'user'
325 ),
326 'excludeuser' => array(
327 ApiBase :: PARAM_TYPE => 'user'
328 ),
329
330 'expandtemplates' => false,
331 'token' => array(
332 ApiBase :: PARAM_TYPE => array(
333 'rollback'
334 ),
335 ApiBase :: PARAM_ISMULTI => true
336 ),
337 );
338 }
339
340 protected function getParamDescription() {
341 return array (
342 'prop' => 'Which properties to get for each revision.',
343 'limit' => 'limit how many revisions will be returned (enum)',
344 'startid' => 'from which revision id to start enumeration (enum)',
345 'endid' => 'stop revision enumeration on this revid (enum)',
346 'start' => 'from which revision timestamp to start enumeration (enum)',
347 'end' => 'enumerate up to this timestamp (enum)',
348 'dir' => 'direction of enumeration - towards "newer" or "older" revisions (enum)',
349 'user' => 'only include revisions made by user',
350 'excludeuser' => 'exclude revisions made by user',
351 'expandtemplates' => 'expand templates in revision content',
352 'token' => 'Which tokens to obtain for each revision',
353 );
354 }
355
356 protected function getDescription() {
357 return array (
358 'Get revision information.',
359 'This module may be used in several ways:',
360 ' 1) Get data about a set of pages (last revision), by setting titles or pageids parameter.',
361 ' 2) Get revisions for one given page, by using titles/pageids with start/end/limit params.',
362 ' 3) Get data about a set of revisions by setting their IDs with revids parameter.',
363 'All parameters marked as (enum) may only be used with a single page (#2).'
364 );
365 }
366
367 protected function getExamples() {
368 return array (
369 'Get data with content for the last revision of titles "API" and "Main Page":',
370 ' api.php?action=query&prop=revisions&titles=API|Main%20Page&rvprop=timestamp|user|comment|content',
371 'Get last 5 revisions of the "Main Page":',
372 ' api.php?action=query&prop=revisions&titles=Main%20Page&rvlimit=5&rvprop=timestamp|user|comment',
373 'Get first 5 revisions of the "Main Page":',
374 ' api.php?action=query&prop=revisions&titles=Main%20Page&rvlimit=5&rvprop=timestamp|user|comment&rvdir=newer',
375 'Get first 5 revisions of the "Main Page" made after 2006-05-01:',
376 ' api.php?action=query&prop=revisions&titles=Main%20Page&rvlimit=5&rvprop=timestamp|user|comment&rvdir=newer&rvstart=20060501000000',
377 'Get first 5 revisions of the "Main Page" that were not made made by anonymous user "127.0.0.1"',
378 ' api.php?action=query&prop=revisions&titles=Main%20Page&rvlimit=5&rvprop=timestamp|user|comment&rvexcludeuser=127.0.0.1',
379 'Get first 5 revisions of the "Main Page" that were made by the user "MediaWiki default"',
380 ' api.php?action=query&prop=revisions&titles=Main%20Page&rvlimit=5&rvprop=timestamp|user|comment&rvuser=MediaWiki%20default',
381 );
382 }
383
384 public function getVersion() {
385 return __CLASS__ . ': $Id$';
386 }
387 }
388