2008-09-27 11:42:28 +00:00
|
|
|
<?php
|
2010-02-24 14:00:23 +00:00
|
|
|
/**
|
2010-12-22 20:52:06 +00:00
|
|
|
*
|
2008-09-27 11:42:28 +00:00
|
|
|
*
|
2010-08-07 19:59:42 +00:00
|
|
|
* Created on Sep 27, 2008
|
|
|
|
|
*
|
2012-07-15 20:13:02 +00:00
|
|
|
* Copyright © 2008 Roan Kattouw "<Firstname>.<Lastname>@gmail.com"
|
2008-09-27 11:42:28 +00:00
|
|
|
*
|
|
|
|
|
* This program is free software; you can redistribute it and/or modify
|
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
|
|
|
* (at your option) any later version.
|
|
|
|
|
*
|
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
|
*
|
|
|
|
|
* You should have received a copy of the GNU General Public License along
|
|
|
|
|
* with this program; if not, write to the Free Software Foundation, Inc.,
|
2010-06-21 13:13:32 +00:00
|
|
|
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
2008-09-27 11:42:28 +00:00
|
|
|
* http://www.gnu.org/copyleft/gpl.html
|
2010-08-07 19:59:42 +00:00
|
|
|
*
|
|
|
|
|
* @file
|
2008-09-27 11:42:28 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* A query module to list duplicates of the given file(s)
|
|
|
|
|
*
|
|
|
|
|
* @ingroup API
|
|
|
|
|
*/
|
|
|
|
|
class ApiQueryDuplicateFiles extends ApiQueryGeneratorBase {
|
|
|
|
|
|
2010-01-11 15:55:52 +00:00
|
|
|
public function __construct( $query, $moduleName ) {
|
2010-02-24 14:00:23 +00:00
|
|
|
parent::__construct( $query, $moduleName, 'df' );
|
2008-09-27 11:42:28 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public function execute() {
|
|
|
|
|
$this->run();
|
|
|
|
|
}
|
|
|
|
|
|
2010-07-23 07:17:56 +00:00
|
|
|
public function getCacheMode( $params ) {
|
|
|
|
|
return 'public';
|
|
|
|
|
}
|
|
|
|
|
|
2010-01-11 15:55:52 +00:00
|
|
|
public function executeGenerator( $resultPageSet ) {
|
|
|
|
|
$this->run( $resultPageSet );
|
2008-09-27 11:42:28 +00:00
|
|
|
}
|
|
|
|
|
|
2011-02-19 00:30:18 +00:00
|
|
|
/**
|
|
|
|
|
* @param $resultPageSet ApiPageSet
|
|
|
|
|
* @return
|
|
|
|
|
*/
|
2010-01-11 15:55:52 +00:00
|
|
|
private function run( $resultPageSet = null ) {
|
2008-09-27 11:42:28 +00:00
|
|
|
$params = $this->extractRequestParams();
|
|
|
|
|
$namespaces = $this->getPageSet()->getAllTitlesByNamespace();
|
2008-12-01 17:14:30 +00:00
|
|
|
if ( empty( $namespaces[NS_FILE] ) ) {
|
2008-09-27 11:42:28 +00:00
|
|
|
return;
|
2008-10-25 14:04:43 +00:00
|
|
|
}
|
2008-12-01 17:14:30 +00:00
|
|
|
$images = $namespaces[NS_FILE];
|
2010-02-24 14:00:23 +00:00
|
|
|
|
2010-01-11 15:55:52 +00:00
|
|
|
$this->addTables( 'image', 'i1' );
|
|
|
|
|
$this->addTables( 'image', 'i2' );
|
|
|
|
|
$this->addFields( array(
|
2008-09-27 11:42:28 +00:00
|
|
|
'i1.img_name AS orig_name',
|
|
|
|
|
'i2.img_name AS dup_name',
|
|
|
|
|
'i2.img_user_text AS dup_user_text',
|
|
|
|
|
'i2.img_timestamp AS dup_timestamp'
|
2010-01-11 15:55:52 +00:00
|
|
|
) );
|
2010-01-23 22:26:40 +00:00
|
|
|
|
2010-01-11 15:55:52 +00:00
|
|
|
$this->addWhere( array(
|
|
|
|
|
'i1.img_name' => array_keys( $images ),
|
2008-09-27 11:42:28 +00:00
|
|
|
'i1.img_sha1 = i2.img_sha1',
|
|
|
|
|
'i1.img_name != i2.img_name',
|
2010-01-11 15:55:52 +00:00
|
|
|
) );
|
2010-01-23 22:26:40 +00:00
|
|
|
|
2010-02-24 14:00:23 +00:00
|
|
|
if ( isset( $params['continue'] ) ) {
|
2010-01-11 15:55:52 +00:00
|
|
|
$cont = explode( '|', $params['continue'] );
|
2010-02-24 14:00:23 +00:00
|
|
|
if ( count( $cont ) != 2 ) {
|
|
|
|
|
$this->dieUsage( 'Invalid continue param. You should pass the ' .
|
|
|
|
|
'original value returned by the previous query', '_badcontinue' );
|
|
|
|
|
}
|
2012-03-30 21:19:34 +00:00
|
|
|
$op = $params['dir'] == 'descending' ? '<' : '>';
|
|
|
|
|
$db = $this->getDB();
|
2012-05-21 17:07:37 +00:00
|
|
|
$orig = $db->addQuotes( $cont[0] );
|
|
|
|
|
$dup = $db->addQuotes( $cont[1] );
|
2010-02-24 14:00:23 +00:00
|
|
|
$this->addWhere(
|
2012-03-30 21:19:34 +00:00
|
|
|
"i1.img_name $op $orig OR " .
|
|
|
|
|
"(i1.img_name = $orig AND " .
|
|
|
|
|
"i2.img_name $op= $dup)"
|
2010-02-24 14:00:23 +00:00
|
|
|
);
|
2008-09-27 11:42:28 +00:00
|
|
|
}
|
2010-01-23 22:26:40 +00:00
|
|
|
|
2012-05-05 13:29:08 +00:00
|
|
|
$sort = ( $params['dir'] == 'descending' ? ' DESC' : '' );
|
2012-03-30 21:19:34 +00:00
|
|
|
// Don't order by i1.img_name if it's constant in the WHERE clause
|
|
|
|
|
if ( count( $this->getPageSet()->getGoodTitles() ) == 1 ) {
|
2012-05-05 13:29:08 +00:00
|
|
|
$this->addOption( 'ORDER BY', 'i2.img_name' . $sort );
|
2012-03-30 21:19:34 +00:00
|
|
|
} else {
|
|
|
|
|
$this->addOption( 'ORDER BY', array(
|
2012-05-05 13:29:08 +00:00
|
|
|
'i1.img_name' . $sort,
|
|
|
|
|
'i2.img_name' . $sort
|
2012-03-30 21:19:34 +00:00
|
|
|
));
|
|
|
|
|
}
|
2010-01-11 15:55:52 +00:00
|
|
|
$this->addOption( 'LIMIT', $params['limit'] + 1 );
|
2008-09-27 11:42:28 +00:00
|
|
|
|
2010-01-11 15:55:52 +00:00
|
|
|
$res = $this->select( __METHOD__ );
|
2008-09-27 11:42:28 +00:00
|
|
|
$count = 0;
|
|
|
|
|
$titles = array();
|
2010-06-20 18:48:34 +00:00
|
|
|
foreach ( $res as $row ) {
|
2010-02-24 14:00:23 +00:00
|
|
|
if ( ++$count > $params['limit'] ) {
|
2008-09-27 11:42:28 +00:00
|
|
|
// We've reached the one extra which shows that
|
|
|
|
|
// there are additional pages to be had. Stop here...
|
2012-05-21 17:07:37 +00:00
|
|
|
$this->setContinueEnumParameter( 'continue', $row->orig_name . '|' . $row->dup_name );
|
2008-09-27 11:42:28 +00:00
|
|
|
break;
|
|
|
|
|
}
|
2010-02-24 14:00:23 +00:00
|
|
|
if ( !is_null( $resultPageSet ) ) {
|
2010-01-11 15:55:52 +00:00
|
|
|
$titles[] = Title::makeTitle( NS_FILE, $row->dup_name );
|
2010-02-24 14:00:23 +00:00
|
|
|
} else {
|
* API: BREAKING CHANGE: (bug 11430) Return fewer results than the limit in some cases to prevent running out of memory
* This means queries could possibly return fewer results than the limit and still set a query-continue
* Add iicontinue, rvcontinue, cicontinue, incontinue, amfrom to faciliate query-continue for these modules
* Implemented by blocking additions to the ApiResult object if they would make it too large
** Important things like query-continue values and warnings are exempt from this check
** RSS feeds and exported XML are also exempted (size-checking them would be too messy)
** Result size is checked against $wgAPIMaxResultSize, which defaults to 8 MB
For those who really care, per-file details follow:
ApiResult.php:
* Introduced ApiResult::$mSize which keeps track of the result size.
* Introduced ApiResult::size() which calculates an array's size
(which is the sum of the strlen()s of its elements).
* ApiResult::addValue() now checks that the result size stays below
$wgAPIMaxResultSize. If the item won't fit, it won't be added and addValue()
will return false. Callers should check the return value and set a
query-continue if it's false.
* Closed the back door that is ApiResult::getData(): callers can't manipulate
the data array directly anymore so they can't bypass the result size limit.
* Added ApiResult::setIndexedTagName_internal() which will call
setIndexedTagName() on an array already in the result. This is needed for the
'new' order of adding results, which means addValue()ing one result at a time
until you hit the limit or run out, then calling this function to set the tag
name.
* Added ApiResult::disableSizeCheck() and enableSizeCheck() which disable and
enable size checking in addValue(). This is used for stuff like query-continue
elements and warnings which shouldn't count towards the result size.
* Added ApiResult::unsetValue() which removes an element from the result and
decreases $mSize.
ApiBase.php:
* Like ApiResult::getData(), ApiBase::getResultData() no longer returns a
reference.
* Use ApiResult::disableSizeCheck() in ApiBase::setWarning()
ApiQueryBase.php:
* Added ApiQueryBase::addPageSubItem(), which adds page subitems one item
at a time.
* addPageSubItem() and addPageSubItems() now return whether the subitem
fit in the result.
* Use ApiResult::disableSizeCheck() in setContinueEnumParameter()
ApiMain.php:
* Use ApiResult::disableSizeCheck() in ApiMain::substituteResultWithError()
* Use getParameter() rather than $mRequest to obtain requestid
DefaultSettings.php:
* Added $wgAPIMaxResultSize, with a default value of 8 MB
ApiQuery*.php:
* Added results one at a time, and set a query-continue if the result is full.
ApiQueryLangLinks.php and friends:
* Migrated from addPageSubItems() to addPageSubItem(). This eliminates the
need for $lastId.
ApiQueryAllLinks.php, ApiQueryWatchlist.php, ApiQueryAllimages.php, ApiQuerySearch.php:
* Renamed $data to something more appropriate ($pageids, $ids or $titles)
ApiQuerySiteinfo.php:
* Abuse siprop as a query-continue parameter and set it to all props that
couldn't be processed.
ApiQueryRandom.php:
* Doesn't do continuations, because the result is supposed to be random.
* Be smart enough to not run the second query if the results of the first
didn't fit.
ApiQueryImageInfo.php, ApiQueryRevisions.php, ApiQueryCategoryInfo.php, ApiQueryInfo.php:
* Added continue parameter which basically skips the first so many items
ApiQueryBacklinks.php:
* Throw the result in a big array first and addValue() that one element at a time if necessary
** This is necessary because the results aren't retrieved in order
* Introduced $this->pageMap to map namespace and title to page ID
* Rewritten extractRowInfo() and extractRedirRowInfo() a little
* Declared all private member variables explicitly
ApiQueryDeletedrevs.php:
* Use a pagemap just like in Backlinks
* Introduce fake page IDs and keep track of them so we know where to add what
** This doesn't change the output format, because the fake page IDs start at 0 and are consecutive
ApiQueryAllmessages.php:
* Add amfrom to facilitate query-continue
ApiQueryUsers.php:
* Rewrite: put the getOtherUsersInfo() code in execute()
2009-02-05 14:30:59 +00:00
|
|
|
$r = array(
|
2008-09-27 11:42:28 +00:00
|
|
|
'name' => $row->dup_name,
|
|
|
|
|
'user' => $row->dup_user_text,
|
2010-01-11 15:55:52 +00:00
|
|
|
'timestamp' => wfTimestamp( TS_ISO_8601, $row->dup_timestamp )
|
2008-09-27 11:42:28 +00:00
|
|
|
);
|
2010-01-11 15:55:52 +00:00
|
|
|
$fit = $this->addPageSubItem( $images[$row->orig_name], $r );
|
2010-02-24 14:00:23 +00:00
|
|
|
if ( !$fit ) {
|
2012-05-21 17:07:37 +00:00
|
|
|
$this->setContinueEnumParameter( 'continue', $row->orig_name . '|' . $row->dup_name );
|
* API: BREAKING CHANGE: (bug 11430) Return fewer results than the limit in some cases to prevent running out of memory
* This means queries could possibly return fewer results than the limit and still set a query-continue
* Add iicontinue, rvcontinue, cicontinue, incontinue, amfrom to faciliate query-continue for these modules
* Implemented by blocking additions to the ApiResult object if they would make it too large
** Important things like query-continue values and warnings are exempt from this check
** RSS feeds and exported XML are also exempted (size-checking them would be too messy)
** Result size is checked against $wgAPIMaxResultSize, which defaults to 8 MB
For those who really care, per-file details follow:
ApiResult.php:
* Introduced ApiResult::$mSize which keeps track of the result size.
* Introduced ApiResult::size() which calculates an array's size
(which is the sum of the strlen()s of its elements).
* ApiResult::addValue() now checks that the result size stays below
$wgAPIMaxResultSize. If the item won't fit, it won't be added and addValue()
will return false. Callers should check the return value and set a
query-continue if it's false.
* Closed the back door that is ApiResult::getData(): callers can't manipulate
the data array directly anymore so they can't bypass the result size limit.
* Added ApiResult::setIndexedTagName_internal() which will call
setIndexedTagName() on an array already in the result. This is needed for the
'new' order of adding results, which means addValue()ing one result at a time
until you hit the limit or run out, then calling this function to set the tag
name.
* Added ApiResult::disableSizeCheck() and enableSizeCheck() which disable and
enable size checking in addValue(). This is used for stuff like query-continue
elements and warnings which shouldn't count towards the result size.
* Added ApiResult::unsetValue() which removes an element from the result and
decreases $mSize.
ApiBase.php:
* Like ApiResult::getData(), ApiBase::getResultData() no longer returns a
reference.
* Use ApiResult::disableSizeCheck() in ApiBase::setWarning()
ApiQueryBase.php:
* Added ApiQueryBase::addPageSubItem(), which adds page subitems one item
at a time.
* addPageSubItem() and addPageSubItems() now return whether the subitem
fit in the result.
* Use ApiResult::disableSizeCheck() in setContinueEnumParameter()
ApiMain.php:
* Use ApiResult::disableSizeCheck() in ApiMain::substituteResultWithError()
* Use getParameter() rather than $mRequest to obtain requestid
DefaultSettings.php:
* Added $wgAPIMaxResultSize, with a default value of 8 MB
ApiQuery*.php:
* Added results one at a time, and set a query-continue if the result is full.
ApiQueryLangLinks.php and friends:
* Migrated from addPageSubItems() to addPageSubItem(). This eliminates the
need for $lastId.
ApiQueryAllLinks.php, ApiQueryWatchlist.php, ApiQueryAllimages.php, ApiQuerySearch.php:
* Renamed $data to something more appropriate ($pageids, $ids or $titles)
ApiQuerySiteinfo.php:
* Abuse siprop as a query-continue parameter and set it to all props that
couldn't be processed.
ApiQueryRandom.php:
* Doesn't do continuations, because the result is supposed to be random.
* Be smart enough to not run the second query if the results of the first
didn't fit.
ApiQueryImageInfo.php, ApiQueryRevisions.php, ApiQueryCategoryInfo.php, ApiQueryInfo.php:
* Added continue parameter which basically skips the first so many items
ApiQueryBacklinks.php:
* Throw the result in a big array first and addValue() that one element at a time if necessary
** This is necessary because the results aren't retrieved in order
* Introduced $this->pageMap to map namespace and title to page ID
* Rewritten extractRowInfo() and extractRedirRowInfo() a little
* Declared all private member variables explicitly
ApiQueryDeletedrevs.php:
* Use a pagemap just like in Backlinks
* Introduce fake page IDs and keep track of them so we know where to add what
** This doesn't change the output format, because the fake page IDs start at 0 and are consecutive
ApiQueryAllmessages.php:
* Add amfrom to facilitate query-continue
ApiQueryUsers.php:
* Rewrite: put the getOtherUsersInfo() code in execute()
2009-02-05 14:30:59 +00:00
|
|
|
break;
|
|
|
|
|
}
|
2008-09-27 11:42:28 +00:00
|
|
|
}
|
|
|
|
|
}
|
2010-02-24 14:00:23 +00:00
|
|
|
if ( !is_null( $resultPageSet ) ) {
|
2010-01-11 15:55:52 +00:00
|
|
|
$resultPageSet->populateFromTitles( $titles );
|
2010-02-24 14:00:23 +00:00
|
|
|
}
|
2008-09-27 11:42:28 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public function getAllowedParams() {
|
2010-02-24 14:00:23 +00:00
|
|
|
return array(
|
2008-09-27 11:42:28 +00:00
|
|
|
'limit' => array(
|
2010-02-24 14:00:23 +00:00
|
|
|
ApiBase::PARAM_DFLT => 10,
|
|
|
|
|
ApiBase::PARAM_TYPE => 'limit',
|
|
|
|
|
ApiBase::PARAM_MIN => 1,
|
|
|
|
|
ApiBase::PARAM_MAX => ApiBase::LIMIT_BIG1,
|
|
|
|
|
ApiBase::PARAM_MAX2 => ApiBase::LIMIT_BIG2
|
2008-09-27 11:42:28 +00:00
|
|
|
),
|
|
|
|
|
'continue' => null,
|
2011-11-14 08:19:55 +00:00
|
|
|
'dir' => array(
|
|
|
|
|
ApiBase::PARAM_DFLT => 'ascending',
|
|
|
|
|
ApiBase::PARAM_TYPE => array(
|
|
|
|
|
'ascending',
|
|
|
|
|
'descending'
|
|
|
|
|
)
|
|
|
|
|
),
|
2008-09-27 11:42:28 +00:00
|
|
|
);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public function getParamDescription() {
|
2010-02-24 14:00:23 +00:00
|
|
|
return array(
|
2008-09-27 11:42:28 +00:00
|
|
|
'limit' => 'How many files to return',
|
|
|
|
|
'continue' => 'When more results are available, use this to continue',
|
2011-11-14 08:19:55 +00:00
|
|
|
'dir' => 'The direction in which to list',
|
2008-09-27 11:42:28 +00:00
|
|
|
);
|
|
|
|
|
}
|
|
|
|
|
|
Added result properties to action=paraminfo
Added information about the properties of the results of API calls
to action=paraminfo, including information about "property groups":
what should the prop parameter be set to to get that property.
Uses the same format for types as parameters already do.
The output format of some modules doesn't fit this, so the result
properties for them weren't added, or only partially.
Partially implemented modules:
* expandtemplates:
parsetree is in its own tag
* protect, allusers, backlinks, deletedrevs, info, imageinfo,
logevents, querypage, recentchanges, revisions, searchinfo,
usercontribs, userinfo, users, watchlist, upload:
response with partially complex structure
Not implemented modules:
* feedcontributions, feedwatchlist, opensearch, rds:
non-standard reponse
* help:
error is normal response; not very useful for automated tools anyway
* paraminfo, parse, pageprops, siteinfo, userrights:
response with complex structure
Change-Id: Iff2a9bef79f994e73eef3062b4dd5461bff968ab
2012-05-02 15:00:30 +00:00
|
|
|
public function getResultProperties() {
|
|
|
|
|
return array(
|
|
|
|
|
'' => array(
|
|
|
|
|
'name' => 'string',
|
|
|
|
|
'user' => 'string',
|
|
|
|
|
'timestamp' => 'timestamp'
|
|
|
|
|
)
|
|
|
|
|
);
|
|
|
|
|
}
|
|
|
|
|
|
2008-09-27 11:42:28 +00:00
|
|
|
public function getDescription() {
|
2010-05-11 22:30:18 +00:00
|
|
|
return 'List all files that are duplicates of the given file(s)';
|
2008-09-27 11:42:28 +00:00
|
|
|
}
|
2010-02-24 14:00:23 +00:00
|
|
|
|
2010-02-13 01:38:12 +00:00
|
|
|
public function getPossibleErrors() {
|
|
|
|
|
return array_merge( parent::getPossibleErrors(), array(
|
|
|
|
|
array( 'code' => '_badcontinue', 'info' => 'Invalid continue param. You should pass the original value returned by the previous query' ),
|
|
|
|
|
) );
|
|
|
|
|
}
|
2008-09-27 11:42:28 +00:00
|
|
|
|
2011-08-17 22:24:21 +00:00
|
|
|
public function getExamples() {
|
2010-02-24 14:00:23 +00:00
|
|
|
return array(
|
|
|
|
|
'api.php?action=query&titles=File:Albert_Einstein_Head.jpg&prop=duplicatefiles',
|
|
|
|
|
'api.php?action=query&generator=allimages&prop=duplicatefiles',
|
|
|
|
|
);
|
2008-09-27 11:42:28 +00:00
|
|
|
}
|
|
|
|
|
|
2011-07-17 16:51:11 +00:00
|
|
|
public function getHelpUrls() {
|
2011-11-28 15:43:11 +00:00
|
|
|
return 'https://www.mediawiki.org/wiki/API:Properties#duplicatefiles_.2F_df';
|
2011-07-17 16:51:11 +00:00
|
|
|
}
|
|
|
|
|
|
2008-09-27 11:42:28 +00:00
|
|
|
public function getVersion() {
|
|
|
|
|
return __CLASS__ . ': $Id$';
|
|
|
|
|
}
|
|
|
|
|
}
|