Merge "DatabaseMssql: Don't duplicate body of makeList()"
[mediawiki.git] / includes / api / ApiQueryDuplicateFiles.php
blob010f8d59a758658ef4e4149296dd8fcdfbb85ded
1 <?php
2 /**
5 * Created on Sep 27, 2008
7 * Copyright © 2008 Roan Kattouw "<Firstname>.<Lastname>@gmail.com"
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License as published by
11 * the Free Software Foundation; either version 2 of the License, or
12 * (at your option) any later version.
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
19 * You should have received a copy of the GNU General Public License along
20 * with this program; if not, write to the Free Software Foundation, Inc.,
21 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
22 * http://www.gnu.org/copyleft/gpl.html
24 * @file
27 /**
28 * A query module to list duplicates of the given file(s)
30 * @ingroup API
32 class ApiQueryDuplicateFiles extends ApiQueryGeneratorBase {
34 public function __construct( ApiQuery $query, $moduleName ) {
35 parent::__construct( $query, $moduleName, 'df' );
38 public function execute() {
39 $this->run();
42 public function getCacheMode( $params ) {
43 return 'public';
46 public function executeGenerator( $resultPageSet ) {
47 $this->run( $resultPageSet );
50 /**
51 * @param ApiPageSet $resultPageSet
53 private function run( $resultPageSet = null ) {
54 $params = $this->extractRequestParams();
55 $namespaces = $this->getPageSet()->getGoodAndMissingTitlesByNamespace();
56 if ( empty( $namespaces[NS_FILE] ) ) {
57 return;
59 $images = $namespaces[NS_FILE];
61 if ( $params['dir'] == 'descending' ) {
62 $images = array_reverse( $images );
65 $skipUntilThisDup = false;
66 if ( isset( $params['continue'] ) ) {
67 $cont = explode( '|', $params['continue'] );
68 $this->dieContinueUsageIf( count( $cont ) != 2 );
69 $fromImage = $cont[0];
70 $skipUntilThisDup = $cont[1];
71 // Filter out any images before $fromImage
72 foreach ( $images as $image => $pageId ) {
73 if ( $image < $fromImage ) {
74 unset( $images[$image] );
75 } else {
76 break;
81 $filesToFind = array_keys( $images );
82 if ( $params['localonly'] ) {
83 $files = RepoGroup::singleton()->getLocalRepo()->findFiles( $filesToFind );
84 } else {
85 $files = RepoGroup::singleton()->findFiles( $filesToFind );
88 $fit = true;
89 $count = 0;
90 $titles = array();
92 $sha1s = array();
93 foreach ( $files as $file ) {
94 /** @var $file File */
95 $sha1s[$file->getName()] = $file->getSha1();
98 // find all files with the hashes, result format is:
99 // array( hash => array( dup1, dup2 ), hash1 => ... )
100 $filesToFindBySha1s = array_unique( array_values( $sha1s ) );
101 if ( $params['localonly'] ) {
102 $filesBySha1s = RepoGroup::singleton()->getLocalRepo()->findBySha1s( $filesToFindBySha1s );
103 } else {
104 $filesBySha1s = RepoGroup::singleton()->findBySha1s( $filesToFindBySha1s );
107 // iterate over $images to handle continue param correct
108 foreach ( $images as $image => $pageId ) {
109 if ( !isset( $sha1s[$image] ) ) {
110 continue; //file does not exist
112 $sha1 = $sha1s[$image];
113 $dupFiles = $filesBySha1s[$sha1];
114 if ( $params['dir'] == 'descending' ) {
115 $dupFiles = array_reverse( $dupFiles );
117 /** @var $dupFile File */
118 foreach ( $dupFiles as $dupFile ) {
119 $dupName = $dupFile->getName();
120 if ( $image == $dupName && $dupFile->isLocal() ) {
121 continue; //ignore the local file itself
123 if ( $skipUntilThisDup !== false && $dupName < $skipUntilThisDup ) {
124 continue; //skip to pos after the image from continue param
126 $skipUntilThisDup = false;
127 if ( ++$count > $params['limit'] ) {
128 $fit = false; //break outer loop
129 // We're one over limit which shows that
130 // there are additional images to be had. Stop here...
131 $this->setContinueEnumParameter( 'continue', $image . '|' . $dupName );
132 break;
134 if ( !is_null( $resultPageSet ) ) {
135 $titles[] = $dupFile->getTitle();
136 } else {
137 $r = array(
138 'name' => $dupName,
139 'user' => $dupFile->getUser( 'text' ),
140 'timestamp' => wfTimestamp( TS_ISO_8601, $dupFile->getTimestamp() )
142 if ( !$dupFile->isLocal() ) {
143 $r['shared'] = '';
145 $fit = $this->addPageSubItem( $pageId, $r );
146 if ( !$fit ) {
147 $this->setContinueEnumParameter( 'continue', $image . '|' . $dupName );
148 break;
152 if ( !$fit ) {
153 break;
156 if ( !is_null( $resultPageSet ) ) {
157 $resultPageSet->populateFromTitles( $titles );
161 public function getAllowedParams() {
162 return array(
163 'limit' => array(
164 ApiBase::PARAM_DFLT => 10,
165 ApiBase::PARAM_TYPE => 'limit',
166 ApiBase::PARAM_MIN => 1,
167 ApiBase::PARAM_MAX => ApiBase::LIMIT_BIG1,
168 ApiBase::PARAM_MAX2 => ApiBase::LIMIT_BIG2
170 'continue' => array(
171 ApiBase::PARAM_HELP_MSG => 'api-help-param-continue',
173 'dir' => array(
174 ApiBase::PARAM_DFLT => 'ascending',
175 ApiBase::PARAM_TYPE => array(
176 'ascending',
177 'descending'
180 'localonly' => false,
184 protected function getExamplesMessages() {
185 return array(
186 'action=query&titles=File:Albert_Einstein_Head.jpg&prop=duplicatefiles'
187 => 'apihelp-query+duplicatefiles-example-simple',
188 'action=query&generator=allimages&prop=duplicatefiles'
189 => 'apihelp-query+duplicatefiles-example-generated',
193 public function getHelpUrls() {
194 return 'https://www.mediawiki.org/wiki/API:Properties#duplicatefiles_.2F_df';