]> scripts.mit.edu Git - autoinstalls/mediawiki.git/blob - includes/api/ApiQueryDuplicateFiles.php
MediaWiki 1.30.2-scripts2
[autoinstalls/mediawiki.git] / includes / api / ApiQueryDuplicateFiles.php
1 <?php
2 /**
3  *
4  *
5  * Created on Sep 27, 2008
6  *
7  * Copyright © 2008 Roan Kattouw "<Firstname>.<Lastname>@gmail.com"
8  *
9  * This program is free software; you can redistribute it and/or modify
10  * it under the terms of the GNU General Public License as published by
11  * the Free Software Foundation; either version 2 of the License, or
12  * (at your option) any later version.
13  *
14  * This program is distributed in the hope that it will be useful,
15  * but WITHOUT ANY WARRANTY; without even the implied warranty of
16  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17  * GNU General Public License for more details.
18  *
19  * You should have received a copy of the GNU General Public License along
20  * with this program; if not, write to the Free Software Foundation, Inc.,
21  * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
22  * http://www.gnu.org/copyleft/gpl.html
23  *
24  * @file
25  */
26
27 /**
28  * A query module to list duplicates of the given file(s)
29  *
30  * @ingroup API
31  */
32 class ApiQueryDuplicateFiles extends ApiQueryGeneratorBase {
33
34         public function __construct( ApiQuery $query, $moduleName ) {
35                 parent::__construct( $query, $moduleName, 'df' );
36         }
37
38         public function execute() {
39                 $this->run();
40         }
41
42         public function getCacheMode( $params ) {
43                 return 'public';
44         }
45
46         public function executeGenerator( $resultPageSet ) {
47                 $this->run( $resultPageSet );
48         }
49
50         /**
51          * @param ApiPageSet $resultPageSet
52          */
53         private function run( $resultPageSet = null ) {
54                 $params = $this->extractRequestParams();
55                 $namespaces = $this->getPageSet()->getGoodAndMissingTitlesByNamespace();
56                 if ( empty( $namespaces[NS_FILE] ) ) {
57                         return;
58                 }
59                 $images = $namespaces[NS_FILE];
60
61                 if ( $params['dir'] == 'descending' ) {
62                         $images = array_reverse( $images );
63                 }
64
65                 $skipUntilThisDup = false;
66                 if ( isset( $params['continue'] ) ) {
67                         $cont = explode( '|', $params['continue'] );
68                         $this->dieContinueUsageIf( count( $cont ) != 2 );
69                         $fromImage = $cont[0];
70                         $skipUntilThisDup = $cont[1];
71                         // Filter out any images before $fromImage
72                         foreach ( $images as $image => $pageId ) {
73                                 if ( $image < $fromImage ) {
74                                         unset( $images[$image] );
75                                 } else {
76                                         break;
77                                 }
78                         }
79                 }
80
81                 $filesToFind = array_keys( $images );
82                 if ( $params['localonly'] ) {
83                         $files = RepoGroup::singleton()->getLocalRepo()->findFiles( $filesToFind );
84                 } else {
85                         $files = RepoGroup::singleton()->findFiles( $filesToFind );
86                 }
87
88                 $fit = true;
89                 $count = 0;
90                 $titles = [];
91
92                 $sha1s = [];
93                 foreach ( $files as $file ) {
94                         /** @var File $file */
95                         $sha1s[$file->getName()] = $file->getSha1();
96                 }
97
98                 // find all files with the hashes, result format is:
99                 // [ hash => [ dup1, dup2 ], hash1 => ... ]
100                 $filesToFindBySha1s = array_unique( array_values( $sha1s ) );
101                 if ( $params['localonly'] ) {
102                         $filesBySha1s = RepoGroup::singleton()->getLocalRepo()->findBySha1s( $filesToFindBySha1s );
103                 } else {
104                         $filesBySha1s = RepoGroup::singleton()->findBySha1s( $filesToFindBySha1s );
105                 }
106
107                 // iterate over $images to handle continue param correct
108                 foreach ( $images as $image => $pageId ) {
109                         if ( !isset( $sha1s[$image] ) ) {
110                                 continue; // file does not exist
111                         }
112                         $sha1 = $sha1s[$image];
113                         $dupFiles = $filesBySha1s[$sha1];
114                         if ( $params['dir'] == 'descending' ) {
115                                 $dupFiles = array_reverse( $dupFiles );
116                         }
117                         /** @var File $dupFile */
118                         foreach ( $dupFiles as $dupFile ) {
119                                 $dupName = $dupFile->getName();
120                                 if ( $image == $dupName && $dupFile->isLocal() ) {
121                                         continue; // ignore the local file itself
122                                 }
123                                 if ( $skipUntilThisDup !== false && $dupName < $skipUntilThisDup ) {
124                                         continue; // skip to pos after the image from continue param
125                                 }
126                                 $skipUntilThisDup = false;
127                                 if ( ++$count > $params['limit'] ) {
128                                         $fit = false; // break outer loop
129                                         // We're one over limit which shows that
130                                         // there are additional images to be had. Stop here...
131                                         $this->setContinueEnumParameter( 'continue', $image . '|' . $dupName );
132                                         break;
133                                 }
134                                 if ( !is_null( $resultPageSet ) ) {
135                                         $titles[] = $dupFile->getTitle();
136                                 } else {
137                                         $r = [
138                                                 'name' => $dupName,
139                                                 'user' => $dupFile->getUser( 'text' ),
140                                                 'timestamp' => wfTimestamp( TS_ISO_8601, $dupFile->getTimestamp() ),
141                                                 'shared' => !$dupFile->isLocal(),
142                                         ];
143                                         $fit = $this->addPageSubItem( $pageId, $r );
144                                         if ( !$fit ) {
145                                                 $this->setContinueEnumParameter( 'continue', $image . '|' . $dupName );
146                                                 break;
147                                         }
148                                 }
149                         }
150                         if ( !$fit ) {
151                                 break;
152                         }
153                 }
154                 if ( !is_null( $resultPageSet ) ) {
155                         $resultPageSet->populateFromTitles( $titles );
156                 }
157         }
158
159         public function getAllowedParams() {
160                 return [
161                         'limit' => [
162                                 ApiBase::PARAM_DFLT => 10,
163                                 ApiBase::PARAM_TYPE => 'limit',
164                                 ApiBase::PARAM_MIN => 1,
165                                 ApiBase::PARAM_MAX => ApiBase::LIMIT_BIG1,
166                                 ApiBase::PARAM_MAX2 => ApiBase::LIMIT_BIG2
167                         ],
168                         'continue' => [
169                                 ApiBase::PARAM_HELP_MSG => 'api-help-param-continue',
170                         ],
171                         'dir' => [
172                                 ApiBase::PARAM_DFLT => 'ascending',
173                                 ApiBase::PARAM_TYPE => [
174                                         'ascending',
175                                         'descending'
176                                 ]
177                         ],
178                         'localonly' => false,
179                 ];
180         }
181
182         protected function getExamplesMessages() {
183                 return [
184                         'action=query&titles=File:Albert_Einstein_Head.jpg&prop=duplicatefiles'
185                                 => 'apihelp-query+duplicatefiles-example-simple',
186                         'action=query&generator=allimages&prop=duplicatefiles'
187                                 => 'apihelp-query+duplicatefiles-example-generated',
188                 ];
189         }
190
191         public function getHelpUrls() {
192                 return 'https://www.mediawiki.org/wiki/Special:MyLanguage/API:Duplicatefiles';
193         }
194 }