]> scripts.mit.edu Git - autoinstalls/mediawiki.git/blob - includes/api/ApiOpenSearch.php
MediaWiki 1.30.2-scripts2
[autoinstalls/mediawiki.git] / includes / api / ApiOpenSearch.php
1 <?php
2 /**
3  * Created on Oct 13, 2006
4  *
5  * Copyright © 2006 Yuri Astrakhan "<Firstname><Lastname>@gmail.com"
6  * Copyright © 2008 Brion Vibber <brion@wikimedia.org>
7  * Copyright © 2014 Wikimedia Foundation and contributors
8  *
9  * This program is free software; you can redistribute it and/or modify
10  * it under the terms of the GNU General Public License as published by
11  * the Free Software Foundation; either version 2 of the License, or
12  * (at your option) any later version.
13  *
14  * This program is distributed in the hope that it will be useful,
15  * but WITHOUT ANY WARRANTY; without even the implied warranty of
16  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17  * GNU General Public License for more details.
18  *
19  * You should have received a copy of the GNU General Public License along
20  * with this program; if not, write to the Free Software Foundation, Inc.,
21  * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
22  * http://www.gnu.org/copyleft/gpl.html
23  *
24  * @file
25  */
26
27 use MediaWiki\MediaWikiServices;
28
29 /**
30  * @ingroup API
31  */
32 class ApiOpenSearch extends ApiBase {
33         use SearchApi;
34
35         private $format = null;
36         private $fm = null;
37
38         /** @var array list of api allowed params */
39         private $allowedParams = null;
40
41         /**
42          * Get the output format
43          *
44          * @return string
45          */
46         protected function getFormat() {
47                 if ( $this->format === null ) {
48                         $params = $this->extractRequestParams();
49                         $format = $params['format'];
50
51                         $allowedParams = $this->getAllowedParams();
52                         if ( !in_array( $format, $allowedParams['format'][ApiBase::PARAM_TYPE] ) ) {
53                                 $format = $allowedParams['format'][ApiBase::PARAM_DFLT];
54                         }
55
56                         if ( substr( $format, -2 ) === 'fm' ) {
57                                 $this->format = substr( $format, 0, -2 );
58                                 $this->fm = 'fm';
59                         } else {
60                                 $this->format = $format;
61                                 $this->fm = '';
62                         }
63                 }
64                 return $this->format;
65         }
66
67         public function getCustomPrinter() {
68                 switch ( $this->getFormat() ) {
69                         case 'json':
70                                 return new ApiOpenSearchFormatJson(
71                                         $this->getMain(), $this->fm, $this->getParameter( 'warningsaserror' )
72                                 );
73
74                         case 'xml':
75                                 $printer = $this->getMain()->createPrinterByName( 'xml' . $this->fm );
76                                 $printer->setRootElement( 'SearchSuggestion' );
77                                 return $printer;
78
79                         default:
80                                 ApiBase::dieDebug( __METHOD__, "Unsupported format '{$this->getFormat()}'" );
81                 }
82         }
83
84         public function execute() {
85                 $params = $this->extractRequestParams();
86                 $search = $params['search'];
87                 $suggest = $params['suggest'];
88                 $results = [];
89                 if ( !$suggest || $this->getConfig()->get( 'EnableOpenSearchSuggest' ) ) {
90                         // Open search results may be stored for a very long time
91                         $this->getMain()->setCacheMaxAge( $this->getConfig()->get( 'SearchSuggestCacheExpiry' ) );
92                         $this->getMain()->setCacheMode( 'public' );
93                         $results = $this->search( $search, $params );
94
95                         // Allow hooks to populate extracts and images
96                         Hooks::run( 'ApiOpenSearchSuggest', [ &$results ] );
97
98                         // Trim extracts, if necessary
99                         $length = $this->getConfig()->get( 'OpenSearchDescriptionLength' );
100                         foreach ( $results as &$r ) {
101                                 if ( is_string( $r['extract'] ) && !$r['extract trimmed'] ) {
102                                         $r['extract'] = self::trimExtract( $r['extract'], $length );
103                                 }
104                         }
105                 }
106
107                 // Populate result object
108                 $this->populateResult( $search, $results );
109         }
110
111         /**
112          * Perform the search
113          * @param string $search the search query
114          * @param array $params api request params
115          * @return array search results. Keys are integers.
116          */
117         private function search( $search, array $params ) {
118                 $searchEngine = $this->buildSearchEngine( $params );
119                 $titles = $searchEngine->extractTitles( $searchEngine->completionSearchWithVariants( $search ) );
120                 $results = [];
121
122                 if ( !$titles ) {
123                         return $results;
124                 }
125
126                 // Special pages need unique integer ids in the return list, so we just
127                 // assign them negative numbers because those won't clash with the
128                 // always positive articleIds that non-special pages get.
129                 $nextSpecialPageId = -1;
130
131                 if ( $params['redirects'] === null ) {
132                         // Backwards compatibility, don't resolve for JSON.
133                         $resolveRedir = $this->getFormat() !== 'json';
134                 } else {
135                         $resolveRedir = $params['redirects'] === 'resolve';
136                 }
137
138                 if ( $resolveRedir ) {
139                         // Query for redirects
140                         $redirects = [];
141                         $lb = new LinkBatch( $titles );
142                         if ( !$lb->isEmpty() ) {
143                                 $db = $this->getDB();
144                                 $res = $db->select(
145                                         [ 'page', 'redirect' ],
146                                         [ 'page_namespace', 'page_title', 'rd_namespace', 'rd_title' ],
147                                         [
148                                                 'rd_from = page_id',
149                                                 'rd_interwiki IS NULL OR rd_interwiki = ' . $db->addQuotes( '' ),
150                                                 $lb->constructSet( 'page', $db ),
151                                         ],
152                                         __METHOD__
153                                 );
154                                 foreach ( $res as $row ) {
155                                         $redirects[$row->page_namespace][$row->page_title] =
156                                                 [ $row->rd_namespace, $row->rd_title ];
157                                 }
158                         }
159
160                         // Bypass any redirects
161                         $seen = [];
162                         foreach ( $titles as $title ) {
163                                 $ns = $title->getNamespace();
164                                 $dbkey = $title->getDBkey();
165                                 $from = null;
166                                 if ( isset( $redirects[$ns][$dbkey] ) ) {
167                                         list( $ns, $dbkey ) = $redirects[$ns][$dbkey];
168                                         $from = $title;
169                                         $title = Title::makeTitle( $ns, $dbkey );
170                                 }
171                                 if ( !isset( $seen[$ns][$dbkey] ) ) {
172                                         $seen[$ns][$dbkey] = true;
173                                         $resultId = $title->getArticleID();
174                                         if ( $resultId === 0 ) {
175                                                 $resultId = $nextSpecialPageId;
176                                                 $nextSpecialPageId -= 1;
177                                         }
178                                         $results[$resultId] = [
179                                                 'title' => $title,
180                                                 'redirect from' => $from,
181                                                 'extract' => false,
182                                                 'extract trimmed' => false,
183                                                 'image' => false,
184                                                 'url' => wfExpandUrl( $title->getFullURL(), PROTO_CURRENT ),
185                                         ];
186                                 }
187                         }
188                 } else {
189                         foreach ( $titles as $title ) {
190                                 $resultId = $title->getArticleID();
191                                 if ( $resultId === 0 ) {
192                                         $resultId = $nextSpecialPageId;
193                                         $nextSpecialPageId -= 1;
194                                 }
195                                 $results[$resultId] = [
196                                         'title' => $title,
197                                         'redirect from' => null,
198                                         'extract' => false,
199                                         'extract trimmed' => false,
200                                         'image' => false,
201                                         'url' => wfExpandUrl( $title->getFullURL(), PROTO_CURRENT ),
202                                 ];
203                         }
204                 }
205
206                 return $results;
207         }
208
209         /**
210          * @param string $search
211          * @param array &$results
212          */
213         protected function populateResult( $search, &$results ) {
214                 $result = $this->getResult();
215
216                 switch ( $this->getFormat() ) {
217                         case 'json':
218                                 // http://www.opensearch.org/Specifications/OpenSearch/Extensions/Suggestions/1.1
219                                 $result->addArrayType( null, 'array' );
220                                 $result->addValue( null, 0, strval( $search ) );
221                                 $terms = [];
222                                 $descriptions = [];
223                                 $urls = [];
224                                 foreach ( $results as $r ) {
225                                         $terms[] = $r['title']->getPrefixedText();
226                                         $descriptions[] = strval( $r['extract'] );
227                                         $urls[] = $r['url'];
228                                 }
229                                 $result->addValue( null, 1, $terms );
230                                 $result->addValue( null, 2, $descriptions );
231                                 $result->addValue( null, 3, $urls );
232                                 break;
233
234                         case 'xml':
235                                 // https://msdn.microsoft.com/en-us/library/cc891508(v=vs.85).aspx
236                                 $imageKeys = [
237                                         'source' => true,
238                                         'alt' => true,
239                                         'width' => true,
240                                         'height' => true,
241                                         'align' => true,
242                                 ];
243                                 $items = [];
244                                 foreach ( $results as $r ) {
245                                         $item = [
246                                                 'Text' => $r['title']->getPrefixedText(),
247                                                 'Url' => $r['url'],
248                                         ];
249                                         if ( is_string( $r['extract'] ) && $r['extract'] !== '' ) {
250                                                 $item['Description'] = $r['extract'];
251                                         }
252                                         if ( is_array( $r['image'] ) && isset( $r['image']['source'] ) ) {
253                                                 $item['Image'] = array_intersect_key( $r['image'], $imageKeys );
254                                         }
255                                         ApiResult::setSubelementsList( $item, array_keys( $item ) );
256                                         $items[] = $item;
257                                 }
258                                 ApiResult::setIndexedTagName( $items, 'Item' );
259                                 $result->addValue( null, 'version', '2.0' );
260                                 $result->addValue( null, 'xmlns', 'http://opensearch.org/searchsuggest2' );
261                                 $result->addValue( null, 'Query', strval( $search ) );
262                                 $result->addSubelementsList( null, 'Query' );
263                                 $result->addValue( null, 'Section', $items );
264                                 break;
265
266                         default:
267                                 ApiBase::dieDebug( __METHOD__, "Unsupported format '{$this->getFormat()}'" );
268                 }
269         }
270
271         public function getAllowedParams() {
272                 if ( $this->allowedParams !== null ) {
273                         return $this->allowedParams;
274                 }
275                 $this->allowedParams = $this->buildCommonApiParams( false ) + [
276                         'suggest' => false,
277                         'redirects' => [
278                                 ApiBase::PARAM_TYPE => [ 'return', 'resolve' ],
279                         ],
280                         'format' => [
281                                 ApiBase::PARAM_DFLT => 'json',
282                                 ApiBase::PARAM_TYPE => [ 'json', 'jsonfm', 'xml', 'xmlfm' ],
283                         ],
284                         'warningsaserror' => false,
285                 ];
286
287                 // Use open search specific default limit
288                 $this->allowedParams['limit'][ApiBase::PARAM_DFLT] = $this->getConfig()->get(
289                         'OpenSearchDefaultLimit'
290                 );
291
292                 return $this->allowedParams;
293         }
294
295         public function getSearchProfileParams() {
296                 return [
297                         'profile' => [
298                                 'profile-type' => SearchEngine::COMPLETION_PROFILE_TYPE,
299                                 'help-message' => 'apihelp-query+prefixsearch-param-profile'
300                         ],
301                 ];
302         }
303
304         protected function getExamplesMessages() {
305                 return [
306                         'action=opensearch&search=Te'
307                                 => 'apihelp-opensearch-example-te',
308                 ];
309         }
310
311         public function getHelpUrls() {
312                 return 'https://www.mediawiki.org/wiki/Special:MyLanguage/API:Opensearch';
313         }
314
315         /**
316          * Trim an extract to a sensible length.
317          *
318          * Adapted from Extension:OpenSearchXml, which adapted it from
319          * Extension:ActiveAbstract.
320          *
321          * @param string $text
322          * @param int $length Target length; actual result will continue to the end of a sentence.
323          * @return string
324          */
325         public static function trimExtract( $text, $length ) {
326                 static $regex = null;
327
328                 if ( $regex === null ) {
329                         $endchars = [
330                                 '([^\d])\.\s', '\!\s', '\?\s', // regular ASCII
331                                 '。', // full-width ideographic full-stop
332                                 '.', '!', '?', // double-width roman forms
333                                 '。', // half-width ideographic full stop
334                         ];
335                         $endgroup = implode( '|', $endchars );
336                         $end = "(?:$endgroup)";
337                         $sentence = ".{{$length},}?$end+";
338                         $regex = "/^($sentence)/u";
339                 }
340
341                 $matches = [];
342                 if ( preg_match( $regex, $text, $matches ) ) {
343                         return trim( $matches[1] );
344                 } else {
345                         // Just return the first line
346                         return trim( explode( "\n", $text )[0] );
347                 }
348         }
349
350         /**
351          * Fetch the template for a type.
352          *
353          * @param string $type MIME type
354          * @return string
355          * @throws MWException
356          */
357         public static function getOpenSearchTemplate( $type ) {
358                 $config = MediaWikiServices::getInstance()->getSearchEngineConfig();
359                 $template = $config->getConfig()->get( 'OpenSearchTemplate' );
360
361                 if ( $template && $type === 'application/x-suggestions+json' ) {
362                         return $template;
363                 }
364
365                 $ns = implode( '|', $config->defaultNamespaces() );
366                 if ( !$ns ) {
367                         $ns = '0';
368                 }
369
370                 switch ( $type ) {
371                         case 'application/x-suggestions+json':
372                                 return $config->getConfig()->get( 'CanonicalServer' ) . wfScript( 'api' )
373                                         . '?action=opensearch&search={searchTerms}&namespace=' . $ns;
374
375                         case 'application/x-suggestions+xml':
376                                 return $config->getConfig()->get( 'CanonicalServer' ) . wfScript( 'api' )
377                                         . '?action=opensearch&format=xml&search={searchTerms}&namespace=' . $ns;
378
379                         default:
380                                 throw new MWException( __METHOD__ . ": Unknown type '$type'" );
381                 }
382         }
383 }
384
385 class ApiOpenSearchFormatJson extends ApiFormatJson {
386         private $warningsAsError = false;
387
388         public function __construct( ApiMain $main, $fm, $warningsAsError ) {
389                 parent::__construct( $main, "json$fm" );
390                 $this->warningsAsError = $warningsAsError;
391         }
392
393         public function execute() {
394                 $result = $this->getResult();
395                 if ( !$result->getResultData( 'error' ) && !$result->getResultData( 'errors' ) ) {
396                         // Ignore warnings or treat as errors, as requested
397                         $warnings = $result->removeValue( 'warnings', null );
398                         if ( $this->warningsAsError && $warnings ) {
399                                 $this->dieWithError(
400                                         'apierror-opensearch-json-warnings',
401                                         'warnings',
402                                         [ 'warnings' => $warnings ]
403                                 );
404                         }
405
406                         // Ignore any other unexpected keys (e.g. from $wgDebugToolbar)
407                         $remove = array_keys( array_diff_key(
408                                 $result->getResultData(),
409                                 [ 0 => 'search', 1 => 'terms', 2 => 'descriptions', 3 => 'urls' ]
410                         ) );
411                         foreach ( $remove as $key ) {
412                                 $result->removeValue( $key, null );
413                         }
414                 }
415
416                 parent::execute();
417         }
418 }