Merge "Special:Upload should not crash on failing previews"
[mediawiki.git] / thumb.php
blobc38b89c251a657607a21425dc73323de7aa03c87
1 <?php
2 /**
3 * PHP script to stream out an image thumbnail.
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
20 * @file
21 * @ingroup Media
24 use MediaWiki\Logger\LoggerFactory;
26 define( 'MW_NO_OUTPUT_COMPRESSION', 1 );
27 require __DIR__ . '/includes/WebStart.php';
29 // Don't use fancy MIME detection, just check the file extension for jpg/gif/png
30 $wgTrivialMimeDetection = true;
32 if ( defined( 'THUMB_HANDLER' ) ) {
33 // Called from thumb_handler.php via 404; extract params from the URI...
34 wfThumbHandle404();
35 } else {
36 // Called directly, use $_GET params
37 wfStreamThumb( $_GET );
40 $mediawiki = new MediaWiki();
41 $mediawiki->doPostOutputShutdown( 'fast' );
43 // --------------------------------------------------------------------------
45 /**
46 * Handle a thumbnail request via thumbnail file URL
48 * @return void
50 function wfThumbHandle404() {
51 global $wgArticlePath;
53 # Set action base paths so that WebRequest::getPathInfo()
54 # recognizes the "X" as the 'title' in ../thumb_handler.php/X urls.
55 # Note: If Custom per-extension repo paths are set, this may break.
56 $repo = RepoGroup::singleton()->getLocalRepo();
57 $oldArticlePath = $wgArticlePath;
58 $wgArticlePath = $repo->getZoneUrl( 'thumb' ) . '/$1';
60 $matches = WebRequest::getPathInfo();
62 $wgArticlePath = $oldArticlePath;
64 if ( !isset( $matches['title'] ) ) {
65 wfThumbError( 404, 'Could not determine the name of the requested thumbnail.' );
66 return;
69 $params = wfExtractThumbRequestInfo( $matches['title'] ); // basic wiki URL param extracting
70 if ( $params == null ) {
71 wfThumbError( 400, 'The specified thumbnail parameters are not recognized.' );
72 return;
75 wfStreamThumb( $params ); // stream the thumbnail
78 /**
79 * Stream a thumbnail specified by parameters
81 * @param array $params List of thumbnailing parameters. In addition to parameters
82 * passed to the MediaHandler, this may also includes the keys:
83 * f (for filename), archived (if archived file), temp (if temp file),
84 * w (alias for width), p (alias for page), r (ignored; historical),
85 * rel404 (path for render on 404 to verify hash path correct),
86 * thumbName (thumbnail name to potentially extract more parameters from
87 * e.g. 'lossy-page1-120px-Foo.tiff' would add page, lossy and width
88 * to the parameters)
89 * @return void
91 function wfStreamThumb( array $params ) {
92 global $wgVaryOnXFP;
94 $headers = []; // HTTP headers to send
96 $fileName = isset( $params['f'] ) ? $params['f'] : '';
98 // Backwards compatibility parameters
99 if ( isset( $params['w'] ) ) {
100 $params['width'] = $params['w'];
101 unset( $params['w'] );
103 if ( isset( $params['width'] ) && substr( $params['width'], -2 ) == 'px' ) {
104 // strip the px (pixel) suffix, if found
105 $params['width'] = substr( $params['width'], 0, -2 );
107 if ( isset( $params['p'] ) ) {
108 $params['page'] = $params['p'];
111 // Is this a thumb of an archived file?
112 $isOld = ( isset( $params['archived'] ) && $params['archived'] );
113 unset( $params['archived'] ); // handlers don't care
115 // Is this a thumb of a temp file?
116 $isTemp = ( isset( $params['temp'] ) && $params['temp'] );
117 unset( $params['temp'] ); // handlers don't care
119 // Some basic input validation
120 $fileName = strtr( $fileName, '\\/', '__' );
122 // Actually fetch the image. Method depends on whether it is archived or not.
123 if ( $isTemp ) {
124 $repo = RepoGroup::singleton()->getLocalRepo()->getTempRepo();
125 $img = new UnregisteredLocalFile( null, $repo,
126 # Temp files are hashed based on the name without the timestamp.
127 # The thumbnails will be hashed based on the entire name however.
128 # @todo fix this convention to actually be reasonable.
129 $repo->getZonePath( 'public' ) . '/' . $repo->getTempHashPath( $fileName ) . $fileName
131 } elseif ( $isOld ) {
132 // Format is <timestamp>!<name>
133 $bits = explode( '!', $fileName, 2 );
134 if ( count( $bits ) != 2 ) {
135 wfThumbError( 404, wfMessage( 'badtitletext' )->parse() );
136 return;
138 $title = Title::makeTitleSafe( NS_FILE, $bits[1] );
139 if ( !$title ) {
140 wfThumbError( 404, wfMessage( 'badtitletext' )->parse() );
141 return;
143 $img = RepoGroup::singleton()->getLocalRepo()->newFromArchiveName( $title, $fileName );
144 } else {
145 $img = wfLocalFile( $fileName );
148 // Check the source file title
149 if ( !$img ) {
150 wfThumbError( 404, wfMessage( 'badtitletext' )->parse() );
151 return;
154 // Check permissions if there are read restrictions
155 $varyHeader = [];
156 if ( !in_array( 'read', User::getGroupPermissions( [ '*' ] ), true ) ) {
157 if ( !$img->getTitle() || !$img->getTitle()->userCan( 'read' ) ) {
158 wfThumbError( 403, 'Access denied. You do not have permission to access ' .
159 'the source file.' );
160 return;
162 $headers[] = 'Cache-Control: private';
163 $varyHeader[] = 'Cookie';
166 // Check if the file is hidden
167 if ( $img->isDeleted( File::DELETED_FILE ) ) {
168 wfThumbErrorText( 404, "The source file '$fileName' does not exist." );
169 return;
172 // Do rendering parameters extraction from thumbnail name.
173 if ( isset( $params['thumbName'] ) ) {
174 $params = wfExtractThumbParams( $img, $params );
176 if ( $params == null ) {
177 wfThumbError( 400, 'The specified thumbnail parameters are not recognized.' );
178 return;
181 // Check the source file storage path
182 if ( !$img->exists() ) {
183 $redirectedLocation = false;
184 if ( !$isTemp ) {
185 // Check for file redirect
186 // Since redirects are associated with pages, not versions of files,
187 // we look for the most current version to see if its a redirect.
188 $possRedirFile = RepoGroup::singleton()->getLocalRepo()->findFile( $img->getName() );
189 if ( $possRedirFile && !is_null( $possRedirFile->getRedirected() ) ) {
190 $redirTarget = $possRedirFile->getName();
191 $targetFile = wfLocalFile( Title::makeTitleSafe( NS_FILE, $redirTarget ) );
192 if ( $targetFile->exists() ) {
193 $newThumbName = $targetFile->thumbName( $params );
194 if ( $isOld ) {
195 /** @var array $bits */
196 $newThumbUrl = $targetFile->getArchiveThumbUrl(
197 $bits[0] . '!' . $targetFile->getName(), $newThumbName );
198 } else {
199 $newThumbUrl = $targetFile->getThumbUrl( $newThumbName );
201 $redirectedLocation = wfExpandUrl( $newThumbUrl, PROTO_CURRENT );
206 if ( $redirectedLocation ) {
207 // File has been moved. Give redirect.
208 $response = RequestContext::getMain()->getRequest()->response();
209 $response->statusHeader( 302 );
210 $response->header( 'Location: ' . $redirectedLocation );
211 $response->header( 'Expires: ' .
212 gmdate( 'D, d M Y H:i:s', time() + 12 * 3600 ) . ' GMT' );
213 if ( $wgVaryOnXFP ) {
214 $varyHeader[] = 'X-Forwarded-Proto';
216 if ( count( $varyHeader ) ) {
217 $response->header( 'Vary: ' . implode( ', ', $varyHeader ) );
219 $response->header( 'Content-Length: 0' );
220 return;
223 // If its not a redirect that has a target as a local file, give 404.
224 wfThumbErrorText( 404, "The source file '$fileName' does not exist." );
225 return;
226 } elseif ( $img->getPath() === false ) {
227 wfThumbErrorText( 400, "The source file '$fileName' is not locally accessible." );
228 return;
231 // Check IMS against the source file
232 // This means that clients can keep a cached copy even after it has been deleted on the server
233 if ( !empty( $_SERVER['HTTP_IF_MODIFIED_SINCE'] ) ) {
234 // Fix IE brokenness
235 $imsString = preg_replace( '/;.*$/', '', $_SERVER["HTTP_IF_MODIFIED_SINCE"] );
236 // Calculate time
237 MediaWiki\suppressWarnings();
238 $imsUnix = strtotime( $imsString );
239 MediaWiki\restoreWarnings();
240 if ( wfTimestamp( TS_UNIX, $img->getTimestamp() ) <= $imsUnix ) {
241 HttpStatus::header( 304 );
242 return;
246 $rel404 = isset( $params['rel404'] ) ? $params['rel404'] : null;
247 unset( $params['r'] ); // ignore 'r' because we unconditionally pass File::RENDER
248 unset( $params['f'] ); // We're done with 'f' parameter.
249 unset( $params['rel404'] ); // moved to $rel404
251 // Get the normalized thumbnail name from the parameters...
252 try {
253 $thumbName = $img->thumbName( $params );
254 if ( !strlen( $thumbName ) ) { // invalid params?
255 throw new MediaTransformInvalidParametersException(
256 'Empty return from File::thumbName'
259 $thumbName2 = $img->thumbName( $params, File::THUMB_FULL_NAME ); // b/c; "long" style
260 } catch ( MediaTransformInvalidParametersException $e ) {
261 wfThumbError(
262 400,
263 'The specified thumbnail parameters are not valid: ' . $e->getMessage()
265 return;
266 } catch ( MWException $e ) {
267 wfThumbError( 500, $e->getHTML(), 'Exception caught while extracting thumb name',
268 [ 'exception' => $e ] );
269 return;
272 // For 404 handled thumbnails, we only use the base name of the URI
273 // for the thumb params and the parent directory for the source file name.
274 // Check that the zone relative path matches up so squid caches won't pick
275 // up thumbs that would not be purged on source file deletion (bug 34231).
276 if ( $rel404 !== null ) { // thumbnail was handled via 404
277 if ( rawurldecode( $rel404 ) === $img->getThumbRel( $thumbName ) ) {
278 // Request for the canonical thumbnail name
279 } elseif ( rawurldecode( $rel404 ) === $img->getThumbRel( $thumbName2 ) ) {
280 // Request for the "long" thumbnail name; redirect to canonical name
281 $response = RequestContext::getMain()->getRequest()->response();
282 $response->statusHeader( 301 );
283 $response->header( 'Location: ' .
284 wfExpandUrl( $img->getThumbUrl( $thumbName ), PROTO_CURRENT ) );
285 $response->header( 'Expires: ' .
286 gmdate( 'D, d M Y H:i:s', time() + 7 * 86400 ) . ' GMT' );
287 if ( $wgVaryOnXFP ) {
288 $varyHeader[] = 'X-Forwarded-Proto';
290 if ( count( $varyHeader ) ) {
291 $response->header( 'Vary: ' . implode( ', ', $varyHeader ) );
293 return;
294 } else {
295 wfThumbErrorText( 404, "The given path of the specified thumbnail is incorrect;
296 expected '" . $img->getThumbRel( $thumbName ) . "' but got '" .
297 rawurldecode( $rel404 ) . "'." );
298 return;
302 $dispositionType = isset( $params['download'] ) ? 'attachment' : 'inline';
304 // Suggest a good name for users downloading this thumbnail
305 $headers[] =
306 "Content-Disposition: {$img->getThumbDisposition( $thumbName, $dispositionType )}";
308 if ( count( $varyHeader ) ) {
309 $headers[] = 'Vary: ' . implode( ', ', $varyHeader );
312 // Stream the file if it exists already...
313 $thumbPath = $img->getThumbPath( $thumbName );
314 if ( $img->getRepo()->fileExists( $thumbPath ) ) {
315 $starttime = microtime( true );
316 $status = $img->getRepo()->streamFileWithStatus( $thumbPath, $headers );
317 $streamtime = microtime( true ) - $starttime;
319 if ( $status->isOK() ) {
320 RequestContext::getMain()->getStats()->timing( 'media.thumbnail.stream', $streamtime );
321 } else {
322 wfThumbError( 500, 'Could not stream the file', null, [ 'file' => $thumbName,
323 'path' => $thumbPath, 'error' => $status->getWikiText( false, false, 'en' ) ] );
325 return;
328 $user = RequestContext::getMain()->getUser();
329 if ( !wfThumbIsStandard( $img, $params ) && $user->pingLimiter( 'renderfile-nonstandard' ) ) {
330 wfThumbError( 429, wfMessage( 'actionthrottledtext' )->parse() );
331 return;
332 } elseif ( $user->pingLimiter( 'renderfile' ) ) {
333 wfThumbError( 429, wfMessage( 'actionthrottledtext' )->parse() );
334 return;
337 list( $thumb, $errorMsg ) = wfGenerateThumbnail( $img, $params, $thumbName, $thumbPath );
339 /** @var MediaTransformOutput|MediaTransformError|bool $thumb */
341 // Check for thumbnail generation errors...
342 $msg = wfMessage( 'thumbnail_error' );
343 $errorCode = 500;
345 if ( !$thumb ) {
346 $errorMsg = $errorMsg ?: $msg->rawParams( 'File::transform() returned false' )->escaped();
347 if ( $errorMsg instanceof MessageSpecifier &&
348 $errorMsg->getKey() === 'thumbnail_image-failure-limit'
350 $errorCode = 429;
352 } elseif ( $thumb->isError() ) {
353 $errorMsg = $thumb->getHtmlMsg();
354 $errorCode = $thumb->getHttpStatusCode();
355 } elseif ( !$thumb->hasFile() ) {
356 $errorMsg = $msg->rawParams( 'No path supplied in thumbnail object' )->escaped();
357 } elseif ( $thumb->fileIsSource() ) {
358 $errorMsg = $msg
359 ->rawParams( 'Image was not scaled, is the requested width bigger than the source?' )
360 ->escaped();
361 $errorCode = 400;
364 if ( $errorMsg !== false ) {
365 wfThumbError( $errorCode, $errorMsg, null, [ 'file' => $thumbName, 'path' => $thumbPath ] );
366 } else {
367 // Stream the file if there were no errors
368 $status = $thumb->streamFileWithStatus( $headers );
369 if ( !$status->isOK() ) {
370 wfThumbError( 500, 'Could not stream the file', null, [
371 'file' => $thumbName, 'path' => $thumbPath,
372 'error' => $status->getWikiText( false, false, 'en' ) ] );
378 * Actually try to generate a new thumbnail
380 * @param File $file
381 * @param array $params
382 * @param string $thumbName
383 * @param string $thumbPath
384 * @return array (MediaTransformOutput|bool, string|bool error message HTML)
386 function wfGenerateThumbnail( File $file, array $params, $thumbName, $thumbPath ) {
387 global $wgAttemptFailureEpoch;
389 $cache = ObjectCache::getLocalClusterInstance();
390 $key = $cache->makeKey(
391 'attempt-failures',
392 $wgAttemptFailureEpoch,
393 $file->getRepo()->getName(),
394 $file->getSha1(),
395 md5( $thumbName )
398 // Check if this file keeps failing to render
399 if ( $cache->get( $key ) >= 4 ) {
400 return [ false, wfMessage( 'thumbnail_image-failure-limit', 4 ) ];
403 $done = false;
404 // Record failures on PHP fatals in addition to caching exceptions
405 register_shutdown_function( function () use ( $cache, &$done, $key ) {
406 if ( !$done ) { // transform() gave a fatal
407 // Randomize TTL to reduce stampedes
408 $cache->incrWithInit( $key, $cache::TTL_HOUR + mt_rand( 0, 300 ) );
410 } );
412 $thumb = false;
413 $errorHtml = false;
415 // guard thumbnail rendering with PoolCounter to avoid stampedes
416 // expensive files use a separate PoolCounter config so it is possible
417 // to set up a global limit on them
418 if ( $file->isExpensiveToThumbnail() ) {
419 $poolCounterType = 'FileRenderExpensive';
420 } else {
421 $poolCounterType = 'FileRender';
424 // Thumbnail isn't already there, so create the new thumbnail...
425 try {
426 $work = new PoolCounterWorkViaCallback( $poolCounterType, sha1( $file->getName() ),
428 'doWork' => function () use ( $file, $params ) {
429 return $file->transform( $params, File::RENDER_NOW );
431 'doCachedWork' => function () use ( $file, $params, $thumbPath ) {
432 // If the worker that finished made this thumbnail then use it.
433 // Otherwise, it probably made a different thumbnail for this file.
434 return $file->getRepo()->fileExists( $thumbPath )
435 ? $file->transform( $params, File::RENDER_NOW )
436 : false; // retry once more in exclusive mode
438 'error' => function ( Status $status ) {
439 return wfMessage( 'generic-pool-error' )->parse() . '<hr>' . $status->getHTML();
443 $result = $work->execute();
444 if ( $result instanceof MediaTransformOutput ) {
445 $thumb = $result;
446 } elseif ( is_string( $result ) ) { // error
447 $errorHtml = $result;
449 } catch ( Exception $e ) {
450 // Tried to select a page on a non-paged file?
453 /** @noinspection PhpUnusedLocalVariableInspection */
454 $done = true; // no PHP fatal occured
456 if ( !$thumb || $thumb->isError() ) {
457 // Randomize TTL to reduce stampedes
458 $cache->incrWithInit( $key, $cache::TTL_HOUR + mt_rand( 0, 300 ) );
461 return [ $thumb, $errorHtml ];
465 * Convert pathinfo type parameter, into normal request parameters
467 * So for example, if the request was redirected from
468 * /w/images/thumb/a/ab/Foo.png/120px-Foo.png. The $thumbRel parameter
469 * of this function would be set to "a/ab/Foo.png/120px-Foo.png".
470 * This method is responsible for turning that into an array
471 * with the folowing keys:
472 * * f => the filename (Foo.png)
473 * * rel404 => the whole thing (a/ab/Foo.png/120px-Foo.png)
474 * * archived => 1 (If the request is for an archived thumb)
475 * * temp => 1 (If the file is in the "temporary" zone)
476 * * thumbName => the thumbnail name, including parameters (120px-Foo.png)
478 * Transform specific parameters are set later via wfExtractThumbParams().
480 * @param string $thumbRel Thumbnail path relative to the thumb zone
481 * @return array|null Associative params array or null
483 function wfExtractThumbRequestInfo( $thumbRel ) {
484 $repo = RepoGroup::singleton()->getLocalRepo();
486 $hashDirReg = $subdirReg = '';
487 $hashLevels = $repo->getHashLevels();
488 for ( $i = 0; $i < $hashLevels; $i++ ) {
489 $subdirReg .= '[0-9a-f]';
490 $hashDirReg .= "$subdirReg/";
493 // Check if this is a thumbnail of an original in the local file repo
494 if ( preg_match( "!^((archive/)?$hashDirReg([^/]*)/([^/]*))$!", $thumbRel, $m ) ) {
495 list( /*all*/, $rel, $archOrTemp, $filename, $thumbname ) = $m;
496 // Check if this is a thumbnail of an temp file in the local file repo
497 } elseif ( preg_match( "!^(temp/)($hashDirReg([^/]*)/([^/]*))$!", $thumbRel, $m ) ) {
498 list( /*all*/, $archOrTemp, $rel, $filename, $thumbname ) = $m;
499 } else {
500 return null; // not a valid looking thumbnail request
503 $params = [ 'f' => $filename, 'rel404' => $rel ];
504 if ( $archOrTemp === 'archive/' ) {
505 $params['archived'] = 1;
506 } elseif ( $archOrTemp === 'temp/' ) {
507 $params['temp'] = 1;
510 $params['thumbName'] = $thumbname;
511 return $params;
515 * Convert a thumbnail name (122px-foo.png) to parameters, using
516 * file handler.
518 * @param File $file File object for file in question
519 * @param array $params Array of parameters so far
520 * @return array Parameters array with more parameters
522 function wfExtractThumbParams( $file, $params ) {
523 if ( !isset( $params['thumbName'] ) ) {
524 throw new InvalidArgumentException( "No thumbnail name passed to wfExtractThumbParams" );
527 $thumbname = $params['thumbName'];
528 unset( $params['thumbName'] );
530 // Do the hook first for older extensions that rely on it.
531 if ( !Hooks::run( 'ExtractThumbParameters', [ $thumbname, &$params ] ) ) {
532 // Check hooks if parameters can be extracted
533 // Hooks return false if they manage to *resolve* the parameters
534 // This hook should be considered deprecated
535 wfDeprecated( 'ExtractThumbParameters', '1.22' );
536 return $params; // valid thumbnail URL (via extension or config)
539 // FIXME: Files in the temp zone don't set a MIME type, which means
540 // they don't have a handler. Which means we can't parse the param
541 // string. However, not a big issue as what good is a param string
542 // if you have no handler to make use of the param string and
543 // actually generate the thumbnail.
544 $handler = $file->getHandler();
546 // Based on UploadStash::parseKey
547 $fileNamePos = strrpos( $thumbname, $params['f'] );
548 if ( $fileNamePos === false ) {
549 // Maybe using a short filename? (see FileRepo::nameForThumb)
550 $fileNamePos = strrpos( $thumbname, 'thumbnail' );
553 if ( $handler && $fileNamePos !== false ) {
554 $paramString = substr( $thumbname, 0, $fileNamePos - 1 );
555 $extraParams = $handler->parseParamString( $paramString );
556 if ( $extraParams !== false ) {
557 return $params + $extraParams;
561 // As a last ditch fallback, use the traditional common parameters
562 if ( preg_match( '!^(page(\d*)-)*(\d*)px-[^/]*$!', $thumbname, $matches ) ) {
563 list( /* all */, /* pagefull */, $pagenum, $size ) = $matches;
564 $params['width'] = $size;
565 if ( $pagenum ) {
566 $params['page'] = $pagenum;
568 return $params; // valid thumbnail URL
570 return null;
574 * Output a thumbnail generation error message
576 * @param int $status
577 * @param string $msgText Plain text (will be html escaped)
578 * @return void
580 function wfThumbErrorText( $status, $msgText ) {
581 wfThumbError( $status, htmlspecialchars( $msgText ) );
585 * Output a thumbnail generation error message
587 * @param int $status
588 * @param string $msgHtml HTML
589 * @param string $msgText Short error description, for internal logging. Defaults to $msgHtml.
590 * Only used for HTTP 500 errors.
591 * @param array $context Error context, for internal logging. Only used for HTTP 500 errors.
592 * @return void
594 function wfThumbError( $status, $msgHtml, $msgText = null, $context = [] ) {
595 global $wgShowHostnames;
597 header( 'Cache-Control: no-cache' );
598 header( 'Content-Type: text/html; charset=utf-8' );
599 if ( $status == 400 || $status == 404 || $status == 429 ) {
600 HttpStatus::header( $status );
601 } elseif ( $status == 403 ) {
602 HttpStatus::header( 403 );
603 header( 'Vary: Cookie' );
604 } else {
605 LoggerFactory::getInstance( 'thumb' )->error( $msgText ?: $msgHtml, $context );
606 HttpStatus::header( 500 );
608 if ( $wgShowHostnames ) {
609 header( 'X-MW-Thumbnail-Renderer: ' . wfHostname() );
610 $url = htmlspecialchars(
611 isset( $_SERVER['REQUEST_URI'] ) ? $_SERVER['REQUEST_URI'] : ''
613 $hostname = htmlspecialchars( wfHostname() );
614 $debug = "<!-- $url -->\n<!-- $hostname -->\n";
615 } else {
616 $debug = '';
618 $content = <<<EOT
619 <!DOCTYPE html>
620 <html><head>
621 <meta charset="UTF-8" />
622 <title>Error generating thumbnail</title>
623 </head>
624 <body>
625 <h1>Error generating thumbnail</h1>
627 $msgHtml
628 </p>
629 $debug
630 </body>
631 </html>
633 EOT;
634 header( 'Content-Length: ' . strlen( $content ) );
635 echo $content;