TextContent: Normalize newlines in preSaveTransform()
[mediawiki.git] / includes / StreamFile.php
blob0fc79802f3de82d4ec49ffcda0f4df252627f950
1 <?php
2 /**
3 * Functions related to the output of file content.
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
20 * @file
23 /**
24 * Functions related to the output of file content
26 class StreamFile {
27 // Do not send any HTTP headers unless requested by caller (e.g. body only)
28 const STREAM_HEADLESS = 1;
29 // Do not try to tear down any PHP output buffers
30 const STREAM_ALLOW_OB = 2;
32 /**
33 * Stream a file to the browser, adding all the headings and fun stuff.
34 * Headers sent include: Content-type, Content-Length, Last-Modified,
35 * and Content-Disposition.
37 * @param string $fname Full name and path of the file to stream
38 * @param array $headers Any additional headers to send if the file exists
39 * @param bool $sendErrors Send error messages if errors occur (like 404)
40 * @param array $optHeaders HTTP request header map (e.g. "range") (use lowercase keys)
41 * @param integer $flags Bitfield of STREAM_* constants
42 * @throws MWException
43 * @return bool Success
45 public static function stream(
46 $fname, $headers = [], $sendErrors = true, $optHeaders = [], $flags = 0
47 ) {
48 $section = new ProfileSection( __METHOD__ );
50 if ( FileBackend::isStoragePath( $fname ) ) { // sanity
51 throw new MWException( __FUNCTION__ . " given storage path '$fname'." );
54 // Don't stream it out as text/html if there was a PHP error
55 if ( ( ( $flags & self::STREAM_HEADLESS ) == 0 || $headers ) && headers_sent() ) {
56 echo "Headers already sent, terminating.\n";
57 return false;
60 $headerFunc = ( $flags & self::STREAM_HEADLESS )
61 ? function ( $header ) {
62 // no-op
64 : function ( $header ) {
65 is_int( $header ) ? HttpStatus::header( $header ) : header( $header );
68 MediaWiki\suppressWarnings();
69 $info = stat( $fname );
70 MediaWiki\restoreWarnings();
72 if ( !is_array( $info ) ) {
73 if ( $sendErrors ) {
74 self::send404Message( $fname, $flags );
76 return false;
79 // Send Last-Modified HTTP header for client-side caching
80 $headerFunc( 'Last-Modified: ' . wfTimestamp( TS_RFC2822, $info['mtime'] ) );
82 if ( ( $flags & self::STREAM_ALLOW_OB ) == 0 ) {
83 // Cancel output buffering and gzipping if set
84 wfResetOutputBuffers();
87 $type = self::contentTypeFromPath( $fname );
88 if ( $type && $type != 'unknown/unknown' ) {
89 $headerFunc( "Content-type: $type" );
90 } else {
91 // Send a content type which is not known to Internet Explorer, to
92 // avoid triggering IE's content type detection. Sending a standard
93 // unknown content type here essentially gives IE license to apply
94 // whatever content type it likes.
95 $headerFunc( 'Content-type: application/x-wiki' );
98 // Don't send if client has up to date cache
99 if ( isset( $optHeaders['if-modified-since'] ) ) {
100 $modsince = preg_replace( '/;.*$/', '', $optHeaders['if-modified-since'] );
101 if ( wfTimestamp( TS_UNIX, $info['mtime'] ) <= strtotime( $modsince ) ) {
102 ini_set( 'zlib.output_compression', 0 );
103 $headerFunc( 304 );
104 return true; // ok
108 // Send additional headers
109 foreach ( $headers as $header ) {
110 header( $header ); // always use header(); specifically requested
113 if ( isset( $optHeaders['range'] ) ) {
114 $range = self::parseRange( $optHeaders['range'], $info['size'] );
115 if ( is_array( $range ) ) {
116 $headerFunc( 206 );
117 $headerFunc( 'Content-Length: ' . $range[2] );
118 $headerFunc( "Content-Range: bytes {$range[0]}-{$range[1]}/{$info['size']}" );
119 } elseif ( $range === 'invalid' ) {
120 if ( $sendErrors ) {
121 $headerFunc( 416 );
122 $headerFunc( 'Cache-Control: no-cache' );
123 $headerFunc( 'Content-Type: text/html; charset=utf-8' );
124 $headerFunc( 'Content-Range: bytes */' . $info['size'] );
126 return false;
127 } else { // unsupported Range request (e.g. multiple ranges)
128 $range = null;
129 $headerFunc( 'Content-Length: ' . $info['size'] );
131 } else {
132 $range = null;
133 $headerFunc( 'Content-Length: ' . $info['size'] );
136 if ( is_array( $range ) ) {
137 $handle = fopen( $fname, 'rb' );
138 if ( $handle ) {
139 $ok = true;
140 fseek( $handle, $range[0] );
141 $remaining = $range[2];
142 while ( $remaining > 0 && $ok ) {
143 $bytes = min( $remaining, 8 * 1024 );
144 $data = fread( $handle, $bytes );
145 $remaining -= $bytes;
146 $ok = ( $data !== false );
147 print $data;
149 } else {
150 return false;
152 } else {
153 return readfile( $fname ) !== false; // faster
156 return true;
160 * Send out a standard 404 message for a file
162 * @param string $fname Full name and path of the file to stream
163 * @param integer $flags Bitfield of STREAM_* constants
164 * @since 1.24
166 public static function send404Message( $fname, $flags = 0 ) {
167 if ( ( $flags & self::STREAM_HEADLESS ) == 0 ) {
168 HttpStatus::header( 404 );
169 header( 'Cache-Control: no-cache' );
170 header( 'Content-Type: text/html; charset=utf-8' );
172 $encFile = htmlspecialchars( $fname );
173 $encScript = htmlspecialchars( $_SERVER['SCRIPT_NAME'] );
174 echo "<!DOCTYPE html><html><body>
175 <h1>File not found</h1>
176 <p>Although this PHP script ($encScript) exists, the file requested for output
177 ($encFile) does not.</p>
178 </body></html>
183 * Convert a Range header value to an absolute (start, end) range tuple
185 * @param string $range Range header value
186 * @param integer $size File size
187 * @return array|string Returns error string on failure (start, end, length)
188 * @since 1.24
190 public static function parseRange( $range, $size ) {
191 $m = [];
192 if ( preg_match( '#^bytes=(\d*)-(\d*)$#', $range, $m ) ) {
193 list( , $start, $end ) = $m;
194 if ( $start === '' && $end === '' ) {
195 $absRange = [ 0, $size - 1 ];
196 } elseif ( $start === '' ) {
197 $absRange = [ $size - $end, $size - 1 ];
198 } elseif ( $end === '' ) {
199 $absRange = [ $start, $size - 1 ];
200 } else {
201 $absRange = [ $start, $end ];
203 if ( $absRange[0] >= 0 && $absRange[1] >= $absRange[0] ) {
204 if ( $absRange[0] < $size ) {
205 $absRange[1] = min( $absRange[1], $size - 1 ); // stop at EOF
206 $absRange[2] = $absRange[1] - $absRange[0] + 1;
207 return $absRange;
208 } elseif ( $absRange[0] == 0 && $size == 0 ) {
209 return 'unrecognized'; // the whole file should just be sent
212 return 'invalid';
214 return 'unrecognized';
218 * Determine the file type of a file based on the path
220 * @param string $filename Storage path or file system path
221 * @param bool $safe Whether to do retroactive upload blacklist checks
222 * @return null|string
224 public static function contentTypeFromPath( $filename, $safe = true ) {
225 global $wgTrivialMimeDetection;
227 $ext = strrchr( $filename, '.' );
228 $ext = $ext === false ? '' : strtolower( substr( $ext, 1 ) );
230 # trivial detection by file extension,
231 # used for thumbnails (thumb.php)
232 if ( $wgTrivialMimeDetection ) {
233 switch ( $ext ) {
234 case 'gif':
235 return 'image/gif';
236 case 'png':
237 return 'image/png';
238 case 'jpg':
239 return 'image/jpeg';
240 case 'jpeg':
241 return 'image/jpeg';
244 return 'unknown/unknown';
247 $magic = MimeMagic::singleton();
248 // Use the extension only, rather than magic numbers, to avoid opening
249 // up vulnerabilities due to uploads of files with allowed extensions
250 // but disallowed types.
251 $type = $magic->guessTypesForExtension( $ext );
254 * Double-check some security settings that were done on upload but might
255 * have changed since.
257 if ( $safe ) {
258 global $wgFileBlacklist, $wgCheckFileExtensions, $wgStrictFileExtensions,
259 $wgFileExtensions, $wgVerifyMimeType, $wgMimeTypeBlacklist;
260 list( , $extList ) = UploadBase::splitExtensions( $filename );
261 if ( UploadBase::checkFileExtensionList( $extList, $wgFileBlacklist ) ) {
262 return 'unknown/unknown';
264 if ( $wgCheckFileExtensions && $wgStrictFileExtensions
265 && !UploadBase::checkFileExtensionList( $extList, $wgFileExtensions )
267 return 'unknown/unknown';
269 if ( $wgVerifyMimeType && in_array( strtolower( $type ), $wgMimeTypeBlacklist ) ) {
270 return 'unknown/unknown';
273 return $type;