3 * Script to update image metadata records
5 * Usage: php rebuildImages.php [--missing] [--dry-run]
7 * --missing Crawl the uploads dir for images without records, and
10 * Copyright (C) 2005 Brion Vibber <brion@pobox.com>
11 * http://www.mediawiki.org/
13 * This program is free software; you can redistribute it and/or modify
14 * it under the terms of the GNU General Public License as published by
15 * the Free Software Foundation; either version 2 of the License, or
16 * (at your option) any later version.
18 * This program is distributed in the hope that it will be useful,
19 * but WITHOUT ANY WARRANTY; without even the implied warranty of
20 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
21 * GNU General Public License for more details.
23 * You should have received a copy of the GNU General Public License along
24 * with this program; if not, write to the Free Software Foundation, Inc.,
25 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
26 * http://www.gnu.org/copyleft/gpl.html
28 * @author Brion Vibber <brion at pobox.com>
30 * @subpackage maintenance
33 $options = array( 'missing', 'dry-run' );
35 require_once( 'commandLine.inc' );
36 require_once( 'FiveUpgrade.inc' );
38 class ImageBuilder
extends FiveUpgrade
{
39 function ImageBuilder( $dryrun = false ) {
40 parent
::FiveUpgrade();
42 $this->maxLag
= 10; # if slaves are lagged more than 10 secs, wait
43 $this->dryrun
= $dryrun;
48 $this->buildOldImage();
51 function init( $count, $table ) {
54 $this->count
= $count;
55 $this->startTime
= wfTime();
56 $this->table
= $table;
59 function progress( $updated ) {
60 $this->updated +
= $updated;
62 if( $this->processed %
100 != 0 ) {
65 $portion = $this->processed
/ $this->count
;
66 $updateRate = $this->updated
/ $this->processed
;
69 $delta = $now - $this->startTime
;
70 $estimatedTotalTime = $delta / $portion;
71 $eta = $this->startTime +
$estimatedTotalTime;
73 printf( "%s: %6.2f%% done on %s; ETA %s [%d/%d] %.2f/sec <%.2f%% updated>\n",
74 wfTimestamp( TS_DB
, intval( $now ) ),
77 wfTimestamp( TS_DB
, intval( $eta ) ),
81 $updateRate * 100.0 );
85 function buildTable( $table, $key, $callback ) {
86 $fname = 'ImageBuilder::buildTable';
88 $count = $this->dbw
->selectField( $table, 'count(*)', '', $fname );
89 $this->init( $count, $table );
90 $this->log( "Processing $table..." );
92 $tableName = $this->dbr
->tableName( $table );
93 $sql = "SELECT * FROM $tableName";
94 $result = $this->dbr
->query( $sql, $fname );
96 while( $row = $this->dbr
->fetchObject( $result ) ) {
97 $update = call_user_func( $callback, $row );
98 if( is_array( $update ) ) {
99 if( !$this->dryrun
) {
100 $this->dbw
->update( $table,
102 array( $key => $row->$key ),
105 $this->progress( 1 );
107 $this->progress( 0 );
110 $this->log( "Finished $table... $this->updated of $this->processed rows updated" );
111 $this->dbr
->freeResult( $result );
114 function buildImage() {
115 $callback = array( &$this, 'imageCallback' );
116 $this->buildTable( 'image', 'img_name', $callback );
119 function imageCallback( $row ) {
120 if( $row->img_width
) {
125 // Fill in the new image info fields
126 $info = $this->imageInfo( $row->img_name
);
128 global $wgMemc, $wgDBname;
129 $key = $wgDBname . ":Image:" . md5( $row->img_name
);
130 $wgMemc->delete( $key );
133 'img_width' => $info['width'],
134 'img_height' => $info['height'],
135 'img_bits' => $info['bits'],
136 'img_media_type' => $info['media'],
137 'img_major_mime' => $info['major'],
138 'img_minor_mime' => $info['minor'] );
142 function buildOldImage() {
143 $this->buildTable( 'oldimage', 'oi_archive_name',
144 array( &$this, 'oldimageCallback' ) );
147 function oldimageCallback( $row ) {
148 if( $row->oi_width
) {
152 // Fill in the new image info fields
153 $info = $this->imageInfo( $row->oi_archive_name
, 'wfImageArchiveDir', $row->oi_name
);
155 'oi_width' => $info['width' ],
156 'oi_height' => $info['height'],
157 'oi_bits' => $info['bits' ] );
160 function crawlMissing() {
161 global $wgUploadDirectory, $wgHashedUploadDirectory;
162 if( $wgHashedUploadDirectory ) {
163 for( $i = 0; $i < 16; $i++
) {
164 for( $j = 0; $j < 16; $j++
) {
165 $dir = sprintf( '%s%s%01x%s%02x',
171 $this->crawlDirectory( $dir );
175 $this->crawlDirectory( $wgUploadDirectory );
179 function crawlDirectory( $dir ) {
180 if( !file_exists( $dir ) ) {
181 return $this->log( "no directory, skipping $dir" );
183 if( !is_dir( $dir ) ) {
184 return $this->log( "not a directory?! skipping $dir" );
186 if( !is_readable( $dir ) ) {
187 return $this->log( "dir not readable, skipping $dir" );
189 $source = opendir( $dir );
190 if( $source === false ) {
191 return $this->log( "couldn't open dir, skipping $dir" );
194 $this->log( "crawling $dir" );
195 while( false !== ( $filename = readdir( $source ) ) ) {
196 $fullpath = $dir . DIRECTORY_SEPARATOR
. $filename;
197 if( is_dir( $fullpath ) ) {
200 if( is_link( $fullpath ) ) {
201 $this->log( "skipping symlink at $fullpath" );
204 $this->checkMissingImage( $filename, $fullpath );
209 function checkMissingImage( $filename, $fullpath ) {
210 $fname = 'ImageBuilder::checkMissingImage';
211 $row = $this->dbw
->selectRow( 'image',
213 array( 'img_name' => $filename ),
217 // already known, move on
220 $this->addMissingImage( $filename, $fullpath );
224 function addMissingImage( $filename, $fullpath ) {
225 $fname = 'ImageBuilder::addMissingImage';
227 $size = filesize( $fullpath );
228 $info = $this->imageInfo( $filename );
229 $timestamp = $this->dbw
->timestamp( filemtime( $fullpath ) );
232 $altname = $wgContLang->checkTitleEncoding( $filename );
233 if( $altname != $filename ) {
234 if( $this->dryrun
) {
235 $filename = $altname;
236 $this->log( "Estimating transcoding... $altname" );
238 $filename = $this->renameFile( $filename );
242 if( $filename == '' ) {
243 $this->log( "Empty filename for $fullpath" );
248 'img_name' => $filename,
250 'img_width' => $info['width'],
251 'img_height' => $info['height'],
252 'img_metadata' => '', // filled in on-demand
253 'img_bits' => $info['bits'],
254 'img_media_type' => $info['media'],
255 'img_major_mime' => $info['major'],
256 'img_minor_mime' => $info['minor'],
257 'img_description' => '(recovered file, missing upload log entry)',
259 'img_user_text' => 'Conversion script',
260 'img_timestamp' => $timestamp );
261 if( !$this->dryrun
) {
262 $this->dbw
->insert( 'image', $fields, $fname );
264 $this->log( $fullpath );
268 $builder = new ImageBuilder( isset( $options['dry-run'] ) );
269 if( isset( $options['missing'] ) ) {
270 $builder->crawlMissing();