Merge "(bug 49840) Moving a page with subpages may lead in the page being moved twice"
[lhc/web/wiklou.git] / includes / media / MediaHandler.php
1 <?php
2 /**
3 * Media-handling base classes and generic functionality.
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
19 *
20 * @file
21 * @ingroup Media
22 */
23
24 /**
25 * Base media handler class
26 *
27 * @ingroup Media
28 */
29 abstract class MediaHandler {
30 const TRANSFORM_LATER = 1;
31 const METADATA_GOOD = true;
32 const METADATA_BAD = false;
33 const METADATA_COMPATIBLE = 2; // for old but backwards compatible.
34 /**
35 * Instance cache
36 */
37 static $handlers = array();
38
39 /**
40 * Get a MediaHandler for a given MIME type from the instance cache
41 *
42 * @param $type string
43 *
44 * @return MediaHandler
45 */
46 static function getHandler( $type ) {
47 global $wgMediaHandlers;
48 if ( !isset( $wgMediaHandlers[$type] ) ) {
49 wfDebug( __METHOD__ . ": no handler found for $type.\n" );
50 return false;
51 }
52 $class = $wgMediaHandlers[$type];
53 if ( !isset( self::$handlers[$class] ) ) {
54 self::$handlers[$class] = new $class;
55 if ( !self::$handlers[$class]->isEnabled() ) {
56 self::$handlers[$class] = false;
57 }
58 }
59 return self::$handlers[$class];
60 }
61
62 /**
63 * Get an associative array mapping magic word IDs to parameter names.
64 * Will be used by the parser to identify parameters.
65 */
66 abstract function getParamMap();
67
68 /**
69 * Validate a thumbnail parameter at parse time.
70 * Return true to accept the parameter, and false to reject it.
71 * If you return false, the parser will do something quiet and forgiving.
72 *
73 * @param $name
74 * @param $value
75 */
76 abstract function validateParam( $name, $value );
77
78 /**
79 * Merge a parameter array into a string appropriate for inclusion in filenames
80 *
81 * @param $params array Array of parameters that have been through normaliseParams.
82 */
83 abstract function makeParamString( $params );
84
85 /**
86 * Parse a param string made with makeParamString back into an array
87 *
88 * @param $str string
89 */
90 abstract function parseParamString( $str );
91
92 /**
93 * Changes the parameter array as necessary, ready for transformation.
94 * Should be idempotent.
95 * Returns false if the parameters are unacceptable and the transform should fail
96 * @param $image
97 * @param $params
98 */
99 abstract function normaliseParams( $image, &$params );
100
101 /**
102 * Get an image size array like that returned by getimagesize(), or false if it
103 * can't be determined.
104 *
105 * @param $image File: the image object, or false if there isn't one
106 * @param string $path the filename
107 * @return Array Follow the format of PHP getimagesize() internal function. See http://www.php.net/getimagesize
108 */
109 abstract function getImageSize( $image, $path );
110
111 /**
112 * Get handler-specific metadata which will be saved in the img_metadata field.
113 *
114 * @param $image File: the image object, or false if there isn't one.
115 * Warning, FSFile::getPropsFromPath might pass an (object)array() instead (!)
116 * @param string $path the filename
117 * @return String
118 */
119 function getMetadata( $image, $path ) {
120 return '';
121 }
122
123 /**
124 * Get metadata version.
125 *
126 * This is not used for validating metadata, this is used for the api when returning
127 * metadata, since api content formats should stay the same over time, and so things
128 * using ForiegnApiRepo can keep backwards compatibility
129 *
130 * All core media handlers share a common version number, and extensions can
131 * use the GetMetadataVersion hook to append to the array (they should append a unique
132 * string so not to get confusing). If there was a media handler named 'foo' with metadata
133 * version 3 it might add to the end of the array the element 'foo=3'. if the core metadata
134 * version is 2, the end version string would look like '2;foo=3'.
135 *
136 * @return string version string
137 */
138 static function getMetadataVersion() {
139 $version = Array( '2' ); // core metadata version
140 wfRunHooks( 'GetMetadataVersion', Array( &$version ) );
141 return implode( ';', $version );
142 }
143
144 /**
145 * Convert metadata version.
146 *
147 * By default just returns $metadata, but can be used to allow
148 * media handlers to convert between metadata versions.
149 *
150 * @param $metadata Mixed String or Array metadata array (serialized if string)
151 * @param $version Integer target version
152 * @return Array serialized metadata in specified version, or $metadata on fail.
153 */
154 function convertMetadataVersion( $metadata, $version = 1 ) {
155 if ( !is_array( $metadata ) ) {
156
157 //unserialize to keep return parameter consistent.
158 wfSuppressWarnings();
159 $ret = unserialize( $metadata );
160 wfRestoreWarnings();
161 return $ret;
162 }
163 return $metadata;
164 }
165
166 /**
167 * Get a string describing the type of metadata, for display purposes.
168 *
169 * @return string
170 */
171 function getMetadataType( $image ) {
172 return false;
173 }
174
175 /**
176 * Check if the metadata string is valid for this handler.
177 * If it returns MediaHandler::METADATA_BAD (or false), Image
178 * will reload the metadata from the file and update the database.
179 * MediaHandler::METADATA_GOOD for if the metadata is a-ok,
180 * MediaHanlder::METADATA_COMPATIBLE if metadata is old but backwards
181 * compatible (which may or may not trigger a metadata reload).
182 * @return bool
183 */
184 function isMetadataValid( $image, $metadata ) {
185 return self::METADATA_GOOD;
186 }
187
188 /**
189 * Get a MediaTransformOutput object representing an alternate of the transformed
190 * output which will call an intermediary thumbnail assist script.
191 *
192 * Used when the repository has a thumbnailScriptUrl option configured.
193 *
194 * Return false to fall back to the regular getTransform().
195 * @return bool
196 */
197 function getScriptedTransform( $image, $script, $params ) {
198 return false;
199 }
200
201 /**
202 * Get a MediaTransformOutput object representing the transformed output. Does not
203 * actually do the transform.
204 *
205 * @param $image File: the image object
206 * @param string $dstPath filesystem destination path
207 * @param string $dstUrl Destination URL to use in output HTML
208 * @param array $params Arbitrary set of parameters validated by $this->validateParam()
209 * @return MediaTransformOutput
210 */
211 final function getTransform( $image, $dstPath, $dstUrl, $params ) {
212 return $this->doTransform( $image, $dstPath, $dstUrl, $params, self::TRANSFORM_LATER );
213 }
214
215 /**
216 * Get a MediaTransformOutput object representing the transformed output. Does the
217 * transform unless $flags contains self::TRANSFORM_LATER.
218 *
219 * @param $image File: the image object
220 * @param string $dstPath filesystem destination path
221 * @param string $dstUrl destination URL to use in output HTML
222 * @param array $params arbitrary set of parameters validated by $this->validateParam()
223 * Note: These parameters have *not* gone through $this->normaliseParams()
224 * @param $flags Integer: a bitfield, may contain self::TRANSFORM_LATER
225 *
226 * @return MediaTransformOutput
227 */
228 abstract function doTransform( $image, $dstPath, $dstUrl, $params, $flags = 0 );
229
230 /**
231 * Get the thumbnail extension and MIME type for a given source MIME type
232 *
233 * @param String $ext Extension of original file
234 * @param String $mime Mime type of original file
235 * @param Array $params Handler specific rendering parameters
236 * @return array thumbnail extension and MIME type
237 */
238 function getThumbType( $ext, $mime, $params = null ) {
239 $magic = MimeMagic::singleton();
240 if ( !$ext || $magic->isMatchingExtension( $ext, $mime ) === false ) {
241 // The extension is not valid for this mime type and we do
242 // recognize the mime type
243 $extensions = $magic->getExtensionsForType( $mime );
244 if ( $extensions ) {
245 return array( strtok( $extensions, ' ' ), $mime );
246 }
247 }
248
249 // The extension is correct (true) or the mime type is unknown to
250 // MediaWiki (null)
251 return array( $ext, $mime );
252 }
253
254 /**
255 * Get useful response headers for GET/HEAD requests for a file with the given metadata
256 * @param $metadata mixed Result of the getMetadata() function of this handler for a file
257 * @return Array
258 */
259 public function getStreamHeaders( $metadata ) {
260 return array();
261 }
262
263 /**
264 * True if the handled types can be transformed
265 * @return bool
266 */
267 function canRender( $file ) {
268 return true;
269 }
270
271 /**
272 * True if handled types cannot be displayed directly in a browser
273 * but can be rendered
274 * @return bool
275 */
276 function mustRender( $file ) {
277 return false;
278 }
279
280 /**
281 * True if the type has multi-page capabilities
282 * @return bool
283 */
284 function isMultiPage( $file ) {
285 return false;
286 }
287
288 /**
289 * Page count for a multi-page document, false if unsupported or unknown
290 * @return bool
291 */
292 function pageCount( $file ) {
293 return false;
294 }
295
296 /**
297 * The material is vectorized and thus scaling is lossless
298 * @return bool
299 */
300 function isVectorized( $file ) {
301 return false;
302 }
303
304 /**
305 * The material is an image, and is animated.
306 * In particular, video material need not return true.
307 * @note Before 1.20, this was a method of ImageHandler only
308 * @return bool
309 */
310 function isAnimatedImage( $file ) {
311 return false;
312 }
313
314 /**
315 * If the material is animated, we can animate the thumbnail
316 * @since 1.20
317 * @return bool If material is not animated, handler may return any value.
318 */
319 function canAnimateThumbnail( $file ) {
320 return true;
321 }
322
323 /**
324 * False if the handler is disabled for all files
325 * @return bool
326 */
327 function isEnabled() {
328 return true;
329 }
330
331 /**
332 * Get an associative array of page dimensions
333 * Currently "width" and "height" are understood, but this might be
334 * expanded in the future.
335 * Returns false if unknown or if the document is not multi-page.
336 *
337 * @param $image File
338 * @param $page Unused, left for backcompatibility?
339 * @return array
340 */
341 function getPageDimensions( $image, $page ) {
342 $gis = $this->getImageSize( $image, $image->getLocalRefPath() );
343 return array(
344 'width' => $gis[0],
345 'height' => $gis[1]
346 );
347 }
348
349 /**
350 * Generic getter for text layer.
351 * Currently overloaded by PDF and DjVu handlers
352 * @return bool
353 */
354 function getPageText( $image, $page ) {
355 return false;
356 }
357
358 /**
359 * Get an array structure that looks like this:
360 *
361 * array(
362 * 'visible' => array(
363 * 'Human-readable name' => 'Human readable value',
364 * ...
365 * ),
366 * 'collapsed' => array(
367 * 'Human-readable name' => 'Human readable value',
368 * ...
369 * )
370 * )
371 * The UI will format this into a table where the visible fields are always
372 * visible, and the collapsed fields are optionally visible.
373 *
374 * The function should return false if there is no metadata to display.
375 */
376
377 /**
378 * @todo FIXME: I don't really like this interface, it's not very flexible
379 * I think the media handler should generate HTML instead. It can do
380 * all the formatting according to some standard. That makes it possible
381 * to do things like visual indication of grouped and chained streams
382 * in ogg container files.
383 * @return bool
384 */
385 function formatMetadata( $image ) {
386 return false;
387 }
388
389 /** sorts the visible/invisible field.
390 * Split off from ImageHandler::formatMetadata, as used by more than
391 * one type of handler.
392 *
393 * This is used by the media handlers that use the FormatMetadata class
394 *
395 * @param array $metadataArray metadata array
396 * @return array for use displaying metadata.
397 */
398 function formatMetadataHelper( $metadataArray ) {
399 $result = array(
400 'visible' => array(),
401 'collapsed' => array()
402 );
403
404 $formatted = FormatMetadata::getFormattedData( $metadataArray );
405 // Sort fields into visible and collapsed
406 $visibleFields = $this->visibleMetadataFields();
407 foreach ( $formatted as $name => $value ) {
408 $tag = strtolower( $name );
409 self::addMeta( $result,
410 in_array( $tag, $visibleFields ) ? 'visible' : 'collapsed',
411 'exif',
412 $tag,
413 $value
414 );
415 }
416 return $result;
417 }
418
419 /**
420 * Get a list of metadata items which should be displayed when
421 * the metadata table is collapsed.
422 *
423 * @return array of strings
424 * @access protected
425 */
426 function visibleMetadataFields() {
427 $fields = array();
428 $lines = explode( "\n", wfMessage( 'metadata-fields' )->inContentLanguage()->text() );
429 foreach ( $lines as $line ) {
430 $matches = array();
431 if ( preg_match( '/^\\*\s*(.*?)\s*$/', $line, $matches ) ) {
432 $fields[] = $matches[1];
433 }
434 }
435 $fields = array_map( 'strtolower', $fields );
436 return $fields;
437 }
438
439 /**
440 * This is used to generate an array element for each metadata value
441 * That array is then used to generate the table of metadata values
442 * on the image page
443 *
444 * @param &$array Array An array containing elements for each type of visibility
445 * and each of those elements being an array of metadata items. This function adds
446 * a value to that array.
447 * @param string $visibility ('visible' or 'collapsed') if this value is hidden
448 * by default.
449 * @param string $type type of metadata tag (currently always 'exif')
450 * @param string $id the name of the metadata tag (like 'artist' for example).
451 * its name in the table displayed is the message "$type-$id" (Ex exif-artist ).
452 * @param string $value thingy goes into a wikitext table; it used to be escaped but
453 * that was incompatible with previous practise of customized display
454 * with wikitext formatting via messages such as 'exif-model-value'.
455 * So the escaping is taken back out, but generally this seems a confusing
456 * interface.
457 * @param string $param value to pass to the message for the name of the field
458 * as $1. Currently this parameter doesn't seem to ever be used.
459 *
460 * Note, everything here is passed through the parser later on (!)
461 */
462 protected static function addMeta( &$array, $visibility, $type, $id, $value, $param = false ) {
463 $msg = wfMessage( "$type-$id", $param );
464 if ( $msg->exists() ) {
465 $name = $msg->text();
466 } else {
467 // This is for future compatibility when using instant commons.
468 // So as to not display as ugly a name if a new metadata
469 // property is defined that we don't know about
470 // (not a major issue since such a property would be collapsed
471 // by default).
472 wfDebug( __METHOD__ . ' Unknown metadata name: ' . $id . "\n" );
473 $name = wfEscapeWikiText( $id );
474 }
475 $array[$visibility][] = array(
476 'id' => "$type-$id",
477 'name' => $name,
478 'value' => $value
479 );
480 }
481
482 /**
483 * Used instead of getLongDesc if there is no handler registered for file.
484 *
485 * @param $file File
486 * @return string
487 */
488 function getShortDesc( $file ) {
489 global $wgLang;
490 return htmlspecialchars( $wgLang->formatSize( $file->getSize() ) );
491 }
492
493 /**
494 * Short description. Shown on Special:Search results.
495 *
496 * @param $file File
497 * @return string
498 */
499 function getLongDesc( $file ) {
500 global $wgLang;
501 return wfMessage( 'file-info', htmlspecialchars( $wgLang->formatSize( $file->getSize() ) ),
502 $file->getMimeType() )->parse();
503 }
504
505 /**
506 * Long description. Shown under image on image description page surounded by ().
507 *
508 * @param $file File
509 * @return string
510 */
511 static function getGeneralShortDesc( $file ) {
512 global $wgLang;
513 return $wgLang->formatSize( $file->getSize() );
514 }
515
516 /**
517 * Used instead of getShortDesc if there is no handler registered for file.
518 *
519 * @param $file File
520 * @return string
521 */
522 static function getGeneralLongDesc( $file ) {
523 global $wgLang;
524 return wfMessage( 'file-info', $wgLang->formatSize( $file->getSize() ),
525 $file->getMimeType() )->parse();
526 }
527
528 /**
529 * Calculate the largest thumbnail width for a given original file size
530 * such that the thumbnail's height is at most $maxHeight.
531 * @param $boxWidth Integer Width of the thumbnail box.
532 * @param $boxHeight Integer Height of the thumbnail box.
533 * @param $maxHeight Integer Maximum height expected for the thumbnail.
534 * @return Integer.
535 */
536 public static function fitBoxWidth( $boxWidth, $boxHeight, $maxHeight ) {
537 $idealWidth = $boxWidth * $maxHeight / $boxHeight;
538 $roundedUp = ceil( $idealWidth );
539 if ( round( $roundedUp * $boxHeight / $boxWidth ) > $maxHeight ) {
540 return floor( $idealWidth );
541 } else {
542 return $roundedUp;
543 }
544 }
545
546 /**
547 * Shown in file history box on image description page.
548 *
549 * @param File $file
550 * @return String Dimensions
551 */
552 function getDimensionsString( $file ) {
553 return '';
554 }
555
556 /**
557 * Modify the parser object post-transform.
558 *
559 * This is often used to do $parser->addOutputHook(),
560 * in order to add some javascript to render a viewer.
561 * See TimedMediaHandler or OggHandler for an example.
562 *
563 * @param Parser $parser
564 * @param File $file
565 */
566 function parserTransformHook( $parser, $file ) {}
567
568 /**
569 * File validation hook called on upload.
570 *
571 * If the file at the given local path is not valid, or its MIME type does not
572 * match the handler class, a Status object should be returned containing
573 * relevant errors.
574 *
575 * @param string $fileName The local path to the file.
576 * @return Status object
577 */
578 function verifyUpload( $fileName ) {
579 return Status::newGood();
580 }
581
582 /**
583 * Check for zero-sized thumbnails. These can be generated when
584 * no disk space is available or some other error occurs
585 *
586 * @param string $dstPath The location of the suspect file
587 * @param int $retval Return value of some shell process, file will be deleted if this is non-zero
588 * @return bool True if removed, false otherwise
589 */
590 function removeBadFile( $dstPath, $retval = 0 ) {
591 if ( file_exists( $dstPath ) ) {
592 $thumbstat = stat( $dstPath );
593 if ( $thumbstat['size'] == 0 || $retval != 0 ) {
594 $result = unlink( $dstPath );
595
596 if ( $result ) {
597 wfDebugLog( 'thumbnail',
598 sprintf( 'Removing bad %d-byte thumbnail "%s". unlink() succeeded',
599 $thumbstat['size'], $dstPath ) );
600 } else {
601 wfDebugLog( 'thumbnail',
602 sprintf( 'Removing bad %d-byte thumbnail "%s". unlink() failed',
603 $thumbstat['size'], $dstPath ) );
604 }
605 return true;
606 }
607 }
608 return false;
609 }
610
611 /**
612 * Remove files from the purge list.
613 *
614 * This is used by some video handlers to prevent ?action=purge
615 * from removing a transcoded video, which is expensive to
616 * regenerate.
617 *
618 * @see LocalFile::purgeThumbnails
619 *
620 * @param array $files
621 * @param array $options Purge options. Currently will always be
622 * an array with a single key 'forThumbRefresh' set to true.
623 */
624 public function filterThumbnailPurgeList( &$files, $options ) {
625 // Do nothing
626 }
627
628 /*
629 * True if the handler can rotate the media
630 * @since 1.21
631 * @return bool
632 */
633 public static function canRotate() {
634 return false;
635 }
636 }