Merge "Put callback function within class in SiteConfigurationTest"
[lhc/web/wiklou.git] / includes / GlobalFunctions.php
1 <?php
2 /**
3 * Global functions used everywhere.
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
19 *
20 * @file
21 */
22
23 if ( !defined( 'MEDIAWIKI' ) ) {
24 die( "This file is part of MediaWiki, it is not a valid entry point" );
25 }
26
27 // Hide compatibility functions from Doxygen
28 /// @cond
29
30 /**
31 * Compatibility functions
32 *
33 * We support PHP 5.3.2 and up.
34 * Re-implementations of newer functions or functions in non-standard
35 * PHP extensions may be included here.
36 */
37
38 if ( !function_exists( 'iconv' ) ) {
39 /**
40 * @codeCoverageIgnore
41 * @return string
42 */
43 function iconv( $from, $to, $string ) {
44 return Fallback::iconv( $from, $to, $string );
45 }
46 }
47
48 if ( !function_exists( 'mb_substr' ) ) {
49 /**
50 * @codeCoverageIgnore
51 * @return string
52 */
53 function mb_substr( $str, $start, $count = 'end' ) {
54 return Fallback::mb_substr( $str, $start, $count );
55 }
56
57 /**
58 * @codeCoverageIgnore
59 * @return int
60 */
61 function mb_substr_split_unicode( $str, $splitPos ) {
62 return Fallback::mb_substr_split_unicode( $str, $splitPos );
63 }
64 }
65
66 if ( !function_exists( 'mb_strlen' ) ) {
67 /**
68 * @codeCoverageIgnore
69 * @return int
70 */
71 function mb_strlen( $str, $enc = '' ) {
72 return Fallback::mb_strlen( $str, $enc );
73 }
74 }
75
76 if ( !function_exists( 'mb_strpos' ) ) {
77 /**
78 * @codeCoverageIgnore
79 * @return int
80 */
81 function mb_strpos( $haystack, $needle, $offset = 0, $encoding = '' ) {
82 return Fallback::mb_strpos( $haystack, $needle, $offset, $encoding );
83 }
84 }
85
86 if ( !function_exists( 'mb_strrpos' ) ) {
87 /**
88 * @codeCoverageIgnore
89 * @return int
90 */
91 function mb_strrpos( $haystack, $needle, $offset = 0, $encoding = '' ) {
92 return Fallback::mb_strrpos( $haystack, $needle, $offset, $encoding );
93 }
94 }
95
96 // gzdecode function only exists in PHP >= 5.4.0
97 // http://php.net/gzdecode
98 if ( !function_exists( 'gzdecode' ) ) {
99 /**
100 * @codeCoverageIgnore
101 * @return string
102 */
103 function gzdecode( $data ) {
104 return gzinflate( substr( $data, 10, -8 ) );
105 }
106 }
107 /// @endcond
108
109 /**
110 * Like array_diff( $a, $b ) except that it works with two-dimensional arrays.
111 * @param $a array
112 * @param $b array
113 * @return array
114 */
115 function wfArrayDiff2( $a, $b ) {
116 return array_udiff( $a, $b, 'wfArrayDiff2_cmp' );
117 }
118
119 /**
120 * @param $a array|string
121 * @param $b array|string
122 * @return int
123 */
124 function wfArrayDiff2_cmp( $a, $b ) {
125 if ( is_string( $a ) && is_string( $b ) ) {
126 return strcmp( $a, $b );
127 } elseif ( count( $a ) !== count( $b ) ) {
128 return count( $a ) < count( $b ) ? -1 : 1;
129 } else {
130 reset( $a );
131 reset( $b );
132 while ( ( list( , $valueA ) = each( $a ) ) && ( list( , $valueB ) = each( $b ) ) ) {
133 $cmp = strcmp( $valueA, $valueB );
134 if ( $cmp !== 0 ) {
135 return $cmp;
136 }
137 }
138 return 0;
139 }
140 }
141
142 /**
143 * Array lookup
144 * Returns an array where the values in array $b are replaced by the
145 * values in array $a with the corresponding keys
146 *
147 * @deprecated since 1.22; use array_intersect_key()
148 * @param $a Array
149 * @param $b Array
150 * @return array
151 */
152 function wfArrayLookup( $a, $b ) {
153 wfDeprecated( __FUNCTION__, '1.22' );
154 return array_flip( array_intersect( array_flip( $a ), array_keys( $b ) ) );
155 }
156
157 /**
158 * Appends to second array if $value differs from that in $default
159 *
160 * @param $key String|Int
161 * @param $value Mixed
162 * @param $default Mixed
163 * @param array $changed to alter
164 * @throws MWException
165 */
166 function wfAppendToArrayIfNotDefault( $key, $value, $default, &$changed ) {
167 if ( is_null( $changed ) ) {
168 throw new MWException( 'GlobalFunctions::wfAppendToArrayIfNotDefault got null' );
169 }
170 if ( $default[$key] !== $value ) {
171 $changed[$key] = $value;
172 }
173 }
174
175 /**
176 * Backwards array plus for people who haven't bothered to read the PHP manual
177 * XXX: will not darn your socks for you.
178 *
179 * @deprecated since 1.22; use array_replace()
180 * @param $array1 Array
181 * @param [$array2, [...]] Arrays
182 * @return Array
183 */
184 function wfArrayMerge( $array1/* ... */ ) {
185 wfDeprecated( __FUNCTION__, '1.22' );
186 $args = func_get_args();
187 $args = array_reverse( $args, true );
188 $out = array();
189 foreach ( $args as $arg ) {
190 $out += $arg;
191 }
192 return $out;
193 }
194
195 /**
196 * Merge arrays in the style of getUserPermissionsErrors, with duplicate removal
197 * e.g.
198 * wfMergeErrorArrays(
199 * array( array( 'x' ) ),
200 * array( array( 'x', '2' ) ),
201 * array( array( 'x' ) ),
202 * array( array( 'y' ) )
203 * );
204 * returns:
205 * array(
206 * array( 'x', '2' ),
207 * array( 'x' ),
208 * array( 'y' )
209 * )
210 * @param varargs
211 * @return Array
212 */
213 function wfMergeErrorArrays( /*...*/ ) {
214 $args = func_get_args();
215 $out = array();
216 foreach ( $args as $errors ) {
217 foreach ( $errors as $params ) {
218 # @todo FIXME: Sometimes get nested arrays for $params,
219 # which leads to E_NOTICEs
220 $spec = implode( "\t", $params );
221 $out[$spec] = $params;
222 }
223 }
224 return array_values( $out );
225 }
226
227 /**
228 * Insert array into another array after the specified *KEY*
229 *
230 * @param array $array The array.
231 * @param array $insert The array to insert.
232 * @param $after Mixed: The key to insert after
233 * @return Array
234 */
235 function wfArrayInsertAfter( array $array, array $insert, $after ) {
236 // Find the offset of the element to insert after.
237 $keys = array_keys( $array );
238 $offsetByKey = array_flip( $keys );
239
240 $offset = $offsetByKey[$after];
241
242 // Insert at the specified offset
243 $before = array_slice( $array, 0, $offset + 1, true );
244 $after = array_slice( $array, $offset + 1, count( $array ) - $offset, true );
245
246 $output = $before + $insert + $after;
247
248 return $output;
249 }
250
251 /**
252 * Recursively converts the parameter (an object) to an array with the same data
253 *
254 * @param $objOrArray Object|Array
255 * @param $recursive Bool
256 * @return Array
257 */
258 function wfObjectToArray( $objOrArray, $recursive = true ) {
259 $array = array();
260 if ( is_object( $objOrArray ) ) {
261 $objOrArray = get_object_vars( $objOrArray );
262 }
263 foreach ( $objOrArray as $key => $value ) {
264 if ( $recursive && ( is_object( $value ) || is_array( $value ) ) ) {
265 $value = wfObjectToArray( $value );
266 }
267
268 $array[$key] = $value;
269 }
270
271 return $array;
272 }
273
274 /**
275 * Get a random decimal value between 0 and 1, in a way
276 * not likely to give duplicate values for any realistic
277 * number of articles.
278 *
279 * @return string
280 */
281 function wfRandom() {
282 # The maximum random value is "only" 2^31-1, so get two random
283 # values to reduce the chance of dupes
284 $max = mt_getrandmax() + 1;
285 $rand = number_format( ( mt_rand() * $max + mt_rand() ) / $max / $max, 12, '.', '' );
286
287 return $rand;
288 }
289
290 /**
291 * Get a random string containing a number of pseudo-random hex
292 * characters.
293 * @note This is not secure, if you are trying to generate some sort
294 * of token please use MWCryptRand instead.
295 *
296 * @param int $length The length of the string to generate
297 * @return String
298 * @since 1.20
299 */
300 function wfRandomString( $length = 32 ) {
301 $str = '';
302 for ( $n = 0; $n < $length; $n += 7 ) {
303 $str .= sprintf( '%07x', mt_rand() & 0xfffffff );
304 }
305 return substr( $str, 0, $length );
306 }
307
308 /**
309 * We want some things to be included as literal characters in our title URLs
310 * for prettiness, which urlencode encodes by default. According to RFC 1738,
311 * all of the following should be safe:
312 *
313 * ;:@&=$-_.+!*'(),
314 *
315 * But + is not safe because it's used to indicate a space; &= are only safe in
316 * paths and not in queries (and we don't distinguish here); ' seems kind of
317 * scary; and urlencode() doesn't touch -_. to begin with. Plus, although /
318 * is reserved, we don't care. So the list we unescape is:
319 *
320 * ;:@$!*(),/
321 *
322 * However, IIS7 redirects fail when the url contains a colon (Bug 22709),
323 * so no fancy : for IIS7.
324 *
325 * %2F in the page titles seems to fatally break for some reason.
326 *
327 * @param $s String:
328 * @return string
329 */
330 function wfUrlencode( $s ) {
331 static $needle;
332
333 if ( is_null( $s ) ) {
334 $needle = null;
335 return '';
336 }
337
338 if ( is_null( $needle ) ) {
339 $needle = array( '%3B', '%40', '%24', '%21', '%2A', '%28', '%29', '%2C', '%2F' );
340 if ( !isset( $_SERVER['SERVER_SOFTWARE'] ) ||
341 ( strpos( $_SERVER['SERVER_SOFTWARE'], 'Microsoft-IIS/7' ) === false )
342 ) {
343 $needle[] = '%3A';
344 }
345 }
346
347 $s = urlencode( $s );
348 $s = str_ireplace(
349 $needle,
350 array( ';', '@', '$', '!', '*', '(', ')', ',', '/', ':' ),
351 $s
352 );
353
354 return $s;
355 }
356
357 /**
358 * This function takes two arrays as input, and returns a CGI-style string, e.g.
359 * "days=7&limit=100". Options in the first array override options in the second.
360 * Options set to null or false will not be output.
361 *
362 * @param array $array1 ( String|Array )
363 * @param array $array2 ( String|Array )
364 * @param $prefix String
365 * @return String
366 */
367 function wfArrayToCgi( $array1, $array2 = null, $prefix = '' ) {
368 if ( !is_null( $array2 ) ) {
369 $array1 = $array1 + $array2;
370 }
371
372 $cgi = '';
373 foreach ( $array1 as $key => $value ) {
374 if ( !is_null( $value ) && $value !== false ) {
375 if ( $cgi != '' ) {
376 $cgi .= '&';
377 }
378 if ( $prefix !== '' ) {
379 $key = $prefix . "[$key]";
380 }
381 if ( is_array( $value ) ) {
382 $firstTime = true;
383 foreach ( $value as $k => $v ) {
384 $cgi .= $firstTime ? '' : '&';
385 if ( is_array( $v ) ) {
386 $cgi .= wfArrayToCgi( $v, null, $key . "[$k]" );
387 } else {
388 $cgi .= urlencode( $key . "[$k]" ) . '=' . urlencode( $v );
389 }
390 $firstTime = false;
391 }
392 } else {
393 if ( is_object( $value ) ) {
394 $value = $value->__toString();
395 }
396 $cgi .= urlencode( $key ) . '=' . urlencode( $value );
397 }
398 }
399 }
400 return $cgi;
401 }
402
403 /**
404 * This is the logical opposite of wfArrayToCgi(): it accepts a query string as
405 * its argument and returns the same string in array form. This allows compatibility
406 * with legacy functions that accept raw query strings instead of nice
407 * arrays. Of course, keys and values are urldecode()d.
408 *
409 * @param string $query query string
410 * @return array Array version of input
411 */
412 function wfCgiToArray( $query ) {
413 if ( isset( $query[0] ) && $query[0] == '?' ) {
414 $query = substr( $query, 1 );
415 }
416 $bits = explode( '&', $query );
417 $ret = array();
418 foreach ( $bits as $bit ) {
419 if ( $bit === '' ) {
420 continue;
421 }
422 if ( strpos( $bit, '=' ) === false ) {
423 // Pieces like &qwerty become 'qwerty' => '' (at least this is what php does)
424 $key = $bit;
425 $value = '';
426 } else {
427 list( $key, $value ) = explode( '=', $bit );
428 }
429 $key = urldecode( $key );
430 $value = urldecode( $value );
431 if ( strpos( $key, '[' ) !== false ) {
432 $keys = array_reverse( explode( '[', $key ) );
433 $key = array_pop( $keys );
434 $temp = $value;
435 foreach ( $keys as $k ) {
436 $k = substr( $k, 0, -1 );
437 $temp = array( $k => $temp );
438 }
439 if ( isset( $ret[$key] ) ) {
440 $ret[$key] = array_merge( $ret[$key], $temp );
441 } else {
442 $ret[$key] = $temp;
443 }
444 } else {
445 $ret[$key] = $value;
446 }
447 }
448 return $ret;
449 }
450
451 /**
452 * Append a query string to an existing URL, which may or may not already
453 * have query string parameters already. If so, they will be combined.
454 *
455 * @param $url String
456 * @param $query Mixed: string or associative array
457 * @return string
458 */
459 function wfAppendQuery( $url, $query ) {
460 if ( is_array( $query ) ) {
461 $query = wfArrayToCgi( $query );
462 }
463 if ( $query != '' ) {
464 if ( false === strpos( $url, '?' ) ) {
465 $url .= '?';
466 } else {
467 $url .= '&';
468 }
469 $url .= $query;
470 }
471 return $url;
472 }
473
474 /**
475 * Expand a potentially local URL to a fully-qualified URL. Assumes $wgServer
476 * is correct.
477 *
478 * The meaning of the PROTO_* constants is as follows:
479 * PROTO_HTTP: Output a URL starting with http://
480 * PROTO_HTTPS: Output a URL starting with https://
481 * PROTO_RELATIVE: Output a URL starting with // (protocol-relative URL)
482 * PROTO_CURRENT: Output a URL starting with either http:// or https:// , depending
483 * on which protocol was used for the current incoming request
484 * PROTO_CANONICAL: For URLs without a domain, like /w/index.php , use $wgCanonicalServer.
485 * For protocol-relative URLs, use the protocol of $wgCanonicalServer
486 * PROTO_INTERNAL: Like PROTO_CANONICAL, but uses $wgInternalServer instead of $wgCanonicalServer
487 *
488 * @todo this won't work with current-path-relative URLs
489 * like "subdir/foo.html", etc.
490 *
491 * @param string $url either fully-qualified or a local path + query
492 * @param $defaultProto Mixed: one of the PROTO_* constants. Determines the
493 * protocol to use if $url or $wgServer is protocol-relative
494 * @return string Fully-qualified URL, current-path-relative URL or false if
495 * no valid URL can be constructed
496 */
497 function wfExpandUrl( $url, $defaultProto = PROTO_CURRENT ) {
498 global $wgServer, $wgCanonicalServer, $wgInternalServer, $wgRequest;
499 if ( $defaultProto === PROTO_CANONICAL ) {
500 $serverUrl = $wgCanonicalServer;
501 } elseif ( $defaultProto === PROTO_INTERNAL && $wgInternalServer !== false ) {
502 // Make $wgInternalServer fall back to $wgServer if not set
503 $serverUrl = $wgInternalServer;
504 } else {
505 $serverUrl = $wgServer;
506 if ( $defaultProto === PROTO_CURRENT ) {
507 $defaultProto = $wgRequest->getProtocol() . '://';
508 }
509 }
510
511 // Analyze $serverUrl to obtain its protocol
512 $bits = wfParseUrl( $serverUrl );
513 $serverHasProto = $bits && $bits['scheme'] != '';
514
515 if ( $defaultProto === PROTO_CANONICAL || $defaultProto === PROTO_INTERNAL ) {
516 if ( $serverHasProto ) {
517 $defaultProto = $bits['scheme'] . '://';
518 } else {
519 // $wgCanonicalServer or $wgInternalServer doesn't have a protocol.
520 // This really isn't supposed to happen. Fall back to HTTP in this
521 // ridiculous case.
522 $defaultProto = PROTO_HTTP;
523 }
524 }
525
526 $defaultProtoWithoutSlashes = substr( $defaultProto, 0, -2 );
527
528 if ( substr( $url, 0, 2 ) == '//' ) {
529 $url = $defaultProtoWithoutSlashes . $url;
530 } elseif ( substr( $url, 0, 1 ) == '/' ) {
531 // If $serverUrl is protocol-relative, prepend $defaultProtoWithoutSlashes,
532 // otherwise leave it alone.
533 $url = ( $serverHasProto ? '' : $defaultProtoWithoutSlashes ) . $serverUrl . $url;
534 }
535
536 $bits = wfParseUrl( $url );
537 if ( $bits && isset( $bits['path'] ) ) {
538 $bits['path'] = wfRemoveDotSegments( $bits['path'] );
539 return wfAssembleUrl( $bits );
540 } elseif ( $bits ) {
541 # No path to expand
542 return $url;
543 } elseif ( substr( $url, 0, 1 ) != '/' ) {
544 # URL is a relative path
545 return wfRemoveDotSegments( $url );
546 }
547
548 # Expanded URL is not valid.
549 return false;
550 }
551
552 /**
553 * This function will reassemble a URL parsed with wfParseURL. This is useful
554 * if you need to edit part of a URL and put it back together.
555 *
556 * This is the basic structure used (brackets contain keys for $urlParts):
557 * [scheme][delimiter][user]:[pass]@[host]:[port][path]?[query]#[fragment]
558 *
559 * @todo Need to integrate this into wfExpandUrl (bug 32168)
560 *
561 * @since 1.19
562 * @param array $urlParts URL parts, as output from wfParseUrl
563 * @return string URL assembled from its component parts
564 */
565 function wfAssembleUrl( $urlParts ) {
566 $result = '';
567
568 if ( isset( $urlParts['delimiter'] ) ) {
569 if ( isset( $urlParts['scheme'] ) ) {
570 $result .= $urlParts['scheme'];
571 }
572
573 $result .= $urlParts['delimiter'];
574 }
575
576 if ( isset( $urlParts['host'] ) ) {
577 if ( isset( $urlParts['user'] ) ) {
578 $result .= $urlParts['user'];
579 if ( isset( $urlParts['pass'] ) ) {
580 $result .= ':' . $urlParts['pass'];
581 }
582 $result .= '@';
583 }
584
585 $result .= $urlParts['host'];
586
587 if ( isset( $urlParts['port'] ) ) {
588 $result .= ':' . $urlParts['port'];
589 }
590 }
591
592 if ( isset( $urlParts['path'] ) ) {
593 $result .= $urlParts['path'];
594 }
595
596 if ( isset( $urlParts['query'] ) ) {
597 $result .= '?' . $urlParts['query'];
598 }
599
600 if ( isset( $urlParts['fragment'] ) ) {
601 $result .= '#' . $urlParts['fragment'];
602 }
603
604 return $result;
605 }
606
607 /**
608 * Remove all dot-segments in the provided URL path. For example,
609 * '/a/./b/../c/' becomes '/a/c/'. For details on the algorithm, please see
610 * RFC3986 section 5.2.4.
611 *
612 * @todo Need to integrate this into wfExpandUrl (bug 32168)
613 *
614 * @param string $urlPath URL path, potentially containing dot-segments
615 * @return string URL path with all dot-segments removed
616 */
617 function wfRemoveDotSegments( $urlPath ) {
618 $output = '';
619 $inputOffset = 0;
620 $inputLength = strlen( $urlPath );
621
622 while ( $inputOffset < $inputLength ) {
623 $prefixLengthOne = substr( $urlPath, $inputOffset, 1 );
624 $prefixLengthTwo = substr( $urlPath, $inputOffset, 2 );
625 $prefixLengthThree = substr( $urlPath, $inputOffset, 3 );
626 $prefixLengthFour = substr( $urlPath, $inputOffset, 4 );
627 $trimOutput = false;
628
629 if ( $prefixLengthTwo == './' ) {
630 # Step A, remove leading "./"
631 $inputOffset += 2;
632 } elseif ( $prefixLengthThree == '../' ) {
633 # Step A, remove leading "../"
634 $inputOffset += 3;
635 } elseif ( ( $prefixLengthTwo == '/.' ) && ( $inputOffset + 2 == $inputLength ) ) {
636 # Step B, replace leading "/.$" with "/"
637 $inputOffset += 1;
638 $urlPath[$inputOffset] = '/';
639 } elseif ( $prefixLengthThree == '/./' ) {
640 # Step B, replace leading "/./" with "/"
641 $inputOffset += 2;
642 } elseif ( $prefixLengthThree == '/..' && ( $inputOffset + 3 == $inputLength ) ) {
643 # Step C, replace leading "/..$" with "/" and
644 # remove last path component in output
645 $inputOffset += 2;
646 $urlPath[$inputOffset] = '/';
647 $trimOutput = true;
648 } elseif ( $prefixLengthFour == '/../' ) {
649 # Step C, replace leading "/../" with "/" and
650 # remove last path component in output
651 $inputOffset += 3;
652 $trimOutput = true;
653 } elseif ( ( $prefixLengthOne == '.' ) && ( $inputOffset + 1 == $inputLength ) ) {
654 # Step D, remove "^.$"
655 $inputOffset += 1;
656 } elseif ( ( $prefixLengthTwo == '..' ) && ( $inputOffset + 2 == $inputLength ) ) {
657 # Step D, remove "^..$"
658 $inputOffset += 2;
659 } else {
660 # Step E, move leading path segment to output
661 if ( $prefixLengthOne == '/' ) {
662 $slashPos = strpos( $urlPath, '/', $inputOffset + 1 );
663 } else {
664 $slashPos = strpos( $urlPath, '/', $inputOffset );
665 }
666 if ( $slashPos === false ) {
667 $output .= substr( $urlPath, $inputOffset );
668 $inputOffset = $inputLength;
669 } else {
670 $output .= substr( $urlPath, $inputOffset, $slashPos - $inputOffset );
671 $inputOffset += $slashPos - $inputOffset;
672 }
673 }
674
675 if ( $trimOutput ) {
676 $slashPos = strrpos( $output, '/' );
677 if ( $slashPos === false ) {
678 $output = '';
679 } else {
680 $output = substr( $output, 0, $slashPos );
681 }
682 }
683 }
684
685 return $output;
686 }
687
688 /**
689 * Returns a regular expression of url protocols
690 *
691 * @param bool $includeProtocolRelative If false, remove '//' from the returned protocol list.
692 * DO NOT USE this directly, use wfUrlProtocolsWithoutProtRel() instead
693 * @return String
694 */
695 function wfUrlProtocols( $includeProtocolRelative = true ) {
696 global $wgUrlProtocols;
697
698 // Cache return values separately based on $includeProtocolRelative
699 static $withProtRel = null, $withoutProtRel = null;
700 $cachedValue = $includeProtocolRelative ? $withProtRel : $withoutProtRel;
701 if ( !is_null( $cachedValue ) ) {
702 return $cachedValue;
703 }
704
705 // Support old-style $wgUrlProtocols strings, for backwards compatibility
706 // with LocalSettings files from 1.5
707 if ( is_array( $wgUrlProtocols ) ) {
708 $protocols = array();
709 foreach ( $wgUrlProtocols as $protocol ) {
710 // Filter out '//' if !$includeProtocolRelative
711 if ( $includeProtocolRelative || $protocol !== '//' ) {
712 $protocols[] = preg_quote( $protocol, '/' );
713 }
714 }
715
716 $retval = implode( '|', $protocols );
717 } else {
718 // Ignore $includeProtocolRelative in this case
719 // This case exists for pre-1.6 compatibility, and we can safely assume
720 // that '//' won't appear in a pre-1.6 config because protocol-relative
721 // URLs weren't supported until 1.18
722 $retval = $wgUrlProtocols;
723 }
724
725 // Cache return value
726 if ( $includeProtocolRelative ) {
727 $withProtRel = $retval;
728 } else {
729 $withoutProtRel = $retval;
730 }
731 return $retval;
732 }
733
734 /**
735 * Like wfUrlProtocols(), but excludes '//' from the protocol list. Use this if
736 * you need a regex that matches all URL protocols but does not match protocol-
737 * relative URLs
738 * @return String
739 */
740 function wfUrlProtocolsWithoutProtRel() {
741 return wfUrlProtocols( false );
742 }
743
744 /**
745 * parse_url() work-alike, but non-broken. Differences:
746 *
747 * 1) Does not raise warnings on bad URLs (just returns false).
748 * 2) Handles protocols that don't use :// (e.g., mailto: and news:, as well as
749 * protocol-relative URLs) correctly.
750 * 3) Adds a "delimiter" element to the array, either '://', ':' or '//' (see (2)).
751 *
752 * @param string $url a URL to parse
753 * @return Array: bits of the URL in an associative array, per PHP docs
754 */
755 function wfParseUrl( $url ) {
756 global $wgUrlProtocols; // Allow all protocols defined in DefaultSettings/LocalSettings.php
757
758 // Protocol-relative URLs are handled really badly by parse_url(). It's so
759 // bad that the easiest way to handle them is to just prepend 'http:' and
760 // strip the protocol out later.
761 $wasRelative = substr( $url, 0, 2 ) == '//';
762 if ( $wasRelative ) {
763 $url = "http:$url";
764 }
765 wfSuppressWarnings();
766 $bits = parse_url( $url );
767 wfRestoreWarnings();
768 // parse_url() returns an array without scheme for some invalid URLs, e.g.
769 // parse_url("%0Ahttp://example.com") == array( 'host' => '%0Ahttp', 'path' => 'example.com' )
770 if ( !$bits || !isset( $bits['scheme'] ) ) {
771 return false;
772 }
773
774 // parse_url() incorrectly handles schemes case-sensitively. Convert it to lowercase.
775 $bits['scheme'] = strtolower( $bits['scheme'] );
776
777 // most of the protocols are followed by ://, but mailto: and sometimes news: not, check for it
778 if ( in_array( $bits['scheme'] . '://', $wgUrlProtocols ) ) {
779 $bits['delimiter'] = '://';
780 } elseif ( in_array( $bits['scheme'] . ':', $wgUrlProtocols ) ) {
781 $bits['delimiter'] = ':';
782 // parse_url detects for news: and mailto: the host part of an url as path
783 // We have to correct this wrong detection
784 if ( isset( $bits['path'] ) ) {
785 $bits['host'] = $bits['path'];
786 $bits['path'] = '';
787 }
788 } else {
789 return false;
790 }
791
792 /* Provide an empty host for eg. file:/// urls (see bug 28627) */
793 if ( !isset( $bits['host'] ) ) {
794 $bits['host'] = '';
795
796 // bug 45069
797 if ( isset( $bits['path'] ) ) {
798 /* parse_url loses the third / for file:///c:/ urls (but not on variants) */
799 if ( substr( $bits['path'], 0, 1 ) !== '/' ) {
800 $bits['path'] = '/' . $bits['path'];
801 }
802 } else {
803 $bits['path'] = '';
804 }
805 }
806
807 // If the URL was protocol-relative, fix scheme and delimiter
808 if ( $wasRelative ) {
809 $bits['scheme'] = '';
810 $bits['delimiter'] = '//';
811 }
812 return $bits;
813 }
814
815 /**
816 * Take a URL, make sure it's expanded to fully qualified, and replace any
817 * encoded non-ASCII Unicode characters with their UTF-8 original forms
818 * for more compact display and legibility for local audiences.
819 *
820 * @todo handle punycode domains too
821 *
822 * @param $url string
823 * @return string
824 */
825 function wfExpandIRI( $url ) {
826 return preg_replace_callback(
827 '/((?:%[89A-F][0-9A-F])+)/i',
828 'wfExpandIRI_callback',
829 wfExpandUrl( $url )
830 );
831 }
832
833 /**
834 * Private callback for wfExpandIRI
835 * @param array $matches
836 * @return string
837 */
838 function wfExpandIRI_callback( $matches ) {
839 return urldecode( $matches[1] );
840 }
841
842 /**
843 * Make URL indexes, appropriate for the el_index field of externallinks.
844 *
845 * @param $url String
846 * @return array
847 */
848 function wfMakeUrlIndexes( $url ) {
849 $bits = wfParseUrl( $url );
850
851 // Reverse the labels in the hostname, convert to lower case
852 // For emails reverse domainpart only
853 if ( $bits['scheme'] == 'mailto' ) {
854 $mailparts = explode( '@', $bits['host'], 2 );
855 if ( count( $mailparts ) === 2 ) {
856 $domainpart = strtolower( implode( '.', array_reverse( explode( '.', $mailparts[1] ) ) ) );
857 } else {
858 // No domain specified, don't mangle it
859 $domainpart = '';
860 }
861 $reversedHost = $domainpart . '@' . $mailparts[0];
862 } else {
863 $reversedHost = strtolower( implode( '.', array_reverse( explode( '.', $bits['host'] ) ) ) );
864 }
865 // Add an extra dot to the end
866 // Why? Is it in wrong place in mailto links?
867 if ( substr( $reversedHost, -1, 1 ) !== '.' ) {
868 $reversedHost .= '.';
869 }
870 // Reconstruct the pseudo-URL
871 $prot = $bits['scheme'];
872 $index = $prot . $bits['delimiter'] . $reversedHost;
873 // Leave out user and password. Add the port, path, query and fragment
874 if ( isset( $bits['port'] ) ) {
875 $index .= ':' . $bits['port'];
876 }
877 if ( isset( $bits['path'] ) ) {
878 $index .= $bits['path'];
879 } else {
880 $index .= '/';
881 }
882 if ( isset( $bits['query'] ) ) {
883 $index .= '?' . $bits['query'];
884 }
885 if ( isset( $bits['fragment'] ) ) {
886 $index .= '#' . $bits['fragment'];
887 }
888
889 if ( $prot == '' ) {
890 return array( "http:$index", "https:$index" );
891 } else {
892 return array( $index );
893 }
894 }
895
896 /**
897 * Check whether a given URL has a domain that occurs in a given set of domains
898 * @param string $url URL
899 * @param array $domains Array of domains (strings)
900 * @return bool True if the host part of $url ends in one of the strings in $domains
901 */
902 function wfMatchesDomainList( $url, $domains ) {
903 $bits = wfParseUrl( $url );
904 if ( is_array( $bits ) && isset( $bits['host'] ) ) {
905 $host = '.' . $bits['host'];
906 foreach ( (array)$domains as $domain ) {
907 $domain = '.' . $domain;
908 if ( substr( $host, -strlen( $domain ) ) === $domain ) {
909 return true;
910 }
911 }
912 }
913 return false;
914 }
915
916 /**
917 * Sends a line to the debug log if enabled or, optionally, to a comment in output.
918 * In normal operation this is a NOP.
919 *
920 * Controlling globals:
921 * $wgDebugLogFile - points to the log file
922 * $wgProfileOnly - if set, normal debug messages will not be recorded.
923 * $wgDebugRawPage - if false, 'action=raw' hits will not result in debug output.
924 * $wgDebugComments - if on, some debug items may appear in comments in the HTML output.
925 *
926 * @param $text String
927 * @param string|bool $dest Destination of the message:
928 * - 'all': both to the log and HTML (debug toolbar or HTML comments)
929 * - 'log': only to the log and not in HTML
930 * For backward compatibility, it can also take a boolean:
931 * - true: same as 'all'
932 * - false: same as 'log'
933 */
934 function wfDebug( $text, $dest = 'all' ) {
935 global $wgDebugLogFile, $wgProfileOnly, $wgDebugRawPage, $wgDebugLogPrefix;
936
937 if ( !$wgDebugRawPage && wfIsDebugRawPage() ) {
938 return;
939 }
940
941 // Turn $dest into a string if it's a boolean (for b/c)
942 if ( $dest === true ) {
943 $dest = 'all';
944 } elseif ( $dest === false ) {
945 $dest = 'log';
946 }
947
948 $timer = wfDebugTimer();
949 if ( $timer !== '' ) {
950 $text = preg_replace( '/[^\n]/', $timer . '\0', $text, 1 );
951 }
952
953 if ( $dest === 'all' ) {
954 MWDebug::debugMsg( $text );
955 }
956
957 if ( $wgDebugLogFile != '' && !$wgProfileOnly ) {
958 # Strip unprintables; they can switch terminal modes when binary data
959 # gets dumped, which is pretty annoying.
960 $text = preg_replace( '![\x00-\x08\x0b\x0c\x0e-\x1f]!', ' ', $text );
961 $text = $wgDebugLogPrefix . $text;
962 wfErrorLog( $text, $wgDebugLogFile );
963 }
964 }
965
966 /**
967 * Returns true if debug logging should be suppressed if $wgDebugRawPage = false
968 * @return bool
969 */
970 function wfIsDebugRawPage() {
971 static $cache;
972 if ( $cache !== null ) {
973 return $cache;
974 }
975 # Check for raw action using $_GET not $wgRequest, since the latter might not be initialised yet
976 if ( ( isset( $_GET['action'] ) && $_GET['action'] == 'raw' )
977 || (
978 isset( $_SERVER['SCRIPT_NAME'] )
979 && substr( $_SERVER['SCRIPT_NAME'], -8 ) == 'load.php'
980 )
981 ) {
982 $cache = true;
983 } else {
984 $cache = false;
985 }
986 return $cache;
987 }
988
989 /**
990 * Get microsecond timestamps for debug logs
991 *
992 * @return string
993 */
994 function wfDebugTimer() {
995 global $wgDebugTimestamps, $wgRequestTime;
996
997 if ( !$wgDebugTimestamps ) {
998 return '';
999 }
1000
1001 $prefix = sprintf( "%6.4f", microtime( true ) - $wgRequestTime );
1002 $mem = sprintf( "%5.1fM", ( memory_get_usage( true ) / ( 1024 * 1024 ) ) );
1003 return "$prefix $mem ";
1004 }
1005
1006 /**
1007 * Send a line giving PHP memory usage.
1008 *
1009 * @param bool $exact print exact values instead of kilobytes (default: false)
1010 */
1011 function wfDebugMem( $exact = false ) {
1012 $mem = memory_get_usage();
1013 if ( !$exact ) {
1014 $mem = floor( $mem / 1024 ) . ' kilobytes';
1015 } else {
1016 $mem .= ' bytes';
1017 }
1018 wfDebug( "Memory usage: $mem\n" );
1019 }
1020
1021 /**
1022 * Send a line to a supplementary debug log file, if configured, or main debug log if not.
1023 * To configure a supplementary log file, set $wgDebugLogGroups[$logGroup] to a string
1024 * filename or an associative array mapping 'destination' to the desired filename. The
1025 * associative array may also contain a 'sample' key with an integer value, specifying
1026 * a sampling factor.
1027 *
1028 * @since 1.23 support for sampling log messages via $wgDebugLogGroups.
1029 *
1030 * @param $logGroup String
1031 * @param $text String
1032 * @param bool $public whether to log the event in the public log if no private
1033 * log file is specified, (default true)
1034 * @param string|bool $dest Destination of the message:
1035 * - 'all': both to the log and HTML (debug toolbar or HTML comments)
1036 * - 'log': only to the log and not in HTML
1037 * - 'private': only to the specifc log if set in $wgDebugLogGroups and
1038 * discarded otherwise
1039 * For backward compatibility, it can also take a boolean:
1040 * - true: same as 'all'
1041 * - false: same as 'private'
1042 */
1043 function wfDebugLog( $logGroup, $text, $dest = 'all' ) {
1044 global $wgDebugLogGroups;
1045
1046 $text = trim( $text ) . "\n";
1047
1048 // Turn $dest into a string if it's a boolean (for b/c)
1049 if ( $dest === true ) {
1050 $dest = 'all';
1051 } elseif ( $dest === false ) {
1052 $dest = 'private';
1053 }
1054
1055 if ( !isset( $wgDebugLogGroups[$logGroup] ) ) {
1056 if ( $dest !== 'private' ) {
1057 wfDebug( "[$logGroup] $text", $dest );
1058 }
1059 return;
1060 }
1061
1062 if ( $dest === 'all' ) {
1063 MWDebug::debugMsg( "[$logGroup] $text" );
1064 }
1065
1066 $logConfig = $wgDebugLogGroups[$logGroup];
1067 if ( is_array( $logConfig ) ) {
1068 if ( isset( $logConfig['sample'] ) && mt_rand( 1, $logConfig['sample'] ) !== 1 ) {
1069 return;
1070 }
1071 $destination = $logConfig['destination'];
1072 } else {
1073 $destination = strval( $logConfig );
1074 }
1075
1076 $time = wfTimestamp( TS_DB );
1077 $wiki = wfWikiID();
1078 $host = wfHostname();
1079 wfErrorLog( "$time $host $wiki: $text", $destination );
1080 }
1081
1082 /**
1083 * Log for database errors
1084 *
1085 * @param string $text database error message.
1086 */
1087 function wfLogDBError( $text ) {
1088 global $wgDBerrorLog, $wgDBerrorLogTZ;
1089 static $logDBErrorTimeZoneObject = null;
1090
1091 if ( $wgDBerrorLog ) {
1092 $host = wfHostname();
1093 $wiki = wfWikiID();
1094
1095 if ( $wgDBerrorLogTZ && !$logDBErrorTimeZoneObject ) {
1096 $logDBErrorTimeZoneObject = new DateTimeZone( $wgDBerrorLogTZ );
1097 }
1098
1099 // Workaround for https://bugs.php.net/bug.php?id=52063
1100 // Can be removed when min PHP > 5.3.2
1101 if ( $logDBErrorTimeZoneObject === null ) {
1102 $d = date_create( "now" );
1103 } else {
1104 $d = date_create( "now", $logDBErrorTimeZoneObject );
1105 }
1106
1107 $date = $d->format( 'D M j G:i:s T Y' );
1108
1109 $text = "$date\t$host\t$wiki\t$text";
1110 wfErrorLog( $text, $wgDBerrorLog );
1111 }
1112 }
1113
1114 /**
1115 * Throws a warning that $function is deprecated
1116 *
1117 * @param $function String
1118 * @param string|bool $version Version of MediaWiki that the function
1119 * was deprecated in (Added in 1.19).
1120 * @param string|bool $component Added in 1.19.
1121 * @param $callerOffset integer: How far up the call stack is the original
1122 * caller. 2 = function that called the function that called
1123 * wfDeprecated (Added in 1.20)
1124 *
1125 * @return null
1126 */
1127 function wfDeprecated( $function, $version = false, $component = false, $callerOffset = 2 ) {
1128 MWDebug::deprecated( $function, $version, $component, $callerOffset + 1 );
1129 }
1130
1131 /**
1132 * Send a warning either to the debug log or in a PHP error depending on
1133 * $wgDevelopmentWarnings. To log warnings in production, use wfLogWarning() instead.
1134 *
1135 * @param string $msg message to send
1136 * @param $callerOffset Integer: number of items to go back in the backtrace to
1137 * find the correct caller (1 = function calling wfWarn, ...)
1138 * @param $level Integer: PHP error level; defaults to E_USER_NOTICE;
1139 * only used when $wgDevelopmentWarnings is true
1140 */
1141 function wfWarn( $msg, $callerOffset = 1, $level = E_USER_NOTICE ) {
1142 MWDebug::warning( $msg, $callerOffset + 1, $level, 'auto' );
1143 }
1144
1145 /**
1146 * Send a warning as a PHP error and the debug log. This is intended for logging
1147 * warnings in production. For logging development warnings, use WfWarn instead.
1148 *
1149 * @param $msg String: message to send
1150 * @param $callerOffset Integer: number of items to go back in the backtrace to
1151 * find the correct caller (1 = function calling wfLogWarning, ...)
1152 * @param $level Integer: PHP error level; defaults to E_USER_WARNING
1153 */
1154 function wfLogWarning( $msg, $callerOffset = 1, $level = E_USER_WARNING ) {
1155 MWDebug::warning( $msg, $callerOffset + 1, $level, 'production' );
1156 }
1157
1158 /**
1159 * Log to a file without getting "file size exceeded" signals.
1160 *
1161 * Can also log to TCP or UDP with the syntax udp://host:port/prefix. This will
1162 * send lines to the specified port, prefixed by the specified prefix and a space.
1163 *
1164 * @param $text String
1165 * @param string $file filename
1166 * @throws MWException
1167 */
1168 function wfErrorLog( $text, $file ) {
1169 if ( substr( $file, 0, 4 ) == 'udp:' ) {
1170 # Needs the sockets extension
1171 if ( preg_match( '!^(tcp|udp):(?://)?\[([0-9a-fA-F:]+)\]:(\d+)(?:/(.*))?$!', $file, $m ) ) {
1172 // IPv6 bracketed host
1173 $host = $m[2];
1174 $port = intval( $m[3] );
1175 $prefix = isset( $m[4] ) ? $m[4] : false;
1176 $domain = AF_INET6;
1177 } elseif ( preg_match( '!^(tcp|udp):(?://)?([a-zA-Z0-9.-]+):(\d+)(?:/(.*))?$!', $file, $m ) ) {
1178 $host = $m[2];
1179 if ( !IP::isIPv4( $host ) ) {
1180 $host = gethostbyname( $host );
1181 }
1182 $port = intval( $m[3] );
1183 $prefix = isset( $m[4] ) ? $m[4] : false;
1184 $domain = AF_INET;
1185 } else {
1186 throw new MWException( __METHOD__ . ': Invalid UDP specification' );
1187 }
1188
1189 // Clean it up for the multiplexer
1190 if ( strval( $prefix ) !== '' ) {
1191 $text = preg_replace( '/^/m', $prefix . ' ', $text );
1192
1193 // Limit to 64KB
1194 if ( strlen( $text ) > 65506 ) {
1195 $text = substr( $text, 0, 65506 );
1196 }
1197
1198 if ( substr( $text, -1 ) != "\n" ) {
1199 $text .= "\n";
1200 }
1201 } elseif ( strlen( $text ) > 65507 ) {
1202 $text = substr( $text, 0, 65507 );
1203 }
1204
1205 $sock = socket_create( $domain, SOCK_DGRAM, SOL_UDP );
1206 if ( !$sock ) {
1207 return;
1208 }
1209
1210 socket_sendto( $sock, $text, strlen( $text ), 0, $host, $port );
1211 socket_close( $sock );
1212 } else {
1213 wfSuppressWarnings();
1214 $exists = file_exists( $file );
1215 $size = $exists ? filesize( $file ) : false;
1216 if ( !$exists || ( $size !== false && $size + strlen( $text ) < 0x7fffffff ) ) {
1217 file_put_contents( $file, $text, FILE_APPEND );
1218 }
1219 wfRestoreWarnings();
1220 }
1221 }
1222
1223 /**
1224 * @todo document
1225 */
1226 function wfLogProfilingData() {
1227 global $wgRequestTime, $wgDebugLogFile, $wgDebugRawPage, $wgRequest;
1228 global $wgProfileLimit, $wgUser;
1229
1230 StatCounter::singleton()->flush();
1231
1232 $profiler = Profiler::instance();
1233
1234 # Profiling must actually be enabled...
1235 if ( $profiler->isStub() ) {
1236 return;
1237 }
1238
1239 // Get total page request time and only show pages that longer than
1240 // $wgProfileLimit time (default is 0)
1241 $elapsed = microtime( true ) - $wgRequestTime;
1242 if ( $elapsed <= $wgProfileLimit ) {
1243 return;
1244 }
1245
1246 $profiler->logData();
1247
1248 // Check whether this should be logged in the debug file.
1249 if ( $wgDebugLogFile == '' || ( !$wgDebugRawPage && wfIsDebugRawPage() ) ) {
1250 return;
1251 }
1252
1253 $forward = '';
1254 if ( !empty( $_SERVER['HTTP_X_FORWARDED_FOR'] ) ) {
1255 $forward = ' forwarded for ' . $_SERVER['HTTP_X_FORWARDED_FOR'];
1256 }
1257 if ( !empty( $_SERVER['HTTP_CLIENT_IP'] ) ) {
1258 $forward .= ' client IP ' . $_SERVER['HTTP_CLIENT_IP'];
1259 }
1260 if ( !empty( $_SERVER['HTTP_FROM'] ) ) {
1261 $forward .= ' from ' . $_SERVER['HTTP_FROM'];
1262 }
1263 if ( $forward ) {
1264 $forward = "\t(proxied via {$_SERVER['REMOTE_ADDR']}{$forward})";
1265 }
1266 // Don't load $wgUser at this late stage just for statistics purposes
1267 // @todo FIXME: We can detect some anons even if it is not loaded. See User::getId()
1268 if ( $wgUser->isItemLoaded( 'id' ) && $wgUser->isAnon() ) {
1269 $forward .= ' anon';
1270 }
1271
1272 // Command line script uses a FauxRequest object which does not have
1273 // any knowledge about an URL and throw an exception instead.
1274 try {
1275 $requestUrl = $wgRequest->getRequestURL();
1276 } catch ( MWException $e ) {
1277 $requestUrl = 'n/a';
1278 }
1279
1280 $log = sprintf( "%s\t%04.3f\t%s\n",
1281 gmdate( 'YmdHis' ), $elapsed,
1282 urldecode( $requestUrl . $forward ) );
1283
1284 wfErrorLog( $log . $profiler->getOutput(), $wgDebugLogFile );
1285 }
1286
1287 /**
1288 * Increment a statistics counter
1289 *
1290 * @param $key String
1291 * @param $count Int
1292 * @return void
1293 */
1294 function wfIncrStats( $key, $count = 1 ) {
1295 StatCounter::singleton()->incr( $key, $count );
1296 }
1297
1298 /**
1299 * Check whether the wiki is in read-only mode.
1300 *
1301 * @return bool
1302 */
1303 function wfReadOnly() {
1304 return wfReadOnlyReason() !== false;
1305 }
1306
1307 /**
1308 * Get the value of $wgReadOnly or the contents of $wgReadOnlyFile.
1309 *
1310 * @return string|bool: String when in read-only mode; false otherwise
1311 */
1312 function wfReadOnlyReason() {
1313 global $wgReadOnly, $wgReadOnlyFile;
1314
1315 if ( $wgReadOnly === null ) {
1316 // Set $wgReadOnly for faster access next time
1317 if ( is_file( $wgReadOnlyFile ) && filesize( $wgReadOnlyFile ) > 0 ) {
1318 $wgReadOnly = file_get_contents( $wgReadOnlyFile );
1319 } else {
1320 $wgReadOnly = false;
1321 }
1322 }
1323
1324 return $wgReadOnly;
1325 }
1326
1327 /**
1328 * Return a Language object from $langcode
1329 *
1330 * @param $langcode Mixed: either:
1331 * - a Language object
1332 * - code of the language to get the message for, if it is
1333 * a valid code create a language for that language, if
1334 * it is a string but not a valid code then make a basic
1335 * language object
1336 * - a boolean: if it's false then use the global object for
1337 * the current user's language (as a fallback for the old parameter
1338 * functionality), or if it is true then use global object
1339 * for the wiki's content language.
1340 * @return Language object
1341 */
1342 function wfGetLangObj( $langcode = false ) {
1343 # Identify which language to get or create a language object for.
1344 # Using is_object here due to Stub objects.
1345 if ( is_object( $langcode ) ) {
1346 # Great, we already have the object (hopefully)!
1347 return $langcode;
1348 }
1349
1350 global $wgContLang, $wgLanguageCode;
1351 if ( $langcode === true || $langcode === $wgLanguageCode ) {
1352 # $langcode is the language code of the wikis content language object.
1353 # or it is a boolean and value is true
1354 return $wgContLang;
1355 }
1356
1357 global $wgLang;
1358 if ( $langcode === false || $langcode === $wgLang->getCode() ) {
1359 # $langcode is the language code of user language object.
1360 # or it was a boolean and value is false
1361 return $wgLang;
1362 }
1363
1364 $validCodes = array_keys( Language::fetchLanguageNames() );
1365 if ( in_array( $langcode, $validCodes ) ) {
1366 # $langcode corresponds to a valid language.
1367 return Language::factory( $langcode );
1368 }
1369
1370 # $langcode is a string, but not a valid language code; use content language.
1371 wfDebug( "Invalid language code passed to wfGetLangObj, falling back to content language.\n" );
1372 return $wgContLang;
1373 }
1374
1375 /**
1376 * This is the function for getting translated interface messages.
1377 *
1378 * @see Message class for documentation how to use them.
1379 * @see https://www.mediawiki.org/wiki/Manual:Messages_API
1380 *
1381 * This function replaces all old wfMsg* functions.
1382 *
1383 * @param $key \string Message key.
1384 * Varargs: normal message parameters.
1385 * @return Message
1386 * @since 1.17
1387 */
1388 function wfMessage( $key /*...*/) {
1389 $params = func_get_args();
1390 array_shift( $params );
1391 if ( isset( $params[0] ) && is_array( $params[0] ) ) {
1392 $params = $params[0];
1393 }
1394 return new Message( $key, $params );
1395 }
1396
1397 /**
1398 * This function accepts multiple message keys and returns a message instance
1399 * for the first message which is non-empty. If all messages are empty then an
1400 * instance of the first message key is returned.
1401 * @param varargs: message keys
1402 * @return Message
1403 * @since 1.18
1404 */
1405 function wfMessageFallback( /*...*/ ) {
1406 $args = func_get_args();
1407 return call_user_func_array( 'Message::newFallbackSequence', $args );
1408 }
1409
1410 /**
1411 * Get a message from anywhere, for the current user language.
1412 *
1413 * Use wfMsgForContent() instead if the message should NOT
1414 * change depending on the user preferences.
1415 *
1416 * @deprecated since 1.18
1417 *
1418 * @param string $key lookup key for the message, usually
1419 * defined in languages/Language.php
1420 *
1421 * Parameters to the message, which can be used to insert variable text into
1422 * it, can be passed to this function in the following formats:
1423 * - One per argument, starting at the second parameter
1424 * - As an array in the second parameter
1425 * These are not shown in the function definition.
1426 *
1427 * @return String
1428 */
1429 function wfMsg( $key ) {
1430 wfDeprecated( __METHOD__, '1.21' );
1431
1432 $args = func_get_args();
1433 array_shift( $args );
1434 return wfMsgReal( $key, $args );
1435 }
1436
1437 /**
1438 * Same as above except doesn't transform the message
1439 *
1440 * @deprecated since 1.18
1441 *
1442 * @param $key String
1443 * @return String
1444 */
1445 function wfMsgNoTrans( $key ) {
1446 wfDeprecated( __METHOD__, '1.21' );
1447
1448 $args = func_get_args();
1449 array_shift( $args );
1450 return wfMsgReal( $key, $args, true, false, false );
1451 }
1452
1453 /**
1454 * Get a message from anywhere, for the current global language
1455 * set with $wgLanguageCode.
1456 *
1457 * Use this if the message should NOT change dependent on the
1458 * language set in the user's preferences. This is the case for
1459 * most text written into logs, as well as link targets (such as
1460 * the name of the copyright policy page). Link titles, on the
1461 * other hand, should be shown in the UI language.
1462 *
1463 * Note that MediaWiki allows users to change the user interface
1464 * language in their preferences, but a single installation
1465 * typically only contains content in one language.
1466 *
1467 * Be wary of this distinction: If you use wfMsg() where you should
1468 * use wfMsgForContent(), a user of the software may have to
1469 * customize potentially hundreds of messages in
1470 * order to, e.g., fix a link in every possible language.
1471 *
1472 * @deprecated since 1.18
1473 *
1474 * @param string $key lookup key for the message, usually
1475 * defined in languages/Language.php
1476 * @return String
1477 */
1478 function wfMsgForContent( $key ) {
1479 wfDeprecated( __METHOD__, '1.21' );
1480
1481 global $wgForceUIMsgAsContentMsg;
1482 $args = func_get_args();
1483 array_shift( $args );
1484 $forcontent = true;
1485 if ( is_array( $wgForceUIMsgAsContentMsg )
1486 && in_array( $key, $wgForceUIMsgAsContentMsg )
1487 ) {
1488 $forcontent = false;
1489 }
1490 return wfMsgReal( $key, $args, true, $forcontent );
1491 }
1492
1493 /**
1494 * Same as above except doesn't transform the message
1495 *
1496 * @deprecated since 1.18
1497 *
1498 * @param $key String
1499 * @return String
1500 */
1501 function wfMsgForContentNoTrans( $key ) {
1502 wfDeprecated( __METHOD__, '1.21' );
1503
1504 global $wgForceUIMsgAsContentMsg;
1505 $args = func_get_args();
1506 array_shift( $args );
1507 $forcontent = true;
1508 if ( is_array( $wgForceUIMsgAsContentMsg )
1509 && in_array( $key, $wgForceUIMsgAsContentMsg )
1510 ) {
1511 $forcontent = false;
1512 }
1513 return wfMsgReal( $key, $args, true, $forcontent, false );
1514 }
1515
1516 /**
1517 * Really get a message
1518 *
1519 * @deprecated since 1.18
1520 *
1521 * @param string $key key to get.
1522 * @param $args
1523 * @param $useDB Boolean
1524 * @param $forContent Mixed: Language code, or false for user lang, true for content lang.
1525 * @param $transform Boolean: Whether or not to transform the message.
1526 * @return String: the requested message.
1527 */
1528 function wfMsgReal( $key, $args, $useDB = true, $forContent = false, $transform = true ) {
1529 wfDeprecated( __METHOD__, '1.21' );
1530
1531 wfProfileIn( __METHOD__ );
1532 $message = wfMsgGetKey( $key, $useDB, $forContent, $transform );
1533 $message = wfMsgReplaceArgs( $message, $args );
1534 wfProfileOut( __METHOD__ );
1535 return $message;
1536 }
1537
1538 /**
1539 * Fetch a message string value, but don't replace any keys yet.
1540 *
1541 * @deprecated since 1.18
1542 *
1543 * @param $key String
1544 * @param $useDB Bool
1545 * @param string $langCode Code of the language to get the message for, or
1546 * behaves as a content language switch if it is a boolean.
1547 * @param $transform Boolean: whether to parse magic words, etc.
1548 * @return string
1549 */
1550 function wfMsgGetKey( $key, $useDB = true, $langCode = false, $transform = true ) {
1551 wfDeprecated( __METHOD__, '1.21' );
1552
1553 wfRunHooks( 'NormalizeMessageKey', array( &$key, &$useDB, &$langCode, &$transform ) );
1554
1555 $cache = MessageCache::singleton();
1556 $message = $cache->get( $key, $useDB, $langCode );
1557 if ( $message === false ) {
1558 $message = '&lt;' . htmlspecialchars( $key ) . '&gt;';
1559 } elseif ( $transform ) {
1560 $message = $cache->transform( $message );
1561 }
1562 return $message;
1563 }
1564
1565 /**
1566 * Replace message parameter keys on the given formatted output.
1567 *
1568 * @param $message String
1569 * @param $args Array
1570 * @return string
1571 * @private
1572 */
1573 function wfMsgReplaceArgs( $message, $args ) {
1574 # Fix windows line-endings
1575 # Some messages are split with explode("\n", $msg)
1576 $message = str_replace( "\r", '', $message );
1577
1578 // Replace arguments
1579 if ( count( $args ) ) {
1580 if ( is_array( $args[0] ) ) {
1581 $args = array_values( $args[0] );
1582 }
1583 $replacementKeys = array();
1584 foreach ( $args as $n => $param ) {
1585 $replacementKeys['$' . ( $n + 1 )] = $param;
1586 }
1587 $message = strtr( $message, $replacementKeys );
1588 }
1589
1590 return $message;
1591 }
1592
1593 /**
1594 * Return an HTML-escaped version of a message.
1595 * Parameter replacements, if any, are done *after* the HTML-escaping,
1596 * so parameters may contain HTML (eg links or form controls). Be sure
1597 * to pre-escape them if you really do want plaintext, or just wrap
1598 * the whole thing in htmlspecialchars().
1599 *
1600 * @deprecated since 1.18
1601 *
1602 * @param $key String
1603 * @param string ... parameters
1604 * @return string
1605 */
1606 function wfMsgHtml( $key ) {
1607 wfDeprecated( __METHOD__, '1.21' );
1608
1609 $args = func_get_args();
1610 array_shift( $args );
1611 return wfMsgReplaceArgs( htmlspecialchars( wfMsgGetKey( $key ) ), $args );
1612 }
1613
1614 /**
1615 * Return an HTML version of message
1616 * Parameter replacements, if any, are done *after* parsing the wiki-text message,
1617 * so parameters may contain HTML (eg links or form controls). Be sure
1618 * to pre-escape them if you really do want plaintext, or just wrap
1619 * the whole thing in htmlspecialchars().
1620 *
1621 * @deprecated since 1.18
1622 *
1623 * @param $key String
1624 * @param string ... parameters
1625 * @return string
1626 */
1627 function wfMsgWikiHtml( $key ) {
1628 wfDeprecated( __METHOD__, '1.21' );
1629
1630 $args = func_get_args();
1631 array_shift( $args );
1632 return wfMsgReplaceArgs(
1633 MessageCache::singleton()->parse( wfMsgGetKey( $key ), null,
1634 /* can't be set to false */ true, /* interface */ true )->getText(),
1635 $args );
1636 }
1637
1638 /**
1639 * Returns message in the requested format
1640 *
1641 * @deprecated since 1.18
1642 *
1643 * @param string $key key of the message
1644 * @param array $options processing rules.
1645 * Can take the following options:
1646 * parse: parses wikitext to HTML
1647 * parseinline: parses wikitext to HTML and removes the surrounding
1648 * p's added by parser or tidy
1649 * escape: filters message through htmlspecialchars
1650 * escapenoentities: same, but allows entity references like &#160; through
1651 * replaceafter: parameters are substituted after parsing or escaping
1652 * parsemag: transform the message using magic phrases
1653 * content: fetch message for content language instead of interface
1654 * Also can accept a single associative argument, of the form 'language' => 'xx':
1655 * language: Language object or language code to fetch message for
1656 * (overridden by content).
1657 * Behavior for conflicting options (e.g., parse+parseinline) is undefined.
1658 *
1659 * @return String
1660 */
1661 function wfMsgExt( $key, $options ) {
1662 wfDeprecated( __METHOD__, '1.21' );
1663
1664 $args = func_get_args();
1665 array_shift( $args );
1666 array_shift( $args );
1667 $options = (array)$options;
1668
1669 foreach ( $options as $arrayKey => $option ) {
1670 if ( !preg_match( '/^[0-9]+|language$/', $arrayKey ) ) {
1671 # An unknown index, neither numeric nor "language"
1672 wfWarn( "wfMsgExt called with incorrect parameter key $arrayKey", 1, E_USER_WARNING );
1673 } elseif ( preg_match( '/^[0-9]+$/', $arrayKey ) && !in_array( $option,
1674 array( 'parse', 'parseinline', 'escape', 'escapenoentities',
1675 'replaceafter', 'parsemag', 'content' ) ) ) {
1676 # A numeric index with unknown value
1677 wfWarn( "wfMsgExt called with incorrect parameter $option", 1, E_USER_WARNING );
1678 }
1679 }
1680
1681 if ( in_array( 'content', $options, true ) ) {
1682 $forContent = true;
1683 $langCode = true;
1684 $langCodeObj = null;
1685 } elseif ( array_key_exists( 'language', $options ) ) {
1686 $forContent = false;
1687 $langCode = wfGetLangObj( $options['language'] );
1688 $langCodeObj = $langCode;
1689 } else {
1690 $forContent = false;
1691 $langCode = false;
1692 $langCodeObj = null;
1693 }
1694
1695 $string = wfMsgGetKey( $key, /*DB*/true, $langCode, /*Transform*/false );
1696
1697 if ( !in_array( 'replaceafter', $options, true ) ) {
1698 $string = wfMsgReplaceArgs( $string, $args );
1699 }
1700
1701 $messageCache = MessageCache::singleton();
1702 $parseInline = in_array( 'parseinline', $options, true );
1703 if ( in_array( 'parse', $options, true ) || $parseInline ) {
1704 $string = $messageCache->parse( $string, null, true, !$forContent, $langCodeObj );
1705 if ( $string instanceof ParserOutput ) {
1706 $string = $string->getText();
1707 }
1708
1709 if ( $parseInline ) {
1710 $m = array();
1711 if ( preg_match( '/^<p>(.*)\n?<\/p>\n?$/sU', $string, $m ) ) {
1712 $string = $m[1];
1713 }
1714 }
1715 } elseif ( in_array( 'parsemag', $options, true ) ) {
1716 $string = $messageCache->transform( $string,
1717 !$forContent, $langCodeObj );
1718 }
1719
1720 if ( in_array( 'escape', $options, true ) ) {
1721 $string = htmlspecialchars ( $string );
1722 } elseif ( in_array( 'escapenoentities', $options, true ) ) {
1723 $string = Sanitizer::escapeHtmlAllowEntities( $string );
1724 }
1725
1726 if ( in_array( 'replaceafter', $options, true ) ) {
1727 $string = wfMsgReplaceArgs( $string, $args );
1728 }
1729
1730 return $string;
1731 }
1732
1733 /**
1734 * Since wfMsg() and co suck, they don't return false if the message key they
1735 * looked up didn't exist but instead the key wrapped in <>'s, this function checks for the
1736 * nonexistence of messages by checking the MessageCache::get() result directly.
1737 *
1738 * @deprecated since 1.18. Use Message::isDisabled().
1739 *
1740 * @param $key String: the message key looked up
1741 * @return Boolean True if the message *doesn't* exist.
1742 */
1743 function wfEmptyMsg( $key ) {
1744 wfDeprecated( __METHOD__, '1.21' );
1745
1746 return MessageCache::singleton()->get( $key, /*useDB*/true, /*content*/false ) === false;
1747 }
1748
1749 /**
1750 * Throw a debugging exception. This function previously once exited the process,
1751 * but now throws an exception instead, with similar results.
1752 *
1753 * @deprecated since 1.22; just throw an MWException yourself
1754 * @param string $msg message shown when dying.
1755 * @throws MWException
1756 */
1757 function wfDebugDieBacktrace( $msg = '' ) {
1758 wfDeprecated( __FUNCTION__, '1.22' );
1759 throw new MWException( $msg );
1760 }
1761
1762 /**
1763 * Fetch server name for use in error reporting etc.
1764 * Use real server name if available, so we know which machine
1765 * in a server farm generated the current page.
1766 *
1767 * @return string
1768 */
1769 function wfHostname() {
1770 static $host;
1771 if ( is_null( $host ) ) {
1772
1773 # Hostname overriding
1774 global $wgOverrideHostname;
1775 if ( $wgOverrideHostname !== false ) {
1776 # Set static and skip any detection
1777 $host = $wgOverrideHostname;
1778 return $host;
1779 }
1780
1781 if ( function_exists( 'posix_uname' ) ) {
1782 // This function not present on Windows
1783 $uname = posix_uname();
1784 } else {
1785 $uname = false;
1786 }
1787 if ( is_array( $uname ) && isset( $uname['nodename'] ) ) {
1788 $host = $uname['nodename'];
1789 } elseif ( getenv( 'COMPUTERNAME' ) ) {
1790 # Windows computer name
1791 $host = getenv( 'COMPUTERNAME' );
1792 } else {
1793 # This may be a virtual server.
1794 $host = $_SERVER['SERVER_NAME'];
1795 }
1796 }
1797 return $host;
1798 }
1799
1800 /**
1801 * Returns a HTML comment with the elapsed time since request.
1802 * This method has no side effects.
1803 *
1804 * @return string
1805 */
1806 function wfReportTime() {
1807 global $wgRequestTime, $wgShowHostnames;
1808
1809 $elapsed = microtime( true ) - $wgRequestTime;
1810
1811 return $wgShowHostnames
1812 ? sprintf( '<!-- Served by %s in %01.3f secs. -->', wfHostname(), $elapsed )
1813 : sprintf( '<!-- Served in %01.3f secs. -->', $elapsed );
1814 }
1815
1816 /**
1817 * Safety wrapper for debug_backtrace().
1818 *
1819 * With Zend Optimizer 3.2.0 loaded, this causes segfaults under somewhat
1820 * murky circumstances, which may be triggered in part by stub objects
1821 * or other fancy talking'.
1822 *
1823 * Will return an empty array if Zend Optimizer is detected or if
1824 * debug_backtrace is disabled, otherwise the output from
1825 * debug_backtrace() (trimmed).
1826 *
1827 * @param int $limit This parameter can be used to limit the number of stack frames returned
1828 *
1829 * @return array of backtrace information
1830 */
1831 function wfDebugBacktrace( $limit = 0 ) {
1832 static $disabled = null;
1833
1834 if ( extension_loaded( 'Zend Optimizer' ) ) {
1835 wfDebug( "Zend Optimizer detected; skipping debug_backtrace for safety.\n" );
1836 return array();
1837 }
1838
1839 if ( is_null( $disabled ) ) {
1840 $disabled = false;
1841 $functions = explode( ',', ini_get( 'disable_functions' ) );
1842 $functions = array_map( 'trim', $functions );
1843 $functions = array_map( 'strtolower', $functions );
1844 if ( in_array( 'debug_backtrace', $functions ) ) {
1845 wfDebug( "debug_backtrace is in disabled_functions\n" );
1846 $disabled = true;
1847 }
1848 }
1849 if ( $disabled ) {
1850 return array();
1851 }
1852
1853 if ( $limit && version_compare( PHP_VERSION, '5.4.0', '>=' ) ) {
1854 return array_slice( debug_backtrace( DEBUG_BACKTRACE_PROVIDE_OBJECT, $limit + 1 ), 1 );
1855 } else {
1856 return array_slice( debug_backtrace(), 1 );
1857 }
1858 }
1859
1860 /**
1861 * Get a debug backtrace as a string
1862 *
1863 * @return string
1864 */
1865 function wfBacktrace() {
1866 global $wgCommandLineMode;
1867
1868 if ( $wgCommandLineMode ) {
1869 $msg = '';
1870 } else {
1871 $msg = "<ul>\n";
1872 }
1873 $backtrace = wfDebugBacktrace();
1874 foreach ( $backtrace as $call ) {
1875 if ( isset( $call['file'] ) ) {
1876 $f = explode( DIRECTORY_SEPARATOR, $call['file'] );
1877 $file = $f[count( $f ) - 1];
1878 } else {
1879 $file = '-';
1880 }
1881 if ( isset( $call['line'] ) ) {
1882 $line = $call['line'];
1883 } else {
1884 $line = '-';
1885 }
1886 if ( $wgCommandLineMode ) {
1887 $msg .= "$file line $line calls ";
1888 } else {
1889 $msg .= '<li>' . $file . ' line ' . $line . ' calls ';
1890 }
1891 if ( !empty( $call['class'] ) ) {
1892 $msg .= $call['class'] . $call['type'];
1893 }
1894 $msg .= $call['function'] . '()';
1895
1896 if ( $wgCommandLineMode ) {
1897 $msg .= "\n";
1898 } else {
1899 $msg .= "</li>\n";
1900 }
1901 }
1902 if ( $wgCommandLineMode ) {
1903 $msg .= "\n";
1904 } else {
1905 $msg .= "</ul>\n";
1906 }
1907
1908 return $msg;
1909 }
1910
1911 /**
1912 * Get the name of the function which called this function
1913 * wfGetCaller( 1 ) is the function with the wfGetCaller() call (ie. __FUNCTION__)
1914 * wfGetCaller( 2 ) [default] is the caller of the function running wfGetCaller()
1915 * wfGetCaller( 3 ) is the parent of that.
1916 *
1917 * @param $level Int
1918 * @return string
1919 */
1920 function wfGetCaller( $level = 2 ) {
1921 $backtrace = wfDebugBacktrace( $level + 1 );
1922 if ( isset( $backtrace[$level] ) ) {
1923 return wfFormatStackFrame( $backtrace[$level] );
1924 } else {
1925 return 'unknown';
1926 }
1927 }
1928
1929 /**
1930 * Return a string consisting of callers in the stack. Useful sometimes
1931 * for profiling specific points.
1932 *
1933 * @param int $limit The maximum depth of the stack frame to return, or false for
1934 * the entire stack.
1935 * @return String
1936 */
1937 function wfGetAllCallers( $limit = 3 ) {
1938 $trace = array_reverse( wfDebugBacktrace() );
1939 if ( !$limit || $limit > count( $trace ) - 1 ) {
1940 $limit = count( $trace ) - 1;
1941 }
1942 $trace = array_slice( $trace, -$limit - 1, $limit );
1943 return implode( '/', array_map( 'wfFormatStackFrame', $trace ) );
1944 }
1945
1946 /**
1947 * Return a string representation of frame
1948 *
1949 * @param $frame Array
1950 * @return string
1951 */
1952 function wfFormatStackFrame( $frame ) {
1953 return isset( $frame['class'] ) ?
1954 $frame['class'] . '::' . $frame['function'] :
1955 $frame['function'];
1956 }
1957
1958 /* Some generic result counters, pulled out of SearchEngine */
1959
1960 /**
1961 * @todo document
1962 *
1963 * @param $offset Int
1964 * @param $limit Int
1965 * @return String
1966 */
1967 function wfShowingResults( $offset, $limit ) {
1968 return wfMessage( 'showingresults' )->numParams( $limit, $offset + 1 )->parse();
1969 }
1970
1971 /**
1972 * Generate (prev x| next x) (20|50|100...) type links for paging
1973 *
1974 * @param $offset String
1975 * @param $limit Integer
1976 * @param $link String
1977 * @param string $query optional URL query parameter string
1978 * @param bool $atend optional param for specified if this is the last page
1979 * @return String
1980 * @deprecated in 1.19; use Language::viewPrevNext() instead
1981 */
1982 function wfViewPrevNext( $offset, $limit, $link, $query = '', $atend = false ) {
1983 wfDeprecated( __METHOD__, '1.19' );
1984
1985 global $wgLang;
1986
1987 $query = wfCgiToArray( $query );
1988
1989 if ( is_object( $link ) ) {
1990 $title = $link;
1991 } else {
1992 $title = Title::newFromText( $link );
1993 if ( is_null( $title ) ) {
1994 return false;
1995 }
1996 }
1997
1998 return $wgLang->viewPrevNext( $title, $offset, $limit, $query, $atend );
1999 }
2000
2001 /**
2002 * @todo document
2003 * @todo FIXME: We may want to blacklist some broken browsers
2004 *
2005 * @param $force Bool
2006 * @return bool Whereas client accept gzip compression
2007 */
2008 function wfClientAcceptsGzip( $force = false ) {
2009 static $result = null;
2010 if ( $result === null || $force ) {
2011 $result = false;
2012 if ( isset( $_SERVER['HTTP_ACCEPT_ENCODING'] ) ) {
2013 # @todo FIXME: We may want to blacklist some broken browsers
2014 $m = array();
2015 if ( preg_match(
2016 '/\bgzip(?:;(q)=([0-9]+(?:\.[0-9]+)))?\b/',
2017 $_SERVER['HTTP_ACCEPT_ENCODING'],
2018 $m
2019 )
2020 ) {
2021 if ( isset( $m[2] ) && ( $m[1] == 'q' ) && ( $m[2] == 0 ) ) {
2022 $result = false;
2023 return $result;
2024 }
2025 wfDebug( "wfClientAcceptsGzip: client accepts gzip.\n" );
2026 $result = true;
2027 }
2028 }
2029 }
2030 return $result;
2031 }
2032
2033 /**
2034 * Obtain the offset and limit values from the request string;
2035 * used in special pages
2036 *
2037 * @param int $deflimit default limit if none supplied
2038 * @param string $optionname Name of a user preference to check against
2039 * @return array
2040 *
2041 */
2042 function wfCheckLimits( $deflimit = 50, $optionname = 'rclimit' ) {
2043 global $wgRequest;
2044 return $wgRequest->getLimitOffset( $deflimit, $optionname );
2045 }
2046
2047 /**
2048 * Escapes the given text so that it may be output using addWikiText()
2049 * without any linking, formatting, etc. making its way through. This
2050 * is achieved by substituting certain characters with HTML entities.
2051 * As required by the callers, "<nowiki>" is not used.
2052 *
2053 * @param string $text text to be escaped
2054 * @return String
2055 */
2056 function wfEscapeWikiText( $text ) {
2057 static $repl = null, $repl2 = null;
2058 if ( $repl === null ) {
2059 $repl = array(
2060 '"' => '&#34;', '&' => '&#38;', "'" => '&#39;', '<' => '&#60;',
2061 '=' => '&#61;', '>' => '&#62;', '[' => '&#91;', ']' => '&#93;',
2062 '{' => '&#123;', '|' => '&#124;', '}' => '&#125;', ';' => '&#59;',
2063 "\n#" => "\n&#35;", "\r#" => "\r&#35;",
2064 "\n*" => "\n&#42;", "\r*" => "\r&#42;",
2065 "\n:" => "\n&#58;", "\r:" => "\r&#58;",
2066 "\n " => "\n&#32;", "\r " => "\r&#32;",
2067 "\n\n" => "\n&#10;", "\r\n" => "&#13;\n",
2068 "\n\r" => "\n&#13;", "\r\r" => "\r&#13;",
2069 "\n\t" => "\n&#9;", "\r\t" => "\r&#9;", // "\n\t\n" is treated like "\n\n"
2070 "\n----" => "\n&#45;---", "\r----" => "\r&#45;---",
2071 '__' => '_&#95;', '://' => '&#58;//',
2072 );
2073
2074 // We have to catch everything "\s" matches in PCRE
2075 foreach ( array( 'ISBN', 'RFC', 'PMID' ) as $magic ) {
2076 $repl["$magic "] = "$magic&#32;";
2077 $repl["$magic\t"] = "$magic&#9;";
2078 $repl["$magic\r"] = "$magic&#13;";
2079 $repl["$magic\n"] = "$magic&#10;";
2080 $repl["$magic\f"] = "$magic&#12;";
2081 }
2082
2083 // And handle protocols that don't use "://"
2084 global $wgUrlProtocols;
2085 $repl2 = array();
2086 foreach ( $wgUrlProtocols as $prot ) {
2087 if ( substr( $prot, -1 ) === ':' ) {
2088 $repl2[] = preg_quote( substr( $prot, 0, -1 ), '/' );
2089 }
2090 }
2091 $repl2 = $repl2 ? '/\b(' . join( '|', $repl2 ) . '):/i' : '/^(?!)/';
2092 }
2093 $text = substr( strtr( "\n$text", $repl ), 1 );
2094 $text = preg_replace( $repl2, '$1&#58;', $text );
2095 return $text;
2096 }
2097
2098 /**
2099 * Get the current unix timestamp with microseconds. Useful for profiling
2100 * @deprecated since 1.22; call microtime() directly
2101 * @return Float
2102 */
2103 function wfTime() {
2104 wfDeprecated( __FUNCTION__, '1.22' );
2105 return microtime( true );
2106 }
2107
2108 /**
2109 * Sets dest to source and returns the original value of dest
2110 * If source is NULL, it just returns the value, it doesn't set the variable
2111 * If force is true, it will set the value even if source is NULL
2112 *
2113 * @param $dest Mixed
2114 * @param $source Mixed
2115 * @param $force Bool
2116 * @return Mixed
2117 */
2118 function wfSetVar( &$dest, $source, $force = false ) {
2119 $temp = $dest;
2120 if ( !is_null( $source ) || $force ) {
2121 $dest = $source;
2122 }
2123 return $temp;
2124 }
2125
2126 /**
2127 * As for wfSetVar except setting a bit
2128 *
2129 * @param $dest Int
2130 * @param $bit Int
2131 * @param $state Bool
2132 *
2133 * @return bool
2134 */
2135 function wfSetBit( &$dest, $bit, $state = true ) {
2136 $temp = (bool)( $dest & $bit );
2137 if ( !is_null( $state ) ) {
2138 if ( $state ) {
2139 $dest |= $bit;
2140 } else {
2141 $dest &= ~$bit;
2142 }
2143 }
2144 return $temp;
2145 }
2146
2147 /**
2148 * A wrapper around the PHP function var_export().
2149 * Either print it or add it to the regular output ($wgOut).
2150 *
2151 * @param $var mixed A PHP variable to dump.
2152 */
2153 function wfVarDump( $var ) {
2154 global $wgOut;
2155 $s = str_replace( "\n", "<br />\n", var_export( $var, true ) . "\n" );
2156 if ( headers_sent() || !isset( $wgOut ) || !is_object( $wgOut ) ) {
2157 print $s;
2158 } else {
2159 $wgOut->addHTML( $s );
2160 }
2161 }
2162
2163 /**
2164 * Provide a simple HTTP error.
2165 *
2166 * @param $code Int|String
2167 * @param $label String
2168 * @param $desc String
2169 */
2170 function wfHttpError( $code, $label, $desc ) {
2171 global $wgOut;
2172 $wgOut->disable();
2173 header( "HTTP/1.0 $code $label" );
2174 header( "Status: $code $label" );
2175 $wgOut->sendCacheControl();
2176
2177 header( 'Content-type: text/html; charset=utf-8' );
2178 print "<!doctype html>" .
2179 '<html><head><title>' .
2180 htmlspecialchars( $label ) .
2181 '</title></head><body><h1>' .
2182 htmlspecialchars( $label ) .
2183 '</h1><p>' .
2184 nl2br( htmlspecialchars( $desc ) ) .
2185 "</p></body></html>\n";
2186 }
2187
2188 /**
2189 * Clear away any user-level output buffers, discarding contents.
2190 *
2191 * Suitable for 'starting afresh', for instance when streaming
2192 * relatively large amounts of data without buffering, or wanting to
2193 * output image files without ob_gzhandler's compression.
2194 *
2195 * The optional $resetGzipEncoding parameter controls suppression of
2196 * the Content-Encoding header sent by ob_gzhandler; by default it
2197 * is left. See comments for wfClearOutputBuffers() for why it would
2198 * be used.
2199 *
2200 * Note that some PHP configuration options may add output buffer
2201 * layers which cannot be removed; these are left in place.
2202 *
2203 * @param $resetGzipEncoding Bool
2204 */
2205 function wfResetOutputBuffers( $resetGzipEncoding = true ) {
2206 if ( $resetGzipEncoding ) {
2207 // Suppress Content-Encoding and Content-Length
2208 // headers from 1.10+s wfOutputHandler
2209 global $wgDisableOutputCompression;
2210 $wgDisableOutputCompression = true;
2211 }
2212 while ( $status = ob_get_status() ) {
2213 if ( $status['type'] == 0 /* PHP_OUTPUT_HANDLER_INTERNAL */ ) {
2214 // Probably from zlib.output_compression or other
2215 // PHP-internal setting which can't be removed.
2216 //
2217 // Give up, and hope the result doesn't break
2218 // output behavior.
2219 break;
2220 }
2221 if ( !ob_end_clean() ) {
2222 // Could not remove output buffer handler; abort now
2223 // to avoid getting in some kind of infinite loop.
2224 break;
2225 }
2226 if ( $resetGzipEncoding ) {
2227 if ( $status['name'] == 'ob_gzhandler' ) {
2228 // Reset the 'Content-Encoding' field set by this handler
2229 // so we can start fresh.
2230 header_remove( 'Content-Encoding' );
2231 break;
2232 }
2233 }
2234 }
2235 }
2236
2237 /**
2238 * More legible than passing a 'false' parameter to wfResetOutputBuffers():
2239 *
2240 * Clear away output buffers, but keep the Content-Encoding header
2241 * produced by ob_gzhandler, if any.
2242 *
2243 * This should be used for HTTP 304 responses, where you need to
2244 * preserve the Content-Encoding header of the real result, but
2245 * also need to suppress the output of ob_gzhandler to keep to spec
2246 * and avoid breaking Firefox in rare cases where the headers and
2247 * body are broken over two packets.
2248 */
2249 function wfClearOutputBuffers() {
2250 wfResetOutputBuffers( false );
2251 }
2252
2253 /**
2254 * Converts an Accept-* header into an array mapping string values to quality
2255 * factors
2256 *
2257 * @param $accept String
2258 * @param string $def default
2259 * @return Array
2260 */
2261 function wfAcceptToPrefs( $accept, $def = '*/*' ) {
2262 # No arg means accept anything (per HTTP spec)
2263 if ( !$accept ) {
2264 return array( $def => 1.0 );
2265 }
2266
2267 $prefs = array();
2268
2269 $parts = explode( ',', $accept );
2270
2271 foreach ( $parts as $part ) {
2272 # @todo FIXME: Doesn't deal with params like 'text/html; level=1'
2273 $values = explode( ';', trim( $part ) );
2274 $match = array();
2275 if ( count( $values ) == 1 ) {
2276 $prefs[$values[0]] = 1.0;
2277 } elseif ( preg_match( '/q\s*=\s*(\d*\.\d+)/', $values[1], $match ) ) {
2278 $prefs[$values[0]] = floatval( $match[1] );
2279 }
2280 }
2281
2282 return $prefs;
2283 }
2284
2285 /**
2286 * Checks if a given MIME type matches any of the keys in the given
2287 * array. Basic wildcards are accepted in the array keys.
2288 *
2289 * Returns the matching MIME type (or wildcard) if a match, otherwise
2290 * NULL if no match.
2291 *
2292 * @param $type String
2293 * @param $avail Array
2294 * @return string
2295 * @private
2296 */
2297 function mimeTypeMatch( $type, $avail ) {
2298 if ( array_key_exists( $type, $avail ) ) {
2299 return $type;
2300 } else {
2301 $parts = explode( '/', $type );
2302 if ( array_key_exists( $parts[0] . '/*', $avail ) ) {
2303 return $parts[0] . '/*';
2304 } elseif ( array_key_exists( '*/*', $avail ) ) {
2305 return '*/*';
2306 } else {
2307 return null;
2308 }
2309 }
2310 }
2311
2312 /**
2313 * Returns the 'best' match between a client's requested internet media types
2314 * and the server's list of available types. Each list should be an associative
2315 * array of type to preference (preference is a float between 0.0 and 1.0).
2316 * Wildcards in the types are acceptable.
2317 *
2318 * @param array $cprefs client's acceptable type list
2319 * @param array $sprefs server's offered types
2320 * @return string
2321 *
2322 * @todo FIXME: Doesn't handle params like 'text/plain; charset=UTF-8'
2323 * XXX: generalize to negotiate other stuff
2324 */
2325 function wfNegotiateType( $cprefs, $sprefs ) {
2326 $combine = array();
2327
2328 foreach ( array_keys( $sprefs ) as $type ) {
2329 $parts = explode( '/', $type );
2330 if ( $parts[1] != '*' ) {
2331 $ckey = mimeTypeMatch( $type, $cprefs );
2332 if ( $ckey ) {
2333 $combine[$type] = $sprefs[$type] * $cprefs[$ckey];
2334 }
2335 }
2336 }
2337
2338 foreach ( array_keys( $cprefs ) as $type ) {
2339 $parts = explode( '/', $type );
2340 if ( $parts[1] != '*' && !array_key_exists( $type, $sprefs ) ) {
2341 $skey = mimeTypeMatch( $type, $sprefs );
2342 if ( $skey ) {
2343 $combine[$type] = $sprefs[$skey] * $cprefs[$type];
2344 }
2345 }
2346 }
2347
2348 $bestq = 0;
2349 $besttype = null;
2350
2351 foreach ( array_keys( $combine ) as $type ) {
2352 if ( $combine[$type] > $bestq ) {
2353 $besttype = $type;
2354 $bestq = $combine[$type];
2355 }
2356 }
2357
2358 return $besttype;
2359 }
2360
2361 /**
2362 * Reference-counted warning suppression
2363 *
2364 * @param $end Bool
2365 */
2366 function wfSuppressWarnings( $end = false ) {
2367 static $suppressCount = 0;
2368 static $originalLevel = false;
2369
2370 if ( $end ) {
2371 if ( $suppressCount ) {
2372 --$suppressCount;
2373 if ( !$suppressCount ) {
2374 error_reporting( $originalLevel );
2375 }
2376 }
2377 } else {
2378 if ( !$suppressCount ) {
2379 $originalLevel = error_reporting( E_ALL & ~(
2380 E_WARNING |
2381 E_NOTICE |
2382 E_USER_WARNING |
2383 E_USER_NOTICE |
2384 E_DEPRECATED |
2385 E_USER_DEPRECATED |
2386 E_STRICT
2387 ) );
2388 }
2389 ++$suppressCount;
2390 }
2391 }
2392
2393 /**
2394 * Restore error level to previous value
2395 */
2396 function wfRestoreWarnings() {
2397 wfSuppressWarnings( true );
2398 }
2399
2400 # Autodetect, convert and provide timestamps of various types
2401
2402 /**
2403 * Unix time - the number of seconds since 1970-01-01 00:00:00 UTC
2404 */
2405 define( 'TS_UNIX', 0 );
2406
2407 /**
2408 * MediaWiki concatenated string timestamp (YYYYMMDDHHMMSS)
2409 */
2410 define( 'TS_MW', 1 );
2411
2412 /**
2413 * MySQL DATETIME (YYYY-MM-DD HH:MM:SS)
2414 */
2415 define( 'TS_DB', 2 );
2416
2417 /**
2418 * RFC 2822 format, for E-mail and HTTP headers
2419 */
2420 define( 'TS_RFC2822', 3 );
2421
2422 /**
2423 * ISO 8601 format with no timezone: 1986-02-09T20:00:00Z
2424 *
2425 * This is used by Special:Export
2426 */
2427 define( 'TS_ISO_8601', 4 );
2428
2429 /**
2430 * An Exif timestamp (YYYY:MM:DD HH:MM:SS)
2431 *
2432 * @see http://exif.org/Exif2-2.PDF The Exif 2.2 spec, see page 28 for the
2433 * DateTime tag and page 36 for the DateTimeOriginal and
2434 * DateTimeDigitized tags.
2435 */
2436 define( 'TS_EXIF', 5 );
2437
2438 /**
2439 * Oracle format time.
2440 */
2441 define( 'TS_ORACLE', 6 );
2442
2443 /**
2444 * Postgres format time.
2445 */
2446 define( 'TS_POSTGRES', 7 );
2447
2448 /**
2449 * ISO 8601 basic format with no timezone: 19860209T200000Z. This is used by ResourceLoader
2450 */
2451 define( 'TS_ISO_8601_BASIC', 9 );
2452
2453 /**
2454 * Get a timestamp string in one of various formats
2455 *
2456 * @param $outputtype Mixed: A timestamp in one of the supported formats, the
2457 * function will autodetect which format is supplied and act
2458 * accordingly.
2459 * @param $ts Mixed: optional timestamp to convert, default 0 for the current time
2460 * @return Mixed: String / false The same date in the format specified in $outputtype or false
2461 */
2462 function wfTimestamp( $outputtype = TS_UNIX, $ts = 0 ) {
2463 try {
2464 $timestamp = new MWTimestamp( $ts );
2465 return $timestamp->getTimestamp( $outputtype );
2466 } catch ( TimestampException $e ) {
2467 wfDebug( "wfTimestamp() fed bogus time value: TYPE=$outputtype; VALUE=$ts\n" );
2468 return false;
2469 }
2470 }
2471
2472 /**
2473 * Return a formatted timestamp, or null if input is null.
2474 * For dealing with nullable timestamp columns in the database.
2475 *
2476 * @param $outputtype Integer
2477 * @param $ts String
2478 * @return String
2479 */
2480 function wfTimestampOrNull( $outputtype = TS_UNIX, $ts = null ) {
2481 if ( is_null( $ts ) ) {
2482 return null;
2483 } else {
2484 return wfTimestamp( $outputtype, $ts );
2485 }
2486 }
2487
2488 /**
2489 * Convenience function; returns MediaWiki timestamp for the present time.
2490 *
2491 * @return string
2492 */
2493 function wfTimestampNow() {
2494 # return NOW
2495 return wfTimestamp( TS_MW, time() );
2496 }
2497
2498 /**
2499 * Check if the operating system is Windows
2500 *
2501 * @return Bool: true if it's Windows, False otherwise.
2502 */
2503 function wfIsWindows() {
2504 static $isWindows = null;
2505 if ( $isWindows === null ) {
2506 $isWindows = substr( php_uname(), 0, 7 ) == 'Windows';
2507 }
2508 return $isWindows;
2509 }
2510
2511 /**
2512 * Check if we are running under HHVM
2513 *
2514 * @return Bool
2515 */
2516 function wfIsHHVM() {
2517 return defined( 'HHVM_VERSION' );
2518 }
2519
2520 /**
2521 * Swap two variables
2522 *
2523 * @param $x Mixed
2524 * @param $y Mixed
2525 */
2526 function swap( &$x, &$y ) {
2527 $z = $x;
2528 $x = $y;
2529 $y = $z;
2530 }
2531
2532 /**
2533 * Tries to get the system directory for temporary files. First
2534 * $wgTmpDirectory is checked, and then the TMPDIR, TMP, and TEMP
2535 * environment variables are then checked in sequence, and if none are
2536 * set try sys_get_temp_dir().
2537 *
2538 * NOTE: When possible, use instead the tmpfile() function to create
2539 * temporary files to avoid race conditions on file creation, etc.
2540 *
2541 * @return String
2542 */
2543 function wfTempDir() {
2544 global $wgTmpDirectory;
2545
2546 if ( $wgTmpDirectory !== false ) {
2547 return $wgTmpDirectory;
2548 }
2549
2550 $tmpDir = array_map( "getenv", array( 'TMPDIR', 'TMP', 'TEMP' ) );
2551
2552 foreach ( $tmpDir as $tmp ) {
2553 if ( $tmp && file_exists( $tmp ) && is_dir( $tmp ) && is_writable( $tmp ) ) {
2554 return $tmp;
2555 }
2556 }
2557 return sys_get_temp_dir();
2558 }
2559
2560 /**
2561 * Make directory, and make all parent directories if they don't exist
2562 *
2563 * @param string $dir full path to directory to create
2564 * @param $mode Integer: chmod value to use, default is $wgDirectoryMode
2565 * @param string $caller optional caller param for debugging.
2566 * @throws MWException
2567 * @return bool
2568 */
2569 function wfMkdirParents( $dir, $mode = null, $caller = null ) {
2570 global $wgDirectoryMode;
2571
2572 if ( FileBackend::isStoragePath( $dir ) ) { // sanity
2573 throw new MWException( __FUNCTION__ . " given storage path '$dir'." );
2574 }
2575
2576 if ( !is_null( $caller ) ) {
2577 wfDebug( "$caller: called wfMkdirParents($dir)\n" );
2578 }
2579
2580 if ( strval( $dir ) === '' || ( file_exists( $dir ) && is_dir( $dir ) ) ) {
2581 return true;
2582 }
2583
2584 $dir = str_replace( array( '\\', '/' ), DIRECTORY_SEPARATOR, $dir );
2585
2586 if ( is_null( $mode ) ) {
2587 $mode = $wgDirectoryMode;
2588 }
2589
2590 // Turn off the normal warning, we're doing our own below
2591 wfSuppressWarnings();
2592 $ok = mkdir( $dir, $mode, true ); // PHP5 <3
2593 wfRestoreWarnings();
2594
2595 if ( !$ok ) {
2596 //directory may have been created on another request since we last checked
2597 if ( is_dir( $dir ) ) {
2598 return true;
2599 }
2600
2601 // PHP doesn't report the path in its warning message, so add our own to aid in diagnosis.
2602 wfLogWarning( sprintf( "failed to mkdir \"%s\" mode 0%o", $dir, $mode ) );
2603 }
2604 return $ok;
2605 }
2606
2607 /**
2608 * Remove a directory and all its content.
2609 * Does not hide error.
2610 */
2611 function wfRecursiveRemoveDir( $dir ) {
2612 wfDebug( __FUNCTION__ . "( $dir )\n" );
2613 // taken from http://de3.php.net/manual/en/function.rmdir.php#98622
2614 if ( is_dir( $dir ) ) {
2615 $objects = scandir( $dir );
2616 foreach ( $objects as $object ) {
2617 if ( $object != "." && $object != ".." ) {
2618 if ( filetype( $dir . '/' . $object ) == "dir" ) {
2619 wfRecursiveRemoveDir( $dir . '/' . $object );
2620 } else {
2621 unlink( $dir . '/' . $object );
2622 }
2623 }
2624 }
2625 reset( $objects );
2626 rmdir( $dir );
2627 }
2628 }
2629
2630 /**
2631 * @param $nr Mixed: the number to format
2632 * @param $acc Integer: the number of digits after the decimal point, default 2
2633 * @param $round Boolean: whether or not to round the value, default true
2634 * @return float
2635 */
2636 function wfPercent( $nr, $acc = 2, $round = true ) {
2637 $ret = sprintf( "%.${acc}f", $nr );
2638 return $round ? round( $ret, $acc ) . '%' : "$ret%";
2639 }
2640
2641 /**
2642 * Safety wrapper around ini_get() for boolean settings.
2643 * The values returned from ini_get() are pre-normalized for settings
2644 * set via php.ini or php_flag/php_admin_flag... but *not*
2645 * for those set via php_value/php_admin_value.
2646 *
2647 * It's fairly common for people to use php_value instead of php_flag,
2648 * which can leave you with an 'off' setting giving a false positive
2649 * for code that just takes the ini_get() return value as a boolean.
2650 *
2651 * To make things extra interesting, setting via php_value accepts
2652 * "true" and "yes" as true, but php.ini and php_flag consider them false. :)
2653 * Unrecognized values go false... again opposite PHP's own coercion
2654 * from string to bool.
2655 *
2656 * Luckily, 'properly' set settings will always come back as '0' or '1',
2657 * so we only have to worry about them and the 'improper' settings.
2658 *
2659 * I frickin' hate PHP... :P
2660 *
2661 * @param $setting String
2662 * @return Bool
2663 */
2664 function wfIniGetBool( $setting ) {
2665 $val = strtolower( ini_get( $setting ) );
2666 // 'on' and 'true' can't have whitespace around them, but '1' can.
2667 return $val == 'on'
2668 || $val == 'true'
2669 || $val == 'yes'
2670 || preg_match( "/^\s*[+-]?0*[1-9]/", $val ); // approx C atoi() function
2671 }
2672
2673 /**
2674 * Windows-compatible version of escapeshellarg()
2675 * Windows doesn't recognise single-quotes in the shell, but the escapeshellarg()
2676 * function puts single quotes in regardless of OS.
2677 *
2678 * Also fixes the locale problems on Linux in PHP 5.2.6+ (bug backported to
2679 * earlier distro releases of PHP)
2680 *
2681 * @param varargs
2682 * @return String
2683 */
2684 function wfEscapeShellArg() {
2685 wfInitShellLocale();
2686
2687 $args = func_get_args();
2688 $first = true;
2689 $retVal = '';
2690 foreach ( $args as $arg ) {
2691 if ( !$first ) {
2692 $retVal .= ' ';
2693 } else {
2694 $first = false;
2695 }
2696
2697 if ( wfIsWindows() ) {
2698 // Escaping for an MSVC-style command line parser and CMD.EXE
2699 // @codingStandardsIgnoreStart For long URLs
2700 // Refs:
2701 // * http://web.archive.org/web/20020708081031/http://mailman.lyra.org/pipermail/scite-interest/2002-March/000436.html
2702 // * http://technet.microsoft.com/en-us/library/cc723564.aspx
2703 // * Bug #13518
2704 // * CR r63214
2705 // Double the backslashes before any double quotes. Escape the double quotes.
2706 // @codingStandardsIgnoreEnd
2707 $tokens = preg_split( '/(\\\\*")/', $arg, -1, PREG_SPLIT_DELIM_CAPTURE );
2708 $arg = '';
2709 $iteration = 0;
2710 foreach ( $tokens as $token ) {
2711 if ( $iteration % 2 == 1 ) {
2712 // Delimiter, a double quote preceded by zero or more slashes
2713 $arg .= str_replace( '\\', '\\\\', substr( $token, 0, -1 ) ) . '\\"';
2714 } elseif ( $iteration % 4 == 2 ) {
2715 // ^ in $token will be outside quotes, need to be escaped
2716 $arg .= str_replace( '^', '^^', $token );
2717 } else { // $iteration % 4 == 0
2718 // ^ in $token will appear inside double quotes, so leave as is
2719 $arg .= $token;
2720 }
2721 $iteration++;
2722 }
2723 // Double the backslashes before the end of the string, because
2724 // we will soon add a quote
2725 $m = array();
2726 if ( preg_match( '/^(.*?)(\\\\+)$/', $arg, $m ) ) {
2727 $arg = $m[1] . str_replace( '\\', '\\\\', $m[2] );
2728 }
2729
2730 // Add surrounding quotes
2731 $retVal .= '"' . $arg . '"';
2732 } else {
2733 $retVal .= escapeshellarg( $arg );
2734 }
2735 }
2736 return $retVal;
2737 }
2738
2739 /**
2740 * Check if wfShellExec() is effectively disabled via php.ini config
2741 * @return bool|string False or one of (safemode,disabled)
2742 * @since 1.22
2743 */
2744 function wfShellExecDisabled() {
2745 static $disabled = null;
2746 if ( is_null( $disabled ) ) {
2747 $disabled = false;
2748 if ( wfIniGetBool( 'safe_mode' ) ) {
2749 wfDebug( "wfShellExec can't run in safe_mode, PHP's exec functions are too broken.\n" );
2750 $disabled = 'safemode';
2751 } else {
2752 $functions = explode( ',', ini_get( 'disable_functions' ) );
2753 $functions = array_map( 'trim', $functions );
2754 $functions = array_map( 'strtolower', $functions );
2755 if ( in_array( 'proc_open', $functions ) ) {
2756 wfDebug( "proc_open is in disabled_functions\n" );
2757 $disabled = 'disabled';
2758 }
2759 }
2760 }
2761 return $disabled;
2762 }
2763
2764 /**
2765 * Execute a shell command, with time and memory limits mirrored from the PHP
2766 * configuration if supported.
2767 * @param string $cmd Command line, properly escaped for shell.
2768 * @param &$retval null|Mixed optional, will receive the program's exit code.
2769 * (non-zero is usually failure). If there is an error from
2770 * read, select, or proc_open(), this will be set to -1.
2771 * @param array $environ optional environment variables which should be
2772 * added to the executed command environment.
2773 * @param array $limits optional array with limits(filesize, memory, time, walltime)
2774 * this overwrites the global wgMaxShell* limits.
2775 * @param array $options Array of options:
2776 * - duplicateStderr: Set this to true to duplicate stderr to stdout,
2777 * including errors from limit.sh
2778 *
2779 * @return string collected stdout as a string
2780 */
2781 function wfShellExec( $cmd, &$retval = null, $environ = array(),
2782 $limits = array(), $options = array()
2783 ) {
2784 global $IP, $wgMaxShellMemory, $wgMaxShellFileSize, $wgMaxShellTime,
2785 $wgMaxShellWallClockTime, $wgShellCgroup;
2786
2787 $disabled = wfShellExecDisabled();
2788 if ( $disabled ) {
2789 $retval = 1;
2790 return $disabled == 'safemode' ?
2791 'Unable to run external programs in safe mode.' :
2792 'Unable to run external programs, proc_open() is disabled.';
2793 }
2794
2795 $includeStderr = isset( $options['duplicateStderr'] ) && $options['duplicateStderr'];
2796
2797 wfInitShellLocale();
2798
2799 $envcmd = '';
2800 foreach ( $environ as $k => $v ) {
2801 if ( wfIsWindows() ) {
2802 /* Surrounding a set in quotes (method used by wfEscapeShellArg) makes the quotes themselves
2803 * appear in the environment variable, so we must use carat escaping as documented in
2804 * http://technet.microsoft.com/en-us/library/cc723564.aspx
2805 * Note however that the quote isn't listed there, but is needed, and the parentheses
2806 * are listed there but doesn't appear to need it.
2807 */
2808 $envcmd .= "set $k=" . preg_replace( '/([&|()<>^"])/', '^\\1', $v ) . '&& ';
2809 } else {
2810 /* Assume this is a POSIX shell, thus required to accept variable assignments before the command
2811 * http://www.opengroup.org/onlinepubs/009695399/utilities/xcu_chap02.html#tag_02_09_01
2812 */
2813 $envcmd .= "$k=" . escapeshellarg( $v ) . ' ';
2814 }
2815 }
2816 $cmd = $envcmd . $cmd;
2817
2818 $useLogPipe = false;
2819 if ( php_uname( 's' ) == 'Linux' ) {
2820 $time = intval ( isset( $limits['time'] ) ? $limits['time'] : $wgMaxShellTime );
2821 if ( isset( $limits['walltime'] ) ) {
2822 $wallTime = intval( $limits['walltime'] );
2823 } elseif ( isset( $limits['time'] ) ) {
2824 $wallTime = $time;
2825 } else {
2826 $wallTime = intval( $wgMaxShellWallClockTime );
2827 }
2828 $mem = intval ( isset( $limits['memory'] ) ? $limits['memory'] : $wgMaxShellMemory );
2829 $filesize = intval ( isset( $limits['filesize'] ) ? $limits['filesize'] : $wgMaxShellFileSize );
2830
2831 if ( $time > 0 || $mem > 0 || $filesize > 0 || $wallTime > 0 ) {
2832 $cmd = '/bin/bash ' . escapeshellarg( "$IP/includes/limit.sh" ) . ' ' .
2833 escapeshellarg( $cmd ) . ' ' .
2834 escapeshellarg(
2835 "MW_INCLUDE_STDERR=" . ( $includeStderr ? '1' : '' ) . ';' .
2836 "MW_CPU_LIMIT=$time; " .
2837 'MW_CGROUP=' . escapeshellarg( $wgShellCgroup ) . '; ' .
2838 "MW_MEM_LIMIT=$mem; " .
2839 "MW_FILE_SIZE_LIMIT=$filesize; " .
2840 "MW_WALL_CLOCK_LIMIT=$wallTime; " .
2841 "MW_USE_LOG_PIPE=yes"
2842 );
2843 $useLogPipe = true;
2844 } elseif ( $includeStderr ) {
2845 $cmd .= ' 2>&1';
2846 }
2847 } elseif ( $includeStderr ) {
2848 $cmd .= ' 2>&1';
2849 }
2850 wfDebug( "wfShellExec: $cmd\n" );
2851
2852 $desc = array(
2853 0 => array( 'file', 'php://stdin', 'r' ),
2854 1 => array( 'pipe', 'w' ),
2855 2 => array( 'file', 'php://stderr', 'w' ) );
2856 if ( $useLogPipe ) {
2857 $desc[3] = array( 'pipe', 'w' );
2858 }
2859
2860 # TODO/FIXME: This is a bad hack to workaround an HHVM bug that prevents
2861 # proc_open() from opening stdin/stdout, so use /dev/null *for now*
2862 # See bug 56597 / https://github.com/facebook/hhvm/issues/1247 for more info
2863 if ( wfIsHHVM() ) {
2864 $desc[0] = array( 'file', '/dev/null', 'r' );
2865 $desc[2] = array( 'file', '/dev/null', 'w' );
2866 }
2867
2868 $pipes = null;
2869 $proc = proc_open( $cmd, $desc, $pipes );
2870 if ( !$proc ) {
2871 wfDebugLog( 'exec', "proc_open() failed: $cmd" );
2872 $retval = -1;
2873 return '';
2874 }
2875 $outBuffer = $logBuffer = '';
2876 $emptyArray = array();
2877 $status = false;
2878 $logMsg = false;
2879
2880 // According to the documentation, it is possible for stream_select()
2881 // to fail due to EINTR. I haven't managed to induce this in testing
2882 // despite sending various signals. If it did happen, the error
2883 // message would take the form:
2884 //
2885 // stream_select(): unable to select [4]: Interrupted system call (max_fd=5)
2886 //
2887 // where [4] is the value of the macro EINTR and "Interrupted system
2888 // call" is string which according to the Linux manual is "possibly"
2889 // localised according to LC_MESSAGES.
2890 $eintr = defined( 'SOCKET_EINTR' ) ? SOCKET_EINTR : 4;
2891 $eintrMessage = "stream_select(): unable to select [$eintr]";
2892
2893 // Build a table mapping resource IDs to pipe FDs to work around a
2894 // PHP 5.3 issue in which stream_select() does not preserve array keys
2895 // <https://bugs.php.net/bug.php?id=53427>.
2896 $fds = array();
2897 foreach ( $pipes as $fd => $pipe ) {
2898 $fds[(int)$pipe] = $fd;
2899 }
2900
2901 while ( true ) {
2902 $status = proc_get_status( $proc );
2903 if ( !$status['running'] ) {
2904 break;
2905 }
2906 $status = false;
2907
2908 $readyPipes = $pipes;
2909
2910 // Clear last error
2911 @trigger_error( '' );
2912 if ( @stream_select( $readyPipes, $emptyArray, $emptyArray, null ) === false ) {
2913 $error = error_get_last();
2914 if ( strncmp( $error['message'], $eintrMessage, strlen( $eintrMessage ) ) == 0 ) {
2915 continue;
2916 } else {
2917 trigger_error( $error['message'], E_USER_WARNING );
2918 $logMsg = $error['message'];
2919 break;
2920 }
2921 }
2922 foreach ( $readyPipes as $pipe ) {
2923 $block = fread( $pipe, 65536 );
2924 $fd = $fds[(int)$pipe];
2925 if ( $block === '' ) {
2926 // End of file
2927 fclose( $pipes[$fd] );
2928 unset( $pipes[$fd] );
2929 if ( !$pipes ) {
2930 break 2;
2931 }
2932 } elseif ( $block === false ) {
2933 // Read error
2934 $logMsg = "Error reading from pipe";
2935 break 2;
2936 } elseif ( $fd == 1 ) {
2937 // From stdout
2938 $outBuffer .= $block;
2939 } elseif ( $fd == 3 ) {
2940 // From log FD
2941 $logBuffer .= $block;
2942 if ( strpos( $block, "\n" ) !== false ) {
2943 $lines = explode( "\n", $logBuffer );
2944 $logBuffer = array_pop( $lines );
2945 foreach ( $lines as $line ) {
2946 wfDebugLog( 'exec', $line );
2947 }
2948 }
2949 }
2950 }
2951 }
2952
2953 foreach ( $pipes as $pipe ) {
2954 fclose( $pipe );
2955 }
2956
2957 // Use the status previously collected if possible, since proc_get_status()
2958 // just calls waitpid() which will not return anything useful the second time.
2959 if ( $status === false ) {
2960 $status = proc_get_status( $proc );
2961 }
2962
2963 if ( $logMsg !== false ) {
2964 // Read/select error
2965 $retval = -1;
2966 proc_close( $proc );
2967 } elseif ( $status['signaled'] ) {
2968 $logMsg = "Exited with signal {$status['termsig']}";
2969 $retval = 128 + $status['termsig'];
2970 proc_close( $proc );
2971 } else {
2972 if ( $status['running'] ) {
2973 $retval = proc_close( $proc );
2974 } else {
2975 $retval = $status['exitcode'];
2976 proc_close( $proc );
2977 }
2978 if ( $retval == 127 ) {
2979 $logMsg = "Possibly missing executable file";
2980 } elseif ( $retval >= 129 && $retval <= 192 ) {
2981 $logMsg = "Probably exited with signal " . ( $retval - 128 );
2982 }
2983 }
2984
2985 if ( $logMsg !== false ) {
2986 wfDebugLog( 'exec', "$logMsg: $cmd" );
2987 }
2988
2989 return $outBuffer;
2990 }
2991
2992 /**
2993 * Execute a shell command, returning both stdout and stderr. Convenience
2994 * function, as all the arguments to wfShellExec can become unwieldy.
2995 *
2996 * @note This also includes errors from limit.sh, e.g. if $wgMaxShellFileSize is exceeded.
2997 * @param string $cmd Command line, properly escaped for shell.
2998 * @param &$retval null|Mixed optional, will receive the program's exit code.
2999 * (non-zero is usually failure)
3000 * @param array $environ optional environment variables which should be
3001 * added to the executed command environment.
3002 * @param array $limits optional array with limits(filesize, memory, time, walltime)
3003 * this overwrites the global wgShellMax* limits.
3004 * @return string collected stdout and stderr as a string
3005 */
3006 function wfShellExecWithStderr( $cmd, &$retval = null, $environ = array(), $limits = array() ) {
3007 return wfShellExec( $cmd, $retval, $environ, $limits, array( 'duplicateStderr' => true ) );
3008 }
3009
3010 /**
3011 * Workaround for http://bugs.php.net/bug.php?id=45132
3012 * escapeshellarg() destroys non-ASCII characters if LANG is not a UTF-8 locale
3013 */
3014 function wfInitShellLocale() {
3015 static $done = false;
3016 if ( $done ) {
3017 return;
3018 }
3019 $done = true;
3020 global $wgShellLocale;
3021 if ( !wfIniGetBool( 'safe_mode' ) ) {
3022 putenv( "LC_CTYPE=$wgShellLocale" );
3023 setlocale( LC_CTYPE, $wgShellLocale );
3024 }
3025 }
3026
3027 /**
3028 * Alias to wfShellWikiCmd()
3029 * @see wfShellWikiCmd()
3030 */
3031 function wfShellMaintenanceCmd( $script, array $parameters = array(), array $options = array() ) {
3032 return wfShellWikiCmd( $script, $parameters, $options );
3033 }
3034
3035 /**
3036 * Generate a shell-escaped command line string to run a MediaWiki cli script.
3037 * Note that $parameters should be a flat array and an option with an argument
3038 * should consist of two consecutive items in the array (do not use "--option value").
3039 * @param string $script MediaWiki cli script path
3040 * @param array $parameters Arguments and options to the script
3041 * @param array $options Associative array of options:
3042 * 'php': The path to the php executable
3043 * 'wrapper': Path to a PHP wrapper to handle the maintenance script
3044 * @return Array
3045 */
3046 function wfShellWikiCmd( $script, array $parameters = array(), array $options = array() ) {
3047 global $wgPhpCli;
3048 // Give site config file a chance to run the script in a wrapper.
3049 // The caller may likely want to call wfBasename() on $script.
3050 wfRunHooks( 'wfShellWikiCmd', array( &$script, &$parameters, &$options ) );
3051 $cmd = isset( $options['php'] ) ? array( $options['php'] ) : array( $wgPhpCli );
3052 if ( isset( $options['wrapper'] ) ) {
3053 $cmd[] = $options['wrapper'];
3054 }
3055 $cmd[] = $script;
3056 // Escape each parameter for shell
3057 return implode( " ", array_map( 'wfEscapeShellArg', array_merge( $cmd, $parameters ) ) );
3058 }
3059
3060 /**
3061 * wfMerge attempts to merge differences between three texts.
3062 * Returns true for a clean merge and false for failure or a conflict.
3063 *
3064 * @param $old String
3065 * @param $mine String
3066 * @param $yours String
3067 * @param $result String
3068 * @return Bool
3069 */
3070 function wfMerge( $old, $mine, $yours, &$result ) {
3071 global $wgDiff3;
3072
3073 # This check may also protect against code injection in
3074 # case of broken installations.
3075 wfSuppressWarnings();
3076 $haveDiff3 = $wgDiff3 && file_exists( $wgDiff3 );
3077 wfRestoreWarnings();
3078
3079 if ( !$haveDiff3 ) {
3080 wfDebug( "diff3 not found\n" );
3081 return false;
3082 }
3083
3084 # Make temporary files
3085 $td = wfTempDir();
3086 $oldtextFile = fopen( $oldtextName = tempnam( $td, 'merge-old-' ), 'w' );
3087 $mytextFile = fopen( $mytextName = tempnam( $td, 'merge-mine-' ), 'w' );
3088 $yourtextFile = fopen( $yourtextName = tempnam( $td, 'merge-your-' ), 'w' );
3089
3090 # NOTE: diff3 issues a warning to stderr if any of the files does not end with
3091 # a newline character. To avoid this, we normalize the trailing whitespace before
3092 # creating the diff.
3093
3094 fwrite( $oldtextFile, rtrim( $old ) . "\n" );
3095 fclose( $oldtextFile );
3096 fwrite( $mytextFile, rtrim( $mine ) . "\n" );
3097 fclose( $mytextFile );
3098 fwrite( $yourtextFile, rtrim( $yours ) . "\n" );
3099 fclose( $yourtextFile );
3100
3101 # Check for a conflict
3102 $cmd = wfEscapeShellArg( $wgDiff3 ) . ' -a --overlap-only ' .
3103 wfEscapeShellArg( $mytextName ) . ' ' .
3104 wfEscapeShellArg( $oldtextName ) . ' ' .
3105 wfEscapeShellArg( $yourtextName );
3106 $handle = popen( $cmd, 'r' );
3107
3108 if ( fgets( $handle, 1024 ) ) {
3109 $conflict = true;
3110 } else {
3111 $conflict = false;
3112 }
3113 pclose( $handle );
3114
3115 # Merge differences
3116 $cmd = wfEscapeShellArg( $wgDiff3 ) . ' -a -e --merge ' .
3117 wfEscapeShellArg( $mytextName, $oldtextName, $yourtextName );
3118 $handle = popen( $cmd, 'r' );
3119 $result = '';
3120 do {
3121 $data = fread( $handle, 8192 );
3122 if ( strlen( $data ) == 0 ) {
3123 break;
3124 }
3125 $result .= $data;
3126 } while ( true );
3127 pclose( $handle );
3128 unlink( $mytextName );
3129 unlink( $oldtextName );
3130 unlink( $yourtextName );
3131
3132 if ( $result === '' && $old !== '' && !$conflict ) {
3133 wfDebug( "Unexpected null result from diff3. Command: $cmd\n" );
3134 $conflict = true;
3135 }
3136 return !$conflict;
3137 }
3138
3139 /**
3140 * Returns unified plain-text diff of two texts.
3141 * Useful for machine processing of diffs.
3142 *
3143 * @param string $before the text before the changes.
3144 * @param string $after the text after the changes.
3145 * @param string $params command-line options for the diff command.
3146 * @return String: unified diff of $before and $after
3147 */
3148 function wfDiff( $before, $after, $params = '-u' ) {
3149 if ( $before == $after ) {
3150 return '';
3151 }
3152
3153 global $wgDiff;
3154 wfSuppressWarnings();
3155 $haveDiff = $wgDiff && file_exists( $wgDiff );
3156 wfRestoreWarnings();
3157
3158 # This check may also protect against code injection in
3159 # case of broken installations.
3160 if ( !$haveDiff ) {
3161 wfDebug( "diff executable not found\n" );
3162 $diffs = new Diff( explode( "\n", $before ), explode( "\n", $after ) );
3163 $format = new UnifiedDiffFormatter();
3164 return $format->format( $diffs );
3165 }
3166
3167 # Make temporary files
3168 $td = wfTempDir();
3169 $oldtextFile = fopen( $oldtextName = tempnam( $td, 'merge-old-' ), 'w' );
3170 $newtextFile = fopen( $newtextName = tempnam( $td, 'merge-your-' ), 'w' );
3171
3172 fwrite( $oldtextFile, $before );
3173 fclose( $oldtextFile );
3174 fwrite( $newtextFile, $after );
3175 fclose( $newtextFile );
3176
3177 // Get the diff of the two files
3178 $cmd = "$wgDiff " . $params . ' ' . wfEscapeShellArg( $oldtextName, $newtextName );
3179
3180 $h = popen( $cmd, 'r' );
3181
3182 $diff = '';
3183
3184 do {
3185 $data = fread( $h, 8192 );
3186 if ( strlen( $data ) == 0 ) {
3187 break;
3188 }
3189 $diff .= $data;
3190 } while ( true );
3191
3192 // Clean up
3193 pclose( $h );
3194 unlink( $oldtextName );
3195 unlink( $newtextName );
3196
3197 // Kill the --- and +++ lines. They're not useful.
3198 $diff_lines = explode( "\n", $diff );
3199 if ( strpos( $diff_lines[0], '---' ) === 0 ) {
3200 unset( $diff_lines[0] );
3201 }
3202 if ( strpos( $diff_lines[1], '+++' ) === 0 ) {
3203 unset( $diff_lines[1] );
3204 }
3205
3206 $diff = implode( "\n", $diff_lines );
3207
3208 return $diff;
3209 }
3210
3211 /**
3212 * This function works like "use VERSION" in Perl, the program will die with a
3213 * backtrace if the current version of PHP is less than the version provided
3214 *
3215 * This is useful for extensions which due to their nature are not kept in sync
3216 * with releases, and might depend on other versions of PHP than the main code
3217 *
3218 * Note: PHP might die due to parsing errors in some cases before it ever
3219 * manages to call this function, such is life
3220 *
3221 * @see perldoc -f use
3222 *
3223 * @param $req_ver Mixed: the version to check, can be a string, an integer, or
3224 * a float
3225 * @throws MWException
3226 */
3227 function wfUsePHP( $req_ver ) {
3228 $php_ver = PHP_VERSION;
3229
3230 if ( version_compare( $php_ver, (string)$req_ver, '<' ) ) {
3231 throw new MWException( "PHP $req_ver required--this is only $php_ver" );
3232 }
3233 }
3234
3235 /**
3236 * This function works like "use VERSION" in Perl except it checks the version
3237 * of MediaWiki, the program will die with a backtrace if the current version
3238 * of MediaWiki is less than the version provided.
3239 *
3240 * This is useful for extensions which due to their nature are not kept in sync
3241 * with releases
3242 *
3243 * Note: Due to the behavior of PHP's version_compare() which is used in this
3244 * function, if you want to allow the 'wmf' development versions add a 'c' (or
3245 * any single letter other than 'a', 'b' or 'p') as a post-fix to your
3246 * targeted version number. For example if you wanted to allow any variation
3247 * of 1.22 use `wfUseMW( '1.22c' )`. Using an 'a' or 'b' instead of 'c' will
3248 * not result in the same comparison due to the internal logic of
3249 * version_compare().
3250 *
3251 * @see perldoc -f use
3252 *
3253 * @param $req_ver Mixed: the version to check, can be a string, an integer, or
3254 * a float
3255 * @throws MWException
3256 */
3257 function wfUseMW( $req_ver ) {
3258 global $wgVersion;
3259
3260 if ( version_compare( $wgVersion, (string)$req_ver, '<' ) ) {
3261 throw new MWException( "MediaWiki $req_ver required--this is only $wgVersion" );
3262 }
3263 }
3264
3265 /**
3266 * Return the final portion of a pathname.
3267 * Reimplemented because PHP5's "basename()" is buggy with multibyte text.
3268 * http://bugs.php.net/bug.php?id=33898
3269 *
3270 * PHP's basename() only considers '\' a pathchar on Windows and Netware.
3271 * We'll consider it so always, as we don't want '\s' in our Unix paths either.
3272 *
3273 * @param $path String
3274 * @param string $suffix to remove if present
3275 * @return String
3276 */
3277 function wfBaseName( $path, $suffix = '' ) {
3278 if ( $suffix == '' ) {
3279 $encSuffix = '';
3280 } else {
3281 $encSuffix = '(?:' . preg_quote( $suffix, '#' ) . ')?';
3282 }
3283
3284 $matches = array();
3285 if ( preg_match( "#([^/\\\\]*?){$encSuffix}[/\\\\]*$#", $path, $matches ) ) {
3286 return $matches[1];
3287 } else {
3288 return '';
3289 }
3290 }
3291
3292 /**
3293 * Generate a relative path name to the given file.
3294 * May explode on non-matching case-insensitive paths,
3295 * funky symlinks, etc.
3296 *
3297 * @param string $path absolute destination path including target filename
3298 * @param string $from Absolute source path, directory only
3299 * @return String
3300 */
3301 function wfRelativePath( $path, $from ) {
3302 // Normalize mixed input on Windows...
3303 $path = str_replace( '/', DIRECTORY_SEPARATOR, $path );
3304 $from = str_replace( '/', DIRECTORY_SEPARATOR, $from );
3305
3306 // Trim trailing slashes -- fix for drive root
3307 $path = rtrim( $path, DIRECTORY_SEPARATOR );
3308 $from = rtrim( $from, DIRECTORY_SEPARATOR );
3309
3310 $pieces = explode( DIRECTORY_SEPARATOR, dirname( $path ) );
3311 $against = explode( DIRECTORY_SEPARATOR, $from );
3312
3313 if ( $pieces[0] !== $against[0] ) {
3314 // Non-matching Windows drive letters?
3315 // Return a full path.
3316 return $path;
3317 }
3318
3319 // Trim off common prefix
3320 while ( count( $pieces ) && count( $against )
3321 && $pieces[0] == $against[0] ) {
3322 array_shift( $pieces );
3323 array_shift( $against );
3324 }
3325
3326 // relative dots to bump us to the parent
3327 while ( count( $against ) ) {
3328 array_unshift( $pieces, '..' );
3329 array_shift( $against );
3330 }
3331
3332 array_push( $pieces, wfBaseName( $path ) );
3333
3334 return implode( DIRECTORY_SEPARATOR, $pieces );
3335 }
3336
3337 /**
3338 * Convert an arbitrarily-long digit string from one numeric base
3339 * to another, optionally zero-padding to a minimum column width.
3340 *
3341 * Supports base 2 through 36; digit values 10-36 are represented
3342 * as lowercase letters a-z. Input is case-insensitive.
3343 *
3344 * @param string $input Input number
3345 * @param int $sourceBase Base of the input number
3346 * @param int $destBase Desired base of the output
3347 * @param int $pad Minimum number of digits in the output (pad with zeroes)
3348 * @param bool $lowercase Whether to output in lowercase or uppercase
3349 * @param string $engine Either "gmp", "bcmath", or "php"
3350 * @return string|bool The output number as a string, or false on error
3351 */
3352 function wfBaseConvert( $input, $sourceBase, $destBase, $pad = 1,
3353 $lowercase = true, $engine = 'auto'
3354 ) {
3355 $input = (string)$input;
3356 if (
3357 $sourceBase < 2 ||
3358 $sourceBase > 36 ||
3359 $destBase < 2 ||
3360 $destBase > 36 ||
3361 $sourceBase != (int)$sourceBase ||
3362 $destBase != (int)$destBase ||
3363 $pad != (int)$pad ||
3364 !preg_match(
3365 "/^[" . substr( '0123456789abcdefghijklmnopqrstuvwxyz', 0, $sourceBase ) . "]+$/i",
3366 $input
3367 )
3368 ) {
3369 return false;
3370 }
3371
3372 static $baseChars = array(
3373 10 => 'a', 11 => 'b', 12 => 'c', 13 => 'd', 14 => 'e', 15 => 'f',
3374 16 => 'g', 17 => 'h', 18 => 'i', 19 => 'j', 20 => 'k', 21 => 'l',
3375 22 => 'm', 23 => 'n', 24 => 'o', 25 => 'p', 26 => 'q', 27 => 'r',
3376 28 => 's', 29 => 't', 30 => 'u', 31 => 'v', 32 => 'w', 33 => 'x',
3377 34 => 'y', 35 => 'z',
3378
3379 '0' => 0, '1' => 1, '2' => 2, '3' => 3, '4' => 4, '5' => 5,
3380 '6' => 6, '7' => 7, '8' => 8, '9' => 9, 'a' => 10, 'b' => 11,
3381 'c' => 12, 'd' => 13, 'e' => 14, 'f' => 15, 'g' => 16, 'h' => 17,
3382 'i' => 18, 'j' => 19, 'k' => 20, 'l' => 21, 'm' => 22, 'n' => 23,
3383 'o' => 24, 'p' => 25, 'q' => 26, 'r' => 27, 's' => 28, 't' => 29,
3384 'u' => 30, 'v' => 31, 'w' => 32, 'x' => 33, 'y' => 34, 'z' => 35
3385 );
3386
3387 if ( extension_loaded( 'gmp' ) && ( $engine == 'auto' || $engine == 'gmp' ) ) {
3388 $result = gmp_strval( gmp_init( $input, $sourceBase ), $destBase );
3389 } elseif ( extension_loaded( 'bcmath' ) && ( $engine == 'auto' || $engine == 'bcmath' ) ) {
3390 $decimal = '0';
3391 foreach ( str_split( strtolower( $input ) ) as $char ) {
3392 $decimal = bcmul( $decimal, $sourceBase );
3393 $decimal = bcadd( $decimal, $baseChars[$char] );
3394 }
3395
3396 for ( $result = ''; bccomp( $decimal, 0 ); $decimal = bcdiv( $decimal, $destBase, 0 ) ) {
3397 $result .= $baseChars[bcmod( $decimal, $destBase )];
3398 }
3399
3400 $result = strrev( $result );
3401 } else {
3402 $inDigits = array();
3403 foreach ( str_split( strtolower( $input ) ) as $char ) {
3404 $inDigits[] = $baseChars[$char];
3405 }
3406
3407 // Iterate over the input, modulo-ing out an output digit
3408 // at a time until input is gone.
3409 $result = '';
3410 while ( $inDigits ) {
3411 $work = 0;
3412 $workDigits = array();
3413
3414 // Long division...
3415 foreach ( $inDigits as $digit ) {
3416 $work *= $sourceBase;
3417 $work += $digit;
3418
3419 if ( $workDigits || $work >= $destBase ) {
3420 $workDigits[] = (int)( $work / $destBase );
3421 }
3422 $work %= $destBase;
3423 }
3424
3425 // All that division leaves us with a remainder,
3426 // which is conveniently our next output digit.
3427 $result .= $baseChars[$work];
3428
3429 // And we continue!
3430 $inDigits = $workDigits;
3431 }
3432
3433 $result = strrev( $result );
3434 }
3435
3436 if ( !$lowercase ) {
3437 $result = strtoupper( $result );
3438 }
3439
3440 return str_pad( $result, $pad, '0', STR_PAD_LEFT );
3441 }
3442
3443 /**
3444 * @return bool
3445 */
3446 function wfHttpOnlySafe() {
3447 global $wgHttpOnlyBlacklist;
3448
3449 if ( isset( $_SERVER['HTTP_USER_AGENT'] ) ) {
3450 foreach ( $wgHttpOnlyBlacklist as $regex ) {
3451 if ( preg_match( $regex, $_SERVER['HTTP_USER_AGENT'] ) ) {
3452 return false;
3453 }
3454 }
3455 }
3456
3457 return true;
3458 }
3459
3460 /**
3461 * Check if there is sufficient entropy in php's built-in session generation
3462 * @return bool true = there is sufficient entropy
3463 */
3464 function wfCheckEntropy() {
3465 return (
3466 ( wfIsWindows() && version_compare( PHP_VERSION, '5.3.3', '>=' ) )
3467 || ini_get( 'session.entropy_file' )
3468 )
3469 && intval( ini_get( 'session.entropy_length' ) ) >= 32;
3470 }
3471
3472 /**
3473 * Override session_id before session startup if php's built-in
3474 * session generation code is not secure.
3475 */
3476 function wfFixSessionID() {
3477 // If the cookie or session id is already set we already have a session and should abort
3478 if ( isset( $_COOKIE[session_name()] ) || session_id() ) {
3479 return;
3480 }
3481
3482 // PHP's built-in session entropy is enabled if:
3483 // - entropy_file is set or you're on Windows with php 5.3.3+
3484 // - AND entropy_length is > 0
3485 // We treat it as disabled if it doesn't have an entropy length of at least 32
3486 $entropyEnabled = wfCheckEntropy();
3487
3488 // If built-in entropy is not enabled or not sufficient override PHP's
3489 // built in session id generation code
3490 if ( !$entropyEnabled ) {
3491 wfDebug( __METHOD__ . ": PHP's built in entropy is disabled or not sufficient, " .
3492 "overriding session id generation using our cryptrand source.\n" );
3493 session_id( MWCryptRand::generateHex( 32 ) );
3494 }
3495 }
3496
3497 /**
3498 * Reset the session_id
3499 * @since 1.22
3500 */
3501 function wfResetSessionID() {
3502 global $wgCookieSecure;
3503 $oldSessionId = session_id();
3504 $cookieParams = session_get_cookie_params();
3505 if ( wfCheckEntropy() && $wgCookieSecure == $cookieParams['secure'] ) {
3506 session_regenerate_id( false );
3507 } else {
3508 $tmp = $_SESSION;
3509 session_destroy();
3510 wfSetupSession( MWCryptRand::generateHex( 32 ) );
3511 $_SESSION = $tmp;
3512 }
3513 $newSessionId = session_id();
3514 wfRunHooks( 'ResetSessionID', array( $oldSessionId, $newSessionId ) );
3515 }
3516
3517 /**
3518 * Initialise php session
3519 *
3520 * @param $sessionId Bool
3521 */
3522 function wfSetupSession( $sessionId = false ) {
3523 global $wgSessionsInMemcached, $wgSessionsInObjectCache, $wgCookiePath, $wgCookieDomain,
3524 $wgCookieSecure, $wgCookieHttpOnly, $wgSessionHandler;
3525 if ( $wgSessionsInObjectCache || $wgSessionsInMemcached ) {
3526 ObjectCacheSessionHandler::install();
3527 } elseif ( $wgSessionHandler && $wgSessionHandler != ini_get( 'session.save_handler' ) ) {
3528 # Only set this if $wgSessionHandler isn't null and session.save_handler
3529 # hasn't already been set to the desired value (that causes errors)
3530 ini_set( 'session.save_handler', $wgSessionHandler );
3531 }
3532 $httpOnlySafe = wfHttpOnlySafe() && $wgCookieHttpOnly;
3533 wfDebugLog( 'cookie',
3534 'session_set_cookie_params: "' . implode( '", "',
3535 array(
3536 0,
3537 $wgCookiePath,
3538 $wgCookieDomain,
3539 $wgCookieSecure,
3540 $httpOnlySafe ) ) . '"' );
3541 session_set_cookie_params( 0, $wgCookiePath, $wgCookieDomain, $wgCookieSecure, $httpOnlySafe );
3542 session_cache_limiter( 'private, must-revalidate' );
3543 if ( $sessionId ) {
3544 session_id( $sessionId );
3545 } else {
3546 wfFixSessionID();
3547 }
3548 wfSuppressWarnings();
3549 session_start();
3550 wfRestoreWarnings();
3551 }
3552
3553 /**
3554 * Get an object from the precompiled serialized directory
3555 *
3556 * @param $name String
3557 * @return Mixed: the variable on success, false on failure
3558 */
3559 function wfGetPrecompiledData( $name ) {
3560 global $IP;
3561
3562 $file = "$IP/serialized/$name";
3563 if ( file_exists( $file ) ) {
3564 $blob = file_get_contents( $file );
3565 if ( $blob ) {
3566 return unserialize( $blob );
3567 }
3568 }
3569 return false;
3570 }
3571
3572 /**
3573 * Get a cache key
3574 *
3575 * @param varargs
3576 * @return String
3577 */
3578 function wfMemcKey( /*... */ ) {
3579 global $wgCachePrefix;
3580 $prefix = $wgCachePrefix === false ? wfWikiID() : $wgCachePrefix;
3581 $args = func_get_args();
3582 $key = $prefix . ':' . implode( ':', $args );
3583 $key = str_replace( ' ', '_', $key );
3584 return $key;
3585 }
3586
3587 /**
3588 * Get a cache key for a foreign DB
3589 *
3590 * @param $db String
3591 * @param $prefix String
3592 * @param varargs String
3593 * @return String
3594 */
3595 function wfForeignMemcKey( $db, $prefix /*, ... */ ) {
3596 $args = array_slice( func_get_args(), 2 );
3597 if ( $prefix ) {
3598 $key = "$db-$prefix:" . implode( ':', $args );
3599 } else {
3600 $key = $db . ':' . implode( ':', $args );
3601 }
3602 return str_replace( ' ', '_', $key );
3603 }
3604
3605 /**
3606 * Get an ASCII string identifying this wiki
3607 * This is used as a prefix in memcached keys
3608 *
3609 * @return String
3610 */
3611 function wfWikiID() {
3612 global $wgDBprefix, $wgDBname;
3613 if ( $wgDBprefix ) {
3614 return "$wgDBname-$wgDBprefix";
3615 } else {
3616 return $wgDBname;
3617 }
3618 }
3619
3620 /**
3621 * Split a wiki ID into DB name and table prefix
3622 *
3623 * @param $wiki String
3624 *
3625 * @return array
3626 */
3627 function wfSplitWikiID( $wiki ) {
3628 $bits = explode( '-', $wiki, 2 );
3629 if ( count( $bits ) < 2 ) {
3630 $bits[] = '';
3631 }
3632 return $bits;
3633 }
3634
3635 /**
3636 * Get a Database object.
3637 *
3638 * @param $db Integer: index of the connection to get. May be DB_MASTER for the
3639 * master (for write queries), DB_SLAVE for potentially lagged read
3640 * queries, or an integer >= 0 for a particular server.
3641 *
3642 * @param $groups Mixed: query groups. An array of group names that this query
3643 * belongs to. May contain a single string if the query is only
3644 * in one group.
3645 *
3646 * @param string $wiki the wiki ID, or false for the current wiki
3647 *
3648 * Note: multiple calls to wfGetDB(DB_SLAVE) during the course of one request
3649 * will always return the same object, unless the underlying connection or load
3650 * balancer is manually destroyed.
3651 *
3652 * Note 2: use $this->getDB() in maintenance scripts that may be invoked by
3653 * updater to ensure that a proper database is being updated.
3654 *
3655 * @return DatabaseBase
3656 */
3657 function &wfGetDB( $db, $groups = array(), $wiki = false ) {
3658 return wfGetLB( $wiki )->getConnection( $db, $groups, $wiki );
3659 }
3660
3661 /**
3662 * Get a load balancer object.
3663 *
3664 * @param string $wiki wiki ID, or false for the current wiki
3665 * @return LoadBalancer
3666 */
3667 function wfGetLB( $wiki = false ) {
3668 return wfGetLBFactory()->getMainLB( $wiki );
3669 }
3670
3671 /**
3672 * Get the load balancer factory object
3673 *
3674 * @return LBFactory
3675 */
3676 function &wfGetLBFactory() {
3677 return LBFactory::singleton();
3678 }
3679
3680 /**
3681 * Find a file.
3682 * Shortcut for RepoGroup::singleton()->findFile()
3683 *
3684 * @param string $title or Title object
3685 * @param array $options Associative array of options:
3686 * time: requested time for an archived image, or false for the
3687 * current version. An image object will be returned which was
3688 * created at the specified time.
3689 *
3690 * ignoreRedirect: If true, do not follow file redirects
3691 *
3692 * private: If true, return restricted (deleted) files if the current
3693 * user is allowed to view them. Otherwise, such files will not
3694 * be found.
3695 *
3696 * bypassCache: If true, do not use the process-local cache of File objects
3697 *
3698 * @return File, or false if the file does not exist
3699 */
3700 function wfFindFile( $title, $options = array() ) {
3701 return RepoGroup::singleton()->findFile( $title, $options );
3702 }
3703
3704 /**
3705 * Get an object referring to a locally registered file.
3706 * Returns a valid placeholder object if the file does not exist.
3707 *
3708 * @param $title Title|String
3709 * @return LocalFile|null A File, or null if passed an invalid Title
3710 */
3711 function wfLocalFile( $title ) {
3712 return RepoGroup::singleton()->getLocalRepo()->newFile( $title );
3713 }
3714
3715 /**
3716 * Should low-performance queries be disabled?
3717 *
3718 * @return Boolean
3719 * @codeCoverageIgnore
3720 */
3721 function wfQueriesMustScale() {
3722 global $wgMiserMode;
3723 return $wgMiserMode
3724 || ( SiteStats::pages() > 100000
3725 && SiteStats::edits() > 1000000
3726 && SiteStats::users() > 10000 );
3727 }
3728
3729 /**
3730 * Get the path to a specified script file, respecting file
3731 * extensions; this is a wrapper around $wgScriptExtension etc.
3732 * except for 'index' and 'load' which use $wgScript/$wgLoadScript
3733 *
3734 * @param string $script script filename, sans extension
3735 * @return String
3736 */
3737 function wfScript( $script = 'index' ) {
3738 global $wgScriptPath, $wgScriptExtension, $wgScript, $wgLoadScript;
3739 if ( $script === 'index' ) {
3740 return $wgScript;
3741 } elseif ( $script === 'load' ) {
3742 return $wgLoadScript;
3743 } else {
3744 return "{$wgScriptPath}/{$script}{$wgScriptExtension}";
3745 }
3746 }
3747
3748 /**
3749 * Get the script URL.
3750 *
3751 * @return string script URL
3752 */
3753 function wfGetScriptUrl() {
3754 if ( isset( $_SERVER['SCRIPT_NAME'] ) ) {
3755 #
3756 # as it was called, minus the query string.
3757 #
3758 # Some sites use Apache rewrite rules to handle subdomains,
3759 # and have PHP set up in a weird way that causes PHP_SELF
3760 # to contain the rewritten URL instead of the one that the
3761 # outside world sees.
3762 #
3763 # If in this mode, use SCRIPT_URL instead, which mod_rewrite
3764 # provides containing the "before" URL.
3765 return $_SERVER['SCRIPT_NAME'];
3766 } else {
3767 return $_SERVER['URL'];
3768 }
3769 }
3770
3771 /**
3772 * Convenience function converts boolean values into "true"
3773 * or "false" (string) values
3774 *
3775 * @param $value Boolean
3776 * @return String
3777 */
3778 function wfBoolToStr( $value ) {
3779 return $value ? 'true' : 'false';
3780 }
3781
3782 /**
3783 * Get a platform-independent path to the null file, e.g. /dev/null
3784 *
3785 * @return string
3786 */
3787 function wfGetNull() {
3788 return wfIsWindows() ? 'NUL' : '/dev/null';
3789 }
3790
3791 /**
3792 * Modern version of wfWaitForSlaves(). Instead of looking at replication lag
3793 * and waiting for it to go down, this waits for the slaves to catch up to the
3794 * master position. Use this when updating very large numbers of rows, as
3795 * in maintenance scripts, to avoid causing too much lag. Of course, this is
3796 * a no-op if there are no slaves.
3797 *
3798 * @param int|bool $maxLag (deprecated)
3799 * @param mixed $wiki Wiki identifier accepted by wfGetLB
3800 * @param string|bool $cluster Cluster name accepted by LBFactory. Default: false.
3801 */
3802 function wfWaitForSlaves( $maxLag = false, $wiki = false, $cluster = false ) {
3803 if ( $cluster !== false ) {
3804 $lb = wfGetLBFactory()->getExternalLB( $cluster );
3805 } else {
3806 $lb = wfGetLB( $wiki );
3807 }
3808
3809 // bug 27975 - Don't try to wait for slaves if there are none
3810 // Prevents permission error when getting master position
3811 if ( $lb->getServerCount() > 1 ) {
3812 $dbw = $lb->getConnection( DB_MASTER, array(), $wiki );
3813 $pos = $dbw->getMasterPos();
3814 // The DBMS may not support getMasterPos() or the whole
3815 // load balancer might be fake (e.g. $wgAllDBsAreLocalhost).
3816 if ( $pos !== false ) {
3817 $lb->waitForAll( $pos );
3818 }
3819 }
3820 }
3821
3822 /**
3823 * Count down from $n to zero on the terminal, with a one-second pause
3824 * between showing each number. For use in command-line scripts.
3825 * @codeCoverageIgnore
3826 * @param $n int
3827 */
3828 function wfCountDown( $n ) {
3829 for ( $i = $n; $i >= 0; $i-- ) {
3830 if ( $i != $n ) {
3831 echo str_repeat( "\x08", strlen( $i + 1 ) );
3832 }
3833 echo $i;
3834 flush();
3835 if ( $i ) {
3836 sleep( 1 );
3837 }
3838 }
3839 echo "\n";
3840 }
3841
3842 /**
3843 * Replace all invalid characters with -
3844 * Additional characters can be defined in $wgIllegalFileChars (see bug 20489)
3845 * By default, $wgIllegalFileChars = ':'
3846 *
3847 * @param $name Mixed: filename to process
3848 * @return String
3849 */
3850 function wfStripIllegalFilenameChars( $name ) {
3851 global $wgIllegalFileChars;
3852 $illegalFileChars = $wgIllegalFileChars ? "|[" . $wgIllegalFileChars . "]" : '';
3853 $name = wfBaseName( $name );
3854 $name = preg_replace(
3855 "/[^" . Title::legalChars() . "]" . $illegalFileChars . "/",
3856 '-',
3857 $name
3858 );
3859 return $name;
3860 }
3861
3862 /**
3863 * Set PHP's memory limit to the larger of php.ini or $wgMemoryLimit;
3864 *
3865 * @return Integer value memory was set to.
3866 */
3867 function wfMemoryLimit() {
3868 global $wgMemoryLimit;
3869 $memlimit = wfShorthandToInteger( ini_get( 'memory_limit' ) );
3870 if ( $memlimit != -1 ) {
3871 $conflimit = wfShorthandToInteger( $wgMemoryLimit );
3872 if ( $conflimit == -1 ) {
3873 wfDebug( "Removing PHP's memory limit\n" );
3874 wfSuppressWarnings();
3875 ini_set( 'memory_limit', $conflimit );
3876 wfRestoreWarnings();
3877 return $conflimit;
3878 } elseif ( $conflimit > $memlimit ) {
3879 wfDebug( "Raising PHP's memory limit to $conflimit bytes\n" );
3880 wfSuppressWarnings();
3881 ini_set( 'memory_limit', $conflimit );
3882 wfRestoreWarnings();
3883 return $conflimit;
3884 }
3885 }
3886 return $memlimit;
3887 }
3888
3889 /**
3890 * Converts shorthand byte notation to integer form
3891 *
3892 * @param $string String
3893 * @return Integer
3894 */
3895 function wfShorthandToInteger( $string = '' ) {
3896 $string = trim( $string );
3897 if ( $string === '' ) {
3898 return -1;
3899 }
3900 $last = $string[strlen( $string ) - 1];
3901 $val = intval( $string );
3902 switch ( $last ) {
3903 case 'g':
3904 case 'G':
3905 $val *= 1024;
3906 // break intentionally missing
3907 case 'm':
3908 case 'M':
3909 $val *= 1024;
3910 // break intentionally missing
3911 case 'k':
3912 case 'K':
3913 $val *= 1024;
3914 }
3915
3916 return $val;
3917 }
3918
3919 /**
3920 * Get the normalised IETF language tag
3921 * See unit test for examples.
3922 *
3923 * @param string $code The language code.
3924 * @return String: The language code which complying with BCP 47 standards.
3925 */
3926 function wfBCP47( $code ) {
3927 $codeSegment = explode( '-', $code );
3928 $codeBCP = array();
3929 foreach ( $codeSegment as $segNo => $seg ) {
3930 // when previous segment is x, it is a private segment and should be lc
3931 if ( $segNo > 0 && strtolower( $codeSegment[( $segNo - 1 )] ) == 'x' ) {
3932 $codeBCP[$segNo] = strtolower( $seg );
3933 // ISO 3166 country code
3934 } elseif ( ( strlen( $seg ) == 2 ) && ( $segNo > 0 ) ) {
3935 $codeBCP[$segNo] = strtoupper( $seg );
3936 // ISO 15924 script code
3937 } elseif ( ( strlen( $seg ) == 4 ) && ( $segNo > 0 ) ) {
3938 $codeBCP[$segNo] = ucfirst( strtolower( $seg ) );
3939 // Use lowercase for other cases
3940 } else {
3941 $codeBCP[$segNo] = strtolower( $seg );
3942 }
3943 }
3944 $langCode = implode( '-', $codeBCP );
3945 return $langCode;
3946 }
3947
3948 /**
3949 * Get a cache object.
3950 *
3951 * @param $inputType integer Cache type, one the the CACHE_* constants.
3952 * @return BagOStuff
3953 */
3954 function wfGetCache( $inputType ) {
3955 return ObjectCache::getInstance( $inputType );
3956 }
3957
3958 /**
3959 * Get the main cache object
3960 *
3961 * @return BagOStuff
3962 */
3963 function wfGetMainCache() {
3964 global $wgMainCacheType;
3965 return ObjectCache::getInstance( $wgMainCacheType );
3966 }
3967
3968 /**
3969 * Get the cache object used by the message cache
3970 *
3971 * @return BagOStuff
3972 */
3973 function wfGetMessageCacheStorage() {
3974 global $wgMessageCacheType;
3975 return ObjectCache::getInstance( $wgMessageCacheType );
3976 }
3977
3978 /**
3979 * Get the cache object used by the parser cache
3980 *
3981 * @return BagOStuff
3982 */
3983 function wfGetParserCacheStorage() {
3984 global $wgParserCacheType;
3985 return ObjectCache::getInstance( $wgParserCacheType );
3986 }
3987
3988 /**
3989 * Get the cache object used by the language converter
3990 *
3991 * @return BagOStuff
3992 */
3993 function wfGetLangConverterCacheStorage() {
3994 global $wgLanguageConverterCacheType;
3995 return ObjectCache::getInstance( $wgLanguageConverterCacheType );
3996 }
3997
3998 /**
3999 * Call hook functions defined in $wgHooks
4000 *
4001 * @param string $event event name
4002 * @param array $args parameters passed to hook functions
4003 * @param string|null $deprecatedVersion optionally mark hook as deprecated with version number
4004 *
4005 * @return Boolean True if no handler aborted the hook
4006 */
4007 function wfRunHooks( $event, array $args = array(), $deprecatedVersion = null ) {
4008 return Hooks::run( $event, $args, $deprecatedVersion );
4009 }
4010
4011 /**
4012 * Wrapper around php's unpack.
4013 *
4014 * @param string $format The format string (See php's docs)
4015 * @param $data: A binary string of binary data
4016 * @param $length integer or false: The minimum length of $data. This is to
4017 * prevent reading beyond the end of $data. false to disable the check.
4018 *
4019 * Also be careful when using this function to read unsigned 32 bit integer
4020 * because php might make it negative.
4021 *
4022 * @throws MWException if $data not long enough, or if unpack fails
4023 * @return array Associative array of the extracted data
4024 */
4025 function wfUnpack( $format, $data, $length = false ) {
4026 if ( $length !== false ) {
4027 $realLen = strlen( $data );
4028 if ( $realLen < $length ) {
4029 throw new MWException( "Tried to use wfUnpack on a "
4030 . "string of length $realLen, but needed one "
4031 . "of at least length $length."
4032 );
4033 }
4034 }
4035
4036 wfSuppressWarnings();
4037 $result = unpack( $format, $data );
4038 wfRestoreWarnings();
4039
4040 if ( $result === false ) {
4041 // If it cannot extract the packed data.
4042 throw new MWException( "unpack could not unpack binary data" );
4043 }
4044 return $result;
4045 }
4046
4047 /**
4048 * Determine if an image exists on the 'bad image list'.
4049 *
4050 * The format of MediaWiki:Bad_image_list is as follows:
4051 * * Only list items (lines starting with "*") are considered
4052 * * The first link on a line must be a link to a bad image
4053 * * Any subsequent links on the same line are considered to be exceptions,
4054 * i.e. articles where the image may occur inline.
4055 *
4056 * @param string $name the image name to check
4057 * @param $contextTitle Title|bool the page on which the image occurs, if known
4058 * @param string $blacklist wikitext of a file blacklist
4059 * @return bool
4060 */
4061 function wfIsBadImage( $name, $contextTitle = false, $blacklist = null ) {
4062 static $badImageCache = null; // based on bad_image_list msg
4063 wfProfileIn( __METHOD__ );
4064
4065 # Handle redirects
4066 $redirectTitle = RepoGroup::singleton()->checkRedirect( Title::makeTitle( NS_FILE, $name ) );
4067 if ( $redirectTitle ) {
4068 $name = $redirectTitle->getDBkey();
4069 }
4070
4071 # Run the extension hook
4072 $bad = false;
4073 if ( !wfRunHooks( 'BadImage', array( $name, &$bad ) ) ) {
4074 wfProfileOut( __METHOD__ );
4075 return $bad;
4076 }
4077
4078 $cacheable = ( $blacklist === null );
4079 if ( $cacheable && $badImageCache !== null ) {
4080 $badImages = $badImageCache;
4081 } else { // cache miss
4082 if ( $blacklist === null ) {
4083 $blacklist = wfMessage( 'bad_image_list' )->inContentLanguage()->plain(); // site list
4084 }
4085 # Build the list now
4086 $badImages = array();
4087 $lines = explode( "\n", $blacklist );
4088 foreach ( $lines as $line ) {
4089 # List items only
4090 if ( substr( $line, 0, 1 ) !== '*' ) {
4091 continue;
4092 }
4093
4094 # Find all links
4095 $m = array();
4096 if ( !preg_match_all( '/\[\[:?(.*?)\]\]/', $line, $m ) ) {
4097 continue;
4098 }
4099
4100 $exceptions = array();
4101 $imageDBkey = false;
4102 foreach ( $m[1] as $i => $titleText ) {
4103 $title = Title::newFromText( $titleText );
4104 if ( !is_null( $title ) ) {
4105 if ( $i == 0 ) {
4106 $imageDBkey = $title->getDBkey();
4107 } else {
4108 $exceptions[$title->getPrefixedDBkey()] = true;
4109 }
4110 }
4111 }
4112
4113 if ( $imageDBkey !== false ) {
4114 $badImages[$imageDBkey] = $exceptions;
4115 }
4116 }
4117 if ( $cacheable ) {
4118 $badImageCache = $badImages;
4119 }
4120 }
4121
4122 $contextKey = $contextTitle ? $contextTitle->getPrefixedDBkey() : false;
4123 $bad = isset( $badImages[$name] ) && !isset( $badImages[$name][$contextKey] );
4124 wfProfileOut( __METHOD__ );
4125 return $bad;
4126 }
4127
4128 /**
4129 * Determine whether the client at a given source IP is likely to be able to
4130 * access the wiki via HTTPS.
4131 *
4132 * @param string $ip The IPv4/6 address in the normal human-readable form
4133 * @return boolean
4134 */
4135 function wfCanIPUseHTTPS( $ip ) {
4136 $canDo = true;
4137 wfRunHooks( 'CanIPUseHTTPS', array( $ip, &$canDo ) );
4138 return !!$canDo;
4139 }
4140
4141 /**
4142 * Work out the IP address based on various globals
4143 * For trusted proxies, use the XFF client IP (first of the chain)
4144 *
4145 * @deprecated in 1.19; call $wgRequest->getIP() directly.
4146 * @return string
4147 */
4148 function wfGetIP() {
4149 wfDeprecated( __METHOD__, '1.19' );
4150 global $wgRequest;
4151 return $wgRequest->getIP();
4152 }
4153
4154 /**
4155 * Checks if an IP is a trusted proxy provider.
4156 * Useful to tell if X-Forwarded-For data is possibly bogus.
4157 * Squid cache servers for the site are whitelisted.
4158 *
4159 * @param $ip String
4160 * @return bool
4161 */
4162 function wfIsTrustedProxy( $ip ) {
4163 $trusted = wfIsConfiguredProxy( $ip );
4164 wfRunHooks( 'IsTrustedProxy', array( &$ip, &$trusted ) );
4165 return $trusted;
4166 }
4167
4168 /**
4169 * Checks if an IP matches a proxy we've configured.
4170 * @param $ip String
4171 * @return bool
4172 * @since 1.23 Supports CIDR ranges in $wgSquidServersNoPurge
4173 */
4174 function wfIsConfiguredProxy( $ip ) {
4175 global $wgSquidServers, $wgSquidServersNoPurge;
4176
4177 // quick check of known proxy servers
4178 $trusted = in_array( $ip, $wgSquidServers )
4179 || in_array( $ip, $wgSquidServersNoPurge );
4180
4181 if ( !$trusted ) {
4182 // slightly slower check to see if the ip is listed directly or in a CIDR
4183 // block in $wgSquidServersNoPurge
4184 foreach ( $wgSquidServersNoPurge as $block ) {
4185 if ( strpos( $block, '/' ) !== false && IP::isInRange( $ip, $block ) ) {
4186 $trusted = true;
4187 break;
4188 }
4189 }
4190 }
4191 return $trusted;
4192 }