displaytitle: reject some CSS if $wgRestrictDisplayTitle set

author MatmaRex <matma.rex@gmail.com>

Wed, 22 May 2013 08:48:14 +0000 (10:48 +0200)

committer MatmaRex <matma.rex@gmail.com>

Fri, 24 May 2013 13:05:37 +0000 (15:05 +0200)
author MatmaRex <matma.rex@gmail.com>
Wed, 22 May 2013 08:48:14 +0000 (10:48 +0200)
committer MatmaRex <matma.rex@gmail.com>
Fri, 24 May 2013 13:05:37 +0000 (15:05 +0200)
diff --git a/includes/DefaultSettings.php b/includes/DefaultSettings.php

index 9221784..173605c 100644 (file)
--- a/includes/DefaultSettings.php
+++ b/includes/DefaultSettings.php
@@ -3497,8 +3497,9 @@ $wgNoFollowDomainExceptions = array();
  $wgAllowDisplayTitle = true;
  
  /**
  $wgAllowDisplayTitle = true;
  
  /**
- * For consistency, restrict DISPLAYTITLE to titles that normalize to the same
- * canonical DB key.
+ * For consistency, restrict DISPLAYTITLE to text that normalizes to the same
+ * canonical DB key. Also disallow some inline CSS rules like display: none;
+ * which can cause the text to be hidden or unselectable.
   */
  $wgRestrictDisplayTitle = true;
  
   */
  $wgRestrictDisplayTitle = true;
  
diff --git a/includes/Sanitizer.php b/includes/Sanitizer.php

index ed01235..b4a1c62 100644 (file)
--- a/includes/Sanitizer.php
+++ b/includes/Sanitizer.php
@@ -813,9 +813,10 @@ class Sanitizer {
         /**
          * Pick apart some CSS and check it for forbidden or unsafe structures.
          * Returns a sanitized string. This sanitized string will have
         /**
          * Pick apart some CSS and check it for forbidden or unsafe structures.
          * Returns a sanitized string. This sanitized string will have
-        * character references and escape sequences decoded, and comments
-        * stripped. If the input is just too evil, only a comment complaining
-        * about evilness will be returned.
+        * character references and escape sequences decoded and comments
+        * stripped (unless it is itself one valid comment, in which case the value
+        * will be passed through). If the input is just too evil, only a comment
+        * complaining about evilness will be returned.
          *
          * Currently URL references, 'expression', 'tps' are forbidden.
          *
          *
          * Currently URL references, 'expression', 'tps' are forbidden.
          *
@@ -856,19 +857,24 @@ class Sanitizer {
                 $value = preg_replace_callback( $decodeRegex,
                         array( __CLASS__, 'cssDecodeCallback' ), $value );
  
                 $value = preg_replace_callback( $decodeRegex,
                         array( __CLASS__, 'cssDecodeCallback' ), $value );
  
-               // Remove any comments; IE gets token splitting wrong
-               // This must be done AFTER decoding character references and
-               // escape sequences, because those steps can introduce comments
-               // This step cannot introduce character references or escape
-               // sequences, because it replaces comments with spaces rather
-               // than removing them completely.
-               $value = StringUtils::delimiterReplace( '/*', '*/', ' ', $value );
-
-               // Remove anything after a comment-start token, to guard against
-               // incorrect client implementations.
-               $commentPos = strpos( $value, '/*' );
-               if ( $commentPos !== false ) {
-                       $value = substr( $value, 0, $commentPos );
+               // Let the value through if it's nothing but a single comment, to
+               // allow other functions which may reject it to pass some error
+               // message through.
+               if ( !preg_match( '! ^ \s* /\* [^*\\/]* \*/ \s* $ !x', $value ) ) {
+                       // Remove any comments; IE gets token splitting wrong
+                       // This must be done AFTER decoding character references and
+                       // escape sequences, because those steps can introduce comments
+                       // This step cannot introduce character references or escape
+                       // sequences, because it replaces comments with spaces rather
+                       // than removing them completely.
+                       $value = StringUtils::delimiterReplace( '/*', '*/', ' ', $value );
+
+                       // Remove anything after a comment-start token, to guard against
+                       // incorrect client implementations.
+                       $commentPos = strpos( $value, '/*' );
+                       if ( $commentPos !== false ) {
+                               $value = substr( $value, 0, $commentPos );
+                       }
                 }
  
                 // Reject problematic keywords and control characters
                 }
  
                 // Reject problematic keywords and control characters
@@ -932,14 +938,7 @@ class Sanitizer {
                 $decoded = Sanitizer::decodeTagAttributes( $text );
                 $stripped = Sanitizer::validateTagAttributes( $decoded, $element );
  
                 $decoded = Sanitizer::decodeTagAttributes( $text );
                 $stripped = Sanitizer::validateTagAttributes( $decoded, $element );
  
-               $attribs = array();
-               foreach ( $stripped as $attribute => $value ) {
-                       $encAttribute = htmlspecialchars( $attribute );
-                       $encValue = Sanitizer::safeEncodeAttribute( $value );
-
-                       $attribs[] = "$encAttribute=\"$encValue\"";
-               }
-               return count( $attribs ) ? ' ' . implode( ' ', $attribs ) : '';
+               return Sanitizer::safeEncodeTagAttributes( $stripped );
         }
  
         /**
         }
  
         /**
@@ -1139,6 +1138,24 @@ class Sanitizer {
                 return $attribs;
         }
  
                 return $attribs;
         }
  
+       /**
+        * Build a partial tag string from an associative array of attribute
+        * names and values as returned by decodeTagAttributes.
+        *
+        * @param $assoc_array Array
+        * @return String
+        */
+       public static function safeEncodeTagAttributes( $assoc_array ) {
+               $attribs = array();
+               foreach ( $assoc_array as $attribute => $value ) {
+                       $encAttribute = htmlspecialchars( $attribute );
+                       $encValue = Sanitizer::safeEncodeAttribute( $value );
+
+                       $attribs[] = "$encAttribute=\"$encValue\"";
+               }
+               return count( $attribs ) ? ' ' . implode( ' ', $attribs ) : '';
+       }
+
         /**
          * Pick the appropriate attribute value from a match set from the
          * attribs regex matches.
         /**
          * Pick the appropriate attribute value from a match set from the
          * attribs regex matches.
diff --git a/includes/parser/CoreParserFunctions.php b/includes/parser/CoreParserFunctions.php

index be945f7..375ff2b 100644 (file)
--- a/includes/parser/CoreParserFunctions.php
+++ b/includes/parser/CoreParserFunctions.php
@@ -363,22 +363,43 @@ class CoreParserFunctions {
         static function displaytitle( $parser, $text = '' ) {
                 global $wgRestrictDisplayTitle;
  
         static function displaytitle( $parser, $text = '' ) {
                 global $wgRestrictDisplayTitle;
  
-               #parse a limited subset of wiki markup (just the single quote items)
+               // parse a limited subset of wiki markup (just the single quote items)
                 $text = $parser->doQuotes( $text );
  
                 $text = $parser->doQuotes( $text );
  
-               #remove stripped text (e.g. the UNIQ-QINU stuff) that was generated by tag extensions/whatever
+               // remove stripped text (e.g. the UNIQ-QINU stuff) that was generated by tag extensions/whatever
                 $text = preg_replace( '/' . preg_quote( $parser->uniqPrefix(), '/' ) . '.*?'
                         . preg_quote( Parser::MARKER_SUFFIX, '/' ) . '/', '', $text );
  
                 $text = preg_replace( '/' . preg_quote( $parser->uniqPrefix(), '/' ) . '.*?'
                         . preg_quote( Parser::MARKER_SUFFIX, '/' ) . '/', '', $text );
  
-               #list of disallowed tags for DISPLAYTITLE
-               #these will be escaped even though they are allowed in normal wiki text
+               // list of disallowed tags for DISPLAYTITLE
+               // these will be escaped even though they are allowed in normal wiki text
                 $bad = array( 'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'div', 'blockquote', 'ol', 'ul', 'li', 'hr',
                         'table', 'tr', 'th', 'td', 'dl', 'dd', 'caption', 'p', 'ruby', 'rb', 'rt', 'rp', 'br' );
  
                 $bad = array( 'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'div', 'blockquote', 'ol', 'ul', 'li', 'hr',
                         'table', 'tr', 'th', 'td', 'dl', 'dd', 'caption', 'p', 'ruby', 'rb', 'rt', 'rp', 'br' );
  
-               #only requested titles that normalize to the actual title are allowed through
-               #if $wgRestrictDisplayTitle is true (it is by default)
-               #mimic the escaping process that occurs in OutputPage::setPageTitle
-               $text = Sanitizer::normalizeCharReferences( Sanitizer::removeHTMLtags( $text, null, array(), array(), $bad ) );
+               // disallow some styles that could be used to bypass $wgRestrictDisplayTitle
+               if ( $wgRestrictDisplayTitle ) {
+                       $htmlTagsCallback = function ( $params ) {
+                               $decoded = Sanitizer::decodeTagAttributes( $params );
+
+                               if ( isset( $decoded['style'] ) ) {
+                                       // this is called later anyway, but we need it right now for the regexes below to be safe
+                                       // calling it twice doesn't hurt
+                                       $decoded['style'] = Sanitizer::checkCss( $decoded['style'] );
+
+                                       if ( preg_match( '/(display|user-select|visibility)\s*:/i', $decoded['style'] ) ) {
+                                               $decoded['style'] = '/* attempt to bypass $wgRestrictDisplayTitle */';
+                                       }
+                               }
+
+                               $params = Sanitizer::safeEncodeTagAttributes( $decoded );
+                       };
+               } else {
+                       $htmlTagsCallback = null;
+               }
+
+               // only requested titles that normalize to the actual title are allowed through
+               // if $wgRestrictDisplayTitle is true (it is by default)
+               // mimic the escaping process that occurs in OutputPage::setPageTitle
+               $text = Sanitizer::normalizeCharReferences( Sanitizer::removeHTMLtags( $text, $htmlTagsCallback, array(), array(), $bad ) );
                 $title = Title::newFromText( Sanitizer::stripAllTags( $text ) );
  
                 if ( !$wgRestrictDisplayTitle ) {
                 $title = Title::newFromText( Sanitizer::stripAllTags( $text ) );
  
                 if ( !$wgRestrictDisplayTitle ) {
diff --git a/tests/parser/parserTests.txt b/tests/parser/parserTests.txt

index d5e221a..8995593 100644 (file)
--- a/tests/parser/parserTests.txt
+++ b/tests/parser/parserTests.txt
@@ -13289,6 +13289,40 @@ Screen
  </p>
  !! end
  
  </p>
  !! end
  
+!! test
+Verify that displaytitle handles inline CSS styles (bug 26547) - rejected value
+!! options
+showtitle
+title=[[Screen]]
+!! config
+wgAllowDisplayTitle=true
+wgRestrictDisplayTitle=true
+!! input
+this is not the the title
+{{DISPLAYTITLE:<span style="display: none;">s</span>creen}}
+!! result
+<span style="/* attempt to bypass $wgRestrictDisplayTitle */">s</span>creen
+<p>this is not the the title
+</p>
+!! end
+
+!! test
+Verify that displaytitle handles inline CSS styles (bug 26547) - accepted value
+!! options
+showtitle
+title=[[Screen]]
+!! config
+wgAllowDisplayTitle=true
+wgRestrictDisplayTitle=true
+!! input
+this is not the the title
+{{DISPLAYTITLE:<span style="color: red;">s</span>creen}}
+!! result
+<span style="color: red;">s</span>creen
+<p>this is not the the title
+</p>
+!! end
+
  !! test
  preload: check <noinclude> and <includeonly>
  !! options
  !! test
  preload: check <noinclude> and <includeonly>
  !! options
diff --git a/tests/phpunit/includes/SanitizerTest.php b/tests/phpunit/includes/SanitizerTest.php

index b745423..38c15ee 100644 (file)
--- a/tests/phpunit/includes/SanitizerTest.php
+++ b/tests/phpunit/includes/SanitizerTest.php
@@ -227,10 +227,14 @@ class SanitizerTest extends MediaWikiTestCase {
         public static function provideCssCommentsFixtures() {
                 /** array( <expected>, <css>, [message] ) */
                 return array(
         public static function provideCssCommentsFixtures() {
                 /** array( <expected>, <css>, [message] ) */
                 return array(
-                       array( ' ', '/**/' ),
+                       // Valid comments spanning entire input
+                       array( '/**/', '/**/' ),
+                       array( '/* comment */', '/* comment */' ),
+                       // Weird stuff
                         array( ' ', '/****/' ),
                         array( ' ', '/****/' ),
-                       array( ' ', '/* comment */' ),
-                       array( ' ', "\\2f\\2a foo \\2a\\2f",
+                       array( ' ', '/* /* */' ),
+                       array( 'display: block;', "display:/* foo */block;" ),
+                       array( 'display: block;', "display:\\2f\\2a foo \\2a\\2f block;",
                                 'Backslash-escaped comments must be stripped (bug 28450)' ),
                         array( '', '/* unfinished comment structure',
                                 'Remove anything after a comment-start token' ),
                                 'Backslash-escaped comments must be stripped (bug 28450)' ),
                         array( '', '/* unfinished comment structure',
                                 'Remove anything after a comment-start token' ),
author	MatmaRex <matma.rex@gmail.com>
	Wed, 22 May 2013 08:48:14 +0000 (10:48 +0200)
committer	MatmaRex <matma.rex@gmail.com>
	Fri, 24 May 2013 13:05:37 +0000 (15:05 +0200)
includes/DefaultSettings.php		patch \| blob \| history
includes/Sanitizer.php		patch \| blob \| history
includes/parser/CoreParserFunctions.php		patch \| blob \| history
tests/parser/parserTests.txt		patch \| blob \| history
tests/phpunit/includes/SanitizerTest.php		patch \| blob \| history