Don't look for pipes in the root node.
[lhc/web/wiklou.git] / includes / MagicWord.php
index b5a58c2..4698960 100644 (file)
 <?php
 /**
  * File for magic words
- * @package MediaWiki
- * @subpackage Parser
- */
-
-/**
- * private
+ *
+ * See docs/magicword.txt
+ *
+ * @file
+ * @ingroup Parser
  */
-$wgMagicFound = false;
-
-/** Actual keyword to be used is set in Language.php */
-
-$magicWords = array(
-       'MAG_REDIRECT',
-       'MAG_NOTOC',
-       'MAG_START',
-       'MAG_CURRENTMONTH',
-       'MAG_CURRENTMONTHNAME',
-       'MAG_CURRENTMONTHNAMEGEN',
-       'MAG_CURRENTMONTHABBREV',
-       'MAG_CURRENTDAY',
-       'MAG_CURRENTDAY2',
-       'MAG_CURRENTDAYNAME',
-       'MAG_CURRENTYEAR',
-       'MAG_CURRENTTIME',
-       'MAG_NUMBEROFARTICLES',
-       'MAG_SUBST',
-       'MAG_MSG',
-       'MAG_MSGNW',
-       'MAG_NOEDITSECTION',
-       'MAG_END',
-       'MAG_IMG_THUMBNAIL',
-       'MAG_IMG_RIGHT',
-       'MAG_IMG_LEFT',
-       'MAG_IMG_NONE',
-       'MAG_IMG_WIDTH',
-       'MAG_IMG_CENTER',
-       'MAG_INT',
-       'MAG_FORCETOC',
-       'MAG_SITENAME',
-       'MAG_NS',
-       'MAG_LOCALURL',
-       'MAG_LOCALURLE',
-       'MAG_SERVER',
-       'MAG_IMG_FRAMED',
-       'MAG_PAGENAME',
-       'MAG_PAGENAMEE',
-       'MAG_NAMESPACE',
-       'MAG_NAMESPACEE',
-       'MAG_TOC',
-       'MAG_GRAMMAR',
-       'MAG_NOTITLECONVERT',
-       'MAG_NOCONTENTCONVERT',
-       'MAG_CURRENTWEEK',
-       'MAG_CURRENTDOW',
-       'MAG_REVISIONID',
-       'MAG_SCRIPTPATH',
-       'MAG_SERVERNAME',
-       'MAG_NUMBEROFFILES',
-       'MAG_IMG_MANUALTHUMB',
-       'MAG_PLURAL',
-       'MAG_FULLURL',
-       'MAG_FULLURLE',
-       'MAG_LCFIRST',
-       'MAG_UCFIRST',
-       'MAG_LC',
-       'MAG_UC',
-       'MAG_FULLPAGENAME',
-       'MAG_FULLPAGENAMEE',
-       'MAG_RAW',
-       'MAG_SUBPAGENAME',
-       'MAG_SUBPAGENAMEE',
-       'MAG_DISPLAYTITLE',
-       'MAG_TALKSPACE',
-       'MAG_TALKSPACEE',
-       'MAG_SUBJECTSPACE',
-       'MAG_SUBJECTSPACEE',
-       'MAG_TALKPAGENAME',
-       'MAG_TALKPAGENAMEE',
-       'MAG_SUBJECTPAGENAME',
-       'MAG_SUBJECTPAGENAMEE', 
-       'MAG_NUMBEROFUSERS',
-       'MAG_RAWSUFFIX',
-       'MAG_NEWSECTIONLINK',
-       'MAG_NUMBEROFPAGES',
-       'MAG_CURRENTVERSION',
-       'MAG_BASEPAGENAME',
-       'MAG_BASEPAGENAMEE',
-       'MAG_URLENCODE',
-       'MAG_CURRENTTIMESTAMP',
-       'MAG_DIRECTIONMARK',
-       'MAG_LANGUAGE',
-       'MAG_CONTENTLANGUAGE',
-       'MAG_PAGESINNAMESPACE',
-       'MAG_NOGALLERY',
-);
-if ( ! defined( 'MEDIAWIKI_INSTALL' ) )
-       wfRunHooks( 'MagicWordMagicWords', array( &$magicWords ) );
-
-for ( $i = 0; $i < count( $magicWords ); ++$i )
-       define( $magicWords[$i], $i );
-
-$wgVariableIDs = array(
-       MAG_CURRENTMONTH,
-       MAG_CURRENTMONTHNAME,
-       MAG_CURRENTMONTHNAMEGEN,
-       MAG_CURRENTMONTHABBREV,
-       MAG_CURRENTDAY,
-       MAG_CURRENTDAY2,
-       MAG_CURRENTDAYNAME,
-       MAG_CURRENTYEAR,
-       MAG_CURRENTTIME,
-       MAG_NUMBEROFARTICLES,
-       MAG_NUMBEROFFILES,
-       MAG_SITENAME,
-       MAG_SERVER,
-       MAG_SERVERNAME,
-       MAG_SCRIPTPATH,
-       MAG_PAGENAME,
-       MAG_PAGENAMEE,
-       MAG_FULLPAGENAME,
-       MAG_FULLPAGENAMEE,
-       MAG_NAMESPACE,
-       MAG_NAMESPACEE,
-       MAG_CURRENTWEEK,
-       MAG_CURRENTDOW,
-       MAG_REVISIONID,
-       MAG_SUBPAGENAME,
-       MAG_SUBPAGENAMEE,
-       MAG_DISPLAYTITLE,
-       MAG_TALKSPACE,
-       MAG_TALKSPACEE,
-       MAG_SUBJECTSPACE,
-       MAG_SUBJECTSPACEE,
-       MAG_TALKPAGENAME,
-       MAG_TALKPAGENAMEE,
-       MAG_SUBJECTPAGENAME,
-       MAG_SUBJECTPAGENAMEE,
-       MAG_NUMBEROFUSERS,
-       MAG_RAWSUFFIX,
-       MAG_NEWSECTIONLINK,
-       MAG_NUMBEROFPAGES,
-       MAG_CURRENTVERSION,
-       MAG_BASEPAGENAME,
-       MAG_BASEPAGENAMEE,
-       MAG_URLENCODE,
-       MAG_CURRENTTIMESTAMP,
-       MAG_DIRECTIONMARK,
-       MAG_LANGUAGE,
-       MAG_CONTENTLANGUAGE,
-       MAG_PAGESINNAMESPACE,
-);
-if ( ! defined( 'MEDIAWIKI_INSTALL' ) )
-       wfRunHooks( 'MagicWordwgVariableIDs', array( &$wgVariableIDs ) );
 
 /**
  * This class encapsulates "magic words" such as #redirect, __NOTOC__, etc.
  * Usage:
- *     if (MagicWord::get( MAG_REDIRECT )->match( $text ) )
+ *     if (MagicWord::get( 'redirect' )->match( $text ) )
  *
  * Possible future improvements:
  *   * Simultaneous searching for a number of magic words
- *   * $wgMagicWords in shared memory
+ *   * MagicWord::$mObjects in shared memory
  *
  * Please avoid reading the data out of one of these objects and then writing
  * special case code. If possible, add another match()-like function here.
  *
- * @package MediaWiki
+ * To add magic words in an extension, use the LanguageGetMagic hook. For
+ * magic words which are also Parser variables, add a MagicWordwgVariableIDs
+ * hook. Use string keys.
+ *
+ * @ingroup Parser
  */
 class MagicWord {
        /**#@+
@@ -175,10 +32,153 @@ class MagicWord {
         */
        var $mId, $mSynonyms, $mCaseSensitive, $mRegex;
        var $mRegexStart, $mBaseRegex, $mVariableRegex;
-       var $mModified;
+       var $mModified, $mFound;
+
+       static public $mVariableIDsInitialised = false;
+       static public $mVariableIDs = array(
+               'currentmonth',
+               'currentmonth1',
+               'currentmonthname',
+               'currentmonthnamegen',
+               'currentmonthabbrev',
+               'currentday',
+               'currentday2',
+               'currentdayname',
+               'currentyear',
+               'currenttime',
+               'currenthour',
+               'localmonth',
+               'localmonth1',
+               'localmonthname',
+               'localmonthnamegen',
+               'localmonthabbrev',
+               'localday',
+               'localday2',
+               'localdayname',
+               'localyear',
+               'localtime',
+               'localhour',
+               'numberofarticles',
+               'numberoffiles',
+               'numberofedits',
+               'articlepath',
+               'sitename',
+               'server',
+               'servername',
+               'scriptpath',
+               'stylepath',
+               'pagename',
+               'pagenamee',
+               'fullpagename',
+               'fullpagenamee',
+               'namespace',
+               'namespacee',
+               'currentweek',
+               'currentdow',
+               'localweek',
+               'localdow',
+               'revisionid',
+               'revisionday',
+               'revisionday2',
+               'revisionmonth',
+               'revisionmonth1',
+               'revisionyear',
+               'revisiontimestamp',
+               'revisionuser',
+               'subpagename',
+               'subpagenamee',
+               'talkspace',
+               'talkspacee',
+               'subjectspace',
+               'subjectspacee',
+               'talkpagename',
+               'talkpagenamee',
+               'subjectpagename',
+               'subjectpagenamee',
+               'numberofusers',
+               'numberofactiveusers',
+               'numberofpages',
+               'currentversion',
+               'basepagename',
+               'basepagenamee',
+               'currenttimestamp',
+               'localtimestamp',
+               'directionmark',
+               'contentlanguage',
+               'numberofadmins',
+               'numberofviews',
+       );
+
+       /* Array of caching hints for ParserCache */
+       static public $mCacheTTLs = array (
+               'currentmonth' => 86400,
+               'currentmonth1' => 86400,
+               'currentmonthname' => 86400,
+               'currentmonthnamegen' => 86400,
+               'currentmonthabbrev' => 86400,
+               'currentday' => 3600,
+               'currentday2' => 3600,
+               'currentdayname' => 3600,
+               'currentyear' => 86400,
+               'currenttime' => 3600,
+               'currenthour' => 3600,
+               'localmonth' => 86400,
+               'localmonth1' => 86400,
+               'localmonthname' => 86400,
+               'localmonthnamegen' => 86400,
+               'localmonthabbrev' => 86400,
+               'localday' => 3600,
+               'localday2' => 3600,
+               'localdayname' => 3600,
+               'localyear' => 86400,
+               'localtime' => 3600,
+               'localhour' => 3600,
+               'numberofarticles' => 3600,
+               'numberoffiles' => 3600,
+               'numberofedits' => 3600,
+               'currentweek' => 3600,
+               'currentdow' => 3600,
+               'localweek' => 3600,
+               'localdow' => 3600,
+               'numberofusers' => 3600,
+               'numberofactiveusers' => 3600,
+               'numberofpages' => 3600,
+               'currentversion' => 86400,
+               'currenttimestamp' => 3600,
+               'localtimestamp' => 3600,
+               'pagesinnamespace' => 3600,
+               'numberofadmins' => 3600,
+               'numberofviews' => 3600,
+               'numberingroup' => 3600,
+               );
+
+       static public $mDoubleUnderscoreIDs = array(
+               'notoc',
+               'nogallery',
+               'forcetoc',
+               'toc',
+               'noeditsection',
+               'newsectionlink',
+               'nonewsectionlink',
+               'hiddencat',
+               'index',
+               'noindex',
+               'staticredirect',
+               'notitleconvert',
+               'nocontentconvert',
+       );
+
+       static public $mSubstIDs = array(
+               'subst',
+               'safesubst',
+       );
+
+       static public $mObjects = array();
+       static public $mDoubleUnderscoreArray = null;
+
        /**#@-*/
 
-       function MagicWord($id = 0, $syn = '', $cs = false) {
+       function __construct($id = 0, $syn = '', $cs = false) {
                $this->mId = $id;
                $this->mSynonyms = (array)$syn;
                $this->mCaseSensitive = $cs;
@@ -193,18 +193,66 @@ class MagicWord {
         * Factory: creates an object representing an ID
         * @static
         */
-       function &get( $id ) {
-               global $wgMagicWords;
-
-               if ( !is_array( $wgMagicWords ) ) {
-                       throw new MWException( "Incorrect initialisation order, \$wgMagicWords does not exist\n" );
-               }
-               if (!array_key_exists( $id, $wgMagicWords ) ) {
+       static function &get( $id ) {
+               wfProfileIn( __METHOD__ );
+               if ( !isset( self::$mObjects[$id] ) ) {
                        $mw = new MagicWord();
                        $mw->load( $id );
-                       $wgMagicWords[$id] = $mw;
+                       self::$mObjects[$id] = $mw;
+               }
+               wfProfileOut( __METHOD__ );
+               return self::$mObjects[$id];
+       }
+
+       /**
+        * Get an array of parser variable IDs
+        */
+       static function getVariableIDs() {
+               if ( !self::$mVariableIDsInitialised ) {
+                       # Deprecated constant definition hook, available for extensions that need it
+                       $magicWords = array();
+                       wfRunHooks( 'MagicWordMagicWords', array( &$magicWords ) );
+                       foreach ( $magicWords as $word ) {
+                               define( $word, $word );
+                       }
+
+                       # Get variable IDs
+                       wfRunHooks( 'MagicWordwgVariableIDs', array( &self::$mVariableIDs ) );
+                       self::$mVariableIDsInitialised = true;
+               }
+               return self::$mVariableIDs;
+       }
+
+       /**
+        * Get an array of parser substitution modifier IDs
+        */
+       static function getSubstIDs() {
+               return self::$mSubstIDs; 
+       }
+
+       /* Allow external reads of TTL array */
+       static function getCacheTTL($id) {
+               if (array_key_exists($id,self::$mCacheTTLs)) {
+                       return self::$mCacheTTLs[$id];
+               } else {
+                       return -1;
                }
-               return $wgMagicWords[$id];
+       }
+
+       /** Get a MagicWordArray of double-underscore entities */
+       static function getDoubleUnderscoreArray() {
+               if ( is_null( self::$mDoubleUnderscoreArray ) ) {
+                       self::$mDoubleUnderscoreArray = new MagicWordArray( self::$mDoubleUnderscoreIDs );
+               }
+               return self::$mDoubleUnderscoreArray;
+       }
+
+       /**
+        * Clear the self::$mObjects variable
+        * For use in parser tests
+        */
+       public static function clearCache() {
+               self::$mObjects = array();
        }
 
        # Initialises this object with an ID
@@ -212,6 +260,11 @@ class MagicWord {
                global $wgContLang;
                $this->mId = $id;
                $wgContLang->getMagic( $this );
+               if ( !$this->mSynonyms ) {
+                       $this->mSynonyms = array( 'dkjsagfjsgashfajsh' );
+                       #throw new MWException( "Error: invalid magic word '$id'" );
+                       wfDebugLog( 'exception', "Error: invalid magic word '$id'\n" );
+               }
        }
 
        /**
@@ -223,14 +276,14 @@ class MagicWord {
                # This was used for matching "$1" variables, but different uses of the feature will have
                # different restrictions, which should be checked *after* the MagicWord has been matched,
                # not here. - IMSoP
-               
+
                $escSyn = array();
                foreach ( $this->mSynonyms as $synonym )
                        // In case a magic word contains /, like that's going to happen;)
                        $escSyn[] = preg_quote( $synonym, '/' );
                $this->mBaseRegex = implode( '|', $escSyn );
-               
-               $case = $this->mCaseSensitive ? '' : 'i';
+
+               $case = $this->mCaseSensitive ? '' : 'iu';
                $this->mRegex = "/{$this->mBaseRegex}/{$case}";
                $this->mRegexStart = "/^(?:{$this->mBaseRegex})/{$case}";
                $this->mVariableRegex = str_replace( "\\$1", "(.*?)", $this->mRegex );
@@ -257,7 +310,7 @@ class MagicWord {
                if ( $this->mRegex === '' )
                        $this->initRegex();
 
-               return $this->mCaseSensitive ? '' : 'i';
+               return $this->mCaseSensitive ? '' : 'iu';
        }
 
        /**
@@ -285,7 +338,7 @@ class MagicWord {
         * @return bool
         */
        function match( $text ) {
-               return preg_match( $this->getRegex(), $text );
+               return (bool)preg_match( $this->getRegex(), $text );
        }
 
        /**
@@ -293,7 +346,7 @@ class MagicWord {
         * @return bool
         */
        function matchStart( $text ) {
-               return preg_match( $this->getRegexStart(), $text );
+               return (bool)preg_match( $this->getRegexStart(), $text );
        }
 
        /**
@@ -306,14 +359,17 @@ class MagicWord {
                $matches = array();
                $matchcount = preg_match( $this->getVariableStartToEndRegex(), $text, $matches );
                if ( $matchcount == 0 ) {
-                       return NULL;
-               } elseif ( count($matches) == 1 ) {
-                       return $matches[0];
+                       return null;
                } else {
-                       # multiple matched parts (variable match); some will be empty because of synonyms
-                       # the variable will be the second non-empty one so remove any blank elements and re-sort the indices
+                       # multiple matched parts (variable match); some will be empty because of
+                       # synonyms. The variable will be the second non-empty one so remove any
+                       # blank elements and re-sort the indices.
+                       # See also bug 6526
+
                        $matches = array_values(array_filter($matches));
-                       return $matches[1];
+
+                       if ( count($matches) == 1 ) { return $matches[0]; }
+                       else { return $matches[1]; }
                }
        }
 
@@ -323,25 +379,31 @@ class MagicWord {
         * input string, removing all instances of the word
         */
        function matchAndRemove( &$text ) {
-               global $wgMagicFound;
-               $wgMagicFound = false;
-               $text = preg_replace_callback( $this->getRegex(), 'pregRemoveAndRecord', $text );
-               return $wgMagicFound;
+               $this->mFound = false;
+               $text = preg_replace_callback( $this->getRegex(), array( &$this, 'pregRemoveAndRecord' ), $text );
+               return $this->mFound;
        }
 
        function matchStartAndRemove( &$text ) {
-               global $wgMagicFound;
-               $wgMagicFound = false;
-               $text = preg_replace_callback( $this->getRegexStart(), 'pregRemoveAndRecord', $text );
-               return $wgMagicFound;
+               $this->mFound = false;
+               $text = preg_replace_callback( $this->getRegexStart(), array( &$this, 'pregRemoveAndRecord' ), $text );
+               return $this->mFound;
        }
 
+       /**
+        * Used in matchAndRemove()
+        * @private
+        **/
+       function pregRemoveAndRecord( ) {
+               $this->mFound = true;
+               return '';
+       }
 
        /**
         * Replaces the word with something else
         */
        function replace( $replacement, $subject, $limit=-1 ) {
-               $res = preg_replace( $this->getRegex(), wfRegexReplacement( $replacement ), $subject, $limit );
+               $res = preg_replace( $this->getRegex(), StringUtils::escapeRegexReplacement( $replacement ), $subject, $limit );
                $this->mModified = !($res === $subject);
                return $res;
        }
@@ -384,6 +446,10 @@ class MagicWord {
                return $this->mSynonyms[$i];
        }
 
+       function getSynonyms() {
+               return $this->mSynonyms;
+       }
+
        /**
         * Returns true if the last call to replace() or substituteCallback()
         * returned a modified text, otherwise false.
@@ -417,20 +483,252 @@ class MagicWord {
         * lookup in a list of magic words
         */
        function addToArray( &$array, $value ) {
+               global $wgContLang;
                foreach ( $this->mSynonyms as $syn ) {
-                       $array[$syn] = $value;
+                       $array[$wgContLang->lc($syn)] = $value;
                }
        }
+
+       function isCaseSensitive() {
+               return $this->mCaseSensitive;
+       }
+
+       function getId() {
+               return $this->mId;
+       }
 }
 
 /**
- * Used in matchAndRemove()
- * @private
- **/
-function pregRemoveAndRecord( $match ) {
-       global $wgMagicFound;
-       $wgMagicFound = true;
-       return '';
-}
+ * Class for handling an array of magic words
+ * @ingroup Parser
+ */
+class MagicWordArray {
+       var $names = array();
+       var $hash;
+       var $baseRegex, $regex;
+       var $matches;
+
+       function __construct( $names = array() ) {
+               $this->names = $names;
+       }
+
+       /**
+        * Add a magic word by name
+        */
+       public function add( $name ) {
+               $this->names[] = $name;
+               $this->hash = $this->baseRegex = $this->regex = null;
+       }
+
+       /**
+        * Add a number of magic words by name
+        */
+       public function addArray( $names ) {
+               $this->names = array_merge( $this->names, array_values( $names ) );
+               $this->hash = $this->baseRegex = $this->regex = null;
+       }
+
+       /**
+        * Get a 2-d hashtable for this array
+        */
+       function getHash() {
+               if ( is_null( $this->hash ) ) {
+                       global $wgContLang;
+                       $this->hash = array( 0 => array(), 1 => array() );
+                       foreach ( $this->names as $name ) {
+                               $magic = MagicWord::get( $name );
+                               $case = intval( $magic->isCaseSensitive() );
+                               foreach ( $magic->getSynonyms() as $syn ) {
+                                       if ( !$case ) {
+                                               $syn = $wgContLang->lc( $syn );
+                                       }
+                                       $this->hash[$case][$syn] = $name;
+                               }
+                       }
+               }
+               return $this->hash;
+       }
+
+       /**
+        * Get the base regex
+        */
+       function getBaseRegex() {
+               if ( is_null( $this->baseRegex ) ) {
+                       $this->baseRegex = array( 0 => '', 1 => '' );
+                       foreach ( $this->names as $name ) {
+                               $magic = MagicWord::get( $name );
+                               $case = intval( $magic->isCaseSensitive() );
+                               foreach ( $magic->getSynonyms() as $i => $syn ) {
+                                       $group = "(?P<{$i}_{$name}>" . preg_quote( $syn, '/' ) . ')';
+                                       if ( $this->baseRegex[$case] === '' ) {
+                                               $this->baseRegex[$case] = $group;
+                                       } else {
+                                               $this->baseRegex[$case] .= '|' . $group;
+                                       }
+                               }
+                       }
+               }
+               return $this->baseRegex;
+       }
+
+       /**
+        * Get an unanchored regex that does not match parameters
+        */
+       function getRegex() {
+               if ( is_null( $this->regex ) ) {
+                       $base = $this->getBaseRegex();
+                       $this->regex = array( '', '' );
+                       if ( $this->baseRegex[0] !== '' ) {
+                               $this->regex[0] = "/{$base[0]}/iuS";
+                       }
+                       if ( $this->baseRegex[1] !== '' ) {
+                               $this->regex[1] = "/{$base[1]}/S";
+                       }
+               }
+               return $this->regex;
+       }
+
+       /**
+        * Get a regex for matching variables with parameters
+        */
+       function getVariableRegex() {
+               return str_replace( "\\$1", "(.*?)", $this->getRegex() );
+       }
 
-?>
+       /**
+        * Get a regex anchored to the start of the string that does not match parameters
+        */
+       function getRegexStart() {
+               $base = $this->getBaseRegex();
+               $newRegex = array( '', '' );
+               if ( $base[0] !== '' ) {
+                       $newRegex[0] = "/^(?:{$base[0]})/iuS";
+               }
+               if ( $base[1] !== '' ) {
+                       $newRegex[1] = "/^(?:{$base[1]})/S"; 
+               }
+               return $newRegex;
+       }
+
+       /**
+        * Get an anchored regex for matching variables with parameters
+        */
+       function getVariableStartToEndRegex() {
+               $base = $this->getBaseRegex();
+               $newRegex = array( '', '' );
+               if ( $base[0] !== '' ) {
+                       $newRegex[0] = str_replace( "\\$1", "(.*?)", "/^(?:{$base[0]})$/iuS" );
+               }
+               if ( $base[1] !== '' ) {
+                       $newRegex[1] = str_replace( "\\$1", "(.*?)", "/^(?:{$base[1]})$/S" );
+               }
+               return $newRegex;
+       }
+
+       /**
+        * Parse a match array from preg_match
+        * Returns array(magic word ID, parameter value)
+        * If there is no parameter value, that element will be false.
+        */
+       function parseMatch( $m ) {
+               reset( $m );
+               while ( list( $key, $value ) = each( $m ) ) {
+                       if ( $key === 0 || $value === '' ) {
+                               continue;
+                       }
+                       $parts = explode( '_', $key, 2 );
+                       if ( count( $parts ) != 2 ) {
+                               // This shouldn't happen
+                               // continue;
+                               throw new MWException( __METHOD__ . ': bad parameter name' );
+                       }
+                       list( /* $synIndex */, $magicName ) = $parts;
+                       $paramValue = next( $m );
+                       return array( $magicName, $paramValue );
+               }
+               // This shouldn't happen either
+               throw new MWException( __METHOD__.': parameter not found' );
+       }
+
+       /**
+        * Match some text, with parameter capture
+        * Returns an array with the magic word name in the first element and the
+        * parameter in the second element.
+        * Both elements are false if there was no match.
+        */
+       public function matchVariableStartToEnd( $text ) {
+               $regexes = $this->getVariableStartToEndRegex();
+               foreach ( $regexes as $regex ) {
+                       if ( $regex !== '' ) {
+                               $m = false;
+                               if ( preg_match( $regex, $text, $m ) ) {
+                                       return $this->parseMatch( $m );
+                               }
+                       }
+               }
+               return array( false, false );
+       }
+
+       /**
+        * Match some text, without parameter capture
+        * Returns the magic word name, or false if there was no capture
+        */
+       public function matchStartToEnd( $text ) {
+               $hash = $this->getHash();
+               if ( isset( $hash[1][$text] ) ) {
+                       return $hash[1][$text];
+               }
+               global $wgContLang;
+               $lc = $wgContLang->lc( $text );
+               if ( isset( $hash[0][$lc] ) ) {
+                       return $hash[0][$lc];
+               }
+               return false;
+       }
+
+       /**
+        * Returns an associative array, ID => param value, for all items that match
+        * Removes the matched items from the input string (passed by reference)
+        */
+       public function matchAndRemove( &$text ) {
+               $found = array();
+               $regexes = $this->getRegex();
+               foreach ( $regexes as $regex ) {
+                       if ( $regex === '' ) {
+                               continue;
+                       }
+                       preg_match_all( $regex, $text, $matches, PREG_SET_ORDER );
+                       foreach ( $matches as $m ) {
+                               list( $name, $param ) = $this->parseMatch( $m );
+                               $found[$name] = $param;
+                       }
+                       $text = preg_replace( $regex, '', $text );
+               }
+               return $found;
+       }
+
+       /**
+        * Return the ID of the magic word at the start of $text, and remove
+        * the prefix from $text.
+        * Return false if no match found and $text is not modified.
+        * Does not match parameters.
+        */
+       public function matchStartAndRemove( &$text ) {
+               $regexes = $this->getRegexStart();
+               foreach ( $regexes as $regex ) {
+                       if ( $regex === '' ) {
+                               continue;
+                       }
+                       if ( preg_match( $regex, $text, $m ) ) {
+                               list( $id, ) = $this->parseMatch( $m );
+                               if ( strlen( $m[0] ) >= strlen( $text ) ) {
+                                       $text = '';
+                               } else {
+                                       $text = substr( $text, strlen( $m[0] ) );
+                               }
+                               return $id;
+                       }
+               }
+               return false;
+       }
+}