Merge "More debug diagnostics for upload by URL"
[lhc/web/wiklou.git] / includes / parser / StripState.php
1 <?php
2 /**
3 * Holder for stripped items when parsing wiki markup.
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
19 *
20 * @file
21 * @ingroup Parser
22 */
23
24 /**
25 * @todo document, briefly.
26 * @ingroup Parser
27 */
28 class StripState {
29 protected $prefix;
30 protected $data;
31 protected $regex;
32
33 protected $tempType, $tempMergePrefix;
34 protected $circularRefGuard;
35 protected $recursionLevel = 0;
36
37 const UNSTRIP_RECURSION_LIMIT = 20;
38
39 /**
40 * @param string $prefix
41 */
42 public function __construct( $prefix ) {
43 $this->prefix = $prefix;
44 $this->data = array(
45 'nowiki' => array(),
46 'general' => array()
47 );
48 $this->regex = "/{$this->prefix}([^\x7f]+)" . Parser::MARKER_SUFFIX . '/';
49 $this->circularRefGuard = array();
50 }
51
52 /**
53 * Add a nowiki strip item
54 * @param string $marker
55 * @param string $value
56 */
57 public function addNoWiki( $marker, $value ) {
58 $this->addItem( 'nowiki', $marker, $value );
59 }
60
61 /**
62 * @param string $marker
63 * @param string $value
64 */
65 public function addGeneral( $marker, $value ) {
66 $this->addItem( 'general', $marker, $value );
67 }
68
69 /**
70 * @throws MWException
71 * @param string $type
72 * @param string $marker
73 * @param string $value
74 */
75 protected function addItem( $type, $marker, $value ) {
76 if ( !preg_match( $this->regex, $marker, $m ) ) {
77 throw new MWException( "Invalid marker: $marker" );
78 }
79
80 $this->data[$type][$m[1]] = $value;
81 }
82
83 /**
84 * @param string $text
85 * @return mixed
86 */
87 public function unstripGeneral( $text ) {
88 return $this->unstripType( 'general', $text );
89 }
90
91 /**
92 * @param string $text
93 * @return mixed
94 */
95 public function unstripNoWiki( $text ) {
96 return $this->unstripType( 'nowiki', $text );
97 }
98
99 /**
100 * @param string $text
101 * @return mixed
102 */
103 public function unstripBoth( $text ) {
104 $text = $this->unstripType( 'general', $text );
105 $text = $this->unstripType( 'nowiki', $text );
106 return $text;
107 }
108
109 /**
110 * @param string $type
111 * @param string $text
112 * @return mixed
113 */
114 protected function unstripType( $type, $text ) {
115 // Shortcut
116 if ( !count( $this->data[$type] ) ) {
117 return $text;
118 }
119
120 $oldType = $this->tempType;
121 $this->tempType = $type;
122 $text = preg_replace_callback( $this->regex, array( $this, 'unstripCallback' ), $text );
123 $this->tempType = $oldType;
124 return $text;
125 }
126
127 /**
128 * @param array $m
129 * @return array
130 */
131 protected function unstripCallback( $m ) {
132 $marker = $m[1];
133 if ( isset( $this->data[$this->tempType][$marker] ) ) {
134 if ( isset( $this->circularRefGuard[$marker] ) ) {
135 return '<span class="error">'
136 . wfMessage( 'parser-unstrip-loop-warning' )->inContentLanguage()->text()
137 . '</span>';
138 }
139 if ( $this->recursionLevel >= self::UNSTRIP_RECURSION_LIMIT ) {
140 return '<span class="error">' .
141 wfMessage( 'parser-unstrip-recursion-limit' )
142 ->numParams( self::UNSTRIP_RECURSION_LIMIT )->inContentLanguage()->text() .
143 '</span>';
144 }
145 $this->circularRefGuard[$marker] = true;
146 $this->recursionLevel++;
147 $ret = $this->unstripType( $this->tempType, $this->data[$this->tempType][$marker] );
148 $this->recursionLevel--;
149 unset( $this->circularRefGuard[$marker] );
150 return $ret;
151 } else {
152 return $m[0];
153 }
154 }
155
156 /**
157 * Get a StripState object which is sufficient to unstrip the given text.
158 * It will contain the minimum subset of strip items necessary.
159 *
160 * @param string $text
161 *
162 * @return StripState
163 */
164 public function getSubState( $text ) {
165 $subState = new StripState( $this->prefix );
166 $pos = 0;
167 while ( true ) {
168 $startPos = strpos( $text, $this->prefix, $pos );
169 $endPos = strpos( $text, Parser::MARKER_SUFFIX, $pos );
170 if ( $startPos === false || $endPos === false ) {
171 break;
172 }
173
174 $endPos += strlen( Parser::MARKER_SUFFIX );
175 $marker = substr( $text, $startPos, $endPos - $startPos );
176 if ( !preg_match( $this->regex, $marker, $m ) ) {
177 continue;
178 }
179
180 $key = $m[1];
181 if ( isset( $this->data['nowiki'][$key] ) ) {
182 $subState->data['nowiki'][$key] = $this->data['nowiki'][$key];
183 } elseif ( isset( $this->data['general'][$key] ) ) {
184 $subState->data['general'][$key] = $this->data['general'][$key];
185 }
186 $pos = $endPos;
187 }
188 return $subState;
189 }
190
191 /**
192 * Merge another StripState object into this one. The strip marker keys
193 * will not be preserved. The strings in the $texts array will have their
194 * strip markers rewritten, the resulting array of strings will be returned.
195 *
196 * @param StripState $otherState
197 * @param array $texts
198 * @return array
199 */
200 public function merge( $otherState, $texts ) {
201 $mergePrefix = Parser::getRandomString();
202
203 foreach ( $otherState->data as $type => $items ) {
204 foreach ( $items as $key => $value ) {
205 $this->data[$type]["$mergePrefix-$key"] = $value;
206 }
207 }
208
209 $this->tempMergePrefix = $mergePrefix;
210 $texts = preg_replace_callback( $otherState->regex, array( $this, 'mergeCallback' ), $texts );
211 $this->tempMergePrefix = null;
212 return $texts;
213 }
214
215 /**
216 * @param array $m
217 * @return string
218 */
219 protected function mergeCallback( $m ) {
220 $key = $m[1];
221 return "{$this->prefix}{$this->tempMergePrefix}-$key" . Parser::MARKER_SUFFIX;
222 }
223
224 /**
225 * Remove any strip markers found in the given text.
226 *
227 * @param string $text Input string
228 * @return string
229 */
230 public function killMarkers( $text ) {
231 return preg_replace( $this->regex, '', $text );
232 }
233 }