Merge "Add two new debug log groups"
[lhc/web/wiklou.git] / includes / content / TextContent.php
1 <?php
2 /**
3 * Content object implementation for representing flat text.
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
19 *
20 * @since 1.21
21 *
22 * @file
23 * @ingroup Content
24 *
25 * @author Daniel Kinzler
26 */
27
28 /**
29 * Content object implementation for representing flat text.
30 *
31 * TextContent instances are immutable
32 *
33 * @ingroup Content
34 */
35 class TextContent extends AbstractContent {
36
37 /**
38 * @param string $text
39 * @param string $model_id
40 */
41 public function __construct( $text, $model_id = CONTENT_MODEL_TEXT ) {
42 parent::__construct( $model_id );
43
44 if ( $text === null || $text === false ) {
45 wfWarn( "TextContent constructed with \$text = " . var_export( $text, true ) . "! "
46 . "This may indicate an error in the caller's scope.", 2 );
47
48 $text = '';
49 }
50
51 if ( !is_string( $text ) ) {
52 throw new MWException( "TextContent expects a string in the constructor." );
53 }
54
55 $this->mText = $text;
56 }
57
58 /**
59 * @note Mutable subclasses MUST override this to return a copy!
60 *
61 * @return Content $this
62 */
63 public function copy() {
64 return $this; # NOTE: this is ok since TextContent are immutable.
65 }
66
67 public function getTextForSummary( $maxlength = 250 ) {
68 global $wgContLang;
69
70 $text = $this->getNativeData();
71
72 $truncatedtext = $wgContLang->truncate(
73 preg_replace( "/[\n\r]/", ' ', $text ),
74 max( 0, $maxlength ) );
75
76 return $truncatedtext;
77 }
78
79 /**
80 * returns the text's size in bytes.
81 *
82 * @return int The size
83 */
84 public function getSize() {
85 $text = $this->getNativeData();
86
87 return strlen( $text );
88 }
89
90 /**
91 * Returns true if this content is not a redirect, and $wgArticleCountMethod
92 * is "any".
93 *
94 * @param bool $hasLinks If it is known whether this content contains links,
95 * provide this information here, to avoid redundant parsing to find out.
96 *
97 * @return bool
98 */
99 public function isCountable( $hasLinks = null ) {
100 global $wgArticleCountMethod;
101
102 if ( $this->isRedirect() ) {
103 return false;
104 }
105
106 if ( $wgArticleCountMethod === 'any' ) {
107 return true;
108 }
109
110 return false;
111 }
112
113 /**
114 * Returns the text represented by this Content object, as a string.
115 *
116 * @return string The raw text.
117 */
118 public function getNativeData() {
119 $text = $this->mText;
120
121 return $text;
122 }
123
124 /**
125 * Returns the text represented by this Content object, as a string.
126 *
127 * @return string The raw text.
128 */
129 public function getTextForSearchIndex() {
130 return $this->getNativeData();
131 }
132
133 /**
134 * Returns attempts to convert this content object to wikitext,
135 * and then returns the text string. The conversion may be lossy.
136 *
137 * @note: this allows any text-based content to be transcluded as if it was wikitext.
138 *
139 * @return string|false The raw text, or false if the conversion failed.
140 */
141 public function getWikitextForTransclusion() {
142 $wikitext = $this->convert( CONTENT_MODEL_WIKITEXT, 'lossy' );
143
144 if ( $wikitext ) {
145 return $wikitext->getNativeData();
146 } else {
147 return false;
148 }
149 }
150
151 /**
152 * Returns a Content object with pre-save transformations applied.
153 * This implementation just trims trailing whitespace.
154 *
155 * @param Title $title
156 * @param User $user
157 * @param ParserOptions $popts
158 *
159 * @return Content
160 */
161 public function preSaveTransform( Title $title, User $user, ParserOptions $popts ) {
162 $text = $this->getNativeData();
163 $pst = rtrim( $text );
164
165 return ( $text === $pst ) ? $this : new static( $pst );
166 }
167
168 /**
169 * Diff this content object with another content object.
170 *
171 * @since 1.21
172 *
173 * @param Content $that The other content object to compare this content
174 * object to.
175 * @param Language $lang The language object to use for text segmentation.
176 * If not given, $wgContentLang is used.
177 *
178 * @return Diff A diff representing the changes that would have to be
179 * made to this content object to make it equal to $that.
180 */
181 public function diff( Content $that, Language $lang = null ) {
182 global $wgContLang;
183
184 $this->checkModelID( $that->getModel() );
185
186 // @todo could implement this in DifferenceEngine and just delegate here?
187
188 if ( !$lang ) {
189 $lang = $wgContLang;
190 }
191
192 $otext = $this->getNativeData();
193 $ntext = $that->getNativeData();
194
195 # Note: Use native PHP diff, external engines don't give us abstract output
196 $ota = explode( "\n", $lang->segmentForDiff( $otext ) );
197 $nta = explode( "\n", $lang->segmentForDiff( $ntext ) );
198
199 $diff = new Diff( $ota, $nta );
200
201 return $diff;
202 }
203
204 /**
205 * Returns a generic ParserOutput object, wrapping the HTML returned by
206 * getHtml().
207 *
208 * @param Title $title Context title for parsing
209 * @param int $revId Revision ID (for {{REVISIONID}})
210 * @param ParserOptions $options Parser options
211 * @param bool $generateHtml Whether or not to generate HTML
212 *
213 * @return ParserOutput Representing the HTML form of the text.
214 */
215 public function getParserOutput( Title $title, $revId = null,
216 ParserOptions $options = null, $generateHtml = true ) {
217 global $wgParser, $wgTextModelsToParse;
218
219 if ( !$options ) {
220 //NOTE: use canonical options per default to produce cacheable output
221 $options = $this->getContentHandler()->makeParserOptions( 'canonical' );
222 }
223
224 if ( in_array( $this->getModel(), $wgTextModelsToParse ) ) {
225 // parse just to get links etc into the database
226 $po = $wgParser->parse( $this->getNativeData(), $title, $options, true, true, $revId );
227 } else {
228 $po = new ParserOutput();
229 }
230
231 if ( $generateHtml ) {
232 $html = $this->getHtml();
233 } else {
234 $html = '';
235 }
236
237 $po->setText( $html );
238
239 return $po;
240 }
241
242 /**
243 * Generates an HTML version of the content, for display. Used by
244 * getParserOutput() to construct a ParserOutput object.
245 *
246 * This default implementation just calls getHighlightHtml(). Content
247 * models that have another mapping to HTML (as is the case for markup
248 * languages like wikitext) should override this method to generate the
249 * appropriate HTML.
250 *
251 * @return string An HTML representation of the content
252 */
253 protected function getHtml() {
254 return $this->getHighlightHtml();
255 }
256
257 /**
258 * Generates a syntax-highlighted version of the content, as HTML.
259 * Used by the default implementation of getHtml().
260 *
261 * @return string A HTML representation of the content's markup
262 */
263 protected function getHighlightHtml() {
264 # TODO: make Highlighter interface, use highlighter here, if available
265 return htmlspecialchars( $this->getNativeData() );
266 }
267
268 /**
269 * This implementation provides lossless conversion between content models based
270 * on TextContent.
271 *
272 * @param string $toModel
273 * @param string $lossy
274 *
275 * @return Content|bool
276 *
277 * @see Content::convert()
278 */
279 public function convert( $toModel, $lossy = '' ) {
280 $converted = parent::convert( $toModel, $lossy );
281
282 if ( $converted !== false ) {
283 return $converted;
284 }
285
286 $toHandler = ContentHandler::getForModelID( $toModel );
287
288 if ( $toHandler instanceof TextContentHandler ) {
289 //NOTE: ignore content serialization format - it's just text anyway.
290 $text = $this->getNativeData();
291 $converted = $toHandler->unserializeContent( $text );
292 }
293
294 return $converted;
295 }
296
297 }