Merge "Parser: Refactor parsing of [[File:...|link=...]] syntax for reusability"
[lhc/web/wiklou.git] / includes / actions / RawAction.php
1 <?php
2 /**
3 * Raw page text accessor
4 *
5 * Copyright © 2004 Gabriel Wicke <wicke@wikidev.net>
6 * http://wikidev.net/
7 *
8 * Based on HistoryAction and SpecialExport
9 *
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License along
21 * with this program; if not, write to the Free Software Foundation, Inc.,
22 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
23 * http://www.gnu.org/copyleft/gpl.html
24 *
25 * @author Gabriel Wicke <wicke@wikidev.net>
26 * @file
27 */
28
29 use MediaWiki\Logger\LoggerFactory;
30
31 /**
32 * A simple method to retrieve the plain source of an article,
33 * using "action=raw" in the GET request string.
34 *
35 * @ingroup Actions
36 */
37 class RawAction extends FormlessAction {
38 public function getName() {
39 return 'raw';
40 }
41
42 public function requiresWrite() {
43 return false;
44 }
45
46 public function requiresUnblock() {
47 return false;
48 }
49
50 /**
51 * @suppress SecurityCheck-XSS Non html mime type
52 */
53 function onView() {
54 $this->getOutput()->disable();
55 $request = $this->getRequest();
56 $response = $request->response();
57 $config = $this->context->getConfig();
58
59 if ( !$request->checkUrlExtension() ) {
60 return;
61 }
62
63 if ( $this->getOutput()->checkLastModified( $this->page->getTouched() ) ) {
64 return; // Client cache fresh and headers sent, nothing more to do.
65 }
66
67 $contentType = $this->getContentType();
68
69 $maxage = $request->getInt( 'maxage', $config->get( 'SquidMaxage' ) );
70 $smaxage = $request->getIntOrNull( 'smaxage' );
71 if ( $smaxage === null ) {
72 if (
73 $contentType == 'text/css' ||
74 $contentType == 'application/json' ||
75 $contentType == 'text/javascript'
76 ) {
77 // CSS/JSON/JS raw content has its own CDN max age configuration.
78 // Note: Title::getCdnUrls() includes action=raw for css/json/js
79 // pages, so if using the canonical url, this will get HTCP purges.
80 $smaxage = intval( $config->get( 'ForcedRawSMaxage' ) );
81 } else {
82 // No CDN cache for anything else
83 $smaxage = 0;
84 }
85 }
86
87 // Set standard Vary headers so cache varies on cookies and such (T125283)
88 $response->header( $this->getOutput()->getVaryHeader() );
89 if ( $config->get( 'UseKeyHeader' ) ) {
90 $response->header( $this->getOutput()->getKeyHeader() );
91 }
92
93 // Output may contain user-specific data;
94 // vary generated content for open sessions on private wikis
95 $privateCache = !User::isEveryoneAllowed( 'read' ) &&
96 ( $smaxage == 0 || MediaWiki\Session\SessionManager::getGlobalSession()->isPersistent() );
97 // Don't accidentally cache cookies if user is logged in (T55032)
98 $privateCache = $privateCache || $this->getUser()->isLoggedIn();
99 $mode = $privateCache ? 'private' : 'public';
100 $response->header(
101 'Cache-Control: ' . $mode . ', s-maxage=' . $smaxage . ', max-age=' . $maxage
102 );
103
104 // In the event of user JS, don't allow loading a user JS/CSS/Json
105 // subpage that has no registered user associated with, as
106 // someone could register the account and take control of the
107 // JS/CSS/Json page.
108 $title = $this->getTitle();
109 if ( $title->isUserConfigPage() && $contentType !== 'text/x-wiki' ) {
110 // not using getRootText() as we want this to work
111 // even if subpages are disabled.
112 $rootPage = strtok( $title->getText(), '/' );
113 $userFromTitle = User::newFromName( $rootPage, 'usable' );
114 if ( !$userFromTitle || $userFromTitle->getId() === 0 ) {
115 $elevated = $this->getUser()->isAllowed( 'editinterface' );
116 $elevatedText = $elevated ? 'by elevated ' : '';
117 $log = LoggerFactory::getInstance( "security" );
118 $log->warning(
119 "Unsafe JS/CSS/Json $elevatedText" . "load - {user} loaded {title} with {ctype}",
120 [
121 'user' => $this->getUser()->getName(),
122 'title' => $title->getPrefixedDBKey(),
123 'ctype' => $contentType,
124 'elevated' => $elevated
125 ]
126 );
127 $msg = wfMessage( 'unregistered-user-config' );
128 throw new HttpError( 403, $msg );
129 }
130 }
131
132 $response->header( 'Content-type: ' . $contentType . '; charset=UTF-8' );
133
134 $text = $this->getRawText();
135
136 // Don't return a 404 response for CSS or JavaScript;
137 // 404s aren't generally cached and it would create
138 // extra hits when user CSS/JS are on and the user doesn't
139 // have the pages.
140 if ( $text === false && $contentType == 'text/x-wiki' ) {
141 $response->statusHeader( 404 );
142 }
143
144 // Avoid PHP 7.1 warning of passing $this by reference
145 $rawAction = $this;
146 if ( !Hooks::run( 'RawPageViewBeforeOutput', [ &$rawAction, &$text ] ) ) {
147 wfDebug( __METHOD__ . ": RawPageViewBeforeOutput hook broke raw page output.\n" );
148 }
149
150 echo $text;
151 }
152
153 /**
154 * Get the text that should be returned, or false if the page or revision
155 * was not found.
156 *
157 * @return string|bool
158 */
159 public function getRawText() {
160 global $wgParser;
161
162 $text = false;
163 $title = $this->getTitle();
164 $request = $this->getRequest();
165
166 // If it's a MediaWiki message we can just hit the message cache
167 if ( $request->getBool( 'usemsgcache' ) && $title->getNamespace() == NS_MEDIAWIKI ) {
168 // The first "true" is to use the database, the second is to use
169 // the content langue and the last one is to specify the message
170 // key already contains the language in it ("/de", etc.).
171 $text = MessageCache::singleton()->get( $title->getDBkey(), true, true, true );
172 // If the message doesn't exist, return a blank
173 if ( $text === false ) {
174 $text = '';
175 }
176 } else {
177 // Get it from the DB
178 $rev = Revision::newFromTitle( $title, $this->getOldId() );
179 if ( $rev ) {
180 $lastmod = wfTimestamp( TS_RFC2822, $rev->getTimestamp() );
181 $request->response()->header( "Last-modified: $lastmod" );
182
183 // Public-only due to cache headers
184 $content = $rev->getContent();
185
186 if ( $content === null ) {
187 // revision not found (or suppressed)
188 $text = false;
189 } elseif ( !$content instanceof TextContent ) {
190 // non-text content
191 wfHttpError( 415, "Unsupported Media Type", "The requested page uses the content model `"
192 . $content->getModel() . "` which is not supported via this interface." );
193 die();
194 } else {
195 // want a section?
196 $section = $request->getIntOrNull( 'section' );
197 if ( $section !== null ) {
198 $content = $content->getSection( $section );
199 }
200
201 if ( $content === null || $content === false ) {
202 // section not found (or section not supported, e.g. for JS, JSON, and CSS)
203 $text = false;
204 } else {
205 $text = $content->getNativeData();
206 }
207 }
208 }
209 }
210
211 if ( $text !== false && $text !== '' && $request->getRawVal( 'templates' ) === 'expand' ) {
212 $text = $wgParser->preprocess(
213 $text,
214 $title,
215 ParserOptions::newFromContext( $this->getContext() )
216 );
217 }
218
219 return $text;
220 }
221
222 /**
223 * Get the ID of the revision that should used to get the text.
224 *
225 * @return int
226 */
227 public function getOldId() {
228 $oldid = $this->getRequest()->getInt( 'oldid' );
229 switch ( $this->getRequest()->getText( 'direction' ) ) {
230 case 'next':
231 # output next revision, or nothing if there isn't one
232 $nextid = 0;
233 if ( $oldid ) {
234 $nextid = $this->getTitle()->getNextRevisionID( $oldid );
235 }
236 $oldid = $nextid ?: -1;
237 break;
238 case 'prev':
239 # output previous revision, or nothing if there isn't one
240 if ( !$oldid ) {
241 # get the current revision so we can get the penultimate one
242 $oldid = $this->page->getLatest();
243 }
244 $previd = $this->getTitle()->getPreviousRevisionID( $oldid );
245 $oldid = $previd ?: -1;
246 break;
247 case 'cur':
248 $oldid = 0;
249 break;
250 }
251
252 return $oldid;
253 }
254
255 /**
256 * Get the content type to use for the response
257 *
258 * @return string
259 */
260 public function getContentType() {
261 // Use getRawVal instead of getVal because we only
262 // need to match against known strings, there is no
263 // storing of localised content or other user input.
264 $ctype = $this->getRequest()->getRawVal( 'ctype' );
265
266 if ( $ctype == '' ) {
267 // Legacy compatibilty
268 $gen = $this->getRequest()->getRawVal( 'gen' );
269 if ( $gen == 'js' ) {
270 $ctype = 'text/javascript';
271 } elseif ( $gen == 'css' ) {
272 $ctype = 'text/css';
273 }
274 }
275
276 $allowedCTypes = [
277 'text/x-wiki',
278 'text/javascript',
279 'text/css',
280 // FIXME: Should we still allow Zope editing? External editing feature was dropped
281 'application/x-zope-edit',
282 'application/json'
283 ];
284 if ( $ctype == '' || !in_array( $ctype, $allowedCTypes ) ) {
285 $ctype = 'text/x-wiki';
286 }
287
288 return $ctype;
289 }
290 }