Merge "maintenance: Document secondary purpose of --server"
[lhc/web/wiklou.git] / includes / specials / SpecialMediaStatistics.php
1 <?php
2 /**
3 * Implements Special:MediaStatistics
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
19 *
20 * @file
21 * @ingroup SpecialPage
22 * @author Brian Wolff
23 */
24
25 use Wikimedia\Rdbms\IResultWrapper;
26 use Wikimedia\Rdbms\IDatabase;
27
28 /**
29 * @ingroup SpecialPage
30 */
31 class MediaStatisticsPage extends QueryPage {
32 protected $totalCount = 0, $totalBytes = 0;
33
34 /**
35 * @var int $totalPerType Combined file size of all files in a section
36 */
37 protected $totalPerType = 0;
38
39 /**
40 * @var int $totalSize Combined file size of all files
41 */
42 protected $totalSize = 0;
43
44 function __construct( $name = 'MediaStatistics' ) {
45 parent::__construct( $name );
46 // Generally speaking there is only a small number of file types,
47 // so just show all of them.
48 $this->limit = 5000;
49 $this->shownavigation = false;
50 }
51
52 public function isExpensive() {
53 return true;
54 }
55
56 /**
57 * Query to do.
58 *
59 * This abuses the query cache table by storing mime types as "titles".
60 *
61 * This will store entries like [[Media:BITMAP;image/jpeg;200;20000]]
62 * where the form is Media type;mime type;count;bytes.
63 *
64 * This relies on the behaviour that when value is tied, the order things
65 * come out of querycache table is the order they went in. Which is hacky.
66 * However, other special pages like Special:Deadendpages and
67 * Special:BrokenRedirects also rely on this.
68 * @return array
69 */
70 public function getQueryInfo() {
71 $dbr = wfGetDB( DB_REPLICA );
72 $fakeTitle = $dbr->buildConcat( [
73 'img_media_type',
74 $dbr->addQuotes( ';' ),
75 'img_major_mime',
76 $dbr->addQuotes( '/' ),
77 'img_minor_mime',
78 $dbr->addQuotes( ';' ),
79 'COUNT(*)',
80 $dbr->addQuotes( ';' ),
81 'SUM( img_size )'
82 ] );
83 return [
84 'tables' => [ 'image' ],
85 'fields' => [
86 'title' => $fakeTitle,
87 'namespace' => NS_MEDIA, /* needs to be something */
88 'value' => '1'
89 ],
90 'options' => [
91 'GROUP BY' => [
92 'img_media_type',
93 'img_major_mime',
94 'img_minor_mime',
95 ]
96 ]
97 ];
98 }
99
100 /**
101 * How to sort the results
102 *
103 * It's important that img_media_type come first, otherwise the
104 * tables will be fragmented.
105 * @return Array Fields to sort by
106 */
107 function getOrderFields() {
108 return [ 'img_media_type', 'count(*)', 'img_major_mime', 'img_minor_mime' ];
109 }
110
111 /**
112 * Output the results of the query.
113 *
114 * @param OutputPage $out
115 * @param Skin $skin (deprecated presumably)
116 * @param IDatabase $dbr
117 * @param IResultWrapper $res Results from query
118 * @param int $num Number of results
119 * @param int $offset Paging offset (Should always be 0 in our case)
120 */
121 protected function outputResults( $out, $skin, $dbr, $res, $num, $offset ) {
122 $prevMediaType = null;
123 foreach ( $res as $row ) {
124 $mediaStats = $this->splitFakeTitle( $row->title );
125 if ( count( $mediaStats ) < 4 ) {
126 continue;
127 }
128 list( $mediaType, $mime, $totalCount, $totalBytes ) = $mediaStats;
129 if ( $prevMediaType !== $mediaType ) {
130 if ( $prevMediaType !== null ) {
131 // We're not at beginning, so we have to
132 // close the previous table.
133 $this->outputTableEnd();
134 }
135 $this->outputMediaType( $mediaType );
136 $this->totalPerType = 0;
137 $this->outputTableStart( $mediaType );
138 $prevMediaType = $mediaType;
139 }
140 $this->outputTableRow( $mime, intval( $totalCount ), intval( $totalBytes ) );
141 }
142 if ( $prevMediaType !== null ) {
143 $this->outputTableEnd();
144 // add total size of all files
145 $this->outputMediaType( 'total' );
146 $this->getOutput()->addWikiText(
147 $this->msg( 'mediastatistics-allbytes' )
148 ->numParams( $this->totalSize )
149 ->sizeParams( $this->totalSize )
150 ->text()
151 );
152 }
153 }
154
155 /**
156 * Output closing </table>
157 */
158 protected function outputTableEnd() {
159 $this->getOutput()->addHTML( Html::closeElement( 'table' ) );
160 $this->getOutput()->addWikiText(
161 $this->msg( 'mediastatistics-bytespertype' )
162 ->numParams( $this->totalPerType )
163 ->sizeParams( $this->totalPerType )
164 ->numParams( $this->makePercentPretty( $this->totalPerType / $this->totalBytes ) )
165 ->text()
166 );
167 $this->totalSize += $this->totalPerType;
168 }
169
170 /**
171 * Output a row of the stats table
172 *
173 * @param string $mime mime type (e.g. image/jpeg)
174 * @param int $count Number of images of this type
175 * @param int $bytes Total space for images of this type
176 */
177 protected function outputTableRow( $mime, $count, $bytes ) {
178 $mimeSearch = SpecialPage::getTitleFor( 'MIMEsearch', $mime );
179 $linkRenderer = $this->getLinkRenderer();
180 $row = Html::rawElement(
181 'td',
182 [],
183 $linkRenderer->makeLink( $mimeSearch, $mime )
184 );
185 $row .= Html::element(
186 'td',
187 [],
188 $this->getExtensionList( $mime )
189 );
190 $row .= Html::rawElement(
191 'td',
192 // Make sure js sorts it in numeric order
193 [ 'data-sort-value' => $count ],
194 $this->msg( 'mediastatistics-nfiles' )
195 ->numParams( $count )
196 /** @todo Check to be sure this really should have number formatting */
197 ->numParams( $this->makePercentPretty( $count / $this->totalCount ) )
198 ->parse()
199 );
200 $row .= Html::rawElement(
201 'td',
202 // Make sure js sorts it in numeric order
203 [ 'data-sort-value' => $bytes ],
204 $this->msg( 'mediastatistics-nbytes' )
205 ->numParams( $bytes )
206 ->sizeParams( $bytes )
207 /** @todo Check to be sure this really should have number formatting */
208 ->numParams( $this->makePercentPretty( $bytes / $this->totalBytes ) )
209 ->parse()
210 );
211 $this->totalPerType += $bytes;
212 $this->getOutput()->addHTML( Html::rawElement( 'tr', [], $row ) );
213 }
214
215 /**
216 * @param float $decimal A decimal percentage (ie for 12.3%, this would be 0.123)
217 * @return String The percentage formatted so that 3 significant digits are shown.
218 */
219 protected function makePercentPretty( $decimal ) {
220 $decimal *= 100;
221 // Always show three useful digits
222 if ( $decimal == 0 ) {
223 return '0';
224 }
225 if ( $decimal >= 100 ) {
226 return '100';
227 }
228 $percent = sprintf( "%." . max( 0, 2 - floor( log10( $decimal ) ) ) . "f", $decimal );
229 // Then remove any trailing 0's
230 return preg_replace( '/\.?0*$/', '', $percent );
231 }
232
233 /**
234 * Given a mime type, return a comma separated list of allowed extensions.
235 *
236 * @param string $mime mime type
237 * @return string Comma separated list of allowed extensions (e.g. ".ogg, .oga")
238 */
239 private function getExtensionList( $mime ) {
240 $exts = MediaWiki\MediaWikiServices::getInstance()->getMimeAnalyzer()
241 ->getExtensionsForType( $mime );
242 if ( $exts === null ) {
243 return '';
244 }
245 $extArray = explode( ' ', $exts );
246 $extArray = array_unique( $extArray );
247 foreach ( $extArray as &$ext ) {
248 $ext = '.' . $ext;
249 }
250
251 return $this->getLanguage()->commaList( $extArray );
252 }
253
254 /**
255 * Output the start of the table
256 *
257 * Including opening <table>, and first <tr> with column headers.
258 * @param string $mediaType
259 */
260 protected function outputTableStart( $mediaType ) {
261 $this->getOutput()->addHTML(
262 Html::openElement(
263 'table',
264 [ 'class' => [
265 'mw-mediastats-table',
266 'mw-mediastats-table-' . strtolower( $mediaType ),
267 'sortable',
268 'wikitable'
269 ] ]
270 )
271 );
272 $this->getOutput()->addHTML( $this->getTableHeaderRow() );
273 }
274
275 /**
276 * Get (not output) the header row for the table
277 *
278 * @return String the header row of the able
279 */
280 protected function getTableHeaderRow() {
281 $headers = [ 'mimetype', 'extensions', 'count', 'totalbytes' ];
282 $ths = '';
283 foreach ( $headers as $header ) {
284 $ths .= Html::rawElement(
285 'th',
286 [],
287 // for grep:
288 // mediastatistics-table-mimetype, mediastatistics-table-extensions
289 // tatistics-table-count, mediastatistics-table-totalbytes
290 $this->msg( 'mediastatistics-table-' . $header )->parse()
291 );
292 }
293 return Html::rawElement( 'tr', [], $ths );
294 }
295
296 /**
297 * Output a header for a new media type section
298 *
299 * @param string $mediaType A media type (e.g. from the MEDIATYPE_xxx constants)
300 */
301 protected function outputMediaType( $mediaType ) {
302 $this->getOutput()->addHTML(
303 Html::element(
304 'h2',
305 [ 'class' => [
306 'mw-mediastats-mediatype',
307 'mw-mediastats-mediatype-' . strtolower( $mediaType )
308 ] ],
309 // for grep
310 // mediastatistics-header-unknown, mediastatistics-header-bitmap,
311 // mediastatistics-header-drawing, mediastatistics-header-audio,
312 // mediastatistics-header-video, mediastatistics-header-multimedia,
313 // mediastatistics-header-office, mediastatistics-header-text,
314 // mediastatistics-header-executable, mediastatistics-header-archive,
315 // mediastatistics-header-3d,
316 $this->msg( 'mediastatistics-header-' . strtolower( $mediaType ) )->text()
317 )
318 );
319 /** @todo Possibly could add a message here explaining what the different types are.
320 * not sure if it is needed though.
321 */
322 }
323
324 /**
325 * parse the fake title format that this special page abuses querycache with.
326 *
327 * @param string $fakeTitle A string formatted as <media type>;<mime type>;<count>;<bytes>
328 * @return array The constituant parts of $fakeTitle
329 */
330 private function splitFakeTitle( $fakeTitle ) {
331 return explode( ';', $fakeTitle, 4 );
332 }
333
334 /**
335 * What group to put the page in
336 * @return string
337 */
338 protected function getGroupName() {
339 return 'media';
340 }
341
342 /**
343 * This method isn't used, since we override outputResults, but
344 * we need to implement since abstract in parent class.
345 *
346 * @param Skin $skin
347 * @param stdClass $result Result row
348 * @return bool|string|void
349 * @throws MWException
350 */
351 public function formatResult( $skin, $result ) {
352 throw new MWException( "unimplemented" );
353 }
354
355 /**
356 * Initialize total values so we can figure out percentages later.
357 *
358 * @param IDatabase $dbr
359 * @param IResultWrapper $res
360 */
361 public function preprocessResults( $dbr, $res ) {
362 $this->executeLBFromResultWrapper( $res );
363 $this->totalCount = $this->totalBytes = 0;
364 foreach ( $res as $row ) {
365 $mediaStats = $this->splitFakeTitle( $row->title );
366 $this->totalCount += isset( $mediaStats[2] ) ? $mediaStats[2] : 0;
367 $this->totalBytes += isset( $mediaStats[3] ) ? $mediaStats[3] : 0;
368 }
369 $res->seek( 0 );
370 }
371 }