Merge "Print chained exceptions when maintenance script fails."
[lhc/web/wiklou.git] / maintenance / refreshExternallinksIndex.php
1 <?php
2 /**
3 * Refresh the externallinks table el_index and el_index_60 from el_to
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
19 *
20 * @file
21 * @ingroup Maintenance
22 */
23
24 require_once __DIR__ . '/Maintenance.php';
25
26 /**
27 * Maintenance script that refreshes the externallinks table el_index and
28 * el_index_60 from el_to
29 *
30 * @ingroup Maintenance
31 * @since 1.33
32 */
33 class RefreshExternallinksIndex extends LoggedUpdateMaintenance {
34 public function __construct() {
35 parent::__construct();
36 $this->addDescription(
37 'Refresh the externallinks table el_index and el_index_60 from el_to' );
38 $this->setBatchSize( 10000 );
39 }
40
41 protected function getUpdateKey() {
42 return static::class
43 . ' v' . LinkFilter::VERSION
44 . ( LinkFilter::supportsIDN() ? '+' : '-' ) . 'IDN';
45 }
46
47 protected function updateSkippedMessage() {
48 return 'externallinks table indexes up to date';
49 }
50
51 protected function doDBUpdates() {
52 $dbw = $this->getDB( DB_MASTER );
53 if ( !$dbw->tableExists( 'externallinks' ) ) {
54 $this->error( "externallinks table does not exist" );
55 return false;
56 }
57 $this->output( "Updating externallinks table index fields\n" );
58
59 $minmax = $dbw->selectRow(
60 'externallinks',
61 [ 'min' => 'MIN(el_id)', 'max' => 'MAX(el_id)' ],
62 '',
63 __METHOD__
64 );
65
66 $updated = 0;
67 $deleted = 0;
68 $start = $minmax->min - 1;
69 $last = $minmax->max;
70 while ( $start < $last ) {
71 $end = min( $start + $this->mBatchSize, $last );
72 $this->output( "el_id $start - $end of $last\n" );
73 $res = $dbw->select( 'externallinks', [ 'el_id', 'el_to', 'el_index' ],
74 [
75 "el_id > $start",
76 "el_id <= $end",
77 ],
78 __METHOD__,
79 [ 'ORDER BY' => 'el_id' ]
80 );
81 foreach ( $res as $row ) {
82 $newIndexes = LinkFilter::makeIndexes( $row->el_to );
83 if ( !$newIndexes ) {
84 $dbw->delete( 'externallinks', [ 'el_id' => $row->el_id ], __METHOD__ );
85 $deleted++;
86 continue;
87 }
88 if ( in_array( $row->el_index, $newIndexes, true ) ) {
89 continue;
90 }
91
92 if ( count( $newIndexes ) === 1 ) {
93 $newIndex = $newIndexes[0];
94 } else {
95 // Assume the scheme is the only difference between the different $newIndexes.
96 // Keep this row's scheme, assuming there's another row with the other scheme.
97 $newIndex = substr( $row->el_index, 0, strpos( $row->el_index, ':' ) ) .
98 substr( $newIndexes[0], strpos( $newIndexes[0], ':' ) );
99 }
100 $dbw->update( 'externallinks',
101 [
102 'el_index' => $newIndex,
103 'el_index_60' => substr( $newIndex, 0, 60 ),
104 ],
105 [ 'el_id' => $row->el_id ],
106 __METHOD__
107 );
108 $updated++;
109 }
110 wfWaitForSlaves();
111 $start = $end;
112 }
113 $this->output( "Done, $updated rows updated, $deleted deleted.\n" );
114
115 return true;
116 }
117 }
118
119 $maintClass = "RefreshExternallinksIndex";
120 require_once RUN_MAINTENANCE_IF_MAIN;