<?php
-require_once 'counter.php';
/**
* @todo document
- * @package MediaWiki
- * @subpackage Maintenance
+ * @addtogroup Maintenance
*/
/** */
-define( 'REPORTING_INTERVAL', 10 );
+define( "REPORTING_INTERVAL", 100 );
+#define( "REPORTING_INTERVAL", 1 );
-function refreshLinks( $start, $newOnly = false, $maxLag = false ) {
- global $wgUser, $wgParser, $wgUseImageResize;
+function refreshLinks( $start, $newOnly = false, $maxLag = false, $end = 0 ) {
+ global $wgUser, $wgParser, $wgUseImageResize, $wgUseTidy;
$fname = 'refreshLinks';
- $dbr =& wfGetDB( DB_SLAVE );
- $dbw =& wfGetDB( DB_MASTER );
+ $dbr = wfGetDB( DB_SLAVE );
$start = intval( $start );
-
+
# Don't generate TeX PNGs (lack of a sensible current directory causes errors anyway)
$wgUser->setOption('math', MW_MATH_SOURCE);
# Don't generate extension images (e.g. Timeline)
$wgParser->mTagHooks = array();
-
+
# Don't generate thumbnail images
$wgUseImageResize = false;
+ $wgUseTidy = false;
if ( $newOnly ) {
print "Refreshing links from ";
$res = $dbr->select( 'page',
- array( 'page_id' ),
+ array( 'page_id' ),
array(
'page_is_new' => 1,
"page_id > $start" ),
);
$num = $dbr->numRows( $res );
print "$num new articles...\n";
-
+
$i = 0;
while ( $row = $dbr->fetchObject( $res ) ) {
if ( !( ++$i % REPORTING_INTERVAL ) ) {
- print_c( $i - 1, $i );
+ print "$i\n";
wfWaitForSlaves( $maxLag );
}
}
} else {
print "Refreshing link table.\n";
- $end = $dbr->selectField( 'page', 'max(page_id)', false );
+ if ( !$end ) {
+ $end = $dbr->selectField( 'page', 'max(page_id)', false );
+ }
print("Starting from page_id $start of $end.\n");
for ($id = $start; $id <= $end; $id++) {
-
+
if ( !($id % REPORTING_INTERVAL) ) {
- print_c( $id - 1, $id );
+ print "$id\n";
wfWaitForSlaves( $maxLag );
}
fixLinksFromArticle( $id );
}
-
-
}
}
function fixLinksFromArticle( $id ) {
- global $wgTitle, $wgArticle, $wgLinkCache, $wgOut;
+ global $wgTitle, $wgParser;
$wgTitle = Title::newFromID( $id );
- $dbw =& wfGetDB( DB_MASTER );
+ $dbw = wfGetDB( DB_MASTER );
+
+ $linkCache =& LinkCache::singleton();
+ $linkCache->clear();
if ( is_null( $wgTitle ) ) {
return;
}
$dbw->begin();
- $wgArticle = new Article( $wgTitle );
- $text = $wgArticle->getContent( true );
- $wgLinkCache = new LinkCache;
- $wgLinkCache->forUpdate( true );
-
- global $wgLinkHolders;
- $wgLinkHolders = array(
- 'namespaces' => array(),
- 'dbkeys' => array(),
- 'queries' => array(),
- 'texts' => array(),
- 'titles' => array()
- );
-
-
- # Parse the text and replace links with placeholders
- $wgOut->addWikiText( $text );
-
- # Look up the links in the DB and add them to the link cache
- $wgOut->transformBuffer();
- $wgOut->clearHTML();
+ $revision = Revision::newFromTitle( $wgTitle );
+ if ( !$revision ) {
+ return;
+ }
- $linksUpdate = new LinksUpdate( $id, $wgTitle->getPrefixedDBkey() );
- $linksUpdate->doDumbUpdate();
+ $options = new ParserOptions;
+ $parserOutput = $wgParser->parse( $revision->getText(), $wgTitle, $options, true, true, $revision->getId() );
+ $update = new LinksUpdate( $wgTitle, $parserOutput, false );
+ $update->doUpdate();
$dbw->immediateCommit();
}
function deleteLinksFromNonexistent( $maxLag = 0 ) {
$fname = 'deleteLinksFromNonexistent';
-
+
wfWaitForSlaves( $maxLag );
- $dbw =& wfGetDB( DB_WRITE );
-
- $linksTables = array(
+ $dbw = wfGetDB( DB_WRITE );
+
+ $linksTables = array(
'pagelinks' => 'pl_from',
'imagelinks' => 'il_from',
'categorylinks' => 'cl_from',
+ 'templatelinks' => 'tl_from',
+ 'externallinks' => 'el_from',
);
$page = $dbw->tableName( 'page' );
$pTable = $dbw->tableName( $table );
$sql = "DELETE $pTable FROM $pTable LEFT JOIN $page ON page_id=$field WHERE page_id IS NULL";
-
+
print "Deleting $table from non-existent articles...";
$dbw->query( $sql, $fname );
print " fixed " .$dbw->affectedRows() . " row(s)\n";