<?php /** * Refresh the externallinks table el_index and el_index_60 from el_to * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License along * with this program; if not, write to the Free Software Foundation, Inc., * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. * http://www.gnu.org/copyleft/gpl.html * * @file * @ingroup Maintenance */ require_once __DIR__ . '/Maintenance.php'; use MediaWiki\MediaWikiServices; /** * Maintenance script that refreshes the externallinks table el_index and * el_index_60 from el_to * * @ingroup Maintenance * @since 1.33 */ class RefreshExternallinksIndex extends LoggedUpdateMaintenance { public function __construct() { parent::__construct(); $this->addDescription( 'Refresh the externallinks table el_index and el_index_60 from el_to' ); $this->setBatchSize( 10000 ); } protected function getUpdateKey() { return static::class . ' v' . LinkFilter::VERSION . ( LinkFilter::supportsIDN() ? '+' : '-' ) . 'IDN'; } protected function updateSkippedMessage() { return 'externallinks table indexes up to date'; } protected function doDBUpdates() { $dbw = $this->getDB( DB_MASTER ); if ( !$dbw->tableExists( 'externallinks', __METHOD__ ) ) { $this->error( "externallinks table does not exist" ); return false; } $this->output( "Updating externallinks table index fields\n" ); $minmax = $dbw->selectRow( 'externallinks', [ 'min' => 'MIN(el_id)', 'max' => 'MAX(el_id)' ], '', __METHOD__ ); $updated = 0; $deleted = 0; $start = $minmax->min - 1; $last = $minmax->max; $lbFactory = MediaWikiServices::getInstance()->getDBLoadBalancerFactory(); while ( $start < $last ) { $end = min( $start + $this->mBatchSize, $last ); $this->output( "el_id $start - $end of $last\n" ); $res = $dbw->select( 'externallinks', [ 'el_id', 'el_to', 'el_index' ], [ "el_id > $start", "el_id <= $end", ], __METHOD__, [ 'ORDER BY' => 'el_id' ] ); foreach ( $res as $row ) { $newIndexes = LinkFilter::makeIndexes( $row->el_to ); if ( !$newIndexes ) { $dbw->delete( 'externallinks', [ 'el_id' => $row->el_id ], __METHOD__ ); $deleted++; continue; } if ( in_array( $row->el_index, $newIndexes, true ) ) { continue; } if ( count( $newIndexes ) === 1 ) { $newIndex = $newIndexes[0]; } else { // Assume the scheme is the only difference between the different $newIndexes. // Keep this row's scheme, assuming there's another row with the other scheme. $newIndex = substr( $row->el_index, 0, strpos( $row->el_index, ':' ) ) . substr( $newIndexes[0], strpos( $newIndexes[0], ':' ) ); } $dbw->update( 'externallinks', [ 'el_index' => $newIndex, 'el_index_60' => substr( $newIndex, 0, 60 ), ], [ 'el_id' => $row->el_id ], __METHOD__ ); $updated++; } $lbFactory->waitForReplication(); $start = $end; } $this->output( "Done, $updated rows updated, $deleted deleted.\n" ); return true; } } $maintClass = RefreshExternallinksIndex::class; require_once RUN_MAINTENANCE_IF_MAIN;