wiki.techinc.nl/maintenance/removeUnusedAccounts.php
Brad Jorsch c29909e59f Mostly drop old pre-actor user schemas
This removes most of the pre-actor user and user_text columns, and the
$wgActorTableSchemaMigrationStage setting that used to determine
whether the columns were used.

rev_user and rev_user_text remain in the code, as on Wikimedia wikis the
revision table is too large to alter at this time. A future change will
combine that with the removal of rev_comment, rev_content_model, and
rev_content_format (and the addition of rev_comment_id and rev_actor).

ActorMigration's constructor continues to take a $stage parameter, and
continues to have the logic for handling it, for the benefit of
extensions that might need their own migration process. Code using
ActorMigration for accessing the core fields should be updated to use
the new actor fields directly. That will be done for in a followup.

Bug: T188327
Change-Id: Id35544b879af1cd708f3efd303fce8d9a1b9eb02
2019-09-09 11:38:36 -04:00

181 lines
6 KiB
PHP

<?php
/**
* Remove unused user accounts from the database
* An unused account is one which has made no edits
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License along
* with this program; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
* http://www.gnu.org/copyleft/gpl.html
*
* @file
* @ingroup Maintenance
* @author Rob Church <robchur@gmail.com>
*/
require_once __DIR__ . '/Maintenance.php';
/**
* Maintenance script that removes unused user accounts from the database.
*
* @ingroup Maintenance
*/
class RemoveUnusedAccounts extends Maintenance {
public function __construct() {
parent::__construct();
$this->addOption( 'delete', 'Actually delete the account' );
$this->addOption( 'ignore-groups', 'List of comma-separated groups to exclude', false, true );
$this->addOption( 'ignore-touched', 'Skip accounts touched in last N days', false, true );
}
public function execute() {
$this->output( "Remove unused accounts\n\n" );
# Do an initial scan for inactive accounts and report the result
$this->output( "Checking for unused user accounts...\n" );
$delUser = [];
$delActor = [];
$dbr = $this->getDB( DB_REPLICA );
$res = $dbr->select(
[ 'user', 'actor' ],
[ 'user_id', 'user_name', 'user_touched', 'actor_id' ],
'',
__METHOD__,
[],
[ 'actor' => [ 'LEFT JOIN', 'user_id = actor_user' ] ]
);
if ( $this->hasOption( 'ignore-groups' ) ) {
$excludedGroups = explode( ',', $this->getOption( 'ignore-groups' ) );
} else {
$excludedGroups = [];
}
$touched = $this->getOption( 'ignore-touched', "1" );
if ( !ctype_digit( $touched ) ) {
$this->fatalError( "Please put a valid positive integer on the --ignore-touched parameter." );
}
$touchedSeconds = 86400 * $touched;
foreach ( $res as $row ) {
# Check the account, but ignore it if it's within a $excludedGroups
# group or if it's touched within the $touchedSeconds seconds.
$instance = User::newFromId( $row->user_id );
if ( count( array_intersect( $instance->getEffectiveGroups(), $excludedGroups ) ) == 0
&& $this->isInactiveAccount( $row->user_id, $row->actor_id ?? null, true )
&& wfTimestamp( TS_UNIX, $row->user_touched ) < wfTimestamp( TS_UNIX, time() - $touchedSeconds )
) {
# Inactive; print out the name and flag it
$delUser[] = $row->user_id;
if ( isset( $row->actor_id ) && $row->actor_id ) {
$delActor[] = $row->actor_id;
}
$this->output( $row->user_name . "\n" );
}
}
$count = count( $delUser );
$this->output( "...found {$count}.\n" );
# If required, go back and delete each marked account
if ( $count > 0 && $this->hasOption( 'delete' ) ) {
$this->output( "\nDeleting unused accounts..." );
$dbw = $this->getDB( DB_MASTER );
$dbw->delete( 'user', [ 'user_id' => $delUser ], __METHOD__ );
# Keep actor rows referenced from ipblocks
$keep = $dbw->selectFieldValues(
'ipblocks', 'ipb_by_actor', [ 'ipb_by_actor' => $delActor ], __METHOD__
);
$del = array_diff( $delActor, $keep );
if ( $del ) {
$dbw->delete( 'actor', [ 'actor_id' => $del ], __METHOD__ );
}
if ( $keep ) {
$dbw->update( 'actor', [ 'actor_user' => 0 ], [ 'actor_id' => $keep ], __METHOD__ );
}
$dbw->delete( 'user_groups', [ 'ug_user' => $delUser ], __METHOD__ );
$dbw->delete( 'user_former_groups', [ 'ufg_user' => $delUser ], __METHOD__ );
$dbw->delete( 'user_properties', [ 'up_user' => $delUser ], __METHOD__ );
$dbw->delete( 'logging', [ 'log_actor' => $delActor ], __METHOD__ );
$dbw->delete( 'recentchanges', [ 'rc_actor' => $delActor ], __METHOD__ );
$this->output( "done.\n" );
# Update the site_stats.ss_users field
$users = $dbw->selectField( 'user', 'COUNT(*)', [], __METHOD__ );
$dbw->update(
'site_stats',
[ 'ss_users' => $users ],
[ 'ss_row_id' => 1 ],
__METHOD__
);
} elseif ( $count > 0 ) {
$this->output( "\nRun the script again with --delete to remove them from the database.\n" );
}
$this->output( "\n" );
}
/**
* Could the specified user account be deemed inactive?
* (No edits, no deleted edits, no log entries, no current/old uploads)
*
* @param int $id User's ID
* @param int|null $actor User's actor ID
* @param bool $master Perform checking on the master
* @return bool
*/
private function isInactiveAccount( $id, $actor, $master = false ) {
$dbo = $this->getDB( $master ? DB_MASTER : DB_REPLICA );
$checks = [
'revision' => 'rev',
'archive' => 'ar',
'image' => 'img',
'oldimage' => 'oi',
'filearchive' => 'fa'
];
$count = 0;
$migration = ActorMigration::newMigration();
$user = User::newFromAnyId( $id, null, $actor );
$this->beginTransaction( $dbo, __METHOD__ );
foreach ( $checks as $table => $prefix ) {
$actorQuery = $migration->getWhere(
$dbo, $prefix . '_user', $user, $prefix !== 'oi' && $prefix !== 'fa'
);
$count += (int)$dbo->selectField(
[ $table ] + $actorQuery['tables'],
'COUNT(*)',
$actorQuery['conds'],
__METHOD__,
[],
$actorQuery['joins']
);
}
$actorQuery = $migration->getWhere( $dbo, 'log_user', $user, false );
$count += (int)$dbo->selectField(
[ 'logging' ] + $actorQuery['tables'],
'COUNT(*)',
[
$actorQuery['conds'],
'log_type != ' . $dbo->addQuotes( 'newusers' )
],
__METHOD__,
[],
$actorQuery['joins']
);
$this->commitTransaction( $dbo, __METHOD__ );
return $count == 0;
}
}
$maintClass = RemoveUnusedAccounts::class;
require_once RUN_MAINTENANCE_IF_MAIN;