summaryrefslogtreecommitdiff
path: root/www/wiki/maintenance/removeUnusedAccounts.php
diff options
context:
space:
mode:
Diffstat (limited to 'www/wiki/maintenance/removeUnusedAccounts.php')
-rw-r--r--www/wiki/maintenance/removeUnusedAccounts.php195
1 files changed, 195 insertions, 0 deletions
diff --git a/www/wiki/maintenance/removeUnusedAccounts.php b/www/wiki/maintenance/removeUnusedAccounts.php
new file mode 100644
index 00000000..3fa30cbd
--- /dev/null
+++ b/www/wiki/maintenance/removeUnusedAccounts.php
@@ -0,0 +1,195 @@
+<?php
+/**
+ * Remove unused user accounts from the database
+ * An unused account is one which has made no edits
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
+ * http://www.gnu.org/copyleft/gpl.html
+ *
+ * @file
+ * @ingroup Maintenance
+ * @author Rob Church <robchur@gmail.com>
+ */
+
+require_once __DIR__ . '/Maintenance.php';
+
+/**
+ * Maintenance script that removes unused user accounts from the database.
+ *
+ * @ingroup Maintenance
+ */
+class RemoveUnusedAccounts extends Maintenance {
+ public function __construct() {
+ parent::__construct();
+ $this->addOption( 'delete', 'Actually delete the account' );
+ $this->addOption( 'ignore-groups', 'List of comma-separated groups to exclude', false, true );
+ $this->addOption( 'ignore-touched', 'Skip accounts touched in last N days', false, true );
+ }
+
+ public function execute() {
+ global $wgActorTableSchemaMigrationStage;
+
+ $this->output( "Remove unused accounts\n\n" );
+
+ # Do an initial scan for inactive accounts and report the result
+ $this->output( "Checking for unused user accounts...\n" );
+ $delUser = [];
+ $delActor = [];
+ $dbr = $this->getDB( DB_REPLICA );
+ if ( $wgActorTableSchemaMigrationStage > MIGRATION_OLD ) {
+ $res = $dbr->select(
+ [ 'user', 'actor' ],
+ [ 'user_id', 'user_name', 'user_touched', 'actor_id' ],
+ '',
+ __METHOD__,
+ [],
+ [ 'actor' => [ 'LEFT JOIN', 'user_id = actor_user' ] ]
+ );
+ } else {
+ $res = $dbr->select( 'user', [ 'user_id', 'user_name', 'user_touched' ], '', __METHOD__ );
+ }
+ if ( $this->hasOption( 'ignore-groups' ) ) {
+ $excludedGroups = explode( ',', $this->getOption( 'ignore-groups' ) );
+ } else {
+ $excludedGroups = [];
+ }
+ $touched = $this->getOption( 'ignore-touched', "1" );
+ if ( !ctype_digit( $touched ) ) {
+ $this->fatalError( "Please put a valid positive integer on the --ignore-touched parameter." );
+ }
+ $touchedSeconds = 86400 * $touched;
+ foreach ( $res as $row ) {
+ # Check the account, but ignore it if it's within a $excludedGroups
+ # group or if it's touched within the $touchedSeconds seconds.
+ $instance = User::newFromId( $row->user_id );
+ if ( count( array_intersect( $instance->getEffectiveGroups(), $excludedGroups ) ) == 0
+ && $this->isInactiveAccount( $row->user_id, $row->actor_id ?? null, true )
+ && wfTimestamp( TS_UNIX, $row->user_touched ) < wfTimestamp( TS_UNIX, time() - $touchedSeconds )
+ ) {
+ # Inactive; print out the name and flag it
+ $delUser[] = $row->user_id;
+ if ( isset( $row->actor_id ) && $row->actor_id ) {
+ $delActor[] = $row->actor_id;
+ }
+ $this->output( $row->user_name . "\n" );
+ }
+ }
+ $count = count( $delUser );
+ $this->output( "...found {$count}.\n" );
+
+ # If required, go back and delete each marked account
+ if ( $count > 0 && $this->hasOption( 'delete' ) ) {
+ $this->output( "\nDeleting unused accounts..." );
+ $dbw = $this->getDB( DB_MASTER );
+ $dbw->delete( 'user', [ 'user_id' => $delUser ], __METHOD__ );
+ if ( $wgActorTableSchemaMigrationStage > MIGRATION_OLD ) {
+ # Keep actor rows referenced from ipblocks
+ $keep = $dbw->selectFieldValues(
+ 'ipblocks', 'ipb_by_actor', [ 'ipb_by_actor' => $delActor ], __METHOD__
+ );
+ $del = array_diff( $delActor, $keep );
+ if ( $del ) {
+ $dbw->delete( 'actor', [ 'actor_id' => $del ], __METHOD__ );
+ }
+ if ( $keep ) {
+ $dbw->update( 'actor', [ 'actor_user' => 0 ], [ 'actor_id' => $keep ], __METHOD__ );
+ }
+ }
+ $dbw->delete( 'user_groups', [ 'ug_user' => $delUser ], __METHOD__ );
+ $dbw->delete( 'user_former_groups', [ 'ufg_user' => $delUser ], __METHOD__ );
+ $dbw->delete( 'user_properties', [ 'up_user' => $delUser ], __METHOD__ );
+ if ( $wgActorTableSchemaMigrationStage > MIGRATION_OLD ) {
+ $dbw->delete( 'logging', [ 'log_actor' => $delActor ], __METHOD__ );
+ $dbw->delete( 'recentchanges', [ 'rc_actor' => $delActor ], __METHOD__ );
+ }
+ if ( $wgActorTableSchemaMigrationStage < MIGRATION_NEW ) {
+ $dbw->delete( 'logging', [ 'log_user' => $delUser ], __METHOD__ );
+ $dbw->delete( 'recentchanges', [ 'rc_user' => $delUser ], __METHOD__ );
+ }
+ $this->output( "done.\n" );
+ # Update the site_stats.ss_users field
+ $users = $dbw->selectField( 'user', 'COUNT(*)', [], __METHOD__ );
+ $dbw->update(
+ 'site_stats',
+ [ 'ss_users' => $users ],
+ [ 'ss_row_id' => 1 ],
+ __METHOD__
+ );
+ } elseif ( $count > 0 ) {
+ $this->output( "\nRun the script again with --delete to remove them from the database.\n" );
+ }
+ $this->output( "\n" );
+ }
+
+ /**
+ * Could the specified user account be deemed inactive?
+ * (No edits, no deleted edits, no log entries, no current/old uploads)
+ *
+ * @param int $id User's ID
+ * @param int|null $actor User's actor ID
+ * @param bool $master Perform checking on the master
+ * @return bool
+ */
+ private function isInactiveAccount( $id, $actor, $master = false ) {
+ $dbo = $this->getDB( $master ? DB_MASTER : DB_REPLICA );
+ $checks = [
+ 'revision' => 'rev',
+ 'archive' => 'ar',
+ 'image' => 'img',
+ 'oldimage' => 'oi',
+ 'filearchive' => 'fa'
+ ];
+ $count = 0;
+
+ $migration = ActorMigration::newMigration();
+
+ $user = User::newFromAnyId( $id, null, $actor );
+
+ $this->beginTransaction( $dbo, __METHOD__ );
+ foreach ( $checks as $table => $prefix ) {
+ $actorQuery = $migration->getWhere(
+ $dbo, $prefix . '_user', $user, $prefix !== 'oi' && $prefix !== 'fa'
+ );
+ $count += (int)$dbo->selectField(
+ [ $table ] + $actorQuery['tables'],
+ 'COUNT(*)',
+ $actorQuery['conds'],
+ __METHOD__,
+ [],
+ $actorQuery['joins']
+ );
+ }
+
+ $actorQuery = $migration->getWhere( $dbo, 'log_user', $user, false );
+ $count += (int)$dbo->selectField(
+ [ 'logging' ] + $actorQuery['tables'],
+ 'COUNT(*)',
+ [
+ $actorQuery['conds'],
+ 'log_type != ' . $dbo->addQuotes( 'newusers' )
+ ],
+ __METHOD__,
+ [],
+ $actorQuery['joins']
+ );
+
+ $this->commitTransaction( $dbo, __METHOD__ );
+
+ return $count == 0;
+ }
+}
+
+$maintClass = RemoveUnusedAccounts::class;
+require_once RUN_MAINTENANCE_IF_MAIN;