mDescription = "Cleanup all spam from a given hostname"; $this->addOption( 'all', 'Check all wikis in $wgLocalDatabases' ); $this->addOption( 'delete', 'Delete pages containing only spam instead of blanking them' ); $this->addArg( 'hostname', 'Hostname that was spamming, single * wildcard in the beginning allowed' ); } public function execute() { global $IP, $wgLocalDatabases, $wgUser; $username = wfMessage( 'spambot_username' )->text(); $wgUser = User::newFromName( $username ); if ( !$wgUser ) { $this->error( "Invalid username specified in 'spambot_username' message: $username", true ); } // Create the user if necessary if ( !$wgUser->getId() ) { $wgUser->addToDatabase(); } $spec = $this->getArg(); $like = LinkFilter::makeLikeArray( $spec ); if ( !$like ) { $this->error( "Not a valid hostname specification: $spec", true ); } if ( $this->hasOption( 'all' ) ) { // Clean up spam on all wikis $this->output( "Finding spam on " . count( $wgLocalDatabases ) . " wikis\n" ); $found = false; foreach ( $wgLocalDatabases as $wikiID ) { $dbr = wfGetDB( DB_SLAVE, array(), $wikiID ); $count = $dbr->selectField( 'externallinks', 'COUNT(*)', array( 'el_index' . $dbr->buildLike( $like ) ), __METHOD__ ); if ( $count ) { $found = true; $cmd = wfShellWikiCmd( "$IP/maintenance/cleanupSpam.php", array( '--wiki', $wikiID, $spec ) ); passthru( "$cmd | sed 's/^/$wikiID: /'" ); } } if ( $found ) { $this->output( "All done\n" ); } else { $this->output( "None found\n" ); } } else { // Clean up spam on this wiki $dbr = wfGetDB( DB_SLAVE ); $res = $dbr->select( 'externallinks', array( 'DISTINCT el_from' ), array( 'el_index' . $dbr->buildLike( $like ) ), __METHOD__ ); $count = $dbr->numRows( $res ); $this->output( "Found $count articles containing $spec\n" ); foreach ( $res as $row ) { $this->cleanupArticle( $row->el_from, $spec ); } if ( $count ) { $this->output( "Done\n" ); } } } private function cleanupArticle( $id, $domain ) { $title = Title::newFromID( $id ); if ( !$title ) { $this->error( "Internal error: no page for ID $id" ); return; } $this->output( $title->getPrefixedDBkey() . " ..." ); $rev = Revision::newFromTitle( $title ); $currentRevId = $rev->getId(); while ( $rev && ( $rev->isDeleted( Revision::DELETED_TEXT ) || LinkFilter::matchEntry( $rev->getContent( Revision::RAW ), $domain ) ) ) { $rev = $rev->getPrevious(); } if ( $rev && $rev->getId() == $currentRevId ) { // The regex didn't match the current article text // This happens e.g. when a link comes from a template rather than the page itself $this->output( "False match\n" ); } else { $dbw = wfGetDB( DB_MASTER ); $dbw->begin( __METHOD__ ); $page = WikiPage::factory( $title ); if ( $rev ) { // Revert to this revision $content = $rev->getContent( Revision::RAW ); $this->output( "reverting\n" ); $page->doEditContent( $content, wfMessage( 'spam_reverting', $domain )->inContentLanguage()->text(), EDIT_UPDATE, $rev->getId() ); } elseif ( $this->hasOption( 'delete' ) ) { // Didn't find a non-spammy revision, blank the page $this->output( "deleting\n" ); $page->doDeleteArticle( wfMessage( 'spam_deleting', $domain )->inContentLanguage()->text() ); } else { // Didn't find a non-spammy revision, blank the page $handler = ContentHandler::getForTitle( $title ); $content = $handler->makeEmptyContent(); $this->output( "blanking\n" ); $page->doEditContent( $content, wfMessage( 'spam_blanking', $domain )->inContentLanguage()->text() ); } $dbw->commit( __METHOD__ ); } } } $maintClass = "CleanupSpam"; require_once RUN_MAINTENANCE_IF_MAIN;