summaryrefslogtreecommitdiff
path: root/maintenance/initEditCount.php
blob: d26349bbe40c85bfbe059f9c5738503332f9492c (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
<?php
/**
 * @file
 * @ingroup Maintenance
 */

require_once "commandLine.inc";

if( isset( $options['help'] ) ) {
	die( "Batch-recalculate user_editcount fields from the revision table.
Options:
  --quick        Force the update to be done in a single query.
  --background   Force replication-friendly mode; may be inefficient but
                 avoids locking tables or lagging slaves with large updates;
                 calculates counts on a slave if possible.

Background mode will be automatically used if the server is MySQL 4.0
(which does not support subqueries) or if multiple servers are listed
in \$wgDBservers, usually indicating a replication environment.

");
}
$dbw = wfGetDB( DB_MASTER );
$user = $dbw->tableName( 'user' );
$revision = $dbw->tableName( 'revision' );

$dbver = $dbw->getServerVersion();

// Autodetect mode...
$backgroundMode = count( $wgDBservers ) > 1 ||
	($dbw instanceof DatabaseMySql && version_compare( $dbver, '4.1' ) < 0);

if( isset( $options['background'] ) ) {
	$backgroundMode = true;
} elseif( isset( $options['quick'] ) ) {
	$backgroundMode = false;
}

if( $backgroundMode ) {
	echo "Using replication-friendly background mode...\n";
	
	$dbr = wfGetDB( DB_SLAVE );
	$chunkSize = 100;
	$lastUser = $dbr->selectField( 'user', 'MAX(user_id)', '', __FUNCTION__ );
	
	$start = microtime( true );
	$migrated = 0;
	for( $min = 0; $min <= $lastUser; $min += $chunkSize ) {
		$max = $min + $chunkSize;
		$result = $dbr->query(
			"SELECT
				user_id,
				COUNT(rev_user) AS user_editcount
			FROM $user
			LEFT OUTER JOIN $revision ON user_id=rev_user
			WHERE user_id > $min AND user_id <= $max
			GROUP BY user_id",
			__FUNCTION__ );
		
		while( $row = $dbr->fetchObject( $result ) ) {
			$dbw->update( 'user',
				array( 'user_editcount' => $row->user_editcount ),
				array( 'user_id' => $row->user_id ),
				__FUNCTION__ );
			++$migrated;
		}
		$dbr->freeResult( $result );
		
		$delta = microtime( true ) - $start;
		$rate = ($delta == 0.0) ? 0.0 : $migrated / $delta;
		printf( "%s %d (%0.1f%%) done in %0.1f secs (%0.3f accounts/sec).\n",
			$wgDBname,
			$migrated,
			min( $max, $lastUser ) / $lastUser * 100.0,
			$delta,
			$rate );
		
		wfWaitForSlaves( 10 );
	}
} else {
	// Subselect should work on modern MySQLs etc
	echo "Using single-query mode...\n";
	$sql = "UPDATE $user SET user_editcount=(SELECT COUNT(*) FROM $revision WHERE rev_user=user_id)";
	$dbw->query( $sql );
}

echo "Done!\n";