summaryrefslogtreecommitdiff
path: root/www/wiki/maintenance/updateSearchIndex.php
diff options
context:
space:
mode:
Diffstat (limited to 'www/wiki/maintenance/updateSearchIndex.php')
-rw-r--r--www/wiki/maintenance/updateSearchIndex.php125
1 files changed, 125 insertions, 0 deletions
diff --git a/www/wiki/maintenance/updateSearchIndex.php b/www/wiki/maintenance/updateSearchIndex.php
new file mode 100644
index 00000000..af2d8287
--- /dev/null
+++ b/www/wiki/maintenance/updateSearchIndex.php
@@ -0,0 +1,125 @@
+<?php
+/**
+ * Periodic off-peak updating of the search index.
+ *
+ * Usage: php updateSearchIndex.php [-s START] [-e END] [-p POSFILE] [-l LOCKTIME] [-q]
+ * Where START is the starting timestamp
+ * END is the ending timestamp
+ * POSFILE is a file to load timestamps from and save them to, searchUpdate.WIKI_ID.pos by default
+ * LOCKTIME is how long the searchindex and revision tables will be locked for
+ * -q means quiet
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
+ * http://www.gnu.org/copyleft/gpl.html
+ *
+ * @file
+ * @ingroup Maintenance
+ */
+
+require_once __DIR__ . '/Maintenance.php';
+
+/**
+ * Maintenance script for periodic off-peak updating of the search index.
+ *
+ * @ingroup Maintenance
+ */
+class UpdateSearchIndex extends Maintenance {
+
+ public function __construct() {
+ parent::__construct();
+ $this->addDescription( 'Script for periodic off-peak updating of the search index' );
+ $this->addOption( 's', 'starting timestamp', false, true );
+ $this->addOption( 'e', 'Ending timestamp', false, true );
+ $this->addOption(
+ 'p',
+ 'File for saving/loading timestamps, searchUpdate.WIKI_ID.pos by default',
+ false,
+ true
+ );
+ $this->addOption(
+ 'l',
+ 'How long the searchindex and revision tables will be locked for',
+ false,
+ true
+ );
+ }
+
+ public function getDbType() {
+ return Maintenance::DB_ADMIN;
+ }
+
+ public function execute() {
+ $posFile = $this->getOption( 'p', 'searchUpdate.' . wfWikiID() . '.pos' );
+ $end = $this->getOption( 'e', wfTimestampNow() );
+ if ( $this->hasOption( 's' ) ) {
+ $start = $this->getOption( 's' );
+ } elseif ( is_readable( 'searchUpdate.pos' ) ) {
+ # B/c to the old position file name which was hardcoded
+ # We can safely delete the file when we're done though.
+ $start = file_get_contents( 'searchUpdate.pos' );
+ unlink( 'searchUpdate.pos' );
+ } elseif ( is_readable( $posFile ) ) {
+ $start = file_get_contents( $posFile );
+ } else {
+ $start = wfTimestamp( TS_MW, time() - 86400 );
+ }
+ $lockTime = $this->getOption( 'l', 20 );
+
+ $this->doUpdateSearchIndex( $start, $end, $lockTime );
+ if ( is_writable( dirname( realpath( $posFile ) ) ) ) {
+ $file = fopen( $posFile, 'w' );
+ if ( $file !== false ) {
+ fwrite( $file, $end );
+ fclose( $file );
+ } else {
+ $this->error( "*** Couldn't write to the $posFile!\n" );
+ }
+ } else {
+ $this->error( "*** Couldn't write to the $posFile!\n" );
+ }
+ }
+
+ private function doUpdateSearchIndex( $start, $end, $maxLockTime ) {
+ global $wgDisableSearchUpdate;
+
+ $wgDisableSearchUpdate = false;
+
+ $dbw = $this->getDB( DB_MASTER );
+ $recentchanges = $dbw->tableName( 'recentchanges' );
+
+ $this->output( "Updating searchindex between $start and $end\n" );
+
+ # Select entries from recentchanges which are on top and between the specified times
+ $start = $dbw->timestamp( $start );
+ $end = $dbw->timestamp( $end );
+
+ $page = $dbw->tableName( 'page' );
+ $sql = "SELECT rc_cur_id FROM $recentchanges
+ JOIN $page ON rc_cur_id=page_id AND rc_this_oldid=page_latest
+ WHERE rc_type != " . RC_LOG . " AND rc_timestamp BETWEEN '$start' AND '$end'";
+ $res = $dbw->query( $sql, __METHOD__ );
+
+ $this->updateSearchIndex( $maxLockTime, [ $this, 'searchIndexUpdateCallback' ], $dbw, $res );
+
+ $this->output( "Done\n" );
+ }
+
+ public function searchIndexUpdateCallback( $dbw, $row ) {
+ $this->updateSearchIndexForPage( $dbw, $row->rc_cur_id );
+ }
+}
+
+$maintClass = UpdateSearchIndex::class;
+require_once RUN_MAINTENANCE_IF_MAIN;