diff options
Diffstat (limited to 'www/wiki/maintenance/preprocessDump.php')
-rw-r--r-- | www/wiki/maintenance/preprocessDump.php | 98 |
1 files changed, 98 insertions, 0 deletions
diff --git a/www/wiki/maintenance/preprocessDump.php b/www/wiki/maintenance/preprocessDump.php new file mode 100644 index 00000000..d540e8f9 --- /dev/null +++ b/www/wiki/maintenance/preprocessDump.php @@ -0,0 +1,98 @@ +<?php +/** + * Take page text out of an XML dump file and preprocess it to obj. + * It may be useful for getting preprocessor statistics or filling the + * preprocessor cache. + * + * Copyright © 2011 Platonides - https://www.mediawiki.org/ + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License along + * with this program; if not, write to the Free Software Foundation, Inc., + * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. + * http://www.gnu.org/copyleft/gpl.html + * + * @file + * @ingroup Maintenance + */ + +require_once __DIR__ . '/dumpIterator.php'; + +/** + * Maintenance script that takes page text out of an XML dump file and + * preprocesses it to obj. + * + * @ingroup Maintenance + */ +class PreprocessDump extends DumpIterator { + + /* Variables for dressing up as a parser */ + public $mTitle = 'PreprocessDump'; + public $mPPNodeCount = 0; + + public function getStripList() { + global $wgParser; + + return $wgParser->getStripList(); + } + + public function __construct() { + parent::__construct(); + $this->addOption( 'cache', 'Use and populate the preprocessor cache.', false, false ); + $this->addOption( 'preprocessor', 'Preprocessor to use.', false, false ); + } + + public function getDbType() { + return Maintenance::DB_NONE; + } + + public function checkOptions() { + global $wgParser, $wgParserConf, $wgPreprocessorCacheThreshold; + + if ( !$this->hasOption( 'cache' ) ) { + $wgPreprocessorCacheThreshold = false; + } + + if ( $this->hasOption( 'preprocessor' ) ) { + $name = $this->getOption( 'preprocessor' ); + } elseif ( isset( $wgParserConf['preprocessorClass'] ) ) { + $name = $wgParserConf['preprocessorClass']; + } else { + $name = Preprocessor_DOM::class; + } + + $wgParser->firstCallInit(); + $this->mPreprocessor = new $name( $this ); + } + + /** + * Callback function for each revision, preprocessToObj() + * @param Revision $rev + */ + public function processRevision( $rev ) { + $content = $rev->getContent( Revision::RAW ); + + if ( $content->getModel() !== CONTENT_MODEL_WIKITEXT ) { + return; + } + + try { + $this->mPreprocessor->preprocessToObj( strval( $content->getNativeData() ), 0 ); + } catch ( Exception $e ) { + $this->error( "Caught exception " . $e->getMessage() . " in " + . $rev->getTitle()->getPrefixedText() ); + } + } +} + +$maintClass = PreprocessDump::class; +require_once RUN_MAINTENANCE_IF_MAIN; |