<?php
-# Copyright (C) 2005 Brion Vibber <brion@pobox.com>
+# Copyright (C) 2005-2007 Brion Vibber <brion@pobox.com>
# http://www.mediawiki.org/
-#
+#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation; either version 2 of the License, or
+# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
-#
+#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
-#
+#
# You should have received a copy of the GNU General Public License along
# with this program; if not, write to the Free Software Foundation, Inc.,
-# 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
+# 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
# http://www.gnu.org/copyleft/gpl.html
-$options = array( 'fix', 'suffix' );
+/**
+ * @file
+ * @ingroup Maintenance
+ */
+
+$options = array( 'fix', 'suffix', 'help' );
/** */
require_once( 'commandLine.inc' );
-#require_once( 'maintenance/userDupes.inc' );
+
+if(isset( $options['help'] ) ) {
+print <<<ENDS
+usage: namespaceDupes.php [--fix] [--suffix=<text>] [--help]
+ --help : this help message
+ --fix : attempt to automatically fix errors
+ --suffix=<text> : dupes will be renamed with correct namespace with <text>
+ appended after the article name.
+ --prefix=<text> : Do an explicit check for the given title prefix
+ in place of the standard namespace list.
+ --verbose : Display output for checked namespaces without conflicts
+
+ENDS;
+die;
+}
class NamespaceConflictChecker {
- function NamespaceConflictChecker( &$db ) {
- $this->db =& $db;
+ function NamespaceConflictChecker( $db, $verbose=false ) {
+ $this->db = $db;
+ $this->verbose = $verbose;
}
-
+
function checkAll( $fix, $suffix = '' ) {
- global $wgContLang;
- $spaces = $wgContLang->getNamespaces();
+ global $wgContLang, $wgNamespaceAliases, $wgCanonicalNamespaceNames;
+ global $wgCapitalLinks;
+
+ $spaces = array();
+
+ // List interwikis first, so they'll be overridden
+ // by any conflicting local namespaces.
+ foreach( $this->getInterwikiList() as $prefix ) {
+ $name = $wgContLang->ucfirst( $prefix );
+ $spaces[$name] = 0;
+ }
+
+ // Now pull in all canonical and alias namespaces...
+ foreach( $wgCanonicalNamespaceNames as $ns => $name ) {
+ // This includes $wgExtraNamespaces
+ if( $name !== '' ) {
+ $spaces[$name] = $ns;
+ }
+ }
+ foreach( $wgContLang->getNamespaces() as $ns => $name ) {
+ if( $name !== '' ) {
+ $spaces[$name] = $ns;
+ }
+ }
+ foreach( $wgNamespaceAliases as $name => $ns ) {
+ $spaces[$name] = $ns;
+ }
+ foreach( $wgContLang->namespaceAliases as $name => $ns ) {
+ $spaces[$name] = $ns;
+ }
+
+ // We'll need to check for lowercase keys as well,
+ // since we're doing case-sensitive searches in the db.
+ foreach( $spaces as $name => $ns ) {
+ $moreNames = array();
+ $moreNames[] = $wgContLang->uc( $name );
+ $moreNames[] = $wgContLang->ucfirst( $wgContLang->lc( $name ) );
+ $moreNames[] = $wgContLang->ucwords( $name );
+ $moreNames[] = $wgContLang->ucwords( $wgContLang->lc( $name ) );
+ $moreNames[] = $wgContLang->ucwordbreaks( $name );
+ $moreNames[] = $wgContLang->ucwordbreaks( $wgContLang->lc( $name ) );
+ if( !$wgCapitalLinks ) {
+ foreach( $moreNames as $altName ) {
+ $moreNames[] = $wgContLang->lcfirst( $altName );
+ }
+ $moreNames[] = $wgContLang->lcfirst( $name );
+ }
+ foreach( array_unique( $moreNames ) as $altName ) {
+ if( $altName !== $name ) {
+ $spaces[$altName] = $ns;
+ }
+ }
+ }
+
+ ksort( $spaces );
+ asort( $spaces );
+
$ok = true;
- foreach( $spaces as $ns => $name ) {
+ foreach( $spaces as $name => $ns ) {
$ok = $this->checkNamespace( $ns, $name, $fix, $suffix ) && $ok;
}
return $ok;
}
+ private function getInterwikiList() {
+ $result = $this->db->select( 'interwiki', array( 'iw_prefix' ) );
+ while( $row = $this->db->fetchObject( $result ) ) {
+ $prefixes[] = $row->iw_prefix;
+ }
+ $this->db->freeResult( $result );
+ return $prefixes;
+ }
+
function checkNamespace( $ns, $name, $fix, $suffix = '' ) {
- echo "Checking namespace $ns: \"$name\"\n";
- if( $name == '' ) {
- echo "... skipping article namespace\n";
- return true;
+ if( $ns == 0 ) {
+ $header = "Checking interwiki prefix: \"$name\"\n";
+ } else {
+ $header = "Checking namespace $ns: \"$name\"\n";
}
-
+
$conflicts = $this->getConflicts( $ns, $name );
$count = count( $conflicts );
if( $count == 0 ) {
- echo "... no conflicts detected!\n";
+ if( $this->verbose ) {
+ echo $header;
+ echo "... no conflicts detected!\n";
+ }
return true;
}
-
+
+ echo $header;
echo "... $count conflicts detected:\n";
$ok = true;
foreach( $conflicts as $row ) {
return $ok;
}
+ /**
+ * @todo: do this for reals
+ */
+ function checkPrefix( $key, $prefix, $fix, $suffix = '' ) {
+ echo "Checking prefix \"$prefix\" vs namespace $key\n";
+ return $this->checkNamespace( $key, $prefix, $fix, $suffix );
+ }
+
function getConflicts( $ns, $name ) {
- $page = $this->newSchema() ? 'page' : 'cur';
+ $page = 'page';
$table = $this->db->tableName( $page );
-
+
$prefix = $this->db->strencode( $name );
$likeprefix = str_replace( '_', '\\_', $prefix);
-
- $sql = "SELECT {$page}_id AS id,
- {$page}_title AS oldtitle,
- $ns AS namespace,
- TRIM(LEADING '$prefix:' FROM {$page}_title) AS title
+ $encNamespace = $this->db->addQuotes( $ns );
+
+ $titleSql = "TRIM(LEADING '$prefix:' FROM {$page}_title)";
+ if( $ns == 0 ) {
+ // An interwiki; try an alternate encoding with '-' for ':'
+ $titleSql = "CONCAT('$prefix-',$titleSql)";
+ }
+
+ $sql = "SELECT {$page}_id AS id,
+ {$page}_title AS oldtitle,
+ $encNamespace AS namespace,
+ $titleSql AS title
FROM {$table}
WHERE {$page}_namespace=0
AND {$page}_title LIKE '$likeprefix:%'";
-
+
$result = $this->db->query( $sql, 'NamespaceConflictChecker::getConflicts' );
-
+
$set = array();
while( $row = $this->db->fetchObject( $result ) ) {
$set[] = $row;
}
$this->db->freeResult( $result );
-
+
return $set;
}
-
+
function reportConflict( $row, $suffix ) {
- $newTitle = Title::makeTitle( $row->namespace, $row->title );
+ $newTitle = Title::makeTitleSafe( $row->namespace, $row->title );
+ if( is_null($newTitle) || !$newTitle->canExist() ) {
+ // Title is also an illegal title...
+ // For the moment we'll let these slide to cleanupTitles or whoever.
+ printf( "... %d (0,\"%s\")\n",
+ $row->id,
+ $row->oldtitle );
+ echo "... *** cannot resolve automatically; illegal title ***\n";
+ return false;
+ }
+
printf( "... %d (0,\"%s\") -> (%d,\"%s\") [[%s]]\n",
$row->id,
$row->oldtitle,
- $row->namespace,
- $row->title,
+ $newTitle->getNamespace(),
+ $newTitle->getDBkey(),
$newTitle->getPrefixedText() );
-
+
$id = $newTitle->getArticleId();
if( $id ) {
echo "... *** cannot resolve automatically; page exists with ID $id ***\n";
return true;
}
}
-
+
function resolveConflict( $row, $resolvable, $suffix ) {
if( !$resolvable ) {
- $row->title .= $suffix;
- $title = Title::makeTitle( $row->namespace, $row->title );
+ echo "... *** old title {$row->title}\n";
+ while( true ) {
+ $row->title .= $suffix;
+ echo "... *** new title {$row->title}\n";
+ $title = Title::makeTitleSafe( $row->namespace, $row->title );
+ if ( ! $title ) {
+ echo "... !!! invalid title\n";
+ return false;
+ }
+ if ( $id = $title->getArticleId() ) {
+ echo "... *** page exists with ID $id ***\n";
+ } else {
+ break;
+ }
+ }
echo "... *** using suffixed form [[" . $title->getPrefixedText() . "]] ***\n";
}
- $tables = $this->newSchema()
- ? array( 'page' )
- : array( 'cur', 'old' );
+ $tables = array( 'page' );
foreach( $tables as $table ) {
$this->resolveConflictOn( $row, $table );
}
return true;
}
-
+
function resolveConflictOn( $row, $table ) {
- $fname = 'NamespaceConflictChecker::resolveConflictOn';
echo "... resolving on $table... ";
+ $newTitle = Title::makeTitleSafe( $row->namespace, $row->title );
$this->db->update( $table,
array(
- "{$table}_namespace" => $row->namespace,
- "{$table}_title" => $row->title,
+ "{$table}_namespace" => $newTitle->getNamespace(),
+ "{$table}_title" => $newTitle->getDBkey(),
),
array(
"{$table}_namespace" => 0,
"{$table}_title" => $row->oldtitle,
),
- $fname );
+ __METHOD__ );
echo "ok.\n";
return true;
}
-
- function newSchema() {
- return class_exists( 'Revision' );
- }
}
$wgTitle = Title::newFromText( 'Namespace title conflict cleanup script' );
+$verbose = isset( $options['verbose'] );
$fix = isset( $options['fix'] );
$suffix = isset( $options['suffix'] ) ? $options['suffix'] : '';
-$dbw =& wfGetDB( DB_MASTER );
-$duper = new NamespaceConflictChecker( $dbw );
-$retval = $duper->checkAll( $fix, $suffix );
+$prefix = isset( $options['prefix'] ) ? $options['prefix'] : '';
+$key = isset( $options['key'] ) ? intval( $options['key'] ) : 0;
+
+$dbw = wfGetDB( DB_MASTER );
+$duper = new NamespaceConflictChecker( $dbw, $verbose );
+
+if( $prefix ) {
+ $retval = $duper->checkPrefix( $key, $prefix, $fix, $suffix );
+} else {
+ $retval = $duper->checkAll( $fix, $suffix );
+}
if( $retval ) {
echo "\nLooks good!\n";
exit( -1 );
}
-?>
\ No newline at end of file
+