2003-08-31 09:46:37 +00:00
|
|
|
<?
|
|
|
|
|
|
|
|
|
|
# This class encapsulates "magic words" such as #redirect, __NOTOC__, etc.
|
|
|
|
|
# Usage:
|
|
|
|
|
# if (MagicWord::get( MAG_REDIRECT )->match( $text ) )
|
|
|
|
|
#
|
|
|
|
|
# Possible future improvements:
|
|
|
|
|
# * Simultaneous searching for a number of magic words
|
|
|
|
|
# * $wgMagicWords in shared memory
|
|
|
|
|
#
|
|
|
|
|
# Please avoid reading the data out of one of these objects and then writing
|
|
|
|
|
# special case code. If possible, add another match()-like function here.
|
|
|
|
|
|
|
|
|
|
/*private*/ $wgMagicFound = false;
|
|
|
|
|
|
|
|
|
|
class MagicWord {
|
|
|
|
|
/*private*/ var $mId, $mSynonyms, $mCaseSensitive, $mRegex;
|
2003-09-21 13:10:10 +00:00
|
|
|
/*private*/ var $mRegexStart, $mBaseRegex, $mVariableRegex;
|
2004-01-07 02:51:47 +00:00
|
|
|
/*private*/ var $mModified;
|
|
|
|
|
|
2003-08-31 09:46:37 +00:00
|
|
|
function MagicWord($id = 0, $syn = "", $cs = false)
|
|
|
|
|
{
|
|
|
|
|
$this->mId = $id;
|
|
|
|
|
$this->mSynonyms = (array)$syn;
|
|
|
|
|
$this->mCaseSensitive = $cs;
|
|
|
|
|
$this->mRegex = "";
|
|
|
|
|
$this->mRegexStart = "";
|
2003-09-21 13:10:10 +00:00
|
|
|
$this->mVariableRegex = "";
|
2004-01-12 00:55:01 +00:00
|
|
|
$this->mVariableStartToEndRegex = "";
|
2004-01-07 02:51:47 +00:00
|
|
|
$this->mModified = false;
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Factory: creates an object representing an ID
|
2003-08-31 09:46:37 +00:00
|
|
|
/*static*/ function &get( $id )
|
|
|
|
|
{
|
|
|
|
|
global $wgMagicWords;
|
|
|
|
|
|
|
|
|
|
if (!array_key_exists( $id, $wgMagicWords ) ) {
|
|
|
|
|
$mw = new MagicWord();
|
|
|
|
|
$mw->load( $id );
|
|
|
|
|
$wgMagicWords[$id] = $mw;
|
|
|
|
|
}
|
|
|
|
|
return $wgMagicWords[$id];
|
|
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Initialises this object with an ID
|
2003-08-31 09:46:37 +00:00
|
|
|
function load( $id )
|
|
|
|
|
{
|
2004-01-07 02:51:47 +00:00
|
|
|
global $wgLang;
|
2003-08-31 09:46:37 +00:00
|
|
|
$this->mId = $id;
|
|
|
|
|
$wgLang->getMagic( $this );
|
|
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Preliminary initialisation
|
2003-08-31 09:46:37 +00:00
|
|
|
/* private */ function initRegex()
|
|
|
|
|
{
|
2004-01-25 02:38:47 +00:00
|
|
|
$variableClass = "A-Za-z0-9_\-\x80-\xff";
|
2003-08-31 09:46:37 +00:00
|
|
|
$escSyn = array_map( "preg_quote", $this->mSynonyms );
|
|
|
|
|
$this->mBaseRegex = implode( "|", $escSyn );
|
|
|
|
|
$case = $this->mCaseSensitive ? "" : "i";
|
|
|
|
|
$this->mRegex = "/{$this->mBaseRegex}/{$case}";
|
|
|
|
|
$this->mRegexStart = "/^{$this->mBaseRegex}/{$case}";
|
2004-01-25 02:38:47 +00:00
|
|
|
$this->mVariableRegex = str_replace( "\\$1", "([$variableClass]*)", $this->mRegex );
|
|
|
|
|
$this->mVariableStartToEndRegex = str_replace( "\\$1", "([$variableClass]*)",
|
|
|
|
|
"/^{$this->mBaseRegex}$/{$case}" );
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Gets a regex representing matching the word
|
2003-08-31 09:46:37 +00:00
|
|
|
function getRegex()
|
|
|
|
|
{
|
|
|
|
|
if ($this->mRegex == "" ) {
|
|
|
|
|
$this->initRegex();
|
|
|
|
|
}
|
|
|
|
|
return $this->mRegex;
|
|
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Gets a regex matching the word, if it is at the
|
|
|
|
|
# string start
|
2003-08-31 09:46:37 +00:00
|
|
|
function getRegexStart()
|
|
|
|
|
{
|
|
|
|
|
if ($this->mRegex == "" ) {
|
|
|
|
|
$this->initRegex();
|
|
|
|
|
}
|
|
|
|
|
return $this->mRegexStart;
|
|
|
|
|
}
|
2004-01-12 00:55:01 +00:00
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# regex without the slashes and what not
|
2003-08-31 09:46:37 +00:00
|
|
|
function getBaseRegex()
|
|
|
|
|
{
|
|
|
|
|
if ($this->mRegex == "") {
|
|
|
|
|
$this->initRegex();
|
|
|
|
|
}
|
|
|
|
|
return $this->mBaseRegex;
|
|
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Returns true if the text contains the word
|
2003-08-31 09:46:37 +00:00
|
|
|
function match( $text ) {
|
|
|
|
|
return preg_match( $this->getRegex(), $text );
|
|
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Returns true if the text starts with the word
|
2003-08-31 09:46:37 +00:00
|
|
|
function matchStart( $text )
|
|
|
|
|
{
|
|
|
|
|
return preg_match( $this->getRegexStart(), $text );
|
|
|
|
|
}
|
|
|
|
|
|
2004-01-12 00:55:01 +00:00
|
|
|
# Returns NULL if there's no match, the value of $1 otherwise
|
|
|
|
|
# The return code is the matched string, if there's no variable
|
|
|
|
|
# part in the regex and the matched variable part ($1) if there
|
|
|
|
|
# is one.
|
|
|
|
|
function matchVariableStartToEnd( $text ) {
|
|
|
|
|
$matchcount = preg_match( $this->getVariableStartToEndRegex(), $text, $matches );
|
|
|
|
|
if ( $matchcount == 0 ) {
|
|
|
|
|
return NULL;
|
|
|
|
|
} elseif ( count($matches) == 1 ) {
|
|
|
|
|
return $matches[0];
|
|
|
|
|
} else {
|
|
|
|
|
return $matches[1];
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Returns true if the text matches the word, and alters the
|
|
|
|
|
# input string, removing all instances of the word
|
2003-08-31 09:46:37 +00:00
|
|
|
function matchAndRemove( &$text )
|
|
|
|
|
{
|
|
|
|
|
global $wgMagicFound;
|
|
|
|
|
$wgMagicFound = false;
|
|
|
|
|
$text = preg_replace_callback( $this->getRegex(), "pregRemoveAndRecord", $text );
|
|
|
|
|
return $wgMagicFound;
|
|
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Replaces the word with something else
|
2003-08-31 09:46:37 +00:00
|
|
|
function replace( $replacement, $subject )
|
|
|
|
|
{
|
2004-01-07 02:51:47 +00:00
|
|
|
$res = preg_replace( $this->getRegex(), $replacement, $subject );
|
|
|
|
|
$this->mModified = !($res === $subject);
|
|
|
|
|
return $res;
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
2003-09-21 13:10:10 +00:00
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Variable handling: {{SUBST:xxx}} style words
|
|
|
|
|
# Calls back a function to determine what to replace xxx with
|
|
|
|
|
# Input word must contain $1
|
2003-09-21 13:10:10 +00:00
|
|
|
function substituteCallback( $text, $callback ) {
|
|
|
|
|
$regex = $this->getVariableRegex();
|
2004-01-07 02:51:47 +00:00
|
|
|
$res = preg_replace_callback( $this->getVariableRegex(), $callback, $text );
|
|
|
|
|
$this->mModified = !($res === $text);
|
|
|
|
|
return $res;
|
2003-09-21 13:10:10 +00:00
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Matches the word, where $1 is a wildcard
|
2003-09-21 13:10:10 +00:00
|
|
|
function getVariableRegex()
|
|
|
|
|
{
|
|
|
|
|
if ( $this->mVariableRegex == "" ) {
|
|
|
|
|
$this->initRegex();
|
|
|
|
|
}
|
|
|
|
|
return $this->mVariableRegex;
|
|
|
|
|
}
|
|
|
|
|
|
2004-01-12 00:55:01 +00:00
|
|
|
# Matches the entire string, where $1 is a wildcard
|
|
|
|
|
function getVariableStartToEndRegex()
|
|
|
|
|
{
|
|
|
|
|
if ( $this->mVariableStartToEndRegex == "" ) {
|
|
|
|
|
$this->initRegex();
|
|
|
|
|
}
|
|
|
|
|
return $this->mVariableStartToEndRegex;
|
|
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Accesses the synonym list directly
|
2003-09-21 13:10:10 +00:00
|
|
|
function getSynonym( $i ) {
|
|
|
|
|
return $this->mSynonyms[$i];
|
|
|
|
|
}
|
2004-01-07 02:51:47 +00:00
|
|
|
|
|
|
|
|
# Returns true if the last call to replace() or substituteCallback()
|
|
|
|
|
# returned a modified text, otherwise false.
|
|
|
|
|
function getWasModified(){
|
|
|
|
|
return $this->mModified;
|
|
|
|
|
}
|
2004-01-10 22:49:37 +00:00
|
|
|
|
|
|
|
|
# $magicarr is an associative array of (magic word ID => replacement)
|
|
|
|
|
# This method uses the php feature to do several replacements at the same time,
|
|
|
|
|
# thereby gaining some efficiency. The result is placed in the out variable
|
|
|
|
|
# $result. The return value is true if something was replaced.
|
|
|
|
|
|
|
|
|
|
/* static */ function replaceMultiple( $magicarr, $subject, &$result ){
|
|
|
|
|
$search = array();
|
|
|
|
|
$replace = array();
|
|
|
|
|
foreach( $magicarr as $id => $replacement ){
|
|
|
|
|
$mw = MagicWord::get( $id );
|
|
|
|
|
$search[] = $mw->getRegex();
|
|
|
|
|
$replace[] = $replacement;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$result = preg_replace( $search, $replace, $subject );
|
|
|
|
|
return !($result === $subject);
|
|
|
|
|
}
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Used in matchAndRemove()
|
2003-08-31 09:46:37 +00:00
|
|
|
/*private*/ function pregRemoveAndRecord( $match )
|
|
|
|
|
{
|
|
|
|
|
global $wgMagicFound;
|
|
|
|
|
$wgMagicFound = true;
|
|
|
|
|
return "";
|
|
|
|
|
}
|
|
|
|
|
|
2003-09-01 13:13:56 +00:00
|
|
|
?>
|