2004-02-18 02:15:00 +00:00
|
|
|
<?php
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* File for magic words
|
2010-08-08 14:23:14 +00:00
|
|
|
*
|
2008-03-12 17:37:03 +00:00
|
|
|
* See docs/magicword.txt
|
|
|
|
|
*
|
WARNING: HUGE COMMIT
Doxygen documentation update:
* Changed alls @addtogroup to @ingroup. @addtogroup adds the comment to the group description, but doesn't add the file, class, function, ... to the group like @ingroup does. See for example http://svn.wikimedia.org/doc/group__SpecialPage.html where it's impossible to see related files, classes, ... that should belong to that group.
* Added @file to file description, it seems that it should be explicitely decalred for file descriptions, otherwise doxygen will think that the comment document the first class, variabled, function, ... that is in that file.
* Removed some empty comments
* Removed some ?>
Added following groups:
* ExternalStorage
* JobQueue
* MaintenanceLanguage
One more thing: there are still a lot of warnings when generating the doc.
2008-05-20 17:13:28 +00:00
|
|
|
* @file
|
|
|
|
|
* @ingroup Parser
|
2004-09-02 23:28:24 +00:00
|
|
|
*/
|
2003-08-31 09:46:37 +00:00
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* This class encapsulates "magic words" such as #redirect, __NOTOC__, etc.
|
|
|
|
|
* Usage:
|
2006-07-14 15:39:23 +00:00
|
|
|
* if (MagicWord::get( 'redirect' )->match( $text ) )
|
2006-01-07 13:09:30 +00:00
|
|
|
*
|
|
|
|
|
* Possible future improvements:
|
2004-09-02 23:28:24 +00:00
|
|
|
* * Simultaneous searching for a number of magic words
|
2006-07-14 16:36:35 +00:00
|
|
|
* * MagicWord::$mObjects in shared memory
|
2004-09-02 23:28:24 +00:00
|
|
|
*
|
2006-01-07 13:09:30 +00:00
|
|
|
* Please avoid reading the data out of one of these objects and then writing
|
2004-09-02 23:28:24 +00:00
|
|
|
* special case code. If possible, add another match()-like function here.
|
2004-09-03 23:00:01 +00:00
|
|
|
*
|
2008-04-14 07:45:50 +00:00
|
|
|
* To add magic words in an extension, use the LanguageGetMagic hook. For
|
2006-07-14 16:36:35 +00:00
|
|
|
* magic words which are also Parser variables, add a MagicWordwgVariableIDs
|
|
|
|
|
* hook. Use string keys.
|
|
|
|
|
*
|
WARNING: HUGE COMMIT
Doxygen documentation update:
* Changed alls @addtogroup to @ingroup. @addtogroup adds the comment to the group description, but doesn't add the file, class, function, ... to the group like @ingroup does. See for example http://svn.wikimedia.org/doc/group__SpecialPage.html where it's impossible to see related files, classes, ... that should belong to that group.
* Added @file to file description, it seems that it should be explicitely decalred for file descriptions, otherwise doxygen will think that the comment document the first class, variabled, function, ... that is in that file.
* Removed some empty comments
* Removed some ?>
Added following groups:
* ExternalStorage
* JobQueue
* MaintenanceLanguage
One more thing: there are still a lot of warnings when generating the doc.
2008-05-20 17:13:28 +00:00
|
|
|
* @ingroup Parser
|
2004-09-02 23:28:24 +00:00
|
|
|
*/
|
2003-08-31 09:46:37 +00:00
|
|
|
class MagicWord {
|
2004-09-03 23:00:01 +00:00
|
|
|
/**#@+
|
2006-06-10 18:28:50 +00:00
|
|
|
* @private
|
2004-09-03 23:00:01 +00:00
|
|
|
*/
|
2006-05-11 22:40:38 +00:00
|
|
|
var $mId, $mSynonyms, $mCaseSensitive, $mRegex;
|
|
|
|
|
var $mRegexStart, $mBaseRegex, $mVariableRegex;
|
2006-07-14 16:36:35 +00:00
|
|
|
var $mModified, $mFound;
|
|
|
|
|
|
|
|
|
|
static public $mVariableIDsInitialised = false;
|
|
|
|
|
static public $mVariableIDs = array(
|
|
|
|
|
'currentmonth',
|
2009-05-20 07:14:03 +00:00
|
|
|
'currentmonth1',
|
2006-07-14 16:36:35 +00:00
|
|
|
'currentmonthname',
|
|
|
|
|
'currentmonthnamegen',
|
|
|
|
|
'currentmonthabbrev',
|
|
|
|
|
'currentday',
|
|
|
|
|
'currentday2',
|
|
|
|
|
'currentdayname',
|
|
|
|
|
'currentyear',
|
|
|
|
|
'currenttime',
|
2006-08-14 22:43:50 +00:00
|
|
|
'currenthour',
|
2006-08-23 16:45:49 +00:00
|
|
|
'localmonth',
|
2009-05-20 07:14:03 +00:00
|
|
|
'localmonth1',
|
2006-08-23 16:45:49 +00:00
|
|
|
'localmonthname',
|
|
|
|
|
'localmonthnamegen',
|
|
|
|
|
'localmonthabbrev',
|
|
|
|
|
'localday',
|
|
|
|
|
'localday2',
|
|
|
|
|
'localdayname',
|
|
|
|
|
'localyear',
|
|
|
|
|
'localtime',
|
|
|
|
|
'localhour',
|
2006-07-14 16:36:35 +00:00
|
|
|
'numberofarticles',
|
|
|
|
|
'numberoffiles',
|
2007-04-17 09:23:31 +00:00
|
|
|
'numberofedits',
|
2010-08-05 15:21:15 +00:00
|
|
|
'articlepath',
|
2006-07-14 16:36:35 +00:00
|
|
|
'sitename',
|
|
|
|
|
'server',
|
|
|
|
|
'servername',
|
|
|
|
|
'scriptpath',
|
2009-09-26 11:51:37 +00:00
|
|
|
'stylepath',
|
2006-07-14 16:36:35 +00:00
|
|
|
'pagename',
|
|
|
|
|
'pagenamee',
|
|
|
|
|
'fullpagename',
|
|
|
|
|
'fullpagenamee',
|
|
|
|
|
'namespace',
|
|
|
|
|
'namespacee',
|
|
|
|
|
'currentweek',
|
|
|
|
|
'currentdow',
|
2006-08-23 16:45:49 +00:00
|
|
|
'localweek',
|
|
|
|
|
'localdow',
|
2006-07-14 16:36:35 +00:00
|
|
|
'revisionid',
|
2006-09-26 17:20:36 +00:00
|
|
|
'revisionday',
|
|
|
|
|
'revisionday2',
|
|
|
|
|
'revisionmonth',
|
2010-05-11 16:24:14 +00:00
|
|
|
'revisionmonth1',
|
2006-09-26 17:20:36 +00:00
|
|
|
'revisionyear',
|
|
|
|
|
'revisiontimestamp',
|
2009-03-07 23:01:59 +00:00
|
|
|
'revisionuser',
|
2006-07-14 16:36:35 +00:00
|
|
|
'subpagename',
|
|
|
|
|
'subpagenamee',
|
|
|
|
|
'talkspace',
|
|
|
|
|
'talkspacee',
|
|
|
|
|
'subjectspace',
|
|
|
|
|
'subjectspacee',
|
|
|
|
|
'talkpagename',
|
|
|
|
|
'talkpagenamee',
|
|
|
|
|
'subjectpagename',
|
|
|
|
|
'subjectpagenamee',
|
|
|
|
|
'numberofusers',
|
2009-02-17 23:05:04 +00:00
|
|
|
'numberofactiveusers',
|
2006-07-14 16:36:35 +00:00
|
|
|
'numberofpages',
|
|
|
|
|
'currentversion',
|
|
|
|
|
'basepagename',
|
|
|
|
|
'basepagenamee',
|
|
|
|
|
'currenttimestamp',
|
2006-08-23 16:45:49 +00:00
|
|
|
'localtimestamp',
|
2006-07-14 16:36:35 +00:00
|
|
|
'directionmark',
|
|
|
|
|
'contentlanguage',
|
|
|
|
|
'numberofadmins',
|
2008-10-19 04:11:02 +00:00
|
|
|
'numberofviews',
|
2006-07-14 16:36:35 +00:00
|
|
|
);
|
2008-04-14 07:45:50 +00:00
|
|
|
|
2008-01-09 20:47:46 +00:00
|
|
|
/* Array of caching hints for ParserCache */
|
|
|
|
|
static public $mCacheTTLs = array (
|
2009-06-06 02:49:32 +00:00
|
|
|
'currentmonth' => 86400,
|
|
|
|
|
'currentmonth1' => 86400,
|
|
|
|
|
'currentmonthname' => 86400,
|
|
|
|
|
'currentmonthnamegen' => 86400,
|
|
|
|
|
'currentmonthabbrev' => 86400,
|
|
|
|
|
'currentday' => 3600,
|
|
|
|
|
'currentday2' => 3600,
|
|
|
|
|
'currentdayname' => 3600,
|
|
|
|
|
'currentyear' => 86400,
|
|
|
|
|
'currenttime' => 3600,
|
|
|
|
|
'currenthour' => 3600,
|
|
|
|
|
'localmonth' => 86400,
|
|
|
|
|
'localmonth1' => 86400,
|
|
|
|
|
'localmonthname' => 86400,
|
|
|
|
|
'localmonthnamegen' => 86400,
|
|
|
|
|
'localmonthabbrev' => 86400,
|
|
|
|
|
'localday' => 3600,
|
|
|
|
|
'localday2' => 3600,
|
|
|
|
|
'localdayname' => 3600,
|
|
|
|
|
'localyear' => 86400,
|
|
|
|
|
'localtime' => 3600,
|
|
|
|
|
'localhour' => 3600,
|
|
|
|
|
'numberofarticles' => 3600,
|
|
|
|
|
'numberoffiles' => 3600,
|
|
|
|
|
'numberofedits' => 3600,
|
|
|
|
|
'currentweek' => 3600,
|
|
|
|
|
'currentdow' => 3600,
|
|
|
|
|
'localweek' => 3600,
|
|
|
|
|
'localdow' => 3600,
|
|
|
|
|
'numberofusers' => 3600,
|
|
|
|
|
'numberofactiveusers' => 3600,
|
|
|
|
|
'numberofpages' => 3600,
|
|
|
|
|
'currentversion' => 86400,
|
|
|
|
|
'currenttimestamp' => 3600,
|
|
|
|
|
'localtimestamp' => 3600,
|
|
|
|
|
'pagesinnamespace' => 3600,
|
|
|
|
|
'numberofadmins' => 3600,
|
|
|
|
|
'numberofviews' => 3600,
|
|
|
|
|
'numberingroup' => 3600,
|
2008-01-09 20:47:46 +00:00
|
|
|
);
|
2006-07-14 16:36:35 +00:00
|
|
|
|
2008-02-20 08:53:12 +00:00
|
|
|
static public $mDoubleUnderscoreIDs = array(
|
|
|
|
|
'notoc',
|
|
|
|
|
'nogallery',
|
|
|
|
|
'forcetoc',
|
|
|
|
|
'toc',
|
|
|
|
|
'noeditsection',
|
|
|
|
|
'newsectionlink',
|
2009-02-19 22:14:59 +00:00
|
|
|
'nonewsectionlink',
|
2008-02-20 08:53:12 +00:00
|
|
|
'hiddencat',
|
2008-07-23 19:49:46 +00:00
|
|
|
'index',
|
|
|
|
|
'noindex',
|
2008-07-27 21:49:58 +00:00
|
|
|
'staticredirect',
|
2010-01-07 04:13:14 +00:00
|
|
|
'notitleconvert',
|
|
|
|
|
'nocontentconvert',
|
2008-02-20 08:53:12 +00:00
|
|
|
);
|
|
|
|
|
|
2010-01-30 11:58:19 +00:00
|
|
|
static public $mSubstIDs = array(
|
|
|
|
|
'subst',
|
|
|
|
|
'safesubst',
|
|
|
|
|
);
|
2008-02-20 08:53:12 +00:00
|
|
|
|
2006-07-14 16:36:35 +00:00
|
|
|
static public $mObjects = array();
|
2008-02-20 08:53:12 +00:00
|
|
|
static public $mDoubleUnderscoreArray = null;
|
2006-07-14 16:36:35 +00:00
|
|
|
|
2004-09-03 23:00:01 +00:00
|
|
|
/**#@-*/
|
2004-01-07 02:51:47 +00:00
|
|
|
|
2007-01-20 13:34:31 +00:00
|
|
|
function __construct($id = 0, $syn = '', $cs = false) {
|
2003-08-31 09:46:37 +00:00
|
|
|
$this->mId = $id;
|
|
|
|
|
$this->mSynonyms = (array)$syn;
|
|
|
|
|
$this->mCaseSensitive = $cs;
|
2004-08-12 13:32:04 +00:00
|
|
|
$this->mRegex = '';
|
|
|
|
|
$this->mRegexStart = '';
|
|
|
|
|
$this->mVariableRegex = '';
|
|
|
|
|
$this->mVariableStartToEndRegex = '';
|
2004-01-07 02:51:47 +00:00
|
|
|
$this->mModified = false;
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
|
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Factory: creates an object representing an ID
|
|
|
|
|
* @static
|
2011-02-08 23:18:13 +00:00
|
|
|
* @return MagicWord
|
2004-09-02 23:28:24 +00:00
|
|
|
*/
|
2006-07-10 15:41:30 +00:00
|
|
|
static function &get( $id ) {
|
2008-01-20 18:46:50 +00:00
|
|
|
wfProfileIn( __METHOD__ );
|
* Introduced a new system for localisation caching. The system is based around fast fetches of individual messages, minimising memory overhead and startup time in the typical case. It handles both core messages (formerly in Language.php) and extension messages (formerly in MessageCache.php). Profiling indicates a significant win for average throughput.
* The serialized message cache, which would have been redundant, has been removed. Similar performance characteristics can be achieved with $wgLocalisationCacheConf['manualRecache'] = true;
* Added a maintenance script rebuildLocalisationCache.php for offline rebuilding of the localisation cache.
* Extension i18n files can now contain any of the variables which can be set in Messages*.php. It is possible, and recommended, to use this feature instead of the hooks for special page aliases and magic words.
* $wgExtensionAliasesFiles, LanguageGetMagic and LanguageGetSpecialPageAliases are retained for backwards compatibility. $wgMessageCache->addMessages() and related functions have been removed. wfLoadExtensionMessages() is a no-op and can continue to be called for b/c.
* Introduced $wgCacheDirectory as a default location for the various local caches that have accumulated. Suggested $IP/cache as a good place for it in the default LocalSettings.php and created this directory with a deny-all .htaccess.
* Patched Exception.php to avoid using the message cache when an exception is thrown from within LocalisationCache, since this tends to fail horribly.
* Removed Language::getLocalisationArray(), Language::loadLocalisation(), Language::load()
* Fixed FileDependency::__sleep()
* In Cdb.php, fixed newlines in debug messages
In MessageCache::get():
* Replaced calls to $wgContLang capitalisation functions with plain PHP functions, reducing the typical case from 99us to 93us. Message cache keys are already documented as being restricted to ASCII.
* Implemented a more efficient way to filter out bogus language codes, reducing the "foo/en" case from 430us to 101us
* Optimised wfRunHooks() in the typical do-nothing case, from ~30us to ~3us. This reduced MessageCache::get() typical case time from 93us to 38us.
* Removed hook MessageNotInMwNs to save an extra 3us per cache hit. Reimplemented the only user (LocalisationUpdate) using the new hook LocalisationCacheRecache.
2009-06-28 07:11:43 +00:00
|
|
|
if ( !isset( self::$mObjects[$id] ) ) {
|
2003-08-31 09:46:37 +00:00
|
|
|
$mw = new MagicWord();
|
|
|
|
|
$mw->load( $id );
|
2006-07-14 16:36:35 +00:00
|
|
|
self::$mObjects[$id] = $mw;
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
2008-01-20 18:46:50 +00:00
|
|
|
wfProfileOut( __METHOD__ );
|
2006-07-14 16:36:35 +00:00
|
|
|
return self::$mObjects[$id];
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Get an array of parser variable IDs
|
|
|
|
|
*/
|
|
|
|
|
static function getVariableIDs() {
|
|
|
|
|
if ( !self::$mVariableIDsInitialised ) {
|
|
|
|
|
# Deprecated constant definition hook, available for extensions that need it
|
|
|
|
|
$magicWords = array();
|
|
|
|
|
wfRunHooks( 'MagicWordMagicWords', array( &$magicWords ) );
|
|
|
|
|
foreach ( $magicWords as $word ) {
|
|
|
|
|
define( $word, $word );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
# Get variable IDs
|
|
|
|
|
wfRunHooks( 'MagicWordwgVariableIDs', array( &self::$mVariableIDs ) );
|
|
|
|
|
self::$mVariableIDsInitialised = true;
|
|
|
|
|
}
|
|
|
|
|
return self::$mVariableIDs;
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
2008-04-14 07:45:50 +00:00
|
|
|
|
2010-01-30 11:58:19 +00:00
|
|
|
/**
|
|
|
|
|
* Get an array of parser substitution modifier IDs
|
|
|
|
|
*/
|
|
|
|
|
static function getSubstIDs() {
|
|
|
|
|
return self::$mSubstIDs;
|
|
|
|
|
}
|
|
|
|
|
|
2008-01-09 20:47:46 +00:00
|
|
|
/* Allow external reads of TTL array */
|
|
|
|
|
static function getCacheTTL($id) {
|
|
|
|
|
if (array_key_exists($id,self::$mCacheTTLs)) {
|
|
|
|
|
return self::$mCacheTTLs[$id];
|
|
|
|
|
} else {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
}
|
2008-02-20 08:53:12 +00:00
|
|
|
|
|
|
|
|
/** Get a MagicWordArray of double-underscore entities */
|
|
|
|
|
static function getDoubleUnderscoreArray() {
|
|
|
|
|
if ( is_null( self::$mDoubleUnderscoreArray ) ) {
|
|
|
|
|
self::$mDoubleUnderscoreArray = new MagicWordArray( self::$mDoubleUnderscoreIDs );
|
|
|
|
|
}
|
|
|
|
|
return self::$mDoubleUnderscoreArray;
|
|
|
|
|
}
|
2008-04-14 07:45:50 +00:00
|
|
|
|
2009-08-26 16:57:53 +00:00
|
|
|
/**
|
|
|
|
|
* Clear the self::$mObjects variable
|
|
|
|
|
* For use in parser tests
|
|
|
|
|
*/
|
|
|
|
|
public static function clearCache() {
|
|
|
|
|
self::$mObjects = array();
|
|
|
|
|
}
|
|
|
|
|
|
2003-12-14 14:25:44 +00:00
|
|
|
# Initialises this object with an ID
|
2004-08-12 13:32:04 +00:00
|
|
|
function load( $id ) {
|
2006-01-07 13:31:29 +00:00
|
|
|
global $wgContLang;
|
2003-08-31 09:46:37 +00:00
|
|
|
$this->mId = $id;
|
2004-09-24 13:14:52 +00:00
|
|
|
$wgContLang->getMagic( $this );
|
2006-10-02 17:04:13 +00:00
|
|
|
if ( !$this->mSynonyms ) {
|
|
|
|
|
$this->mSynonyms = array( 'dkjsagfjsgashfajsh' );
|
|
|
|
|
#throw new MWException( "Error: invalid magic word '$id'" );
|
|
|
|
|
wfDebugLog( 'exception', "Error: invalid magic word '$id'\n" );
|
|
|
|
|
}
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
2006-01-07 13:31:29 +00:00
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Preliminary initialisation
|
2006-06-10 18:28:50 +00:00
|
|
|
* @private
|
2004-09-02 23:28:24 +00:00
|
|
|
*/
|
|
|
|
|
function initRegex() {
|
2011-02-16 07:24:36 +00:00
|
|
|
// Sort the synonyms by length, descending, so that the longest synonym
|
|
|
|
|
// matches in precedence to the shortest
|
|
|
|
|
$synonyms = $this->mSynonyms;
|
|
|
|
|
usort( $synonyms, array( $this, 'compareStringLength' ) );
|
2008-04-14 07:45:50 +00:00
|
|
|
|
2006-01-08 04:25:43 +00:00
|
|
|
$escSyn = array();
|
2011-02-16 07:24:36 +00:00
|
|
|
foreach ( $synonyms as $synonym )
|
2006-01-08 04:25:43 +00:00
|
|
|
// In case a magic word contains /, like that's going to happen;)
|
|
|
|
|
$escSyn[] = preg_quote( $synonym, '/' );
|
2004-08-22 17:24:50 +00:00
|
|
|
$this->mBaseRegex = implode( '|', $escSyn );
|
2008-04-14 07:45:50 +00:00
|
|
|
|
2006-10-08 13:00:42 +00:00
|
|
|
$case = $this->mCaseSensitive ? '' : 'iu';
|
2003-08-31 09:46:37 +00:00
|
|
|
$this->mRegex = "/{$this->mBaseRegex}/{$case}";
|
2005-05-04 07:49:42 +00:00
|
|
|
$this->mRegexStart = "/^(?:{$this->mBaseRegex})/{$case}";
|
|
|
|
|
$this->mVariableRegex = str_replace( "\\$1", "(.*?)", $this->mRegex );
|
2006-01-07 13:09:30 +00:00
|
|
|
$this->mVariableStartToEndRegex = str_replace( "\\$1", "(.*?)",
|
2005-05-04 07:49:42 +00:00
|
|
|
"/^(?:{$this->mBaseRegex})$/{$case}" );
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
2006-01-07 13:31:29 +00:00
|
|
|
|
2011-02-16 07:24:36 +00:00
|
|
|
/**
|
|
|
|
|
* A comparison function that returns -1, 0 or 1 depending on whether the
|
|
|
|
|
* first string is longer, the same length or shorter than the second
|
|
|
|
|
* string.
|
|
|
|
|
*/
|
|
|
|
|
function compareStringLength( $s1, $s2 ) {
|
|
|
|
|
$l1 = strlen( $s1 );
|
|
|
|
|
$l2 = strlen( $s2 );
|
|
|
|
|
if ( $l1 < $l2 ) {
|
|
|
|
|
return 1;
|
|
|
|
|
} elseif ( $l1 > $l2 ) {
|
|
|
|
|
return -1;
|
|
|
|
|
} else {
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Gets a regex representing matching the word
|
|
|
|
|
*/
|
2004-08-12 13:32:04 +00:00
|
|
|
function getRegex() {
|
|
|
|
|
if ($this->mRegex == '' ) {
|
2003-08-31 09:46:37 +00:00
|
|
|
$this->initRegex();
|
|
|
|
|
}
|
|
|
|
|
return $this->mRegex;
|
|
|
|
|
}
|
|
|
|
|
|
2006-01-08 05:35:03 +00:00
|
|
|
/**
|
|
|
|
|
* Gets the regexp case modifier to use, i.e. i or nothing, to be used if
|
|
|
|
|
* one is using MagicWord::getBaseRegex(), otherwise it'll be included in
|
|
|
|
|
* the complete expression
|
|
|
|
|
*/
|
|
|
|
|
function getRegexCase() {
|
|
|
|
|
if ( $this->mRegex === '' )
|
|
|
|
|
$this->initRegex();
|
|
|
|
|
|
2006-10-08 13:00:42 +00:00
|
|
|
return $this->mCaseSensitive ? '' : 'iu';
|
2006-01-08 05:35:03 +00:00
|
|
|
}
|
|
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Gets a regex matching the word, if it is at the string start
|
|
|
|
|
*/
|
2004-08-12 13:32:04 +00:00
|
|
|
function getRegexStart() {
|
|
|
|
|
if ($this->mRegex == '' ) {
|
2003-08-31 09:46:37 +00:00
|
|
|
$this->initRegex();
|
|
|
|
|
}
|
|
|
|
|
return $this->mRegexStart;
|
|
|
|
|
}
|
2004-01-12 00:55:01 +00:00
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* regex without the slashes and what not
|
|
|
|
|
*/
|
2004-08-12 13:32:04 +00:00
|
|
|
function getBaseRegex() {
|
|
|
|
|
if ($this->mRegex == '') {
|
2003-08-31 09:46:37 +00:00
|
|
|
$this->initRegex();
|
|
|
|
|
}
|
|
|
|
|
return $this->mBaseRegex;
|
|
|
|
|
}
|
2006-01-07 13:31:29 +00:00
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
2010-01-12 07:24:25 +00:00
|
|
|
* Returns true if the text contains the word
|
|
|
|
|
* @return bool
|
2004-09-02 23:28:24 +00:00
|
|
|
*/
|
2003-08-31 09:46:37 +00:00
|
|
|
function match( $text ) {
|
2010-01-12 07:24:25 +00:00
|
|
|
return (bool)preg_match( $this->getRegex(), $text );
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
|
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
2010-01-12 07:24:25 +00:00
|
|
|
* Returns true if the text starts with the word
|
|
|
|
|
* @return bool
|
2004-09-02 23:28:24 +00:00
|
|
|
*/
|
2004-08-12 13:32:04 +00:00
|
|
|
function matchStart( $text ) {
|
2010-01-12 07:24:25 +00:00
|
|
|
return (bool)preg_match( $this->getRegexStart(), $text );
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
|
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Returns NULL if there's no match, the value of $1 otherwise
|
|
|
|
|
* The return code is the matched string, if there's no variable
|
|
|
|
|
* part in the regex and the matched variable part ($1) if there
|
|
|
|
|
* is one.
|
|
|
|
|
*/
|
2004-01-12 00:55:01 +00:00
|
|
|
function matchVariableStartToEnd( $text ) {
|
2005-12-04 21:15:04 +00:00
|
|
|
$matches = array();
|
2004-01-12 00:55:01 +00:00
|
|
|
$matchcount = preg_match( $this->getVariableStartToEndRegex(), $text, $matches );
|
|
|
|
|
if ( $matchcount == 0 ) {
|
2009-12-11 21:07:27 +00:00
|
|
|
return null;
|
2004-01-12 00:55:01 +00:00
|
|
|
} else {
|
2006-07-05 18:25:39 +00:00
|
|
|
# multiple matched parts (variable match); some will be empty because of
|
|
|
|
|
# synonyms. The variable will be the second non-empty one so remove any
|
|
|
|
|
# blank elements and re-sort the indices.
|
2006-07-11 13:42:34 +00:00
|
|
|
# See also bug 6526
|
|
|
|
|
|
2005-05-04 07:49:42 +00:00
|
|
|
$matches = array_values(array_filter($matches));
|
2006-07-11 13:42:34 +00:00
|
|
|
|
|
|
|
|
if ( count($matches) == 1 ) { return $matches[0]; }
|
|
|
|
|
else { return $matches[1]; }
|
2004-01-12 00:55:01 +00:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Returns true if the text matches the word, and alters the
|
|
|
|
|
* input string, removing all instances of the word
|
|
|
|
|
*/
|
2004-08-12 13:32:04 +00:00
|
|
|
function matchAndRemove( &$text ) {
|
2006-07-14 16:36:35 +00:00
|
|
|
$this->mFound = false;
|
|
|
|
|
$text = preg_replace_callback( $this->getRegex(), array( &$this, 'pregRemoveAndRecord' ), $text );
|
|
|
|
|
return $this->mFound;
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
|
|
|
|
|
2004-03-20 15:03:26 +00:00
|
|
|
function matchStartAndRemove( &$text ) {
|
2006-07-14 16:36:35 +00:00
|
|
|
$this->mFound = false;
|
|
|
|
|
$text = preg_replace_callback( $this->getRegexStart(), array( &$this, 'pregRemoveAndRecord' ), $text );
|
|
|
|
|
return $this->mFound;
|
2006-01-07 13:31:29 +00:00
|
|
|
}
|
2004-03-20 15:03:26 +00:00
|
|
|
|
2006-07-14 16:36:35 +00:00
|
|
|
/**
|
|
|
|
|
* Used in matchAndRemove()
|
|
|
|
|
* @private
|
|
|
|
|
**/
|
2006-11-29 11:43:58 +00:00
|
|
|
function pregRemoveAndRecord( ) {
|
2006-07-14 16:36:35 +00:00
|
|
|
$this->mFound = true;
|
|
|
|
|
return '';
|
|
|
|
|
}
|
2004-03-20 15:03:26 +00:00
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Replaces the word with something else
|
|
|
|
|
*/
|
2006-05-23 07:19:01 +00:00
|
|
|
function replace( $replacement, $subject, $limit=-1 ) {
|
2006-11-21 09:53:45 +00:00
|
|
|
$res = preg_replace( $this->getRegex(), StringUtils::escapeRegexReplacement( $replacement ), $subject, $limit );
|
2004-01-07 02:51:47 +00:00
|
|
|
$this->mModified = !($res === $subject);
|
|
|
|
|
return $res;
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
2003-09-21 13:10:10 +00:00
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Variable handling: {{SUBST:xxx}} style words
|
|
|
|
|
* Calls back a function to determine what to replace xxx with
|
|
|
|
|
* Input word must contain $1
|
|
|
|
|
*/
|
2003-09-21 13:10:10 +00:00
|
|
|
function substituteCallback( $text, $callback ) {
|
2004-01-07 02:51:47 +00:00
|
|
|
$res = preg_replace_callback( $this->getVariableRegex(), $callback, $text );
|
|
|
|
|
$this->mModified = !($res === $text);
|
|
|
|
|
return $res;
|
2003-09-21 13:10:10 +00:00
|
|
|
}
|
|
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Matches the word, where $1 is a wildcard
|
|
|
|
|
*/
|
2004-08-12 13:32:04 +00:00
|
|
|
function getVariableRegex() {
|
|
|
|
|
if ( $this->mVariableRegex == '' ) {
|
2003-09-21 13:10:10 +00:00
|
|
|
$this->initRegex();
|
2006-01-07 13:09:30 +00:00
|
|
|
}
|
2003-09-21 13:10:10 +00:00
|
|
|
return $this->mVariableRegex;
|
|
|
|
|
}
|
|
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Matches the entire string, where $1 is a wildcard
|
|
|
|
|
*/
|
2004-08-12 13:32:04 +00:00
|
|
|
function getVariableStartToEndRegex() {
|
|
|
|
|
if ( $this->mVariableStartToEndRegex == '' ) {
|
2004-01-12 00:55:01 +00:00
|
|
|
$this->initRegex();
|
2006-01-07 13:09:30 +00:00
|
|
|
}
|
2004-01-12 00:55:01 +00:00
|
|
|
return $this->mVariableStartToEndRegex;
|
|
|
|
|
}
|
|
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Accesses the synonym list directly
|
|
|
|
|
*/
|
2003-09-21 13:10:10 +00:00
|
|
|
function getSynonym( $i ) {
|
|
|
|
|
return $this->mSynonyms[$i];
|
|
|
|
|
}
|
2004-01-07 02:51:47 +00:00
|
|
|
|
2006-07-02 17:47:24 +00:00
|
|
|
function getSynonyms() {
|
|
|
|
|
return $this->mSynonyms;
|
|
|
|
|
}
|
|
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
2006-01-07 13:09:30 +00:00
|
|
|
* Returns true if the last call to replace() or substituteCallback()
|
2004-09-02 23:28:24 +00:00
|
|
|
* returned a modified text, otherwise false.
|
|
|
|
|
*/
|
2004-01-07 02:51:47 +00:00
|
|
|
function getWasModified(){
|
|
|
|
|
return $this->mModified;
|
|
|
|
|
}
|
2004-01-10 22:49:37 +00:00
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* $magicarr is an associative array of (magic word ID => replacement)
|
|
|
|
|
* This method uses the php feature to do several replacements at the same time,
|
|
|
|
|
* thereby gaining some efficiency. The result is placed in the out variable
|
|
|
|
|
* $result. The return value is true if something was replaced.
|
2006-01-07 13:09:30 +00:00
|
|
|
* @static
|
2004-09-02 23:28:24 +00:00
|
|
|
**/
|
|
|
|
|
function replaceMultiple( $magicarr, $subject, &$result ){
|
2004-01-10 22:49:37 +00:00
|
|
|
$search = array();
|
|
|
|
|
$replace = array();
|
|
|
|
|
foreach( $magicarr as $id => $replacement ){
|
|
|
|
|
$mw = MagicWord::get( $id );
|
|
|
|
|
$search[] = $mw->getRegex();
|
|
|
|
|
$replace[] = $replacement;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$result = preg_replace( $search, $replace, $subject );
|
|
|
|
|
return !($result === $subject);
|
|
|
|
|
}
|
2004-03-20 15:03:26 +00:00
|
|
|
|
2004-09-02 23:28:24 +00:00
|
|
|
/**
|
|
|
|
|
* Adds all the synonyms of this MagicWord to an array, to allow quick
|
|
|
|
|
* lookup in a list of magic words
|
|
|
|
|
*/
|
2004-08-12 13:32:04 +00:00
|
|
|
function addToArray( &$array, $value ) {
|
2006-10-08 13:00:42 +00:00
|
|
|
global $wgContLang;
|
2006-07-03 08:57:29 +00:00
|
|
|
foreach ( $this->mSynonyms as $syn ) {
|
2006-10-08 13:00:42 +00:00
|
|
|
$array[$wgContLang->lc($syn)] = $value;
|
2004-03-20 15:03:26 +00:00
|
|
|
}
|
|
|
|
|
}
|
2006-07-03 08:57:29 +00:00
|
|
|
|
|
|
|
|
function isCaseSensitive() {
|
|
|
|
|
return $this->mCaseSensitive;
|
|
|
|
|
}
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
|
|
|
|
|
function getId() {
|
|
|
|
|
return $this->mId;
|
|
|
|
|
}
|
2003-08-31 09:46:37 +00:00
|
|
|
}
|
|
|
|
|
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
/**
|
|
|
|
|
* Class for handling an array of magic words
|
WARNING: HUGE COMMIT
Doxygen documentation update:
* Changed alls @addtogroup to @ingroup. @addtogroup adds the comment to the group description, but doesn't add the file, class, function, ... to the group like @ingroup does. See for example http://svn.wikimedia.org/doc/group__SpecialPage.html where it's impossible to see related files, classes, ... that should belong to that group.
* Added @file to file description, it seems that it should be explicitely decalred for file descriptions, otherwise doxygen will think that the comment document the first class, variabled, function, ... that is in that file.
* Removed some empty comments
* Removed some ?>
Added following groups:
* ExternalStorage
* JobQueue
* MaintenanceLanguage
One more thing: there are still a lot of warnings when generating the doc.
2008-05-20 17:13:28 +00:00
|
|
|
* @ingroup Parser
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
*/
|
|
|
|
|
class MagicWordArray {
|
|
|
|
|
var $names = array();
|
|
|
|
|
var $hash;
|
|
|
|
|
var $baseRegex, $regex;
|
2008-02-20 08:53:12 +00:00
|
|
|
var $matches;
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
|
|
|
|
|
function __construct( $names = array() ) {
|
|
|
|
|
$this->names = $names;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Add a magic word by name
|
|
|
|
|
*/
|
|
|
|
|
public function add( $name ) {
|
|
|
|
|
$this->names[] = $name;
|
|
|
|
|
$this->hash = $this->baseRegex = $this->regex = null;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Add a number of magic words by name
|
|
|
|
|
*/
|
|
|
|
|
public function addArray( $names ) {
|
|
|
|
|
$this->names = array_merge( $this->names, array_values( $names ) );
|
|
|
|
|
$this->hash = $this->baseRegex = $this->regex = null;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Get a 2-d hashtable for this array
|
|
|
|
|
*/
|
|
|
|
|
function getHash() {
|
|
|
|
|
if ( is_null( $this->hash ) ) {
|
|
|
|
|
global $wgContLang;
|
|
|
|
|
$this->hash = array( 0 => array(), 1 => array() );
|
|
|
|
|
foreach ( $this->names as $name ) {
|
|
|
|
|
$magic = MagicWord::get( $name );
|
|
|
|
|
$case = intval( $magic->isCaseSensitive() );
|
|
|
|
|
foreach ( $magic->getSynonyms() as $syn ) {
|
|
|
|
|
if ( !$case ) {
|
|
|
|
|
$syn = $wgContLang->lc( $syn );
|
|
|
|
|
}
|
|
|
|
|
$this->hash[$case][$syn] = $name;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return $this->hash;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Get the base regex
|
|
|
|
|
*/
|
|
|
|
|
function getBaseRegex() {
|
|
|
|
|
if ( is_null( $this->baseRegex ) ) {
|
|
|
|
|
$this->baseRegex = array( 0 => '', 1 => '' );
|
|
|
|
|
foreach ( $this->names as $name ) {
|
|
|
|
|
$magic = MagicWord::get( $name );
|
|
|
|
|
$case = intval( $magic->isCaseSensitive() );
|
|
|
|
|
foreach ( $magic->getSynonyms() as $i => $syn ) {
|
|
|
|
|
$group = "(?P<{$i}_{$name}>" . preg_quote( $syn, '/' ) . ')';
|
|
|
|
|
if ( $this->baseRegex[$case] === '' ) {
|
|
|
|
|
$this->baseRegex[$case] = $group;
|
|
|
|
|
} else {
|
|
|
|
|
$this->baseRegex[$case] .= '|' . $group;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return $this->baseRegex;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
2010-02-15 09:34:51 +00:00
|
|
|
* Get an unanchored regex that does not match parameters
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
*/
|
|
|
|
|
function getRegex() {
|
|
|
|
|
if ( is_null( $this->regex ) ) {
|
|
|
|
|
$base = $this->getBaseRegex();
|
|
|
|
|
$this->regex = array( '', '' );
|
|
|
|
|
if ( $this->baseRegex[0] !== '' ) {
|
|
|
|
|
$this->regex[0] = "/{$base[0]}/iuS";
|
|
|
|
|
}
|
|
|
|
|
if ( $this->baseRegex[1] !== '' ) {
|
|
|
|
|
$this->regex[1] = "/{$base[1]}/S";
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return $this->regex;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
2010-02-15 09:34:51 +00:00
|
|
|
* Get a regex for matching variables with parameters
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
*/
|
|
|
|
|
function getVariableRegex() {
|
|
|
|
|
return str_replace( "\\$1", "(.*?)", $this->getRegex() );
|
|
|
|
|
}
|
|
|
|
|
|
2010-01-30 12:46:16 +00:00
|
|
|
/**
|
2010-02-15 09:34:51 +00:00
|
|
|
* Get a regex anchored to the start of the string that does not match parameters
|
2010-01-30 12:46:16 +00:00
|
|
|
*/
|
|
|
|
|
function getRegexStart() {
|
|
|
|
|
$base = $this->getBaseRegex();
|
|
|
|
|
$newRegex = array( '', '' );
|
|
|
|
|
if ( $base[0] !== '' ) {
|
2010-02-15 09:34:51 +00:00
|
|
|
$newRegex[0] = "/^(?:{$base[0]})/iuS";
|
2010-01-30 12:46:16 +00:00
|
|
|
}
|
|
|
|
|
if ( $base[1] !== '' ) {
|
2010-02-15 09:34:51 +00:00
|
|
|
$newRegex[1] = "/^(?:{$base[1]})/S";
|
2010-01-30 12:46:16 +00:00
|
|
|
}
|
|
|
|
|
return $newRegex;
|
|
|
|
|
}
|
|
|
|
|
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
/**
|
2010-02-15 09:34:51 +00:00
|
|
|
* Get an anchored regex for matching variables with parameters
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
*/
|
|
|
|
|
function getVariableStartToEndRegex() {
|
|
|
|
|
$base = $this->getBaseRegex();
|
|
|
|
|
$newRegex = array( '', '' );
|
|
|
|
|
if ( $base[0] !== '' ) {
|
|
|
|
|
$newRegex[0] = str_replace( "\\$1", "(.*?)", "/^(?:{$base[0]})$/iuS" );
|
|
|
|
|
}
|
|
|
|
|
if ( $base[1] !== '' ) {
|
|
|
|
|
$newRegex[1] = str_replace( "\\$1", "(.*?)", "/^(?:{$base[1]})$/S" );
|
|
|
|
|
}
|
|
|
|
|
return $newRegex;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Parse a match array from preg_match
|
2008-02-20 08:53:12 +00:00
|
|
|
* Returns array(magic word ID, parameter value)
|
|
|
|
|
* If there is no parameter value, that element will be false.
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
*/
|
|
|
|
|
function parseMatch( $m ) {
|
|
|
|
|
reset( $m );
|
|
|
|
|
while ( list( $key, $value ) = each( $m ) ) {
|
|
|
|
|
if ( $key === 0 || $value === '' ) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
$parts = explode( '_', $key, 2 );
|
|
|
|
|
if ( count( $parts ) != 2 ) {
|
|
|
|
|
// This shouldn't happen
|
|
|
|
|
// continue;
|
|
|
|
|
throw new MWException( __METHOD__ . ': bad parameter name' );
|
|
|
|
|
}
|
2007-08-21 03:57:54 +00:00
|
|
|
list( /* $synIndex */, $magicName ) = $parts;
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
$paramValue = next( $m );
|
|
|
|
|
return array( $magicName, $paramValue );
|
|
|
|
|
}
|
|
|
|
|
// This shouldn't happen either
|
|
|
|
|
throw new MWException( __METHOD__.': parameter not found' );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Match some text, with parameter capture
|
2008-04-14 07:45:50 +00:00
|
|
|
* Returns an array with the magic word name in the first element and the
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
* parameter in the second element.
|
|
|
|
|
* Both elements are false if there was no match.
|
|
|
|
|
*/
|
|
|
|
|
public function matchVariableStartToEnd( $text ) {
|
|
|
|
|
$regexes = $this->getVariableStartToEndRegex();
|
2007-08-21 03:57:54 +00:00
|
|
|
foreach ( $regexes as $regex ) {
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
if ( $regex !== '' ) {
|
|
|
|
|
$m = false;
|
|
|
|
|
if ( preg_match( $regex, $text, $m ) ) {
|
|
|
|
|
return $this->parseMatch( $m );
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return array( false, false );
|
|
|
|
|
}
|
2007-06-29 01:19:14 +00:00
|
|
|
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
/**
|
|
|
|
|
* Match some text, without parameter capture
|
|
|
|
|
* Returns the magic word name, or false if there was no capture
|
|
|
|
|
*/
|
|
|
|
|
public function matchStartToEnd( $text ) {
|
|
|
|
|
$hash = $this->getHash();
|
|
|
|
|
if ( isset( $hash[1][$text] ) ) {
|
|
|
|
|
return $hash[1][$text];
|
|
|
|
|
}
|
|
|
|
|
global $wgContLang;
|
|
|
|
|
$lc = $wgContLang->lc( $text );
|
|
|
|
|
if ( isset( $hash[0][$lc] ) ) {
|
|
|
|
|
return $hash[0][$lc];
|
|
|
|
|
}
|
|
|
|
|
return false;
|
|
|
|
|
}
|
2008-02-20 08:53:12 +00:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns an associative array, ID => param value, for all items that match
|
|
|
|
|
* Removes the matched items from the input string (passed by reference)
|
|
|
|
|
*/
|
|
|
|
|
public function matchAndRemove( &$text ) {
|
|
|
|
|
$found = array();
|
|
|
|
|
$regexes = $this->getRegex();
|
|
|
|
|
foreach ( $regexes as $regex ) {
|
|
|
|
|
if ( $regex === '' ) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
preg_match_all( $regex, $text, $matches, PREG_SET_ORDER );
|
|
|
|
|
foreach ( $matches as $m ) {
|
|
|
|
|
list( $name, $param ) = $this->parseMatch( $m );
|
|
|
|
|
$found[$name] = $param;
|
|
|
|
|
}
|
|
|
|
|
$text = preg_replace( $regex, '', $text );
|
|
|
|
|
}
|
|
|
|
|
return $found;
|
|
|
|
|
}
|
2010-01-30 12:46:16 +00:00
|
|
|
|
|
|
|
|
/**
|
2010-02-15 09:34:51 +00:00
|
|
|
* Return the ID of the magic word at the start of $text, and remove
|
|
|
|
|
* the prefix from $text.
|
|
|
|
|
* Return false if no match found and $text is not modified.
|
|
|
|
|
* Does not match parameters.
|
2010-01-30 12:46:16 +00:00
|
|
|
*/
|
|
|
|
|
public function matchStartAndRemove( &$text ) {
|
|
|
|
|
$regexes = $this->getRegexStart();
|
|
|
|
|
foreach ( $regexes as $regex ) {
|
|
|
|
|
if ( $regex === '' ) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
2010-02-22 07:02:12 +00:00
|
|
|
if ( preg_match( $regex, $text, $m ) ) {
|
2010-11-30 18:44:50 +00:00
|
|
|
list( $id, ) = $this->parseMatch( $m );
|
2010-02-22 07:02:12 +00:00
|
|
|
if ( strlen( $m[0] ) >= strlen( $text ) ) {
|
|
|
|
|
$text = '';
|
|
|
|
|
} else {
|
|
|
|
|
$text = substr( $text, strlen( $m[0] ) );
|
|
|
|
|
}
|
|
|
|
|
return $id;
|
2010-01-30 12:46:16 +00:00
|
|
|
}
|
|
|
|
|
}
|
2010-02-15 09:34:51 +00:00
|
|
|
return false;
|
2010-01-30 12:46:16 +00:00
|
|
|
}
|
Basic integrated audio/video support, with Ogg implementation.
* JavaScript video player based loosely on Greg Maxwell's player
* Image page text snippet customisation
* Abstraction of transform parameters in the parser. Introduced Linker::makeImageLink2().
* Made canRender(), mustRender() depend on file, not just on handler. Moved width=0, height=0 checking to ImageHandler::canRender(), since audio streams have width=height=0 but should be rendered.
Also:
* Automatic upgrade for oldimage rows on image page view, allows media handler selection based on oi_*_mime
* oi_*_mime unconditionally referenced, REQUIRES SCHEMA UPGRADE
* Don't destroy file info for missing files on upgrade
* Simple, centralised extension message file handling
* Made MessageCache::loadAllMessages non-static, optimised for repeated-call case due to abuse in User.php
* Support for lightweight parser output hooks, with callback whitelist for security
* Moved Linker::formatSize() to Language, to join the new formatTimePeriod() and formatBitrate()
* Introduced MagicWordArray, regex capture trick requires that magic word IDs DO NOT CONTAIN HYPHENS.
2007-08-15 10:50:09 +00:00
|
|
|
}
|