wiki.techinc.nl/languages/classes/LanguageSr.php

<?php

require_once( dirname( __FILE__ ) . '/../LanguageConverter.php' );
require_once( dirname( __FILE__ ) . '/LanguageSr_ec.php' );
require_once( dirname( __FILE__ ) . '/LanguageSr_el.php' );

/**
 * There are two levels of conversion for Serbian: the script level
 * (Cyrillics <-> Latin), and the variant level (ekavian
 * <->iyekavian). The two are orthogonal. So we really only need two
 * dictionaries: one for Cyrillics and Latin, and one for ekavian and
 * iyekavian.
 *
 * @ingroup Language
 */
class SrConverter extends LanguageConverter {
	var $mToLatin = array(
		'а' => 'a', 'б' => 'b',  'в' => 'v', 'г' => 'g',  'д' => 'd',
		'ђ' => 'đ', 'е' => 'e',  'ж' => 'ž', 'з' => 'z',  'и' => 'i',
		'ј' => 'j', 'к' => 'k',  'л' => 'l', 'љ' => 'lj', 'м' => 'm',
		'н' => 'n', 'њ' => 'nj', 'о' => 'o', 'п' => 'p',  'р' => 'r',
		'с' => 's', 'т' => 't',  'ћ' => 'ć', 'у' => 'u',  'ф' => 'f',
		'х' => 'h', 'ц' => 'c',  'ч' => 'č', 'џ' => 'dž', 'ш' => 'š',

		'А' => 'A', 'Б' => 'B',  'В' => 'V', 'Г' => 'G',  'Д' => 'D',
		'Ђ' => 'Đ', 'Е' => 'E',  'Ж' => 'Ž', 'З' => 'Z',  'И' => 'I',
		'Ј' => 'J', 'К' => 'K',  'Л' => 'L', 'Љ' => 'Lj', 'М' => 'M',
		'Н' => 'N', 'Њ' => 'Nj', 'О' => 'O', 'П' => 'P',  'Р' => 'R',
		'С' => 'S', 'Т' => 'T',  'Ћ' => 'Ć', 'У' => 'U',  'Ф' => 'F',
		'Х' => 'H', 'Ц' => 'C',  'Ч' => 'Č', 'Џ' => 'Dž', 'Ш' => 'Š',
	);

	var $mToCyrillics = array(
		'a' => 'а', 'b'  => 'б', 'c' => 'ц', 'č' => 'ч', 'ć'  => 'ћ',
		'd' => 'д', 'dž' => 'џ', 'đ' => 'ђ', 'e' => 'е', 'f'  => 'ф',
		'g' => 'г', 'h'  => 'х', 'i' => 'и', 'j' => 'ј', 'k'  => 'к',
		'l' => 'л', 'lj' => 'љ', 'm' => 'м', 'n' => 'н', 'nj' => 'њ',
		'o' => 'о', 'p'  => 'п', 'r' => 'р', 's' => 'с', 'š'  => 'ш',
		't' => 'т', 'u'  => 'у', 'v' => 'в', 'z' => 'з', 'ž'  => 'ж',

		'A' => 'А', 'B'  => 'Б', 'C' => 'Ц', 'Č' => 'Ч', 'Ć'  => 'Ћ',
		'D' => 'Д', 'Dž' => 'Џ', 'Đ' => 'Ђ', 'E' => 'Е', 'F'  => 'Ф',
		'G' => 'Г', 'H'  => 'Х', 'I' => 'И', 'J' => 'Ј', 'K'  => 'К',
		'L' => 'Л', 'LJ' => 'Љ', 'M' => 'М', 'N' => 'Н', 'NJ' => 'Њ',
		'O' => 'О', 'P'  => 'П', 'R' => 'Р', 'S' => 'С', 'Š'  => 'Ш',
		'T' => 'Т', 'U'  => 'У', 'V' => 'В', 'Z' => 'З', 'Ž'  => 'Ж',

		'DŽ' => 'Џ', 'd!ž' => 'дж', 'D!ž' => 'Дж', 'D!Ž' => 'ДЖ',
		'Lj' => 'Љ', 'l!j' => 'лј', 'L!j' => 'Лј', 'L!J' => 'ЛЈ',
		'Nj' => 'Њ', 'n!j' => 'нј', 'N!j' => 'Нј', 'N!J' => 'НЈ'
	);

	function loadDefaultTables() {
		$this->mTables = array(
			'sr-ec' => new ReplacementArray( $this->mToCyrillics ),
			'sr-el' => new ReplacementArray( $this->mToLatin ),
			'sr'    => new ReplacementArray()
		);
	}

	/**
	 * rules should be defined as -{ekavian | iyekavian-} -or-
	 * -{code:text | code:text | ...}-
	 *
	 * update: delete all rule parsing because it's not used
	 * currently, and just produces a couple of bugs
	 *
	 * @param $rule string
	 * @param $flags array
	 * @return array
	 */
	function parseManualRule( $rule, $flags = array() ) {
		if ( in_array( 'T', $flags ) ) {
			return parent::parseManualRule( $rule, $flags );
		}

		$carray = array();
		// otherwise ignore all formatting
		foreach ( $this->mVariants as $v ) {
			$carray[$v] = $rule;
		}

		return $carray;
	}

	/**
	 * A function wrapper:
	 *   - if there is no selected variant, leave the link
	 *     names as they were
	 *   - do not try to find variants for usernames
	 *
	 * @param $link string
	 * @param $nt Title
	 * @param $ignoreOtherCond bool
	 */
	function findVariantLink( &$link, &$nt, $ignoreOtherCond = false ) {
		// check for user namespace
		if ( is_object( $nt ) ) {
			$ns = $nt->getNamespace();
			if ( $ns == NS_USER || $ns == NS_USER_TALK )
				return;
		}

		$oldlink = $link;
		parent::findVariantLink( $link, $nt, $ignoreOtherCond );
		if ( $this->getPreferredVariant() == $this->mMainLanguageCode )
			$link = $oldlink;
	}

	/**
	 * We want our external link captions to be converted in variants,
	 * so we return the original text instead -{$text}-, except for URLs
	 *
	 * @param $text string
	 * @param $noParse bool
	 *
	 * @return string
	 */
	function markNoConversion( $text, $noParse = false ) {
		if ( $noParse || preg_match( "/^https?:\/\/|ftp:\/\/|irc:\/\//", $text ) )
			return parent::markNoConversion( $text );
		return $text;
	}

	/**
	 * An ugly function wrapper for parsing Image titles
	 * (to prevent image name conversion)
	 *
	 * @param $text string
	 * @param $toVariant bool
	 *
	 * @return string
	 */
	function autoConvert( $text, $toVariant = false ) {
		global $wgTitle;
		if ( is_object( $wgTitle ) && $wgTitle->getNameSpace() == NS_FILE ) {
			$imagename = $wgTitle->getNsText();
			if ( preg_match( "/^$imagename:/", $text ) ) return $text;
		}
		return parent::autoConvert( $text, $toVariant );
	}

	/**
	 *  It translates text into variant, specials:
	 *    - ommiting roman numbers
	 *
	 * @param $text string
	 * @param $toVariant string
	 *
	 * @return string
	 */
	function translate( $text, $toVariant ) {
		$breaks = '[^\w\x80-\xff]';

		// regexp for roman numbers
		$roman = 'M{0,4}(CM|CD|D?C{0,3})(XC|XL|L?X{0,3})(IX|IV|V?I{0,3})';

		$reg = '/^' . $roman . '$|^' . $roman . $breaks . '|' . $breaks . $roman . '$|' . $breaks . $roman . $breaks . '/';

		$matches = preg_split( $reg, $text, -1, PREG_SPLIT_OFFSET_CAPTURE );

		$m = array_shift( $matches );
		if ( !isset( $this->mTables[$toVariant] ) ) {
			throw new MWException( "Broken variant table: " . implode( ',', array_keys( $this->mTables ) ) );
		}
		$ret = $this->mTables[$toVariant]->replace( $m[0] );
		$mstart = $m[1] + strlen( $m[0] );
		foreach ( $matches as $m ) {
			$ret .= substr( $text, $mstart, $m[1] -$mstart );
			$ret .= parent::translate( $m[0], $toVariant );
			$mstart = $m[1] + strlen( $m[0] );
		}

		return $ret;
	}
}

/**
 * Serbian (Српски / Srpski)
 *
 * @ingroup Language
 */
class LanguageSr extends LanguageSr_ec {
	function __construct() {
		global $wgHooks;

		parent::__construct();

		$variants = array( 'sr', 'sr-ec', 'sr-el' );
		$variantfallbacks = array(
			'sr'    => 'sr-ec',
			'sr-ec' => 'sr',
			'sr-el' => 'sr',
		);

		$flags = array(
			'S' => 'S', 'писмо' => 'S', 'pismo' => 'S',
			'W' => 'W', 'реч'   => 'W', 'reč'   => 'W', 'ријеч' => 'W', 'riječ' => 'W'
		);
		$this->mConverter = new SrConverter( $this, 'sr', $variants, $variantfallbacks, $flags );
		$wgHooks['ArticleSaveComplete'][] = $this->mConverter;
	}

	/**
	 * @param $count int
	 * @param $forms array
	 *
	 * @return string
	 */
	function convertPlural( $count, $forms ) {
		if ( !count( $forms ) ) {
			return '';
		}

		// if no number with word, then use $form[0] for singular and $form[1] for plural or zero
		if ( count( $forms ) === 2 ) {
			return $count == 1 ? $forms[0] : $forms[1];
		}

		// @todo FIXME: CLDR defines 4 plural forms. Form with decimals missing.
		// See http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html#ru
		$forms = $this->preConvertPlural( $forms, 3 );

		if ( $count > 10 && floor( ( $count % 100 ) / 10 ) == 1 ) {
			return $forms[2];
		} else {
			switch ( $count % 10 ) {
				case 1:  return $forms[0];
				case 2:
				case 3:
				case 4:  return $forms[1];
				default: return $forms[2];
			}
		}
	}
}
-												Fix for compatibility with short_open_tag = Off

											
										
										
											2004-02-18 02:15:00 +00:00
+								<?php
-												WARNING: HUGE COMMIT

Doxygen documentation update:
* Changed alls @addtogroup to @ingroup. @addtogroup adds the comment to the group description, but doesn't add the file, class, function, ... to the group like @ingroup does. See for example http://svn.wikimedia.org/doc/group__SpecialPage.html where it's impossible to see related files, classes, ... that should belong to that group.
* Added @file to file description, it seems that it should be explicitely decalred for file descriptions, otherwise doxygen will think that the comment document the first class, variabled, function, ... that is in that file.
* Removed some empty comments
* Removed some ?>

Added following groups:
* ExternalStorage
* JobQueue
* MaintenanceLanguage

One more thing: there are still a lot of warnings when generating the doc.

											
										
										
											2008-05-20 17:13:28 +00:00
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+								require_once( dirname( __FILE__ ) . '/../LanguageConverter.php' );
 								require_once( dirname( __FILE__ ) . '/LanguageSr_ec.php' );
 								require_once( dirname( __FILE__ ) . '/LanguageSr_el.php' );
-*BOOM*
* (bug 3993) Variants for Serbian language

											
										
										
											2006-03-02 22:22:18 +00:00
-												WARNING: HUGE COMMIT

Doxygen documentation update:
* Changed alls @addtogroup to @ingroup. @addtogroup adds the comment to the group description, but doesn't add the file, class, function, ... to the group like @ingroup does. See for example http://svn.wikimedia.org/doc/group__SpecialPage.html where it's impossible to see related files, classes, ... that should belong to that group.
* Added @file to file description, it seems that it should be explicitely decalred for file descriptions, otherwise doxygen will think that the comment document the first class, variabled, function, ... that is in that file.
* Removed some empty comments
* Removed some ?>

Added following groups:
* ExternalStorage
* JobQueue
* MaintenanceLanguage

One more thing: there are still a lot of warnings when generating the doc.

											
										
										
											2008-05-20 17:13:28 +00:00
+								/**
 								 * There are two levels of conversion for Serbian: the script level
 								 * (Cyrillics <-> Latin), and the variant level (ekavian
 								 * <->iyekavian). The two are orthogonal. So we really only need two
 								 * dictionaries: one for Cyrillics and Latin, and one for ekavian and
 								 * iyekavian.
 								 *
 								 * @ingroup Language
 								 */
-*BOOM*
* (bug 3993) Variants for Serbian language

											
										
										
											2006-03-02 22:22:18 +00:00
+								class SrConverter extends LanguageConverter {
 									var $mToLatin = array(
 										'а' => 'a', 'б' => 'b',  'в' => 'v', 'г' => 'g',  'д' => 'd',
 										'ђ' => 'đ', 'е' => 'e',  'ж' => 'ž', 'з' => 'z',  'и' => 'i',
 										'ј' => 'j', 'к' => 'k',  'л' => 'l', 'љ' => 'lj', 'м' => 'm',
 										'н' => 'n', 'њ' => 'nj', 'о' => 'o', 'п' => 'p',  'р' => 'r',
 										'с' => 's', 'т' => 't',  'ћ' => 'ć', 'у' => 'u',  'ф' => 'f',
 										'х' => 'h', 'ц' => 'c',  'ч' => 'č', 'џ' => 'dž', 'ш' => 'š',
 										'А' => 'A', 'Б' => 'B',  'В' => 'V', 'Г' => 'G',  'Д' => 'D',
 										'Ђ' => 'Đ', 'Е' => 'E',  'Ж' => 'Ž', 'З' => 'Z',  'И' => 'I',
 										'Ј' => 'J', 'К' => 'K',  'Л' => 'L', 'Љ' => 'Lj', 'М' => 'M',
 										'Н' => 'N', 'Њ' => 'Nj', 'О' => 'O', 'П' => 'P',  'Р' => 'R',
 										'С' => 'S', 'Т' => 'T',  'Ћ' => 'Ć', 'У' => 'U',  'Ф' => 'F',
 										'Х' => 'H', 'Ц' => 'C',  'Ч' => 'Č', 'Џ' => 'Dž', 'Ш' => 'Š',
 									);
 									var $mToCyrillics = array(
 										'a' => 'а', 'b'  => 'б', 'c' => 'ц', 'č' => 'ч', 'ć'  => 'ћ',
 										'd' => 'д', 'dž' => 'џ', 'đ' => 'ђ', 'e' => 'е', 'f'  => 'ф',
 										'g' => 'г', 'h'  => 'х', 'i' => 'и', 'j' => 'ј', 'k'  => 'к',
 										'l' => 'л', 'lj' => 'љ', 'm' => 'м', 'n' => 'н', 'nj' => 'њ',
 										'o' => 'о', 'p'  => 'п', 'r' => 'р', 's' => 'с', 'š'  => 'ш',
 										't' => 'т', 'u'  => 'у', 'v' => 'в', 'z' => 'з', 'ž'  => 'ж',
 										'A' => 'А', 'B'  => 'Б', 'C' => 'Ц', 'Č' => 'Ч', 'Ć'  => 'Ћ',
 										'D' => 'Д', 'Dž' => 'Џ', 'Đ' => 'Ђ', 'E' => 'Е', 'F'  => 'Ф',
 										'G' => 'Г', 'H'  => 'Х', 'I' => 'И', 'J' => 'Ј', 'K'  => 'К',
 										'L' => 'Л', 'LJ' => 'Љ', 'M' => 'М', 'N' => 'Н', 'NJ' => 'Њ',
 										'O' => 'О', 'P'  => 'П', 'R' => 'Р', 'S' => 'С', 'Š'  => 'Ш',
 										'T' => 'Т', 'U'  => 'У', 'V' => 'В', 'Z' => 'З', 'Ž'  => 'Ж',
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										'DŽ' => 'Џ', 'd!ž' => 'дж', 'D!ž' => 'Дж', 'D!Ž' => 'ДЖ',
 										'Lj' => 'Љ', 'l!j' => 'лј', 'L!j' => 'Лј', 'L!J' => 'ЛЈ',
 										'Nj' => 'Њ', 'n!j' => 'нј', 'N!j' => 'Нј', 'N!J' => 'НЈ'
-*BOOM*
* (bug 3993) Variants for Serbian language

											
										
										
											2006-03-02 22:22:18 +00:00
+									);
 									function loadDefaultTables() {
-												* Introduced StringUtils.php, populated it with some generic string functions, both new and collected from various other files.
* Removed some backtracking regexes with an O(N^2) worst case, replaced with StringUtils::delimiterReplace(). There is a beneficial functional difference: /*/ is no longer considered to be a complete CSS comment.
* Changed the parser strip state from an array to an object. This should hopefully avoid the PHP bugs with array references. StripState uses the new ReplacementArray to do the replacements, thereby supporting FSS. 
* Removed DatabaseFunctions.php from the default startup sequence. Moved wfGetDB() to GlobalFunctions.php.
* Introduced the SiteStats class, with a collection of cached site stats accessor functions.
* Removed all global functions from Parser.php, they don't belong there.
* Made LanguageConverter use the new ReplacementArray class instead of managing its own FSS objects.

											
										
										
											2006-11-21 09:53:45 +00:00
+										$this->mTables = array(
 											'sr-ec' => new ReplacementArray( $this->mToCyrillics ),
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+											'sr-el' => new ReplacementArray( $this->mToLatin ),
-												* Introduced StringUtils.php, populated it with some generic string functions, both new and collected from various other files.
* Removed some backtracking regexes with an O(N^2) worst case, replaced with StringUtils::delimiterReplace(). There is a beneficial functional difference: /*/ is no longer considered to be a complete CSS comment.
* Changed the parser strip state from an array to an object. This should hopefully avoid the PHP bugs with array references. StripState uses the new ReplacementArray to do the replacements, thereby supporting FSS. 
* Removed DatabaseFunctions.php from the default startup sequence. Moved wfGetDB() to GlobalFunctions.php.
* Introduced the SiteStats class, with a collection of cached site stats accessor functions.
* Removed all global functions from Parser.php, they don't belong there.
* Made LanguageConverter use the new ReplacementArray class instead of managing its own FSS objects.

											
										
										
											2006-11-21 09:53:45 +00:00
+											'sr'    => new ReplacementArray()
 										);
-												Small cleanup to language files, expect the two that got corrupted in the process

											
										
										
											2005-08-15 19:27:58 +00:00
+									}
-												More documentation!

											
										
										
											2011-05-29 16:32:05 +00:00
+									/**
 									 * rules should be defined as -{ekavian | iyekavian-} -or-
 									 * -{code:text | code:text | ...}-
 									 *
 									 * update: delete all rule parsing because it's not used
 									 * currently, and just produces a couple of bugs
 									 *
 									 * @param $rule string
 									 * @param $flags array
 									 * @return array
 									 */
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+									function parseManualRule( $rule, $flags = array() ) {
 										if ( in_array( 'T', $flags ) ) {
 											return parent::parseManualRule( $rule, $flags );
-												More lang variant stuff:
* More parser tests, also added 'variant' option for testing
* Add global $wgDefaultLanguageVariant, can be used to set a default
  fallback variant
* Restructured some of the parser code in LanguageConverter, fix flag
  processing and add some comments to despookify the old zh code :)
* Cleanup of some old hacks in LanguageSr and Kk (do not use the global 
  title object, but the one passed to the parser)

											
										
										
											2007-01-01 17:20:19 +00:00
+										}
-												Bug 3190

											
										
										
											2005-08-19 00:05:06 +00:00
-												Explicitally define some variables

Function documentation

											
										
										
											2011-02-18 23:21:48 +00:00
+										$carray = array();
-												More lang variant stuff:
* More parser tests, also added 'variant' option for testing
* Add global $wgDefaultLanguageVariant, can be used to set a default
  fallback variant
* Restructured some of the parser code in LanguageConverter, fix flag
  processing and add some comments to despookify the old zh code :)
* Cleanup of some old hacks in LanguageSr and Kk (do not use the global 
  title object, but the one passed to the parser)

											
										
										
											2007-01-01 17:20:19 +00:00
+										// otherwise ignore all formatting
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										foreach ( $this->mVariants as $v ) {
-												More lang variant stuff:
* More parser tests, also added 'variant' option for testing
* Add global $wgDefaultLanguageVariant, can be used to set a default
  fallback variant
* Restructured some of the parser code in LanguageConverter, fix flag
  processing and add some comments to despookify the old zh code :)
* Cleanup of some old hacks in LanguageSr and Kk (do not use the global 
  title object, but the one passed to the parser)

											
										
										
											2007-01-01 17:20:19 +00:00
+											$carray[$v] = $rule;
 										}
-												remove EOL whitespace, and excess empty lines

											
										
										
											2008-05-17 17:10:18 +00:00
-*BOOM*
* (bug 3993) Variants for Serbian language

											
										
										
											2006-03-02 22:22:18 +00:00
+										return $carray;
-												* (bug 3682) LanguageSr.php - added convertPlural

											
										
										
											2005-10-12 07:40:34 +00:00
+									}
-												Bug 3190

											
										
										
											2005-08-19 00:05:06 +00:00
-												Changes to doc-comments. /* to /** in language folder.

											
										
										
											2011-05-22 22:05:18 +00:00
+									/**
-												More language variant stuff:
* Added some basic parser tests for variants
* Enable selflinks to be written in variants
* Prevent username lookup in variants for sr.wiki (per community request)
* Update release notes (also notes for last commit, when I forgot)

											
										
										
											2006-12-26 12:19:45 +00:00
+									 * A function wrapper:
-												remove EOL whitespace, and excess empty lines

											
										
										
											2008-05-17 17:10:18 +00:00
+									 *   - if there is no selected variant, leave the link
-												More language variant stuff:
* Added some basic parser tests for variants
* Enable selflinks to be written in variants
* Prevent username lookup in variants for sr.wiki (per community request)
* Update release notes (also notes for last commit, when I forgot)

											
										
										
											2006-12-26 12:19:45 +00:00
+									 *     names as they were
 									 *   - do not try to find variants for usernames
-												More documentation!

											
										
										
											2011-05-29 16:32:05 +00:00
+									 *
 									 * @param $link string
 									 * @param $nt Title
 									 * @param $ignoreOtherCond bool
-												* (bug 6300) Bug fixes for sr: variants
* Patch from Robert Stojnic

											
										
										
											2006-06-16 22:30:39 +00:00
+									 */
-. Use param $ignoreOtherCond instead of $forTemplate and $ignoreSubmitCond in findVariantLink().
2. Drop some duplicate categories produced by findVariantLink().

											
										
										
											2009-02-02 07:54:43 +00:00
+									function findVariantLink( &$link, &$nt, $ignoreOtherCond = false ) {
-												More language variant stuff:
* Added some basic parser tests for variants
* Enable selflinks to be written in variants
* Prevent username lookup in variants for sr.wiki (per community request)
* Update release notes (also notes for last commit, when I forgot)

											
										
										
											2006-12-26 12:19:45 +00:00
+										// check for user namespace
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										if ( is_object( $nt ) ) {
-												More language variant stuff:
* Added some basic parser tests for variants
* Enable selflinks to be written in variants
* Prevent username lookup in variants for sr.wiki (per community request)
* Update release notes (also notes for last commit, when I forgot)

											
										
										
											2006-12-26 12:19:45 +00:00
+											$ns = $nt->getNamespace();
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+											if ( $ns == NS_USER || $ns == NS_USER_TALK )
-												More language variant stuff:
* Added some basic parser tests for variants
* Enable selflinks to be written in variants
* Prevent username lookup in variants for sr.wiki (per community request)
* Update release notes (also notes for last commit, when I forgot)

											
										
										
											2006-12-26 12:19:45 +00:00
+												return;
 										}
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										$oldlink = $link;
-. Use param $ignoreOtherCond instead of $forTemplate and $ignoreSubmitCond in findVariantLink().
2. Drop some duplicate categories produced by findVariantLink().

											
										
										
											2009-02-02 07:54:43 +00:00
+										parent::findVariantLink( $link, $nt, $ignoreOtherCond );
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										if ( $this->getPreferredVariant() == $this->mMainLanguageCode )
 											$link = $oldlink;
-												* (bug 6300) Bug fixes for sr: variants
* Patch from Robert Stojnic

											
										
										
											2006-06-16 22:30:39 +00:00
+									}
-												Changes to doc-comments. /* to /** in language folder.

											
										
										
											2011-05-22 22:05:18 +00:00
+									/**
-												* (bug 6300) Bug fixes for sr: variants
* Patch from Robert Stojnic

											
										
										
											2006-06-16 22:30:39 +00:00
+									 * We want our external link captions to be converted in variants,
 									 * so we return the original text instead -{$text}-, except for URLs
-												More documentation!

											
										
										
											2011-05-29 15:59:47 +00:00
+									 *
-												More documentation!

											
										
										
											2011-05-29 16:32:05 +00:00
+									 * @param $text string
 									 * @param $noParse bool
 									 *
-												More documentation!

											
										
										
											2011-05-29 15:59:47 +00:00
+									 * @return string
-												* (bug 6300) Bug fixes for sr: variants
* Patch from Robert Stojnic

											
										
										
											2006-06-16 22:30:39 +00:00
+									 */
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+									function markNoConversion( $text, $noParse = false ) {
 										if ( $noParse || preg_match( "/^https?:\/\/|ftp:\/\/|irc:\/\//", $text ) )
 											return parent::markNoConversion( $text );
-												* (bug 6300) Bug fixes for sr: variants
* Patch from Robert Stojnic

											
										
										
											2006-06-16 22:30:39 +00:00
+										return $text;
 									}
-												Changes to doc-comments. /* to /** in language folder.

											
										
										
											2011-05-22 22:05:18 +00:00
+									/**
-												* (bug 6300) Bug fixes for sr: variants
* Patch from Robert Stojnic

											
										
										
											2006-06-16 22:30:39 +00:00
+									 * An ugly function wrapper for parsing Image titles
 									 * (to prevent image name conversion)
-												More documentation!

											
										
										
											2011-05-29 15:59:47 +00:00
+									 *
-												More documentation!

											
										
										
											2011-05-29 16:32:05 +00:00
+									 * @param $text string
 									 * @param $toVariant bool
 									 *
-												More documentation!

											
										
										
											2011-05-29 15:59:47 +00:00
+									 * @return string
-												* (bug 6300) Bug fixes for sr: variants
* Patch from Robert Stojnic

											
										
										
											2006-06-16 22:30:39 +00:00
+									 */
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+									function autoConvert( $text, $toVariant = false ) {
-												* (bug 6300) Bug fixes for sr: variants
* Patch from Robert Stojnic

											
										
										
											2006-06-16 22:30:39 +00:00
+										global $wgTitle;
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										if ( is_object( $wgTitle ) && $wgTitle->getNameSpace() == NS_FILE ) {
-												* (bug 6300) Bug fixes for sr: variants
* Patch from Robert Stojnic

											
										
										
											2006-06-16 22:30:39 +00:00
+											$imagename = $wgTitle->getNsText();
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+											if ( preg_match( "/^$imagename:/", $text ) ) return $text;
-												* (bug 6300) Bug fixes for sr: variants
* Patch from Robert Stojnic

											
										
										
											2006-06-16 22:30:39 +00:00
+										}
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										return parent::autoConvert( $text, $toVariant );
-												remove EOL whitespace, and excess empty lines

											
										
										
											2008-05-17 17:10:18 +00:00
+									}
-												* (bug 6300) Bug fixes for sr: variants
* Patch from Robert Stojnic

											
										
										
											2006-06-16 22:30:39 +00:00
-												* Updates to language variant code for Serbian et al


											
										
										
											2006-09-20 10:22:12 +00:00
+									/**
 									 *  It translates text into variant, specials:
 									 *    - ommiting roman numbers
-												More documentation!

											
										
										
											2011-05-29 15:59:47 +00:00
+									 *
-												More documentation!

											
										
										
											2011-05-29 16:32:05 +00:00
+									 * @param $text string
 									 * @param $toVariant string
 									 *
-												More documentation!

											
										
										
											2011-05-29 15:59:47 +00:00
+									 * @return string
-												* Updates to language variant code for Serbian et al


											
										
										
											2006-09-20 10:22:12 +00:00
+									 */
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+									function translate( $text, $toVariant ) {
-												* Updates to language variant code for Serbian et al


											
										
										
											2006-09-20 10:22:12 +00:00
+										$breaks = '[^\w\x80-\xff]';
 										// regexp for roman numbers
 										$roman = 'M{0,4}(CM|CD|D?C{0,3})(XC|XL|L?X{0,3})(IX|IV|V?I{0,3})';
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										$reg = '/^' . $roman . '$|^' . $roman . $breaks . '|' . $breaks . $roman . '$|' . $breaks . $roman . $breaks . '/';
-												* Updates to language variant code for Serbian et al


											
										
										
											2006-09-20 10:22:12 +00:00
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										$matches = preg_split( $reg, $text, -1, PREG_SPLIT_OFFSET_CAPTURE );
-												remove EOL whitespace, and excess empty lines

											
										
										
											2008-05-17 17:10:18 +00:00
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										$m = array_shift( $matches );
 										if ( !isset( $this->mTables[$toVariant] ) ) {
-												* Make variant table caching a little more robust, using main language code
  in cache key. Probably this is still a bit wonky, though. Was breaking
  parser tests when Chinese tables were getting loaded into Serbian code.


											
										
										
											2006-12-27 01:49:09 +00:00
+											throw new MWException( "Broken variant table: " . implode( ',', array_keys( $this->mTables ) ) );
 										}
-												* Introduced StringUtils.php, populated it with some generic string functions, both new and collected from various other files.
* Removed some backtracking regexes with an O(N^2) worst case, replaced with StringUtils::delimiterReplace(). There is a beneficial functional difference: /*/ is no longer considered to be a complete CSS comment.
* Changed the parser strip state from an array to an object. This should hopefully avoid the PHP bugs with array references. StripState uses the new ReplacementArray to do the replacements, thereby supporting FSS. 
* Removed DatabaseFunctions.php from the default startup sequence. Moved wfGetDB() to GlobalFunctions.php.
* Introduced the SiteStats class, with a collection of cached site stats accessor functions.
* Removed all global functions from Parser.php, they don't belong there.
* Made LanguageConverter use the new ReplacementArray class instead of managing its own FSS objects.

											
										
										
											2006-11-21 09:53:45 +00:00
+										$ret = $this->mTables[$toVariant]->replace( $m[0] );
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										$mstart = $m[1] + strlen( $m[0] );
 										foreach ( $matches as $m ) {
 											$ret .= substr( $text, $mstart, $m[1] -$mstart );
 											$ret .= parent::translate( $m[0], $toVariant );
 											$mstart = $m[1] + strlen( $m[0] );
-												* Updates to language variant code for Serbian et al


											
										
										
											2006-09-20 10:22:12 +00:00
+										}
 										return $ret;
 									}
-												Nov. branch merge, all files copied from stable

											
										
										
											2003-11-09 11:24:43 +00:00
+								}
-												WARNING: HUGE COMMIT

Doxygen documentation update:
* Changed alls @addtogroup to @ingroup. @addtogroup adds the comment to the group description, but doesn't add the file, class, function, ... to the group like @ingroup does. See for example http://svn.wikimedia.org/doc/group__SpecialPage.html where it's impossible to see related files, classes, ... that should belong to that group.
* Added @file to file description, it seems that it should be explicitely decalred for file descriptions, otherwise doxygen will think that the comment document the first class, variabled, function, ... that is in that file.
* Removed some empty comments
* Removed some ?>

Added following groups:
* ExternalStorage
* JobQueue
* MaintenanceLanguage

One more thing: there are still a lot of warnings when generating the doc.

											
										
										
											2008-05-20 17:13:28 +00:00
+								/**
-												Added description to language classes

											
										
										
											2010-10-10 12:53:37 +00:00
+								 * Serbian (Српски / Srpski)
 								 *
-												WARNING: HUGE COMMIT

Doxygen documentation update:
* Changed alls @addtogroup to @ingroup. @addtogroup adds the comment to the group description, but doesn't add the file, class, function, ... to the group like @ingroup does. See for example http://svn.wikimedia.org/doc/group__SpecialPage.html where it's impossible to see related files, classes, ... that should belong to that group.
* Added @file to file description, it seems that it should be explicitely decalred for file descriptions, otherwise doxygen will think that the comment document the first class, variabled, function, ... that is in that file.
* Removed some empty comments
* Removed some ?>

Added following groups:
* ExternalStorage
* JobQueue
* MaintenanceLanguage

One more thing: there are still a lot of warnings when generating the doc.

											
										
										
											2008-05-20 17:13:28 +00:00
+								 * @ingroup Language
 								 */
-*BOOM*
* (bug 3993) Variants for Serbian language

											
										
										
											2006-03-02 22:22:18 +00:00
+								class LanguageSr extends LanguageSr_ec {
-												Using __construct for all the language constructors, and few minor fixes.

											
										
										
											2006-06-24 18:48:58 +00:00
+									function __construct() {
-*BOOM*
* (bug 3993) Variants for Serbian language

											
										
										
											2006-03-02 22:22:18 +00:00
+										global $wgHooks;
-												* Updates to language variant code for Serbian et al


											
										
										
											2006-09-20 10:22:12 +00:00
-												Merged localisation-work branch:

* Made lines from initialiseMessages() appear as list items during installation
* Moved the bulk of the localisation data from the Language*.php files to the Messages*.php files. Deleted most of the Languages*.php files.
* Introduced "stub global" framework to provide deferred initialisation of core modules. 
* Removed placeholder values for $wgTitle and $wgArticle, these variables will now be null during the initialisation process, until they are set by index.php or another entry point.
* Added DBA cache type, for BDB-style caches. 
* Removed custom date format functions, replacing them with a format string in the style of PHP's date(). Used string identifiers instead of integer identifiers, in both the language files and user preferences. Migration should be transparent in most cases.
* Simplified the initialisation API for LoadBalancer objects.
* Removed the broken altencoding feature.
* Moved default user options and toggles from Language to User. Language objects are still able to define default preference overrides and extra user toggles, via a slightly different interface.
* Don't include the date option in the parser cache rendering hash unless $wgUseDynamicDates is enabled.
* Merged LanguageUtf8 with Language. Removed LanguageUtf8.php. 
* Removed inclusion of language files from the bottom of Language.php. This is now consistently done from Language::factory(). 
* Add the name of the executing maintenance script to the debug log. Start the profiler during maintenance scripts.
* Added "serialized" directory, for storing precompiled data in serialized form. 

											
										
										
											2006-07-26 07:15:39 +00:00
+										parent::__construct();
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										$variants = array( 'sr', 'sr-ec', 'sr-el' );
-*BOOM*
* (bug 3993) Variants for Serbian language

											
										
										
											2006-03-02 22:22:18 +00:00
+										$variantfallbacks = array(
 											'sr'    => 'sr-ec',
-												More lang variant stuff:
* More parser tests, also added 'variant' option for testing
* Add global $wgDefaultLanguageVariant, can be used to set a default
  fallback variant
* Restructured some of the parser code in LanguageConverter, fix flag
  processing and add some comments to despookify the old zh code :)
* Cleanup of some old hacks in LanguageSr and Kk (do not use the global 
  title object, but the one passed to the parser)

											
										
										
											2007-01-01 17:20:19 +00:00
+											'sr-ec' => 'sr',
 											'sr-el' => 'sr',
-												remove EOL whitespace, and excess empty lines

											
										
										
											2008-05-17 17:10:18 +00:00
+										);
-												* Updates to language variant code for Serbian et al


											
										
										
											2006-09-20 10:22:12 +00:00
-*BOOM*
* (bug 3993) Variants for Serbian language

											
										
										
											2006-03-02 22:22:18 +00:00
+										$flags = array(
 											'S' => 'S', 'писмо' => 'S', 'pismo' => 'S',
 											'W' => 'W', 'реч'   => 'W', 'reč'   => 'W', 'ријеч' => 'W', 'riječ' => 'W'
 										);
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										$this->mConverter = new SrConverter( $this, 'sr', $variants, $variantfallbacks, $flags );
-*BOOM*
* (bug 3993) Variants for Serbian language

											
										
										
											2006-03-02 22:22:18 +00:00
+										$wgHooks['ArticleSaveComplete'][] = $this->mConverter;
 									}
-												Update plural forms per http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html. Complete per Date: 2009/05/12 11:24:52 for languages currently supported in MediaWiki.

Added FIXME where CLDR definition is different from MediaWiki's.

											
										
										
											2009-10-02 18:30:23 +00:00
-												Some language love

											
										
										
											2011-05-29 15:21:03 +00:00
+									/**
 									 * @param $count int
 									 * @param $forms array
 									 *
 									 * @return string
 									 */
-												Update plural forms per http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html. Complete per Date: 2009/05/12 11:24:52 for languages currently supported in MediaWiki.

Added FIXME where CLDR definition is different from MediaWiki's.

											
										
										
											2009-10-02 18:30:23 +00:00
+									function convertPlural( $count, $forms ) {
-												Explicitally define some variables

Function documentation

											
										
										
											2011-02-18 23:21:48 +00:00
+										if ( !count( $forms ) ) {
 											return '';
 										}
-												Update plural forms per http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html. Complete per Date: 2009/05/12 11:24:52 for languages currently supported in MediaWiki.

Added FIXME where CLDR definition is different from MediaWiki's.

											
										
										
											2009-10-02 18:30:23 +00:00
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										// if no number with word, then use $form[0] for singular and $form[1] for plural or zero
-												Explicitally define some variables

Function documentation

											
										
										
											2011-02-18 23:21:48 +00:00
+										if ( count( $forms ) === 2 ) {
 											return $count == 1 ? $forms[0] : $forms[1];
 										}
-												Update plural forms per http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html. Complete per Date: 2009/05/12 11:24:52 for languages currently supported in MediaWiki.

Added FIXME where CLDR definition is different from MediaWiki's.

											
										
										
											2009-10-02 18:30:23 +00:00
-												Use consistent notation for "@todo FIXME". Should update http://svn.wikimedia.org/doc/todo.html nicely.

											
										
										
											2011-05-17 22:03:20 +00:00
+										// @todo FIXME: CLDR defines 4 plural forms. Form with decimals missing.
-												Update plural forms per http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html. Complete per Date: 2009/05/12 11:24:52 for languages currently supported in MediaWiki.

Added FIXME where CLDR definition is different from MediaWiki's.

											
										
										
											2009-10-02 18:30:23 +00:00
+										// See http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html#ru
 										$forms = $this->preConvertPlural( $forms, 3 );
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+										if ( $count > 10 && floor( ( $count % 100 ) / 10 ) == 1 ) {
-												Update plural forms per http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html. Complete per Date: 2009/05/12 11:24:52 for languages currently supported in MediaWiki.

Added FIXME where CLDR definition is different from MediaWiki's.

											
										
										
											2009-10-02 18:30:23 +00:00
+											return $forms[2];
 										} else {
-												Stylize languages/*, languages/classes/*, but not languages/messages/*

											
										
										
											2010-07-29 09:43:18 +00:00
+											switch ( $count % 10 ) {
-												Update plural forms per http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html. Complete per Date: 2009/05/12 11:24:52 for languages currently supported in MediaWiki.

Added FIXME where CLDR definition is different from MediaWiki's.

											
										
										
											2009-10-02 18:30:23 +00:00
+												case 1:  return $forms[0];
 												case 2:
 												case 3:
 												case 4:  return $forms[1];
 												default: return $forms[2];
 											}
 										}
 									}
-*BOOM*
* (bug 3993) Variants for Serbian language

											
										
										
											2006-03-02 22:22:18 +00:00
+								}