2007-05-01 15:02:44 +00:00
|
|
|
|
<?php
|
2006-11-06 17:46:58 +00:00
|
|
|
|
|
2010-07-29 09:43:18 +00:00
|
|
|
|
require_once( dirname( __FILE__ ) . '/../LanguageConverter.php' );
|
|
|
|
|
|
require_once( dirname( __FILE__ ) . '/LanguageKk_cyrl.php' );
|
2006-11-06 17:46:58 +00:00
|
|
|
|
|
2007-12-17 15:31:32 +00:00
|
|
|
|
define( 'KK_C_UC', 'АӘБВГҒДЕЁЖЗИЙКҚЛМНҢОӨПРСТУҰҮФХҺЦЧШЩЪЫІЬЭЮЯ' ); # Kazakh Cyrillic uppercase
|
|
|
|
|
|
define( 'KK_C_LC', 'аәбвгғдеёжзийкқлмнңоөпрстуұүфхһцчшщъыіьэюя' ); # Kazakh Cyrillic lowercase
|
|
|
|
|
|
define( 'KK_L_UC', 'AÄBCÇDEÉFGĞHIİÏJKLMNÑOÖPQRSŞTUÜVWXYÝZ' ); # Kazakh Latin uppercase
|
|
|
|
|
|
define( 'KK_L_LC', 'aäbcçdeéfgğhıiïjklmnñoöpqrsştuüvwxyýz' ); # Kazakh Latin lowercase
|
2010-07-29 09:43:18 +00:00
|
|
|
|
// define( 'KK_A', 'ٴابپتجحدرزسشعفقكلمنڭەوۇۋۆىيچھ' ); # Kazakh Arabic
|
2008-01-11 14:16:42 +00:00
|
|
|
|
define( 'H_HAMZA', 'ٴ' ); # U+0674 ARABIC LETTER HIGH HAMZA
|
2010-07-29 09:43:18 +00:00
|
|
|
|
// define( 'ZWNJ', '' ); # U+200C ZERO WIDTH NON-JOINER
|
2007-12-17 15:31:32 +00:00
|
|
|
|
|
WARNING: HUGE COMMIT
Doxygen documentation update:
* Changed alls @addtogroup to @ingroup. @addtogroup adds the comment to the group description, but doesn't add the file, class, function, ... to the group like @ingroup does. See for example http://svn.wikimedia.org/doc/group__SpecialPage.html where it's impossible to see related files, classes, ... that should belong to that group.
* Added @file to file description, it seems that it should be explicitely decalred for file descriptions, otherwise doxygen will think that the comment document the first class, variabled, function, ... that is in that file.
* Removed some empty comments
* Removed some ?>
Added following groups:
* ExternalStorage
* JobQueue
* MaintenanceLanguage
One more thing: there are still a lot of warnings when generating the doc.
2008-05-20 17:13:28 +00:00
|
|
|
|
/** Kazakh (Қазақша)
|
|
|
|
|
|
* converter routines
|
|
|
|
|
|
*
|
|
|
|
|
|
* @ingroup Language
|
|
|
|
|
|
*/
|
2006-11-06 17:46:58 +00:00
|
|
|
|
class KkConverter extends LanguageConverter {
|
2008-05-17 17:10:18 +00:00
|
|
|
|
|
2011-02-18 23:21:48 +00:00
|
|
|
|
protected $mCyrl2Latn, $mLatn2Cyrl, $mCyLa2Arab;
|
|
|
|
|
|
|
2011-05-29 16:32:05 +00:00
|
|
|
|
/**
|
|
|
|
|
|
* @param $langobj Language
|
|
|
|
|
|
* @param $maincode string
|
|
|
|
|
|
* @param $variants array
|
|
|
|
|
|
* @param $variantfallbacks array
|
|
|
|
|
|
* @param $flags array
|
|
|
|
|
|
*/
|
2010-07-29 09:43:18 +00:00
|
|
|
|
function __construct( $langobj, $maincode,
|
|
|
|
|
|
$variants = array(),
|
|
|
|
|
|
$variantfallbacks = array(),
|
|
|
|
|
|
$flags = array() ) {
|
2007-12-27 22:46:23 +00:00
|
|
|
|
parent::__construct( $langobj, $maincode,
|
2010-01-19 02:36:33 +00:00
|
|
|
|
$variants, $variantfallbacks, $flags );
|
2008-05-17 17:10:18 +00:00
|
|
|
|
|
2007-12-27 22:46:23 +00:00
|
|
|
|
// No point delaying this since they're in code.
|
|
|
|
|
|
// Waiting until loadDefaultTables() means they never get loaded
|
|
|
|
|
|
// when the tables themselves are loaded from cache.
|
|
|
|
|
|
$this->loadRegs();
|
|
|
|
|
|
}
|
2007-12-09 16:24:35 +00:00
|
|
|
|
|
2006-11-22 09:06:24 +00:00
|
|
|
|
function loadDefaultTables() {
|
2007-12-17 15:31:32 +00:00
|
|
|
|
// require( dirname(__FILE__)."/../../includes/KkConversion.php" );
|
|
|
|
|
|
// Placeholder for future implementing. Remove variables declarations
|
|
|
|
|
|
// after generating KkConversion.php
|
|
|
|
|
|
$kk2Cyrl = array();
|
|
|
|
|
|
$kk2Latn = array();
|
|
|
|
|
|
$kk2Arab = array();
|
2007-12-30 16:24:26 +00:00
|
|
|
|
$kk2KZ = array();
|
|
|
|
|
|
$kk2TR = array();
|
|
|
|
|
|
$kk2CN = array();
|
2007-12-17 15:31:32 +00:00
|
|
|
|
|
2006-11-21 09:53:45 +00:00
|
|
|
|
$this->mTables = array(
|
2007-12-30 16:24:26 +00:00
|
|
|
|
'kk-cyrl' => new ReplacementArray( $kk2Cyrl ),
|
|
|
|
|
|
'kk-latn' => new ReplacementArray( $kk2Latn ),
|
|
|
|
|
|
'kk-arab' => new ReplacementArray( $kk2Arab ),
|
2010-07-29 09:43:18 +00:00
|
|
|
|
'kk-kz' => new ReplacementArray( array_merge( $kk2Cyrl, $kk2KZ ) ),
|
|
|
|
|
|
'kk-tr' => new ReplacementArray( array_merge( $kk2Latn, $kk2TR ) ),
|
|
|
|
|
|
'kk-cn' => new ReplacementArray( array_merge( $kk2Arab, $kk2CN ) ),
|
2007-12-30 16:24:26 +00:00
|
|
|
|
'kk' => new ReplacementArray()
|
2006-11-21 09:53:45 +00:00
|
|
|
|
);
|
2006-11-22 09:06:24 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
2007-12-09 16:24:35 +00:00
|
|
|
|
function postLoadTables() {
|
|
|
|
|
|
$this->mTables['kk-kz']->merge( $this->mTables['kk-cyrl'] );
|
|
|
|
|
|
$this->mTables['kk-tr']->merge( $this->mTables['kk-latn'] );
|
|
|
|
|
|
$this->mTables['kk-cn']->merge( $this->mTables['kk-arab'] );
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2008-05-17 17:10:18 +00:00
|
|
|
|
function loadRegs() {
|
2007-12-17 15:31:32 +00:00
|
|
|
|
|
|
|
|
|
|
$this->mCyrl2Latn = array(
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # Punctuation
|
2007-12-17 15:31:32 +00:00
|
|
|
|
'/№/u' => 'No.',
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # Е after vowels
|
2007-12-17 15:31:32 +00:00
|
|
|
|
'/([АӘЕЁИОӨҰҮЭЮЯЪЬ])Е/u' => '$1YE',
|
|
|
|
|
|
'/([АӘЕЁИОӨҰҮЭЮЯЪЬ])е/ui' => '$1ye',
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # leading ЁЮЯЩ
|
|
|
|
|
|
'/^Ё([' . KK_C_UC . ']|$)/u' => 'YO$1', '/^Ё([' . KK_C_LC . ']|$)/u' => 'Yo$1',
|
|
|
|
|
|
'/^Ю([' . KK_C_UC . ']|$)/u' => 'YU$1', '/^Ю([' . KK_C_LC . ']|$)/u' => 'Yu$1',
|
|
|
|
|
|
'/^Я([' . KK_C_UC . ']|$)/u' => 'YA$1', '/^Я([' . KK_C_LC . ']|$)/u' => 'Ya$1',
|
|
|
|
|
|
'/^Щ([' . KK_C_UC . ']|$)/u' => 'ŞÇ$1', '/^Щ([' . KK_C_LC . ']|$)/u' => 'Şç$1',
|
|
|
|
|
|
# # other ЁЮЯ
|
2008-05-17 17:10:18 +00:00
|
|
|
|
'/Ё/u' => 'YO', '/ё/u' => 'yo',
|
2007-12-17 15:31:32 +00:00
|
|
|
|
'/Ю/u' => 'YU', '/ю/u' => 'yu',
|
|
|
|
|
|
'/Я/u' => 'YA', '/я/u' => 'ya',
|
|
|
|
|
|
'/Щ/u' => 'ŞÇ', '/щ/u' => 'şç',
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # soft and hard signs
|
2007-12-17 15:31:32 +00:00
|
|
|
|
'/[ъЪ]/u' => 'ʺ', '/[ьЬ]/u' => 'ʹ',
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # other characters
|
2007-12-17 15:31:32 +00:00
|
|
|
|
'/А/u' => 'A', '/а/u' => 'a', '/Ә/u' => 'Ä', '/ә/u' => 'ä',
|
|
|
|
|
|
'/Б/u' => 'B', '/б/u' => 'b', '/В/u' => 'V', '/в/u' => 'v',
|
|
|
|
|
|
'/Г/u' => 'G', '/г/u' => 'g', '/Ғ/u' => 'Ğ', '/ғ/u' => 'ğ',
|
|
|
|
|
|
'/Д/u' => 'D', '/д/u' => 'd', '/Е/u' => 'E', '/е/u' => 'e',
|
|
|
|
|
|
'/Ж/u' => 'J', '/ж/u' => 'j', '/З/u' => 'Z', '/з/u' => 'z',
|
|
|
|
|
|
'/И/u' => 'Ï', '/и/u' => 'ï', '/Й/u' => 'Ý', '/й/u' => 'ý',
|
|
|
|
|
|
'/К/u' => 'K', '/к/u' => 'k', '/Қ/u' => 'Q', '/қ/u' => 'q',
|
|
|
|
|
|
'/Л/u' => 'L', '/л/u' => 'l', '/М/u' => 'M', '/м/u' => 'm',
|
|
|
|
|
|
'/Н/u' => 'N', '/н/u' => 'n', '/Ң/u' => 'Ñ', '/ң/u' => 'ñ',
|
|
|
|
|
|
'/О/u' => 'O', '/о/u' => 'o', '/Ө/u' => 'Ö', '/ө/u' => 'ö',
|
|
|
|
|
|
'/П/u' => 'P', '/п/u' => 'p', '/Р/u' => 'R', '/р/u' => 'r',
|
|
|
|
|
|
'/С/u' => 'S', '/с/u' => 's', '/Т/u' => 'T', '/т/u' => 't',
|
|
|
|
|
|
'/У/u' => 'W', '/у/u' => 'w', '/Ұ/u' => 'U', '/ұ/u' => 'u',
|
|
|
|
|
|
'/Ү/u' => 'Ü', '/ү/u' => 'ü', '/Ф/u' => 'F', '/ф/u' => 'f',
|
|
|
|
|
|
'/Х/u' => 'X', '/х/u' => 'x', '/Һ/u' => 'H', '/һ/u' => 'h',
|
|
|
|
|
|
'/Ц/u' => 'C', '/ц/u' => 'c', '/Ч/u' => 'Ç', '/ч/u' => 'ç',
|
|
|
|
|
|
'/Ш/u' => 'Ş', '/ш/u' => 'ş', '/Ы/u' => 'I', '/ы/u' => 'ı',
|
|
|
|
|
|
'/І/u' => 'İ', '/і/u' => 'i', '/Э/u' => 'É', '/э/u' => 'é',
|
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
$this->mLatn2Cyrl = array(
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # Punctuation
|
2008-01-02 15:15:26 +00:00
|
|
|
|
'/#|No\./' => '№',
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # Şç
|
2012-04-07 20:12:09 +00:00
|
|
|
|
'/ŞÇʹ/u' => 'ЩЬ', '/Şçʹ/u' => 'Щь',
|
2007-12-17 15:31:32 +00:00
|
|
|
|
'/Ş[Çç]/u' => 'Щ', '/şç/u' => 'щ',
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # soft and hard signs
|
|
|
|
|
|
'/([' . KK_L_UC . '])ʺ([' . KK_L_UC . '])/u' => '$1Ъ$2',
|
|
|
|
|
|
'/ʺ([' . KK_L_LC . '])/u' => 'ъ$1',
|
|
|
|
|
|
'/([' . KK_L_UC . '])ʹ([' . KK_L_UC . '])/u' => '$1Ь$2',
|
|
|
|
|
|
'/ʹ([' . KK_L_LC . '])/u' => 'ь$1',
|
2007-12-17 15:31:32 +00:00
|
|
|
|
'/ʺ/u' => 'ъ',
|
|
|
|
|
|
'/ʹ/u' => 'ь',
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # Ye Yo Yu Ya.
|
2007-12-17 15:31:32 +00:00
|
|
|
|
'/Y[Ee]/u' => 'Е', '/ye/u' => 'е',
|
|
|
|
|
|
'/Y[Oo]/u' => 'Ё', '/yo/u' => 'ё',
|
|
|
|
|
|
'/Y[UWuw]/u' => 'Ю', '/y[uw]/u' => 'ю',
|
|
|
|
|
|
'/Y[Aa]/u' => 'Я', '/ya/u' => 'я',
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # other characters
|
2007-12-17 15:31:32 +00:00
|
|
|
|
'/A/u' => 'А', '/a/u' => 'а', '/Ä/u' => 'Ә', '/ä/u' => 'ә',
|
|
|
|
|
|
'/B/u' => 'Б', '/b/u' => 'б', '/C/u' => 'Ц', '/c/u' => 'ц',
|
|
|
|
|
|
'/Ç/u' => 'Ч', '/ç/u' => 'ч', '/D/u' => 'Д', '/d/u' => 'д',
|
|
|
|
|
|
'/E/u' => 'Е', '/e/u' => 'е', '/É/u' => 'Э', '/é/u' => 'э',
|
|
|
|
|
|
'/F/u' => 'Ф', '/f/u' => 'ф', '/G/u' => 'Г', '/g/u' => 'г',
|
|
|
|
|
|
'/Ğ/u' => 'Ғ', '/ğ/u' => 'ғ', '/H/u' => 'Һ', '/h/u' => 'һ',
|
|
|
|
|
|
'/I/u' => 'Ы', '/ı/u' => 'ы', '/İ/u' => 'І', '/i/u' => 'і',
|
|
|
|
|
|
'/Ï/u' => 'И', '/ï/u' => 'и', '/J/u' => 'Ж', '/j/u' => 'ж',
|
|
|
|
|
|
'/K/u' => 'К', '/k/u' => 'к', '/L/u' => 'Л', '/l/u' => 'л',
|
|
|
|
|
|
'/M/u' => 'М', '/m/u' => 'м', '/N/u' => 'Н', '/n/u' => 'н',
|
|
|
|
|
|
'/Ñ/u' => 'Ң', '/ñ/u' => 'ң', '/O/u' => 'О', '/o/u' => 'о',
|
|
|
|
|
|
'/Ö/u' => 'Ө', '/ö/u' => 'ө', '/P/u' => 'П', '/p/u' => 'п',
|
|
|
|
|
|
'/Q/u' => 'Қ', '/q/u' => 'қ', '/R/u' => 'Р', '/r/u' => 'р',
|
|
|
|
|
|
'/S/u' => 'С', '/s/u' => 'с', '/Ş/u' => 'Ш', '/ş/u' => 'ш',
|
|
|
|
|
|
'/T/u' => 'Т', '/t/u' => 'т', '/U/u' => 'Ұ', '/u/u' => 'ұ',
|
|
|
|
|
|
'/Ü/u' => 'Ү', '/ü/u' => 'ү', '/V/u' => 'В', '/v/u' => 'в',
|
|
|
|
|
|
'/W/u' => 'У', '/w/u' => 'у', '/Ý/u' => 'Й', '/ý/u' => 'й',
|
|
|
|
|
|
'/X/u' => 'Х', '/x/u' => 'х', '/Z/u' => 'З', '/z/u' => 'з',
|
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
$this->mCyLa2Arab = array(
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # Punctuation -> Arabic
|
2008-01-11 14:16:42 +00:00
|
|
|
|
'/#|№|No\./u' => '', # ؀
|
2008-01-02 15:15:26 +00:00
|
|
|
|
'/\,/' => '،', # ،
|
|
|
|
|
|
'/;/' => '؛', # ؛
|
|
|
|
|
|
'/\?/' => '؟', # ؟
|
|
|
|
|
|
'/%/' => '٪', # ٪
|
|
|
|
|
|
'/\*/' => '٭', # ٭
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # Digits -> Arabic
|
2008-01-02 15:15:26 +00:00
|
|
|
|
'/0/' => '۰', # ۰
|
|
|
|
|
|
'/1/' => '۱', # ۱
|
|
|
|
|
|
'/2/' => '۲', # ۲
|
|
|
|
|
|
'/3/' => '۳', # ۳
|
|
|
|
|
|
'/4/' => '۴', # ۴
|
|
|
|
|
|
'/5/' => '۵', # ۵
|
|
|
|
|
|
'/6/' => '۶', # ۶
|
|
|
|
|
|
'/7/' => '۷', # ۷
|
|
|
|
|
|
'/8/' => '۸', # ۸
|
|
|
|
|
|
'/9/' => '۹', # ۹
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # Cyrillic -> Arabic
|
2008-01-11 14:16:42 +00:00
|
|
|
|
'/Аллаһ/ui' => 'ﷲ',
|
2007-12-17 15:31:32 +00:00
|
|
|
|
'/([АӘЕЁИОӨҰҮЭЮЯЪЬ])е/ui' => '$1يە',
|
2007-12-30 16:24:26 +00:00
|
|
|
|
'/[еэ]/ui' => 'ە', '/[ъь]/ui' => '',
|
2008-05-17 17:10:18 +00:00
|
|
|
|
'/[аә]/ui' => 'ا', '/[оө]/ui' => 'و', '/[ұү]/ui' => 'ۇ', '/[ыі]/ui' => 'ى',
|
2008-01-11 14:16:42 +00:00
|
|
|
|
'/[и]/ui' => 'ىي', '/ё/ui' => 'يو', '/ю/ui' => 'يۋ', '/я/ui' => 'يا', '/[й]/ui' => 'ي',
|
|
|
|
|
|
'/ц/ui' => 'تس', '/щ/ui' => 'شش',
|
|
|
|
|
|
'/һ/ui' => 'ح', '/ч/ui' => 'تش',
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# '/һ/ui' => 'ھ', '/ч/ui' => 'چ',
|
2008-01-11 14:16:42 +00:00
|
|
|
|
'/б/ui' => 'ب', '/в/ui' => 'ۆ', '/г/ui' => 'گ', '/ғ/ui' => 'ع',
|
|
|
|
|
|
'/д/ui' => 'د', '/ж/ui' => 'ج', '/з/ui' => 'ز', '/к/ui' => 'ك',
|
|
|
|
|
|
'/қ/ui' => 'ق', '/л/ui' => 'ل', '/м/ui' => 'م', '/н/ui' => 'ن',
|
|
|
|
|
|
'/ң/ui' => 'ڭ', '/п/ui' => 'پ', '/р/ui' => 'ر', '/с/ui' => 'س',
|
|
|
|
|
|
'/т/ui' => 'ت', '/у/ui' => 'ۋ', '/ф/ui' => 'ف', '/х/ui' => 'ح',
|
|
|
|
|
|
'/ш/ui' => 'ش',
|
2010-07-29 09:43:18 +00:00
|
|
|
|
# # Latin -> Arabic // commented for now...
|
2008-01-11 14:16:42 +00:00
|
|
|
|
/*'/Allah/ui' => 'ﷲ',
|
|
|
|
|
|
'/[eé]/ui' => 'ە', '/[yý]/ui' => 'ي', '/[ʺʹ]/ui' => '',
|
|
|
|
|
|
'/[aä]/ui' => 'ا', '/[oö]/ui' => 'و', '/[uü]/ui' => 'ۇ',
|
|
|
|
|
|
'/[ï]/ui' => 'ىي', '/[ıIiİ]/u' => 'ى',
|
2008-05-17 17:10:18 +00:00
|
|
|
|
'/c/ui' => 'تس',
|
2008-01-11 14:16:42 +00:00
|
|
|
|
'/ç/ui' => 'تش', '/h/ui' => 'ح',
|
|
|
|
|
|
#'/ç/ui' => 'چ', '/h/ui' => 'ھ',
|
|
|
|
|
|
'/b/ui' => 'ب','/d/ui' => 'د',
|
|
|
|
|
|
'/f/ui' => 'ف', '/g/ui' => 'گ', '/ğ/ui' => 'ع',
|
|
|
|
|
|
'/j/ui' => 'ج', '/k/ui' => 'ك', '/l/ui' => 'ل', '/m/ui' => 'م',
|
|
|
|
|
|
'/n/ui' => 'ن', '/ñ/ui' => 'ڭ', '/p/ui' => 'پ', '/q/ui' => 'ق',
|
|
|
|
|
|
'/r/ui' => 'ر', '/s/ui' => 'س', '/ş/ui' => 'ش', '/t/ui' => 'ت',
|
|
|
|
|
|
'/v/ui' => 'ۆ', '/w/ui' => 'ۋ', '/x/ui' => 'ح', '/z/ui' => 'ز',*/
|
2007-12-17 15:31:32 +00:00
|
|
|
|
);
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2011-05-29 16:32:05 +00:00
|
|
|
|
/**
|
|
|
|
|
|
* rules should be defined as -{ekavian | iyekavian-} -or-
|
|
|
|
|
|
* -{code:text | code:text | ...}-
|
|
|
|
|
|
*
|
|
|
|
|
|
* update: delete all rule parsing because it's not used
|
|
|
|
|
|
* currently, and just produces a couple of bugs
|
|
|
|
|
|
*
|
|
|
|
|
|
* @param $rule string
|
|
|
|
|
|
* @param $flags array
|
|
|
|
|
|
* @return array
|
|
|
|
|
|
*/
|
2010-07-29 09:43:18 +00:00
|
|
|
|
function parseManualRule( $rule, $flags = array() ) {
|
|
|
|
|
|
if ( in_array( 'T', $flags ) ) {
|
|
|
|
|
|
return parent::parseManualRule( $rule, $flags );
|
2007-05-08 20:57:41 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
2011-02-18 23:21:48 +00:00
|
|
|
|
$carray = array();
|
2007-05-08 20:57:41 +00:00
|
|
|
|
// otherwise ignore all formatting
|
2010-07-29 09:43:18 +00:00
|
|
|
|
foreach ( $this->mVariants as $v ) {
|
2007-05-08 20:57:41 +00:00
|
|
|
|
$carray[$v] = $rule;
|
|
|
|
|
|
}
|
2008-05-17 17:10:18 +00:00
|
|
|
|
|
2007-05-08 20:57:41 +00:00
|
|
|
|
return $carray;
|
|
|
|
|
|
}
|
2007-01-01 17:20:19 +00:00
|
|
|
|
|
2011-05-22 22:05:18 +00:00
|
|
|
|
/**
|
2007-01-21 09:55:14 +00:00
|
|
|
|
* A function wrapper:
|
2008-05-17 17:10:18 +00:00
|
|
|
|
* - if there is no selected variant, leave the link
|
2007-12-17 15:31:32 +00:00
|
|
|
|
* names as they were
|
|
|
|
|
|
* - do not try to find variants for usernames
|
2011-05-29 16:32:05 +00:00
|
|
|
|
*
|
|
|
|
|
|
* @param $link string
|
|
|
|
|
|
* @param $nt Title
|
|
|
|
|
|
* @param bool $ignoreOtherCond
|
2006-11-22 09:06:24 +00:00
|
|
|
|
*/
|
2009-02-02 07:54:43 +00:00
|
|
|
|
function findVariantLink( &$link, &$nt, $ignoreOtherCond = false ) {
|
2007-01-21 09:55:14 +00:00
|
|
|
|
// check for user namespace
|
2010-07-29 09:43:18 +00:00
|
|
|
|
if ( is_object( $nt ) ) {
|
2007-01-21 09:55:14 +00:00
|
|
|
|
$ns = $nt->getNamespace();
|
2010-07-29 09:43:18 +00:00
|
|
|
|
if ( $ns == NS_USER || $ns == NS_USER_TALK )
|
2007-01-21 09:55:14 +00:00
|
|
|
|
return;
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2010-07-29 09:43:18 +00:00
|
|
|
|
$oldlink = $link;
|
2009-02-02 07:54:43 +00:00
|
|
|
|
parent::findVariantLink( $link, $nt, $ignoreOtherCond );
|
2010-07-29 09:43:18 +00:00
|
|
|
|
if ( $this->getPreferredVariant() == $this->mMainLanguageCode )
|
|
|
|
|
|
$link = $oldlink;
|
2006-11-22 09:06:24 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
2011-05-22 22:05:18 +00:00
|
|
|
|
/**
|
2006-11-22 09:06:24 +00:00
|
|
|
|
* An ugly function wrapper for parsing Image titles
|
|
|
|
|
|
* (to prevent image name conversion)
|
2011-05-29 15:59:47 +00:00
|
|
|
|
*
|
2011-05-29 16:32:05 +00:00
|
|
|
|
* @param $text string
|
|
|
|
|
|
* @param $toVariant bool
|
|
|
|
|
|
*
|
2011-05-29 15:59:47 +00:00
|
|
|
|
* @return string
|
2006-11-22 09:06:24 +00:00
|
|
|
|
*/
|
2010-07-29 09:43:18 +00:00
|
|
|
|
function autoConvert( $text, $toVariant = false ) {
|
2006-11-22 09:06:24 +00:00
|
|
|
|
global $wgTitle;
|
2010-07-29 09:43:18 +00:00
|
|
|
|
if ( is_object( $wgTitle ) && $wgTitle->getNameSpace() == NS_FILE ) {
|
2006-11-22 09:06:24 +00:00
|
|
|
|
$imagename = $wgTitle->getNsText();
|
2010-07-29 09:43:18 +00:00
|
|
|
|
if ( preg_match( "/^$imagename:/", $text ) ) return $text;
|
2006-11-22 09:06:24 +00:00
|
|
|
|
}
|
2010-07-29 09:43:18 +00:00
|
|
|
|
return parent::autoConvert( $text, $toVariant );
|
2006-11-22 09:06:24 +00:00
|
|
|
|
}
|
2006-11-06 17:46:58 +00:00
|
|
|
|
|
|
|
|
|
|
/**
|
2007-12-17 15:31:32 +00:00
|
|
|
|
* It translates text into variant
|
2011-05-29 15:59:47 +00:00
|
|
|
|
*
|
2011-05-29 16:32:05 +00:00
|
|
|
|
* @param $text string
|
|
|
|
|
|
* @param $toVariant string
|
|
|
|
|
|
*
|
2011-05-29 15:59:47 +00:00
|
|
|
|
* @return string
|
2006-11-06 17:46:58 +00:00
|
|
|
|
*/
|
2010-07-29 09:43:18 +00:00
|
|
|
|
function translate( $text, $toVariant ) {
|
2010-09-07 22:39:05 +00:00
|
|
|
|
global $wgLanguageCode;
|
2007-12-17 15:31:32 +00:00
|
|
|
|
$text = parent::translate( $text, $toVariant );
|
2006-11-06 17:46:58 +00:00
|
|
|
|
|
2007-12-17 15:31:32 +00:00
|
|
|
|
switch( $toVariant ) {
|
|
|
|
|
|
case 'kk-cyrl':
|
|
|
|
|
|
case 'kk-kz':
|
2008-01-02 15:15:26 +00:00
|
|
|
|
$letters = KK_L_UC . KK_L_LC . 'ʺʹ#0123456789';
|
2010-09-07 22:39:05 +00:00
|
|
|
|
$wgLanguageCode = 'kk';
|
2007-12-17 15:31:32 +00:00
|
|
|
|
break;
|
|
|
|
|
|
case 'kk-latn':
|
|
|
|
|
|
case 'kk-tr':
|
|
|
|
|
|
$letters = KK_C_UC . KK_C_LC . '№0123456789';
|
2010-09-07 22:39:05 +00:00
|
|
|
|
$wgLanguageCode = 'kk-Latn';
|
2007-12-17 15:31:32 +00:00
|
|
|
|
break;
|
|
|
|
|
|
case 'kk-arab':
|
|
|
|
|
|
case 'kk-cn':
|
2010-07-29 09:43:18 +00:00
|
|
|
|
$letters = KK_C_UC . KK_C_LC . /*KK_L_UC.KK_L_LC.'ʺʹ'.*/',;\?%\*№0123456789';
|
2010-09-07 22:39:05 +00:00
|
|
|
|
$wgLanguageCode = 'kk-Arab';
|
2007-12-17 15:31:32 +00:00
|
|
|
|
break;
|
|
|
|
|
|
default:
|
2010-09-07 22:39:05 +00:00
|
|
|
|
$wgLanguageCode = 'kk';
|
2007-12-17 15:31:32 +00:00
|
|
|
|
return $text;
|
2007-01-21 09:55:14 +00:00
|
|
|
|
}
|
2007-12-17 15:31:32 +00:00
|
|
|
|
// disable conversion variables like $1, $2...
|
|
|
|
|
|
$varsfix = '\$[0-9]';
|
|
|
|
|
|
|
2010-07-29 09:43:18 +00:00
|
|
|
|
$matches = preg_split( '/' . $varsfix . '[^' . $letters . ']+/u', $text, -1, PREG_SPLIT_OFFSET_CAPTURE );
|
2007-12-17 15:31:32 +00:00
|
|
|
|
$mstart = 0;
|
2007-12-24 13:33:38 +00:00
|
|
|
|
$ret = '';
|
2010-07-29 09:43:18 +00:00
|
|
|
|
foreach ( $matches as $m ) {
|
|
|
|
|
|
$ret .= substr( $text, $mstart, $m[1] -$mstart );
|
2007-12-17 15:31:32 +00:00
|
|
|
|
$ret .= $this->regsConverter( $m[0], $toVariant );
|
2010-07-29 09:43:18 +00:00
|
|
|
|
$mstart = $m[1] + strlen( $m[0] );
|
2006-11-06 17:46:58 +00:00
|
|
|
|
}
|
|
|
|
|
|
return $ret;
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2011-05-29 16:32:05 +00:00
|
|
|
|
/**
|
|
|
|
|
|
* @param $text string
|
|
|
|
|
|
* @param $toVariant string
|
|
|
|
|
|
* @return mixed|string
|
|
|
|
|
|
*/
|
2007-12-30 16:24:26 +00:00
|
|
|
|
function regsConverter( $text, $toVariant ) {
|
2010-09-21 06:55:49 +00:00
|
|
|
|
if ( $text == '' ) {
|
|
|
|
|
|
return $text;
|
|
|
|
|
|
}
|
2007-12-17 15:31:32 +00:00
|
|
|
|
|
|
|
|
|
|
switch( $toVariant ) {
|
|
|
|
|
|
case 'kk-arab':
|
|
|
|
|
|
case 'kk-cn':
|
2010-07-29 09:43:18 +00:00
|
|
|
|
$letters = KK_C_LC . KK_C_UC/*.KK_L_LC.KK_L_UC*/;
|
2008-01-11 14:16:42 +00:00
|
|
|
|
$front = 'әөүіӘӨҮІ'/*.'äöüiÄÖÜİ'*/;
|
|
|
|
|
|
$excludes = 'еэгғкқЕЭГҒКҚ'/*.'eégğkqEÉGĞKQ'*/;
|
|
|
|
|
|
// split text to words
|
2010-07-29 09:43:18 +00:00
|
|
|
|
$matches = preg_split( '/[\b\s\-\.:]+/', $text, -1, PREG_SPLIT_OFFSET_CAPTURE );
|
2008-01-11 14:16:42 +00:00
|
|
|
|
$mstart = 0;
|
|
|
|
|
|
$ret = '';
|
2010-07-29 09:43:18 +00:00
|
|
|
|
foreach ( $matches as $m ) {
|
2008-01-11 14:16:42 +00:00
|
|
|
|
$ret .= substr( $text, $mstart, $m[1] - $mstart );
|
|
|
|
|
|
// is matched the word to front vowels?
|
|
|
|
|
|
// exclude a words matched to е, э, г, к, к, қ,
|
|
|
|
|
|
// them should be without hamza
|
2010-07-29 09:43:18 +00:00
|
|
|
|
if ( preg_match( '/[' . $front . ']/u', $m[0] ) && !preg_match( '/[' . $excludes . ']/u', $m[0] ) ) {
|
|
|
|
|
|
$ret .= preg_replace( '/[' . $letters . ']+/u', H_HAMZA . '$0', $m[0] );
|
2008-01-11 14:16:42 +00:00
|
|
|
|
} else {
|
|
|
|
|
|
$ret .= $m[0];
|
|
|
|
|
|
}
|
2010-07-29 09:43:18 +00:00
|
|
|
|
$mstart = $m[1] + strlen( $m[0] );
|
2008-01-11 14:16:42 +00:00
|
|
|
|
}
|
|
|
|
|
|
$text =& $ret;
|
2010-07-29 09:43:18 +00:00
|
|
|
|
foreach ( $this->mCyLa2Arab as $pat => $rep ) {
|
2007-12-17 15:31:32 +00:00
|
|
|
|
$text = preg_replace( $pat, $rep, $text );
|
|
|
|
|
|
}
|
|
|
|
|
|
return $text;
|
|
|
|
|
|
break;
|
|
|
|
|
|
case 'kk-latn':
|
|
|
|
|
|
case 'kk-tr':
|
2010-07-29 09:43:18 +00:00
|
|
|
|
foreach ( $this->mCyrl2Latn as $pat => $rep ) {
|
2007-12-17 15:31:32 +00:00
|
|
|
|
$text = preg_replace( $pat, $rep, $text );
|
|
|
|
|
|
}
|
|
|
|
|
|
return $text;
|
|
|
|
|
|
break;
|
|
|
|
|
|
case 'kk-cyrl':
|
2008-01-07 05:16:01 +00:00
|
|
|
|
case 'kk-kz':
|
2010-07-29 09:43:18 +00:00
|
|
|
|
foreach ( $this->mLatn2Cyrl as $pat => $rep ) {
|
2007-12-17 15:31:32 +00:00
|
|
|
|
$text = preg_replace( $pat, $rep, $text );
|
|
|
|
|
|
}
|
|
|
|
|
|
return $text;
|
|
|
|
|
|
break;
|
|
|
|
|
|
default:
|
|
|
|
|
|
return $text;
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2011-05-22 22:05:18 +00:00
|
|
|
|
/**
|
2007-12-17 15:31:32 +00:00
|
|
|
|
* We want our external link captions to be converted in variants,
|
|
|
|
|
|
* so we return the original text instead -{$text}-, except for URLs
|
2011-05-29 15:59:47 +00:00
|
|
|
|
*
|
2011-05-29 16:32:05 +00:00
|
|
|
|
* @param $text string
|
|
|
|
|
|
* @param $noParse string|bool
|
|
|
|
|
|
*
|
2011-05-29 15:59:47 +00:00
|
|
|
|
* @return string
|
2007-12-17 15:31:32 +00:00
|
|
|
|
*/
|
2010-07-29 09:43:18 +00:00
|
|
|
|
function markNoConversion( $text, $noParse = false ) {
|
|
|
|
|
|
if ( $noParse || preg_match( "/^https?:\/\/|ftp:\/\/|irc:\/\//", $text ) )
|
2007-12-17 15:31:32 +00:00
|
|
|
|
return parent::markNoConversion( $text );
|
|
|
|
|
|
return $text;
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2011-05-29 15:53:18 +00:00
|
|
|
|
/**
|
|
|
|
|
|
* @param $key string
|
|
|
|
|
|
* @return String
|
|
|
|
|
|
*/
|
2007-12-17 15:31:32 +00:00
|
|
|
|
function convertCategoryKey( $key ) {
|
|
|
|
|
|
return $this->autoConvert( $key, 'kk' );
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2006-11-06 17:46:58 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
WARNING: HUGE COMMIT
Doxygen documentation update:
* Changed alls @addtogroup to @ingroup. @addtogroup adds the comment to the group description, but doesn't add the file, class, function, ... to the group like @ingroup does. See for example http://svn.wikimedia.org/doc/group__SpecialPage.html where it's impossible to see related files, classes, ... that should belong to that group.
* Added @file to file description, it seems that it should be explicitely decalred for file descriptions, otherwise doxygen will think that the comment document the first class, variabled, function, ... that is in that file.
* Removed some empty comments
* Removed some ?>
Added following groups:
* ExternalStorage
* JobQueue
* MaintenanceLanguage
One more thing: there are still a lot of warnings when generating the doc.
2008-05-20 17:13:28 +00:00
|
|
|
|
/**
|
|
|
|
|
|
* class that handles Cyrillic, Latin and Arabic scripts for Kazakh
|
|
|
|
|
|
* right now it only distinguish kk_cyrl, kk_latn, kk_arab and kk_kz, kk_tr, kk_cn.
|
|
|
|
|
|
*
|
|
|
|
|
|
* @ingroup Language
|
|
|
|
|
|
*/
|
2007-12-09 16:24:35 +00:00
|
|
|
|
class LanguageKk extends LanguageKk_cyrl {
|
2006-11-06 17:46:58 +00:00
|
|
|
|
|
2006-11-22 09:06:24 +00:00
|
|
|
|
function __construct() {
|
|
|
|
|
|
global $wgHooks;
|
2006-11-06 17:46:58 +00:00
|
|
|
|
parent::__construct();
|
|
|
|
|
|
|
2007-12-09 16:24:35 +00:00
|
|
|
|
$variants = array( 'kk', 'kk-cyrl', 'kk-latn', 'kk-arab', 'kk-kz', 'kk-tr', 'kk-cn' );
|
2006-11-22 09:06:24 +00:00
|
|
|
|
$variantfallbacks = array(
|
2008-04-29 05:39:35 +00:00
|
|
|
|
'kk' => 'kk-cyrl',
|
2007-12-24 13:33:38 +00:00
|
|
|
|
'kk-cyrl' => 'kk',
|
|
|
|
|
|
'kk-latn' => 'kk',
|
|
|
|
|
|
'kk-arab' => 'kk',
|
|
|
|
|
|
'kk-kz' => 'kk-cyrl',
|
|
|
|
|
|
'kk-tr' => 'kk-latn',
|
|
|
|
|
|
'kk-cn' => 'kk-arab'
|
2006-11-22 09:06:24 +00:00
|
|
|
|
);
|
2006-11-06 17:46:58 +00:00
|
|
|
|
|
2006-11-22 09:06:24 +00:00
|
|
|
|
$this->mConverter = new KkConverter( $this, 'kk', $variants, $variantfallbacks );
|
2007-12-09 16:24:35 +00:00
|
|
|
|
|
2006-11-22 09:06:24 +00:00
|
|
|
|
$wgHooks['ArticleSaveComplete'][] = $this->mConverter;
|
|
|
|
|
|
}
|
2006-11-06 17:46:58 +00:00
|
|
|
|
|
2007-12-17 15:31:32 +00:00
|
|
|
|
/**
|
|
|
|
|
|
* Work around for right-to-left direction support in kk-arab and kk-cn
|
|
|
|
|
|
*
|
|
|
|
|
|
* @return bool
|
|
|
|
|
|
*/
|
2008-05-17 17:10:18 +00:00
|
|
|
|
function isRTL() {
|
2007-12-17 15:31:32 +00:00
|
|
|
|
$variant = $this->getPreferredVariant();
|
|
|
|
|
|
if ( $variant == 'kk-arab' || $variant == 'kk-cn' ) {
|
|
|
|
|
|
return true;
|
|
|
|
|
|
} else {
|
|
|
|
|
|
return parent::isRTL();
|
2006-11-22 09:06:24 +00:00
|
|
|
|
}
|
2006-11-06 17:46:58 +00:00
|
|
|
|
}
|
2006-11-24 15:06:50 +00:00
|
|
|
|
|
2011-05-22 22:05:18 +00:00
|
|
|
|
/**
|
2007-12-17 15:31:32 +00:00
|
|
|
|
* It fixes issue with ucfirst for transforming 'i' to 'İ'
|
2011-05-29 15:53:18 +00:00
|
|
|
|
*
|
|
|
|
|
|
* @param $string string
|
|
|
|
|
|
*
|
|
|
|
|
|
* @return string
|
2007-12-02 10:48:34 +00:00
|
|
|
|
*/
|
|
|
|
|
|
function ucfirst ( $string ) {
|
2007-12-17 15:31:32 +00:00
|
|
|
|
$variant = $this->getPreferredVariant();
|
2010-07-29 09:43:18 +00:00
|
|
|
|
if ( ( $variant == 'kk-latn' || $variant == 'kk-tr' ) && $string[0] == 'i' ) {
|
2007-12-02 10:48:34 +00:00
|
|
|
|
$string = 'İ' . substr( $string, 1 );
|
|
|
|
|
|
} else {
|
|
|
|
|
|
$string = parent::ucfirst( $string );
|
|
|
|
|
|
}
|
|
|
|
|
|
return $string;
|
|
|
|
|
|
}
|
2006-11-06 17:46:58 +00:00
|
|
|
|
|
2011-05-22 22:05:18 +00:00
|
|
|
|
/**
|
2007-12-17 15:31:32 +00:00
|
|
|
|
* It fixes issue with lcfirst for transforming 'I' to 'ı'
|
2011-05-29 15:53:18 +00:00
|
|
|
|
*
|
|
|
|
|
|
* @param $string string
|
|
|
|
|
|
*
|
|
|
|
|
|
* @return string
|
2007-12-02 10:48:34 +00:00
|
|
|
|
*/
|
|
|
|
|
|
function lcfirst ( $string ) {
|
2007-12-17 15:31:32 +00:00
|
|
|
|
$variant = $this->getPreferredVariant();
|
2010-07-29 09:43:18 +00:00
|
|
|
|
if ( ( $variant == 'kk-latn' || $variant == 'kk-tr' ) && $string[0] == 'I' ) {
|
2007-12-02 10:48:34 +00:00
|
|
|
|
$string = 'ı' . substr( $string, 1 );
|
|
|
|
|
|
} else {
|
|
|
|
|
|
$string = parent::lcfirst( $string );
|
|
|
|
|
|
}
|
|
|
|
|
|
return $string;
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2011-05-29 15:53:18 +00:00
|
|
|
|
/**
|
|
|
|
|
|
* @param $word string
|
|
|
|
|
|
* @param $case string
|
|
|
|
|
|
* @return string
|
|
|
|
|
|
*/
|
2007-12-17 15:31:32 +00:00
|
|
|
|
function convertGrammar( $word, $case ) {
|
2008-01-14 14:22:32 +00:00
|
|
|
|
wfProfileIn( __METHOD__ );
|
2007-12-17 15:31:32 +00:00
|
|
|
|
|
|
|
|
|
|
$variant = $this->getPreferredVariant();
|
|
|
|
|
|
switch ( $variant ) {
|
|
|
|
|
|
case 'kk-arab':
|
|
|
|
|
|
case 'kk-cn':
|
2008-01-14 14:22:32 +00:00
|
|
|
|
$word = parent::convertGrammarKk_arab( $word, $case );
|
2007-12-17 15:31:32 +00:00
|
|
|
|
break;
|
|
|
|
|
|
case 'kk-latn':
|
|
|
|
|
|
case 'kk-tr':
|
2008-01-14 14:22:32 +00:00
|
|
|
|
$word = parent::convertGrammarKk_latn( $word, $case );
|
2007-12-17 15:31:32 +00:00
|
|
|
|
break;
|
|
|
|
|
|
case 'kk-cyrl':
|
|
|
|
|
|
case 'kk-kz':
|
|
|
|
|
|
case 'kk':
|
|
|
|
|
|
default:
|
2008-01-14 14:22:32 +00:00
|
|
|
|
$word = parent::convertGrammarKk_cyrl( $word, $case );
|
2007-12-17 15:31:32 +00:00
|
|
|
|
}
|
2007-06-29 01:19:14 +00:00
|
|
|
|
|
2008-01-14 14:22:32 +00:00
|
|
|
|
wfProfileOut( __METHOD__ );
|
2007-12-17 15:31:32 +00:00
|
|
|
|
return $word;
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|