MediaWiki uses a number of nonstandard codes which do not validate according to the IANA language subtag registry. Some of them have the wrong semantics entirely: MediaWiki's `sr-ec` variant maps to BCP 47 `sr-EC` which is "Serbian as used in Ethiopia" (!). Extend LanguageCode::bcp47() to map our nonstandard codes to valid BCP 47 language codes. Export the mapping so that it can be used in JavaScript's corresponding mw.language.bcp47() implementation as well, and return the standard BCP 47 codes in the siteinfo API. Thanks to TheDJ (I10b4473c7e53f027812bbccf26bb47aec15fddfd) and Fomafix (I93efc190714ba76247d30ba49fc21ae872fc3555) for previous attempts at this! Also removed a fixme for the name of 'Twi', dating back to 2004 (f59c3be23b) -- checking tw.wikipedia.org it certainly appears that the autonym of 'Twi' is correctly 'Twi'. Tracking bugs for invalid language codes are T125073 and T145535. Discussion of zh-XX => zh-HanX-XX mapping is at T198419. This is a replay of an earlier merged patch,8380f0173e, which had to be reverted because it caused regressions in the Babel extension (T199941). Bug: T34483 Bug: T106367 Bug: T120847 Depends-On: I27a5b8e45b34c6b57c1b612b11548001c88cd483 Change-Id: Iebbc604af21d7f2af9c1f1ab2574cb5f309bf6ed
491 lines
22 KiB
PHP
491 lines
22 KiB
PHP
<?php
|
||
/**
|
||
* Language names.
|
||
*
|
||
* This program is free software; you can redistribute it and/or modify
|
||
* it under the terms of the GNU General Public License as published by
|
||
* the Free Software Foundation; either version 2 of the License, or
|
||
* (at your option) any later version.
|
||
*
|
||
* This program is distributed in the hope that it will be useful,
|
||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
* GNU General Public License for more details.
|
||
*
|
||
* You should have received a copy of the GNU General Public License along
|
||
* with this program; if not, write to the Free Software Foundation, Inc.,
|
||
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
||
* http://www.gnu.org/copyleft/gpl.html
|
||
*
|
||
* @file
|
||
* @ingroup Language
|
||
*/
|
||
|
||
namespace MediaWiki\Languages\Data;
|
||
|
||
/**
|
||
* Language names in their own languages (language autonyms).
|
||
*
|
||
* These determine things like interwikis, language selectors, and so on.
|
||
* Safe to change without running scripts on the respective sites.
|
||
*
|
||
* \u{200E} is the left-to-right marker and
|
||
* \u{200F} is the right-to-left marker.
|
||
* They are required for ensuring the correct display of brackets in
|
||
* mixed rtl/ltr environment.
|
||
*
|
||
* Some writing systems require some line-height fixes. This includes
|
||
* most Indic scripts, like Devanagari.
|
||
* If you are adding support for such a language, add it also to
|
||
* the relevant section in shared.css.
|
||
*
|
||
* Do not use this class directly. Use Language::fetchLanguageNames(), which
|
||
* includes support for the CLDR extension.
|
||
*
|
||
* @ingroup Language
|
||
*/
|
||
class Names {
|
||
public static $names = [
|
||
'aa' => 'Qafár af', # Afar
|
||
'ab' => 'Аҧсшәа', # Abkhaz
|
||
'abs' => 'bahasa ambon', # Ambonese Malay, T193566
|
||
'ace' => 'Acèh', # Aceh
|
||
'ady' => 'адыгабзэ', # Adyghe
|
||
'ady-cyrl' => 'адыгабзэ', # Adyghe
|
||
'aeb' => 'تونسي/Tûnsî', # Tunisian Arabic (multiple scripts - defaults to Arabic)
|
||
'aeb-arab' => 'تونسي', # Tunisian Arabic (Arabic Script)
|
||
'aeb-latn' => 'Tûnsî', # Tunisian Arabic (Latin Script)
|
||
'af' => 'Afrikaans', # Afrikaans
|
||
'ak' => 'Akan', # Akan
|
||
'aln' => 'Gegë', # Gheg Albanian
|
||
'als' => 'Alemannisch', # Alemannic -- not a valid code, for compatibility. See gsw.
|
||
'am' => 'አማርኛ', # Amharic
|
||
'an' => 'aragonés', # Aragonese
|
||
'ang' => 'Ænglisc', # Old English, T25283
|
||
'anp' => 'अङ्गिका', # Angika
|
||
'ar' => 'العربية', # Arabic
|
||
'arc' => 'ܐܪܡܝܐ', # Aramaic
|
||
'arn' => 'mapudungun', # Mapuche, Mapudungu, Araucanian (Araucano)
|
||
'arq' => 'جازايرية', # Algerian Spoken Arabic
|
||
'ary' => 'Maġribi', # Moroccan Spoken Arabic
|
||
'arz' => 'مصرى', # Egyptian Spoken Arabic
|
||
'as' => 'অসমীয়া', # Assamese
|
||
'ase' => 'American sign language', # American sign language
|
||
'ast' => 'asturianu', # Asturian
|
||
'atj' => 'Atikamekw', # Atikamekw
|
||
'av' => 'авар', # Avar
|
||
'avk' => 'Kotava', # Kotava
|
||
'awa' => 'अवधी', # Awadhi
|
||
'ay' => 'Aymar aru', # Aymara
|
||
'az' => 'azərbaycanca', # Azerbaijani
|
||
'azb' => 'تۆرکجه', # South Azerbaijani
|
||
'ba' => 'башҡортса', # Bashkir
|
||
'ban' => 'Basa Bali', # Balinese
|
||
'bar' => 'Boarisch', # Bavarian (Austro-Bavarian and South Tyrolean)
|
||
'bat-smg' => 'žemaitėška', # Samogitian (deprecated code, 'sgs' in ISO 639-3 since 2010-06-30 )
|
||
'bbc' => 'Batak Toba', # Batak Toba (falls back to bbc-latn)
|
||
'bbc-latn' => 'Batak Toba', # Batak Toba
|
||
'bcc' => 'جهلسری بلوچی', # Southern Balochi
|
||
'bcl' => 'Bikol Central', # Bikol: Central Bicolano language
|
||
'be' => 'беларуская', # Belarusian normative
|
||
'be-tarask' => "беларуская (тарашкевіца)\u{200E}", # Belarusian in Taraskievica orthography
|
||
'be-x-old' => "беларуская (тарашкевіца)\u{200E}", # (be-tarask compat)
|
||
'bg' => 'български', # Bulgarian
|
||
'bgn' => 'روچ کپتین بلوچی', # Western Balochi
|
||
'bh' => 'भोजपुरी', # Bihari macro language. Falls back to Bhojpuri (bho)
|
||
'bho' => 'भोजपुरी', # Bhojpuri
|
||
'bi' => 'Bislama', # Bislama
|
||
'bjn' => 'Bahasa Banjar', # Banjarese
|
||
'bm' => 'bamanankan', # Bambara
|
||
'bn' => 'বাংলা', # Bengali
|
||
'bo' => 'བོད་ཡིག', # Tibetan
|
||
'bpy' => 'বিষ্ণুপ্রিয়া মণিপুরী', # Bishnupriya Manipuri
|
||
'bqi' => 'بختیاری', # Bakthiari
|
||
'br' => 'brezhoneg', # Breton
|
||
'brh' => 'Bráhuí', # Brahui
|
||
'bs' => 'bosanski', # Bosnian
|
||
'btm' => 'Batak Mandailing', # Batak Mandailing
|
||
'bto' => 'Iriga Bicolano', # Rinconada Bikol
|
||
'bug' => 'ᨅᨔ ᨕᨘᨁᨗ', # Buginese
|
||
'bxr' => 'буряад', # Buryat (Russia)
|
||
'ca' => 'català', # Catalan
|
||
'cbk-zam' => 'Chavacano de Zamboanga', # Zamboanga Chavacano
|
||
'cdo' => 'Mìng-dĕ̤ng-ngṳ̄', # Min Dong
|
||
'ce' => 'нохчийн', # Chechen
|
||
'ceb' => 'Cebuano', # Cebuano
|
||
'ch' => 'Chamoru', # Chamorro
|
||
'cho' => 'Choctaw', # Choctaw
|
||
'chr' => 'ᏣᎳᎩ', # Cherokee
|
||
'chy' => 'Tsetsêhestâhese', # Cheyenne
|
||
'ckb' => 'کوردی', # Central Kurdish
|
||
'co' => 'corsu', # Corsican
|
||
'cps' => 'Capiceño', # Capiznon
|
||
'cr' => 'Nēhiyawēwin / ᓀᐦᐃᔭᐍᐏᐣ', # Cree
|
||
'crh' => 'qırımtatarca', # Crimean Tatar (multiple scripts - defaults to Latin)
|
||
'crh-latn' => "qırımtatarca (Latin)\u{200E}", # Crimean Tatar (Latin)
|
||
'crh-cyrl' => "къырымтатарджа (Кирилл)\u{200E}", # Crimean Tatar (Cyrillic)
|
||
'cs' => 'čeština', # Czech
|
||
'csb' => 'kaszëbsczi', # Cassubian
|
||
'cu' => 'словѣньскъ / ⰔⰎⰑⰂⰡⰐⰠⰔⰍⰟ', # Old Church Slavonic (ancient language)
|
||
'cv' => 'Чӑвашла', # Chuvash
|
||
'cy' => 'Cymraeg', # Welsh
|
||
'da' => 'dansk', # Danish
|
||
'de' => 'Deutsch', # German ("Du")
|
||
'de-at' => 'Österreichisches Deutsch', # Austrian German
|
||
'de-ch' => 'Schweizer Hochdeutsch', # Swiss Standard German
|
||
'de-formal' => "Deutsch (Sie-Form)\u{200E}", # German - formal address ("Sie")
|
||
'din' => 'Thuɔŋjäŋ', # Dinka
|
||
'diq' => 'Zazaki', # Zazaki
|
||
'dsb' => 'dolnoserbski', # Lower Sorbian
|
||
'dtp' => 'Dusun Bundu-liwan', # Central Dusun
|
||
'dty' => 'डोटेली', # Doteli
|
||
'dv' => 'ދިވެހިބަސް', # Dhivehi
|
||
'dz' => 'ཇོང་ཁ', # Dzongkha (Bhutan)
|
||
'ee' => 'eʋegbe', # Éwé
|
||
'egl' => 'Emiliàn', # Emilian
|
||
'el' => 'Ελληνικά', # Greek
|
||
'eml' => 'emiliàn e rumagnòl', # Emiliano-Romagnolo / Sammarinese
|
||
'en' => 'English', # English
|
||
'en-ca' => 'Canadian English', # Canadian English
|
||
'en-gb' => 'British English', # British English
|
||
'eo' => 'Esperanto', # Esperanto
|
||
'es' => 'español', # Spanish
|
||
'es-419' => 'español de América Latina', # Spanish for the Latin America and Caribbean region
|
||
'es-formal' => "español (formal)\u{200E}", # Spanish formal address
|
||
'et' => 'eesti', # Estonian
|
||
'eu' => 'euskara', # Basque
|
||
'ext' => 'estremeñu', # Extremaduran
|
||
'fa' => 'فارسی', # Persian
|
||
'ff' => 'Fulfulde', # Fulfulde, Maasina
|
||
'fi' => 'suomi', # Finnish
|
||
'fit' => 'meänkieli', # Tornedalen Finnish
|
||
'fiu-vro' => 'Võro', # Võro (deprecated code, 'vro' in ISO 639-3 since 2009-01-16)
|
||
'fj' => 'Na Vosa Vakaviti', # Fijian
|
||
'fo' => 'føroyskt', # Faroese
|
||
'fr' => 'français', # French
|
||
'frc' => 'français cadien', # Cajun French
|
||
'frp' => 'arpetan', # Franco-Provençal/Arpitan
|
||
'frr' => 'Nordfriisk', # North Frisian
|
||
'fur' => 'furlan', # Friulian
|
||
'fy' => 'Frysk', # Frisian
|
||
'ga' => 'Gaeilge', # Irish
|
||
'gag' => 'Gagauz', # Gagauz
|
||
'gan' => '贛語', # Gan (multiple scripts - defaults to Traditional)
|
||
'gan-hans' => "赣语(简体)\u{200E}", # Gan (Simplified Han)
|
||
'gan-hant' => "贛語(繁體)\u{200E}", # Gan (Traditional Han)
|
||
'gcr' => 'kréyòl gwiyanè', # Guianan Creole
|
||
'gd' => 'Gàidhlig', # Scots Gaelic
|
||
'gl' => 'galego', # Galician
|
||
'glk' => 'گیلکی', # Gilaki
|
||
'gn' => 'Avañe\'ẽ', # Guaraní, Paraguayan
|
||
'gom' => 'गोंयची कोंकणी / Gõychi Konknni', # Goan Konkani
|
||
'gom-deva' => 'गोंयची कोंकणी', # Goan Konkani (Devanagari script)
|
||
'gom-latn' => 'Gõychi Konknni', # Goan Konkani (Latin script)
|
||
'gor' => 'Bahasa Hulontalo', # Gorontalo
|
||
'got' => '𐌲𐌿𐍄𐌹𐍃𐌺', # Gothic
|
||
'grc' => 'Ἀρχαία ἑλληνικὴ', # Ancient Greek
|
||
'gsw' => 'Alemannisch', # Alemannic
|
||
'gu' => 'ગુજરાતી', # Gujarati
|
||
'gv' => 'Gaelg', # Manx
|
||
'ha' => 'Hausa', # Hausa
|
||
'hak' => '客家語/Hak-kâ-ngî', # Hakka
|
||
'haw' => 'Hawaiʻi', # Hawaiian
|
||
'he' => 'עברית', # Hebrew
|
||
'hi' => 'हिन्दी', # Hindi
|
||
'hif' => 'Fiji Hindi', # Fijian Hindi (multiple scripts - defaults to Latin)
|
||
'hif-latn' => 'Fiji Hindi', # Fiji Hindi (Latin script)
|
||
'hil' => 'Ilonggo', # Hiligaynon
|
||
'ho' => 'Hiri Motu', # Hiri Motu
|
||
'hr' => 'hrvatski', # Croatian
|
||
'hrx' => 'Hunsrik', # Riograndenser Hunsrückisch
|
||
'hsb' => 'hornjoserbsce', # Upper Sorbian
|
||
'ht' => 'Kreyòl ayisyen', # Haitian Creole French
|
||
'hu' => 'magyar', # Hungarian
|
||
'hu-formal' => "magyar (formal)\u{200E}", # Hungarian formal address
|
||
'hy' => 'հայերեն', # Armenian, T202611
|
||
'hyw' => 'արեւմտահայերէն', # Western Armenian, T201276
|
||
'hz' => 'Otsiherero', # Herero
|
||
'ia' => 'interlingua', # Interlingua (IALA)
|
||
'id' => 'Bahasa Indonesia', # Indonesian
|
||
'ie' => 'Interlingue', # Interlingue (Occidental)
|
||
'ig' => 'Igbo', # Igbo
|
||
'ii' => 'ꆇꉙ', # Sichuan Yi
|
||
'ik' => 'Iñupiak', # Inupiak (Inupiatun, Northwest Alaska / Inupiatun, North Alaskan)
|
||
'ike-cans' => 'ᐃᓄᒃᑎᑐᑦ', # Inuktitut, Eastern Canadian (Unified Canadian Aboriginal Syllabics)
|
||
'ike-latn' => 'inuktitut', # Inuktitut, Eastern Canadian (Latin script)
|
||
'ilo' => 'Ilokano', # Ilokano
|
||
'inh' => 'ГӀалгӀай', # Ingush
|
||
'io' => 'Ido', # Ido
|
||
'is' => 'íslenska', # Icelandic
|
||
'it' => 'italiano', # Italian
|
||
'iu' => 'ᐃᓄᒃᑎᑐᑦ/inuktitut', # Inuktitut (macro language, see ike/ikt, falls back to ike-cans)
|
||
'ja' => '日本語', # Japanese
|
||
'jam' => 'Patois', # Jamaican Creole English
|
||
'jbo' => 'la .lojban.', # Lojban
|
||
'jut' => 'jysk', # Jutish / Jutlandic
|
||
'jv' => 'Basa Jawa', # Javanese
|
||
'ka' => 'ქართული', # Georgian
|
||
'kaa' => 'Qaraqalpaqsha', # Karakalpak
|
||
'kab' => 'Taqbaylit', # Kabyle
|
||
'kbd' => 'Адыгэбзэ', # Kabardian
|
||
'kbd-cyrl' => 'Адыгэбзэ', # Kabardian (Cyrillic)
|
||
'kbp' => 'Kabɩyɛ', # Kabiyè
|
||
'kg' => 'Kongo', # Kongo, (FIXME!) should probaly be KiKongo or KiKoongo
|
||
'khw' => 'کھوار', # Khowar
|
||
'ki' => 'Gĩkũyũ', # Gikuyu
|
||
'kiu' => 'Kırmancki', # Kirmanjki
|
||
'kj' => 'Kwanyama', # Kwanyama
|
||
'kk' => 'қазақша', # Kazakh (multiple scripts - defaults to Cyrillic)
|
||
'kk-arab' => "قازاقشا (تٴوتە)\u{200F}", # Kazakh Arabic
|
||
'kk-cyrl' => "қазақша (кирил)\u{200E}", # Kazakh Cyrillic
|
||
'kk-latn' => "qazaqşa (latın)\u{200E}", # Kazakh Latin
|
||
'kk-cn' => "قازاقشا (جۇنگو)\u{200F}", # Kazakh (China)
|
||
'kk-kz' => "қазақша (Қазақстан)\u{200E}", # Kazakh (Kazakhstan)
|
||
'kk-tr' => "qazaqşa (Türkïya)\u{200E}", # Kazakh (Turkey)
|
||
'kl' => 'kalaallisut', # Inuktitut, Greenlandic/Greenlandic/Kalaallisut (kal)
|
||
'km' => 'ភាសាខ្មែរ', # Khmer, Central
|
||
'kn' => 'ಕನ್ನಡ', # Kannada
|
||
'ko' => '한국어', # Korean
|
||
'ko-kp' => '조선말', # Korean (DPRK), T190324
|
||
'koi' => 'Перем Коми', # Komi-Permyak
|
||
'kr' => 'Kanuri', # Kanuri, Central
|
||
'krc' => 'къарачай-малкъар', # Karachay-Balkar
|
||
'kri' => 'Krio', # Krio
|
||
'krj' => 'Kinaray-a', # Kinaray-a
|
||
'krl' => 'karjal', # Karelian
|
||
'ks' => 'कॉशुर / کٲشُر', # Kashmiri (multiple scripts - defaults to Perso-Arabic)
|
||
'ks-arab' => 'کٲشُر', # Kashmiri (Perso-Arabic script)
|
||
'ks-deva' => 'कॉशुर', # Kashmiri (Devanagari script)
|
||
'ksh' => 'Ripoarisch', # Ripuarian
|
||
'ku' => 'kurdî', # Kurdish (multiple scripts - defaults to Latin)
|
||
'ku-latn' => "kurdî (latînî)\u{200E}", # Northern Kurdish (Latin script)
|
||
'ku-arab' => "كوردي (عەرەبی)\u{200F}", # Northern Kurdish (Arabic script) (falls back to ckb)
|
||
'kum' => 'къумукъ', # Kumyk (Cyrillic, 'kum-latn' for Latin script)
|
||
'kv' => 'коми', # Komi-Zyrian (Cyrillic is common script but also written in Latin script)
|
||
'kw' => 'kernowek', # Cornish
|
||
'ky' => 'Кыргызча', # Kirghiz
|
||
'la' => 'Latina', # Latin
|
||
'lad' => 'Ladino', # Ladino
|
||
'lb' => 'Lëtzebuergesch', # Luxembourgish
|
||
'lbe' => 'лакку', # Lak
|
||
'lez' => 'лезги', # Lezgi
|
||
'lfn' => 'Lingua Franca Nova', # Lingua Franca Nova
|
||
'lg' => 'Luganda', # Ganda
|
||
'li' => 'Limburgs', # Limburgian
|
||
'lij' => 'Ligure', # Ligurian
|
||
'liv' => 'Līvõ kēļ', # Livonian
|
||
'lki' => 'لەکی', # Laki
|
||
'lmo' => 'lumbaart', # Lombard
|
||
'ln' => 'lingála', # Lingala
|
||
'lo' => 'ລາວ', # Laotian
|
||
'lrc' => 'لۊری شومالی', # Northern Luri
|
||
'loz' => 'Silozi', # Lozi
|
||
'lt' => 'lietuvių', # Lithuanian
|
||
'ltg' => 'latgaļu', # Latgalian
|
||
'lus' => 'Mizo ţawng', # Mizo/Lushai
|
||
'luz' => 'لئری دوٙمینی', # Southern Luri
|
||
'lv' => 'latviešu', # Latvian
|
||
'lzh' => '文言', # Literary Chinese, T10217
|
||
'lzz' => 'Lazuri', # Laz
|
||
'mai' => 'मैथिली', # Maithili
|
||
'map-bms' => 'Basa Banyumasan', # Banyumasan ('jv-x-bms')
|
||
'mdf' => 'мокшень', # Moksha
|
||
'mg' => 'Malagasy', # Malagasy
|
||
'mh' => 'Ebon', # Marshallese
|
||
'mhr' => 'олык марий', # Eastern Mari
|
||
'mi' => 'Māori', # Maori
|
||
'min' => 'Baso Minangkabau', # Minangkabau
|
||
'mk' => 'македонски', # Macedonian
|
||
'ml' => 'മലയാളം', # Malayalam
|
||
'mn' => 'монгол', # Halh Mongolian (Cyrillic) (ISO 639-3: khk)
|
||
'mni' => 'মেইতেই লোন্', # Manipuri/Meitei
|
||
'mnw' => 'ဘာသာ မန်', # Mon, T201583
|
||
'mo' => 'молдовеняскэ', # Moldovan, deprecated (ISO 639-2: ro-Cyrl-MD)
|
||
'mr' => 'मराठी', # Marathi
|
||
'mrj' => 'кырык мары', # Hill Mari
|
||
'ms' => 'Bahasa Melayu', # Malay
|
||
'mt' => 'Malti', # Maltese
|
||
'mus' => 'Mvskoke', # Muskogee/Creek
|
||
'mwl' => 'Mirandés', # Mirandese
|
||
'my' => 'မြန်မာဘာသာ', # Burmese
|
||
'myv' => 'эрзянь', # Erzya
|
||
'mzn' => 'مازِرونی', # Mazanderani
|
||
'na' => 'Dorerin Naoero', # Nauruan
|
||
'nah' => 'Nāhuatl', # Nahuatl (added to ISO 639-3 on 2006-10-31)
|
||
'nan' => 'Bân-lâm-gú', # Min-nan, T10217
|
||
'nap' => 'Napulitano', # Neapolitan, T45793
|
||
'nb' => 'norsk bokmål', # Norwegian (Bokmal)
|
||
'nds' => 'Plattdüütsch', # Low German ''or'' Low Saxon
|
||
'nds-nl' => 'Nedersaksies', # aka Nedersaksisch: Dutch Low Saxon
|
||
'ne' => 'नेपाली', # Nepali
|
||
'new' => 'नेपाल भाषा', # Newar / Nepal Bhasha
|
||
'ng' => 'Oshiwambo', # Ndonga
|
||
'niu' => 'Niuē', # Niuean
|
||
'nl' => 'Nederlands', # Dutch
|
||
'nl-informal' => "Nederlands (informeel)\u{200E}", # Dutch (informal address ("je"))
|
||
'nn' => 'norsk nynorsk', # Norwegian (Nynorsk)
|
||
'no' => 'norsk', # Norwegian macro language (falls back to nb).
|
||
'nov' => 'Novial', # Novial
|
||
'nrm' => 'Nouormand', # Norman (invalid code; 'nrf' in ISO 639 since 2014)
|
||
'nso' => 'Sesotho sa Leboa', # Northern Sotho
|
||
'nv' => 'Diné bizaad', # Navajo
|
||
'ny' => 'Chi-Chewa', # Chichewa
|
||
'nys' => 'Nyunga', # Nyungar
|
||
'oc' => 'occitan', # Occitan
|
||
'olo' => 'Livvinkarjala', # Livvi-Karelian
|
||
'om' => 'Oromoo', # Oromo
|
||
'or' => 'ଓଡ଼ିଆ', # Oriya
|
||
'os' => 'Ирон', # Ossetic, T31091
|
||
'pa' => 'ਪੰਜਾਬੀ', # Eastern Punjabi (Gurmukhi script) (pan)
|
||
'pag' => 'Pangasinan', # Pangasinan
|
||
'pam' => 'Kapampangan', # Pampanga
|
||
'pap' => 'Papiamentu', # Papiamentu
|
||
'pcd' => 'Picard', # Picard
|
||
'pdc' => 'Deitsch', # Pennsylvania German
|
||
'pdt' => 'Plautdietsch', # Plautdietsch/Mennonite Low German
|
||
'pfl' => 'Pälzisch', # Palatinate German
|
||
'pi' => 'पालि', # Pali
|
||
'pih' => 'Norfuk / Pitkern', # Norfuk/Pitcairn/Norfolk
|
||
'pl' => 'polski', # Polish
|
||
'pms' => 'Piemontèis', # Piedmontese
|
||
'pnb' => 'پنجابی', # Western Punjabi
|
||
'pnt' => 'Ποντιακά', # Pontic/Pontic Greek
|
||
'prg' => 'Prūsiskan', # Prussian
|
||
'ps' => 'پښتو', # Pashto
|
||
'pt' => 'português', # Portuguese
|
||
'pt-br' => 'português do Brasil', # Brazilian Portuguese
|
||
'qu' => 'Runa Simi', # Southern Quechua
|
||
'qug' => 'Runa shimi', # Kichwa/Northern Quechua (temporarily used until Kichwa has its own)
|
||
'rgn' => 'Rumagnôl', # Romagnol
|
||
'rif' => 'Tarifit', # Tarifit
|
||
'rm' => 'rumantsch', # Raeto-Romance
|
||
'rmy' => 'Romani', # Vlax Romany
|
||
'rn' => 'Kirundi', # Rundi/Kirundi/Urundi
|
||
'ro' => 'română', # Romanian
|
||
'roa-rup' => 'armãneashti', # Aromanian (deprecated code, 'rup' exists in ISO 639-3)
|
||
'roa-tara' => 'tarandíne', # Tarantino ('nap-x-tara')
|
||
'ru' => 'русский', # Russian
|
||
'rue' => 'русиньскый', # Rusyn
|
||
'rup' => 'armãneashti', # Aromanian
|
||
'ruq' => 'Vlăheşte', # Megleno-Romanian (multiple scripts - defaults to Latin)
|
||
'ruq-cyrl' => 'Влахесте', # Megleno-Romanian (Cyrillic script)
|
||
# 'ruq-grek' => 'Βλαεστε', # Megleno-Romanian (Greek script)
|
||
'ruq-latn' => 'Vlăheşte', # Megleno-Romanian (Latin script)
|
||
'rw' => 'Kinyarwanda', # Kinyarwanda, should possibly be Kinyarwandi
|
||
'sa' => 'संस्कृतम्', # Sanskrit
|
||
'sah' => 'саха тыла', # Sakha
|
||
'sat' => 'ᱥᱟᱱᱛᱟᱲᱤ', # Santali
|
||
'sc' => 'sardu', # Sardinian
|
||
'scn' => 'sicilianu', # Sicilian
|
||
'sco' => 'Scots', # Scots
|
||
'sd' => 'سنڌي', # Sindhi
|
||
'sdc' => 'Sassaresu', # Sassarese
|
||
'sdh' => 'کوردی خوارگ', # Southern Kurdish
|
||
'se' => 'davvisámegiella', # Northern Sami
|
||
'sei' => 'Cmique Itom', # Seri
|
||
'ses' => 'Koyraboro Senni', # Koyraboro Senni
|
||
'sg' => 'Sängö', # Sango/Sangho
|
||
'sgs' => 'žemaitėška', # Samogitian
|
||
'sh' => 'srpskohrvatski / српскохрватски', # Serbocroatian
|
||
'shi' => 'Tašlḥiyt/ⵜⴰⵛⵍⵃⵉⵜ', # Tachelhit (multiple scripts - defaults to Latin)
|
||
'shi-tfng' => 'ⵜⴰⵛⵍⵃⵉⵜ', # Tachelhit (Tifinagh script)
|
||
'shi-latn' => 'Tašlḥiyt', # Tachelhit (Latin script)
|
||
'shn' => 'ၽႃႇသႃႇတႆး ', # Shan
|
||
'shy-latn' => 'tachawit', # Shawiya (Latin script) - T194047
|
||
'si' => 'සිංහල', # Sinhalese
|
||
'simple' => 'Simple English', # Simple English
|
||
'sk' => 'slovenčina', # Slovak
|
||
'skr' => 'سرائیکی', # Saraiki (multiple scripts - defaults to Arabic)
|
||
'skr-arab' => 'سرائیکی', # Saraiki (Arabic script)
|
||
'sl' => 'slovenščina', # Slovenian
|
||
'sli' => 'Schläsch', # Lower Selisian
|
||
'sm' => 'Gagana Samoa', # Samoan
|
||
'sma' => 'Åarjelsaemien', # Southern Sami
|
||
'sn' => 'chiShona', # Shona
|
||
'so' => 'Soomaaliga', # Somali
|
||
'sq' => 'shqip', # Albanian
|
||
'sr' => 'српски / srpski', # Serbian (multiple scripts - defaults to Cyrillic)
|
||
'sr-ec' => "српски (ћирилица)\u{200E}", # Serbian Cyrillic ekavian
|
||
'sr-el' => "srpski (latinica)\u{200E}", # Serbian Latin ekavian
|
||
'srn' => 'Sranantongo', # Sranan Tongo
|
||
'ss' => 'SiSwati', # Swati
|
||
'st' => 'Sesotho', # Southern Sotho
|
||
'sty' => 'cебертатар', # Siberian Tatar
|
||
'stq' => 'Seeltersk', # Saterland Frisian
|
||
'su' => 'Basa Sunda', # Sundanese
|
||
'sv' => 'svenska', # Swedish
|
||
'sw' => 'Kiswahili', # Swahili
|
||
'szl' => 'ślůnski', # Silesian
|
||
'ta' => 'தமிழ்', # Tamil
|
||
'tay' => 'Tayal', # Atayal
|
||
'tcy' => 'ತುಳು', # Tulu
|
||
'te' => 'తెలుగు', # Telugu
|
||
'tet' => 'tetun', # Tetun
|
||
'tg' => 'тоҷикӣ', # Tajiki (falls back to tg-cyrl)
|
||
'tg-cyrl' => 'тоҷикӣ', # Tajiki (Cyrllic script) (default)
|
||
'tg-latn' => 'tojikī', # Tajiki (Latin script)
|
||
'th' => 'ไทย', # Thai
|
||
'ti' => 'ትግርኛ', # Tigrinya
|
||
'tk' => 'Türkmençe', # Turkmen
|
||
'tl' => 'Tagalog', # Tagalog
|
||
'tly' => 'толышә зывон', # Talysh
|
||
'tn' => 'Setswana', # Setswana
|
||
'to' => 'lea faka-Tonga', # Tonga (Tonga Islands)
|
||
'tpi' => 'Tok Pisin', # Tok Pisin
|
||
'tr' => 'Türkçe', # Turkish
|
||
'tru' => 'Ṫuroyo', # Turoyo
|
||
'ts' => 'Xitsonga', # Tsonga
|
||
'tt' => 'татарча/tatarça', # Tatar (multiple scripts - defaults to Cyrillic)
|
||
'tt-cyrl' => 'татарча', # Tatar (Cyrillic script) (default)
|
||
'tt-latn' => 'tatarça', # Tatar (Latin script)
|
||
'tum' => 'chiTumbuka', # Tumbuka
|
||
'tw' => 'Twi', # Twi
|
||
'ty' => 'reo tahiti', # Tahitian
|
||
'tyv' => 'тыва дыл', # Tyvan
|
||
'tzm' => 'ⵜⴰⵎⴰⵣⵉⵖⵜ', # Tamazight
|
||
'udm' => 'удмурт', # Udmurt
|
||
'ug' => 'ئۇيغۇرچە / Uyghurche', # Uyghur (multiple scripts - defaults to Arabic)
|
||
'ug-arab' => 'ئۇيغۇرچە', # Uyghur (Arabic script) (default)
|
||
'ug-latn' => 'Uyghurche', # Uyghur (Latin script)
|
||
'uk' => 'українська', # Ukrainian
|
||
'ur' => 'اردو', # Urdu
|
||
'uz' => 'oʻzbekcha/ўзбекча', # Uzbek (multiple scripts - defaults to Latin)
|
||
'uz-cyrl' => 'ўзбекча', # Uzbek Cyrillic
|
||
'uz-latn' => 'oʻzbekcha', # Uzbek Latin (default)
|
||
've' => 'Tshivenda', # Venda
|
||
'vec' => 'vèneto', # Venetian
|
||
'vep' => 'vepsän kel’', # Veps
|
||
'vi' => 'Tiếng Việt', # Vietnamese
|
||
'vls' => 'West-Vlams', # West Flemish
|
||
'vmf' => 'Mainfränkisch', # Upper Franconian, Main-Franconian
|
||
'vo' => 'Volapük', # Volapük
|
||
'vot' => 'Vaďďa', # Vod/Votian
|
||
'vro' => 'Võro', # Võro
|
||
'wa' => 'walon', # Walloon
|
||
'war' => 'Winaray', # Waray-Waray
|
||
'wo' => 'Wolof', # Wolof
|
||
'wuu' => '吴语', # Wu Chinese
|
||
'xal' => 'хальмг', # Kalmyk-Oirat
|
||
'xh' => 'isiXhosa', # Xhosan
|
||
'xmf' => 'მარგალური', # Mingrelian
|
||
'yi' => 'ייִדיש', # Yiddish
|
||
'yo' => 'Yorùbá', # Yoruba
|
||
'yue' => '粵語', # Cantonese
|
||
'za' => 'Vahcuengh', # Zhuang
|
||
'zea' => 'Zeêuws', # Zeeuws/Zeaws
|
||
'zgh' => 'ⵜⴰⵎⴰⵣⵉⵖⵜ ⵜⴰⵏⴰⵡⴰⵢⵜ', # Moroccan Amazigh (multiple scripts - defaults to Neo-Tifinagh)
|
||
'zh' => '中文', # (Zhōng Wén) - Chinese
|
||
'zh-classical' => '文言', # Classical Chinese/Literary Chinese -- (see T10217)
|
||
'zh-cn' => "中文(中国大陆)\u{200E}", # Chinese (PRC)
|
||
'zh-hans' => "中文(简体)\u{200E}", # Mandarin Chinese (Simplified Chinese script) (cmn-hans)
|
||
'zh-hant' => "中文(繁體)\u{200E}", # Mandarin Chinese (Traditional Chinese script) (cmn-hant)
|
||
'zh-hk' => "中文(香港)\u{200E}", # Chinese (Hong Kong)
|
||
'zh-min-nan' => 'Bân-lâm-gú', # Min-nan -- (see T10217)
|
||
'zh-mo' => "中文(澳門)\u{200E}", # Chinese (Macau)
|
||
'zh-my' => "中文(马来西亚)\u{200E}", # Chinese (Malaysia)
|
||
'zh-sg' => "中文(新加坡)\u{200E}", # Chinese (Singapore)
|
||
'zh-tw' => "中文(台灣)\u{200E}", # Chinese (Taiwan)
|
||
'zh-yue' => '粵語', # Cantonese -- (see T10217)
|
||
'zu' => 'isiZulu' # Zulu
|
||
];
|
||
}
|