Lang/Data

Lang/Data モジュールの解説
--[[--------------------------< L A N G _ N A M E _ T A B L E >------------------------------------------------  primary table of tables that decode: lang -> language tags and names script -> ISO 15924 script tags region -> ISO 3166 region tags variant -> iana registered variant tags suppressed -> map of scripts tags and their associated language tags  all of these data come from separate modules that are derived from the IANA language-subtag-registry file  key_to_lower() avoids the metatable trap and sets all keys in the subtables to lowercase.  Many language codes have multiple associated names; Module:lang is only concerned with the first name so key_to_lower() only fetches the first name.  TODO: instead of returning: ["key"] = {"name"} where each table has only one name, return ["key"] = "name" requires changes in Module:Lang.  ]]  local function key_to_lower (module, src_type) local out = {}; local source = (('variants' == src_type) and require (module)) or mw.loadData (module);-- fetch data from this module; require() avoids metatable trap for variant data if 'variants' == src_type then for k, v in pairs (source) do out[k:lower()] = v;-- for variant, everything is needed end  elseif 'lang' == src_type and source.active then-- for ~/iana_languages (active) for k, v in pairs (source.active) do out[k:lower()] = {v[1]};-- ignore multiple names; take first name only end  elseif 'lang_dep' == src_type and source.deprecated then-- for ~/iana_languages (deprecated) for k, v in pairs (source.deprecated) do out[k:lower()] = {v[1]};-- ignore multiple names; take first name only end  else-- here for all other sources for k, v in pairs (source) do out[k:lower()] = {v[1]};-- ignore multiple names; take first name only end end return out; end  local lang_name_table = { lang = key_to_lower ('Module:Language/data/iana languages', 'lang'), lang_dep = key_to_lower ('Module:Language/data/iana languages', 'lang_dep'), script = key_to_lower ('Module:Language/data/iana scripts'),-- script keys are capitalized; set to lower region = key_to_lower ('Module:Language/data/iana regions'),-- region keys are uppercase; set to lower variant = key_to_lower ('Module:Language/data/iana variants', 'variants'), suppressed = key_to_lower ('Module:Language/data/iana suppressed scripts'),-- script keys are capitalized; set to lower }   --[[--------------------------< O V E R R I D E >--------------------------------------------------------------  Language codes and names in this table override the BCP47 names in lang_name_table.  indexes in this table shall always be lower case  ]]  local override = { ------------------------------< I S O   6 3 9 - 1 >------------------------------------------------------------  ["ca-valencia"] = {"バレンシア語"}, ["cu"] = {"教会スラヴ語"},-- 2nd IANA name; ["de-at"] = {"オーストリアドイツ語"},-- these code-region and code-variant tags to match en.wiki article names ["de-ch"] = {"スイスドイツ語"}, ["en-au"] = {"オーストラリア英語"}, ["en-ca"] = {"カナダ英語"}, ["en-emodeng"] = {"初期近代英語"}, ["en-gb"] = {"イギリス英語"}, ["en-ie"] = {"アイルランド英語"}, ["en-in"] = {"インド英語"}, ["en-nz"] = {"ニュージーランド英語"}, ["en-us"] = {"アメリカ英語"}, ["en-za"] = {"南アフリカ英語"}, ["fy"] = {"西フリジア語"},-- Western Frisian ["mo"] = {"モルドバ語"},-- Moldavian (deprecated code); to match en.wiki article title ["oc-provenc"] = {"オック語"}, ["ps"] = {"パシュトー語"},-- Pushto ["tw-asante"] = {"アサンテ方言"},  -- these ISO 639-1 language-name overrides imported from Module:Language/data/wp_languages ---- ["av"] = {"アヴァル語"},-- Avaric ["bo"] = {"チベット語"},-- Tibetan ["el"] = {"ギリシア語"},-- Modern Greek --["en-SA"] = {"South African English"},-- English; no; SA is not South Africa it Saudi Arabia;  ZA is South Africa ["ff"] = {"フラニ語"},-- Fulah ["ht"] = {"ハイチ語"},-- Haitian ["hz"] = {"ヘレロ語"},-- Herero ["ii"] = {"四川彝語"},-- Sichuan Yi ["ki"] = {"キクユ語"},-- Kikuyu ["kl"] = {"グリーンランド語"},-- Kalaallisut ["ky"] = {"キルギス語"},-- Kirghiz ["lg"] = {"ガンダ語"},-- Ganda ["li"] = {"リンブルフ語"},-- Limburgan ["mi"] = {"マオリ語"},-- Maori ["na"] = {"ナウル語"},-- Nauru ["nb"] = {"ブークモール"},-- Norwegian Bokmål ["nd"] = {"北ンデベレ語"},-- North Ndebele ["nn"] = {"ニーノシュク"},-- Norwegian Nynorsk ["nr"] = {"南ンデベレ語"},-- South Ndebele ["ny"] = {"チェワ語"},-- Nyanja ["oj"] = {"オジブワ語"},-- Ojibwa ["or"] = {"オリヤー語"},-- Oriya ["pa"] = {"パンジャーブ語"},-- Panjabi ["rn"] = {"ルンディ語"},-- Rundi ["sl"] = {"スロベニア語"},-- Slovenian ["ss"] = {"スワジ語"},-- Swati ["st"] = {"ソト語"},-- Southern Sotho ["to"] = {"トンガ語"},-- Tonga ----   ------------------------------< I S O   6 3 9 - 2,   - 3,   - 5 >----------------------------------------------  ["arc"] = {"Aramaic"},-- Official Aramaic (700-300 BCE), Imperial Aramaic (700-300 BCE); ["art"] = {"constructed"},-- to match en.wiki article; lowercase for category name ["bhd"] = {"Bhadarwahi"},-- Bhadrawahi; to match en.wiki article title ["bla"] = {"Blackfoot"},-- Siksika; to match en.wiki article title ["bua"] = {"Buryat"},-- Buriat; this is a macro language; these four use wp preferred transliteration; ["bxm"] = {"Mongolian Buryat"},-- Mongolia Buriat; these three all redirect to Buryat ["bxr"] = {"Russian Buryat"},-- Russia Buriat; ["bxu"] = {"Chinese Buryat"},-- China Buriat; ["byr"] = {"Yipma"},-- Baruya, Yipma ["egy"] = {"Ancient Egyptian"},-- Egyptian (Ancient); distinguish from contemporary arz: Egyptian Arabic  ["frr"] = {"North Frisian"},-- Northern Frisian ["frs"] = {"East Frisian Low Saxon"},-- Eastern Frisian ["ilo"] = {"Ilocano"},-- Iloko; to match en.wiki article title ["jam"] = {"Jamaican Patois"},-- Jamaican Creole English ["mhr"] = {"Meadow Mari"},-- Eastern Mari ["mid"] = {"Modern Mandaic"},-- Mandaic ["mla"] = {"Tamambo"},-- Malo ['mte'] = {"Mono-Alu"},-- Mono (Solomon Islands) ["nan-tw"] = {"Taiwanese Hokkien"},-- make room for IANA / 639-3 nan Min Nan Chinese; match en.wiki article title ["nrf"] = {"Norman"},-- not quite a collective - IANA name: Jèrriais; categorizes to Norman-language text ["nzi"] = {"Nzema"},-- Nzima; to match en.wiki article title ["orv"] = {"Old East Slavic"},-- Old Russian ["pfl"] = {"Palatine German"},-- Pfaelzisch; to match en.wiki article ["pms"] = {"Piedmontese"},-- Piemontese; to match en.wiki article title ["pnb"] = {"Punjabi (Western)"},-- Western Panjabi; dab added to override import from ~/wp languages and distinguish pnb from pa in reverse look up tag_from_name() ["stq"] = {"Saterland Frisian"},-- Saterfriesisch ["und"] = {"undetermined"},-- capitalization to match existing category ["wrg"] = {"Warrongo"},-- Warungu ["xal-ru"] = {"Kalmyk"},-- to match en.wiki article title ["xgf"] = {"Tongva"},-- ISO 639-3 is Gabrielino-Fernandeño  -- these ISO 639-2, -3 language-name overrides imported from Module:Language/data/wp_languages ---- ["ace"] = {"Acehnese"},-- Achinese ["aec"] = {"Sa'idi Arabic"},-- Saidi Arabic ["akl"] = {"Aklan"},-- Aklanon ["alt"] = {"Altay"},-- Southern Altai ["apm"] = {"Mescalero-Chiricahua"},-- Mescalero-Chiricahua Apache ["bal"] = {"Balochi"},-- Baluchi ["bcl"] = {"Central Bicolano"},-- Central Bikol ["bin"] = {"Edo"},-- Bini ["bpy"] = {"Bishnupriya Manipuri"},-- Bishnupriya ["chg"] = {"Chagatay"},-- Chagatai ["ckb"] = {"Sorani Kurdish"},-- Central Kurdish ["cnu"] = {"Shenwa"},-- Chenoua ["coc"] = {"Cocopah"},-- Cocopa ["diq"] = {"Zazaki"},-- Dimli ["fit"] = {"Meänkieli"},-- Tornedalen Finnish ["fkv"] = {"Kven"},-- Kven Finnish ["frk"] = {"Old Frankish"},-- Frankish ["gez"] = {"Ge'ez"},-- Geez ["gju"] = {"Gujari"},-- Gujari ["gsw"] = {"Alemannic German"},-- Swiss German ["gul"] = {"Gullah"},-- Sea Island Creole English ["hak"] = {"Hakka"},-- Hakka Chinese ["hbo"] = {"Biblical Hebrew"},-- Ancient Hebrew ["hnd"] = {"Hindko"},-- Southern Hindko --["ikt"] = {"Inuvialuk"},-- Inuinnaqtun ["kaa"] = {"Karakalpak"},-- Kara-Kalpak ["khb"] = {"Tai Lü"},-- Lü ["kmr"] = {"Kurmanji Kurdish"},-- Northern Kurdish ["kpo"] = {"Kposo"},-- Ikposo ["krj"] = {"Kinaray-a"},-- Kinaray-A ["ktz"] = {"Juǀ'hoan"},-- Juǀʼhoan ["lez"] = {"Lezgian"},-- Lezghian ["liv"] = {"Livonian"},-- Liv ["lng"] = {"Lombardic"},-- Langobardic ["mia"] = {"Miami-Illinois"},-- Miami ["miq"] = {"Miskito"},-- Mískito ["mix"] = {"Mixtec"},-- Mixtepec Mixtec ["mni"] = {"Meitei"},-- Manipuri ["mrj"] = {"Hill Mari"},-- Western Mari ["mww"] = {"White Hmong"},-- Hmong Daw ["nds-nl"] = {"Dutch Low Saxon"},-- Low German ["new"] = {"Nepal Bhasa"},-- Newari ["nso"] = {"Northern Sotho"},-- Pedi ["nwc"] = {"Classical Nepal Bhasa"},-- Classical Newari ["ood"] = {"O'odham"},-- Tohono O'odham ["otk"] = {"Old Turkic"},-- Old Turkish ["pal"] = {"Middle Persian"},-- Pahlavi ["pam"] = {"Kapampangan"},-- Pampanga ["phr"] = {"Potwari"},-- Pahari-Potwari ["pka"] = {"Jain Prakrit"},-- Ardhamāgadhī Prākrit --["pnb"] = {"Punjabi"},-- Western Panjabi ["psu"] = {"Shauraseni"},-- Sauraseni Prākrit ["rap"] = {"Rapa Nui"},-- Rapanui ["rar"] = {"Cook Islands Māori"},-- Rarotongan ["rmu"] = {"Scandoromani"},-- Tavringer Romani ["rom"] = {"Romani"},-- Romany ["rup"] = {"Aromanian"},-- Macedo-Romanian ["ryu"] = {"Okinawan"},-- Central Okinawan ["sdc"] = {"Sassarese"},-- Sassarese Sardinian ["sdn"] = {"Gallurese"},-- Gallurese Sardinian ["shp"] = {"Shipibo"},-- Shipibo-Conibo ["src"] = {"Logudorese"},-- Logudorese Sardinian ["sro"] = {"Campidanese"},-- Campidanese Sardinian ["tkl"] = {"Tokelauan"},-- Tokelau ["tvl"] = {"Tuvaluan"},-- Tuvalu ["tyv"] = {"Tuvan"},-- Tuvinian ["vls"] = {"West Flemish"},-- Vlaams ["wep"] = {"Westphalian"},-- Westphalien ["xal"] = {"Oirat"},-- Kalmyk ["xcl"] = {"Old Armenian"},-- Classical Armenian ["yua"] = {"Yucatec Maya"},-- Yucateco ----   ------------------------------< P R I V A T E - U S E   T A G S >----------------------------------------------  ["cel-x-proto"] = {"Proto-Celtic"},-- cel in IANA is Celtic languages ["gem-x-proto"] = {"Proto-Germanic"},-- gem in IANA is Germanic languages ["grc-x-aeolic"] = {"Aeolic Greek"},-- these grc-x-... codes are preferred alternates to the non-standard catchall code grc-gre ["grc-x-attic"] = {"Attic Greek"}, ["grc-x-biblical"] = {"Biblical Greek"}, ["grc-x-byzant"] = {"Byzantine Greek"}, ["grc-x-classic"] = {"Classical Greek"}, ["grc-x-doric"] = {"Doric Greek"}, ["grc-x-hellen"] = {"Hellenistic Greek"}, ["grc-x-ionic"] = {"Ionic Greek"}, ["grc-x-koine"] = {"コイネー・ギリシア語"}, ["grc-x-medieval"] = {"Medieval Greek"}, ["grc-x-patris"] = {"Patristic Greek"}, ["grk-x-proto"] = {"Proto-Greek"},-- grk in IANA is Greek languages ["iir-x-proto"] = {"Proto-Indo-Iranian"},-- iir in IANA is Indo-Iranian Languages ["ira-x-proto"] = {"Proto-Iranian"},-- ira in IANA is Iranian languages ["itc-x-proto"] = {"Proto-Italic"},-- itc in IANA is Italic languages ["ksh-x-colog"] = {"Colognian"},-- en.wiki article is Colognian; ksh (Kölsch) redirects there ["mis-x-ripuar"] = {"Ripuarian"},-- replaces improper use of ksh in wp_languages ["sla-x-proto"] = {"Proto-Slavic"},-- sla in IANA is Slavic languages ["yuf-x-hav"] = {"Havasupai"},-- IANA name for these three is Havasupai-Walapai-Yavapai ["yuf-x-wal"] = {"Walapai"}, ["yuf-x-yav"] = {"Yavapai"}, }   --[[--------------------------< A R T I C L E _ L I N K >------------------------------------------------------  for those rare occasions when article titles don't fit with the normal '-language', this table maps language code to article title.  Use of this table should be avoided and the use of redirects preferred as that is the long-standing method of handling article names that don't fit with the normal pattern  ]]  local article_name = { ["lij"] = {"Ligurian (Romance language)"},-- Ligurian; see Template_talk:Lang#Ligurian_dab ['mnh'] = {"Mono language (Congo)"},-- Mono (Democratic Republic of Congo); see Template_talk:Lang#Mono_languages ['mnr'] = {"Mono language (California)"},-- Mono (USA) ['mru'] = {"Mono language (Cameroon)"},-- Mono (Cameroon) ["xlg"] = {"Ligurian (ancient language)"},-- see Template_talk:Lang#Ligurian_dab }   --[=[-------------------------< R T L _ S C R I P T S >--------------------------------------------------------  ISO 15924 scripts that are written right-to-left.  Data in this table taken from [[ISO 15924#List of codes]]  last update to this list: 2017-12-24  ]=]  local rtl_scripts = { 'adlm', 'arab', 'aran', 'armi', 'avst', 'cprt', 'egyd', 'egyh', 'hatr', 'hebr', 'hung', 'inds', 'khar', 'lydi', 'mand', 'mani', 'mend', 'merc', 'mero', 'narb', 'nbat', 'nkoo', 'orkh', 'palm', 'phli', 'phlp', 'phlv', 'phnx', 'prti', 'rohg', 'samr', 'sarb', 'sogd', 'sogo', 'syrc', 'syre', 'syrj', 'syrn', 'thaa', 'wole', };   --[[--------------------------< T R A N S L I T   T I T L E S >------------------------------------------------  This is a table of tables of transliteration standards and the language codes or language scripts that apply to those standards.  This table is used to create the tool-tip text associated with the transliterated text displayed by some of the {{lang-??}} templates.  These tables are more-or-less copied directly from {{transl}}.  The standard 'NO_STD' is a construct to allow for the cases when no |std= parameter value is provided.  ]]  local translit_title_table = { ['ahl'] = { ['default'] = 'Academy of the Hebrew Language transliteration', },  ['ala'] = { ['default'] = 'American Library Association – Library of Congress transliteration', },  ['ala-lc'] = { ['default'] = 'American Library Association – Library of Congress transliteration', },  ['batr'] = { ['default'] = 'Bikdash Arabic Transliteration Rules', },  ['bgn/pcgn'] = { ['default'] = 'Board on Geographic Names / Permanent Committee on Geographical Names transliteration', },  ['din'] = { ['ar'] = 'DIN 31635 Arabic', ['fa'] = 'DIN 31635 Arabic', ['ku'] = 'DIN 31635 Arabic', ['ps'] = 'DIN 31635 Arabic', ['tg'] = 'DIN 31635 Arabic', ['ug'] = 'DIN 31635 Arabic', ['ur'] = 'DIN 31635 Arabic', ['arab'] = 'DIN 31635 Arabic',  ['default'] = 'DIN transliteration', },  ['eae'] = { ['default'] = 'Encyclopaedia Aethiopica transliteration', },  ['hepburn'] = { ['default'] = 'Hepburn transliteration', },  ['hunterian'] = { ['default'] = 'Hunterian transliteration', },  ['iast'] = { ['default'] = 'International Alphabet of Sanskrit transliteration', },  ['iso'] = {-- when a transliteration standard is supplied ['ab'] = 'ISO 9 Cyrillic', ['ba'] = 'ISO 9 Cyrillic', ['be'] = 'ISO 9 Cyrillic', ['bg'] = 'ISO 9 Cyrillic', ['kk'] = 'ISO 9 Cyrillic', ['ky'] = 'ISO 9 Cyrillic', ['mn'] = 'ISO 9 Cyrillic', ['ru'] = 'ISO 9 Cyrillic', ['tg'] = 'ISO 9 Cyrillic', ['uk'] = 'ISO 9 Cyrillic', ['bua'] = 'ISO 9 Cyrillic', ['sah'] = 'ISO 9 Cyrillic', ['tut'] = 'ISO 9 Cyrillic', ['xal'] = 'ISO 9 Cyrillic', ['cyrl'] = 'ISO 9 Cyrillic',  ['ar'] = 'ISO 233 Arabic', ['ku'] = 'ISO 233 Arabic', ['ps'] = 'ISO 233 Arabic', ['ug'] = 'ISO 233 Arabic', ['ur'] = 'ISO 233 Arabic', ['arab'] = 'ISO 233 Arabic',  ['he'] = 'ISO 259 Hebrew', ['yi'] = 'ISO 259 Hebrew', ['hebr'] = 'ISO 259 Hebrew',  ['el'] = 'ISO 843 Greek', ['grc'] = 'ISO 843 Greek',  ['ja'] = 'ISO 3602 Japanese', ['hira'] = 'ISO 3602 Japanese', ['hrkt'] = 'ISO 3602 Japanese', ['jpan'] = 'ISO 3602 Japanese', ['kana'] = 'ISO 3602 Japanese',  ['zh'] = 'ISO 7098 Chinese', ['chi'] = 'ISO 7098 Chinese', ['pny'] = 'ISO 7098 Chinese', ['zho'] = 'ISO 7098 Chinese', --['han'] = 'ISO 7098 Chinese',-- unicode alias of Hani? doesn't belong here? should be Hani? ['hans'] = 'ISO 7098 Chinese', ['hant'] = 'ISO 7098 Chinese',  ['ka'] = 'ISO 9984 Georgian', ['kat'] = 'ISO 9984 Georgian',  ['arm'] = 'ISO 9985 Armenian', ['hy'] = 'ISO 9985 Armenian',  ['th'] = 'ISO 11940 Thai', ['tha'] = 'ISO 11940 Thai',  ['ko'] = 'ISO 11941 Korean', ['kor'] = 'ISO 11941 Korean',  ['awa'] = 'ISO 15919 Indic', ['bho'] = 'ISO 15919 Indic', ['bn'] = 'ISO 15919 Indic', ['bra'] = 'ISO 15919 Indic', ['doi'] = 'ISO 15919 Indic', ['dra'] = 'ISO 15919 Indic', ['gon'] = 'ISO 15919 Indic', ['gu'] = 'ISO 15919 Indic', ['hi'] = 'ISO 15919 Indic', ['inc'] = 'ISO 15919 Indic', ['kn'] = 'ISO 15919 Indic', ['kok'] = 'ISO 15919 Indic', ['ks'] = 'ISO 15919 Indic', ['mag'] = 'ISO 15919 Indic', ['mai'] = 'ISO 15919 Indic', ['ml'] = 'ISO 15919 Indic', ['mr'] = 'ISO 15919 Indic', ['ne'] = 'ISO 15919 Indic', ['new'] = 'ISO 15919 Indic', ['or'] = 'ISO 15919 Indic', ['pa'] = 'ISO 15919 Indic', ['raj'] = 'ISO 15919 Indic', ['sa'] = 'ISO 15919 Indic', ['sat'] = 'ISO 15919 Indic', ['sd'] = 'ISO 15919 Indic', ['si'] = 'ISO 15919 Indic', ['ta'] = 'ISO 15919 Indic', ['tcy'] = 'ISO 15919 Indic', ['te'] = 'ISO 15919 Indic', ['beng'] = 'ISO 15919 Indic', ['brah'] = 'ISO 15919 Indic', ['deva'] = 'ISO 15919 Indic', ['gujr'] = 'ISO 15919 Indic', ['guru'] = 'ISO 15919 Indic', ['knda'] = 'ISO 15919 Indic', ['mlym'] = 'ISO 15919 Indic', ['orya'] = 'ISO 15919 Indic', ['sinh'] = 'ISO 15919 Indic', ['taml'] = 'ISO 15919 Indic', ['telu'] = 'ISO 15919 Indic',  ['default'] = 'ISO transliteration', },  ['jyutping'] = { ['default'] = 'Jyutping transliteration', },  ['mr'] = { ['default'] = 'McCune–Reischauer transliteration', },  ['nihon-shiki'] = { ['default'] = 'Nihon-shiki transliteration', },  ['no_std'] = {-- when no transliteration standard is supplied ['akk'] = 'Semitic transliteration', ['sem'] = 'Semitic transliteration', ['phnx'] = 'Semitic transliteration', ['xsux'] = 'Cuneiform transliteration', },  ['pinyin'] = { ['default'] = 'Pinyin transliteration', },  ['rr'] = { ['default'] = 'Revised Romanization of Korean transliteration', },  ['rtgs'] = { ['default'] = 'Royal Thai General System of Transcription', },  ['satts'] = { ['default'] = 'Standard Arabic Technical Transliteration System transliteration', },  ['ungegn'] = { ['default'] = 'United Nations Group of Experts on Geographical Names transliteration', },  ['wadegile'] = { ['default'] = 'Wade–Giles transliteration', },  ['wehr'] = { ['default'] = 'Hans Wehr transliteration', }, };   return { article_name = article_name, lang_name_table = lang_name_table, override = override, rtl_scripts = rtl_scripts, translit_title_table = translit_title_table, }; 

🔥 Trending searches on Wiki 日本語:

地下鉄サリン事件池田伸子広谷鏡子萩尾匡也東京タワー (小説)FRUITS ZIPPER宮島未奈早川雪洲上沼真平百田尚樹怪異と乙女と神隠し和久井健YOU (タレント)安藤サクラ深津絵里フロリアン・ヴィルツゲゲゲの女房塩﨑実央小松菜奈マフィア千葉科学大学松居一代葛西美空WEST.駿河太郎ジャスティンミラノ立川談志三吉彩花宇多田ヒカル内田雄馬工藤夕貴東京エンカウント高梨沙羅ジャッキー・ロビンソン涙の女王羽瀬川なぎ麻生太郎藤原実資くるり〜誰が私と恋をした?〜蜻蛉日記上杉憲寛イチロー山崎亜美高岡法科大学ユダヤ人伏見寅威ソンドラ・ロック是永千恵武井壮陰裂土谷正実塩谷立鳥居みゆき影木栄貴坂本龍馬松下洸平あぶない刑事の登場人物亀梨和也石井久子島根県第1区全開ガール山﨑福也石井紘基井口裕香木村拓哉浜辺美波青木さやか福士蒼汰LINE (アプリケーション)釘宮理恵メジャーリーグベースボール上田麗奈4月17日トルクメニスタンすずめの戸締まり明石花火大会歩道橋事故蒲島郁夫🡆 More