Module:Lang/data: Difference between revisions
Jump to navigation
Jump to search
-temp_source_get();
imported>Stuwisi m (1 revision imported) |
w>Trappist the monk (-temp_source_get();) |
||
Line 22: | Line 22: | ||
local function key_to_lower (module, src_type) | local function key_to_lower (module, src_type) | ||
local out = {}; | local out = {}; | ||
local | local source_t = (('var_sup' == src_type) and require (module)) or mw.loadData (module); -- fetch data from this module; require() avoids metatable trap for variant data | ||
if 'var_sup' == src_type then | if 'var_sup' == src_type then | ||
for k, v in pairs ( | for k, v in pairs (source_t) do | ||
out[k:lower()] = v; -- for variant and suppressed everything is needed | out[k:lower()] = v; -- for variant and suppressed everything is needed | ||
end | end | ||
elseif 'lang' == src_type and | elseif 'lang' == src_type and source_t.active then -- for ~/iana_languages (active) | ||
for k, v in pairs ( | for k, v in pairs (source_t.active) do | ||
out[k:lower()] = v[1]; -- ignore multiple names; take first name only | out[k:lower()] = v[1]; -- ignore multiple names; take first name only | ||
end | end | ||
elseif 'lang_dep' == src_type and | elseif 'lang_dep' == src_type and source_t.deprecated then -- for ~/iana_languages (deprecated) | ||
for k, v in pairs ( | for k, v in pairs (source_t.deprecated) do | ||
out[k:lower()] = v[1]; -- ignore multiple names; take first name only | out[k:lower()] = v[1]; -- ignore multiple names; take first name only | ||
end | end | ||
else -- here for all other sources | else -- here for all other sources | ||
for k, v in pairs ( | for k, v in pairs (source_t) do | ||
out[k:lower()] = v[1]; -- ignore multiple names; take first name only | out[k:lower()] = v[1]; -- ignore multiple names; take first name only | ||
end | end | ||
Line 47: | Line 48: | ||
local lang_name_table_t = { | local lang_name_table_t = { | ||
lang = key_to_lower ('Module: | lang = key_to_lower ('Module:Lang/data/iana languages', 'lang'), | ||
lang_dep = key_to_lower ('Module: | lang_dep = key_to_lower ('Module:Lang/data/iana languages', 'lang_dep'), | ||
script = key_to_lower ('Module: | script = key_to_lower ('Module:Lang/data/iana scripts'), -- script keys are capitalized; set to lower | ||
region = key_to_lower ('Module: | region = key_to_lower ('Module:Lang/data/iana regions'), -- region keys are uppercase; set to lower | ||
variant = key_to_lower ('Module: | variant = key_to_lower ('Module:Lang/data/iana variants', 'var_sup'), | ||
suppressed = key_to_lower ('Module: | suppressed = key_to_lower ('Module:Lang/data/iana suppressed scripts', 'var_sup'), -- script keys are capitalized; set to lower | ||
} | } | ||
Line 118: | Line 119: | ||
------------------------------< I S O _ 6 3 9 - 1 >------------------------------------------------------------ | ------------------------------< I S O _ 6 3 9 - 1 >------------------------------------------------------------ | ||
["ab"] = "Abkhaz", -- to match en.wiki article name | |||
["ca-valencia"] = "Valencian", | ["ca-valencia"] = "Valencian", | ||
["cu"] = "Church Slavonic", -- 2nd IANA name; | ["cu"] = "Church Slavonic", -- 2nd IANA name; | ||
Line 138: | Line 140: | ||
["pt-br"] = "Brazilian Portuguese", -- match MediaWiki | ["pt-br"] = "Brazilian Portuguese", -- match MediaWiki | ||
["tw-asante"] = "Asante Twi", | ["tw-asante"] = "Asante Twi", | ||
["ug"] = "Uyghur", -- 2nd IANA name; to match en.wiki article name | |||
-- these ISO 639-1 language-name overrides imported from Module:Language/data/wp_languages | -- these ISO 639-1 language-name overrides imported from Module:Language/data/wp_languages (since deleted) | ||
--<begin do-not-edit except to comment out>-- | --<begin do-not-edit except to comment out>-- | ||
["av"] = "Avar", -- Avaric | ["av"] = "Avar", -- Avaric | ||
Line 175: | Line 178: | ||
["alv"] = "Atlantic–Congo languages", -- to match en.wiki article title (endash) | ["alv"] = "Atlantic–Congo languages", -- to match en.wiki article title (endash) | ||
["arc"] = "Aramaic", | ["arc"] = "Imperial Aramaic (700-300 BCE)", -- Official Aramaic (700-300 BCE), Imperial Aramaic (700-300 BCE); to match en.wiki article title uses ISO639-2 'preferred' name | ||
["art"] = "constructed", -- to match en.wiki article; lowercase for category name | ["art"] = "constructed", -- to match en.wiki article; lowercase for category name | ||
["bhd"] = "Bhadarwahi", -- Bhadrawahi; to match en.wiki article title | ["bhd"] = "Bhadarwahi", -- Bhadrawahi; to match en.wiki article title | ||
Line 194: | Line 197: | ||
["ilo"] = "Ilocano", -- Iloko; to match en.wiki article title | ["ilo"] = "Ilocano", -- Iloko; to match en.wiki article title | ||
["jam"] = "Jamaican Patois", -- Jamaican Creole English | ["jam"] = "Jamaican Patois", -- Jamaican Creole English | ||
["lij-mc"] = "Monégasque", -- Ligurian as spoken in Monaco; also in <article_name> table | |||
["luo"] = "Dholuo", -- IANA (primary) /ISO 639-3: Luo (Kenya and Tanzania); IANA (secondary): Dholuo | ["luo"] = "Dholuo", -- IANA (primary) /ISO 639-3: Luo (Kenya and Tanzania); IANA (secondary): Dholuo | ||
["mhr"] = "Meadow Mari", -- Eastern Mari | ["mhr"] = "Meadow Mari", -- Eastern Mari | ||
Line 218: | Line 222: | ||
["rop"] = "Australian Kriol", -- Kriol; en.wiki article is a dab; point to correct en.wiki article | ["rop"] = "Australian Kriol", -- Kriol; en.wiki article is a dab; point to correct en.wiki article | ||
["sdo"] = "Bukar–Sadong", -- Bukar-Sadung Bidayuh; to match en.wiki article title | ["sdo"] = "Bukar–Sadong", -- Bukar-Sadung Bidayuh; to match en.wiki article title | ||
["smp"] = "Samaritan Hebrew", -- to match en.wiki article title | |||
["stq"] = "Saterland Frisian", -- Saterfriesisch | ["stq"] = "Saterland Frisian", -- Saterfriesisch | ||
["und"] = "undetermined", -- capitalization to match existing category | ["und"] = "undetermined", -- capitalization to match existing category | ||
Line 226: | Line 231: | ||
["zxx"] = "no linguistic content", -- capitalization | ["zxx"] = "no linguistic content", -- capitalization | ||
-- these ISO 639-2, -3 language-name overrides imported from Module:Language/data/wp_languages | -- these ISO 639-2, -3 language-name overrides imported from Module:Language/data/wp_languages (since deleted) | ||
--<begin do-not-edit except to comment out>-- | --<begin do-not-edit except to comment out>-- | ||
["ace"] = "Acehnese", -- Achinese | ["ace"] = "Acehnese", -- Achinese | ||
Line 258: | Line 263: | ||
["kpo"] = "Kposo", -- Ikposo | ["kpo"] = "Kposo", -- Ikposo | ||
["krj"] = "Kinaray-a", -- Kinaray-A | ["krj"] = "Kinaray-a", -- Kinaray-A | ||
-- ["ktz"] = "Juǀ'hoan", -- Juǀʼhoan | |||
["lez"] = "Lezgian", -- Lezghian | ["lez"] = "Lezgian", -- Lezghian | ||
["liv"] = "Livonian", -- Liv | ["liv"] = "Livonian", -- Liv | ||
Line 304: | Line 309: | ||
------------------------------< P R I V A T E _ U S E _ T A G S >---------------------------------------------- | ------------------------------< P R I V A T E _ U S E _ T A G S >---------------------------------------------- | ||
["akk-x-latbabyl"] = "Late Babylonian Akkadian", | |||
["akk-x-midassyr"] = "Middle Assyrian Akkadian", | |||
["akk-x-midbabyl"] = "Middle Babylonian Akkadian", | |||
["akk-x-neoassyr"] = "Neo-Assyrian Akkadian", | |||
["akk-x-neobabyl"] = "Neo-Babylonian Akkadian", | |||
["akk-x-old"] = "Old Akkadian", | |||
["akk-x-oldassyr"] = "Old Assyrian Akkadian", | |||
["akk-x-oldbabyl"] = "Old Babylonian Akkadian", | |||
["alg-x-proto"] = "Proto-Algonquian", -- alg in IANA is Algonquian languages | ["alg-x-proto"] = "Proto-Algonquian", -- alg in IANA is Algonquian languages | ||
["cel-x- | ["ca-x-old"] = "Old Catalan", | ||
["cel-x-combrit"] = "Common Brittonic", -- cel in IANA is Celtic languages | |||
["cel-x-proto"] = "Proto-Celtic", | |||
["egy-x-demotic"] = "Demotic Egyptian", | |||
["egy-x-late"] = "Late Egyptian", | |||
["egy-x-middle"] = "Middle Egyptian", | |||
["egy-x-old"] = "Old Egyptian", | |||
["gem-x-proto"] = "Proto-Germanic", -- gem in IANA is Germanic languages | ["gem-x-proto"] = "Proto-Germanic", -- gem in IANA is Germanic languages | ||
["gmw-x-ecg"] = "East Central German", | ["gmw-x-ecg"] = "East Central German", | ||
Line 321: | Line 340: | ||
["grk-x-proto"] = "Proto-Greek", -- grk in IANA is Greek languages | ["grk-x-proto"] = "Proto-Greek", -- grk in IANA is Greek languages | ||
["iir-x-proto"] = "Proto-Indo-Iranian", -- iir in IANA is Indo-Iranian Languages | ["iir-x-proto"] = "Proto-Indo-Iranian", -- iir in IANA is Indo-Iranian Languages | ||
["inc-x-mitanni"] = "Mitanni-Aryan", -- inc in IANA is Indic languages | |||
["inc-x-proto"] = "Proto-Indo-Aryan", | |||
["ine-x-anatolia"] = "Anatolian languages", | |||
["ine-x-proto"] = "Proto-Indo-European", | ["ine-x-proto"] = "Proto-Indo-European", | ||
["ira-x-proto"] = "Proto-Iranian", -- ira in IANA is Iranian languages | ["ira-x-proto"] = "Proto-Iranian", -- ira in IANA is Iranian languages | ||
Line 326: | Line 348: | ||
["ksh-x-colog"] = "Colognian", -- en.wiki article is Colognian; ksh (Kölsch) redirects there | ["ksh-x-colog"] = "Colognian", -- en.wiki article is Colognian; ksh (Kölsch) redirects there | ||
["la-x-medieval"] = "Medieval Latin", | ["la-x-medieval"] = "Medieval Latin", | ||
["la-x-new"] = "New Latin", | |||
["lmo-x-milanese"] = "Milanese", -- lmo in IANA is Lombard; Milanese is a dialect | |||
["mis-x-ripuar"] = "Ripuarian", -- replaces improper use of ksh in wp_languages | ["mis-x-ripuar"] = "Ripuarian", -- replaces improper use of ksh in wp_languages | ||
["prg-x-old"] = "Old Prussian", | |||
["sem-x-ammonite"] = "Ammonite", | |||
["sem-x-aramaic"] = "Aramaic", | |||
["sem-x-canaan"] = "Canaanite languages", | |||
["sem-x-dumaitic"] = "Dumaitic", | |||
["sem-x-egurage"] = "Eastern Gurage", | |||
["sem-x-hatran"] = "Hatran Aramaic", | |||
["sem-x-oldsoara"] = "Old South Arabian", | |||
["sem-x-palmyren"] = "Palmyrene Aramaic", | |||
["sem-x-proto"] = "Proto-Semitic", | ["sem-x-proto"] = "Proto-Semitic", | ||
["sem-x-taymanit"] = "Taymanitic", | |||
["sla-x-proto"] = "Proto-Slavic", -- sla in IANA is Slavic languages | ["sla-x-proto"] = "Proto-Slavic", -- sla in IANA is Slavic languages | ||
["yuf-x-hav"] = "Havasupai", -- IANA name for these three is Havasupai-Walapai-Yavapai | ["yuf-x-hav"] = "Havasupai", -- IANA name for these three is Havasupai-Walapai-Yavapai | ||
["yuf-x-wal"] = "Walapai", | ["yuf-x-wal"] = "Walapai", | ||
["yuf-x-yav"] = "Yavapai", | ["yuf-x-yav"] = "Yavapai", | ||
["xsc-x-pontic"] = "Pontic Scythian", -- xsc in IANA is Scythian | |||
["xsc-x-saka"] = "Saka", | |||
["xsc-x-sarmat"] = "Sarmatian", | |||
} | } | ||
Line 344: | Line 381: | ||
local article_name = { | local article_name = { | ||
['kue'] = "Kuman language (New Guinea)", -- Kuman (Papua New Guinea); to avoid Kuman dab page | |||
["lij"] = "Ligurian (Romance language)", -- Ligurian; see Template_talk:Lang#Ligurian_dab | ["lij"] = "Ligurian (Romance language)", -- Ligurian; see Template_talk:Lang#Ligurian_dab | ||
["lij-mc"] = "Monégasque language", -- Ligurian as spoken in Monaco | |||
['mbo'] = "Mbo language (Cameroon)", -- Mbo (Cameroon) | |||
['mnh'] = "Mono language (Congo)", -- Mono (Democratic Republic of Congo); see Template_talk:Lang#Mono_languages | ['mnh'] = "Mono language (Congo)", -- Mono (Democratic Republic of Congo); see Template_talk:Lang#Mono_languages | ||
['mnr'] = "Mono language (California)", -- Mono (USA) | ['mnr'] = "Mono language (California)", -- Mono (USA) | ||
['mru'] = "Mono language (Cameroon)", -- Mono (Cameroon) | ['mru'] = "Mono language (Cameroon)", -- Mono (Cameroon) | ||
['qwm'] = "Kuman (Russia)", -- Kuman (Russia); to avoid Kuman dab page | |||
["snq"] = "Sangu language (Gabon)", -- Sangu (Gabon) | |||
["toi"] = "Tonga language (Zambia and Zimbabwe)", -- Tonga (Zambia and Zimbabwe); to avoid Tonga language dab page | |||
["vwa"] = "Awa language (China)", -- Awa (China); to avoid Awa dab page | |||
["xlg"] = "Ligurian (ancient language)", -- see Template_talk:Lang#Ligurian_dab | ["xlg"] = "Ligurian (ancient language)", -- see Template_talk:Lang#Ligurian_dab | ||
["zmw"] = "Mbo language (Congo)", -- Mbo (Democratic Republic of Congo) | |||
} | } | ||
Line 468: | Line 513: | ||
['zh'] = 'ISO 7098 Chinese', | ['zh'] = 'ISO 7098 Chinese', | ||
['chi'] = 'ISO 7098 Chinese', | ['chi'] = 'ISO 7098 Chinese', | ||
[' | ['cmn'] = 'ISO 7098 Chinese', | ||
['zho'] = 'ISO 7098 Chinese', | ['zho'] = 'ISO 7098 Chinese', | ||
-- ['han'] = 'ISO 7098 Chinese', -- unicode alias of Hani? doesn't belong here? should be Hani? | -- ['han'] = 'ISO 7098 Chinese', -- unicode alias of Hani? doesn't belong here? should be Hani? | ||
Line 495: | Line 540: | ||
['gu'] = 'ISO 15919 Indic', | ['gu'] = 'ISO 15919 Indic', | ||
['hi'] = 'ISO 15919 Indic', | ['hi'] = 'ISO 15919 Indic', | ||
['hno'] = 'ISO 15919 Indic', | |||
['inc'] = 'ISO 15919 Indic', | ['inc'] = 'ISO 15919 Indic', | ||
['kn'] = 'ISO 15919 Indic', | ['kn'] = 'ISO 15919 Indic', | ||
Line 507: | Line 553: | ||
['or'] = 'ISO 15919 Indic', | ['or'] = 'ISO 15919 Indic', | ||
['pa'] = 'ISO 15919 Indic', | ['pa'] = 'ISO 15919 Indic', | ||
['pnb'] = 'ISO 15919 Indic', | |||
['raj'] = 'ISO 15919 Indic', | ['raj'] = 'ISO 15919 Indic', | ||
['sa'] = 'ISO 15919 Indic', | ['sa'] = 'ISO 15919 Indic', | ||
Line 512: | Line 559: | ||
['sd'] = 'ISO 15919 Indic', | ['sd'] = 'ISO 15919 Indic', | ||
['si'] = 'ISO 15919 Indic', | ['si'] = 'ISO 15919 Indic', | ||
['skr'] = 'ISO 15919 Indic', | |||
['ta'] = 'ISO 15919 Indic', | ['ta'] = 'ISO 15919 Indic', | ||
['tcy'] = 'ISO 15919 Indic', | ['tcy'] = 'ISO 15919 Indic', | ||
Line 588: | Line 636: | ||
['default'] = 'Hans Wehr transliteration', | ['default'] = 'Hans Wehr transliteration', | ||
}, | }, | ||
}; | ['yaleko'] = { | ||
['default'] = 'Yale romanization of Korean', | |||
} | |||
}; | |||