Modul:Language/data
Penampilan
local U = mw.ustring.char
-- Diakritik, daripada blok [[Tanda-tanda Diakritik Penggabung]]..
local grave = U(0x300)
local acute = U(0x301)
local circumflex = U(0x302)
local tilde = U(0x303)
local macron = U(0x304)
local breve = U(0x306)
local dot = U(0x307)
local diaeresis = U(0x308)
local double_acute = U(0x30B)
local caron = U(0x30C)
local double_grave = U(0x30F)
local invbreve = U(0x311)
local dot_below = U(0x323)
local undertie = U(0x35C)
--[[
Ini jadual kod-kod bahasa Wikikamus dengan data milik mereka.
Name ialah "nama sahih" yang digunakan di Wikikamus.
Article ialah rencana Wikipedia.
Script ialah kod ISO 15924.
]]
local data = {
["languages"] = {
["ab"] = {
["name"] = "Abkhaz",
},
["ang"] = {
["name"] = "Inggeris Kuno",
["article"] = {"Inggeris Kuno"},
-- Remove macrons, acutes, and overdots
["replacements"] = {
decompose = true,
from = { "[" .. macron .. acute .. dot .. "]" },
},
},
["ar"] = {
["name"] = "Arab",
["article"] = "bahasa Arab",
["direction"] = "rtl", -- Harus berada dalam modul data skrip.
["replacements"] = {
-- ālif dengan waslah digantikan dengan ālif;
[U(0x0671)] = U(0x0627),
-- taṭwīl, fatḥatan, ḍammatan, kasratan,
-- fatḥah, ḍammah, kasrah,
-- syaddah, sukūn, dan ālif superskrip (khanjariah) dikeluarkan.
["["..U(0x0640)..U(0x064B)..U(0x064C)..U(0x064D)
..U(0x064E)..U(0x064F)..U(0x0650)
..U(0x0651)..U(0x0652)..U(0x0670).."]"] = "",
},
},
["ara"] = {
["name"] = "Arab",
["article"] = "bahasa Arab",
["direction"] = "rtl", -- Harus berada dalam modul data skrip.
["replacements"] = {
-- ālif dengan waslah digantikan dengan ālif;
[U(0x0671)] = U(0x0627),
-- taṭwīl, fatḥatan, ḍammatan, kasratan,
-- fatḥah, ḍammah, kasrah,
-- syaddah, sukūn, dan ālif superskrip (khanjariah) dikeluarkan.
["["..U(0x0640)..U(0x064B)..U(0x064C)..U(0x064D)
..U(0x064E)..U(0x064F)..U(0x0650)
..U(0x0651)..U(0x0652)..U(0x0670).."]"] = "",
},
},
["arb"] = {
["name"] = "Arab Baku Moden",
["article"] = "bahasa Arab Baku Moden",
["direction"] = "rtl", -- Harus berada dalam modul data skrip.
["replacements"] = {
-- ālif dengan waslah digantikan dengan ālif;
[U(0x0671)] = U(0x0627),
-- taṭwīl, fatḥatan, ḍammatan, kasratan,
-- fatḥah, ḍammah, kasrah,
-- syaddah, sukūn, dan ālif superskrip (khanjariah) dikeluarkan.
["["..U(0x0640)..U(0x064B)..U(0x064C)..U(0x064D)
..U(0x064E)..U(0x064F)..U(0x0650)
..U(0x0651)..U(0x0652)..U(0x0670).."]"] = "",
},
},
["apc"] = {
["name"] = "Arab Syam Utara",
["article"] = "bahasa Arab Syam Utara",
["direction"] = "rtl", -- Harus berada dalam modul data skrip.
["replacements"] = {
-- ālif dengan waslah digantikan dengan ālif;
[U(0x0671)] = U(0x0627),
-- taṭwīl, fatḥatan, ḍammatan, kasratan,
-- fatḥah, ḍammah, kasrah,
-- syaddah, sukūn, dan ālif superskrip (khanjariah) dikeluarkan.
["["..U(0x0640)..U(0x064B)..U(0x064C)..U(0x064D)
..U(0x064E)..U(0x064F)..U(0x0650)
..U(0x0651)..U(0x0652)..U(0x0670).."]"] = "",
},
},
["ajp"] = {
["name"] = "Arab Syam Selatan",
["article"] = "bahasa Arab Syam Selatan",
["direction"] = "rtl", -- Harus berada dalam modul data skrip.
["replacements"] = {
-- ālif dengan waslah digantikan dengan ālif;
[U(0x0671)] = U(0x0627),
-- taṭwīl, fatḥatan, ḍammatan, kasratan,
-- fatḥah, ḍammah, kasrah,
-- syaddah, sukūn, dan ālif superskrip (khanjariah) dikeluarkan.
["["..U(0x0640)..U(0x064B)..U(0x064C)..U(0x064D)
..U(0x064E)..U(0x064F)..U(0x0650)
..U(0x0651)..U(0x0652)..U(0x0670).."]"] = "",
},
},
["arz"] = {
["name"] = "Arab Mesir",
["article"] = "bahasa Arab Mesir",
["direction"] = "rtl", -- Harus berada dalam modul data skrip.
["replacements"] = {
-- ālif dengan waslah digantikan dengan ālif;
[U(0x0671)] = U(0x0627),
-- taṭwīl, fatḥatan, ḍammatan, kasratan,
-- fatḥah, ḍammah, kasrah,
-- syaddah, sukūn, dan ālif superskrip (khanjariah) dikeluarkan.
["["..U(0x0640)..U(0x064B)..U(0x064C)..U(0x064D)
..U(0x064E)..U(0x064F)..U(0x0650)
..U(0x0651)..U(0x0652)..U(0x0670).."]"] = "",
},
},
["av"] = {
["name"] = "Avar"
},
["be"] = {
["article"] = "bahasa Belarusia",
["replacements"] = { [acute] = "", },
},
["bn"] = {
["name"] = "Benggali",
["article"] = "bahasa Benggali",
},
["bua"] = {
["name"] = "Buryat",
},
["cel-pro"] = { -- Tag salah
["name"] = "Celtik Purba",
["Wikipedia_code"] = "cel-x-proto",
},
["cel-x-proto"] = {
["name"] = "Celtik Purba",
},
["cel-bry-pro"] = { -- Tag salah
["name"] = "Brythonik Purba",
["article"] = "Britonik Basahan",
["type"] = "rekonstruksi",
},
["cu"] = {
["name"] = "Slavonik Gereja Kuno",
["article"] = "Slavonik Gereja Kuno",
},
["de"] = {
["name"] = "Jerman",
["article"] = "bahasa Jerman",
},
["en"] = {
["name"] = "Inggeris",
["article"] = "bahasa Inggeris",
},
["es"] = {
["name"] = "Sepanyol",
["article"] = "bahasa Sepanyol",
},
["egy"] = {
["name"] = "Mesir",
},
["evn"] = {
["name"] = "Evenki",
["article"] = "bahasa Evenki",
},
["fr"] = {
["name"] = "Perancis",
["article"] = "bahasa Perancis",
},
["frm"] = {
["name"] = "Perancis Pertengahan",
["article"] = "Perancis Pertengahan",
},
["frp"] = {
["name"] = "Franco-Provençal",
},
["ff"] = {
["name"] = "Fula",
},
["gem-pro"] = { -- Tag salah
["name"] = "Jermanik Purba",
["article"] = "bahasa Jermanik Purba",
["type"] = "rekonstruksi",
["replacements"] = {},
["Wikipedia_code"] = "gem-x-proto",
},
["gem-x-proto"] = {
["name"] = "Jermanik Purba",
["article"] = "bahasa Jermanik Purba",
["type"] = "rekonstruksi",
["replacements"] = {},
},
["gml"] = {
["name"] = "Jerman Hilir Pertengahan",
},
["gmw-ecg"] = {
["name"] = "Jerman Tengah Timur",
},
["gmw-x-proto"] = {
["name"] = "Jermanik Barat Purba",
["article"] = "bahasa Jermanik Barat Purba",
["type"] = "rekonstruksi",
["replacements"] = {},
},
["gmq-x-gut"] = {
["name"] = "Gutnis",
["article"] = "Gutnis",
},
["goh"] = {
["replacements"] = {
decompose = true,
from = {
"[" .. macron .. circumflex .. diaeresis .. "]",
},
},
},
["got"] = {
["name"] = "Gothik",
["article"] = "bahasa Gothik",
["replacements"] = {
-- Latin ke Gothik sebab orang tak nak kena salin
-- dan tampal huruf-huruf Gothik
["[AÁaáĀā]"] = "𐌰",
["[Bb]"] = "𐌱",
["[Gg]"] = "𐌲",
["[Dd]"] = "𐌳",
["[EeĒē]"] = "𐌴",
["[Qq]"] = "𐌵",
["[Zz]"] = "𐌶",
["[Hh]"] = "𐌷",
["[Þþ]"] = "𐌸",
["[IiÍí]"] = "𐌹",
["[Kk]"] = "𐌺",
["[Ll]"] = "𐌻",
["[Mm]"] = "𐌼",
["[Nn]"] = "𐌽",
["[Jj]"] = "𐌾",
["[UuÚúŪū]"] = "𐌿",
["[Pp]"] = "𐍀",
["[Rr]"] = "𐍂",
["[Ss]"] = "𐍃",
["[Tt]"] = "𐍄",
["[WwYy]"] = "𐍅",
["[Ff]"] = "𐍆",
["[Xx]"] = "𐍇",
["[Ƕƕ]"] = "𐍈", -- Entah kalau "hw" dan "hv" boleh tukar ganti
["[OoŌō]"] = "𐍉",
},
},
["gsw"] = {
["name"] = "Jerman Alemannik",
},
["grc"] = {
["name"] = "Yunani Purba",
["article"] = "Yunani Purba",
["replacements"] = {
decompose = true,
from = {
-- Gantikan bentuk huruf varian dengan yang standard.
"ϐ", "ϵ", "ϑ", "ϰ", "ϱ", "ϲ", "ϕ",
-- Buangkan makron dan breve.
"[" .. macron .. breve .. undertie .. "]"
},
to = {
"β", "ε", "θ", "κ", "ρ", "σ", "φ",
}
},
},
["grk-pro"] = { -- Tag salah
["name"] = "Hellenik Purba",
["Wikipedia_name"] = "Proto-Yunani",
["article"] = "bahasa Proto-Yunani",
["type"] = "rekonstruksi",
["replacements"] = {},
["Wikipedia_code"] = "gem-x-proto",
},
["grk-x-proto"] = {
["name"] = "Hellenik Purba",
["Wikipedia_name"] = "Proto-Yunani",
["article"] = "bahasa Proto-Yunani",
["type"] = "rekonstruksi",
["replacements"] = {},
},
["grt"] = {
["name"] = "Garo",
},
["ha"] = {
["name"] = "Hausa",
-- buangkan tanda alun, grava, tirus, makron, sirkumfleks
["replacements"] = {
decompose = true,
from = { "[" .. grave .. circumflex .. macron .. acute .. tilde .. "]" },
},
},
["hi"] = {
["name"] = "Hindi",
["article"] = "Hindi",
},
["ine-bsl-pro"] = {
["name"] = "Balto-Slavik Purba",
["article"] = "bahasa Balto-Slavik Purba",
["type"] = "rekonstruksi",
},
["ine-pro"] = { -- Tag salah
["name"] = "Indo-Eropah Purba",
["article"] = "bahasa Indo-Eropah Purba",
["type"] = "rekonstruksi",
["replacements"] = {},
["Wikipedia_code"] = "ine-x-proto",
},
["ine-x-proto"] = {
["name"] = "Indo-Eropah Purba",
["article"] = "bahasa Indo-Eropah Purba",
["type"] = "rekonstruksi",
["replacements"] = {},
},
["ja"] = {
["name"] = "Jepun",
["article"] = "bahasa Jepun",
},
["jbo"] = { -- Lojban
["type"] = "appendix",
},
["ksk"] = {
["name"] = "Kansa",
["article"] = "bahasa Kansa",
},
["la"] = {
["name"] = "Latin",
["article"] = "Latin",
["replacements"] = {
decompose = true,
from = { "[" .. macron .. breve .. diaeresis .. "]" },
},
},
["lt"] = {
["name"] = "Lithuania",
-- buangkan tanda tirus, alun, grava
["replacements"] = {
decompose = true,
from = { "[" .. acute .. tilde .. grave .. "]" },
},
},
["moe"] = {
["name"] = "Cree",
},
["mul"] = {
["name"] = "Translingual",
["article"] = "",
},
["nci"] = {
["name"] = "Nahuatl Klasik",
["article"] = "Nahuatl Klasik",
-- Buangkan makron, tirus, sirkumfleks dan grava
["replacements"] = {
decompose = true,
-- Buangkan makron, tirus, sirkumfleks, grava dan saltillo;
-- lihat [[Saltillo (linguistics)]].
from = { "[" .. grave .. acute .. macron .. circumflex .. "Ꞌꞌʻʼ'ʔ]" },
},
},
["nds-de"] = {
["name"] = "Jerman Hilir Jerman",
},
["odt"] = {
["name"] = "Belanda Kuno",
},
["oge"] = {
["name"] = "Georgia Kuno",
},
["oj"] = {
["name"] = "Ojibwe",
},
["orv"] = {
["name"] = "Slavik Timur Kuno",
["article"] = "Slavik Timur Kuno",
["replacements"] = {
[U(0x484)] = "",
},
},
["osx"] = {
["name"] = "Saxon Kuno",
},
["pt"] = {
["name"] = "Portugis",
["article"] = "bahasa Portugus",
-- ["scripts"] = { "Latn" },
},
["pa"] = {
["name"] = "Punjab",
["article"] = "bahasa Punjab",
},
["pis"] = {
["name"] = "Pijin",
["article"] = "bahasa Pijin",
},
["poz-x-poly-proto"] = {
["name"] = "Nuklear Polinesia Purba",
["article"] = "bahasa Polinesia Purba",
["type"] = "rekonstruksi",
},
["rap"] = {
["name"] = "Rapa Nui",
["article"] = "Rapa Nui language",
},
["ru"] = {
["name"] = "Rusia",
["article"] = "bahasa Rusia",
["replacements"] = { [acute] = "", },
},
["rw"] = {
["name"] = "Rwanda-Rundi",
},
["se"] = {
["replacements"] = {
["([đflmnŋrsšŧv])'%1"] = "%1%1",
},
},
["sem-pro"] = {
["name"] = "Semitik Purba",
["article"] = "Semitik Purba",
["type"] = "rekonstruksi",
},
["sh"] = {
["article"] = "bahasa Serbo-Croatia",
["replacements"] = {
decompose = true,
from = { "([AaEeIiOoUuRrАаЕеИиОоУуРр])[" .. double_grave
.. grave .. invbreve .. acute .. macron .. tilde .. "]" },
to = { "%1" },
},
},
["sl"] = {
["name"] = "Sloven",
["replacements"] = {
decompose = true,
-- remove tonal orthography
from = {"ł", "[" .. grave .. acute .. macron .. double_grave .. invbreve .. circumflex .. dot_below .. "]"},
to = {"l"},
},
},
["sla-pro"] = {
["name"] = "Slavik Purba", -- juga Slavik Basahan
["type"] = "rekonstruksi",
["replacements"] = {
["[ÀÁÃĀȀȂ]"] = "A",
["[àáãāȁȃ]"] = "a",
["[ÈÉẼĒȄȆ]"] = "E",
["[èéẽēȅȇ]"] = "e",
["[ÌÍĨĪȈȊ]"] = "I",
["[ìíĩīȉȋ]"] = "i",
["[ÒÓÕŌȌȎŐ]"] = "O",
["[òóõōȍȏő]"] = "o",
["[ÙÚŨŪȔȖŰ]"] = "U",
["[ùúũūȕȗű]"] = "u",
["[ỲÝỸȲ]"] = "Y",
["[ỳýỹȳ]"] = "y",
["Ǭ"] = "Ǫ",
["ǭ"] = "ǫ",
["[" .. grave .. acute .. double_acute .. tilde .. macron .. double_grave .. invbreve .. "]"] = "",
["ĭ"] = "ь",
["ŭ"] = "ъ",
},
},
["tts"] = {
["name"] = "Isan", -- juga "Thai Timur Laut"
["article"] = "bahasa Isan",
},
["ug"] = {
["name"] = "Uyghur", --juga kurang biasanya dieja "Uighur"
["article"] = "bahasa Uyghur",
},
["uk"] = {
["article"] = "bahasa Ukraine",
["replacements"] = { [acute] = "", }
},
["ur"] = {
["name"] = "Urdu",
["article"] = "Urdu",
},
["xcl"] = {
["name"] = "Armenia Kuno",
["article"] = "Armenia Klasik",
["replacements"] = {
["[՞՜՛՟]"] = "",
["և"] = "եւ",
},
},
["xgf"] = {
["name"] = "Tongva", -- nama bukan ISO "Gabrielino-Fernandeño"
["article"] = "bahasa Tongva",
["replacements"] = {
["['`ʔ]"] = "ʼ",
},
},
["xlu"] = {
["name"] = "Luwi", -- nama bukan ISO "Cuneiform Luwian"
["article"] = "Luwi Pepaku"
},
["xxt"] = {
["name"] = "Tambora",
["article"] = "bahasa Tambora",
},
["xvn"] = {
["name"] = "Vandalik",
["article"] = "bahasa Vandalik",
},
["yua"] = {
["name"] = "Maya Yucatec",
["article"] = "bahasa Maya Yucatec",
},
["zh"] = {
["name"] = "Cina",
["article"] = "bahasa Cina",
-- ["scripts"] = { "Hani" },
},
},
-- Di sini, kekunci (contohnya, "gem") ialah kod bahasa Wikipedia yang digunakan
-- dalam {{lang}}, dan nilai-nilai (contohnya, "gem-pro") ialah kod Wiktionary
-- yang setara.
-- Subtags are not currently supported.
["redirects"] = {
["aae"] = "sq",
["aiq"] = "fa",
["aln"] = "sq",
["als"] = "sq",
["azb"] = "az",
["azj"] = "az",
["bgn"] = "bal",
["bs"] = "sh",
["bxr"] = "bua",
["ciw"] = "oj",
["cnr"] = "sh",
["fil"] = "tl",
["fuf"] = "ff",
["gem"] = "gem-pro", -- Tidak betul, tetapi biasa digunakan.
["hak"] = "zh",
["hbo"] = "he",
["hr"] = "sh",
["ine"] = "ine-pro", -- Tidak betul, tetapi mungkin biasa digunakan.
["kjv"] = "sh",
["nan"] = "zh",
["prs"] = "fa",
["rn"] = "rw",
["sli"] = "gmw-ecg",
["sr"] = "sh",
["src"] = "sc",
["sro"] = "sc",
["tw"] = "ak",
["wae"] = "gsw",
["wep"] = "nds-de",
["yue"] = "zh",
["xno"] = "fro",
},
}
return data