Module:Diacritics
Appearance
![]() | This module is rated as ready for general use. It has reached a mature form and is thought to be relatively bug-free and ready for use wherever appropriate. It is ready to mention on help pages and other Wikipedia resources as an option for new users to learn. To reduce server load and bad output, it should be improved by sandbox testing rather than repeated trial-and-error editing. |
Functions
- convertChar returns the non-diacritic version of the supplied character.
- stripDiacrits replaces words containing diacritical characters with their non-diacritic equivalent.
- isLike tests two words, returning true if they only differ in diacritics, nothing otherwise.
- strip_diacrits is available for export to other modules.
- is_like is available for export to other modules.
Usage
{{#invoke:Diacritics |convertChar | single-character }}
{{#invoke:Diacritics |convertChar |char=single-character}}
{{#invoke:Diacritics |stripDiacrits |word or words }}
{{#invoke:Diacritics |stripDiacrits |word=word or words}}
{{#invoke:Diacritics |isLike | word1 or words1 | word2 or words2 }}
{{#invoke:Diacritics |isLike |word1=word1 or words1 |word2=word2 or words2}}
Examples
{{#invoke: Diacritics |convertChar |char=è }}
→ Script error: The function "convertChar" does not exist.{{#invoke: Diacritics |convertChar | ß }}
→ Script error: The function "convertChar" does not exist.{{#invoke: Diacritics |stripDiacrits |word = Fred}}
→ Fred{{#invoke: Diacritics |stripDiacrits | Fred }}
→ Fred{{#invoke: Diacritics |stripDiacrits | café }}
→ café{{#invoke: Diacritics |stripDiacrits | décidé }}
→ décidé{{#invoke: Diacritics |stripDiacrits | chère }}
→ chère{{#invoke: Diacritics |stripDiacrits | Übersetzung }}
→ Übersetzung{{#invoke: Diacritics |stripDiacrits | Álvar Núñez Cabeza de Vaca }}
→ Álvar Núñez Cabeza de Vaca{{#invoke: Diacritics |isLike | Núñez | Nunez }}
→ Script error: The function "isLike" does not exist.{{#invoke: Diacritics |isLike | Núñez | Núñez }}
→ Script error: The function "isLike" does not exist.{{#invoke: Diacritics |isLike | Nunez | Nunez }}
→ Script error: The function "isLike" does not exist.{{#invoke: Diacritics |isLike | Álvar Núñez | Alvar Nunez }}
→ Script error: The function "isLike" does not exist.{{#invoke: Diacritics |isLike | Álvar | Núñez }}
→ Script error: The function "isLike" does not exist.
--[[
stripDiacrits replaces accented characters with their simplest equivalent.
strip_diacrits is available for export to other modules.
--]]
local p = {}
local chars = {
a = { 'á', 'à', 'â', 'ä', 'ǎ', 'ă', 'ā', 'ã', 'å', 'ą' },
c = { 'ć', 'ċ', 'ĉ', 'č', 'ç' },
d = { 'ď', 'đ', 'ḍ', 'ð' },
e = { 'é', 'è', 'ė', 'ê', 'ë', 'ě', 'ĕ', 'ē', 'ẽ', 'ę', 'ẹ' },
f = { 'ġ', 'ĝ', 'ğ', 'ģ' },
g = { 'ĥ', 'ħ', 'ḥ' },
i = { 'ı', 'í', 'ì', 'î', 'ï', 'ǐ', 'ĭ', 'ī', 'ĩ', 'į' },
j = { 'ĵ' },
k = { 'ķ' },
l = { 'ĺ', 'ŀ', 'ľ', 'ļ', 'ł', 'ḷ', 'ḹ' },
m = { 'ṃ' },
n = { 'ń', 'ň', 'ñ', 'ņ', 'ṇ', 'ŋ' },
o = { 'ó', 'ò', 'ô', 'ö', 'ǒ', 'ŏ', 'ō', 'õ', 'ǫ', 'ọ', 'ő', 'ø' },
r = { 'ŕ', 'ř', 'ŗ', 'ṛ', 'ṝ' },
s = { 'ś', 'ŝ', 'š', 'ş', 'ș', 'ṣ' },
ss = { 'ß' },
t = { 'ť', 'ţ', 'ț', 'ṭ' },
u = { 'ú', 'ù', 'û', 'ü', 'ǔ', 'ŭ', 'ū', 'ũ', 'ů', 'ų', 'ụ', 'ű', 'ǘ', 'ǜ', 'ǚ', 'ǖ' },
w = { 'ŵ' },
y = { 'ý', 'ŷ', 'ÿ', 'ỹ', 'ȳ' },
z = { 'ź', 'ż', 'ž' },
}
local char_idx = {}
for k1, v1 in pairs(chars) do
for k2, v2 in pairs(v1) do
char_idx[v2] = v1
end
end
p.strip_diacrits = function(wrd)
if not wrd or wrd == "" then return "" end
for ch in wrd:gmatch(".") do
if char_idx[ch] then
wrd = wrd:gsub(ch, char_idx[ch])
end
end
return wrd
end
p.stripDiacrits = function(frame)
return p.strip_diacrits(frame.args.word or mw.text.trim(frame.args[1]))
end
return p