local data = {}
local U = mw.ustring.char
local macron = U(0x304)
local spacing_macron = U(0xAF)
local modifier_macron = U(0x2C9)
local breve = U(0x306)
local spacing_breve = U(0x2D8)
local rough = U(0x314)
local smooth = U(0x313)
local diaeresis = U(0x308)
local acute = U(0x301)
local grave = U(0x300)
local circum = U(0x342)
local Latin_circum = U(0x302)
local coronis = U(0x343)
local subscript = U(0x345)
data["diacritics"] = {
["macron"] = macron,
["spacing_macron"] = spacing_macron,
["modifier_macron"] = modifier_macron,
["breve"] = breve,
["spacing_breve"] = spacing_breve,
["rough"] = rough,
["smooth"] = smooth,
["diaeresis"] = diaeresis,
["acute"] = acute,
["grave"] = grave,
["circum"] = circum,
["Latin_circum"] = Latin_circum,
["coronis"] = coronis,
["subscript"] = subscript,
}
data.diacritics.all = ""
for name, diacritic in pairs(data.diacritics) do
data.diacritics.all = data.diacritics.all .. diacritic
end
data["named"] = data["diacritics"]
data["diacritic"] = "[" .. data.diacritics.all .. "]"
data["all"] = data["diacritic"]
data["diacritic_groups"] = {
[1] = "[".. macron .. breve .."]",
[2] = "[".. diaeresis .. smooth .. rough .."]",
[3] = "[".. acute .. grave .. circum .. "]",
[4] = subscript,
}
data["groups"] = data["diacritic_groups"]
data["diacritic_groups"]["accents"] = data["groups"][3]
data["diacritical_conversions"] = {
-- Convert spacing to combining diacritics
["[".. spacing_macron .. modifier_macron .."]"] = macron, -- macron
[spacing_breve] = breve, -- breve
["[῾ʽ]"] = rough, -- rough breathing, modifier letter reversed comma
["[᾿ʼ᾽".. coronis .."]"] = smooth, -- smooth breathing, modifier letter apostrophe, coronis, combining coronis
["´"] = acute, -- acute
["`"] = grave, -- grave
["[῀ˆ".. Latin_circum .."]"] = circum, -- Greek circumflex (perispomeni), circumflex, combining circumflex
["῎"] = smooth .. acute, -- smooth and acute
["῍"] = smooth .. grave, -- smooth and grave
["῏"] = smooth .. circum, -- smooth and circumflex
["῞"] = rough .. acute, -- rough and acute
["῝"] = rough .. grave, -- rough and grave
["῟"] = rough .. circum, -- rough and circumflex
["¨"] = diaeresis,
["΅"] = diaeresis .. acute,
["῭"] = diaeresis .. grave,
["῁"] = diaeresis .. circum,
}
data["conversions"] = data["diacritical_conversions"]
data["consonants"] = "βγδζθκλμνξπρσςτφχψ"
data["consonant"] = "[" .. data.consonants .. "]"
return data