local export = {}
local gsub = mw.ustring.gsub
local gsplit = mw.text.gsplit
local match = mw.ustring.match
local initial_ipa = {
["b"] = "p", ["p"] = "pʰ", ["m"] = "m",
["d"] = "t", ["t"] = "tʰ", ["n"] = "n", ["l"] = "l",
["c"] = "t͡s", ["ch"] = "t͡sʰ", ["s"] = "s",
["g"] = "k", ["k"] = "kʰ", ["ng"] = "ŋ", ["h"] = "x",
[""] = "",
}
local final_ipa = {
["i"] = "i", ["u"] = "u", ["ṳ"] = "y",
["a"] = "a", ["ia"] = "ia", ["ua"] = "ua",
["a̤"] = "ɛ", ["ie"] = "iɛ", ["uoi"] = "uɛ", ["ṳe"] = "yɛ",
["o̤"] = "ɔ", ["io̤"] = "iɔ",
["e"] = "e", ["e̤"] = "œ", ["o"] = "o",
["ai"] = "ai", ["uai"] = "uai",
["au"] = "au", ["iau"] = "iau",
["iu"] = "iu",
["ing"] = "iŋ", ["uing"] = "uiŋ", ["ṳing"] = "yiŋ",
["ang"] = "aŋ", ["iang"] = "iaŋ", ["uang"] = "uaŋ",
["o̤ng"] = "ɔŋ", ["ong"] = "ɔŋ", ["io̤ng"] = "iɔŋ", ["iong"] = "iɔŋ", ["uo̤ng"] = "uɔŋ",
["eng"] = "eiŋ", --missing /ieiŋ/
["e̤ng"] = "œyŋ",
["aing"] = "aiŋ", ["uaing"] = "uaiŋ",
}
local tone_marks = "[́̂̌̿̄̆̀]"
local tone_from_mark = {
["́"] = 1, --陰平 (acute)
["̂"] = 3, --陽平 (circumflex)
["̌"] = 2, --上 (caron)
["̿"] = 3, --陰去 (double overline)
["̄"] = 4, --陽去 (macron)
["̆"] = 5, --陰入 (breve)
["̀"] = 6, --陽入 (grave)
}
local tone_value = {
[1] = "⁵⁴", --陰平
[2] = "²¹", --上
[3] = "³³", --陰去
[4] = "⁵⁵", --陽去
[5] = "²⁴", --陰入
[6] = "⁴²", --陽入
}
--[=[
Given a syllable, return tone value of the syllable's tone and the syllable without the tone mark
]=]
local function get_tone_value(syllable)
if match(syllable, "̄̄") then -- check for double macron
local corrected = gsub(syllable, "̄̄", "̿")
error("Please change " .. syllable .. " to " .. corrected .. ".")
end
local tone = match(syllable, tone_marks)
if tone then
return tone_value[tone_from_mark[tone]], gsub(syllable, tone, "")
else
error("No tone detected.")
end
end
function export.rom(text)
text = gsub(text, "/", " / ")
text = gsub(text, ">([^> %-]+)", "<sup>→%1</sup>")
return text
end
function export.ipa(text)
text = mw.ustring.toNFD(mw.ustring.lower(text))
local words_ipa = {}
for word in gsplit(text, "/") do
word = gsub(word, " ", "-")
syllables_ipa = {}
for syllable in gsplit(word, "-") do
syllable = match(syllable, ">(.*)$") or syllable
local initial, final, tone_value
tone_value, syllable = get_tone_value(syllable)
initial, final = match(syllable, "^([bpmdtnlcsk]?[gh]?)([aeioung̤]+)$")
initial, final = mw.ustring.toNFC(initial), mw.ustring.toNFC(final)
initial, final = initial_ipa[initial], final_ipa[final]
table.insert(syllables_ipa, initial..final..tone_value)
end
table.insert(words_ipa, table.concat(syllables_ipa, " "))
end
return "/" .. table.concat(words_ipa, "/, /") .. "/"
end
return export