11,796
edits
TheNightAvl (talk | contribs) mNo edit summary |
TheNightAvl (talk | contribs) No edit summary |
||
(11 intermediate revisions by 2 users not shown) | |||
Line 3: | Line 3: | ||
-- DATA -- | -- DATA -- | ||
--[[change the character you want to use to mark secondary stress in the input→]] local secondary_stress_marker = "_" | |||
local data = { | local data = { | ||
Line 36: | Line 38: | ||
["ž"] = "ʒ", | ["ž"] = "ʒ", | ||
["hl"] = " | ["hl"] = "ɬ", | ||
["hlj"] = "ʎ̥", | ["hlj"] = "ʎ̥", | ||
["hm"] = "m̥", | ["hm"] = "m̥", | ||
Line 43: | Line 45: | ||
["hñ"] = "ŋ̊", | ["hñ"] = "ŋ̊", | ||
["hr"] = "r̥", | ["hr"] = "r̥", | ||
["tl"] = "ɬ", | |||
["dl"] = "ɮ", | |||
["ls"] = "ɬ", | |||
["lz"] = "ɮ", | |||
["lš"] = "ɬɬ", | |||
["lž"] = "ɮɮ", | |||
["tˌl"] = "ˌɬ", | |||
["dˌl"] = "ˌɮ", | |||
["lˌs"] = "ˌɬ", | |||
["lˌz"] = "ˌɮ", | |||
["lˌš"] = "ɬˌɬ", | |||
["lˌž"] = "ɮˌɮ", | |||
["l·s"] = "ɬɬ", | |||
["l·z"] = "ɮɮ", | |||
["llj"] = "ʎʎ", | ["llj"] = "ʎʎ", | ||
["nnj"] = "ɲɲ", | ["nnj"] = "ɲɲ", | ||
["rtl"] = "ɬɬ", | |||
["rdl"] = "ɮɮ", | |||
["ltl"] = "ɬɬ", | |||
["ldl"] = "ɮɮ", | |||
["l·ˌs"] = "ɬˌɬ", | |||
["l·ˌz"] = "ɮˌɮ", | |||
["lˌlj"] = "ʎˌʎ", | |||
["nˌnj"] = "ɲˌɲ", | |||
["rtˌl"] = "ɬˌɬ", | |||
["rdˌl"] = "ɮˌɮ", | |||
["ltˌl"] = "ɬˌɬ", | |||
["ldˌl"] = "ɮˌɮ", | |||
["lhl"] = " | ["lhl"] = "ɬɬ", | ||
["lhlj"] = "ʎʎ", | ["lhlj"] = "ʎʎ", | ||
["mhm"] = "mm", | ["mhm"] = "mm", | ||
["nhm"] = "mm", | |||
["nhn"] = "nn", | ["nhn"] = "nn", | ||
["nhnj"] = "ɲɲ", | ["nhnj"] = "ɲɲ", | ||
["ñhñ"] = "ŋŋ", | ["ñhñ"] = "ŋŋ", | ||
["rhr"] = "rr", | ["rhr"] = "rr", | ||
["nm"] = "mm", | |||
["lˌhl"] = "ɬˌɬ", | |||
["lˌhlj"] = "ʎˌʎ", | |||
["mˌhm"] = "mˌm", | |||
["nˌhm"] = "mˌm", | |||
["nˌhn"] = "nˌn", | |||
["nˌhnj"] = "ɲˌɲ", | |||
["ñˌhñ"] = "ŋˌŋ", | |||
["rˌhr"] = "rˌr", | |||
["nˌm"] = "mˌm", | |||
[" "] = " ", | [" "] = " ", | ||
["."] = "|", | ["."] = "|", | ||
["ˌ"] = "ˌ", | |||
} | } | ||
data[","] = data["."] | data[","] = data["."] | ||
local affixes = mw.loadData("Module:lfv-IPA/affixes") | |||
local prefixes, suffixes = affixes.prefixes, affixes.suffixes | |||
local vowel = { | local vowel = { | ||
Line 73: | Line 119: | ||
["y"] = true, | ["y"] = true, | ||
} | } | ||
local ortho_vowels = "aeêioôøuy" | |||
for v, _ in pairs(vowel) do | |||
vowel["ˈ" .. v] = true | |||
end | |||
local consonant = { | local consonant = { | ||
Line 101: | Line 151: | ||
["z"] = true, | ["z"] = true, | ||
["ʒ"] = true, | ["ʒ"] = true, | ||
["ɬ"] = true, | |||
["ɮ"] = true, | |||
} | } | ||
for c, _ in pairs(consonant) do | |||
consonant["ˈ" .. c] = true | |||
end | |||
local ortho_consonants = "bdðfgǧhjklmnñprsštþvwŵzž" | |||
local ortho_digraphs = {"hlj", "hl", "hm", "hnj", "hn", "hñ", "hr","lj", "ls","lz","nj"} | |||
local boundary = { | local boundary = { | ||
Line 115: | Line 172: | ||
["ŋ̊"] = "ŋŋ", | ["ŋ̊"] = "ŋŋ", | ||
["r̥"] = "rr", | ["r̥"] = "rr", | ||
["ˌʎ̥"] = "ʎˌʎ", | |||
["ˌm̥"] = "mˌm", | |||
["ˌn̥"] = "nˌn", | |||
["ˌɲ̊"] = "ɲˌɲ", | |||
["ˌŋ̊"] = "ŋˌŋ", | |||
["ˌr̥"] = "rˌr", | |||
} | } | ||
Line 127: | Line 191: | ||
["z"] = "z̥", | ["z"] = "z̥", | ||
["ʒ"] = "ʒ̊", | ["ʒ"] = "ʒ̊", | ||
["ɮ"] = "ɮ̊", | |||
} | } | ||
Line 138: | Line 203: | ||
["t"] = true, | ["t"] = true, | ||
["θ"] = true, | ["θ"] = true, | ||
["ɬ"] = true, | |||
} | |||
local velar = { | |||
["ɡ"] = true, | |||
["ɣ"] = true, | |||
["x"] = true, | |||
["k"] = true, | |||
} | } | ||
function generate_IPA(word, phon, col) | function generate_IPA(word, phon, col, nopref, nosuff) | ||
local working_IPA = {} | local working_IPA = {} | ||
local is_affix = false | local is_affix = false | ||
word = word:gsub(secondary_stress_marker, "ˌ") | |||
-- auto secondary stress -- | |||
if phon then | |||
if nopref ~= true then | |||
for _, pref in ipairs(prefixes) do | |||
if mw.ustring.find(word, "^" .. pref) then | |||
word = mw.ustring.gsub(word, "^" .. pref, pref .. "ˌ") | |||
break | |||
end | |||
end | |||
end | |||
if nosuff ~= true then | |||
for _, suff in ipairs(suffixes) do | |||
if mw.ustring.find(word, suff .. "$") then | |||
word = mw.ustring.gsub(word, suff .. "$", "ˌ" .. suff) | |||
break | |||
end | |||
end | |||
end | |||
for _, digraph in ipairs(ortho_digraphs) do | |||
word = mw.ustring.gsub(word, digraph .. "ˌ([" .. ortho_vowels .. "])", "ˌ" .. digraph .. "%1") | |||
end | |||
word = mw.ustring.gsub(word, "([" .. ortho_consonants .. "])ˌ([" .. ortho_vowels .. "])", "ˌ%1%2") | |||
end | |||
-- base generation -- | -- base generation -- | ||
while #word > 0 do | while #word > 0 do | ||
if data[mw.ustring.sub(word, 1, 4)] then | if data[mw.ustring.sub(word, 1, 5)] then | ||
table.insert(working_IPA, data[mw.ustring.sub(word, 1, 5)]) | |||
word = mw.ustring.sub(word, 6) | |||
elseif data[mw.ustring.sub(word, 1, 4)] then | |||
table.insert(working_IPA, data[mw.ustring.sub(word, 1, 4)]) | table.insert(working_IPA, data[mw.ustring.sub(word, 1, 4)]) | ||
word = mw.ustring.sub(word, 5) | word = mw.ustring.sub(word, 5) | ||
Line 173: | Line 275: | ||
end | end | ||
end | end | ||
word = word:gsub("ˌˌ+", "ˌ") | |||
local i = 1 | local i = 1 | ||
Line 217: | Line 321: | ||
end | end | ||
end | end | ||
mw.logObject(working_IPA) | |||
-- intervocalic voicing and gemination of voiceless sonorants -- | -- intervocalic voicing and gemination of voiceless sonorants -- | ||
if vowel[p_prev] and intervocalic_voicing[p_current] ~= nil and vowel[p_next] then | if vowel[p_prev] and intervocalic_voicing[p_current] ~= nil and vowel[p_next] then | ||
p_resolve(intervocalic_voicing[p_current]) | p_resolve(intervocalic_voicing[p_current]) | ||
end | |||
-- account for <CCu/iV> spelling -- | |||
if consonant[p_prev] and working_IPA[i-2] == p_prev and vowel[p_next] then | |||
if p_current == "u" then | |||
p_resolve("w") | |||
elseif p_current == "i" then | |||
p_resolve("j") | |||
end | |||
end | |||
-- n → ŋ -- | |||
if p_current == "n" and velar[p_next] then | |||
p_resolve("ŋ") | |||
end | end | ||
Line 262: | Line 382: | ||
-- phonetic only -- | -- phonetic only -- | ||
if phon then | if phon then | ||
-- terminal devoicing -- | -- terminal devoicing -- | ||
Line 322: | Line 435: | ||
elseif vowel[p_prev] and p_current == "u" then | elseif vowel[p_prev] and p_current == "u" then | ||
p_resolve("u̯") | p_resolve("u̯") | ||
end | |||
-- {i u} V -- | |||
if vowel[p_next] and (p_current == "i" or p_current == "u") then | |||
local desyllabify = false | |||
for checker = 1, i-1 do | |||
if vowel[working_IPA[i - checker]] then | |||
desyllabify = true | |||
break | |||
elseif boundary[working_IPA[i - checker]] or working_IPA[i - checker] == nil then | |||
break | |||
end | |||
end | |||
if desyllabify then | |||
if p_current == "u" then | |||
p_resolve("u̯") | |||
elseif p_current == "i" then | |||
p_resolve("i̯") | |||
end | |||
end | |||
end | end | ||
Line 348: | Line 483: | ||
if phon then | if phon then | ||
-- /xd/ -- | -- /xd/ /xɡ/ -- | ||
if mw.ustring.find(working_IPA, "( | if mw.ustring.find(working_IPA, "(x[dɡ][̥̊])") then | ||
working_IPA = mw.ustring.gsub(working_IPA, "( | working_IPA = mw.ustring.gsub(working_IPA, "(x)([dɡ][̥̊])", "h%2") | ||
elseif mw.ustring.find(working_IPA, "( | elseif mw.ustring.find(working_IPA, "(x[dɡ])") then | ||
working_IPA = mw.ustring.gsub(working_IPA, "( | working_IPA = mw.ustring.gsub(working_IPA, "(x)([dɡ])", "h%2") .. "~" .. mw.ustring.gsub(working_IPA, "(x)([dɡ])", "ɦ%2") | ||
end | end | ||
Line 375: | Line 510: | ||
["nolarge"] = true, | ["nolarge"] = true, | ||
["cite"] = true, | ["cite"] = true, | ||
["nopref"] = true, | |||
["nosuff"] = true, | |||
} | } | ||
local p = 2 | local p = 2 | ||
Line 405: | Line 542: | ||
if parameters["cite"] then | if parameters["cite"] then | ||
local broad = generate_IPA(outputIPA, false, false) | local broad = generate_IPA(outputIPA, false, false, parameters["nopref"] or false, parameters["nosuff"] or false) | ||
local narrow = generate_IPA(outputIPA, true, parameters["colloquial"] or parameters["col"] or false) | local narrow = generate_IPA(outputIPA, true, parameters["colloquial"] or parameters["col"] or false, parameters["nopref"] or false, parameters["nosuff"] or false) | ||
if "ˈ" .. broad ~= narrow then | if "ˈ" .. broad ~= narrow then | ||
Line 415: | Line 552: | ||
else | else | ||
outputIPA = generate_IPA(outputIPA, parameters["phon"] or false, parameters["colloquial"] or parameters["col"] or false) | outputIPA = generate_IPA(outputIPA, parameters["phon"] or false, parameters["colloquial"] or parameters["col"] or false, parameters["nopref"] or false, parameters["nosuff"] or false) | ||
if parameters["phon"] and parameters["format"] then | if parameters["phon"] and parameters["format"] then |