Module:rad-IPA: Difference between revisions
Jump to navigation
Jump to search
TheNightAvl (talk | contribs) mNo edit summary |
TheNightAvl (talk | contribs) (Added u resolution function.) |
||
Line 29: | Line 29: | ||
[false] = "ɛ", | [false] = "ɛ", | ||
}, | }, | ||
["é"] = "eː", | |||
["f"] = "f", | ["f"] = "f", | ||
["g"] = "ɡ", | ["g"] = "ɡ", | ||
Line 57: | Line 58: | ||
[false] = "ɔ", | [false] = "ɔ", | ||
}, | }, | ||
["ó"] = "oː", | |||
["ø"] = { | ["ø"] = { | ||
["a"] = "œa", | ["a"] = "œa", | ||
Line 76: | Line 78: | ||
[false] = "u", | [false] = "u", | ||
}, | }, | ||
["ù"] = "ù", | |||
["û"] = "ɤ", | ["û"] = "ɤ", | ||
["ú"] = "uː", | ["ú"] = "uː", | ||
Line 103: | Line 106: | ||
data["!"] = data["."] | data["!"] = data["."] | ||
data["?"] = data["."] | data["?"] = data["."] | ||
local valid_phone = { | |||
["a"] = true, ["aː"] = true, ["aːː"] = true, ["æː"] = true, ["ai"] = true, ["au"] = true, ["b"] = true, | |||
["ç"] = true, ["d"] = true, ["ð"] = true, ["eː"] = true, ["ei"] = true, ["ɛ"] = true, ["ɤ"] = true, | |||
["ɤi"] = true, ["f"] = true, ["ɡ"] = true, ["ɣ"] = true, ["h"] = true, ["i"] = true, ["iː"] = true, | |||
["iːː"] = true, ["iːe"] = true, ["ia"] = true, ["ie"] = true, ["j"] = true, ["k"] = true, ["l"] = true, | |||
["m"] = true, ["n"] = true, ["ŋ"] = true, ["oː"] = true, ["œ"] = true, ["œa"] = true, ["øi"] = true, | |||
["ɔ"] = true, ["ɔː"] = true, ["ɔa"] = true, ["ɔi"] = true, ["p"] = true, ["r"] = true, ["s"] = true, | |||
["ʃ"] = true, ["t"] = true, ["u"] = true, ["uː"] = true, ["uːː"] = true, ["uːo"] = true, ["ua"] = true, | |||
["uo"] = true, ["v"] = true, ["w"] = true, ["y"] = true, ["z"] = true, ["ʒ"] = true, ["θ"] = true, | |||
} | |||
local consonant = { | |||
["b"] = true, ["ç"] = true, ["d"] = true, ["ð"] = true, ["f"] = true, | |||
["ɡ"] = true, ["ɣ"] = true, ["h"] = true, ["j"] = true, ["k"] = true, | |||
["l"] = true, ["m"] = true, ["n"] = true, ["ŋ"] = true, ["p"] = true, | |||
["r"] = true, ["s"] = true, ["ʃ"] = true, ["t"] = true, ["v"] = true, | |||
["w"] = true, ["y"] = true, ["z"] = true, ["ʒ"] = true, ["θ"] = true, | |||
} | |||
local vowel = { | |||
["a"] = true, ["aː"] = true, ["aːː"] = true, ["æː"] = true, ["ai"] = true, ["au"] = true, | |||
["eː"] = true, ["ei"] = true, ["ɛ"] = true, ["ɤ"] = true, ["ɤi"] = true, ["i"] = true, | |||
["iː"] = true, ["iːː"] = true, ["iːe"] = true, ["ia"] = true, ["ie"] = true, ["oː"] = true, | |||
["œ"] = true, ["œa"] = true, ["øi"] = true, ["ɔ"] = true, ["ɔː"] = true, ["ɔa"] = true, | |||
["ɔi"] = true, ["u"] = true, ["uː"] = true, ["uːː"] = true, ["uːo"] = true, ["ua"] = true, | |||
["uo"] = true, | |||
} | |||
local glide = { | |||
["j"] = true, ["w"] = true, | |||
} | |||
local boundary = { | |||
[" "] = true, ["|"] = true, ["·"] = true, | |||
} | |||
local IPA = {} | local IPA = {} | ||
function append_IPA (working_IPA) | function append_IPA(working_IPA) | ||
local IPA_size = #IPA --This variable needs to be set before the function or it breaks. | local IPA_size = #IPA --This variable needs to be set before the function or it breaks. | ||
-- generate_IPA: mw.log("————— REGISTERING PHONE —————") | -- generate_IPA: mw.log("————— REGISTERING PHONE —————") | ||
Line 128: | Line 167: | ||
split_s[i] = mw.ustring.sub(s, i,i) | split_s[i] = mw.ustring.sub(s, i,i) | ||
end | end | ||
-- generate_IPA: mw.log("————— BEGINNING BASE GENERATION —————") | |||
if s_len == 0 then | if s_len == 0 then | ||
Line 223: | Line 264: | ||
-- generate_IPA: mw.log('————— STRING EXHAUSTED —————') | -- generate_IPA: mw.log('————— STRING EXHAUSTED —————') | ||
mw.log("Base generation result: [" .. table.concat(IPA,"][") .. "]") | |||
return IPA | return IPA | ||
end | |||
function resolve_u(phones) | |||
local working_phones = phones | |||
mw.log("————— BEGINNING U RESOLUTION —————") | |||
for i = 1, #working_phones do | |||
local p_current = working_phones[i] | |||
local p_next = working_phones[i + 1] | |||
local p_next2 = working_phones[i + 2] | |||
local p_next3 = working_phones[i + 3] | |||
local toResolve = false | |||
if p_current == "a" and p_next == "ù" then | |||
mw.log("<aù> recognised in position " .. i .. ". Converting to resolvable [u].") | |||
working_phones[i + 1] = "u" | |||
end | |||
if p_current == "u" then | |||
mw.log("[u] found in position " .. i .. ".") | |||
if consonant[p_next] then | |||
if glide[p_next2] then | |||
if not vowel[p_next3] then | |||
mw.log("ɤCj!V environment identified.") | |||
toResolve = true | |||
end | |||
elseif not vowel[p_next2] and not glide[p_next2] then | |||
mw.log("ɤC!V environment identified.") | |||
toResolve = true | |||
end | |||
end | |||
elseif p_current == "ù" or p_current == "ū" then | |||
mw.log("Fixed [u] found in position " .. i .. ".") | |||
working_phones[i] = "u" | |||
end | |||
if toResolve == true then | |||
working_phones[i] = "ɤ" | |||
mw.log("[u] → [ɤ] in position ".. i .. ".") | |||
end | |||
end | |||
mw.log("[u] resolution result: [" .. table.concat(working_phones,"][") .. "]") | |||
return working_phones | |||
end | end | ||
Line 229: | Line 316: | ||
local args = getArgs(frame) | local args = getArgs(frame) | ||
local baseGen = generate_IPA(args[1]) | local baseGen = generate_IPA(args[1]) | ||
local outputIPA = table.concat( | local outputIPA = resolve_u(baseGen) | ||
outputIPA = table.concat(outputIPA,"][") | |||
return "[" .. outputIPA .. "]" | return "[" .. outputIPA .. "]" |
Revision as of 20:09, 17 August 2023
See {{rad-IPA}}
.
local getArgs = require('Module:Arguments').getArgs
local export = {}
local data = {
["a"] = {
["i"] = "ai",
["o"] = {
["i"] = "ɔi",
[false] = "ɔː",
},
["u"] = "au",
[false] = "a",
},
["á"] = "aː",
["ả"] = "aːː",
["â"] = "ɤ",
["âi"] = "ɤi",
["b"] = "b",
["c"] = "ts",
["d"] = {
["x"] = "dʒ",
["z"] = "dz",
[false] = "d",
},
["ð"] = "ð",
["e"] = {
["a"] = "æː",
["i"] = "ei",
[false] = "ɛ",
},
["é"] = "eː",
["f"] = "f",
["g"] = "ɡ",
["h"] = "h",
["ħ"] = "ɣ",
["i"] = {
["e"] = {
["a"] = "ia",
[false] = "ie",
},
[false] = "i",
},
["í"] = "iː",
["ỉ"] = {
["e"] = "iːe",
[false] = "iːː",
},
["j"] = "j",
["ĵ"] = "ĵ",
["k"] = "k",
["ķ"] = "tʃ",
["l"] = "l",
["m"] = "m",
["n"] = "n",
["ņ"] = "ŋ",
["o"] = {
["a"] = "ɔa",
[false] = "ɔ",
},
["ó"] = "oː",
["ø"] = {
["a"] = "œa",
["i"] = "ei",
[false] = "œ",
},
["p"] = "p",
["q"] = "k",
["r"] = "r",
["s"] = "s",
["ș"] = "ʃ",
["t"] = "t",
["u"] = {
["i"] = "ɤi",
["o"] = {
["a"] = "ua",
[false] = "uo",
},
[false] = "u",
},
["ù"] = "ù",
["û"] = "ɤ",
["ú"] = "uː",
["ủ"] = {
["o"] = "uːo",
[false] = "uːː",
},
["ū"] = "ū",
["v"] = "v",
["w"] = "w",
["x"] = "ʒ",
["ỳ"] = "ỳ",
["z"] = "z",
["þ"] = "θ",
["·"] = "·",
[" "] = " ",
["."] = "|",
}
data["à"] = data["a"]
data["è"] = data["e"]
data["ì"] = data["i"]
data["ò"] = data["o"]
data["y"] = data["i"]
data["ý"] = data["í"]
data["ỷ"] = data["ỉ"]
data[","] = data["."]
data["!"] = data["."]
data["?"] = data["."]
local valid_phone = {
["a"] = true, ["aː"] = true, ["aːː"] = true, ["æː"] = true, ["ai"] = true, ["au"] = true, ["b"] = true,
["ç"] = true, ["d"] = true, ["ð"] = true, ["eː"] = true, ["ei"] = true, ["ɛ"] = true, ["ɤ"] = true,
["ɤi"] = true, ["f"] = true, ["ɡ"] = true, ["ɣ"] = true, ["h"] = true, ["i"] = true, ["iː"] = true,
["iːː"] = true, ["iːe"] = true, ["ia"] = true, ["ie"] = true, ["j"] = true, ["k"] = true, ["l"] = true,
["m"] = true, ["n"] = true, ["ŋ"] = true, ["oː"] = true, ["œ"] = true, ["œa"] = true, ["øi"] = true,
["ɔ"] = true, ["ɔː"] = true, ["ɔa"] = true, ["ɔi"] = true, ["p"] = true, ["r"] = true, ["s"] = true,
["ʃ"] = true, ["t"] = true, ["u"] = true, ["uː"] = true, ["uːː"] = true, ["uːo"] = true, ["ua"] = true,
["uo"] = true, ["v"] = true, ["w"] = true, ["y"] = true, ["z"] = true, ["ʒ"] = true, ["θ"] = true,
}
local consonant = {
["b"] = true, ["ç"] = true, ["d"] = true, ["ð"] = true, ["f"] = true,
["ɡ"] = true, ["ɣ"] = true, ["h"] = true, ["j"] = true, ["k"] = true,
["l"] = true, ["m"] = true, ["n"] = true, ["ŋ"] = true, ["p"] = true,
["r"] = true, ["s"] = true, ["ʃ"] = true, ["t"] = true, ["v"] = true,
["w"] = true, ["y"] = true, ["z"] = true, ["ʒ"] = true, ["θ"] = true,
}
local vowel = {
["a"] = true, ["aː"] = true, ["aːː"] = true, ["æː"] = true, ["ai"] = true, ["au"] = true,
["eː"] = true, ["ei"] = true, ["ɛ"] = true, ["ɤ"] = true, ["ɤi"] = true, ["i"] = true,
["iː"] = true, ["iːː"] = true, ["iːe"] = true, ["ia"] = true, ["ie"] = true, ["oː"] = true,
["œ"] = true, ["œa"] = true, ["øi"] = true, ["ɔ"] = true, ["ɔː"] = true, ["ɔa"] = true,
["ɔi"] = true, ["u"] = true, ["uː"] = true, ["uːː"] = true, ["uːo"] = true, ["ua"] = true,
["uo"] = true,
}
local glide = {
["j"] = true, ["w"] = true,
}
local boundary = {
[" "] = true, ["|"] = true, ["·"] = true,
}
local IPA = {}
function append_IPA(working_IPA)
local IPA_size = #IPA --This variable needs to be set before the function or it breaks.
-- generate_IPA: mw.log("————— REGISTERING PHONE —————")
if IPA_size > 0 then
for i=1, IPA_size do
IPA[IPA_size - i + 2] = IPA[IPA_size - i + 1]
end
end
IPA[1] = working_IPA
-- generate_IPA: mw.log("[" .. working_IPA .. "] registered.")
-- generate_IPA: mw.log("Current IPA: [" .. table.concat(IPA, "][") .. "]")
end
function generate_IPA(word)
local s = word
local s_len = mw.ustring.len(s)
IPA = {}
local split_s = {}
for i = 1, s_len do
split_s[i] = mw.ustring.sub(s, i,i)
end
-- generate_IPA: mw.log("————— BEGINNING BASE GENERATION —————")
if s_len == 0 then
error("Empty input.")
end
while s_len > 0 do
local getData = {}
local multiMatch = false
local i_iteration = -2
-- generate_IPA: mw.log("=========================\nCURRENT TEST STRING: <".. mw.ustring.upper(s) .. ">")
if s_len < 3 then
i_iteration = 1 - s_len
end
for i = i_iteration, 0 do
-- generate_IPA: mw.log("————— <" .. split_s[s_len + i] .. "> selected. (i = " .. i .. ") —————")
getData = data[split_s[s_len + i]]
local deadEnd = false
if data[split_s[s_len + i]] == nil then
error("'" .. split_s[s_len + i] .. "' is an invalid character.")
end
while type(getData) == "table" do
if i == 0 then
if getData[false] then
-- generate_IPA: mw.log("Singular index recognised.")
getData = getData[false]
-- generate_IPA: mw.log("Index acquired: " .. getData)
else
error(split_s[s_len] .. " is an invalid character.")
end
else
-- generate_IPA: mw.log("Tabular index recognised.")
for j = 1, 0 - i do
-- DEBUG PRINT ONLY
local currentCombo = ""
if i == -2 and j == 2 then
currentCombo = split_s[s_len + i + j - 2] .. " + " .. split_s[s_len + i + j - 1] .. " + " .. split_s[s_len + i + j]
else
currentCombo = split_s[s_len + i + j - 1] .. " + " .. split_s[s_len + i + j]
end
-- END OF DEBUG PRINT
-- generate_IPA: mw.log("Testing " .. currentCombo)
if getData[split_s[s_len + i + j]] then
getData = getData[split_s[s_len + i + j]]
-- generate_IPA: mw.log("Combination recognised: " .. currentCombo .. " (j = " .. j .. ")")
if type(getData) == "string" then
if j + i == 0 then
-- generate_IPA: mw.log("Index acquired: " .. getData)
multiMatch = true
break
else
-- generate_IPA: mw.log('Non-final index: dead end.')
getData = {}
deadEnd = true
break
end
elseif j + i == 0 and getData[false] then
getData = getData[false]
-- generate_IPA: mw.log("Index acquired: " .. getData)
multiMatch = true
break
elseif j + i == 0 and not getData[false] then
error("data[" .. table.concat(getData, "][") .. "][false] is missing." )
else
-- generate_IPA: mw.log("Target still tabular: reiterating.")
end
else
-- generate_IPA: mw.log('Dead end.')
getData = {}
deadEnd = true
break
end
end
if type(getData) == "table" then break end
end
end
if type(getData) == "string" and (i == 0 or multiMatch == true) then
-- generate_IPA: mw.log("Target acquired of length " .. 1 - i .. ", converting to [" .. getData .. "].")
append_IPA(getData)
s = mw.ustring.sub(s, 1, s_len + i - 1)
s_len = mw.ustring.len(s)
break
elseif deadEnd == false then
-- generate_IPA: mw.log('Non-final index: dead end.')
end
end
end
-- generate_IPA: mw.log('————— STRING EXHAUSTED —————')
mw.log("Base generation result: [" .. table.concat(IPA,"][") .. "]")
return IPA
end
function resolve_u(phones)
local working_phones = phones
mw.log("————— BEGINNING U RESOLUTION —————")
for i = 1, #working_phones do
local p_current = working_phones[i]
local p_next = working_phones[i + 1]
local p_next2 = working_phones[i + 2]
local p_next3 = working_phones[i + 3]
local toResolve = false
if p_current == "a" and p_next == "ù" then
mw.log("<aù> recognised in position " .. i .. ". Converting to resolvable [u].")
working_phones[i + 1] = "u"
end
if p_current == "u" then
mw.log("[u] found in position " .. i .. ".")
if consonant[p_next] then
if glide[p_next2] then
if not vowel[p_next3] then
mw.log("ɤCj!V environment identified.")
toResolve = true
end
elseif not vowel[p_next2] and not glide[p_next2] then
mw.log("ɤC!V environment identified.")
toResolve = true
end
end
elseif p_current == "ù" or p_current == "ū" then
mw.log("Fixed [u] found in position " .. i .. ".")
working_phones[i] = "u"
end
if toResolve == true then
working_phones[i] = "ɤ"
mw.log("[u] → [ɤ] in position ".. i .. ".")
end
end
mw.log("[u] resolution result: [" .. table.concat(working_phones,"][") .. "]")
return working_phones
end
function export.generate(frame)
local args = getArgs(frame)
local baseGen = generate_IPA(args[1])
local outputIPA = resolve_u(baseGen)
outputIPA = table.concat(outputIPA,"][")
return "[" .. outputIPA .. "]"
end
return export