11,201
edits
TheNightAvl (talk | contribs) (Added syllabification) |
TheNightAvl (talk | contribs) (Added syllable tagging) |
||
Line 101: | Line 101: | ||
[false] = "i", | [false] = "i", | ||
}, | }, | ||
["ỳ"] = " | ["ỳ"] = "y", | ||
["z"] = "z", | ["z"] = "z", | ||
["þ"] = "θ", | ["þ"] = "θ", | ||
Line 196: | Line 196: | ||
["z"] = "z", ["ʒ"] = "ʒ", ["θ"] = "ð", | ["z"] = "z", ["ʒ"] = "ʒ", ["θ"] = "ð", | ||
} | } | ||
local affricate = { | |||
["dz"] = true, ["dʒ"] = true , | |||
["ts"] = true, ["tʃ"] = true, | |||
} | |||
local sibilant = { | local sibilant = { | ||
Line 311: | Line 316: | ||
vowel[temp] = true | vowel[temp] = true | ||
end | end | ||
local long = { | |||
["a"] = false, ["aː"] = true, ["aːː"] = true, ["æː"] = true, ["ai"] = true, ["au"] = true, | |||
["eː"] = true, ["ei"] = true, ["ɛ"] = false, ["ɤ"] = false, ["ɤi"] = true, ["i"] = false, | |||
["iː"] = true, ["iːː"] = true, ["iːe"] = true, ["ia"] = true, ["ie"] = true, ["oː"] = true, | |||
["œ"] = false, ["œa"] = true, ["øi"] = true, ["ɔ"] = false, ["ɔː"] = true, ["ɔa"] = true, | |||
["ɔi"] = true, ["u"] = false, ["uː"] = true, ["uːː"] = true, ["uːo"] = true, ["ua"] = true, | |||
["uo"] = true, ["y"] = false, | |||
} | |||
local weak = { | |||
["a"] = false, ["aː"] = false, ["aːː"] = false, ["æː"] = false, ["ai"] = false, ["au"] = false, | |||
["eː"] = false, ["ei"] = false, ["ɛ"] = false, ["ɤ"] = true, ["ɤi"] = false, ["i"] = true, | |||
["iː"] = false, ["iːː"] = false, ["iːe"] = false, ["ia"] = false, ["ie"] = false, ["oː"] = false, | |||
["œ"] = false, ["œa"] = false, ["øi"] = false, ["ɔ"] = false, ["ɔː"] = false, ["ɔa"] = false, | |||
["ɔi"] = false, ["u"] = false, ["uː"] = false, ["uːː"] = false, ["uːo"] = false, ["ua"] = false, | |||
["uo"] = false, ["y"] = false, | |||
} | |||
-- MISC -- | -- MISC -- | ||
Line 330: | Line 353: | ||
if mw.ustring.match(s, toReplace) then | if mw.ustring.match(s, toReplace) then | ||
s = mw.ustring.gsub(s, toReplace, ReplaceKey) | s = mw.ustring.gsub(s, toReplace, ReplaceKey) | ||
mw.log("Irregular spelling <" .. toReplace .. "> recognised. Treating as <" .. ReplaceKey .. ">.") | -- generate_IPA: mw.log("Irregular spelling <" .. toReplace .. "> recognised. Treating as <" .. ReplaceKey .. ">.") | ||
end | end | ||
end | end | ||
Line 380: | Line 403: | ||
-- generate_IPA: mw.log("Tabular index recognised.") | -- generate_IPA: mw.log("Tabular index recognised.") | ||
for j = 1, 0 - i do | for j = 1, 0 - i do | ||
local currentCombo = "" | local currentCombo = "" | ||
-- for logs only | |||
if i == -2 and j == 2 then | if i == -2 and j == 2 then | ||
currentCombo = split_s[s_len + i + j - 2] .. " + " .. split_s[s_len + i + j - 1] .. " + " .. split_s[s_len + i + j] | currentCombo = split_s[s_len + i + j - 2] .. " + " .. split_s[s_len + i + j - 1] .. " + " .. split_s[s_len + i + j] | ||
Line 387: | Line 410: | ||
currentCombo = split_s[s_len + i + j - 1] .. " + " .. split_s[s_len + i + j] | currentCombo = split_s[s_len + i + j - 1] .. " + " .. split_s[s_len + i + j] | ||
end | end | ||
-- generate_IPA: mw.log("Testing " .. currentCombo) | -- generate_IPA: mw.log("Testing " .. currentCombo) | ||
-- | |||
if getData[split_s[s_len + i + j]] then | if getData[split_s[s_len + i + j]] then | ||
getData = getData[split_s[s_len + i + j]] | getData = getData[split_s[s_len + i + j]] | ||
Line 480: | Line 504: | ||
-- Resolution of [u], [ù] and [ū] -- | -- Resolution of [u], [ù] and [ū] -- | ||
if p_current == "u" then | if p_current == "u" then | ||
mw.log("[u] found in position " .. i .. ".") | mw.log("[u] found in position " .. i .. ". Testing for resolution.") | ||
if consonant[p_next] then | if consonant[p_next] then | ||
if glide[p_next2] then | if glide[p_next2] then | ||
Line 486: | Line 510: | ||
mw.log("ɤCj!V environment identified.") | mw.log("ɤCj!V environment identified.") | ||
p_Resolve("ɤ") | p_Resolve("ɤ") | ||
else | |||
mw.log("No resolution needed.") | |||
end | end | ||
elseif not vowel[p_next2] and not glide[p_next2] then | elseif not vowel[p_next2] and not glide[p_next2] then | ||
mw.log("ɤC!V environment identified.") | mw.log("ɤC!V environment identified.") | ||
p_Resolve("ɤ") | p_Resolve("ɤ") | ||
else | |||
mw.log("No resolution needed.") | |||
end | end | ||
else | |||
mw.log("No resolution needed.") | |||
end | end | ||
elseif p_current == "ù" or p_current == "ū" then | elseif p_current == "ù" or p_current == "ū" then | ||
Line 550: | Line 580: | ||
end | end | ||
end | end | ||
Line 710: | Line 736: | ||
p_RemoveNext() | p_RemoveNext() | ||
mw.log("Geminate [" .. p_current .. "] removed in final position at position " .. i .. ".") | mw.log("Geminate [" .. p_current .. "] removed in final position at position " .. i .. ".") | ||
end | end | ||
Line 755: | Line 777: | ||
end | end | ||
mw.log("————— | mw.log("————— BUILDING SYLLABLES —————") | ||
-- division into syllables -- | -- division into syllables -- | ||
Line 775: | Line 797: | ||
mw.log("Syllable " .. syllable_no .. " registered:") | mw.log("Syllable " .. syllable_no .. " registered:") | ||
logSyllable() | logSyllable() | ||
mw.log("===== | mw.log("====================") | ||
syllable_no = syllable_no + 1 | syllable_no = syllable_no + 1 | ||
working_syllable = { | working_syllable = { | ||
Line 790: | Line 812: | ||
syllables[syllable_no] = p_current | syllables[syllable_no] = p_current | ||
table.remove(working_phones, 1) | table.remove(working_phones, 1) | ||
mw.log("Boundary syllable " .. syllable_no .. " registered: '" .. p_current .. "' | mw.log("Boundary syllable " .. syllable_no .. " registered: '" .. p_current .. "'\n====================") | ||
syllable_no = syllable_no + 1 | syllable_no = syllable_no + 1 | ||
end | end | ||
Line 813: | Line 835: | ||
end | end | ||
table.remove(working_phones, 1) | table.remove(working_phones, 1) | ||
-- mw.log("Current working syllable:") | |||
-- logSyllable() | |||
logSyllable() | |||
if #working_phones == 0 then | if #working_phones == 0 then | ||
Line 822: | Line 843: | ||
end | end | ||
end | end | ||
if consonant[p_current] then | if consonant[p_current] then | ||
Line 875: | Line 893: | ||
end | end | ||
mw.log(" | mw.log("STRING EXHAUSTED\n====================") | ||
return syllables | |||
end | |||
function tag_syllables(syllables) | |||
mw.log("————— TAGGING SYLLABLES —————") | |||
local syl_count = #syllables | |||
for i = 1, syl_count do | |||
local syllable = syllables[i] | |||
local function tag_syllable(tag, value) | |||
syllables[i][tag] = value | |||
mw.log("syllables[" .. i .. "][" .. tag .. "] = " .. tostring(value) ) | |||
end | |||
-- tag checked syllables -- | |||
if type(syllable) == "table" then | |||
if syllable["coda"] == nil then | |||
tag_syllable("checked", false) | |||
else | |||
tag_syllable("checked", true) | |||
end | |||
-- tag long syllables -- | |||
if long[syllable["nucleus"]] then | |||
tag_syllable("long", true) | |||
else | |||
tag_syllable("long", false) | |||
end | |||
-- tag weak syllables (nucleus = [i] [ɤ]) -- | |||
if weak[syllable["nucleus"]] then | |||
tag_syllable("weak", true) | |||
else | |||
tag_syllable("weak", false) | |||
end | |||
-- tag heavy syllables (nucleus is long coda is an obstruent-initial cluster) - | |||
if syllable["coda"] then | |||
if long[syllable["nucleus"]] and affricate[syllable["coda"][1]] then | |||
tag_syllable("heavy", true) | |||
elseif long[syllable["nucleus"]] and obstruent[syllable["coda"][1]] and syllable["coda"][2] then | |||
tag_syllable("heavy", true) | |||
else | |||
tag_syllable("heavy", false) | |||
end | |||
end | |||
mw.log("—————") | |||
end | |||
end | |||
return syllables | return syllables | ||
Line 891: | Line 968: | ||
outputIPA = resolve_consonants(outputIPA, hj) | outputIPA = resolve_consonants(outputIPA, hj) | ||
outputIPA = get_syllables(outputIPA) | outputIPA = get_syllables(outputIPA) | ||
outputIPA = tag_syllables(outputIPA) | |||
-- test output only -- | -- test output only -- | ||
local test_output = "" | |||
for i = 1, #outputIPA do | for i = 1, #outputIPA do | ||
local onset = "" | local onset = "" | ||
Line 907: | Line 987: | ||
end | end | ||
test_output = test_output .. " • " .. onset .. " [ " .. outputIPA[i]["nucleus"] .. " ] " .. coda | |||
else | else | ||
test_output = test_output .. " • " .. outputIPA[i] | |||
end | end | ||
end | end | ||
mw.log(test_output) | |||
-- return outputIPA | -- return outputIPA | ||
end | end |