Module:mg-pron: Difference between revisions

From Linguifex
Jump to navigation Jump to search
No edit summary
No edit summary
Line 26: Line 26:
}
}


local function syllabify(term)
local function syllabify(term, pos)
term = gsub(term, "(" .. consonants .. "*)(" .. vowels .. "*)", "%1%2·")
term = gsub(term, "(" .. consonants .. "*)(" .. vowels .. "*)", "%1%2·")
term = gsub(term, "··", "·"); term = gsub(term, "·$", "")
term = gsub(term, "··", "·"); term = gsub(term, "·$", "")
Line 33: Line 33:
term = gsub(term, "·(" .. consonants .. ")·", "%1·")
term = gsub(term, "·(" .. consonants .. ")·", "%1·")
local syll = split(term, "·")
local monosyll = {["n"] = "ˈ", ["pron"] = "", ["particle"] = "(ˈ)", ["prep"] = "(ˈ)", ["conj"] = "(ˈ)"}
if #syll == 1 then
syll[1] = monosyll[pos] .. syll[1]
if monosyll[pos] == "ˈ" and match(syll[1], "[aá]") then gsub(syll[1], "([aá])", "%1(ː)") end
else
syll[#syll - 1] = "ˈ" .. syll[#syll - 1]
if match(syll[#syll - 1], "[aá]") then gsub(syll[#syll - 1], "([aá])", "%1ː") end
end
return term
return term
end
end

Revision as of 16:55, 25 August 2021



local sub = mw.ustring.sub
local find = mw.ustring.find
local match = mw.ustring.match
local gmatch = mw.ustring.gmatch
local gsub = mw.ustring.gsub
local u = mw.ustring.char
local split = mw.text.split
local gsplit = mw.text.gsplit

local NASAL = u(0x0303) -- COMBINING TILDE, ̃

local velar = "[kɡɫ]"
local consonants = "[bkdhjlmnɲprɾstʃθβðɡɣzʧɫʎ]"
local vowels = "[aeiou]"

local function same(foo, bar)
	foo, bar = mw.ustring.toNFD(foo), mw.ustring.toNFD(bar) -- decompose diacritics
	foo, bar = match(foo, "^."), match(bar, "^.") -- sort out the letter
	return foo == bar and true or false
end

local export = {}

local prelims = {
	{"r", "ɾ"}, {"ch", "ʧ"}, {"qu", "k"}, {"il", "ʎ"}, {"ñ", "ɲ"}, {"g", "ɡ"}, {"c", "k"},
}

local function syllabify(term, pos)
	term = gsub(term, "(" .. consonants .. "*)(" .. vowels .. "*)", "%1%2·")
	term = gsub(term, "··", "·"); term = gsub(term, "·$", "")
	term = gsub(term, "·(" .. consonants .. ")(" .. consonants .. ")(" .. vowels .. "*)", "%1·%2%3")
	term = gsub(term, "·(" .. consonants .. ")$", "%1")
	term = gsub(term, "·(" .. consonants .. ")·", "%1·")
	
	local syll = split(term, "·")
	
	local monosyll = {["n"] = "ˈ", ["pron"] = "", ["particle"] = "(ˈ)", ["prep"] = "(ˈ)", ["conj"] = "(ˈ)"}
	if #syll == 1 then
		syll[1] = monosyll[pos] .. syll[1]
		if monosyll[pos] == "ˈ" and match(syll[1], "[aá]") then gsub(syll[1], "([aá])", "%1(ː)") end
	else
		syll[#syll - 1] = "ˈ" .. syll[#syll - 1]
		if match(syll[#syll - 1], "[aá]") then gsub(syll[#syll - 1], "([aá])", "%1ː") end
	end

	return term
end

local rules = {
	{"([ɾs])·([ɾs])", function(s1, s2) return same(s1, s2) and "·ʰ" .. s1 or s1 .. s2 end},
	{".$", {["a"] = "ɐ", ["e"] = "ɪ", ["o"] = "ʊ", --[[["n"] = NASAL]]}}
}

function export.crux(term)
	term = mw.ustring.lower(term)
	
	for _, repl in ipairs(prelims) do
		term = gsub(term, repl[1], repl[2])
	end
	
	term = syllabify(term)
	
	for _, rule in ipairs(rules) do
		term = gsub(term, rule[1], rule[2])
	end
	
	return term
end

function IPA_span(items)
	local bits = {}
	for _, item in ipairs(items) do
		local bit = "<span style=\"font-size:110%;font-family:'Gentium','DejaVu Sans','Segoe UI',sans-serif>" .. item.pron .. "</span>"
		table.insert(bits, bit)
	end
	return table.concat(bits)
end

function format_IPA(items)
	return "[[w:IPA chart|IPA]]<sup>([[IPA for Modern Gallaecian|key]])</sup>:&#32;" .. IPA_span(items)
end

function line_format(pronunciation)
	local full_pronunciations = {}
	local IPA_args = {{pron = '[' .. pronunciation .. ']'}}
	table.insert(full_pronunciations, format_IPA(IPA_args))
	return table.concat(full_pronunciations)
end

function separate_word(term)
	local result = {}
	
	for word in gsplit(term, " ") do
		table.insert(result, export.crux(word))
	end
	
	return table.concat(result, " ")
end

function export.show(frame)
	local params = {
		[1] = { default = mw.title.getCurrentTitle().text }, -- PAGENAME
	}
	local args = require("Module:parameters").process(frame:getParent().args, params)
	local term = frame.args[1] or mw.title.getCurrentTitle().nsText == 'Template' and "gueizuñe" or args[1]
	
	local ipa = "* "
	ipa = ipa .. line_format(separate_word(term))
	
	return ipa
end

return export