Module:pollasena-roots: Difference between revisions

From Linguifex
Jump to navigation Jump to search
No edit summary
No edit summary
 
(20 intermediate revisions by the same user not shown)
Line 1: Line 1:
local m_put = require("Module:parse utilities")
local m_put = require("Module:parse utilities")
local m_families = require("Module:families")
local m_families = require("Module:families")
local m_languages = require("Module:languages")
local m_lang = require("Module:languages")
local m_param = require("Module:parameters")
local m_param = require("Module:parameters")
local m_param_utils = require("Module:parameter utilities")
local m_param_utils = require("Module:parameter utilities")
local m_etym = require("Module:etymology")
local m_links = require("Module:links")


local gsub = mw.ustring.gsub
local gsub = mw.ustring.gsub
Line 13: Line 15:
local export = {}
local export = {}


local function getLanguage(code)
local function lang_from_code(...)
return require("Module:languages").getByCode(code)
return m_lang.getByCode(...)
end
end


Line 34: Line 36:
end
end
local data = {term = term, alt = alt or term, lang = lang, to_wikt = natlang}
local data = {term = term, alt = alt or term, lang = lang, to_wikt = natlang}
return require('Module:links').full_link(data, "term")
return m_links.full_link(data, "term")
end
end


Line 113: Line 115:
end
end


local function parse_etym_args(parent_args, base_params)
local function get_single_args(args, index)
local single = {}
for k, v in pairs(args) do
if type(v) == "table" and v.maxindex then
if v[index] ~= nil then
single[k] = v[index]
end
else
single[k] = v
end
end
return single
end
 
local function parse_args(parent_args, dest_code, ancestor_codes, extra_params)
local param_mods = m_param_utils.construct_param_mods({{group = {"link", "q", "l"}}})
local param_mods = m_param_utils.construct_param_mods({{group = {"link", "q", "l"}}})
local params = extra_params or {}
params.nocap = {type = "boolean"}
params.nocat = {type = "boolean"}
local termarg_index = 1
for _, ancestor in ipairs(ancestor_codes) do
local lang_options = ancestor.options or {}
if lang_options.roots then
params[termarg_index] = {
required = not lang_options.optional,
list = true,
allow_holes = true,
}
else
params[termarg_index] = {
required = not lang_options.optional,
}
end
termarg_index = termarg_index + 1
end
m_param_utils.augment_params_with_modifiers(params, param_mods)
local args = m_param.process(parent_args, params)


local terms, args = m_param_utils.parse_term_with_inline_modifiers_and_separate_params({
local dest_lang = m_lang.getByCode(dest_code)
params = base_params,
local etymologies = {}
param_mods = param_mods,
raw_args = parent_args,
termarg_index = 1
termarg = 1,
for _, ancestor in ipairs(ancestor_codes) do
lang = function(args)
local code = ancestor.code
return args[sourcearg][#args[sourcearg]]
local lang_options = ancestor.options or {}
end,
local ancestor_lang = m_lang.getByCode(code)
sc = "sc",
})
local terms
-- If term param 3= is empty, there will be no terms in terms.terms. To facilitate further code and for
local separator = ""
-- compatibility,, insert one. It will display as <small>[Term?]</small>.
 
if not terms.terms[1] then
if lang_options.roots then
terms.terms[1] = {
local items = m_param_utils.parse_list_with_inline_modifiers_and_separate_params({
lang = args[sourcearg][#args[sourcearg]],
processed_args = args,
sc = args.sc,
param_mods = param_mods,
}
termarg = termarg_index,
lang = ancestor_lang,
})
terms = {}
local root_index = 1
for _, item in ipairs(items) do
if item.term == "-" or item.term == "+" then
separator = item.term
elseif item.term then
if root_index > 1 and separator == "-" then -- no asterisk after hyphen
if not item.alt then
item.alt = item.term:gsub("^%*", "")
else
item.alt = item.alt:gsub("^%*", "")
end
item.no_alt_ast = true
end
table.insert(terms, item)
root_index = root_index + 1
end
end
else
local single_args = get_single_args(args, termarg_index)
local parsed = m_param_utils.parse_term_with_inline_modifiers_and_separate_params({
processed_args = single_args,
param_mods = param_mods,
termarg = termarg_index,
lang = ancestor_lang,
})
 
terms = parsed.terms or {}
if not terms[1] then
if parsed.term then
terms[1] = parsed
else
terms[1] = { lang = ancestor_lang }
end
end
end
 
local etymology = m_etym.format_derived({
lang = dest_lang,
sources = { ancestor_lang },
terms = terms,
conj = lang_options.roots and separator or nil,
nocat = args.nocat,
template_name = "derived",
})
 
table.insert(etymologies, etymology)
termarg_index = termarg_index + 1
end
end


return terms.terms, args
return etymologies, args
end
end


local function concat_etymologies(args, etymologies)
local capital = args.nocap and "f" or "F"
return capital .. "rom " .. table.concat(etymologies, ", from ") .. "."
end


local function parse_args(parent_args, dest_code, ancestor_codes)
function export.qsc(frame)
local params = {
local parent_args = frame:getParent().args
[1] = {
required = true,
local ancestor_codes = {
list = true,
{ code = "sekh" },
allow_holes = true,
{ code = "wasc", options = {optional = true, roots = true } }
},
["nocat"] = {type = "boolean"},
}
}
for code, lang_options in ipairs() do
local evolution, args = parse_args(parent_args, "qsc", ancestor_codes)
end
return parse_etym_args(parent_args, params)
return concat_etymologies(args, evolution)
end
end


function export.qsc(frame)
function export.lyti(frame)
local parent_args = frame:getParent().args
local source_code = parent_args.source or "und"
local ancestor_codes = {
local ancestor_codes = {
["sekh"] = {},
{ code = "lyti-mid", options = {optional = not parent_args.mid} },
["wasc"] = {optional = true}
{ code = "lyti-old", options = {optional = not parent_args.old} },
{ code = source_code, options = {} },
}
local extra_params = {
mid = {type = "boolean"},
old = {type = "boolean"},
source = {},
}
}
local parent_args = frame:getParent().args
local evolution, args = parse_args(parent_args, "lyti", ancestor_codes, extra_params)
local terms, args = parse_args(parent_args, "qsc", ancestor_codes)
 
return concat_etymologies(args, evolution)
end
end


return export
return export

Latest revision as of 01:11, 10 April 2026


This module implemented inherited templates for Pollasena languages: {{qsc-inh}}, {{sekh-inh}}, {{gwax-wasc}}, {{soky-inh}}. It was generalized to also include other non-Pollasena languages: {{guim-inh}}.


local m_put = require("Module:parse utilities")
local m_families = require("Module:families")
local m_lang = require("Module:languages")
local m_param = require("Module:parameters")
local m_param_utils = require("Module:parameter utilities")
local m_etym = require("Module:etymology")
local m_links = require("Module:links")

local gsub = mw.ustring.gsub
local PAGENAME = gsub(mw.title.getCurrentTitle().text, "%s", "&nbsp;")
local NAMESPACE = mw.title.getCurrentTitle().nsText
local match = mw.ustring.match
local gmatch = mw.ustring.gmatch

local export = {}

local function lang_from_code(...)
	return m_lang.getByCode(...)
end

local function ncategories(categories)
	local out_categories = {}
	for key, cat in ipairs(categories) do
		out_categories[key] = "[[Category:" .. cat .. "]]"
	end

	return NAMESPACE == "Template" and "" or table.concat(out_categories, "")
end

local function link(lang, term, alt)
	local natlang = lang:getWikidataItem() or false
	-- true if the language declaration has a wikidata item, a marginal amount of conlangs have it
	
	if lang:hasType("reconstructed") and not term:match("^%*") then
		term = "*" .. term
	end
	local data = {term = term, alt = alt or term, lang = lang, to_wikt = natlang}
	return m_links.full_link(data, "term")
end

function export.getLink(frame)
	local params = {}
	local a = 0
	
	if frame.args["offset"] or (frame.args["old"] or frame.args["older"]) then
		local offset = frame.args["old"] and 1 or frame.args["older"] and 2 or tonumber(frame.args["offset"])
		
		for i=1,offset do
			params[i] = {}
		end
		params[offset+1] = {list = true}
		a = offset + 1
	else
		params[1] = {list = true}
		a = 1
	end
	
	-- exceptions
	params["and"], params["see"] = {}, {}
	
	local args = require("Module:parameters").process(frame:getParent().args, params)
	
	local fam, lang = m_families.getByCode(frame.args[1]), require("Module:languages").getByCode(frame.args[2])
	local proto = fam:getProtoLanguage()

	local links = {}; local categories = {}; local alts = {};
	-- WIP
	for i, item in ipairs(args[a]) do
		if item == "+" then
			table.insert(links,"&nbsp;")
		elseif item == "-" then
			table.insert(links, item)
		elseif item:find("<") and not item:find("^[^<]*<[a-z]*[^a-z:]") then
			local run = m_put.parse_balanced_segment_run(item, "<", ">")
			local orig_param = a + i - 1
			local function parse_err(msg)
				error(msg .. ": " .. orig_param .. "= " .. table.concat(run))
			end
			local term = run[1]:gsub("%*","")

			for j = 2, #run - 1, 2 do
				local modtext = run[j]:match("^<(.*)>$")
				local prefix, arg = modtext:match("^([a-z]+):(.*)$")
				
				if item:match("><") then
					if prefix == "a" then
						table.insert(links, link(proto, term, arg))
						table.insert(alts, arg)
					elseif prefix == "c" then
						table.insert(categories, lang:getCanonicalName() .. " terms from " .. proto:getCanonicalName() .. " *" .. arg)
						table.insert(alts, term)
					end
				elseif prefix == "a" then
					table.insert(links, link(proto, term, arg))
					table.insert(categories, lang:getCanonicalName() .. " terms from " .. proto:getCanonicalName() .. " *" .. term)
					table.insert(alts, arg)
				elseif prefix == "c" then
					table.insert(links, link(proto, term))
					table.insert(categories, lang:getCanonicalName() .. " terms from " .. proto:getCanonicalName() .. " *" .. arg)
					table.insert(alts, term)
				end
			end
		else
			table.insert(links, link(proto, args[a][i]))
			table.insert(categories, lang:getCanonicalName() .. " terms from " .. proto:getCanonicalName() .. " *" .. args[a][i])
			table.insert(alts, args[a][i])
		end
		
		if i~=1 and links[i-1] == "-" then alts[i] = links[i]:gsub("^%*","") end
		--if i~=1 and links[i-1] ~= "&nbsp;" then links[i] = links[i]:gsub("(%|?)%*%-","%1-") end
		--if i~=1 and alts[i-1]:match("%-$") then links[i] = links[i]:gsub("%|%*","|") end
	end
	
	return table.concat(links) .. ncategories(categories)
end

local function get_single_args(args, index)
	local single = {}
	for k, v in pairs(args) do
		if type(v) == "table" and v.maxindex then
			if v[index] ~= nil then
				single[k] = v[index]
			end
		else
			single[k] = v
		end
	end
	return single
end

local function parse_args(parent_args, dest_code, ancestor_codes, extra_params)
	local param_mods = m_param_utils.construct_param_mods({{group = {"link", "q", "l"}}})
	
	local params = extra_params or {}
	params.nocap = {type = "boolean"}
	params.nocat = {type = "boolean"}
	
	local termarg_index = 1
	for _, ancestor in ipairs(ancestor_codes) do
		local lang_options = ancestor.options or {}
		
		if lang_options.roots then
			params[termarg_index] = {
				required = not lang_options.optional,
				list = true,
				allow_holes = true,
			}
		else
			params[termarg_index] = {
				required = not lang_options.optional,
			}
		end
		
		termarg_index = termarg_index + 1
	end
	
	m_param_utils.augment_params_with_modifiers(params, param_mods)
	
	local args = m_param.process(parent_args, params)

	local dest_lang = m_lang.getByCode(dest_code)
	local etymologies = {}
	
	termarg_index = 1
	for _, ancestor in ipairs(ancestor_codes) do
		local code = ancestor.code
		local lang_options = ancestor.options or {}
		local ancestor_lang = m_lang.getByCode(code)
		
		local terms
		local separator = ""

		if lang_options.roots then
			local items = m_param_utils.parse_list_with_inline_modifiers_and_separate_params({
				processed_args = args,
				param_mods = param_mods,
				termarg = termarg_index,
				lang = ancestor_lang,
			})
			
			terms = {}
			local root_index = 1
			for _, item in ipairs(items) do
				if item.term == "-" or item.term == "+" then
					separator = item.term
				elseif item.term then
					if root_index > 1 and separator == "-" then -- no asterisk after hyphen
						if not item.alt then
							item.alt = item.term:gsub("^%*", "")
						else
							item.alt = item.alt:gsub("^%*", "")
						end
						item.no_alt_ast = true
					end
					
					table.insert(terms, item)
					root_index = root_index + 1
				end
			end
		else
			local single_args = get_single_args(args, termarg_index)
			local parsed = m_param_utils.parse_term_with_inline_modifiers_and_separate_params({
				processed_args = single_args,
				param_mods = param_mods,
				termarg = termarg_index,
				lang = ancestor_lang,
			})

			terms = parsed.terms or {}
			if not terms[1] then
				if parsed.term then
					terms[1] = parsed
				else
					terms[1] = { lang = ancestor_lang }
				end
			end
		end

		local etymology = m_etym.format_derived({
			lang = dest_lang,
			sources = { ancestor_lang },
			terms = terms,
			conj = lang_options.roots and separator or nil,
			nocat = args.nocat,
			template_name = "derived",
		})

		table.insert(etymologies, etymology)
		termarg_index = termarg_index + 1
	end

	return etymologies, args
end

local function concat_etymologies(args, etymologies)
	local capital = args.nocap and "f" or "F"
	return capital .. "rom " .. table.concat(etymologies, ", from ") .. "."	
end

function export.qsc(frame)
	local parent_args = frame:getParent().args
	
	local ancestor_codes = {
		{ code = "sekh" },
		{ code = "wasc", options = {optional = true, roots = true } }
	}
	
	local evolution, args = parse_args(parent_args, "qsc", ancestor_codes)
	
	return concat_etymologies(args, evolution)
end

function export.lyti(frame)
	local parent_args = frame:getParent().args
	local source_code = parent_args.source or "und"
	
	local ancestor_codes = {
		{ code = "lyti-mid", options = {optional = not parent_args.mid} },
		{ code = "lyti-old", options = {optional = not parent_args.old} },
		{ code = source_code, options = {} },
	}
	
	local extra_params = {
		mid = {type = "boolean"},
		old = {type = "boolean"},
		source = {},
	}
	
	local evolution, args = parse_args(parent_args, "lyti", ancestor_codes, extra_params)
	
	return concat_etymologies(args, evolution)
end

return export