Module:pollasena-roots: Difference between revisions

No edit summary
Tag: Reverted
No edit summary
 
(50 intermediate revisions by the same user not shown)
Line 4: Line 4:
local m_param = require("Module:parameters")
local m_param = require("Module:parameters")
local m_param_utils = require("Module:parameter utilities")
local m_param_utils = require("Module:parameter utilities")
local m_param_utils = require("Module:parameter utilities")
local m_utils = require("Module:utilities")
local m_etym = require("Module:etymology")
local m_etym = require("Module:etymology")
local m_etym_specialized = require("Module:etymology/specialized")
local m_links = require("Module:links")
local m_links = require("Module:links")
local m_table = require("Module:table")


local gsub = mw.ustring.gsub
local gsub = mw.ustring.gsub
local PAGENAME = gsub(mw.title.getCurrentTitle().text, "%s", " ")
local NAMESPACE = mw.title.getCurrentTitle().nsText
local match = mw.ustring.match
local match = mw.ustring.match
local gmatch = mw.ustring.gmatch


local export = {}
local export = {}


local function ncategories(categories)
local wasc_suffixes = m_table.listToSet {
local out_categories = {}
"-ati", "-cosc", "-e", "-ekan", "-i", "-ila", "-kan",
for key, cat in ipairs(categories) do
"-la", "-osc", "-otl", "-que", "-scati", "-si", "-tl",
out_categories[key] = "[[Category:" .. cat .. "]]"
}
 
local function get_single_args(args, index)
local single = {}
for k, v in pairs(args) do
if type(v) == "table" and v.maxindex then
if v[index] ~= nil then
single[k] = v[index]
end
else
single[k] = v
end
end
end
 
return single
return NAMESPACE == "Template" and "" or table.concat(out_categories, "")
end
end


local function link(lang, term, alt)
function export.parse_args(parent_args, dest_code, ancestor_codes, extra_params)
local natlang = lang:getWikidataItem() or false
local param_mods = m_param_utils.construct_param_mods({{group = {"link", "q", "l"}}})
-- true if the language declaration has a wikidata item, a marginal amount of conlangs have it
local params = extra_params or {}
params.nocap = {type = "boolean"} -- no capital letter
params.nocat = {type = "boolean"} -- no categories
params.p = {} -- borrowing process
if lang:hasType("reconstructed") and not term:match("^%*") then
local termarg_index
term = "*" .. term
if parent_args.borrowing then
termarg_index = 2
params[1] = {
type = "language",
required = true,
}
else
termarg_index = 1
end
end
local data = {term = term, alt = alt or term, lang = lang, to_wikt = natlang}
return m_links.full_link(data, "term")
end
function export.getLink(frame)
local params = {}
local a = 0
if frame.args["offset"] or (frame.args["old"] or frame.args["older"]) then
for _, ancestor in ipairs(ancestor_codes) do
local offset = frame.args["old"] and 1 or frame.args["older"] and 2 or tonumber(frame.args["offset"])
local lang_options = ancestor.options or {}
for i=1,offset do
if lang_options.roots then
params[i] = {}
params[termarg_index] = {
required = not lang_options.optional,
list = true,
}
params["c"] = {
list = true,
allow_holes = true,
}
else
params[termarg_index] = {
required = not lang_options.optional,
}
if lang_options.annotated then
params["parts"] = {
sublist = true,
}
end
end
end
params[offset+1] = {list = true}
a = offset + 1
termarg_index = termarg_index + 1
else
params[1] = {list = true}
a = 1
end
end
-- exceptions
m_param_utils.augment_params_with_modifiers(params, param_mods)
params["and"], params["see"] = {}, {}
local args = require("Module:parameters").process(frame:getParent().args, params)
local args = m_param.process(parent_args, params)
 
local dest_lang = m_lang.getByCode(dest_code)
local etymologies = {}
local fam, lang = m_families.getByCode(frame.args[1]), require("Module:languages").getByCode(frame.args[2])
termarg_index = parent_args.borrowing and 2 or 1
local proto = fam:getProtoLanguage()
local cats = {}
for _, ancestor in ipairs(ancestor_codes) do
local code = ancestor.code
local lang_options = ancestor.options or {}
local ancestor_lang = m_lang.getByCode(code)
local raw_val = parent_args[termarg_index] or parent_args[tostring(termarg_index)]
if lang_options.optional and (raw_val == nil or raw_val == "") then
termarg_index = termarg_index + 1
else
local terms
local separator = ""
if lang_options.roots then
local items = m_param_utils.parse_list_with_inline_modifiers_and_separate_params({
processed_args = args,
param_mods = param_mods,
termarg = termarg_index,
lang = ancestor_lang,
})
terms = {}
local root_index = 1
local last_term = ""
for _, item in ipairs(items) do
if item.alt and not match(item.alt, "^%*") and ancestor_lang:hasType("reconstructed") then
item.alt = "*" .. item.alt
end
if item.term == "-" or item.term == "+" then
separator = item.term
elseif item.term then
if root_index > 1 and last_term ~= "+" then -- only subsequent asterisks afer space
item.alt = gsub(item.alt or item.term, "^%*", "")
end
table.insert(terms, item)
local function one_asterisk(str)
return "*" .. gsub(str, "^*+", "")
end
local cat_term = one_asterisk(args.c[root_index] or item.term)
if code == "wasc" then -- Wascotl root and suffix handling
local suffix = match(cat_term, "^*[%w']+(%-[%w']+)$")
if wasc_suffixes[suffix] then
cat_term = gsub(cat_term, suffix, "-")
end
end
table.insert(cats, dest_lang:getCanonicalName() .. " terms derived from the " .. ancestor_lang:getCanonicalName() .. " root " .. cat_term)
root_index = root_index + 1
end
last_term = item.term
end
if not terms[1] then
terms[1] = { lang = ancestor_lang }
end
else
local single_args = get_single_args(args, termarg_index)
local parsed = m_param_utils.parse_term_with_inline_modifiers_and_separate_params({
processed_args = single_args,
param_mods = param_mods,
termarg = termarg_index,
lang = ancestor_lang,
})


local links = {}; local categories = {}; local alts = {};
terms = parsed.terms or {}
-- WIP
if not terms[1] then
for i, item in ipairs(args[a]) do
if parsed.term then
if item == "+" then
terms[1] = parsed
table.insert(links," ")
else
elseif item == "-" then
terms[1] = { lang = ancestor_lang }
table.insert(links, item)
end
elseif item:find("<") and not item:find("^[^<]*<[a-z]*[^a-z:]") then
end
local run = m_put.parse_balanced_segment_run(item, "<", ">")
local orig_param = a + i - 1
local function parse_err(msg)
error(msg .. ": " .. orig_param .. "= " .. table.concat(run))
end
end
local term = run[1]:gsub("%*","")
 
local etymology
for j = 2, #run - 1, 2 do
if lang_options.borrowed then
local modtext = run[j]:match("^<(.*)>$")
etymology = m_etym_specialized.specialized_borrowing{
local prefix, arg = modtext:match("^([a-z]+):(.*)$")
bortype = args.p or "b",
lang = dest_lang,
sources = {ancestor_lang},
terms = terms,
sort_key = args.sort,
nocat = args.nocat,
conj = lang_options.roots and separator or nil,
nocap = args.mid or args.old or args.nocap,
}
else
etymology = m_etym.format_inherited{
lang = dest_lang,
terms = terms,
sort_key = args.sort,
nocat = args.nocat,
conj = lang_options.roots and separator or nil,
}
etymology = "from " .. etymology
end
if lang_options.annotated and args.parts then
local referrals = {}
for _, part in ipairs(args.parts) do
local referral = m_links.full_link({
lang = ancestor_lang,
term = part,
}, "term")
table.insert(referrals, referral)
end
if item:match("><") then
etymology = etymology .. " (see " .. m_table.serialCommaJoin(referrals) .. ")"
if prefix == "a" then
table.insert(links, link(proto, term, arg))
table.insert(alts, arg)
elseif prefix == "c" then
table.insert(categories, lang:getCanonicalName() .. " terms from " .. proto:getCanonicalName() .. " *" .. arg)
table.insert(alts, term)
end
elseif prefix == "a" then
table.insert(links, link(proto, term, arg))
table.insert(categories, lang:getCanonicalName() .. " terms from " .. proto:getCanonicalName() .. " *" .. term)
table.insert(alts, arg)
elseif prefix == "c" then
table.insert(links, link(proto, term))
table.insert(categories, lang:getCanonicalName() .. " terms from " .. proto:getCanonicalName() .. " *" .. arg)
table.insert(alts, term)
end
end
end
else
table.insert(links, link(proto, args[a][i]))
table.insert(etymologies, etymology)
table.insert(categories, lang:getCanonicalName() .. " terms from " .. proto:getCanonicalName() .. " *" .. args[a][i])
termarg_index = termarg_index + 1
table.insert(alts, args[a][i])
end
end
if i~=1 and links[i-1] == "-" then alts[i] = links[i]:gsub("^%*","") end
--if i~=1 and links[i-1] ~= "&nbsp;" then links[i] = links[i]:gsub("(%|?)%*%-","%1-") end
--if i~=1 and alts[i-1]:match("%-$") then links[i] = links[i]:gsub("%|%*","|") end
end
end
return table.concat(links) .. ncategories(categories)
local categories = m_utils.format_categories(cats, dest_lang)
end
 
local function parse_args(parent_args, ancestor_specs)
local param_mods = m_param_utils.construct_param_mods({
{ group = {"link", "q", "l"} },
})
 
local parsed = {}
local common = {
nocat = parent_args.nocat,
nocap = parent_args.nocap,
}
 
for i, spec in ipairs(ancestor_specs) do
local lang = m_lang.getByCode(spec.code)
local params = {
[1] = {
required = not spec.optional,
list = spec.roots and "term",
allow_holes = spec.roots or nil,
},
}
 
local terms_obj = m_param_utils.parse_term_with_inline_modifiers_and_separate_params({
params = params,
param_mods = param_mods,
raw_args = { [1] = parent_args[i] }, -- map positional arg i -> local [1]
termarg = 1,
lang = lang,
sc = "sc.default",
})
 
local terms = terms_obj.terms
if not terms[1] then
terms[1] = { lang = lang } -- allow empty optional term if desired
end
 
parsed[i] = {
lang = lang,
terms = terms,
}
end
 
return parsed, common
end
 
local function concat_etymologies(parsed, opts, dest_lang)
local chunks = {}
 
for _, item in ipairs(parsed) do
if item.terms and item.terms[1] then
table.insert(chunks, m_etym.format_derived({
lang = dest_lang,
sources = { item.lang },
terms = item.terms,
nocat = opts.nocat,
template_name = "der",
}))
end
end
local capital = opts.nocap and "f" or "F"
return etymologies, args, parent_args.nocat and "" or categories
local text = capital .. "rom " .. table.concat(chunks, ", from ")
return text .. "."
end
 
function export.qsc(frame)
local parent_args = frame:getParent().args
local dest_lang = m_lang.getByCode("qsc")
 
local ancestor_specs = {
{ code = "sekh", optional = false },
{ code = "wasc", optional = true, roots = true },
}
 
local parsed, opts = parse_args(parent_args, ancestor_specs)
return concat_etymologies(parsed, opts, dest_lang)
end
 
function export.lyti(frame)
local parent_args = frame:getParent().args
local source_code = parent_args.source
 
local ancestor_codes = {
{code = "lyti-mid", options = {optional = not parent_args.mid}},
{code = "lyti-old", options = {optional = not parent_args.old}},
{code = source_code, options = {}},
}
 
local etymologies = parse_args(parent_args, "lyti", ancestor_codes)
return concat_etymologies(parent_args, etymologies)
end
end


return export
return export