48,403
edits
No edit summary |
No edit summary |
||
| (4 intermediate revisions by the same user not shown) | |||
| Line 10: | Line 10: | ||
[[Module:scripts]] | [[Module:scripts]] | ||
[[Module:languages]] and its submodules | [[Module:languages]] and its submodules | ||
[[Module: | [[Module:gender and number]] | ||
]=] | ]=] | ||
| Line 158: | Line 158: | ||
umatch = require(string_utilities_module).match | umatch = require(string_utilities_module).match | ||
return umatch(...) | return umatch(...) | ||
end | |||
local m_headword_data | |||
local function get_headword_data() | |||
m_headword_data = load_data("Module:headword/data") | |||
return m_headword_data | |||
end | end | ||
| Line 294: | Line 300: | ||
end | end | ||
--[==[ | --[==[ | ||
Given a link target as passed to `full_link()`, get the actual page that the target refers to. This removes | Given a link target as passed to `full_link()`, get the actual page that the target refers to. This removes | ||
bold, italics, strip markets and HTML; calls `makeEntryName()` for the language in question; converts targets | bold, italics, strip markets and HTML; calls `makeEntryName()` for the language in question; converts targets | ||
beginning with `*` to the Reconstruction namespace; and converts appendix-constructed languages to the Appendix | beginning with `*` to the Reconstruction namespace; and converts appendix-constructed languages to the Appendix | ||
namespace. Returns up to three values: the page, the original target minus any anti-asterisk !! | namespace. Returns up to three values: | ||
value `true` if the target had a backslash-escaped * in it. | # the actual page to link to, or {nil} to not link to anything; | ||
# how the target should be displayed as, if the user didn't explicitly specify any display text; generally the | |||
same as the original target, but minus any anti-asterisk !!; | |||
# the value `true` if the target had a backslash-escaped * in it (FIXME: explain this more clearly). | |||
]==] | ]==] | ||
function export.get_link_page_with_auto_display(target, lang, sc, plain) | function export.get_link_page_with_auto_display(target, lang, sc, plain) | ||
| Line 363: | Line 371: | ||
-- If the link contains unexpanded template parameters, then don't create a link. | -- If the link contains unexpanded template parameters, then don't create a link. | ||
if target:match("{{{.-}}}") then | if target:match("{{{.-}}}") then | ||
-- FIXME: Should we return the original target as the default display value (second return value)? | |||
return nil | return nil | ||
end | end | ||
-- Link to appendix for reconstructed terms and terms in appendix-only languages. Plain links interpret * literally, however. | -- Link to appendix for reconstructed terms and terms in appendix-only languages. Plain links interpret * | ||
-- literally, however. | |||
if reconstructed == 1 then | if reconstructed == 1 then | ||
if lang:getFullCode() == "und" then | if lang:getFullCode() == "und" then | ||
return nil | -- Return the original target as default display value. If we don't do this, we wrongly get | ||
-- [Term?] displayed instead. | |||
return nil, orig_target | |||
end | end | ||
if not lang:hasType("conlang") then | if not lang:hasType("conlang") then | ||
target = " | target = "Reconstruction:" .. lang:getFullName() .. "/" .. target | ||
end | end | ||
-- Reconstructed languages and substrates require an initial *. | -- Reconstructed languages and substrates require an initial *. | ||
| Line 380: | Line 392: | ||
.. " is unattested, while the given term does not begin with '*' to indicate that it is reconstructed.") | .. " is unattested, while the given term does not begin with '*' to indicate that it is reconstructed.") | ||
elseif lang:hasType("appendix-constructed") then | elseif lang:hasType("appendix-constructed") then | ||
target = " | target = "Appendix:" .. lang:getFullName() .. "/" .. target | ||
else | else | ||
target = target | target = target | ||
end | end | ||
target = (lang:hasType("conlang") and "Contionary:" or "wikt:") .. target | |||
return target, orig_target, escaped > 0 | return target, orig_target, escaped > 0 | ||
| Line 417: | Line 427: | ||
-- If the target is "" then it's a link like [[#English]], which refers to the current page. | -- If the target is "" then it's a link like [[#English]], which refers to the current page. | ||
if auto_display == "" then | if auto_display == "" then | ||
auto_display = | auto_display = (m_headword_data or get_headword_data()).pagename | ||
end | end | ||
| Line 435: | Line 445: | ||
-- If `no_alt_ast` is true, use pcall to catch the error which will be thrown if this is a reconstructed lang and the alt text doesn't have *. | -- If `no_alt_ast` is true, use pcall to catch the error which will be thrown if this is a reconstructed lang and the alt text doesn't have *. | ||
if link.display == auto_display then | if link.display == auto_display then | ||
else | else | ||
local ok, check | local ok, check | ||
| Line 443: | Line 452: | ||
ok = true | ok = true | ||
check = export.get_link_page(orig_display, lang, sc, plain) | check = export.get_link_page(orig_display, lang, sc, plain) | ||
end | end | ||
end | end | ||
| Line 654: | Line 660: | ||
end | end | ||
term, alt = new_term, new_alt | term, alt = new_term, new_alt | ||
end | end | ||
end | end | ||
| Line 686: | Line 687: | ||
term = selective_trim(term) | term = selective_trim(term) | ||
end | end | ||
-- If not, make a link using the parameters. | -- If not, make a link using the parameters. | ||
return make_link({ | return make_link({ | ||
| Line 806: | Line 807: | ||
elseif item_type == "pos" then | elseif item_type == "pos" then | ||
tag = { '<span class="ann-pos">', '</span>' } | tag = { '<span class="ann-pos">', '</span>' } | ||
elseif item_type == "non-gloss" then | |||
tag = { '<span class="ann-non-gloss">', '</span>' } | |||
elseif item_type == "annotations" then | elseif item_type == "annotations" then | ||
tag = { '<span class="mention-gloss-paren annotation-paren">(</span>', | tag = { '<span class="mention-gloss-paren annotation-paren">(</span>', | ||
| Line 817: | Line 820: | ||
end | end | ||
end | end | ||
local pos_tags | |||
--[==[Formats the annotations that are displayed with a link created by {{code|lua|full_link}}. Annotations are the extra bits of information that are displayed following the linked term, and include things such as gender, transliteration, gloss and so on. | --[==[Formats the annotations that are displayed with a link created by {{code|lua|full_link}}. Annotations are the extra bits of information that are displayed following the linked term, and include things such as gender, transliteration, gloss and so on. | ||
| Line 827: | Line 832: | ||
*:: Gloss that translates the term in the link, or gives some other descriptive information. | *:: Gloss that translates the term in the link, or gives some other descriptive information. | ||
*:; <code class="n">pos</code> | *:; <code class="n">pos</code> | ||
*:: Part of speech of the linked term. If the given argument matches one of the | *:: Part of speech of the linked term. If the given argument matches one of the aliases in `pos_aliases` in [[Module:headword/data]], or consists of a part of speech or alias followed by `f` (for a non-lemma form), expand it appropriately. Otherwise, just show the given text as it is. | ||
*:; <code class="n">ng</code> | |||
*:: Arbitrary non-gloss descriptive text for the link. This should be used in preference to putting descriptive text in `gloss` or `pos`. | |||
*:; <code class="n">lit</code> | *:; <code class="n">lit</code> | ||
*:: Literal meaning of the term, if the usual meaning is figurative or idiomatic. | *:: Literal meaning of the term, if the usual meaning is figurative or idiomatic. | ||
| Line 888: | Line 895: | ||
end | end | ||
pos_tags = pos_tags or | -- Canonicalize part of speech aliases as well as non-lemma aliases like 'nf' or 'nounf' for "noun form". | ||
insert(annotations, export.mark( | pos_tags = pos_tags or (m_headword_data or get_headword_data()).pos_aliases | ||
local pos = pos_tags[data.pos] | |||
if not pos and data.pos:find("f$") then | |||
local pos_form = data.pos:sub(1, -2) | |||
-- We only expand something ending in 'f' if the result is a recognized non-lemma POS. | |||
pos_form = (pos_tags[pos_form] or pos_form) .. " form" | |||
if (m_headword_data or get_headword_data()).nonlemmas[pos_form .. "s"] then | |||
pos = pos_form | |||
end | |||
end | |||
insert(annotations, export.mark(pos or data.pos, "pos")) | |||
end | |||
-- Non-gloss text | |||
if data.ng then | |||
insert(annotations, export.mark(data.ng, "non-gloss")) | |||
end | end | ||
| Line 895: | Line 917: | ||
if data.lit then | if data.lit then | ||
insert(annotations, "literally " .. export.mark(data.lit, "gloss")) | insert(annotations, "literally " .. export.mark(data.lit, "gloss")) | ||
end | |||
-- Provide a hook to insert additional annotations such as nested inflections. | |||
if data.postprocess_annotations then | |||
data.postprocess_annotations { | |||
data = data, | |||
annotations = annotations | |||
} | |||
end | end | ||
| Line 1,017: | Line 1,047: | ||
track_sc = boolean, | track_sc = boolean, | ||
no_nonstandard_sc_cat = boolean, | no_nonstandard_sc_cat = boolean, | ||
fragment = link_fragment | fragment = link_fragment, | ||
id = sense_id, | id = sense_id, | ||
genders = { "gender1", "gender2", ... }, | genders = { "gender1", "gender2", ... }, | ||
| Line 1,024: | Line 1,054: | ||
gloss = gloss, | gloss = gloss, | ||
pos = part_of_speech_tag, | pos = part_of_speech_tag, | ||
ng = non-gloss text, | |||
lit = literal_translation, | lit = literal_translation, | ||
no_alt_ast = boolean, | no_alt_ast = boolean, | ||
accel = {accelerated_creation_tags}, | accel = {accelerated_creation_tags}, | ||
interwiki = interwiki, | interwiki = interwiki, | ||
pretext = "text_at_beginning" or nil, | |||
posttext = "text_at_end" or nil, | |||
q = { "left_qualifier1", "left_qualifier2", ...} or "left_qualifier", | q = { "left_qualifier1", "left_qualifier2", ...} or "left_qualifier", | ||
qq = { "right_qualifier1", "right_qualifier2", ...} or "right_qualifier", | qq = { "right_qualifier1", "right_qualifier2", ...} or "right_qualifier", | ||
l = { "left_label1", "left_label2", ...}, | |||
ll = { "right_label1", "right_label2", ...}, | |||
a = { "left_accent_qualifier1", "left_accent_qualifier2", ...}, | |||
aa = { "right_accent_qualifier1", "right_accent_qualifier2", ...}, | |||
refs = { "formatted_ref1", "formatted_ref2", ...} or { {text = "text", name = "name", group = "group"}, ... }, | refs = { "formatted_ref1", "formatted_ref2", ...} or { {text = "text", name = "name", group = "group"}, ... }, | ||
show_qualifiers = boolean, | |||
} } | } } | ||
Any one of the items in the <code class="n">data</code> table may be {{code|lua|nil}}, but an error will be shown if neither <code class="n">term</code> nor <code class="n">alt</code> nor <code class="n">tr</code> is present. | Any one of the items in the <code class="n">data</code> table may be {{code|lua|nil}}, but an error will be shown if neither <code class="n">term</code> nor <code class="n">alt</code> nor <code class="n">tr</code> is present. | ||
| Line 1,039: | Line 1,077: | ||
* Call <code class="n">[[Module:script utilities#tag_text]]</code> to add the appropriate language and script tags to the term, and to italicize terms written in the Latin script if necessary. Accelerated creation tags, as used by [[WT:ACCEL]], are included. | * Call <code class="n">[[Module:script utilities#tag_text]]</code> to add the appropriate language and script tags to the term, and to italicize terms written in the Latin script if necessary. Accelerated creation tags, as used by [[WT:ACCEL]], are included. | ||
* Generate a transliteration, based on the alt or term arguments, if the script is not Latin and no transliteration was provided. | * Generate a transliteration, based on the alt or term arguments, if the script is not Latin and no transliteration was provided. | ||
* Add the annotations (transliteration, gender, gloss etc.) after the link. | * Add the annotations (transliteration, gender, gloss, etc.) after the link. | ||
* If <code class="n">no_alt_ast</code> is specified, then the alt text does not need to contain an asterisk if the language is reconstructed. This should only be used by modules which really need to allow links to reconstructions that don't display asterisks (e.g. number boxes). | * If <code class="n">no_alt_ast</code> is specified, then the alt text does not need to contain an asterisk if the language is reconstructed. This should only be used by modules which really need to allow links to reconstructions that don't display asterisks (e.g. number boxes). | ||
* If <code class="n">show_qualifiers</code> is specified, left and right qualifiers and references will be displayed. (This is | * If <code class="n">pretext</code> or <code class="n">posttext</code> is specified, this is text to (respectively) prepend or append to the output, directly before processing qualifiers, labels and references. This can be used to add arbitrary extra text inside of the qualifiers, labels and references. | ||
* If <code class="n">show_qualifiers</code> is specified or the `show_qualifiers` field is set, left and right qualifiers, accent qualifiers, labels and references will be displayed, otherwise they will be ignored. (This is because a fair amount of code stores qualifiers, labels and/or references in these fields and displays them itself, rather than expecting {{code|lua|full_link()}} to display them.)]==] | |||
function export.full_link(data, face, allow_self_link, show_qualifiers) | function export.full_link(data, face, allow_self_link, show_qualifiers) | ||
-- Prevent data from being destructively modified. | -- Prevent data from being destructively modified. | ||
| Line 1,104: | Line 1,143: | ||
if not data.sc[i] then | if not data.sc[i] then | ||
data.sc[i] = best | data.sc[i] = best | ||
end | end | ||
| Line 1,173: | Line 1,205: | ||
elseif (data.term[1] or data.alt[1]) and data.sc[1]:isTransliterated() then | elseif (data.term[1] or data.alt[1]) and data.sc[1]:isTransliterated() then | ||
-- Track whenever there is manual translit. The categories below like 'terms with redundant transliterations' | |||
-- aren't sufficient because they only work with reference to automatic translit and won't operate at all in | |||
-- languages without any automatic translit, like Persian and Hebrew. | |||
if data.tr[1] then | |||
local full_code = lang:getFullCode() | |||
end | |||
if not nevercalltr then | if not nevercalltr then | ||
| Line 1,186: | Line 1,224: | ||
if automated_tr or data.tr_fail then | if automated_tr or data.tr_fail then | ||
local manual_tr = data.tr[1] | local manual_tr = data.tr[1] | ||
if (not manual_tr) or lang:overrideManualTranslit(data.sc[1]) then | if (not manual_tr) or lang:overrideManualTranslit(data.sc[1]) then | ||
| Line 1,230: | Line 1,257: | ||
insert(output, export.format_link_annotations(data, face)) | insert(output, export.format_link_annotations(data, face)) | ||
local categories = | if data.pretext then | ||
insert(output, 1, data.pretext) | |||
end | |||
if data.posttext then | |||
insert(output, data.posttext) | |||
end | |||
local categories = cats[1] and format_categories(cats, lang, "-", nil, nil, data.sc) or "" | |||
output = concat(output) | output = concat(output) | ||
if show_qualifiers then | if show_qualifiers or data.show_qualifiers then | ||
output = add_qualifiers_and_refs_to_term(data, output) | output = add_qualifiers_and_refs_to_term(data, output) | ||
end | end | ||