Modul:ru-headword
Ezt a sablont számos orosz címszósablon használja: {{ru-noun}}
, {{ru-proper noun}}
, {{ru-proper noun+}}
, {{ru-adj}}
, {{ru-verb}}
, {{ru-verb-cform}}
, {{ru-adv}}
.
--[=[
This module implements the headword templates {{ru-noun}}, {{ru-adj}},
{{ru-adv}}, {{ru-noun+}}, etc. The main entry point is show(), which is
meant to be called from one of the above templates. However, {{ru-noun+}}
uses the entry point noun_plus(), and {{ru-noun-m}} (not currently used)
uses the entry point noun_multi(). When calling show(), the first parameter
of the #invoke call is the part of speech. Other parameters are taken from
the parent template call.
The implementations for different types of headwords (different parts of
speech) are set in pos_functions[POS] for a given POS (part of speech).
The value is a 2-argument function of (ARGS, DATA):
-- ARGS on entry is initialized to the parent template call's arguments,
with blank arguments converted to nil.
-- DATA on entry is initialized to a table, with entries like this:
local data = {lang = lang, pos_category = poscat, categories = {}, heads = {}, translits = {}, genders = {}, inflections = {}}
where:
-- LANG is an object describing the language.
-- POS_CATEGORY is the (plural) part of speech, e.g. "nouns" or "verbs".
-- CATEGORIES on entry is a list of categories. There will be one category
corresponding to the part of speech (e.g. [[Category:Russian adverbs]]),
and possibly additional categories such as [[Category:Requests for accents in Russian entries]]
and [[Category:Russian terms with irregular pronunciations]]. On exit
it may contain additional categories to place the page in.
-- HEADS on entry is a list of the headwords, taken directly from arguments
'head', 'head2', 'head3', ...
-- TRANSLITS on entry is a list of translits, matching one-to-one with
heads in HEADS. These come either from 'tr', 'tr2', etc. or from
auto-transliterating the corresponding head (i.e. the translits will
always be non-empty whether or not the user explicitly specified the
translit).
-- GENDERS on entry is an empty list. On exit it should be the appropriate
gender settings, and will be passed directly to full_headword() in
[[Module:headword]]. See the documentation for that module for info on
the format of this setting.
-- INFLECTIONS on entry is an empty list. On exit it should be the
appropriate inflections to be displayed in the headword, and will be
passed directly to full_headword() in [[Module:headword]]. See the
documentation for that module for info on the format of this setting.
]=]--
local m_common = require("Module:ru-common")
local m_links = require("Module:links")
local m_headword = require("Module:headword")
local m_utilities = require("Module:utilities")
local ut = require("Module:utils")
local m_table_tools = require("Module:table tools")
local m_debug = require("Module:debug")
local m_ru_translit = require("Module:ru-translit")
local export = {}
local pos_functions = {}
local lang = require("Module:languages").getByCode("ru")
local IRREGMARKER = "△"
local HYPMARKER = "⟐"
local latin_text_class = "[a-zščžěáéíóúýàèìòùỳâêîôûŷạẹịọụỵȧėȯẏ]"
-- Forward references
local do_noun
local u = mw.ustring.char
local rfind = mw.ustring.find
local rsubn = mw.ustring.gsub
local rmatch = mw.ustring.match
local rsplit = mw.text.split
local ulower = mw.ustring.lower
local AC = u(0x0301) -- acute = ́
local function ine(x) return x ~= "" and x; end
-- version of rsubn() that discards all but the first return value
local function rsub(term, foo, bar)
local retval = rsubn(term, foo, bar)
return retval
end
-- version of rsubn() that returns a 2nd argument boolean indicating whether
-- a substitution was made.
local function rsubb(term, foo, bar)
local retval, nsubs = rsubn(term, foo, bar)
return retval, nsubs > 0
end
local function track(page)
m_debug.track("ru-headword/" .. page)
return true
end
-- Clone parent's args while also assigning nil to empty strings.
local function clone_args(frame)
local args = {}
for pname, param in pairs(frame:getParent().args) do
if param == "" then args[pname] = nil
else args[pname] = param
end
end
return args
end
-- Iterate over a chain of parameters, FIRST then PREF2, PREF3, ...,
-- inserting into LIST (newly created if omitted). Return LIST.
local function process_arg_chain(args, first, pref, list)
if not list then
list = {}
end
local val = args[first]
local i = 2
while val do
table.insert(list, val)
val = args[pref .. i]
i = i + 1
end
return list
end
local function make_qualifier_text(text)
return '<span class="ib-brac"><span class="qualifier-brac">(</span></span>' ..
'<span class="ib-content"><span class="qualifier-content">' .. text ..
'</span></span><span class="ib-brac"><span class="qualifier-brac">)</span></span>'
end
-- The main entry point.
function export.show(frame)
local args = clone_args(frame)
local PAGENAME = mw.title.getCurrentTitle().text
local NAMESPACE = mw.title.getCurrentTitle().nsText
local poscat = ine(frame.args[1]) or error("Part of speech has not been specified. Please pass parameter 1 to the module invocation.")
local data = {lang = lang, pos_category = poscat, categories = {}, heads = {},
translits = {}, genders = {}, inflections = {}, noposcat = args.noposcat}
local tracking_categories = {}
-- Get the head parameters
-- First get the 1st parameter. The remainder is named head2=, head3= etc.
local head = args[1] or PAGENAME
local i = 2
while head do
-- catch errors in arguments where headword doesn't match page title,
-- but only in the main namespace; for the moment, do only with tracking;
-- FIXME, duplicates tracking down below a bit, clean that stuff up
local head_no_links = m_links.remove_links(head)
local head_noaccent = m_common.remove_accents(head_no_links)
if NAMESPACE == "" and head_noaccent ~= PAGENAME then
track("bad-headword")
--error("Headword " .. head .. " doesn't match pagename " ..
-- PAGENAME)
end
if rfind(head_no_links, " ") then
--ut.insert_if_not(data.categories, "orosz multiword terms")
track("space-in-headword/" .. poscat)
elseif rfind(head_no_links, ".%-.") then
-- The following is for bot scripts
-- We only look for hyphens between characters so we don't
-- get tripped up by prefixes and suffixes
track("hyphen-no-space-in-headword/" .. poscat)
end
if m_common.needs_accents(head_no_links) then
if not args.noacccat then
--table.insert(data.categories, "Requests for accents in Russian entries")
end
end
if rfind(ulower(head_no_links), latin_text_class) then
track("latin-text-in-headword")
end
if rfind(head_no_links, "ьо") then
track("ьо")
end
table.insert(data.heads, head)
head = args["head" .. i]
i = i + 1
end
-- Get transliteration(s)
local i = 0
for _, head in ipairs(data.heads) do
head = m_links.remove_links(head)
local head_noaccents = rsub(head, "\204\129", "")
local tr_gen = mw.ustring.toNFC(lang:transliterate(head, nil))
local tr_gen_noaccents = mw.ustring.toNFC(lang:transliterate(head_noaccents, nil))
i = i + 1
local tr
if i == 1 then
tr = args.tr
else
tr = args["tr" .. i]
end
if tr then
if not args.notrcat then
--table.insert(data.categories, "orosz terms with irregular pronunciations")
end
local tr_fixed = tr
tr_fixed = rsub(tr_fixed, "ɛ", "e")
tr_fixed = rsub(tr_fixed, "([eoéó])v([oó])$", "%1g%2")
tr_fixed = rsub(tr_fixed, "([eoéó])v([oó][- ])", "%1g%2")
tr_fixed = mw.ustring.toNFC(tr_fixed)
if tr == tr_gen or tr == tr_gen_noaccents then
table.insert(tracking_categories, "ru headword with tr/redundant")
--elseif tr_fixed == tr_gen then
-- table.insert(tracking_categories, "ru headword with tr/with manual adjustment")
elseif rfind(tr, ",") then
table.insert(tracking_categories, "ru headword with tr/comma")
elseif head_noaccents == PAGENAME then
if not args.notrcat then
table.insert(tracking_categories, "ru headword with tr/headword is pagename")
end
else
table.insert(tracking_categories, "ru headword with tr/headword not pagename")
end
else
local orighead, transformed_head = m_ru_translit.apply_tr_fixes(head)
if orighead ~= transformed_head and not args.notrcat then
--table.insert(data.categories, "orosz terms with irregular pronunciations")
end
tr = tr_gen
end
table.insert(data.translits, tr)
end
if pos_functions[poscat] then
pos_functions[poscat](args, data)
end
return m_headword.full_headword(data) .. (data.extra_text or "") ..
m_utilities.format_categories(tracking_categories, lang, nil)
end
local function noun_plus_or_multi(frame, multi)
local args = clone_args(frame)
PAGENAME = mw.title.getCurrentTitle().text
local poscat = ine(frame.args[1]) or error("Part of speech has not been specified. Please pass parameter 1 to the module invocation.")
local old = ine(frame.args.old)
-- default value of n=, used in ru-proper noun+ where ndef=sg is set
local ndef = ine(frame.args.ndef)
args.ndef = args.ndef or ndef
local m_noun = require("Module:ru-noun")
if multi then
args = m_noun.do_generate_forms_multi(args, old)
else
args = m_noun.do_generate_forms(args, old)
end
local data = {lang = lang, pos_category = poscat, categories = {}, heads = {},
translits = {}, genders = {}, inflections = {}}
-- do explicit genders using g=, g2=, etc.
data.genders = process_arg_chain(args, "g", "g", data.genders)
-- if none, do inferred or explicit genders taken from declension;
-- clone because will get destructively modified by do_noun()
if #data.genders == 0 then
if args["g2"] or args["g3"] or args["g4"] then
error("Cannot specify g2=, g3= or g4= without g=")
end
data.genders = mw.clone(args.genders)
end
local saw_note = false
-- Given a list of {RU, TR} pairs, where TR may be nil, separate off the
-- footnote symbols from RU and TR, link the remainder if it's not already
-- linked, and remove monosyllabic accents (but not from multiword
-- expressions).
local function prepare_entry(list, ishead)
if not list or #list == 0 then
return {{"-"}}
end
local newlist = {}
for _, x in ipairs(list) do
local ru, tr = x[1], x[2]
-- separate_notes() just returns the note, but get_notes() adds
-- <sup>...</sup>. We want the former for checking whether the
-- note is nonempty after removing IRREGMARKER (if we use the
-- latter we'll get <sup></sup> in the case of just IRREGMARKER),
-- but the latter when generating the inflectional form.
if not ishead and (rfind(ru, "[%[|%]]") or tr and rfind(tr, "[%[|%]]")) then
track("form-with-link")
end
local ruentry, runotes = m_table_tools.separate_notes(ru)
local sawhyp
runotes = rsub(runotes, IRREGMARKER, "") -- remove note of irregularity
runotes, sawhyp = rsubb(runotes, HYPMARKER, "")
if runotes ~= "" then
saw_note = true
end
runotes = m_table_tools.superscript_notes(runotes)
local trentry, trnotes
if tr then
trentry, trnotes = m_table_tools.separate_notes(tr)
trnotes = rsub(trnotes, IRREGMARKER, "") -- remove note of irregularity
trnotes = m_table_tools.superscript_notes(trnotes)
end
if m_common.is_monosyllabic(ruentry) then
ruentry = m_common.remove_accents(ruentry)
if trentry then
trentry = m_common.remove_accents(trentry)
end
end
if sawhyp then
table.insert(newlist, {ruentry .. runotes .. HYPMARKER,
trentry and trentry .. trnotes .. HYPMARKER})
elseif ishead then
table.insert(newlist, {ruentry .. runotes, trentry and trentry .. trnotes})
else
local ruspan, trspan
if ruentry == "-" then
ruspan = "-"
elseif rfind(ruentry, "[%[|%]]") then
-- don't add links around a form that's already linked
ruspan = ruentry .. runotes
elseif old then
ruspan = "[[" .. com.remove_jo(ruentry) .. "|" .. ruentry .. "]]" .. runotes
else
ruspan = "[[" .. ruentry .. "]]" .. runotes
end
if trentry then
trspan = trentry .. trnotes
end
table.insert(newlist, {ruspan, trspan})
end
end
return newlist
end
local function remove_tr(list)
local newlist = {}
for _, x in ipairs(list) do
table.insert(newlist, x[1])
end
return newlist
end
local argsn = args.n or args.ndef
local genitives, plurals, genpls
if argsn == "p" then
data.heads = prepare_entry(args.nom_pl_linked, "ishead")
genitives = prepare_entry(args.gen_pl)
plurals = {{"-"}}
genpls = {{"-"}}
else
data.heads = prepare_entry(args.nom_sg_linked, "ishead")
genitives = prepare_entry(args.gen_sg)
plurals = argsn == "s" and {{"-"}} or prepare_entry(args.nom_pl)
genpls = argsn == "s" and {{"-"}} or prepare_entry(args.gen_pl)
end
local feminines = process_arg_chain(args, "f", "f") -- do feminines
local masculines = process_arg_chain(args, "m", "m") -- do masculines
local irregtr = false
for _, head in ipairs(data.heads) do
local ru, tr = head[1], head[2]
if rfind(ru, " ") then
--ut.insert_if_not(data.categories, "orosz multiword terms")
track("space-in-headword/" .. poscat)
elseif rfind(ru, ".%-.") then
-- The following are for bot scripts
-- We only look for hyphens between characters so we don't
-- get tripped up by prefixes and suffixes
track("hyphen-no-space-in-headword/" .. poscat)
end
if not tr then
tr = lang:transliterate(m_links.remove_links(ru))
else
irregtr = true
end
table.insert(data.translits, tr)
end
if irregtr and not args.notrcat then
--table.insert(data.categories, "orosz terms with irregular pronunciations")
end
-- Combine adjacent heads by their transliteration (which should always
-- be different, as identical heads including translit have previously
-- been removed)
data.heads = remove_tr(data.heads)
local i = 1
while i < #data.heads do
if data.heads[i] == data.heads[i+1] then
data.translits[i] = data.translits[i] .. ", " .. data.translits[i+1]
table.remove(data.heads, i+1)
table.remove(data.translits, i+1)
else
i = i + 1
end
end
-- Eliminate transliteration from genitives and remove duplicates
-- (which may occur when there are two translits for a form)
genitives = remove_tr(genitives)
local genitives_no_dups = {}
for _, gen in ipairs(genitives) do
ut.insert_if_not(genitives_no_dups, gen)
end
genitives = genitives_no_dups
-- Eliminate transliteration from plurals and remove duplicates
-- (which may occur when there are two translits for a form)
plurals = remove_tr(plurals)
local plurals_no_dups = {}
for _, pl in ipairs(plurals) do
ut.insert_if_not(plurals_no_dups, pl)
end
plurals = plurals_no_dups
-- Eliminate transliteration from genitive plurals and remove duplicates
-- (which may occur when there are two translits for a form)
genpls = remove_tr(genpls)
local genpls_no_dups = {}
for _, gpl in ipairs(genpls) do
ut.insert_if_not(genpls_no_dups, gpl)
end
genpls = genpls_no_dups
do_noun(data, args, argsn == "s",
genitives, plurals, genpls, feminines, masculines, poscat == "tulajdonnevek")
local notes = process_arg_chain(args, "notes", "notes")
local notes_segments = {}
if saw_note then
for _, note in ipairs(notes) do
table.insert(notes_segments, " " .. make_qualifier_text(note))
end
end
local notes_text = table.concat(notes_segments, "")
return m_headword.full_headword(data) .. (data.extra_text or "") .. notes_text
end
-- External entry point; implementation of {{ru-noun+}}.
function export.noun_plus(frame)
return noun_plus_or_multi(frame, false)
end
-- External entry point; implementation of {{ru-noun-m}}.
function export.noun_multi(frame)
return noun_plus_or_multi(frame, true)
end
pos_functions["tulajdonnevek"] = function(args, data)
pos_functions["főnevek"](args, data, true)
end
pos_functions["névmások"] = function(args, data)
pos_functions["főnevek"](args, data)
end
-- Display additional inflection information for a noun
pos_functions["főnevek"] = function(args, data, proper)
process_arg_chain(args, 2, "g", data.genders) -- do genders
local genitives = process_arg_chain(args, 3, "gen") -- do genitives
local plurals = process_arg_chain(args, 4, "pl") -- do plurals
local genpls = process_arg_chain(args, 5, "genpl") -- do genitive plurals
local feminines = process_arg_chain(args, "f", "f") -- do feminines
local masculines = process_arg_chain(args, "m", "m") -- do masculines
if not args.altyo and not args.manual and args[3] ~= "-" and
mw.title.getCurrentTitle().nsText == "" and
not args.unknown_decl and not args.unknown_stress and
not args.unknown_pattern and not args.unknown_gender and
not args.unknown_animacy then
error("[[Template:ru-noun]] can now only be used with indeclinable and manually-declined nouns; use [[Template:ru-noun+]] instead")
end
do_noun(data, args, proper,
genitives, plurals, genpls, feminines, masculines, proper)
end
do_noun = function(data, args, no_plural,
genitives, plurals, genpls, feminines, masculines, proper)
if #data.genders == 0 then
if mw.title.getCurrentTitle().nsText ~= "Sablon" then
error("A nemet meg kell adni")
else
table.insert(data.genders, "?")
end
end
-- Process the genders
local singular_genders = {
["m"] = true,
["m-?"] = true,
["m-an"] = true,
["m-in"] = true,
["f"] = true,
["f-?"] = true,
["f-an"] = true,
["f-in"] = true,
["n"] = true,
["n-an"] = true,
["n-in"] = true}
local plural_genders = {
["p"] = true, -- This is needed because some invariant plural only words have no gender to speak of
["?-p"] = true,
["an-p"] = true,
["in-p"] = true,
["m-p"] = true,
["m-?-p"] = true,
["m-an-p"] = true,
["m-in-p"] = true,
["f-p"] = true,
["f-?-p"] = true,
["f-an-p"] = true,
["f-in-p"] = true,
["n-p"] = true,
["n-?-p"] = true,
["n-an-p"] = true,
["n-in-p"] = true }
local real_genders = {}
for i, g in ipairs(data.genders) do
if g == "m" then
g = "m-?"
elseif g == "m-p" then
g = "m-?-p"
elseif g == "f" and plurals[1] ~= "-" and not no_plural then
g = "f-?"
elseif g == "f-p" then
g = "f-?-p"
elseif g == "p" then
g = "?-p"
end
if not singular_genders[g] and not plural_genders[g] and g ~= "?" and g ~= "?-in" and g ~= "?-an" then
error("Unrecognized gender: " .. g)
end
data.genders[i] = g
local first_letter = g:sub(1,1)
-- Categorize by gender
if first_letter == "m" then
ut.insert_if_not(real_genders, "m")
table.insert(data.categories, "orosz hímnemű főnevek")
elseif first_letter == "f" then
ut.insert_if_not(real_genders, "f")
table.insert(data.categories, "orosz nőnemű főnevek")
elseif first_letter == "n" then
ut.insert_if_not(real_genders, "n")
table.insert(data.categories, "orosz semlegesnemű főnevek")
end
-- Categorize by animacy
if rfind(g, "an") then
table.insert(data.categories, "orosz élő főnevek")
elseif rfind(g, "in") then
table.insert(data.categories, "orosz élettelen főnevek")
end
-- Categorize by number
if plural_genders[g] then
table.insert(data.categories, "orosz pluralia tantum")
if g == "?-p" or g == "an-p" or g == "in-p" then
table.insert(data.categories, "orosz pluralia tantum with incomplete gender")
end
end
end
if #real_genders > 1 then
table.insert(data.categories, "orosz nouns with multiple genders")
end
local function add_forms(inflection, forms)
for i, form in ipairs(forms) do
if rfind(form, HYPMARKER) then
form = rsub(form, HYPMARKER, "")
table.insert(inflection, {term=form, hypothetical=true})
else
table.insert(inflection, form)
end
if m_common.needs_accents(form) then
table.insert(data.categories, "Requests for accents in Russian noun entries")
end
end
end
-- Add the genitive forms
if genitives[1] == "-" then
table.insert(data.inflections, {label = "[[Appendix:Glossary#indeclinable|nem ragozható]]"})
--table.insert(data.categories, "orosz indeclinable nouns")
elseif #genitives > 0 then
local gen_parts = {label = "birtokos"}
add_forms(gen_parts, genitives)
table.insert(data.inflections, gen_parts)
end
-- Add the plural forms
-- If the noun is plural only, then ignore the 4th parameter altogether
if genitives[1] == "-" then
-- do nothing
elseif plural_genders[data.genders[1]] then
table.insert(data.inflections, {label = "[[Appendix:Glossary#plural only|csak többes szám]]"})
elseif plurals[1] == "-" then
if not proper then
table.insert(data.inflections, {label = "[[megszámlálhatatlan]]"})
table.insert(data.categories, "orosz megszámlálhatatlan főnevek")
end
elseif #plurals > 0 then
local pl_parts = {label = "alanyeset tsz."}
add_forms(pl_parts, plurals)
--This can't work currently because the forms in plurals are already
--linked with spans around them, superscripted notes, etc.
--for _, form in ipairs(plurals) do
-- if not rfind(form, HYPMARKER) and not mw.title.new(form).exists then
-- table.insert(categories, "orosz nouns with missing plurals")
-- end
--end
table.insert(data.inflections, pl_parts)
end
-- Add the genitive plural forms
if genitives[1] == "-" or plural_genders[data.genders[1]] or plurals[1] == "-" then
-- indeclinable, plural only or uncountable; do nothing
elseif genpls[1] == "-" then
table.insert(data.inflections, {label = "genitive plural missing"})
elseif #genpls > 0 then
local genpl_parts = {label = "birtokos tsz."}
add_forms(genpl_parts, genpls)
table.insert(data.inflections, genpl_parts)
end
-- Add the feminine forms
if #feminines > 0 then
local f_parts = {label = "nőnemű"}
add_forms(f_parts, feminines)
table.insert(data.inflections, f_parts)
end
-- Add the masculine forms
if #masculines > 0 then
local m_parts = {label = "hímnemű"}
add_forms(m_parts, masculines)
table.insert(data.inflections, m_parts)
end
local extra_notes = {}
if args.unknown_decl then
track("unknown-decl")
table.insert(extra_notes, "unknown declension")
end
if args.unknown_stress then
track("unknown-stress")
table.insert(extra_notes, "unknown stress")
end
if args.unknown_pattern then
track("unknown-pattern")
table.insert(extra_notes, "unknown accent pattern")
end
if args.unknown_gender then
track("unknown-gender")
table.insert(extra_notes, "unknown gender")
end
if args.unknown_animacy then
track("unknown-animacy")
table.insert(extra_notes, "unknown animacy")
end
if #extra_notes > 0 then
data.extra_text = " " .. make_qualifier_text(table.concat(extra_notes, ", "))
end
end
local function generate_informal_comp(comp)
if rfind(comp, "е́?е$") then
return rsub(comp, "(е́?)е$", "%1й")
else
return nil
end
end
local function generate_po_variant(comp)
if rfind(comp, "е$") or rfind(comp, "е́?й$") then
return "[[по" .. comp .. "|(по)]][[" .. comp .. "]]"
else
return comp
end
end
local allowed_endings = {
{"ый", "yj"},
{"ий", "ij"},
{"о́й", "o" .. AC .. "j"},
-- last two for adverbs
{"о", "o"},
{"о́", "o" .. AC}
}
local velar_to_translit = {
["к"] = "k",
["г"] = "g",
["х"] = "x"
}
local velar_to_palatal = {
["к"] = "ч",
["г"] = "ж",
["х"] = "ш",
["k"] = "č",
["g"] = "ž",
["x"] = "š"
}
-- Generate the comparative(s) given the positive(s). Note that this is written
-- to take in and generate comparative(s) for transliteration(s) as well as
-- Russian. This isn't currently used by {{ru-adjective}} but will be used by
-- a bot that generates entries for comparatives.
local function generate_comparative(heads, trs, compspec)
local comps = {}
if not rfind(compspec, "^%+") then
error("Compspec '" .. compspec .. "' must begin with + in this function")
end
if compspec ~= "+" and not rfind(compspec, "^%+[abc]'*$") then
error("Compsec '" .. compspec .. "' has illegal format, should be e.g. + or +c''")
end
compspec = rsub(compspec, "^%+", "")
for i, head in ipairs(heads) do
local tr = m_common.decompose(trs[i])
head = m_links.remove_links(head)
local removed_ending = false
for j, endingpair in ipairs(allowed_endings) do
if rfind(head, endingpair[1] .. "$") then
if not rfind(tr, endingpair[2] .. "$") then
error("Translit '" .. tr .. "' doesn't end with expected '"
.. endingpair[2] .. "', corresponding to head '" .. head .. "'")
end
if endingpair[1] == "о́й" then
if compspec == "a" then
error("Short stress pattern a not allowed with ending-stressed adjectives")
elseif compspec == "" then
compspec = "b"
end
end
head = rsub(head, endingpair[1] .. "$", "")
tr = rsub(tr, endingpair[2] .. "$", "")
removed_ending = true
break
end
end
if not removed_ending then
error("Head '" .. head .. "' doesn't end with expected ending")
end
local comp, comptr
if rfind(head, "[кгх]$") then
stemhead, lastheadchar = rmatch(head, "^(.*)(.)$")
stemtr, lasttrchar = rmatch(tr, "^(.*)(.)$")
if velar_to_translit[lastheadchar] ~= lasttrchar then
error("Translit '" .. tr .. "' doesn't end with transliterated equivalent of last char '" ..
lastheadchar .. "' of head '" .. head .. "'")
end
comp, comptr = m_common.make_ending_stressed(stemhead, stemtr)
comp = comp .. velar_to_palatal[lastheadchar] .. "е" -- Cyrillic е
comptr = comptr .. velar_to_palatal[lasttrchar] .. "e" -- Latin e
elseif compspec == "" or compspec == "a" then
comp = head .. "ее" -- Cyrillic ее
comptr = tr .. "ee" -- Latin ee
else -- end-stressed comparative, including pattern a'
comp, comptr = m_common.make_unstressed_once(head, tr)
comp = comp .. "е́е" -- Cyrillic е́е
comptr = comptr .. "e" .. AC .. "e" -- Latin decomposed ée
end
ut.insert_if_not(comps, {comp, comptr})
end
return comps
end
-- Meant to be called from a bot
function export.generate_comparative(frame)
local comps = ine(frame.args[1]) or error("Must specify comparative(s) in parameter 1")
local compspec = ine(frame.args[2]) or ""
comps = rsplit(comps, ",")
local heads = {}
local trs = {}
for _, comp in ipairs(comps) do
local splitvals = rsplit(comp, "//")
if #splitvals > 2 then
error("HEAD or HEAD//TR expected: " .. comp)
end
table.insert(heads, splitvals[1])
table.insert(trs, #splitvals == 1 and lang:transliterate(splitvals[1], nil) or splitvals[2])
end
comps = generate_comparative(heads, trs, compspec)
local combined_comps = {}
for _, comp in ipairs(comps) do
table.insert(combined_comps, comp[1] .. "//" .. comp[2])
end
return m_common.recompose(table.concat(combined_comps, ","))
end
local function handle_comparatives(data, comps, catpos, noinf, accel)
if #comps == 1 and comps[1] == "-" then
table.insert(data.inflections, {label = "no comparative"})
track("nocomp")
elseif #comps > 0 then
local normal_comp_parts = {label = "középfok", accel = accel}
-- Skip accelerators for these thre
local rare_comp_parts = {label = "rare comparative"}
local dated_comp_parts = {label = "dated comparative"}
local awkward_comp_parts = {label = "rare/awkward comparative"}
local function insert_comp(comp, comptype)
local comp_parts = comptype == "rare" and rare_comp_parts or
comptype == "dated" and dated_comp_parts or
comptype == "awkward" and awkward_comp_parts or
normal_comp_parts
ut.insert_if_not(comp_parts, generate_po_variant(comp))
if not noinf then
local informal = generate_informal_comp(comp)
if informal then
ut.insert_if_not(comp_parts, generate_po_variant(informal))
end
end
if m_common.needs_accents(comp) then
table.insert(data.categories, "Requests for accents in Russian " .. catpos .. " entries")
end
end
for _, comp in ipairs(comps) do
if comp == "peri" then
for _, head in ipairs(data.heads) do
ut.insert_if_not(normal_comp_parts, "[[бо́лее]] " .. head)
end
track("pericomp")
else
local comptype = "normal"
if rfind(comp, "^rare%-") then
comptype = "rare"
comp = rsub(comp, "^rare%-", "")
elseif rfind(comp, "^dated%-") then
comptype = "dated"
comp = rsub(comp, "^dated%-", "")
elseif rfind(comp, "^awkward%-") then
comptype = "awkward"
comp = rsub(comp, "^awkward%-", "")
end
if rfind(comp, "^+") then
local autocomps = generate_comparative(data.heads, data.translits, comp)
for _, autocomp in ipairs(autocomps) do
insert_comp(autocomp[1], comptype)
end
else
insert_comp(comp, comptype)
end
end
end
if #normal_comp_parts > 0 then
table.insert(data.inflections, normal_comp_parts)
end
if #rare_comp_parts > 0 then
table.insert(data.inflections, rare_comp_parts)
end
if #dated_comp_parts > 0 then
table.insert(data.inflections, dated_comp_parts)
end
if #awkward_comp_parts > 0 then
table.insert(data.inflections, awkward_comp_parts)
end
end
end
-- Display additional inflection information for an adjective
pos_functions["melléknevek"] = function(args, data)
local comps = process_arg_chain(args, 2, "comp") -- do comparatives
local sups = process_arg_chain(args, 3, "sup") -- do superlatives
handle_comparatives(data, comps, "adjective", args["noinf"], nil)
if #sups > 0 then
local sup_parts = {label = "felsőfok"}
for _, sup in ipairs(sups) do
if sup == "peri" then
for _, head in ipairs(data.heads) do
table.insert(sup_parts, "[[са́мый]] " .. head)
end
else
table.insert(sup_parts, sup)
if m_common.needs_accents(sup) then
table.insert(data.categories, "Requests for accents in Russian adjective entries")
end
end
end
table.insert(data.inflections, sup_parts)
end
if args.indecl then
table.insert(data.inflections, {label = "nem ragozható"})
table.insert(data.categories, "orosz nem ragozható melléknevek")
end
end
-- Display additional inflection information for an adverb
pos_functions["határozószók"] = function(args, data)
local comps = process_arg_chain(args, 2, "comp") -- do comparatives
local encoded_head = data.heads[1]
if encoded_head == "" then
encoded_head = nil
end
handle_comparatives(data, comps, "adverb", args["noinf"], {form = "középfok", lemma = encoded_head})
end
-- Display additional inflection information for a verb and verbal combining form
local function do_verb(args, data, pos)
local cform = pos == "verbal combining forms"
if cform then
table.insert(data.categories, "orosz igék")
end
-- Aspect
local aspect = args[2] or mw.title.getCurrentTitle().nsText == "Sablon" and "?"
if aspect == "impf" then
table.insert(data.genders, "impf")
table.insert(data.categories, "orosz folyamatos igék")
elseif aspect == "pf" then
table.insert(data.genders, "pf")
table.insert(data.categories, "orosz befejezett igék")
elseif aspect == "both" then
table.insert(data.genders, "impf")
table.insert(data.genders, "pf")
table.insert(data.categories, "orosz folyamatos igék")
table.insert(data.categories, "orosz befejezett igék")
table.insert(data.categories, "orosz kétaspektusú igék")
elseif aspect == "?" then
table.insert(data.genders, "?")
table.insert(data.categories, "Requests for aspect in Russian entries")
elseif not aspect then
error("Missing Russian verb aspect, should be 'pf', 'impf', 'both' or '?'")
else
error("Invalid Russian verb aspect '" .. aspect .. "', should be 'pf', 'impf', 'both' or '?'")
end
if pos == "verbal combining forms" then
table.insert(data.categories, "orosz verbal combining forms|" .. rsub(data.heads[1], "^%-", ""))
end
-- Get the imperfective parameters
-- First get the impf= parameter. The remainder is named impf2=, impf3= etc.
local imperfectives = {}
local form = args.impf
local i = 2
while form do
table.insert(imperfectives, form)
form = args["impf" .. i]
i = i + 1
end
-- Get the perfective parameters
-- First get the pf= parameter. The remainder is named pf2=, pf3= etc.
local perfectives = {}
local form = args.pf
local i = 2
while form do
table.insert(perfectives, form)
form = args["pf" .. i]
i = i + 1
end
-- Add the imperfective forms
if #imperfectives > 0 then
if aspect == "impf" then
error("Can't specify imperfective counterparts for an imperfective verb")
end
local impf_parts = {label = "folyamatos"}
for i, form in ipairs(imperfectives) do
table.insert(impf_parts, form)
if m_common.needs_accents(form) then
table.insert(data.categories, "Requests for accents in Russian verb entries")
end
end
table.insert(data.inflections, impf_parts)
end
-- Add the perfective forms
if #perfectives > 0 then
if aspect == "pf" then
error("Can't specify perfective counterparts for a perfective verb")
end
local pf_parts = {label = "befejezett"}
for i, form in ipairs(perfectives) do
table.insert(pf_parts, form)
if m_common.needs_accents(form) then
table.insert(data.categories, "Requests for accents in Russian verb entries")
end
end
table.insert(data.inflections, pf_parts)
end
end
pos_functions["igék"] = function(args, data)
do_verb(args, data, "verbs")
end
pos_functions["verbal combining forms"] = function(args, data)
do_verb(args, data, "verbal combining forms")
end
return export
-- For Vim, so we get 4-space tabs
-- vim: set ts=4 sw=4 noet: