This module handles generating the descriptions and categorization for Belarusian category pages of the format "Belarusian LABEL" where LABEL can be any text. Examples are Category:Bulgarian conjugation 2.1 verbs and Category:Russian velar-stem neuter-form nouns. This module is part of the poscatboiler system, which is a general framework for generating the descriptions and categorization of category pages.
For more information, see Module:category tree/poscatboiler/data/lang-specific/documentation.
NOTE: If you add a new language-specific module, you must add the language code to the list at the top of Module:category tree/poscatboiler/data/lang-specific in order for the module to be recognized.
local labels = {}
local handlers = {}
local rfind = mw.ustring.find
local rmatch = mw.ustring.match
local rsubn = mw.ustring.gsub
-- version of rsubn() that discards all but the first return value
local function rsub(term, foo, bar)
local retval = rsubn(term, foo, bar)
return retval
end
--------------------------------- Verbs --------------------------------
labels = {
description = "Belarusian verbs categorized by class.",
parents = {{name = "verbs by inflection type", sort = "class"}},
}
labels = {
description = "Belarusian verbs categorized by class and accent pattern.",
parents = {{name = "verbs by inflection type", sort = "class and accent pattern"}},
}
table.insert(handlers, function(data)
local cls, variant, pattern = rmatch(data.label, "^class (*)(°?)(?) verbs")
if cls then
if pattern == "" then
return {
description = "Belarusian class " .. cls .. " verbs.",
breadcrumb = cls,
parents = {{name = "verbs by class", sort = cls .. variant}},
}
else
return {
description = "Belarusian class " .. cls .. " verbs of " ..
"accent pattern " .. pattern .. (
variant == "" and "" or " and variant " .. variant) .. ". " .. (
pattern == "a" and "With this pattern, all forms are stem-stressed."
or pattern == "b" and "With this pattern, all forms are ending-stressed."
or "With this pattern, the first singular present indicative and all forms " ..
"outside of the present indicative are ending-stressed, while the remaining " ..
"forms of the present indicative are stem-stressed.").. (
variant == "" and "" or
cls == "3" and variant == "°" and " The variant code indicates that the -н of the stem " ..
"is missing in most non-present-tense forms." or
cls == "6" and variant == "°" and
" The variant code indicates that the present tense is not " ..
"]. (In most verbs of this class, " ..
"the present tense is iotated, e.g. піса́ць with present tense " ..
"пішу́, пі́шеш, пі́ше, etc.)"
),
breadcrumb = cls .. variant .. pattern,
parents = {
{name = "class " .. cls .. " verbs", sort = pattern},
{name = "verbs by class and accent pattern", sort = cls .. pattern},
},
}
end
end
end)
--------------------------------- Adjectives --------------------------------
labels = {
description = "Belarusian adjectives categorized by stem type and stress. " ..
"Unlike for nouns, adjectives are consistently either stem-stressed or ending-stressed.",
parents = {{name = "adjectives by inflection type", sort = "stem type and stress"}},
}
local adj_stem_expl = {
= "a soft consonant",
= "a hard consonant other than a velar",
= "a velar consonant",
= "-ов, -ев, -ын or -ін",
}
local adj_decl_endings = {
= {"-ы", "-ая", "-ае", "-ыя"},
= {"-ы́", "-а́я", "-о́е", "-ы́я"},
= {"-і", "-ая", "-ае", "-ія"},
= {"-і́", "-а́я", "-о́е", "-і́я"},
= {"-і", "-яя", "-яе", "-ія"},
-- FIXME, not sure the rest are correct
= {"-", "-а", "-а", "-і"},
= {"-", "-а", "(nil)", "-і"},
}
table.insert(handlers, function(data)
local breadcrumb, stem, stress = rmatch(data.label, "^((*) (*)-stressed) adjectives")
if not breadcrumb then
breadcrumb, stem = rmatch(data.label, "^((*)) adjectives")
stress = ""
end
if breadcrumb and adj_stem_expl and adj_decl_endings then
local m, f, n, p = unpack(adj_decl_endings)
local stresstext = stress == "stem" and
"The adjectives in this category have stress on the stem." or
stress == "ending" and
"The adjectives in this category have stress on the endings." or
"All adjectives of this type have stress on the stem."
local endingtext = "ending in the nominative in masculine singular " .. m ..
", feminine singular " .. f .. ", neuter singular " .. p .. " and plural " ..
p .. "."
local stemtext = " The stem ends in " .. adj_stem_expl .. "."
return {
description = "Belarusian " .. stem .. " adjectives, " .. endingtext .. stemtext .. " " .. stresstext,
breadcrumb = breadcrumb,
parents = {"adjectives by stem type and stress"},
}
end
end)
--------------------------------- Nouns/Pronouns/Numerals --------------------------------
for _, pos in ipairs({"nouns", "pronouns", "numerals"}) do
local sgpos = pos:gsub("s$", "")
labels = {
description = "Belarusian " .. pos .. " categorized by stem type and typical gender. " ..
"Note that \"typical gender\" means the gender that is typical for the " .. sgpos .. "'s ending (e.g. most " ..
pos .. " in ''-я'' with accusative in ''-ю'' are feminine, and hence all such " .. pos .. " are considered " ..
"to be \"typically feminine'\"; but some are in fact masculine). See ] for further " ..
"information on accent patterns.",
parents = {{name = pos .. " by inflection type", sort = "stem type and gender"}},
}
labels = {
description = "Belarusian " .. pos .. " categorized by stem type, typical gender and accent pattern. " ..
"Note that \"typical gender\" means the gender that is typical for the " .. sgpos .. "'s ending (e.g. most " ..
pos .. " in ''-я'' with accusative in ''-ю'' are feminine, and hence all such " .. pos .. " are considered " ..
"to be \"typically feminine'\"; but some are in fact masculine). See ] for further " ..
"information on accent patterns.",
parents = {{name = pos .. " by inflection type", sort = "stem type, gender and accent pattern"}},
}
labels = {
description = "Belarusian " .. pos .. " categorized according to their (unpredictable) vowel alternation pattern (e.g. ''а'' vs. ''о'').",
parents = {{name = pos, sort = "vowel alternation"}},
}
labels = {
description = "Belarusian " .. pos .. " categorized according to their accent pattern (see ]).",
parents = {{name = pos .. " by inflection type", sort = "accent pattern"}},
}
labels = {
description = "Belarusian " .. pos .. " with a reducible stem, where an extra vowel is inserted " ..
"before the last stem consonant in the nominative singular and/or genitive plural.",
parents = {{name = pos .. " by inflection type", sort = "reducible stem"}},
}
labels = {
description = "Belarusian " .. pos .. " with multiple stems.",
parents = {{name = pos .. " by inflection type", sort = "multiple stems"}},
}
labels = {
description = "Belarusian " .. pos .. " with multiple accent patterns. See ].",
parents = {{name = pos .. " by inflection type", sort = "multiple accent patterns"}},
}
labels = {
description = "Belarusian " .. pos .. " with adjectival endings.",
parents = {pos},
}
labels = {
description = "Belarusian " .. pos .. " with an irregular stem, which occurs in all cases except the nominative singular and maybe the accusative singular.",
parents = {{name = "irregular " .. pos, sort = "stem"}},
}
labels = {
description = "Belarusian " .. pos .. " with an irregular plural stem, which occurs in all cases.",
parents = {{name = "irregular " .. pos, sort = "plural stem"}},
}
end
local noun_stem_expl = {
= "a hard consonant",
= "a velar (-к, -г or -х)",
= "a soft consonant",
= "-м (with -ен- or -ён- in some forms)",
= "-я or -а (with -т- or -ц- in most forms)",
= "-ов, -ав, -ев, -ёв, -ін or -ын",
= "-ов, -ав, -ев, -ёв, -ін or -ын",
}
local noun_stem_to_declension = {
= "third",
= "third",
= "fourth",
= "fourth",
= "fourth",
}
local noun_stem_gender_endings = {
masculine = {
= {"a hard consonant", "-ы"},
= {"a velar", "-і"},
= {"-ь", "-і"},
},
feminine = {
= {"-а", "-ы"},
= {"a velar", "-і"},
= {"-я", "-і"},
= {"-р or a hushing consonant", "-ы"},
= {"-ь or -ў", "-і"},
},
neuter = {
= {"-а or -о", "-ы"},
= {"-а or -о", "-і"},
= {"-е or -ё", "-і"},
= {"-я", "-і"},
= {"-я or -а", "-ты"},
= {"-я", "-ёны"},
},
}
local noun_vowel_alternation_expl = {
= "unstressed -а- in the lemma and stressed -э- in some remaining forms, or unstressed -я- in the lemma and stressed or unstressed -е- in some remaining forms",
= "unstressed -а- in the lemma and stressed -о- in some remaining forms, or unstressed -я- in the lemma and stressed -ё- in some remaining forms",
= "unstressed (usually word-initial) а- in the lemma and stressed во- in some remaining forms",
= "stressed (usually word-initial) во- in the lemma and unstressed а- in some remaining forms",
= "stressed -о- in the lemma and unstressed -ы- in some remaining forms",
= "unstressed -ы- in the lemma and stressed -о- in some remaining forms",
}
table.insert(handlers, function(data)
local function escape_accent(accent)
return rsub(accent, "'", "'")
end
local function get_stem_gender_text(stem, genderspec, pos)
local gender = genderspec
gender = rsub(gender, " in %-$", "")
if not noun_stem_gender_endings then
return nil
end
local endings = noun_stem_gender_endings
if not endings then
return nil
end
local sgending, plending = endings, endings
local stemtext = noun_stem_expl and " The stem ends in " .. noun_stem_expl .. "." or ""
local decltext =
rfind(stem, "declension") and "" or
" This is traditionally considered to belong to the " .. (
noun_stem_to_declension or gender == "feminine" and "first" or "second"
) .. " declension."
local genderdesc
if rfind(genderspec, "in %-$") then
genderdesc = rsub(genderspec, "in (%-)$", pos .. "s ending in %1")
else
genderdesc = "usually " .. gender .. " " .. pos .. "s"
end
return stem .. ", " .. genderdesc .. ", normally ending in " .. sgending .. " in the nominative singular " ..
" and " .. plending .. " in the nominative plural." .. stemtext .. decltext
end
local stem, gender, accent, pos = rmatch(data.label, "^(.*) (.-) adjectival accent%-(.-) (.*)s$")
if not stem then
stem, gender, pos = rmatch(data.label, "^(.*) (.-) adjectival (.*)s$")
end
if stem and noun_stem_expl then
local stemspec
if stem == "hard" then
stemspec = accent == "a" and "hard stem-stressed" or "hard ending-stressed"
else
stemspec = stem
end
local endings = adj_decl_endings
if endings then
local stemtext = " The stem ends in " .. noun_stem_expl .. "."
local accentdesc = accent == "a" and
"This " .. pos .. " is stressed according to accent pattern a (stress on the stem)." or
accent == "b" and
"This " .. pos .. " is stressed according to accent pattern b (stress on the ending)." or
"All " .. pos .. "s of this class are stressed according to accent pattern a (stress on the stem)."
local accenttext = accent and " accent-" .. accent or ""
local m, f, n, pl = unpack(endings)
local sg =
gender == "masculine" and m or
gender == "feminine" and f or
gender == "neuter" and n or
nil
return {
description = "Belarusian " .. stem .. " " .. gender .. " " .. pos ..
"s, with adjectival endings, ending in " .. (sg and sg .. " in the nominative singular and " or "") ..
pl .. " in the nominative plural." .. stemtext .. " " .. accentdesc,
breadcrumb = stem .. " " .. gender .. accenttext,
parents = {
{name = "adjectival " .. pos .. "s", sort = stem .. " " .. gender .. accenttext},
pos .. "s by stem type, gender and accent pattern",
}
}
end
end
-- First group is .* to capture e.g. "hard third-declension".
local part1, stem, gender, accent, part2, pos = rmatch(data.label, "^((.*) (.-)%-form) accent%-(.-)( (.*)s)$")
local ending
if not stem then
-- check for e.g. 'Belarusian hard masculine accent-a nouns in -а'
part1, stem, gender, accent, part2, pos, ending = rmatch(data.label, "^((.-) (+ine)) accent%-(.-)( (.*)s in %-())$")
if stem then
gender = gender .. " in -" .. ending
end
end
if stem then
local stem_gender_text = get_stem_gender_text(stem, gender, pos)
if stem_gender_text then
local accent_text = " This " .. pos .. " is stressed according to accent pattern " ..
escape_accent(accent) .. " (see ])."
return {
description = "Belarusian " .. stem_gender_text .. accent_text,
breadcrumb = "Accent-" .. escape_accent(accent),
parents = {
{name = part1 .. part2, sort = accent},
pos .. "s by stem type, gender and accent pattern",
}
}
end
end
-- First group is .* to capture e.g. "hard third-declension".
local stem, gender, pos = rmatch(data.label, "^(.*) (.-)%-form (.*)s$")
if not stem then
-- check for e.g. 'Belarusian hard masculine nouns in -а'
stem, gender, pos, ending = rmatch(data.label, "^(.-) (+ine) (.*)s in %-()$")
if stem then
gender = gender .. " in -" .. ending
end
end
if stem then
local stem_gender_text = get_stem_gender_text(stem, gender, pos)
if stem_gender_text then
return {
description = "Belarusian " .. stem_gender_text,
breadcrumb = ending and stem .. " " .. gender or stem .. " " .. gender .. "-form",
parents = {pos .. "s by stem type and gender"},
}
end
end
local pos, accent = rmatch(data.label, "^(.*)s with accent pattern (.*)$")
if accent then
return {
description = "Belarusian " .. pos .. "s with accent pattern " .. escape_accent(accent) ..
" (see ]).",
breadcrumb = {name = escape_accent(accent), nocap = true},
parents = {{name = pos .. "s by accent pattern", sort = accent}},
}
end
local pos, alternation = rmatch(data.label, "^(.*)s with (.*%-.*) alternation$")
if alternation then
return {
description = "Belarusian " .. pos .. "s with vowel alternation between " ..
noun_vowel_alternation_expl .. ".",
breadcrumb = {name = alternation, nocap = true},
parents = {{name = pos .. "s by vowel alternation", sort = alternation}},
}
end
end)
return {LABELS = labels, HANDLERS = handlers}