မဝ်ဂျူ:auto cat
Documentation for this module may be created at မဝ်ဂျူ:auto cat/doc
local export = {}
-- Used in multiple places; create a variable for ease in testing.
local poscatboiler_submodule = "poscatboiler"
local labelPatterns = {
"ဝေါဟာ.-", "ဂၞန်သင်္ချာ", "နဲကဲဗီုပြၚ်အပြံၚ်အလှာဲကြိယာ.-", "Participle.-", "အရာမစဵုဒၞာ", "အရီုအဗၚ်", "မှဝ်", "မဝ်ဖဳယျာ.-",
"သၚ်္ကေတမထပိုတ်ကုတ်ဝါကျ", "ဗျဥ်မအက္ခဝ်လိက်", "ဂၞန်သင်္ချာ", "အၚ်္ဂသွက်သ္ဂောံပ္တိတ်ရမျာၚ်မအခဝ်", "သင်္ကေတ", "ဇၟန်လိက်", "ဝါကျ",
"ဗီုရုပ်မုက်လိက်", "ဗီုမရပ်စကာဂလာန်မလိက်", "Chengyu", "palindrome", "ယၟု.-",
"ပွမချဳဒရာၚ်.-", "အဆက်လက္ကရဴ", "မဝ်ဂျူ.-", "ထာမ်ပလိက်.-",
}
local function splitLabelLang(titleObject)
local getByCanonicalName = require("Module:languages").getByCanonicalName
local canonicalName
local label, lang
local pattern
--[=[
-- Progressively add another word to the potential canonical name until it
-- matches an actual canonical name.
local words = mw.text.split(titleObject.text, " ")
for i = #words - 1, 1, -1 do
canonicalName = table.concat(words, " ", 1, i)
lang = getByCanonicalName(canonicalName)
if lang then
break
end
end
local label = lang and titleObject.text:sub(#canonicalName + 2)
or titleObject.text
--]=]
if titleObject.text:find("^ဝေါဟာ") and not titleObject.text:find("^ဝေါဟာမနွံဒၞာဲ") then
-- ဗက်ကဆံၚ် "တၞဟ်ခြာ" တိုန်ကၠာဟိုတ်နူမနွံကဏ္ဍ "တာလျိုၚ်"
canonicalName, label = titleObject.text:match("^ဝေါဟာ(ဗက်အလိုက်အရေဝ်ဘာသာ)(တၞဟ်ခြာ.+)$")
if not canonicalName then
canonicalName, label = titleObject.text:match("^ဝေါဟာ(ဗက်အလိုက်အရေဝ်ဘာသာ)(ပ္ဍဲ.+)$")
end
if not canonicalName then
canonicalName, label = titleObject.text:match("^မအရေဝ်ဝေါဟာ(.+)(တၞဟ်ခြာ.+)$")
end
if not canonicalName then
canonicalName, label = titleObject.text:match("^မအရေဝ်ဝေါဟာ(.+)(ပ္ဍဲ.+)$")
end
if canonicalName then
label = "ဝေါဟာ" .. label
lang = getByCanonicalName(canonicalName)
end
else
for _,pattern in ipairs(labelPatterns) do
label, canonicalName = titleObject.text:match("^(" .. pattern .. ")(ဗက်အလိုက်အရေဝ်ဘာသာ)$")
if not canonicalName then
label, canonicalName = titleObject.text:match("^(" .. pattern .. ")ဘာသာ(.+)$")
end
if canonicalName then
lang = getByCanonicalName(canonicalName)
break
end
end
end
return label, lang
end
-- Add the arguments in `source` to those in `receiver`, offsetting numeric arguments by `offset`.
local function add_args(receiver, source, offset)
for k, v in pairs(source) do
if type(k) == "number" then
receiver[k + offset] = v
else
receiver[k] = v
end
end
return receiver
end
-- List of handler functions that try to match the page name.
-- A handler should return a table of template title plus arguments
-- that is passed to frame:expandTemplate.
-- If a handler does not recognise the page name, it should return nil.
-- Note that the order of functions matters!
local handlers = {}
local function add_handler(func)
table.insert(handlers, func)
end
-- Topical categories
add_handler(function(titleObject)
--[[
if not titleObject.text:find("^[a-z-]+:.") then
return nil
end
local code, label = titleObject.text:match("^([a-z-]+):(.+)$")
--]]
-- ချူတၟိ
if not titleObject.text:find("^ဗက်အလိုက်အရေဝ်ဘာသာ:.") and not titleObject.text:find("^ဘာသာ.+:.") then
return nil
end
local langName, label = titleObject.text:match("^(ဗက်အလိုက်အရေဝ်ဘာသာ):(.+)$")
local code = (langName and "mul" or nil)
if code == nil then
langName, label = titleObject.text:match("^ဘာသာ(.+):(.+)$")
code = (langName and require("Module:languages").getByCanonicalName(langName):getCode() or nil)
end
return {title = "topic cat", args = {code, label}}
end)
-- Letter names
add_handler(function(titleObject)
if not titleObject.text:find("letter names$") then
return nil
end
local langCode = titleObject.text:match("^([^:]+):")
local lang, cat
if langCode then
lang = require("Module:languages").getByCode(langCode) or error('The language code "' .. langCode .. '" is not valid.')
cat = titleObject.text:match(":(.+)$")
else
cat = titleObject.text
end
return {title = "topic cat", args = {lang and lang:getCode() or nil, cat}}
end)
-- letter cat
add_handler(function(titleObject)
-- Only recognize cases consisting of an uppercase letter followed by the
-- corresponding lowercase letter, either as the entire category name or
-- followed by a colon (for cases like [[Category:Gg: ⠛]]). Cases that
-- don't fit this profile (e.g. for Turkish [[Category:İi]] and
-- [[Category:Iı]]) need to call {{letter cat}} directly. Formerly this
-- handler was much less restrictive and would fire on categories named
-- [[Category:zh:]], [[Category:RFQ]], etc.
local upper, lower = mw.ustring.match(titleObject.text, "^(%u)(%l)%f[:%z]")
if not upper or mw.ustring.upper(lower) ~= upper then
return nil
end
return {title = "letter cat"}
end)
-- poscatboiler lang-specific
add_handler(function(titleObject, args)
local label, lang = splitLabelLang(titleObject)
if lang then
local baseLabel, script = label:match("(.+)နကဵုမအခဝ်(.-)$")
if script and baseLabel ~= "ဝေါဟာ" then
local scriptObj = require("Module:scripts").getByCanonicalName(script)
if scriptObj then
return {title = poscatboiler_submodule, args = add_args({lang:getCode(), baseLabel, scriptObj:getCode()}, args, 3)}, true
end
end
return {title = poscatboiler_submodule, args = add_args({lang:getCode(), label}, args, 3)}, true
end
end)
-- poscatboiler umbrella category
add_handler(function(titleObject, args)
local label = titleObject.text:match("(.+)ဗက်အလိုက်အရေဝ်ဘာသာ$")
if label then
return {
title = poscatboiler_submodule,
args = add_args({nil, mw.getContentLanguage():lcfirst(label)}, args, 3)
}, true
end
end)
-- topic cat
add_handler(function(titleObject)
return {title = "topic cat", args = {nil, titleObject.text}}
end)
-- poscatboiler raw handlers
add_handler(function(titleObject, args)
local args = add_args({nil, titleObject.text}, args, 3)
args.raw = true
return {
title = poscatboiler_submodule,
args = args,
}, true
end)
-- poscatboiler umbrella handlers without 'by language'
add_handler(function(titleObject, args)
local args = add_args({nil, mw.getContentLanguage():lcfirst(titleObject.text)}, args, 3)
return {
title = poscatboiler_submodule,
args = args,
}, true
end)
function export.show(frame)
local args = frame:getParent().args
local titleObject = mw.title.getCurrentTitle()
if titleObject.nsText == "ထာမ်ပလိက်" then
return "(This template should be used on pages in the Category: namespace.)"
elseif titleObject.nsText ~= "ကဏ္ဍ" then
error("This template/module can only be used on pages in the Category: namespace.")
end
local function extra_args_error(templateObject)
local numargstext = {}
local argstext = {}
local maxargnum = 0
for k, v in pairs(templateObject.args) do
if type(v) == "number" and v > maxargnum then
maxargnum = v
else
table.insert(numargstext, "|" .. k .. "=" .. v)
end
end
for i = 1, maxargnum do
local v = templateObject.args[i]
if v == nil then
v = "(nil)"
elseif v == true then
v = "(true)"
elseif v == false then
v = "(false)"
end
table.insert(argstext, "|" .. v)
end
error("Extra arguments to {{auto cat}} not allowed for this category (recognized as {{[[Template:" ..
templateObject.title .. "|" .. templateObject.title .. "]]" .. numargstext .. argstext .. "}}")
end
local first_error_templateObject, first_error_args_handled, first_error_cattext
-- Go through each handler in turn. If a handler doesn't recognize the format of the
-- category, it will return nil, and we will consider the next handler. Otherwise,
-- it returns a template name and arguments to call it with, but even then, that template
-- might return an error, and we need to consider the next handler. This happens,
-- for example, with the category "CAT:Mato Grosso, Brazil", where "Mato" is the name of
-- a language, so the handler for {{poscatboiler}} fires and tries to find a label
-- "Grosso, Brazil". This throws an error, and previously, this blocked fruther handler
-- consideration, but now we check for the error and continue checking handlers;
-- eventually, {{topic cat}} will fire and correctly handle the category.
for _, handler in ipairs(handlers) do
local templateObject, args_handled = handler(titleObject, args)
if templateObject then
require("Module:debug").track("auto cat/" .. templateObject.title)
local cattext = frame:expandTemplate(templateObject)
-- FIXME! We check for specific text found in most or all error messages generated
-- by category tree templates (in particular, the second piece of text below should be
-- in all error messages generated when a given module doesn't recognize a category name).
-- If this text ever changes in the source modules (e.g. [[Module:category tree]],
-- it needs to be changed here as well.)
if cattext:find("Category:Categories with invalid label") or
cattext:find("The automatically%-generated contents of this category has errors") then
if not first_error_cattext then
first_error_templateObject = templateObject
first_error_args_handled = args_handled
first_error_cattext = cattext
end
else
if not args_handled and next(args) then
extra_args_error(templateObject)
end
return cattext
end
end
end
if first_error_cattext then
if not first_error_args_handled and next(args) then
extra_args_error(first_error_templateObject)
end
return first_error_cattext
end
error("{{auto cat}} couldn't recognize format of category name")
end
-- test function for injecting title string
function export.test(title)
if type(title) == "table" then
title = title:getParent().args[1]
end
local titleObject = {}
titleObject.text = title
for _, handler in ipairs(handlers) do
local t = handler(titleObject)
if t then
return t.title
end
end
end
return export