Модуль:script utilities/tracking
Көрүнүш
Көзөмөлгө алынган шарттардын тизмеси
[түзөтүү]Ар бир тил үчүн көз салынган бардык үлгүлөр, аларга көз салып турган Wiktionary:Tracking/script субшаблону үчүн "Бул жерде кандай шилтемелер бар" барагына шилтеме. Диакритика окууну жеңилдетүү үчүн чекиттүү тегеректе (э.) көрсөтүлөт.
Ар бир тил үчүн көзөмөлдөнүүчү бардык үлгүлөр, аларга көз салган Wiktionary:Tracking/script субшаблонунун "Бул жерде кандай шилтемелер бар" барагына шилтеме менен. Диакритика окууга жеңил болушу үчүн чекиттүү тегеректин (◌) үстүндө көрсөтүлөт.
- Tibetan: [་།]$, [་།]%]%]$ (Tibetan/trailing-punctuation),
- Thai: เเ (Thai/broken-ae), ํ[◌่◌้◌๊◌๋]?า (Thai/broken-am), [ฤฦ]า (Thai/wrong-rue-lue),
- Белгисиз: ϑ (Greek/wrong-theta), ϰ (Greek/wrong-kappa), ϱ (Greek/wrong-rho), ϕ (Greek/wrong-phi),
- Russian: ◌̀ (Russian/grave-accent),
- Lao: ເເ (Lao/broken-ae), ໍ[◌່◌້◌໊◌໋]?າ (Lao/broken-am), ຫນ (Lao/possible-broken-ho-no), ຫມ (Lao/possible-broken-ho-mo), ຫລ (Lao/possible-broken-ho-lo),
- Old English: ◌́ (/ang/acute),
- Ancient Greek: ᾽ (Ancient Greek/spacing-coronis), ᾿ (Ancient Greek/spacing-smooth-breathing), [᾽᾿] (Ancient Greek/wrong-apostrophe),
- Lü: ᦵᦵ (Lü/broken-ae), [ᦀ-ᦫ][ᦵᦶᦷᦺ] (Lü/possible-wrong-sequence)
local export = {}
local U = mw.ustring.char
--[[
-- redirect_to: tracking conditions to redirect to (allows multiple languages
to use the same conditions)
-- path: added to Wiktionary:Tracking; default is language code (or code under
tracking conditions are listed)
-- Wiktionary:Tracking/Greek
-- Wiktionary:Tracking/ang
-- code: added after path
-- Wiktionary:Tracking/Greek/spacing-coronis
-- Wiktionary:Tracking/ang/acute
-- chars: what to search for in the text; can be a table containing multiple
patterns
]]
export.allTrackingConditions = {
["ang"] = {
{ chars = U(0x301), code = "acute", decompose = true },
},
["grc"] = {
{ redirect_to = "Greek" },
path = "Ancient Greek",
{ chars = U(0x1FBD), code = "spacing-coronis" },
{ chars = U(0x1FBF), code = "spacing-smooth-breathing" },
{ chars = "[" .. U(0x1FBD) .. U(0x1FBF) .. "]", code = "wrong-apostrophe" },
},
["el"] = {
{ redirect_to = "Greek" },
},
["Greek"] = {
{ chars = "ϑ", code = "wrong-theta" },
{ chars = "ϰ", code = "wrong-kappa" },
{ chars = "ϱ", code = "wrong-rho" },
{ chars = "ϕ", code = "wrong-phi" },
},
["ru"] = {
path = "Russian",
{ chars = U(0x300), code = "grave-accent", decompose = true },
},
["bo"] = {
path = "Tibetan",
{ chars = { "[་།]$", "[་།]%]%]$" }, code = "trailing-punctuation" },
},
["th"] = {
path = "Thai",
{ chars = "เ".."เ", code = "broken-ae" },
{ chars = "ํ[่้๊๋]?า", code = "broken-am" },
{ chars = "[ฤฦ]า", code = "wrong-rue-lue" },
},
["lo"] = {
path = "Lao",
{ chars = "ເ".."ເ", code = "broken-ae" },
{ chars = "ໍ[່້໊໋]?າ", code = "broken-am" },
{ chars = "ຫນ", code = "possible-broken-ho-no" },
{ chars = "ຫມ", code = "possible-broken-ho-mo" },
{ chars = "ຫລ", code = "possible-broken-ho-lo" },
},
["khb"] = {
path = "Lü",
{ chars = "ᦵ".."ᦵ", code = "broken-ae" },
{ chars = "[ᦀ-ᦫ][ᦵᦶᦷᦺ]", code = "possible-wrong-sequence" },
},
}
local function interpretCondition(condition, text, path)
-- Ignore conditions that don't have "chars" or "code".
local required = { "chars", "code" }
for i, param in pairs(required) do
if not condition[param] then
return nil
end
end
if type(condition.chars) ~= "table" then
condition.chars = { condition.chars }
end
for i, char in pairs(condition.chars) do
local text = condition.decompose and mw.ustring.toNFD(text) or text
if type(char) == "string" and mw.ustring.find(text, char) then
require("Module:debug").track("script/" .. path .. "/" .. condition.code)
end
end
end
local function interpretConditions(text, code)
if not text then
return nil
end
local trackingConditions = export.allTrackingConditions[code]
if trackingConditions then
local path = trackingConditions.path or code
for i, condition in ipairs(trackingConditions) do
local target = condition.redirect_to
if target then
interpretConditions(text, target)
else
local path = condition.path or path
interpretCondition(condition, text, path)
end
end
end
end
function export.track(text, lang)
local langCode = lang:getCode()
interpretConditions(text, langCode)
end
return export