Zum Inhalt springen

Modul:chm-translit

Vun Wiktionary

This module will transliterate Mari (Eastern and Western) text per WT:CHM TR through the function tr.


-- This is a module to transliterate Mari (Eastern/Meadow (standard) and Western/Hill) Cyrillic words to Latin
 
local export = {}
 
function export.tr(word)
    if type(word) == 'table' then -- called directly from a template
        word = word.args[1]
    end
 
    -- Ё needs converting if is decomposed
    word = word:gsub("ё","ё"):gsub("Ё","Ё")
 
    -- е after a vowel or at the beginning of a word becomes je
    word = mw.ustring.gsub(word, "([АӒОӦУӰЫӸЕЯЁЮИЕЪЬаӓоӧуӱыӹэяёюиеъь%A][́̀]?)е","%1je")
    word = mw.ustring.gsub(word, "^Е","Je")
    word = mw.ustring.gsub(word, "^е","je")
    word = mw.ustring.gsub(word, "([^Ѐ-ӿ])Е","%1Je")
    word = mw.ustring.gsub(word, "([^Ѐ-ӿ])е","%1je")
 
    return (mw.ustring.gsub(word,'.',tab))
end
 
tab = {
    ["А"]="A", ["Б"]="B", ["В"]="V", ["Г"]="G", ["Д"]="D", ["Е"]="E", ["Ё"]="Jo", ["Ж"]="Ž", ["З"]="Z", ["И"]="I", ["Й"]="J",
    ["К"]="K", ["Л"]="L", ["М"]="M", ["Н"]="N", ["Ҥ"]="Ŋ", ["О"]="O", ["Ӧ"]="Ö", ["П"]="P", ["Р"]="R", ["С"]="S", ["Т"]="T",
    ["У"]="U", ["Ӱ"]="Ü", ["Ф"]="F", ["Х"]="X", ["Ц"]="C", ["Ч"]="Č", ["Ш"]="Š", ["Щ"]="Šč", ["Ъ"]="ʺ", ["Ы"]="Y", ["Ь"]="ʹ",
    ["Э"]="E", ["Ю"]="Ju", ["Я"]="Ja",
    ['а']='a', ['б']='b', ['в']='v', ['г']='g', ['д']='d', ['е']='e', ['ё']='jo', ['ж']='ž', ['з']='z', ['и']='i', ['й']='j',
    ['к']='k', ['л']='l', ['м']='m', ['н']='n', ['ҥ']='ŋ', ['о']='o', ['ӧ']='ö', ['п']='p', ['р']='r', ['с']='s', ['т']='t',
    ['у']='u', ['ӱ']='ü', ['ф']='f',
    ['х']='x', ['ц']='c', ['ч']='č', ['ш']='š', ['щ']='šč', ['ъ']='ʺ', ['ы']='y', ['ь']='ʹ', ['э']='e', ['ю']='ju', ['я']='ja',
    -- Hill (Western) Mari only, doesn't use Ҥ, ҥ
    ["Ӓ"]="Ä", ["Ӹ"]="Ÿ", ['ӓ']='ä', ['ӹ']='ÿ', 
}
 
return export