Module:Pinyin
Appearance
This module is rated as beta, and is ready for widespread use. It is still new and should be used with some caution to ensure the results are as expected. |
This module converts Hanyu Pinyin input from the "lazy" numbers form (eg. Han4yu3 pin1yin1) to the proper form with tones marked on the correct vowels (eg. Hànyǔ pīnyīn). It implements {{Pinyin}}
Additionally, the module converts the convenient shorthand v to ü as in most Chinese pinyin IMEs, and catches the incorrect nue and lue to nüe and lüe respectively. Otherwise, the module does not check whether the input pinyin is entered correctly or not.
Also supports putting the accent on esoteric pinyin like on m, ng, and ê. (eg. ng3 gives ňg)
Usage
[edit]{{#invoke:Pinyin|pinyin|input}}
- input - The values to convert to proper pinyin form. As input, the pinyin for individual characters has to be in the form untoned pinyin + tone number with no spaces between them (eg. ma1), though there is no limitation on how many words to take as input and whether there are spaces between individual characters.
local p = {}
function attachTone(a, n)
n = tonumber(n)
if a == "a" then
if n == 1 then return "ā" end
if n == 2 then return "á" end
if n == 3 then return "ǎ" end
if n == 4 then return "à" end
return a
end
if a == "A" then
if n == 1 then return "Ā" end
if n == 2 then return "Á" end
if n == 3 then return "Ǎ" end
if n == 4 then return "À" end
return a
end
if a == "e" then
if n == 1 then return "ē" end
if n == 2 then return "é" end
if n == 3 then return "ě" end
if n == 4 then return "è" end
return a
end
if a == "E" then
if n == 1 then return "Ē" end
if n == 2 then return "É" end
if n == 3 then return "Ě" end
if n == 4 then return "È" end
return a
end
if a == "i" then
if n == 1 then return "ī" end
if n == 2 then return "í" end
if n == 3 then return "ǐ" end
if n == 4 then return "ì" end
return a
end
if a == "O" then
if n == 1 then return "Ō" end
if n == 2 then return "Ó" end
if n == 3 then return "Ŏ" end
if n == 4 then return "Ò" end
return a
end
if a == "o" then
if n == 1 then return "ō" end
if n == 2 then return "ó" end
if n == 3 then return "ǒ" end
if n == 4 then return "ò" end
return a
end
if a == "u" then
if n == 1 then return "ū" end
if n == 2 then return "ú" end
if n == 3 then return "ǔ" end
if n == 4 then return "ù" end
return a
end
if (a == "v") or (a == "ü") then
if n == 1 then return "ǖ" end
if n == 2 then return "ǘ" end
if n == 3 then return "ǚ" end
if n == 4 then return "ǜ" end
return "ü"
end
if a == "Ê" then
if n == 1 then return "Ê̄" end
if n == 2 then return "Ế" end
if n == 3 then return "Ê̌" end
if n == 4 then return "Ề" end
return a
end
if a == "ê" then
if n == 1 then return "ê̄" end
if n == 2 then return "ế" end
if n == 3 then return "ê̌" end
if n == 4 then return "ề" end
return a
end
if a == "N" then
if n == 2 then return "Ń" end
if n == 3 then return "Ň" end
if n == 4 then return "Ǹ" end
return a
end
if a == "n" then
if n == 2 then return "ń" end
if n == 3 then return "ň" end
if n == 4 then return "ǹ" end
return a
end
if a == "M" then
if n == 2 then return "Ḿ" end
if n == 4 then return "M̀" end
return a
end
if a == "m" then
if n == 2 then return "ḿ" end
if n == 4 then return "m̀" end
return a
end
return a
end
function selectVowel(chara, n)
if not chara then
return
end
if chara:find('^.*A') then
return chara:gsub("A", attachTone("A", n))
end
if chara:find('^.*a') then
return chara:gsub("a", attachTone("a", n))
end
if chara:find('^.*E') then
return chara:gsub("E", attachTone("E", n))
end
if chara:find('^.*e') then
return chara:gsub("e", attachTone("e", n))
end
if chara:find('^.*Ê') then
return chara:gsub("Ê", attachTone("Ê", n))
end
if chara:find('^.*ê') then
return chara:gsub("ê", attachTone("ê", n))
end
if chara:find('^.*iu') then
return chara:gsub("iu", "i"..attachTone("u", n))
end
if chara:find('^.*i') then
return chara:gsub("i", attachTone("i", n))
end
if chara:find('^.*O') then
return chara:gsub("O", attachTone("O", n))
end
if chara:find('^.*o') then
return chara:gsub("o", attachTone("o", n))
end
if chara:find('^.*u') then
return chara:gsub("u", attachTone("u", n))
end
if chara:find('^.*v') then
return chara:gsub("v", attachTone("v", n))
end
if chara:find('^.*ü') then
return chara:gsub("ü", attachTone("ü", n))
end
if chara:find('^.*N') then
return chara:gsub("N", attachTone("N", n))
end
if chara:find('^.*n') then
return chara:gsub("n", attachTone("n", n))
end
if chara:find('^.*M') then
return chara:gsub("M", attachTone("M", n))
end
if chara:find('^.*m') then
return chara:gsub("m", attachTone("m", n))
end
end
function p.pinyin(frame)
local input = frame.args[1]
if not input then
return
end
local ve = input:gsub("nue", "nve"):gsub("lue", "lve")
local out = ve:gsub("([%aüÊê]+)(%d)", selectVowel)
return (out:gsub("v", "ü"))
end
return p