Module:Pinyin
| This module is rated as beta. It is considered ready for widespread use, but as it is still relatively new, it should be applied with some caution to ensure results are as expected. |
This module converts Hanyu Pinyin input from the "lazy" numbers form (eg. Han4yu3 pin1yin1) to the proper form with tones marked on the correct vowels (eg. Hànyǔ pīnyīn). It implements {{Pinyin}}
Additionally, the module converts the convenient shorthand v to ü as in most Chinese pinyin IMEs, and catches the incorrect nue and lue to nüe and lüe respectively. Otherwise, the module does not check whether the input pinyin is entered correctly or not.
Also supports putting the accent on esoteric pinyin like on m, ng, and ê. (eg. ng3 gives ňg)
Usage
{{#invoke:Pinyin|pinyin|input}}
- input - The values to convert to proper pinyin form. As input, the pinyin for individual characters has to be in the form untoned pinyin + tone number with no spaces between them (eg. ma1), though there is no limitation on how many words to take as input and whether there are spaces between individual characters.
local p = {}
local function remove_links_and_markup(text)
-- these either are unnecessary or interfere with assimilation
-- remove bold/italic
-- it is not impossible to allow bold/italic when it does not interfere with assimilation, but determining when to allow or disallow that adds complication for little practical gain
text = gsub(text, "'''", "")
text = gsub(text, "''", "")
-- remove HTML tags (except br)
text = gsub(text, "<[Bb][Rr] */?>", " ")
text = gsub(text, "</?[A-Za-z][^>]->", "")
text = gsub(text, " ", "<br>")
-- remove wikilinks
text = gsub(text, "%[%[[^%|]+%|(..-)%]%]", "%1")
text = gsub(gsub(text, "%[%[", ""), "%]%]", "")
text = mw.text.killMarkers(text)
return text
end
function attachTone(a, n)
n = tonumber(n)
if a == "a" then
if n == 1 then return "ā" end
if n == 2 then return "á" end
if n == 3 then return "ǎ" end
if n == 4 then return "à" end
return a
end
if a == "A" then
if n == 1 then return "Ā" end
if n == 2 then return "Á" end
if n == 3 then return "Ǎ" end
if n == 4 then return "À" end
return a
end
if a == "e" then
if n == 1 then return "ē" end
if n == 2 then return "é" end
if n == 3 then return "ě" end
if n == 4 then return "è" end
return a
end
if a == "E" then
if n == 1 then return "Ē" end
if n == 2 then return "É" end
if n == 3 then return "Ě" end
if n == 4 then return "È" end
return a
end
if a == "i" then
if n == 1 then return "ī" end
if n == 2 then return "í" end
if n == 3 then return "ǐ" end
if n == 4 then return "ì" end
return a
end
if a == "O" then
if n == 1 then return "Ō" end
if n == 2 then return "Ó" end
if n == 3 then return "Ŏ" end
if n == 4 then return "Ò" end
return a
end
if a == "o" then
if n == 1 then return "ō" end
if n == 2 then return "ó" end
if n == 3 then return "ǒ" end
if n == 4 then return "ò" end
return a
end
if a == "u" then
if n == 1 then return "ū" end
if n == 2 then return "ú" end
if n == 3 then return "ǔ" end
if n == 4 then return "ù" end
return a
end
if (a == "v") or (a == "ü") then
if n == 1 then return "ǖ" end
if n == 2 then return "ǘ" end
if n == 3 then return "ǚ" end
if n == 4 then return "ǜ" end
return "ü"
end
if a == "Ê" then
if n == 1 then return "Ê̄" end
if n == 2 then return "Ế" end
if n == 3 then return "Ê̌" end
if n == 4 then return "Ề" end
return a
end
if a == "ê" then
if n == 1 then return "ê̄" end
if n == 2 then return "ế" end
if n == 3 then return "ê̌" end
if n == 4 then return "ề" end
return a
end
if a == "N" then
if n == 2 then return "Ń" end
if n == 3 then return "Ň" end
if n == 4 then return "Ǹ" end
return a
end
if a == "n" then
if n == 2 then return "ń" end
if n == 3 then return "ň" end
if n == 4 then return "ǹ" end
return a
end
if a == "M" then
if n == 2 then return "Ḿ" end
if n == 4 then return "M̀" end
return a
end
if a == "m" then
if n == 2 then return "ḿ" end
if n == 4 then return "m̀" end
return a
end
return a
end
function selectVowel(chara, n)
if not chara then
return
end
if chara:find('^.*A') then
return chara:gsub("A", attachTone("A", n))
end
if chara:find('^.*a') then
return chara:gsub("a", attachTone("a", n))
end
if chara:find('^.*E') then
return chara:gsub("E", attachTone("E", n))
end
if chara:find('^.*e') then
return chara:gsub("e", attachTone("e", n))
end
if chara:find('^.*Ê') then
return chara:gsub("Ê", attachTone("Ê", n))
end
if chara:find('^.*ê') then
return chara:gsub("ê", attachTone("ê", n))
end
if chara:find('^.*iu') then
return chara:gsub("iu", "i"..attachTone("u", n))
end
if chara:find('^.*i') then
return chara:gsub("i", attachTone("i", n))
end
if chara:find('^.*O') then
return chara:gsub("O", attachTone("O", n))
end
if chara:find('^.*o') then
return chara:gsub("o", attachTone("o", n))
end
if chara:find('^.*u') then
return chara:gsub("u", attachTone("u", n))
end
if chara:find('^.*v') then
return chara:gsub("v", attachTone("v", n))
end
if chara:find('^.*ü') then
return chara:gsub("ü", attachTone("ü", n))
end
if chara:find('^.*N') then
return chara:gsub("N", attachTone("N", n))
end
if chara:find('^.*n') then
return chara:gsub("n", attachTone("n", n))
end
if chara:find('^.*M') then
return chara:gsub("M", attachTone("M", n))
end
if chara:find('^.*m') then
return chara:gsub("m", attachTone("m", n))
end
end
function p.pinyin(frame)
local input = frame.args[1]
if not input then
return
end
local ve = input:gsub("nue", "nve"):gsub("lue", "lve")
local out = ve:gsub("([%aüÊê]+)(%d)", selectVowel)
return (out:gsub("v", "ü"))
end
return p
Content Disclaimer
Informasi ini disarikan dari Wikipedia dan disajikan kembali untuk tujuan edukasi. Konten tersedia di bawah lisensi CC BY-SA 3.0. Kami tidak bertanggung jawab atas ketidakakuratan data yang bersumber dari kontribusi publik tersebut.
- The information displayed on this website is sourced in part or in whole from Wikipedia and has been adapted for the purpose of restating it. We strive to provide accurate and relevant information, however:
- There is no guarantee of absolute accuracy. Wikipedia is an open, collaborative project that can be edited by anyone, so information is subject to change.
- It is not intended to constitute professional advice. The content displayed is for informational and educational purposes only. For important decisions (e.g., medical, legal, or financial), please consult a professional.
- Content copyright. Wikipedia is licensed under the Creative Commons Attribution-ShareAlike License (CC BY-SA). This means that content may be reused with appropriate attribution and shared under a similar license.
- Responsible use. Any risk arising from the use of information from this website is entirely the responsibility of the user.