Module:Pinyin

Neet di̱ Wikipedia

This module converts Hanyu Pinyin input from the "lazy" numbers form (eg. Han4yu3 pin1yin1) to the proper form with tones marked on the correct vowels (eg. Hànyǔ pīnyīn). It implements {{Pinyin}}

Additionally, the module converts the convenient shorthand v to ü as in most Chinese pinyin IMEs, and catches the incorrect nue and lue to nüe and lüe respectively. Otherwise, the module does not check whether the input pinyin is entered correctly or not.

Also supports putting the accent on esoteric pinyin like on m, ng, and ê. (eg. ng3 gives ňg)

Usage[jhyuk a̱tyin ka]

{{#invoke:Pinyin|pinyin|input}}
  • input - The values to convert to proper pinyin form. As input, the pinyin for individual characters has to be in the form untoned pinyin + tone number with no spaces between them (eg. ma1), though there is no limitation on how many words to take as input and whether there are spaces between individual characters.



local p = {}

function attachTone(a, n)
    n = tonumber(n)
	if a == "a" then
		if n == 1 then return "ā" end
		if n == 2 then return "á" end
		if n == 3 then return "ǎ" end
		if n == 4 then return "à" end
		return a
			
	end
	
	if a == "A" then
		if n == 1 then return "Ā" end
		if n == 2 then return "Á" end
		if n == 3 then return "Ǎ" end
		if n == 4 then return "À" end
		return a
			
	end
	
	if a == "e" then
		if n == 1 then return "ē" end
		if n == 2 then return "é" end
		if n == 3 then return "ě" end
		if n == 4 then return "è" end
		return a
			
	end
	
	if a == "E" then
		if n == 1 then return "Ē" end
		if n == 2 then return "É" end
		if n == 3 then return "Ě" end
		if n == 4 then return "È" end
		return a
			
	end
	
	if a == "i" then
		if n == 1 then return "ī" end
		if n == 2 then return "í" end
		if n == 3 then return "ǐ" end
		if n == 4 then return "ì" end
		return a
			
	end
	
	if a == "O" then
		if n == 1 then return "Ō" end
		if n == 2 then return "Ó" end
		if n == 3 then return "Ŏ" end
		if n == 4 then return "Ò" end
		return a
			
	end
	
	if a == "o" then
		if n == 1 then return "ō" end
		if n == 2 then return "ó" end
		if n == 3 then return "ǒ" end
		if n == 4 then return "ò" end
		return a
			
	end
	
	if a == "u" then
		if n == 1 then return "ū" end
		if n == 2 then return "ú" end
		if n == 3 then return "ǔ" end
		if n == 4 then return "ù" end
		return a
			
	end
	
	if (a == "v") or (a == "ü") then
		if n == 1 then return "ǖ" end
		if n == 2 then return "ǘ" end
		if n == 3 then return "ǚ" end
		if n == 4 then return "ǜ" end
		return "ü"
			
	end
	
	if a == "Ê" then
		if n == 1 then return "Ê̄" end
		if n == 2 then return "Ế" end
		if n == 3 then return "Ê̌" end
		if n == 4 then return "Ề" end
		return a
			
	end
	
	if a == "ê" then
		if n == 1 then return "ê̄" end
		if n == 2 then return "ế" end
		if n == 3 then return "ê̌" end
		if n == 4 then return "ề" end
		return a
			
	end
	
	if a == "N" then
		if n == 2 then return "Ń" end
		if n == 3 then return "Ň" end
		if n == 4 then return "Ǹ" end
		return a
			
	end
	if a == "n" then
		if n == 2 then return "ń" end
		if n == 3 then return "ň" end
		if n == 4 then return "ǹ" end
		return a
	end
	
	if a == "M" then
		if n == 2 then return "Ḿ" end
		if n == 4 then return "M̀" end
		return a
	end
	if a == "m" then
		if n == 2 then return "ḿ" end
		if n == 4 then return "m̀" end
		return a
	end
	
	return a
	
end


function selectVowel(chara, n)
	
	if not chara then
		return
	end

	if chara:find('^.*A') then
		return chara:gsub("A", attachTone("A", n))
	end
	if chara:find('^.*a') then
		return chara:gsub("a", attachTone("a", n))
	end

	if chara:find('^.*E') then
		return chara:gsub("E", attachTone("E", n))
	end
	if chara:find('^.*e') then
		return chara:gsub("e", attachTone("e", n))
	end
	
	if chara:find('^.*Ê') then
		return chara:gsub("Ê", attachTone("Ê", n))
	end
	if chara:find('^.*ê') then
		return chara:gsub("ê", attachTone("ê", n))
	end
	
	if chara:find('^.*iu') then
		return chara:gsub("iu", "i"..attachTone("u", n))
	end
	if chara:find('^.*i') then
		return chara:gsub("i", attachTone("i", n))
	end

	if chara:find('^.*O') then
		return chara:gsub("O", attachTone("O", n))
	end
	if chara:find('^.*o') then
		return chara:gsub("o", attachTone("o", n))
	end
	
	if chara:find('^.*u') then
		return chara:gsub("u", attachTone("u", n))
	end
	
	if chara:find('^.*v') then
		return chara:gsub("v", attachTone("v", n))
	end
	if chara:find('^.*ü') then
		return chara:gsub("ü", attachTone("ü", n))
	end

	if chara:find('^.*N') then
		return chara:gsub("N", attachTone("N", n))
	end
	if chara:find('^.*n') then
		return chara:gsub("n", attachTone("n", n))
	end

	if chara:find('^.*M') then
		return chara:gsub("M", attachTone("M", n))
	end
	if chara:find('^.*m') then
		return chara:gsub("m", attachTone("m", n))
	end
end

function p.pinyin(frame)
	local input = frame.args[1]
	if not input then
		return
	end
	local ve = input:gsub("nue", "nve"):gsub("lue", "lve")
	local out = ve:gsub("([%aüÊê]+)(%d)", selectVowel)
	return (out:gsub("v", "ü"))
end

 
return p