Module:zh

Documentation for this module may be created at Module:zh/doc
local M = {}

local m_skeys = nil
local len = mw.ustring.len
local gsub = mw.ustring.gsub
local cmn_pron = nil

local tones = '[̄́̌̀]'

local pos_aliases_title = {
	["n"] = "Noun", 
	["pn"] = "Proper noun", 
	["propn"] = "Proper noun", 
	["pron"] = "Pronoun", 
	["v"] = "Verb", 
	["a"] = "Adjective", 
	["adj"] = "Adjective", 
	["adv"] = "Adverb", 
	["prep"] = "Preposition", 
	["postp"] = "Postposition", 
	["conj"] = "Conjunction", 
	["part"] = "Particle", 
	["suf"] = "Suffix", 
	["prov"] = "Proverb", 
	["id"] = "Idiom", 
	["ch"] = "Idiom", 
	["cy"] = "Idiom", 
	["ph"] = "Phrase", 
	["intj"] = "Interjection", 
	["cl"] = "Classifier", 
	["num"] = "Numeral", 
	["abb"] = "Abbreviation", 
	["deter"] = "Determiner",
}

local pos_aliases_head = {
	["n"] = "noun", 
	["pn"] = "proper noun", 
	["propn"] = "proper noun", 
	["v"] = "verb", 
	["a"] = "adj",
	["postp"] = "post", 
	["conj"] = "con", 
	["part"] = "particle", 
	["pron"] = "pronoun", 
	["prov"] = "proverb", 
	["id"] = "idiom", 
	["ch"] = "idiom", 
	["cy"] = "idiom", 
	["ph"] = "phrase", 
	["intj"] = "interj", 
	["abb"] = "abbr", 
	["cl"] = "cls", 
	["deter"] = "det",
}

local function replace_chars(s, tab)
	local output = {}
	for cp in mw.ustring.gcodepoint(s) do
		local ch = mw.ustring.char(cp)
		table.insert(output, tab[ch] or ch)
	end
	return table.concat(output)
end

function M.sortkey_conv(f)
	local m_sort_data = mw.loadData("Module:zh/data/sortkey")
	local rs = type(f) == 'table' and f.args[1] or f
	local ch = mw.ustring.sub(rs,1,1)
	ch = m_sort_data.sortkeys[ch] or ch
	return ch .. mw.ustring.sub(rs, 2, len(rs))
end

function M.py_detone(f)
	local text = type(f) == 'table' and f.args[1] or f
	return mw.ustring.toNFC(gsub(mw.ustring.toNFD(text), tones, ''))
end

function M.py_transf(f)
	local text = type(f) == 'table' and f.args[1] or f
	return M.py_detone(text) .. M.tone_determ(text)
end

function M.tone_determ(f)
	local text = type(f) == 'table' and f.args[1] or f
	text = mw.ustring.toNFD(text)
	local tone_num = { ['̄'] = '1', ['́'] = '2', ['̌'] = '3', ['̀'] = '4' }
	return tone_num[mw.ustring.match(text, tones)] or '5'
end

function M.ts_determ(f)
	local m_ts_data = mw.loadData("Module:zh/data/ts")
	local m_st_data = mw.loadData("Module:zh/data/st")
	local text = type(f) == 'table' and f.args[1] or f
	local i = 0
	for cp in mw.ustring.gcodepoint(text) do
		local ch = mw.ustring.char(cp)
		if m_ts_data.ts[ch] then return 'trad' end
		if m_st_data.st[ch] then if i > 1 then return 'simp' else i = i + 1 end end
	end
	return (i > 0 and 'simp' or 'both')
end

function M.ts(f)
	local m_ts_data = mw.loadData("Module:zh/data/ts")
	local text = type(f) == 'table' and f.args[1] or f
	text = replace_chars(text, m_ts_data.ts)
	return text
end

function M.st(f)
	local m_st_data = mw.loadData("Module:zh/data/st")
	local text = type(f) == 'table' and f.args[1] or f
	text = replace_chars(text, m_st_data.st)
	return text
end

function M.py(text,comp,pos,p,is_erhua)
	local m_cmn_pron = mw.loadData("Module:zh/data/cmn-pron")
	if not is_erhua then is_erhua = false end
	if type(text) == 'table' then text,comp,pos,p,is_erhua = text.args[1],text.args[2],text.args[3],text.args[4],text.args[5] end
	comp = comp or ''
	local q = {}
	local sum = 0
	length = len(text)
	if is_erhua then length = length - 1 end
	textconv = text
	text = ''
	if comp ~= '' and comp ~= '12' and comp ~= '21' and not ((pos == 'cy' or pos == 'Idiom' or pos == 'idiom') and length == 4) and not is_erhua then
		for i = 1, len(comp) do
			sum = sum + tonumber(mw.ustring.sub(comp,i,i))
			q[sum] = 'y'
		end
	end
	if not p then p={} end
	local initial = true
	for i = 1, length do
		if p[i] and p[i] ~= '' then --pronunciation supplied
			text = text .. p[i]
		else
			local char = mw.ustring.sub(textconv,i,i)
			char = m_cmn_pron.py[char] or m_cmn_pron.py[M.ts(char)] or char
			if is_erhua or initial or not mw.ustring.find(char,'^[aoeāōēáóéǎǒěàòè]') then
				text = text .. char
			else
				text = text .. "&#39;" .. char
			end
			
			if char ~= mw.ustring.sub(textconv,i,i) then
				initial = false
			else
				initial = true
			end
		end
		if q[i] == 'y' and i ~= length and not is_erhua then text = text .. ' ' end
	end
	if is_erhua == true then text = text .. 'r' end
	if pos == 'pn' or pos == 'propn' then
		characters = mw.text.split(text,' ')
		for i=1,#characters do
			characters[i] = mw.language.getContentLanguage():ucfirst(characters[i])
		end
		text = table.concat(characters,' ')
	end
	return text
end

function M.py_er(text,comp,pos,p)
	return M.py(text,comp,pos,p,true)
end

function M.pytemp(text,comp,pos,p,is_erhua)
	local m_cmn_pron = mw.loadData("Module:zh/data/cmn-pron")
	if not is_erhua then is_erhua = false end
	if type(text) == 'table' then text,comp,pos = text.args[1],text.args[2],text.args[3] or 'n' end
	comp = comp or ''
	local q = {}
	local sum = 0
	textconv = M.ts(text)
	length = len(text)
	if is_erhua == true then
		length = length - 1
		textconv = mw.ustring.sub(textconv, 1, length)
	end
	text = ''
	if comp ~= '' and comp ~= '12' and comp ~= '21' and not is_erhua then
		for i = 1, len(comp) do
			sum = sum + tonumber(mw.ustring.sub(comp,i,i))
			q[sum] = 'y'
		end
	end
	if not p then p={} end
	for i = 1, length do
		if p[i] and p[i] ~= '' then --pronunciation supplied
			text = text .. p[i]
		else
			local char = mw.ustring.sub(textconv,i,i)
			if mw.ustring.find(char,'[一不期績绩蹟跡迹嵌框微突帆藩擊击夾夹鞠拈夕汐矽昔惜息危椰濤涛叔寂馴驯築筑質质播究菌矻識识穴膜餾馏企辱署偽伪蹈諷讽斂敛坊樸朴儲储剖檔档髮轍辙賜赐堤壑酵括懾慑蝸蜗淆攜携崖癌暫暂蟄蛰驟骤液血酪嘌覲幀蕁曳室癬癣亞亚穹褐貯贮淑場场踮]') then
				text = text .. char
			else
				char = m_cmn_pron.py[char] or char
				if i ~= 1 and mw.ustring.find(char,'^[aoeāōēáóéǎǒěàòè]') then
					char = "'" .. char
				end
				text = text .. char
			end
		end
		if q[i] == 'y' and i ~= length and not is_erhua then text = text .. ' ' end
	end
	text = gsub(text," '"," ")
	if pos == 'pn' or pos == 'propn' then
		characters = mw.text.split(text,' ')
		for i=1,#characters do
			characters[i] = mw.language.getContentLanguage():ucfirst(characters[i])
		end
		text = table.concat(characters,' ')
	end
	return text
end

function M.pytemp_er(text,comp,pos,p)
	return M.pytemp(text,comp,pos,p,true)
end

function M.pywordconv(text,p)
	local m_cmn_pron = mw.loadData("Module:zh/data/cmn-pron")
	if type(text) == 'table' then text = text.args[1] end
	textconv = M.ts(text)
	length = len(text)
	text = ''
	if not p then p = {} for i = 1, 20 do p[i] = '' end end
	for i = 1, length do
		if p[i] ~= '' then
			text = text .. M.py_transf(p[i])
		else
			char = mw.ustring.sub(textconv,i,i)
			cpy = m_cmn_pron.py[char] or char
			text = text .. M.py_transf(cpy)
		end
	end
	return text
end

function M.pywordconv_er(text,p)
	local m_cmn_pron = mw.loadData("Module:zh/data/cmn-pron")
	if type(text) == 'table' then text = text.args[1] end
	length = len(text) - 1
	textconv = mw.ustring.sub(M.ts(text),1,length)
	text = ''
	if not p then p={} for i=1,20 do p[i]='' end end
	for i = 1,length do
		if p[i] ~= '' then
			if i == length then p[i] = p[i] .. 'r' end
			text = text .. M.py_transf(p[i])
		else
			char = mw.ustring.sub(textconv,i,i)
			cpy = m_cmn_pron.py[char] or char
			if i == length then cpy = cpy .. 'r' end
			text = text .. M.py_transf(cpy)
		end
	end
	return text
end

function M.decomp(text,comp)
	if type(text) == 'table' then text,comp = text.args[1],text.args[2] or '' end
	comp = comp or tostring(len(text))
	local num = tonumber(comp)
	char = mw.ustring.sub(text,num,num)
	return char
end

function M.compdecomp(title,comp)
	if type(title) == 'table' then title,comp = title.args[1],title.args[2] end
	comp = comp or ''
	local start = 1
	local finish = 1
	local sum = 0
	local text = ''
	local p={}
	textlen = len(title)
	if comp == '' then
		for i = 1,textlen do
			comp = comp .. '1'
		end
	end
	for i = 1, len(comp) do
		p[i] = tonumber(mw.ustring.sub(comp,i,i))
		sum = sum + p[i]
	end
	if sum ~= textlen then
		comp = ''
		for j = 1,textlen do
			p[j] = tonumber(1)
			comp = comp .. '1'
		end
	end
	for i = 1, len(comp) do
		if i ~= 1 then start = start + p[i-1] end
		finish = start + p[i] - 1
		text = (text .. '[[' .. mw.ustring.sub(title,start,finish) .. ']]')
	end
	return text
end

function M.compdecompetym(title,comp)
	if type(title) == 'table' then title,comp = title.args[1],title.args[2] end
	comp = comp or ''
	local start = 1
	local finish = 1
	local sum = 0
	local text = ''
	local p={}
	textlen = len(title)
	if comp == '' then
		for i = 1,textlen do
			comp = (comp .. '1')
		end
	end
	for i = 1, len(comp) do
		p[i] = tonumber(mw.ustring.sub(comp,i,i))
		sum = sum + p[i]
	end
	if sum ~= textlen then
		comp = ''
		for j = 1,textlen do
			p[j] = tonumber(1)
			comp = (comp .. '1')
		end
	end
	for i = 1, len(comp) do
		if i ~= 1 then start = start + p[i-1] end
		finish = start + p[i] - 1
		if i ~= 1 then text = (text .. '|') end
		text = (text .. mw.ustring.sub(title,start,finish))
	end
	return text
end

function M.hzbox(title,comp,e,alt)
	if type(title) == 'table' then title,comp = title.args[1],title.args[2] end
	local id = M.ts_determ(title)
	local text = '{{zh-forms'
	if e and e ~= "" then text = text .. '|' .. e end
	if id == 'simp' then
		text = text .. '|t=' .. M.st(title)
	elseif id == 'trad' then
		text = text .. '|s=' .. M.ts(title)
	end
	text = text .. ((comp and comp ~= "") and ('|type=' .. comp) or '')
	text = text .. ((alt and alt ~= "") and '|alt=' .. alt or '')
	return text .. '}}'
end

function M.hzbox_er(title)
	if type(title) == 'table' then title = title.args[1] end
	length = len(title)
	if mw.ustring.sub(title, length, length) == '兒' then id = 'trad' else id = 'simp' end
	title = mw.ustring.sub(title, 1, length-1)
	text = '{{zh-hanzi-box|'
	if id == 'simp' then
		text = (text .. '[[' .. title .. ']][[儿]]|[[' .. M.st(title) .. '兒]]}}')
	else
		text = (text .. '[[' .. M.ts(title) .. '儿]]|[[' .. title .. ']][[兒]]}}')
	end
	return text
end

function M.sort(title)
	local m_cmn_pron = mw.loadData("Module:zh/data/cmn-pron")
	if type(title) == 'table' then title = title.args[1] end
	local text = ''
	length = len(title)
	title = M.ts(title)
	for i = 1,length do
		charpy = mw.ustring.sub(title,i,i)
		charpy = m_cmn_pron.py[charpy] or charpy
		text = text .. M.py_transf(charpy)
	end
	return text
end

function M.postitle(pos)
	pos = pos or ''
	if pos == '' then pos = 'n' end
	return pos_aliases_title[pos] or pos
end

function M.poshead(pos)
	pos = pos or ''
	if pos == '' then pos = 'n' end
	return pos_aliases_head[pos] or pos
end

function M.skeys(title)
	if m_skeys == nil then m_skeys = mw.loadData('Module:zh/data/skeys') end
	
	if type(title) == 'table' then title = title.args[1] end
	text = mw.ustring.sub(title,1,1)
	text = m_skeys.skeys[text] or text
	return text
end

function M.chardecomp(title)
	if type(title) == 'table' then title = title.args[1] end
	text = mw.text.split(title,"")
	return table.concat(text,"|")
end

function M.semantics(text,name,sem)
	if sem[1] and sem[1] ~= '' then
		text = (text .. '\n\n====' .. name .. '====')
		if name == 'Derived terms' then
			text = text .. '\n{{zh-der'
			for i = 1, #sem do
				text = text .. '|' .. sem[i]
			end
			text = text .. '}}'
		else
			for i = 1, #sem do
				text = text .. '\n* {{zh-l|' .. sem[i] .. '}}'
			end
		end
	end
	return text
end

function M.create_er(f)
	return M.create(f,true)
end

local function checkpos(pos)
	for poscode,posname in pairs(pos_aliases_head) do
		if pos == posname then
			return poscode
		end
	end
	for poscode,posname in pairs(pos_aliases_title) do
		if pos == posname then
			return poscode
		end
	end
	return pos
end

function M.headword(title,comp,pos,is_erhua)
	if not is_erhua then is_erhua = false end
	is_table = (type(title) == 'table')
	p = {}
	for i=4,23 do table.insert(p,(is_table and title.args[i] or '')) end
	if type(title) == 'table' then title,comp,pos = title.args[1],title.args[2],title.args[3] end
	text = '{{zh-' .. M.poshead(pos) .. '|'
	id = M.ts_determ(title)
	if id == 'both' then text = text .. 'ts' elseif id == 'simp' then text = text .. 's' else text = text .. 't' end
	if is_erhua then
		text = text .. '|pin=' .. M.py_er(title,comp,pos,p) .. '|pint=' .. M.pywordconv_er(title,p)
		if id == 'simp' then
			text = text .. '|tra=' .. M.st(title) .. '|sim=' .. title
		else
			text = text .. '|tra=' .. title .. '|sim=' .. M.ts(title)
		end
		text = text .. '}}\n\n# {{erhua form'
		if def ~= '' then text = text .. '|' .. def end
	else
		text = text .. '|pin=' .. M.py(title,comp,pos,p) .. '|pint=' .. M.pywordconv(title,p)
		if id == 'simp' then
			text = text .. '|tra=' .. M.st(title) .. '|sim=' .. title
		elseif id == 'trad' then
			text = text .. '|tra=' .. title .. '|sim=' .. M.ts(title)
		end
	end
	return text .. '}}'
end

function M.link(frame, mention, args, pagename, no_transcript)
	args = args or frame:getParent().args
	pagename = pagename or mw.title.getCurrentTitle().text
	if args[2] and mw.ustring.match(args[2], '[一-龯㐀-䶵]') then
		gloss = args[4] or ''
		tr = args[3] or ''
		text = args[1] .. '/' .. args[2]
	else
		text = args[1] or ''
		if not args['gloss'] or args['gloss'] == '' then
			if args[3] or (args[2] and (mw.ustring.match(args[2], '[āōēīūǖáóéíúǘǎǒěǐǔǚàòèìùǜâêîôû̍ⁿ]') or mw.ustring.match(args[2], '[bcdfghjklmnpqrstwz]h?y?[aeiou][aeiou]?[iumnptk]?g?[1-9]'))) then
				tr = args[2] or ''
				gloss = args[3] or ''
			else
				tr = ''
				gloss = args[2] or ''
			end
		else
			tr = args[2] or ''
			gloss = args['gloss']
		end
	end
	if args['tr'] and args['tr'] ~= '' then
		tr = args['tr']
		gloss = gloss or args[2] or ''
	end
	if text ~= '' and not text:match('[%[%]]') then
		word = mw.text.split(text,"/",true)
		if #word == 1 and M.ts_determ(word[1]) == 'trad' and not mw.ustring.match(word[1], '%*') then
			table.insert(word, M.ts(word[1]))
		end
		if tr == '' and not no_transcript and word[1] and text ~= pagename and mw.title.new(word[1]).exists then
			content = mw.title.new(word[1]):getContent()
			content = gsub(content, ",([^ ])", ";%1")
			template = mw.ustring.match(content, "{{zh%-pron[^}]*|m=([^};|\n]+)")
			if template and template ~= "" then
				if cmn_pron == nil then
				   cmn_pron = require("Module:cmn-pron")
				end
				tr = cmn_pron.str_analysis(template, 'link')
			end
		end
		for i = 1,#word do
			word[i] = gsub(word[i], '%*', '')
			if mention then
				word[i] = '<i class="Hani mention" lang="zh">[[' .. word[i] .. '#Chinese|' .. word[i] .. ']]</i>'
--[[ (disabled to allow links to, for example, a link to 冥王星#Chinese from 冥王星#Japanese. 18 May, 2016)
			elseif word[i] == pagename then
				word[i] = '<span class="Hani" lang="zh"><b>' .. word[i] .. '</b></span>'
]]
			else
				word[i] = '<span class="Hani" lang="zh">[[' .. word[i] .. '#Chinese|' .. word[i] .. ']]</span>'
			end
		end
		text = table.concat(word,"／")
	elseif text:match('[%[%]]') or text == pagename then
		if mention then
			text = '<i class="Hani mention" lang="zh">' .. mw.ustring.gsub(text, "%*", "") .. '</i>'
		else
			text = '<span class="Hani" lang="zh">' .. mw.ustring.gsub(text, "%*", "") .. '</span>'
		end
	end
	if tr == '-' or no_transcript then
		tr = '' -- allow translit to be disabled: remove translit if it is "-", just like normal {{l}}
	end
	notes = mention and args['note'] or ''
	if tr ~= '' or gloss ~= '' or notes ~= '' then
		text = text .. ' ('
		if tr ~= '' then
			text = text .. '<span class="tr"><i>' .. tr .. '</i></span>'
			if gloss ~= '' or notes ~= '' then
				text = text .. ', '
			end
		end
		if gloss ~= '' then
			text = text .. '“' .. gloss .. '”'
			if notes ~= '' then
				text = text .. ', '
			end
		end
		if notes ~= '' then
			text = text .. notes
		end
		text = text .. ')'
	end
	return text
end

function M.mention(frame)
	return M.link(frame,true)
end

function M.check_pron(text, variety, length, entry_creation)
	if type(text) == 'table' then text, variety = text.args[1], text.args[2] end
	if not text then
		return
	end
	startpoint, address = { ['yue'] = 51, ['hak'] = 19968, ['nan'] = 19968 }, { ['yue'] = 'Jyutping_word/%03d', ['hak'] = 'hak-pron/%02d', ['nan'] = 'nan-pron/%03d' }
	unit = 1000
	first_char = mw.ustring.sub(text, 1, 1)
	codepoints = { ['simp'] = mw.ustring.codepoint(first_char), ['trad'] = mw.ustring.codepoint(M.st(first_char)) }
	texts = { ['simp'] = text, ['trad'] = M.st(text) }
	local result = false
	for identity, codepoint in pairs(codepoints) do
		if length == 1 and variety == "yue" then
			success, data = pcall(mw.loadData, 'Module:zh/data/Jyutping character')
		else
			page_index = math.floor((codepoint - startpoint[variety]) / unit)
			success, data = pcall(mw.loadData,
				('Module:zh/data/' .. address[variety]):format(page_index)
			)
		end
		if success then
			result = data[texts[identity]] or false
		else
			result = false
		end
		if result then
			if variety == "nan" and entry_creation then
				result = gsub(result, "%-á%-", "-仔-")
				result = gsub(result, "%-á/", "-仔/")
				result = gsub(result, "%-á$", "-仔")
				result = gsub(result, "^(.+)%-%1%-%1$", "(%1)")
				result = gsub(result, "^(.+)%-%1%-%1([%-%/])", "(%1)%2")
				result = gsub(result, "([%-%/])(.+)%-%1%-%1$", "%1(%2)")
				result = gsub(result, "([%-%/])(.+)%-%1%-%1([%-%/])", "%1(%2)%3")
			end
			return result
		end
	end
	return result
end

function M.nan_for_bot()
	text = mw.title.getCurrentTitle().text
	result = M.check_pron(text, 'nan')
	if result then
		return '\n|mn=' .. result
	else
		return
	end
end

function M.der(frame)
	local m_columns = require("Module:columns")
	local args = frame:getParent().args
	local pagename = mw.title.getCurrentTitle().subpageText
	local result = {}
	
	fold = args["fold"] and true or false
	title = args["title"] and " (<i>" .. args["title"] .. "</i>)" or ""
	no_transcript = args["hide_pron"] and true or false
	
	for i, word in ipairs(args) do
		table.insert(result, M.link(frame, nil, mw.text.split(word, ":"), pagename, no_transcript))
	end
	
	return 
		m_columns.create_table(
			(len(pagename) > 1 and 2 or 3), 
			result, 
			1, 
			"#F5F5FF",
			((#result > 72 or fold) and 1 or 0), 
			"Derived terms",
			"Derived terms from <span lang=\"zh\" class=\"Hani\">" .. pagename .. "</span>" .. title, 
			math.floor(80 / (len(pagename) > 1 and 2 or 3)), 
			"* ", 
			nil
		)
end

local lang_abbrev = {
	['m'] = 'Mandarin',
	['c'] = 'Cantonese', ['g'] = 'Gan', ['h'] = 'Hakka', ['j'] = 'Jin',
	['md'] = 'Min Dong', ['mn'] = 'Min Nan', ['mn-t'] = 'Teochew',
	['w'] = 'Wu', ['x'] = 'Xiang',
}

function M.cls(frame)
	local args = frame:getParent().args
	local result, categories = {}, {}
	local m_zh_cat = require("Module:zh-cat")
	for i, combination in ipairs(args) do
		local part = mw.text.split(combination, ":")
		if #part == 2 then
			local dialect = { "" }
			local function annotate(main_text, annotation)
				return "<span style=\"border-bottom: 1px dotted #000; cursor:help\" " ..
					"title=\"" .. annotation .. "\"><i>" .. main_text .. "</i></span>"
			end
			for variety in mw.text.gsplit(part[1], ",") do
				table.insert(dialect, annotate(variety, lang_abbrev[variety]))
			end
			note = table.concat(dialect, " ")
		else
			note = false
		end
		table.insert(result, M.link(frame, nil, { part[2] or part[1], tr = "-" }, pagename) ..
			(note or ""))
		table.insert(categories, m_zh_cat.categorize("Classifier:" .. (part[2] or part[1])))
	end
	return "&nbsp;&nbsp;<small><span style=\"background:#EDFFFF\">(Classifier: " ..
		table.concat(result, "; ") .. ")</span></small>" .. 
		(mw.title.getCurrentTitle().nsText == "" and table.concat(categories) or "")
end

function M.newDer(frame)
	local title = mw.title.getCurrentTitle().subpageText
	local prefix = "Module:zh/data/wordlist/"
	local args = frame:getParent().args
	
	local limit = args["limit"] and tonumber(args["limit"]) or false
	local char_pronunciation = args["p"] or false
	local fold = args["fold"] or false
	local hide_pron = args["hide_pron"] or false
	
	local result = {}
	for _, arg in ipairs(args) do
		table.insert(result, arg)
	end
	
	i = 1
	while i < 4 do
		local wordlist = require(prefix .. tostring(i))
		for word, pronunciation in pairs(wordlist) do
			if mw.ustring.match(word, title) and word ~= title and not (len(title) == 1 and len(word) > (limit or 4)) then
				if char_pronunciation then
					if mw.text.split(pronunciation, " ")[mw.ustring.find(word, title)] == char_pronunciation then
						table.insert(result, word)
					end
				else
					table.insert(result, word)
				end
			end
		end
		i = i + 1
	end
	local hash, res = {}, {}
	for _, element in ipairs(result) do
		local section = mw.text.split(element, ":")[1]
		if not hash[section] then
			res[#res + 1] = element
			hash[section] = true
		end
	end
	return "{{zh-der|" .. (hide_pron and "hide_pron=1|" or "") .. (fold and "fold=1|" or "") .. table.concat(res, "|") .. "}}"
end

function M.create(f,is_erhua)
	if not is_erhua then is_erhua = false end
	local title = mw.title.getCurrentTitle().text
	local params = {
		["type"] = {}, ["comp"] = {alias_of = "type"},
		[1] = {list = true, allow_holes = true},
		["pos"] = {list = true, allow_holes = true},
		["def"] = {list = true, allow_holes = true},
		["e1"] = {list = "e", allow_holes=true}, ["etym1"] = {list = "etym", allow_holes=true}, ["etymology1"] = {list = "etymology", allow_holes=true}, ["meaning"] = {list = true, allow_holes=true}, ["gloss"] = {list = true, allow_holes=true},
		["k"] = {}, ["ko"] = {alias_of = "k"}, ["korean"] = {alias_of = "k"},
		["kt"] = {}, ["tr"] = {alias_of = "kt"}, ["transcription"] = {alias_of = "kt"}, ["ktr"] = {alias_of = "kt"}, ["kotr"] = {alias_of = "kt"}, ["koreantr"] = {alias_of = "kt"}, ["ktrans"] = {alias_of = "kt"}, ["kotrans"] = {alias_of = "kt"},
		["ke"] = {}, ["kodef"] = {alias_of = "ke"}, ["kodefinition"] = {alias_of = "ke"}, ["koreandef"] = {alias_of = "ke"},
		["v"] = {}, ["vi"] = {alias_of = "v"}, ["vietnam"] = {alias_of = "v"},
		["ve"] = {}, ["videf"] = {alias_of = "ve"}, ["videfinition"] = {alias_of = "ve"}, ["vietnamdef"] = {alias_of = "ve"}, ["vietnamdefinition"] = {alias_of = "ve"},
		["p"] = {list = true, allow_holes=true}, ["pron"] = {list = true, allow_holes=true}, ["pronunciation"] = {list = true, allow_holes=true},
		["e"] = {}, ["etym"] = {alias_of = "e"}, ["etymology"] = {alias_of = "e"}, ["origin"] = {alias_of = "e"}, ["ori"] = {alias_of = "e"}, ["o"] = {alias_of = "e"},
		["syn"] = {list = true}, ["synonym"] = {list = true},
		["ant"] = {list = true}, ["antonym"] = {list = true},
		["der"] = {list = true}, ["deriv"] = {list = true}, ["derived"] = {list = true}, ["derivedterm"] = {list = true},
		["also"] = {list = true}, ["see"] = {list = true}, ["seealso"] = {list = true}, ["alsosee"] = {list = true},
		["wp"] = {}, ["wiki"] = {alias_of = "wp"}, ["wikipedia"] = {alias_of = "wp"},
		["cat"] = {list = true}, ["category"] = {list = true}, ["categories"] = {list = true}, ["categorize"] = {list = true}, ["categorise"] = {list = true}, ["categorization"] = {list = true}, ["categorisation"] = {list = true},
		["pic"] = {}, ["file"] = {alias_of = "pic"}, ["image"] = {alias_of = "pic"}, ["picture"] = {alias_of = "pic"},
		["piccap"] = {}, ["caption"] = {alias_of = "piccap"}, ["description"] = {alias_of = "piccap"}, ["desc"] = {alias_of = "piccap"},
		["er"] = {}, ["erhua"] = {alias_of = "er"},
		["tl"] = {}, ["toneless"] = {alias_of = "tl"}, ["tonelessvariant"] = {alias_of = "tl"}, ["variant"] = {alias_of = "tl"}, ["variation"] = {alias_of = "tl"}, ["tonelessvariation"] = {alias_of = "tl"},
		["a"] = {}, ["audio"] = {alias_of = "a"}, ["listen"] = {alias_of = "a"}, ["sound"] = {alias_of = "a"}, ["pronounced"] = {alias_of = "a"},
		["alt"] = {}, ["alter"] = {alias_of = "alt"}, ["altern"] = {alias_of = "alt"}, ["alternate"] = {alias_of = "alt"}, ["alternative"] = {alias_of = "alt"},
		["c"] = {}, ["cant"] = {alias_of = "c"}, ["cantonese"] = {alias_of = "c"},
		["mn"] = {}, ["nan"] = {alias_of = "mn"}, ["minnan"] = {alias_of = "mn"},
		["w"] = {}, ["wu"] = {alias_of = "w"}, ["shanghai"] = {alias_of = "w"},
		["m"] = {},
		["c-t"] = {},
		["g"] = {},
		["h"] = {},
		["j"] = {},
		["md"] = {},
		["mn-t"] = {},
		["x"] = {},
		["mc"] = {},
		["oc"] = {},
		["ts"] = {},
	}
	local args = require("Module:parameters").process(f:getParent().args, params)
	local comp = args["type"] or ""
	local pos = {}
	local def = {}
	for i=1,math.max(args[1].maxindex/2, args["pos"].maxindex, args["def"].maxindex) do
		table.insert(pos, args[1][2*i-1] or args["pos"][i] or "")
		table.insert(def, args[1][2*i] or args["def"][i] or "")
	end
	
	local function length(array)
		return array.maxindex or #array
	end
	
	local function expand(arg)
		local result = {}
		local maximum = 0
		for i=1,#arg do if length(arg[i]) > maximum then maximum = length(arg[i]) end end
		local current = nil
		for i=1,maximum do
			current = nil
			for j=1,#arg do
				if current then
					break
				else
					current = arg[j][i]
				end
			end
			current = current or ""
			table.insert(result, current)
		end
		return result
	end
	
	local function fetch_all(arg)
		local result = {}
		for i=1,#arg do
			for j=1,#arg[i] do
				table.insert(result,arg[i][j])
			end
		end
		return result
	end
	
	local etyms = expand({args["e1"], args["etym1"], args["etymology1"], args["gloss"], args["meaning"]})
	local ko = args["k"] or ""
	local kotrans = args["kt"] or ""
	local kodef = args["ke"] or def[1] or ""
	local vi = args["v"] or ""
	local videf = args["ve"] or def[1] or ""
	local p = expand({args["p"], args["pron"], args["pronunciation"]})
	local etym = args["e"] or ""
	local syn = expand({args["syn"], args["synonym"]})
	local ant = expand({args["ant"], args["antonym"]})
	local der = expand({args["der"], args["deriv"], args["derived"], args["derivedterm"]})
	local also = expand({args["also"], args["see"], args["alsosee"], args["seealso"]})
	local wp = args["wp"] or ""
	local cat = fetch_all({args["cat"], args["category"], args["categories"], args["categorize"], args["categorise"], args["categorization"], args["categorisation"]})
	local pic = args["pic"] or ""
	local piccap = args["piccap"] or ""
	local er = args["er"] or ""
	local tl = args["tl"] or ""
	local audio = args["a"] or ""
	local alt = args["alt"] or ""
	local c = args["c"] or ""
	local c_t = args["c-t"] or ""
	local mn = args["mn"] or ""
	local mn_t = args["mn-t"] or ""
	local w = args["w"] or ""
	local m = args["m"] or ""
	local h = args["h"] or ""
	local g = args["g"] or ""
	local j = args["j"] or ""
	local x = args["x"] or ""
	local md = args["md"] or ""
	local mc = args["mc"] or ""
	local oc = args["oc"] or ""
	local ts = args["ts"] or ""
	text = ''
	if not pos[1] or pos[1] == '' then pos[1] = 'n' end
	for i=1,#pos do pos[i] = checkpos(pos[i]) end
	text = (text .. '==Chinese==\n')
	if M.ts_determ(title) == 'simp' and ts ~= "trad" then
		return text .. '{{zh-see|' .. M.st(title) .. ('}}\n\n[[zh:%s]]'):format(mw.title.getCurrentTitle().text)
	end
	length = len(title)
	noerhua = mw.ustring.sub(title,1,length-1)
	erhua = mw.ustring.sub(title,length,length)
	text = text .. (is_erhua and M.hzbox_er(title) or M.hzbox(title,comp,table.concat(etyms,'|'),alt))
	if wp ~= '' then text = (text .. '\n{{zh-wp}}') end
	if pic ~= '' then text = (text .. '\n[[File:' .. pic .. '|thumb|250px') if piccap ~= '' then text = (text .. '|' .. piccap) end text = (text .. ']]')	end
	if is_erhua then
		text = (text .. '===Pronunciation===\n{{zh-pron\n\|m=' .. M.pytemp_er(title,comp,pos[1],p) .. 'r\n|cat=' .. table.concat(pos[1],',') .. '\n}}\n\n')
	else
		text = (text .. '\n\n')
		if etym ~= '' then text = (text .. '===Etymology===\n' .. etym .. '\n\n') end
		if #etyms > 0 then
			text = (text .. '===Etymology===\n')
			text = (text .. '{{zh-compound|' .. M.compdecompetym(title,comp) .. '|' .. table.concat(etyms,'|') .. '}}\n\n')
		end
		text = (text .. '===Pronunciation===\n{{zh-pron')
		if m ~= '-' then
			if m ~= '' then
				m_pron = m
				text = (text .. '\n|m=' .. m_pron)
			else
				m_pron = gsub(M.pytemp(title,comp,pos[1],p), '，', ', ')
				text = (text .. '\n|m=' .. m_pron)
				if er ~= '' then text = (text .. ',er=' .. er) end
				if tl ~= '' then text = (text .. ',tl=y') end
			end
		end
		if c == '' then c = M.check_pron(title, 'yue', length) or '' end
		if length == 1 or (c ~= '' and c ~= '-') then text = (text .. '\n|c=' .. (c or "")) end
		if length == 1 or c_t ~= '' then text = (text .. '\n|c-t=' .. (c_t or "")) end
		if length == 1 or g ~= '' then text = (text .. '\n|g=' .. (g or "")) end
		if h == '' then h = M.check_pron(title, 'hak') or '' end
		if length == 1 or (h ~= '' and h ~= '-') then text = (text .. '\n|h=' .. (h and ("pfs=" .. h) or "")) end
		if length == 1 or j ~= '' then text = (text .. '\n|j=' .. (j or "")) end
		if length == 1 or md ~= '' then text = (text .. '\n|md=' .. (md or "")) end
		if mn == '' then mn = M.check_pron(title, 'nan', nil, true) or '' end
		if length == 1 or (mn ~= '' and mn ~= '-') then text = (text .. '\n|mn=' .. (mn or "")) end
		if length == 1 or mn_t ~= '' then text = (text .. '\n|mn-t=' .. (mn_t or "")) end
		if length == 1 or w ~= '' then text = (text .. '\n|w=' .. (w or "")) end
		if length == 1 or x ~= '' then text = (text .. '\n|x=' .. (x or "")) end
		if audio ~= '' then text = (text .. '\n|ma=') if audio ~= 'y' then text = (text .. audio) else text = (text .. 'y') end end
		if length == 1 or mc ~= '' then text = (text .. '\n|mc=' .. (mc ~= "" and mc or 'y')) end
		if length == 1 or oc ~= '' then text = (text .. '\n|oc=' .. (oc ~= "" and oc or 'y')) end
		text = (text .. '\n|cat=' .. table.concat(pos,',') .. '\n}}\n\n')
	end
	text = (text .. '===' .. (length == 1 and "Definitions" or M.postitle(pos[1])) .. '===\n')
	text = (text .. '{{zh-' .. (length == 1 and "hanzi" or M.poshead(pos[1])) .. '}}\n\n')
	if is_erhua then
		text = text .. '# {{context|Mandarin|lang=zh}} {{erhua form'
		if def[1] and def[1] ~= '' then text = text .. '|' .. def[1] end
		text = text .. '}}'
	else
		text = (text .. '# ' .. ((def[1] and def[1] ~= "") and def[1] or "{{rfdef|lang=zh}}"))
	end
	if syn[1] then
		if mw.ustring.match(syn[1], "^dial") then
			text = text .. "\n\n====Synonyms====\n{{zh-" .. syn[1] .. "}}"
		else
			text = M.semantics(text,'Synonyms',syn)
		end
	end
	text = M.semantics(text,'Antonyms',ant)
	text = M.semantics(text,'Derived terms',der)
	for i=2,#pos do
		text = text .. '\n\n===' .. M.postitle(pos[i]) .. '===\n'
		text = text .. '{{zh-' .. M.poshead(pos[i]) .. '}}\n\n'
		if is_erhua then
			text = text .. '# {{context|Mandarin|lang=zh}} {{erhua form'
			if def[i] ~= '' then text = text .. '|' .. def[i] end
			text = text .. '}}'
		else
			text = text .. '# ' .. def[i]
		end
	end
	if #also > 0 then
		text = (text .. '\n\n===See also===')
		for i=1,#also do
			text = (text .. '\n* {{zh-l|' .. also[i] .. '}}')
		end
	end
	if #cat > 0 then text = (text .. '\n\n{{zh-cat|' .. table.concat(cat,'|') .. '}}') end
	if ko ~= '' then
		text = text .. '\n\n----\n\n==Korean==\n{{ko-hanjatab}}\n\n===Noun===\n{{ko-noun|hj|hangeul=' .. ko .. '}}\n\n# {{hanja form of|' .. ko .. '|' .. kodef .. '}}'
	end
	if vi ~= '' then
		text = text .. '\n\n----\n\n==Vietnamese==\n{{vi-hantutab}}\n\n===' .. M.postitle(pos[1]) .. '===\n{{vi-hantu}}\n\n# {{han tu form of|' .. vi .. '|' .. videf .. '}}'
	end
	return text
end

function M.wikipedia(frame)
	local args = frame:getParent().args
	local title = mw.title.getCurrentTitle().text
	local wp_data = {
		["zh"] = { "Written Standard Chinese<sup>[[w:Written vernacular Chinese|?]]</sup>", "Hani", "zh" },
		["cdo"] = { "Min Dong", "Latn", "cdo" },
		["cl"] = { "Classical", "Hani", "zh" },
		["gan"] = { "Gan", "Hani", "zh" },
		["hak"] = { "Hakka", "Latn", "hak" },
		["nan"] = { "Min Nan", "Latn", "nan" },
		["wuu"] = { "Wu", "Hani", "zh" },
		["yue"] = { "Cantonese", "Hani", "zh" },
		["en"] = { "English", "Latn", "en" },
	}
	
	args = args[1] and args or { "zh" }
	result = { '<div class="sister-wikipedia sister-project noprint floatright" style="border: 1px solid #aaa; font-size: 90%; background: #f9f9f9; width: 250px; padding: 4px; text-align: left;"><div style="float: left;">[[File:Wikipedia-logo.png|32px|none|link=|alt=]]</div><div style="margin-left: 40px;">[[Wikipedia]] has ' ..
		(args[2] and "articles" or "an article") .. ' on:' }

	for _, arg in ipairs(args) do
		local part = mw.text.split(arg, ":")
		local lang_data = wp_data[part[1]] or { nil, "Hani", "zh" }
		local annotation = lang_data[1] or false
		if part[1] == "zh" and not args[2] then
			annotation = false
		elseif annotation then
			annotation = " <span style=\"font-size\:80%\">(" .. annotation .. ")</span>"
		end
		table.insert(result, '<div style="margin-left: 10px;">• <b class="' .. (gsub(lang_data[2], "Latn", (len(part[2] or title) < 15 and "Latn\" style=\"font-size:120%" or "Latn"))) .. '" lang="' .. lang_data[3] .. '">[[w&#x3a;' .. part[1] .. '&#x3a;' .. (part[2] or title) .. '|' .. (part[2] or title) .. ']]</b>' .. (annotation or "") .. '</div>')
	end
	
	table.insert(result, '</div></div>')
	
	return table.concat(result)
end

return M