Module:shi-headword


local lang = require("Module:languages").getByCode("shi")

local export = {}
local pos_functions = {}

-----------------------
-- Utility functions --
-----------------------

-- If Not Empty
local function ine(arg)
	if arg == "" then
		return nil
	else
		return arg
	end
end

local function list_to_set(list)
	local set = {}
	for _, item in ipairs(list) do set[item] = true end
	return set
end

-- version of mw.ustring.gsub() that discards all but the first return value
function rsub(term, foo, bar)
	local retval = mw.ustring.gsub(term, foo, bar)
	return retval
end

local rfind = mw.ustring.find

local function append_cat(data, pos)
	table.insert(data.categories, lang:getCanonicalName() .. " " .. pos)
end

function remove_links(text)
	text = rsub(text, "%[%[[^|%]]*|", "")
	text = rsub(text, "%[%[", "")
	text = rsub(text, "%]%]", "")
	return text
end

local function make_unused_key_tracker(t)
	local unused_keys = require"Module:table".listToSet(
							require"Module:table".keysToList(t))
	local mt = {
		__index = function(self, key)
			if key ~= nil then unused_keys[key] = nil end
			return t[key]
		end,
		__newindex = function(self, key, value) t[key] = value end
	}
	local proxy_table = setmetatable({}, mt)
	return proxy_table, unused_keys
end

-- The main entry point.
function export.show(frame)

	local PAGENAME = mw.title.getCurrentTitle().text

	local poscat = frame.args[1] or error("Part of speech has not been specified. Please pass parameter 1 to the module invocation.")

	local params = {
		[1] = {list = "head", allow_holes = true, default = ""},
		["head"] = {default = ""},
		["tr"] = {list = true, allow_holes = true}
	}

	local args, unused_keys = make_unused_key_tracker(frame:getParent().args)

	-- Gather parameters
	local data = {
		lang = lang,
		pos_category = poscat,
		categories = {},
		heads = {},
		translits = {},
		genders = {},
		inflections = {enable_auto_translit = true}
	}

	local head = args["head"] or PAGENAME or ""
	local translit = ine(args["tr"])
	local i = 1

	while head do
		table.insert(data.heads, head)
		data.translits[#data.heads] = translit
		i = i + 1
		head = ine(args["head" .. i])
		translit = ine(args["tr" .. i])
	end

	if pos_functions[poscat] then pos_functions[poscat].func(args, data) end

	local unused_key_list = require"Module:table".keysToList(unused_keys)
	if #unused_key_list > 0 then
		local unused_key_string = require "Module:array"(unused_key_list):map(
									  function(key)
				return "|" .. key .. "=" .. args[key]
			end):concat("\n")
		error("Unused arguments: " .. unused_key_string)
	end

	return require("Module:headword").full_headword(data)
end

local function getargs(args, argpref, defgender, position)
	-- Gather parameters
	local forms = {}

	local form

	if ine(args[position]) then
		form = ine(args[position])
	else 
		form = ine(args[argpref])
	end

	local translit = ine(args[argpref .. "tr"])

	local gender = ine(args[argpref .. "g"])
	local gender2 = ine(args[argpref .. "g2"])

	local i = 1

	while form do
		local genderlist = (gender or gender2) and {gender, gender2} or
							   defgender and {defgender} or nil
		table.insert(forms,
					 {term = form, translit = translit, gender = genderlist})

		i = i + 1
		form = ine(args[argpref .. i])
		translit = ine(args[argpref .. i .. "tr"])
		gender = ine(args[argpref .. i .. "g"])
		gender2 = ine(args[argpref .. i .. "g2"])
	end

	return forms
end

local function handle_infl(args, data, argpref, label, defgender, position)
	local newinfls = getargs(args, argpref, defgender, position)
	newinfls.label = label

	if #newinfls > 0 then
		table.insert(data.inflections, newinfls)
	end
end

local function handle_all_infl(args, data, argpref, label, nobase, position)
	if not nobase and argpref ~= "" then
		handle_infl(args, data, argpref, label, nil, position)
	end
	
	local labelsp = label == "" and "" or label .. " "
	handle_infl(args, data, argpref .. "cons", labelsp .. "construct state")
end

local function handle_noun_plural(args, data)
	if args["pl"] == "-" then
		table.insert(data.inflections, {
			label = "usually [[Appendix:Glossary#uncountable|uncountable]]"
		})
		append_cat(data, "uncountable nouns")
	else
		handle_infl(args, data, "pl", "plural")
	end
end

local valid_genders = list_to_set({"m", "f", "m-p", "f-p", "p"})

local function is_masc_sg(g) return g == "m" end
local function is_fem_sg(g) return g == "f" end

local function handle_gender(args, data, default, nonlemma)
	local g = ine(args[1]) or default
	local g2 = ine(args["g2"])

	local function process_gender(g)
		if not g then
			table.insert(data.genders, "?")
		elseif valid_genders[g] then
			table.insert(data.genders, g)
		else
			error("Unrecognized gender: " .. g)
		end
	end

	process_gender(g)
	if g2 then process_gender(g2) end

	if nonlemma then return end

	if g and g2 then append_cat(data, "terms with multiple genders") end
end

-- Part-of-speech functions

pos_functions["adjectives"] = {
	func = function(args, data)
		handle_all_infl(args, data, "f", "feminine")
		handle_all_infl(args, data, "pl", "masculine plural")
		handle_all_infl(args, data, "fpl", "feminine plural")
	end
}

function handle_noun_infls(args, data, singonly)
	handle_all_infl(args, data, "", "")

	if not singonly then
		handle_noun_plural(args, data)
		handle_all_infl(args, data, "pl", "plural", "nobase")
	end

	handle_all_infl(args, data, "f", "feminine")
	handle_all_infl(args, data, "m", "masculine")
end

pos_functions["nouns"] = {
	func = function(args, data)
		handle_gender(args, data)
		if args["sing"] ~= nil then
			append_cat(data, "collective nouns")
			table.insert(data.inflections, {label = "collective"})
			handle_all_infl(args, data, "sing", "singulative")
		end
		handle_noun_infls(args, data)
	end
}

pos_functions["verbs"] = {
	func = function(args, data)
		data.pos_category = "verbs"
		handle_infl(args, data, "imperf", "imperfective", nil, 1)
		handle_infl(args, data, "perf", "perfective", nil, 2)
	end
}

pos_functions["numerals"] = {
	func = function(args, data)
		append_cat(data, "cardinal numbers")
		handle_gender(args, data)
		handle_noun_infls(args, data)
	end
}

pos_functions["proper nouns"] = {
	func = function(args, data)
		handle_gender(args, data)
		handle_noun_infls(args, data, "singular only")
	end
}

pos_functions["pronouns"] = {
	params = {["g"] = {}},
	func = function(args, data)
		handle_gender(args, data)
		handle_infl(args, data, "sa", "subject affix")
	end
}

return export