Documentation for this module may be created at မော်ဂျူး:fr-headword/doc

local export = {}
local pos_functions = {}
local rfind = mw.ustring.find
local rmatch = mw.ustring.match
local rsubn = mw.ustring.gsub
local rsplit = mw.text.split

local lang = require("Module:languages").getByCode("fr")
		
local suffix_categories = {
	["နာမဝိသေသနများ"] = true,
	["ကြိယာဝိသေသနများ"] = true,
	["နာမ်များ"] = true,
	["ကြိယာများ"] = true,
	["prepositional phrases"] = true,
}

-- version of rsubn() that discards all but the first return value
local function rsub(term, foo, bar)
	local retval = rsubn(term, foo, bar)
	return retval
end

local function track(page)
	require("Module:debug").track("fr-headword/" .. page)
	return true
end

-- mw.title.new() returns nil if there are weird chars in
-- the pagename.
local function exists(pagename)
	local title = mw.title.new(pagename)
	return title and title.exists
end

local function add_suffix(list, suffix)
	local newlist = {}
	for _, item in ipairs(list) do
		local form
		if suffix == "s" then
			if rfind(item, "[sx]$") then
				form = item
			elseif rfind(item, "al$") then
				form = rsub(item, "al$", "aux")
			else
				form = item .. suffix
			end
		elseif suffix == "e" then
			if rfind(item, "e$") then
				form = item
			elseif rfind(item, "en$") then
				form = item .. "ne"
			elseif rfind(item, "er$") then
				form = rsub(item, "er$", "ère")
			elseif rfind(item, "el$") then
				form = item .. "le"
			elseif rfind(item, "et$") then
				form = item .. "te"
			elseif rfind(item, "on$") then
				form = item .. "ne"
			elseif rfind(item, "ieur$") then
				form = item .. "e"
			elseif rfind(item, "teur$") then
				form = rsub(item, "teur$", "trice")
			elseif rfind(item, "eu[rx]$") then
				form = rsub(item, "eu[rx]$", "euse")
			elseif rfind(item, "if$") then
				form = rsub(item, "if$", "ive")
			elseif rfind(item, "c$") then
				form = rsub(item, "c$", "que")
			else
				form = item .. suffix
			end
		else
			form = item .. suffix
		end
		table.insert(newlist, form)
	end
	return newlist
end

local no_split_words = {
	["c'est"] = true,
	["quelqu'un"] = true,
	["aujourd'hui"] = true,
}

-- Auto-add links to a “space word” (after splitting on spaces). We split off
-- final punctuation, and then split on hyphens if split_dash is given, and
-- also split on apostrophes, including the apostrophe in the link to its left
-- (so we auto-split “l’eau” as “[[l']][[eau]]”).
local function add_space_word_links(space_word, split_dash)
	local space_word_no_punct, punct = rmatch(space_word, "^(.*)([,;:?!])$")
	space_word_no_punct = space_word_no_punct or space_word
	punct = punct or ""
	local words
	-- don’t split prefixes and suffixes
	if not split_dash or rfind(space_word_no_punct, "^%-") or rfind(space_word_no_punct, "%-$") then
		words = {space_word_no_punct}
	else
		words = rsplit(space_word_no_punct, "%-")
	end
	local linked_words = {}
	for _, word in ipairs(words) do
		if not no_split_words[word] and rfind(word, "'") then
			word = rsub(word, "([^']+')", "[[%1]]")
			word = rsub(word, "%]([^%[%]]*)$", "][[%1]]")
		else
			word = "[[" .. word .. "]]"
		end
		table.insert(linked_words, word)
	end
	return table.concat(linked_words, "-") .. punct
end

-- Auto-add links to a lemma. We split on spaces, and also on hyphens
-- if split_dash is given or the word has no spaces. In addition, we split
-- on apostrophes, including the apostrophe in the link to its left
-- (so we auto-split "de l’eau" as "[[de]] [[l']][[eau]]"). We don’t always
-- split on hyphens because of cases like “boire du petit-lait” where
-- “petit-lait” should be linked as a whole, but provide the option to do it
-- for cases like “croyez-le ou non”. If there’s no space, however, then
-- it makes sense to split on hyphens by default (e.g. for “avant-avant-hier”).
-- Cases where only some of the hyphens should be split can always be handled
-- by explicitly specifying the head (e.g. “Nord-Pas-de-Calais”).
local function add_lemma_links(lemma, split_dash)
	if not rfind(lemma, " ") then
		split_dash = true
	end
	local words = rsplit(lemma, " ")
	local linked_words = {}
	for _, word in ipairs(words) do
		table.insert(linked_words, add_space_word_links(word, split_dash))
	end
	local retval = table.concat(linked_words, " ")
	-- If we ended up with a single link consisting of the entire lemma,
	-- remove the link.
	local unlinked_retval = rmatch(retval, "^%[%[([^%[%]]*)%]%]$")
	return unlinked_retval or retval
end

-- The main entry point.
-- This is the only function that can be invoked from a template.
function export.show(frame)
	local PAGENAME = mw.title.getCurrentTitle().text
	
	local poscat = frame.args[1] or error("Part of speech has not been specified. Please pass parameter 1 to the module invocation.")
	
	local params = {
		["head"] = {list = true},
		["suff"] = {type = "boolean"},
		["splitdash"] = {type = "boolean"},
	}

	if rfind(PAGENAME, " ") then
		track("space")
	end

	if pos_functions[poscat] then
		for key, val in pairs(pos_functions[poscat].params) do
			params[key] = val
		end
	end

	local parargs = frame:getParent().args
	local args = require("Module:parameters").process(parargs, params)

	local heads = args["head"]
	if pos_functions[poscat] and pos_functions[poscat].param1_is_head and args[1] then
		-- FIXME! REMOVE ME! Hack to correspond to previous template code in {{fr-adv}}.
		if args[1] == "-" then
			track("arg1dash")
		else
			table.insert(heads, 1, args[1])
		end
	end
	local auto_linked_head = add_lemma_links(PAGENAME, args["splitdash"])
	if #heads == 0 then
		heads = {auto_linked_head}
	else
		for _, head in ipairs(heads) do
			if head == auto_linked_head then
				track("redundant-head")
			end
		end
	end
		
	local data = {lang = lang, pos_category = poscat, categories = {}, heads = heads, genders = {}, inflections = {}, categories = {}}
	
	if args["suff"] then
		data.pos_category = "နောက်ဆက်များ"
		
		if suffix_categories[poscat] then
			local singular_poscat = poscat:gsub("s$", "")
			table.insert(data.categories, lang:getCanonicalName() .. " " .. singular_poscat .. "-forming suffixes")
		else
			error("No category exists for suffixes forming " .. poscat .. ".")
		end
	end
	
	if pos_functions[poscat] then
		pos_functions[poscat].func(args, data)
	end
	
	return require("Module:headword").full_headword(data)
end

local allowed_genders = {
	["m"] = true,
	["f"] = true,
	["m-p"] = true,
	["f-p"] = true,
	["m-s"] = true,
	["f-s"] = true,
}

local function get_noun_pos(is_proper)
	return {
		params = {
			[1] = {},
			["g"] = {list = true},
			[2] = {list = true},
			["f"] = {list = true},
			["m"] = {list = true},
			["dim"] = {list = true},
			},
		func = function(args, data)
			local PAGENAME = mw.title.getCurrentTitle().text
			
			local function default_plural()
				if rfind(PAGENAME, 'x$') then
					track("default-x")
				end
				if rfind(PAGENAME, 'z$') then
					track("default-z")
				end
				if rfind(PAGENAME, '[sxz]$') then
					return PAGENAME
				elseif rfind(PAGENAME, '[ae]u$') then
					return "x"
				elseif rfind(PAGENAME, 'al$') then
					return mw.ustring.sub(PAGENAME, 1, -3) .. 'aux'
				else
					return "s"
				end
			end

			-- Gather genders
			local function insert_gender(g)
				if g == "mf" then
					table.insert(data.genders, "m")
					table.insert(data.genders, "f")
				else
					table.insert(data.genders, g)
				end
			end
			insert_gender(args[1])
			for _, g in ipairs(args.g) do
				insert_gender(g)
			end

			-- Gather all the plural parameters from the numbered parameters.
			local plurals = args[2]
			plurals.label = "ဗဟုဝုစ်"
			plurals.accel = {form = "p"}
			plurals.request = true
			
			-- Gather all the feminine parameters
			local feminines = args["f"]
			feminines.label = "ဣတ္ထိလိင်"
			
			-- Gather all the masculine parameters
			local masculines = args["m"]
			masculines.label = "ပုလ္လိင်"
			
			-- Add categories for genders
			if #data.genders == 0 then
				table.insert(data.genders, "?")
			end
			
			local mode = nil
			
			for _, g in ipairs(data.genders) do
				if g == "m-p" or g == "f-p" then
					mode = "p"
				end

				if g == "?" and (is_proper or mw.title.getCurrentTitle().nsText == "တမ်းပလိတ်") then
					-- allow unknown gender in template example and proper nouns,
					-- since there are currently so many proper nouns with
					-- unspecified gender
				elseif g and g ~= "" and not allowed_genders[g] then
					error("Unrecognized French gender: " .. g)
				end

				if g == "m" or g == "m-p" or g == "m-s" then
					table.insert(data.categories, "ပြင်သစ် ပုလ္လိင် နာမ်များ")
				elseif g == "f" or g == "f-p" or g == "f-s" then
					table.insert(data.categories, "ပြင်သစ် ဣတ္ထိလိင် နာမ်များ")
				end
			end
			
			-- Decide how to show the plurals
			mode = mode or plurals[1]
			
			-- Plural is not attested
			if mode == "!" then
				table.insert(data.inflections, {label = "plural not attested"})
				table.insert(data.categories, "French nouns with unattested plurals")
			-- Plural-only noun, doesn't have a plural
			elseif mode == "p" then
				table.insert(data.inflections, {label = "plural only"})
				table.insert(data.categories, "French pluralia tantum")
			else
				-- Plural is unknown
				if mode == "?" then
					table.remove(plurals, 1)  -- Remove the mode parameter
				-- Uncountable noun; may occasionally have a plural
				elseif mode == "-" then
					table.remove(plurals, 1)  -- Remove the mode parameter
					table.insert(data.categories, "ပြင်သစ် ရေတွက်မရ နာမ်များ")
				
					-- If plural forms were given explicitly, then show "usually"
					if #plurals > 0 then
						track("count-uncount")
						table.insert(data.inflections, {label = "များသောအားဖြင့် [[နောက်ဆက်တွဲ:ခက်ဆစ်#uncountable|ရေတွက်မရ]]"})
						table.insert(data.categories, "ပြင်သစ် ရေတွက်ရ နာမ်များ")
					else
						table.insert(data.inflections, {label = "[[နောက်ဆက်တွဲ:ခက်ဆစ်#uncountable|ရေတွက်မရ]]"})
					end
				-- Mixed countable/uncountable noun, always has a plural
				elseif mode == "~" then
					table.remove(plurals, 1)  -- Remove the mode parameter
					table.insert(data.inflections, {label = "[[နောက်ဆက်တွဲ:ခက်ဆစ်#countable|ရေတွက်ရ]] နှင့် [[နောက်ဆက်တွဲ:ခက်ဆစ်#uncountable|ရေတွက်မရ]]"})
					table.insert(data.categories, "ပြင်သစ် ရေတွက်မရ နာမ်များ")
					table.insert(data.categories, "ပြင်သစ် ရေတွက်ရ နာမ်များ")
				
					-- If no plural was given, add a default one now
					if #plurals == 0 then
						table.insert(plurals, default_plural())
					end
				-- Default proper noun; uncountable unless plural(s) specified
				elseif is_proper then
					if #plurals > 0 then
						table.insert(data.categories, "ပြင်သစ် ရေတွက်ရ နာမ်များ")
					else
						table.insert(data.categories, "ပြင်သစ် ရေတွက်မရ နာမ်များ")
					end
				-- The default, always has a plural
				else
					table.insert(data.categories, "ပြင်သစ် ရေတွက်ရ နာမ်များ")
					
					-- If no plural was given, add a default one now
					if #plurals == 0 then
						table.insert(plurals, default_plural())
					end
				end
				
				-- Process the plural forms
				for i, pl in ipairs(plurals) do
					if pl == "*" then
						pl = PAGENAME
					elseif pl == "s" then
						pl = PAGENAME .. "s"
					elseif pl == "x" then
						pl = PAGENAME .. "x"
					end

					if not exists(pl) then
						table.insert(data.categories, "French nouns with red links in their headword lines")
					end
					
					plurals[i] = pl
				end
		
				-- Add the plural forms; do this in some cases even if no plurals
				-- specified so we get a "please provide plural" message.
				if mode ~= "-" and (not is_proper or mode) or #plurals > 0 then
					table.insert(data.inflections, plurals)
				end
			end
			
			-- Add the feminine forms
			if #feminines > 0 then
				table.insert(data.inflections, feminines)
				
				for _, f in ipairs(feminines) do
					if not exists(f) then
						table.insert(data.categories, "French nouns with red links in their headword lines")
					end
				end
			end
			
			-- Add the masculine forms
			if #masculines > 0 then
				table.insert(data.inflections, masculines)
				
				for _, m in ipairs(masculines) do
					if not exists(m) then
						table.insert(data.categories, "French nouns with red links in their headword lines")
					end
				end
			end

			-- Handle diminutives
			if #args.dim > 0 then
				local dims_infl = mw.clone(args.dim)
				dims_infl.label = "diminutive"
				dims_infl.accel = {form = "diminutive"}
				table.insert(data.inflections, dims_infl)
			end
		end
	}
end

pos_functions["နာမ်များ"] = get_noun_pos(false)

pos_functions["တစ်ဦးဆိုင်နာမ်များ"] = get_noun_pos(true)

pos_functions["နာမ်စားများ"] = {
	params = {
		["head"] = {list = true},
		[1] = {alias_of = "g"},
		["g"] = {list = true},
		["f"] = {list = true},
		["fqual"] = {list = true, allow_holes = true},
		["m"] = {list = true},
		["mqual"] = {list = true, allow_holes = true},
		["fp"] = {list = true},
		["fpqual"] = {list = true, allow_holes = true},
		["mp"] = {list = true},
		["mpqual"] = {list = true, allow_holes = true},
		["p"] = {list = true},
		["pqual"] = {list = true, allow_holes = true},
		},
	func = function(args, data)
		local PAGENAME = mw.title.getCurrentTitle().text
		
		-- Gather genders
		local function insert_gender(g)
			if g == "mf" then
				table.insert(data.genders, "m")
				table.insert(data.genders, "f")
			else
				table.insert(data.genders, g)
			end
		end
		for _, g in ipairs(args.g) do
			insert_gender(g)
		end

		local function process_inflection(label, infls, quals)
			infls.label = label
			for i, infl in ipairs(infls) do
				if quals[i] then
					infls[i] = {term = infl, qualifiers = {quals[i]}}
				end
			end
		end

		-- Gather all inflections.
		process_inflection("masculine", args["m"], args["mqual"])			
		process_inflection("feminine", args["f"], args["fqual"])			
		process_inflection("masculine plural", args["mp"], args["mpqual"])			
		process_inflection("feminine plural", args["fp"], args["fpqual"])			
		process_inflection("plural", args["p"], args["pqual"])			

		-- Add categories for genders
		if #data.genders == 0 then
			table.insert(data.genders, "?")
		end

		-- Validate/canonicalize genders			
		for i, g in ipairs(data.genders) do
			if g == "m." then
				data.genders[i] = "m"
			elseif g == "f." then
				data.genders[i] = "f"
			elseif g == "?" and mw.title.getCurrentTitle().nsText == "တမ်းပလိတ်" then
				-- allow unknown gender in template example
			elseif g == "?" then
				-- FIXME, remove this branch once we’ve added the required genders
				track("missing-pron-gender")
			elseif g and g ~= "" and not allowed_genders[g] then
				error("Unrecognized French gender: " .. g)
			end
		end

		-- Add the inflections
		if #args["m"] > 0 then
			table.insert(data.inflections, args["m"])
		end
		if #args["f"] > 0 then
			table.insert(data.inflections, args["f"])
		end
		if #args["mp"] > 0 then
			table.insert(data.inflections, args["mp"])
		end
		if #args["fp"] > 0 then
			table.insert(data.inflections, args["fp"])
		end
		if #args["p"] > 0 then
			table.insert(data.inflections, args["p"])
		end
	end
}


local function get_misc_pos()
	return {
		param1_is_head = true,
		params = {
			[1] = {},
		},
		func = function(args, data)
		end
	}
end

pos_functions["ကြိယာဝိသေသနများ"] = get_misc_pos()
	
pos_functions["ဝိဘတ်များ"] = get_misc_pos()

pos_functions["phrases"] = get_misc_pos()

pos_functions["prepositional phrases"] = get_misc_pos()

pos_functions["စကားပုံများ"] = get_misc_pos()

pos_functions["ပုဒ်ဖြတ်ပုဒ်ရပ်သင်္ကေတများ"] = get_misc_pos()

pos_functions["diacritical marks"] = get_misc_pos()

pos_functions["အာမေဋိတ်များ"] = get_misc_pos()

pos_functions["ရှေ့ဆက်များ"] = get_misc_pos()

pos_functions["အတိုချုံ့များ"] = get_misc_pos()

pos_functions["နာမဝိသေသနများ"] = {
	params = {
		[1] = {},
		["inv"] = {},
		["m2"] = {},
		["onlyg"] = {},
		["f"] = {list = true},
		["mp"] = {list = true},
		["fp"] = {list = true},
		["p"] = {list = true},
		["current"] = {list = true},
		["comp"] = {list = true},
		["sup"] = {list = true},
		},
	func = function(args, data)
		local PAGENAME = mw.title.getCurrentTitle().text
		if args.onlyg == "p" or args.onlyg == "m-p" or args.onlyg == "f-p" then
			table.insert(data.categories, "French pluralia tantum")
		end
		if args.onlyg == "s" or args.onlyg == "f-s" or args.onlyg == "f-s" then
			table.insert(data.categories, "French singularia tantum")
		end
		if args.onlyg then
			table.insert(data.categories, "French defective adjectives")
		end
		if args.onlyg == "p" then
			table.insert(data.inflections, {label = "ဗဟုဝုစ်သာ"})
			if args[1] ~= "mf" then
				-- Handle feminine plurals
				if #args.fp > 0 then
					local fplurals_infl = mw.clone(args.fp)
					fplurals_infl.label = "ဣတ္ထိလိင် ဗဟုဝုစ်"
					fplurals_infl.accel = {form = "f|p"}
					table.insert(data.inflections, fplurals_infl)
				end
			end
		elseif args.onlyg == "s" then
			table.insert(data.inflections, {label = "ဧကဝုစ်သာ"})
			if not (args[1] == "mf" or #args.f == 0 and rfind(PAGENAME, "e$")) then
				-- Handle feminines
				local feminines = #args.f > 0 and args.f or add_suffix(#args.current > 0 and args.current or {PAGENAME}, "e")
				local feminines_infl = mw.clone(feminines)
				feminines_infl.label = "ဣတ္ထိလိင် ဧကဝုစ်"
				feminines_infl.accel = {form = "f|s"}
				table.insert(data.inflections, feminines_infl)
			end
		elseif args.onlyg == "m" then
			table.insert(data.genders, "m")
			table.insert(data.inflections, {label = "ပုလ္လိင်သာ"})
			-- Handle masculine plurals
			local mplurals = #args.mp > 0 and args.mp or add_suffix(#args.current > 0 and args.current or {PAGENAME}, "s")
			local mplurals_infl = mw.clone(mplurals)
			mplurals_infl.label = "ပုလ္လိင် ဗဟုဝုစ်"
			mplurals_infl.accel = {form = "m|p"}
			table.insert(data.inflections, mplurals_infl)
		elseif args.onlyg == "f" then
			table.insert(data.genders, "f")
			table.insert(data.inflections, {label = "ဣတ္ထိလိင်သာ"})
			-- Handle feminine plurals
			local fplurals = #args.fp > 0 and args.fp or add_suffix(#args.current > 0 and args.current or {PAGENAME}, "s")
			local fplurals_infl = mw.clone(fplurals)
			fplurals_infl.label = "ဣတ္ထိလိင် ဗဟုဝုစ်"
			fplurals_infl.accel = {form = "f|p"}
			table.insert(data.inflections, fplurals_infl)
		elseif args.onlyg then
			table.insert(data.genders, args.onlyg)
			table.insert(data.inflections, {label = "defective"})
		else
			-- Gather genders
			local gender = args[1]
			-- Default to mf if base form ends in -e and no feminine,
			-- feminine plural or gender specified
			if not gender and #args.f == 0 and #args.fp == 0 and rfind(PAGENAME, "e$") then
				gender = "mf"
			end
			
			if #args.current > 0 then
				track("adj-current")
			end
			
			if args.inv then
				table.insert(data.inflections, {label = "invariable"})
			end
			
			-- Handle plurals of mf adjectives
			local plurals = #args.p > 0 and args.p or {PAGENAME .. "s"}
			if not args.inv and gender == "mf" then
				local plurals_infl = mw.clone(plurals)
				plurals_infl.label = "ဗဟုဝုစ်"
				plurals_infl.accel = {form = "p"}
				table.insert(data.inflections, plurals_infl)
			end
			
			if not args.inv and gender ~= "mf" then
				-- Handle case of special masculine singular before vowel
				if args.m2 then
					local masc_before_vowel = {args.m2}
					masc_before_vowel.label = "masculine singular before vowel"
					masc_before_vowel.accel = {form = "m|s"}
					table.insert(data.inflections, masc_before_vowel)
				end
				
				-- Handle feminines
				local feminines = #args.f > 0 and args.f or add_suffix(#args.current > 0 and args.current or {PAGENAME}, "e")
				local feminines_infl = mw.clone(feminines)
				feminines_infl.label = "ဣတ္ထိလိင် ဧကဝုစ်"
				feminines_infl.accel = {form = "f|s"}
				table.insert(data.inflections, feminines_infl)
				
				-- Handle masculine plurals
				local mplurals = #args.mp > 0 and args.mp or add_suffix(#args.current > 0 and args.current or {PAGENAME}, "s")
				local mplurals_infl = mw.clone(mplurals)
				mplurals_infl.label = "ပုလ္လိင် ဗဟုဝုစ်"
				mplurals_infl.accel = {form = "m|p"}
				table.insert(data.inflections, mplurals_infl)
				
				-- Handle feminine plurals
				local fplurals = #args.fp > 0 and args.fp or add_suffix(feminines, "s")
				local fplurals_infl = mw.clone(fplurals)
				fplurals_infl.label = "ဣတ္ထိလိင် ဗဟုဝုစ်"
				fplurals_infl.accel = {form = "f|p"}
				table.insert(data.inflections, fplurals_infl)
			end
		end
		
		-- Handle comparatives
		if #args.comp > 0 then
			local comps_infl = mw.clone(args.comp)
			comps_infl.label = "နှိုင်းယှဉ်ရ"
			comps_infl.accel = {form = "comparative"}
			table.insert(data.inflections, comps_infl)
		end
		
		-- Handle superlatives
		if #args.sup > 0 then
			local sups_infl = mw.clone(args.sup)
			sups_infl.label = "အသာလွန်ဆုံး"
			sups_infl.accel = {form = "superlative"}
			table.insert(data.inflections, sups_infl)
		end
		
		-- Check existence
		for key, val in pairs(data.inflections) do
			for i, form in ipairs(val) do
				if not exists(form) then
					table.insert(data.categories, "French adjectives with red links in their headword lines")
					return
				end
			end
		end
	end
}

pos_functions["verbs"] = {
	param1_is_head = true,
	params = {
		[1] = {},
		["type"] = {list = true},
	},
	func = function(args, data)
		local PAGENAME = mw.title.getCurrentTitle().text
		for _, ty in ipairs(args.type) do
			local category, label
			if ty == "auxiliary" then
				category = "auxiliary verbs"
			elseif ty == "defective" then
				category = "defective verbs"
				label = "[[defective]]"
			elseif ty == "impersonal" then
				category = "impersonal verbs"
				label = "[[impersonal]]"
			elseif ty == "modal" then
				category = "modal verbs"
			elseif ty == "reflexive" then
				category = "reflexive verbs"
			elseif ty == "transitive" then
				label = "[[transitive]]"
			elseif ty == "intransitive" then
				label = "[[intransitive]]"
			elseif ty == "ambitransitive" or ty == "ambi" then
				label = "[[transitive]] and [[intransitive]]"
			end
			if category then
				table.insert(data.categories, "ပြင်သစ် " .. category)
			end
			if label then
				table.insert(data.inflections, {label = label})
			end
		end
	end
}

return export

-- For Vim, so we get 4-space tabs
-- vim: set ts=4 sw=4 noet: