Module:ybi-IPA

From Wiktionary, the free dictionary
Jump to navigation Jump to search

Yamphu IPA pronunciation module. See {{ybi-IPA}}.


local export = {}

local lang = require("Module:languages").getByCode("ybi")
local m_IPA = require("Module:IPA")

local gsub = mw.ustring.gsub
local gmatch = mw.ustring.gmatch
local find = mw.ustring.find
local toNFC = mw.ustring.toNFC

local correspondences = {
	[":"] = "ː",
	["ṅ"] = "ŋ",
	["g"] = "ɡ",
	["k"] = "k",
	["p"] = "p",
	["b"] = "b",
	["c"] = "t͡s",
	["j"] = "d͡z",
	["ñ"] = "ɲ",
	["ṭ"] = "ʈ",
	["ḍ"] = "ɖ",
	["t"] = "t",
	["d"] = "d",
	["y"] = "j",
	["w"] = "w",
	["l"] = "l",
	["s"] = "s",
	["ś"] = "ʃ",
	["ṣ"] = "s",
	["h"] = "h",
	["n"] = "n",
	["ṃ"] = "̃",
	["’"] = "ʔ",
	["r"] = "r",
	["ṇ"] = "ɳ",
	["'"] = "ʔ",
	["‍"] = "",
	["‌"] = "",

	["a"] = "ʌ",
	["i"] = "i",
	["u"] = "u",
	["e"] = "e",
	["o"] = "o",
	["ê"] = "ɛ",
	["ô"] = "ɔ",

	["ā"] = "a",
	["ī"] = "iː",
	["ū"] = "uː",
	["ē"] = "eː",
	["ō"] = "oː",

	["ḥ"] = "ː",

	[" "] = " ",
	[","] = ",",
	['̄'] = 'ː',
}

local vowels = "aiueoôêɔɛaːāīūēōô̄ê̄ˑ"
local weak_h_c = "gjdṇḍbvrṟwy"
local primary_stress = "ˈ"
local secondary_stress = "ˌ"
local weak_h = "([" .. weak_h_c .. "])h"
local aspirate = "([kcṭtp])"
local syllabify_pattern = "([" .. vowels .. "]̃?)([^" .. vowels .. "%.%-]+)([" .. vowels .. "]̃?)"

local function find_consonants(text)
	local current = ""
	local cons = {}
	for cc in mw.ustring.gcodepoint(text .. " ") do
		local ch = mw.ustring.char(cc)
		if find(current .. ch, "^[kgṅcjñṭḍṇɽtdnpbmɽ̃yrlɳwvɾj’'wśṣshqxġzžḻṛṟfθðṉ]$") or find(current .. ch, "^[kgcjṭḍṇtɽdɽ̃pbṛṟ]h$") then
			current = current .. ch
		else
			table.insert(cons, current)
			current = ch
		end
	end
	return cons
end

local function syllabify(text)
	for count = 1, 2 do
		text = gsub(text, syllabify_pattern, function(a, b, c)
			b_set = find_consonants(b)
			table.insert(b_set, #b_set > 1 and 2 or 1, "")
			return a .. table.concat(b_set) .. c
		end)
		text = gsub(text, "(" .. vowels .. ")(?=" .. vowels .. ")", "%1.")
	end
	for count = 1, 2 do
		text = gsub(text, "(" .. vowels .. ")(" .. vowels .. ")", "%1.%2")
	end
	return text
end

local identical = "knlsfzθð"
for character in gmatch(identical, ".") do
	correspondences[character] = character
end

function export.link(term)
	return require("Module:links").full_link { term = term, lang = lang }
end

function export.toIPA(text, phonetic)
	local translit = lang:transliterate(text)

	if not translit then
		error('The term "' .. text .. '" could not be transliterated.')
	end

	if phonetic then
		translit = gsub(translit, 'c(h?)c(h)', 't̚t͡sʰ')
		translit = gsub(translit, 'cc', 't̚t͡s')
		translit = gsub(translit, 'j(h?)j(h)', 'd̚d͡zʱ')
		translit = gsub(translit, 'jj', 'd̚d͡z')
	end

	translit = gsub(translit, "*", "")
	translit = gsub(translit, "͠", "̃")
	translit = gsub(translit, "̃", "̃")
	translit = gsub(translit, '̄', 'ː')
	translit = gsub(translit, "%-", " ")
	translit = syllabify(translit)

	-- aspiration rules
	translit = gsub(translit, aspirate .. "h", '%1ʰ')
	translit = gsub(translit, weak_h, '%1ʱ')
	translit = gsub(translit, '([' .. weak_h_c .. '])%.h', '.%1ʱ')
	translit = gsub(translit, aspirate .. '%.h', '.%1ʰ')
	translit = gsub(translit, "%.ː", "ː.")

	translit = gsub(translit, ".", correspondences)

	-- formatting
	translit = gsub(translit, "ː̃", "̃ː")
	translit = gsub(translit, "ː.̃", "̃ː.")
	translit = gsub(translit, "%.$", " ")
	translit = gsub(translit, "%.?%-", ".")
	translit = gsub(translit, "ː%.̃", "̃ː.")
	translit = gsub(translit, ":", "ː")

	translit = toNFC(translit)

	return translit
end

function export.make(frame)
	local args = frame:getParent().args
	local pagetitle = mw.title.getCurrentTitle().text

	local p, results = {}, {}

	if args[1] then
		for _, item in ipairs(args) do
			table.insert(p, (item ~= "") and item or nil)
		end
	else
		p = { pagetitle }
	end

	for _, term in ipairs(p) do
		table.insert(results, { pron = "/" .. export.toIPA(term) .. "/" })
		if export.toIPA(term, true) ~= export.toIPA(term) then
			table.insert(results, { pron = "[" .. export.toIPA(term, true) .. "]" })
		end
	end
	
	mw.logObject(results)

	return m_IPA.format_IPA_full { lang = lang, items = results }
end

return export