Module:grc-accent/testcases

The following documentation is located at Module:grc-accent/testcases/documentation. ^[edit]

Useful links: root page • root page’s subpages • links • transclusions • tested module • sandbox

All tests passed. (refresh)

test_add_accent:
Text	Expected	Actual
κρεως (1, noun)	κρέως	κρέως
Τρως (1, noun)	Τρώς	Τρώς
πολεως (1, noun)	πόλεως	πόλεως
πολεων (1, noun)	πόλεων	πόλεων
Πειριθοι (2, noun)	Πειρίθοι	Πειρίθοι
Ᾰ̓θηναιοιν (-2, noun)	Ᾰ̓θηναίοιν	Ᾰ̓θηναίοιν
Ᾰ̓θηναιοις (-2, noun)	Ᾰ̓θηναίοις	Ᾰ̓θηναίοις
βᾰρειαι (-2, noun)	βᾰρεῖαι	βᾰρεῖαι
ᾰ̓ληθειαι (-3, noun)	ᾰ̓λήθειαι	ᾰ̓λήθειαι
Ᾰ̓θηναιοι (3, noun)	Ᾰ̓θηναῖοι	Ᾰ̓θηναῖοι
βᾰρειαι (2, noun)	βᾰρεῖαι	βᾰρεῖαι
ᾰ̓ληθειαι (2, noun)	ᾰ̓λήθειαι	ᾰ̓λήθειαι
αἱμᾰ (1, noun)	αἷμᾰ	αἷμᾰ
λογος (-2)	λόγος	λόγος
προτερᾱ (-3)	προτέρᾱ	προτέρᾱ
Αἰθιοπων (2)	Αἰθιόπων	Αἰθιόπων
χωρῶν (1)	χωρῶν	χωρῶν
δημος (1)	δῆμος	δῆμος
τοιουτος (2)	τοιοῦτος	τοιοῦτος
χωρᾱ (1)	χώρᾱ	χώρᾱ
μοιρᾰ (1)	μοῖρᾰ	μοῖρᾰ
προτερᾱ (1)	προτέρᾱ	προτέρᾱ
ἐγενετο (1)	ἐγένετο	ἐγένετο
φως (1, circumflex)	φῶς	φῶς
μοιρα (1)	μοίρα	μοίρα
μοιρα (1, circumflex)	μοῖρα	μοῖρα
ἐγενετο (1, circumflex)	ἐγένετο	ἐγένετο
λογος (1)	λόγος	λόγος
λογος (1, circumflex)	λόγος	λόγος

test_detect_accent:
Text	Expected	Actual
ἐγένετο	2, acute	2, acute
ἐγένετο (from end)	3, acute	3, acute
τοιοῦτος	2, circumflex	2, circumflex
τοιοῦτος (from end)	2, circumflex	2, circumflex
φῶς	1, circumflex	1, circumflex
φῶς (from end)	1, circumflex	1, circumflex

test_find_ambig:
Text	Expected	Actual
Διονύσια	ι, ύ, ι	ι, ύ, ι
πᾶς
οἵᾳ
μίᾰ
ἐᾱ́ν

test_get_accent_term:
Text	Expected	Actual
πολὺς	barytone	barytone
πολύς	oxytone	oxytone
λέγω	paroxytone	paroxytone
γίγνομαι	proparoxytone	proparoxytone
φῶς	perispomenon	perispomenon
οἷος	properispomenon	properispomenon

test_get_length:
	Text	Expected	Actual
ambiguous vowels
	αἷμᾰ	long, short	long, short
	μοῖρα	long, either	long, either
	πάθος	either, short	either, short
	πᾰ́θος	short, short	short, short
	ἆρᾰ	long, short	long, short
capital letters
	ᾍδης	long, long	long, long
	Αἰσχύλος	long, either, short	long, either, short
	Ἠλέκτρᾱ	long, short, long	long, short, long
	Ἑλλάς	short, either	short, either
short final diphthongs
	ᾰ̓λήθειαι	short, long, long, short	short, long, long, short
	Ᾰ̓θηναιοι	short, long, long, short	short, long, long, short
	Ᾰ̓θηναίοιν	short, long, long, long	short, long, long, long
	Ᾰ̓θηναίοις	short, long, long, long	short, long, long, long

test_get_weight:
Text	Expected	Actual
ὀρθ (1)	heavy	heavy
ὀρθ	heavy	heavy
μικρ (1)	heavy	heavy
μικρ	heavy	heavy
ἰδι (1)	(nil)	(nil)
ἰδι	(nil)	(nil)
ῐ̓δῐ (1)	light	light
ῐ̓δῐ	light	light
φῐλ (1)	light	light
φῐλ	light	light

test_harmonize_length:
	Text	Expected	Actual
	ᾰ̓́λοξ, ἄλοκος	ᾰ̓́λοξ, ᾰ̓́λοκος	ᾰ̓́λοξ, ᾰ̓́λοκος
	ἄλοκος, ᾰ̓́λοξ	ᾰ̓́λοκος, ᾰ̓́λοξ	ᾰ̓́λοκος, ᾰ̓́λοξ
	ἄλοξ, ἄλοκος	ᾰ̓́λοξ, ᾰ̓́λοκος	ᾰ̓́λοξ, ᾰ̓́λοκος
	Αἰθίοψ, Αἰθίοπος	Αἰθῐ́οψ, Αἰθῐ́οπος	Αἰθῐ́οψ, Αἰθῐ́οπος
transfer length only if both vowels have the same breathing mark
	ἄξιος, ᾱ	ἄξιος, ᾱ	ἄξιος, ᾱ

test_length_at:
Text	Expected	Actual
μοῖρα (2 syllables from end)	long	long
πάθους (2 syllables from end)	either	either
πᾰ́θος (2 syllables from end)	short	short

test_mark_implied_length:
Text	Expected	Actual
μοῖρα	μοῖρᾰ	μοῖρᾰ
χώρα	χώρᾱ	χώρᾱ
πάθος	πᾰ́θος	πᾰ́θος
ἀλήθεια	ἀλήθειᾰ	ἀλήθειᾰ

test_strip_accent:
	Text	Expected	Actual
	ᾰ̓́νθρωπος	ανθρωπος	ανθρωπος
	Πηληῐ̈ᾰ́δης	Πηληιαδης	Πηληιαδης

test_strip_tone:
	Text	Expected	Actual
	Πηληῐ̈ᾰ́δης	Πηληῐ̈ᾰδης	Πηληῐ̈ᾰδης
	Ᾱ̔́ͅδης	Ᾱ̔ͅδης	Ᾱ̔ͅδης
	μολὼν λαβέ	μολων λαβε	μολων λαβε
circumflex → macron
	πᾶς	πᾱς	πᾱς
circumflexes on diphthongs should not be replaced with macrons
	οἷαι	οἱαι	οἱαι
	γᾰλεοῦ	γᾰλεου	γᾰλεου

local tests = require("Module:UnitTests")
local m_accent = require("Module:grc-accent")

local m_utilities = require("Module:grc-utilities")
local m_table = require("Module:table")

local concat = table.concat
local insert = table.insert
local reverse_ipairs = m_table.reverseIpairs
local sparse_concat = m_table.sparseConcat
local table_reverse = m_table.reverse
local tag = m_utilities.tag
local toNFC = mw.ustring.toNFC

function tests:check_mark_implied_length(example, expected)
	self:equals(
		tag(example),
		toNFC(m_accent.mark_implied_length(example)),
		toNFC(expected),
		{ display = tag }
	)
end

local function display_find_ambig(word)
	local vowel_list = m_accent.find_ambig(word, true)
	return toNFC(concat(vowel_list, ", "))
end

function tests:check_find_ambig(example, expected)
	self:equals(
		tag(example),
		display_find_ambig(example),
		expected,
		{ display = tag }
	)
end

function tests:check_length_at(example, position, expected)
	self:equals(
		tag(example) .. " (" .. position .. " syllables from end)",
		m_accent.length_at(example, position),
		expected
	)
end

function tests:check_get_length(example, expected, is_noun)
	local lengths = {}
	local get_length = m_accent.get_length
	local tokens = m_utilities.tokenize(example)
	local token_count = #tokens
	local short_diphthong = is_noun
	for i, token in reverse_ipairs(tokens) do
		if m_accent.contains_vowel(token) then
			if i ~= token_count then
				short_diphthong = false
			end
			insert(lengths, get_length(token, short_diphthong))
		end
	end
	lengths = concat(table_reverse(lengths), ", ")
	
	self:equals(
		tag(example),
		lengths,
		expected
	)
end

function tests:check_harmonize_length(word1, word2, expected)
	self:equals(
		tag(word1 .. ", " .. word2),
		toNFC(concat({ m_accent.harmonize_length(word1, word2) }, ", ")),
		toNFC(expected),
		{ display = tag }
	)
end

function tests:check_strip_accent(example, expected)
	self:equals(
		tag(example),
		toNFC(m_accent.strip_accent(example)),
		toNFC(expected),
		{ display = tag }
	)
end

function tests:check_strip_tone(example, expected)
	self:equals(
		tag(example),
		toNFC(m_accent.strip_tone(example)),
		toNFC(expected),
		{ display = tag }
	)
end

function tests:check_get_weight(example, expected, position)
	self:equals(
		tag(example) .. " (" .. position .. ")",
		m_accent.get_weight(example, position),
		expected
	)
	self:equals(
		tag(example),
		m_accent.get_weight(example),
		expected
	)
end

function tests:check_add_accent(example, position, expected, circumflex, is_noun)
	self:equals(
		tag(example) .. " (" .. sparse_concat({ position, circumflex and "circumflex" or nil, is_noun and "noun" or nil }, ", ") .. ")",
		toNFC(m_accent.add_accent(example, position, { short_diphthong = is_noun, synaeresis = is_noun, circumflex = circumflex })),
		toNFC(expected),
		{ display = tag }
	)
end

local function display_detect_accent(syllable, accent_name)
	return syllable .. ", " .. accent_name
end

function tests:check_detect_accent(example, expected, from_end)
	self:equals(
		tag(example) .. (from_end and " (from end)" or ""),
		display_detect_accent(m_accent.detect_accent(example, from_end)),
		expected
	)
end

function tests:check_get_accent_term(example, expected)
	self:equals(
		tag(example),
		m_accent.get_accent_term(example),
		expected
	)
end

function tests:test_mark_implied_length()
	local examples = {
		{ "μοῖρα", "μοῖρᾰ" },
		{ "χώρα", "χώρᾱ" },
		{ "πάθος", "πᾰ́θος" },
		{ "ἀλήθεια", "ἀλήθειᾰ" },
	}
	
	tests:iterate(examples, "check_mark_implied_length")
end

function tests:test_find_ambig()
	local examples = {
		{ "Διονύσια", "ι, ύ, ι" },
		{ "πᾶς", "" },
		{ "οἵᾳ", "" },
		{ "μίᾰ", "" },
		{ "ἐᾱ́ν", "" },
	}
	
	tests:iterate(examples, "check_find_ambig")
end

function tests:test_length_at()
	local examples = {
		{ "μοῖρα", 2, "long" },
		{ "πάθους", 2, "either" },
		{ "πᾰ́θος", 2, "short" },
	}
	
	tests:iterate(examples, "check_length_at")
end

function tests:test_get_length()
	local examples = {
		"ambiguous vowels",
		{ "αἷμᾰ", "long, short", true },
		{ "μοῖρα", "long, either" },
		{ "πάθος", "either, short" },
		{ "πᾰ́θος", "short, short" },
		{ "ἆρᾰ", "long, short" },
		"capital letters",
		{ "ᾍδης", "long, long" },
		{ "Αἰσχύλος", "long, either, short" },
		{ "Ἠλέκτρᾱ", "long, short, long" },
		{ "Ἑλλάς", "short, either" },
		"short final diphthongs",
		{ "ᾰ̓λήθειαι", "short, long, long, short", true },
		{ "Ᾰ̓θηναιοι", "short, long, long, short", true },
		{ "Ᾰ̓θηναίοιν", "short, long, long, long", true },
		{ "Ᾰ̓θηναίοις", "short, long, long, long", true },
	}
	
	tests:iterate(examples, "check_get_length")
end

function tests:test_harmonize_length()
	local examples = {
		{ "ᾰ̓́λοξ", "ἄλοκος", "ᾰ̓́λοξ, ᾰ̓́λοκος" },
		{ "ἄλοκος", "ᾰ̓́λοξ", "ᾰ̓́λοκος, ᾰ̓́λοξ" },
		{ "ἄλοξ", "ἄλοκος", "ᾰ̓́λοξ, ᾰ̓́λοκος" },
		{ "Αἰθίοψ", "Αἰθίοπος", "Αἰθῐ́οψ, Αἰθῐ́οπος" },
		"transfer length only if both vowels have the same breathing mark",
		{ "ἄξιος", "ᾱ", "ἄξιος, ᾱ" },
	}
	
	tests:iterate(examples, "check_harmonize_length")
end

function tests:test_strip_accent()
	local examples = {
		{ "ᾰ̓́νθρωπος", "ανθρωπος" },
		{ "Πηληῐ̈ᾰ́δης", "Πηληιαδης" },
		-- { },
	}
	
	tests:iterate(examples, "check_strip_accent")
end

function tests:test_strip_tone()
	local examples = {
		{ "Πηληῐ̈ᾰ́δης", "Πηληῐ̈ᾰδης" },
		{ "Ᾱ̔́ͅδης", "Ᾱ̔ͅδης" }, -- pleonastic
		{ "μολὼν λαβέ", "μολων λαβε" },
		"circumflex &rarr; macron",
		{ "πᾶς", "πᾱς" },
		"circumflexes on diphthongs should not<br>be replaced with macrons",
		{ "οἷαι", "οἱαι" }, -- οῑαι if tokenization yields ο-ῑαι
		{ "γᾰλεοῦ", "γᾰλεου" }, -- γᾰλεοῡ if tokenization yields γᾰλεο-ῦ
	}
	
	tests:iterate(examples, "check_strip_tone")
end

function tests:test_get_weight()
	local examples = {
		{ "ὀρθ", "heavy", 1 },
		{ "μικρ", "heavy", 1 },
		{ "ἰδι", nil, 1 },
		{ "ῐ̓δῐ", "light", 1 },
		{ "φῐλ", "light", 1 },
	}
	
	tests:iterate(examples, "check_get_weight")
end

function tests:test_add_accent()
	local examples = {
		{ "κρεως", 1, "κρέως", nil, true},
		{ "Τρως", 1, "Τρώς", nil, true },
		{ "πολεως", 1, "πόλεως", nil, true },
		{ "πολεων", 1, "πόλεων", nil, true },
		{ "Πειριθοι", 2, "Πειρίθοι", nil, true },
		{ "Ᾰ̓θηναιοιν", -2, "Ᾰ̓θηναίοιν", nil, true },
		{ "Ᾰ̓θηναιοις", -2, "Ᾰ̓θηναίοις", nil, true },
		{ "βᾰρειαι", -2, "βᾰρεῖαι", nil, true },
		{ "ᾰ̓ληθειαι", -3, "ᾰ̓λήθειαι", nil, true },
		{ "Ᾰ̓θηναιοι", 3, "Ᾰ̓θηναῖοι", nil, true },
		{ "βᾰρειαι", 2, "βᾰρεῖαι", nil, true },
		{ "ᾰ̓ληθειαι", 2, "ᾰ̓λήθειαι", nil, true },
		{ "αἱμᾰ", 1, "αἷμᾰ", nil, true },
		{ "λογος", -2, "λόγος" },
		{ "προτερᾱ", -3, "προτέρᾱ" },
		{ "Αἰθιοπων", 2, "Αἰθιόπων"}, -- position 2 because the nominative is Αἰθίοψ
		{ "χωρῶν", 1, "χωρῶν"}, -- don't modify existing accent
		{ "δημος", 1, "δῆμος" },
		{ "τοιουτος", 2, "τοιοῦτος" },
		{ "χωρᾱ", 1, "χώρᾱ" },
		{ "μοιρᾰ", 1, "μοῖρᾰ" },
		{ "προτερᾱ", 1, "προτέρᾱ" },
		{ "ἐγενετο", 1, "ἐγένετο" },
		{ "φως", 1, "φῶς", true },
		{ "μοιρα", 1, "μοίρα" },
		{ "μοιρα", 1, "μοῖρα", true },
		{ "ἐγενετο", 1, "ἐγένετο", true },
		{ "λογος", 1, "λόγος" },
		{ "λογος", 1, "λόγος", true },
	}
	
	tests:iterate(examples, "check_add_accent")
end

function tests:test_detect_accent()
	local examples = {
		{ "ἐγένετο",	"2, acute" },
		{ "ἐγένετο",	"3, acute", true },
		{ "τοιοῦτος",	"2, circumflex" },
		{ "τοιοῦτος",	"2, circumflex", true },
		{ "φῶς",		"1, circumflex" },
		{ "φῶς",		"1, circumflex", true },
	}
	
	tests:iterate(examples, "check_detect_accent")
end

function tests:test_get_accent_term()
	local examples = {
		{ "πολὺς", "barytone" },
		{ "πολύς", "oxytone" },
		{ "λέγω", "paroxytone" },
		{ "γίγνομαι", "proparoxytone" },
		{ "φῶς", "perispomenon" },
		{ "οἷος", "properispomenon" },
	}
	
	tests:iterate(examples, "check_get_accent_term")
end

return tests