Module:de-IPA/testcases
Appearance
- The following documentation is located at Module:de-IPA/testcases/documentation. [edit] Categories were auto-generated by Module:module categorization. [edit]
- Useful links: root page • root page’s subpages • links • transclusions • tested module • sandbox
80 of 88 tests failed. (refresh)
Text | Expected | Actual | Differs at | |
---|---|---|---|---|
Vater | ˈfaːtɐ | fɐtər | 1 | |
Anna | ˈana | ɐnɐ | 1 | |
Saal | zaːl | zaːl | ||
Qual | kʋaːl | kʋɐl | 3 | |
lokal, orig=rom | loˈkaːl | lɔkɐl | 2 | |
Sarg | zaɐ̯k | zɐrk | 2 | |
hart | haɐ̯t | hɐrt | 2 | |
Waise | ˈʋaɪ̯zə | ʋaɪ̯zə | 1 | |
Schlächter | ˈʃlɛçtɐ | ʃlɛçtər | 1 | |
gäbe | ˈgɛːbə | ɡɛbə | 1 | |
Käse | ˈkɛːzə | kɛzə | 1 | |
Auswahl | ˈaʊ̯sʋaːl | aʊ̯sʋaːl | 1 | |
Zahlen | ˈtsaːlən | t͡saːlən | 1 | |
wählen | ˈʋɛːlən | ʋɛːlən | 1 | |
brauchen | ˈbraʊ̯xən | braʊ̯χən | 1 | |
gleichen | ˈglaɪ̯çən | ɡlaɪ̯çən | 1 | |
Archen | ˈaɐ̯çən | ɐrçən | 1 | |
Aachen | ˈaːχən | aːχən | 1 | |
solch | zɔlç | zɔlç | ||
Wacht | ʋaχt | ʋɐχt | 2 | |
doch | dɔχ | dɔχ | ||
Stadt | ʃtat | ʃtɐt | 3 | |
Dschungel | ˈdʒʊŋəl | t͡ʃʊŋəl | 1 | |
lesen | ˈleːzən | ləzən | 1 | |
lecker | ˈlɛkɐ | ləkər | 1 | |
Erde (respelled Ērde) | ˈeːɐ̯də | eːrdə | 1 | |
werden | ˈʋɛɐ̯dən | ʋərdən | 1 | |
abendlich | ˈabəntlɪç | ɐbəndlɪç | 1 | |
Reichstag (respelled Reichs/tag) | ˈraɪ̯çstaːk | raɪ̯kstɐk | 1 | |
Eiche | ˈaɪ̯çə | aɪ̯çə | 1 | |
oder | ˈoːdɐ | ɔdər | 1 | |
Hund | hʊnt | hʊnt | ||
sehen | zeːn | zeːhən | 4 | |
nah | naː | naː | ||
Nische (respelled Nīsche), orig=rom | ˈniːʃə | niːʃə | 1 | |
mische | ˈmɪʃə | mɪʃə | 1 | |
spielen | ˈʃpiːlən | ʃpiːlən | 1 | |
Tier | tiːɐ̯ | tiːr | 4 | |
Österreich (respelled Ȫster/reich) | ˈøːstɐraɪ̯ç | œːʃtərraɪ̯ç | 1 | |
köstlich | ˈkœstlɪç | kœʃtlɪç | 1 | |
öffnen | ˈœfnən | œffnən | 1 | |
höre | ˈhøːrə | hœrə | 1 | |
hört | hœɐ̯t | hœrt | 3 | |
Plörre | ˈplœrə | plœrrə | 1 | |
Quatsch | kʋatʃ | kʋɐt͡ʃ | 3 | |
aßen | ˈaːsən | ɐən | 1 | |
Haus | haʊ̯s | haʊ̯s | ||
Hause | ˈhaʊ̯zə | haʊ̯zə | 1 | |
lasen | ˈlaːzən | lɐzən | 1 | |
massig | ˈmasɪç | mɐszɪk | 1 | |
Tisch | tɪʃ | tɪʃ | ||
scheußlich | ˈʃɔʏ̯slɪç | ʃɔʏ̯lɪç | 1 | |
Asche | ˈaʃə | ɐʃə | 1 | |
Quatsch | kʋatʃ | kʋɐt͡ʃ | 3 | |
Buch | buːx | bʊχ | 2 | |
Kusses | ˈkʊsəs | kʊszəs | 1 | |
Furcht | fʊɐ̯çt | fʊrçt | 3 | |
Uhr | uːɐ̯ | uːr | 3 | |
Bücher | ˈbyːçɐ | bʏçər | 1 | |
Brücke | ˈbrʏkə | brʏkə | 1 | |
Tür | tyːɐ̯ | tʏr | 2 | |
Vogel | ˈfoːgəl | fɔɡəl | 1 | |
Vase, orig=rom | ˈʋaːzə | fɐzə | 1 | |
administrativ, orig=rom | ˌatmɪnɪstraˈtif | ɐtmɪnɪʃtrɐtɪf | 1 | |
selektiv, orig=rom | zeˌlɛkˈtif | zələktɪf | 2 | |
Möwe | ˈmøːʋə | mœʋə | 1 | |
was | ʋas | ʋɐs | 2 | |
geglichen | gəˈglɪçən | ɡəɡlɪçən | 1 | |
angeglichen | ˈangəˌglɪçən | ɐŋəɡlɪçən | 1 | |
aufgeben | ˈaʊ̯fˌɡeːbən | aʊ̯fɡəbən | 1 | |
aufgegeben | ˈaʊ̯fɡəˌɡeːbən | aʊ̯fɡəɡəbən | 1 | |
Mächtigkeit | ˈmɛçtɪçˌkaɪ̯t | mɛçtɪkaɪ̯t | 1 | |
eventuell (respelled evéntuèll), orig=rom | eˈʋɛntuˌɛll | əfˈəntˌʏll | 1 | |
Enklave, orig=rom | ɛnˈklaːʋə | əŋklɐfə | 1 | |
Phonem, orig=rom | foˈneːm | fɔnəm | 2 | |
Chemie, orig=rom | çeˈmiː | çəmiː | 2 | |
Information, orig=rom | ˌɪnfoɐ̯maˈtsi̯oːn | ɪnfɔrmɐtɪɔn | 1 | |
Platin (respelled Plátin), orig=rom | ˈplaːtin | plˈaːtɪn | 1 | |
Qualität, orig=rom | ˌkʋaliˈtɛːt | kʋɐlɪtɛt | 1 | |
Rasur, orig=rom | raˈzuːɐ̯ | rɐzʊr | 2 | |
rasieren, orig=rom | raˈziːrən | rɐziːrən | 2 | |
programmieren, orig=rom | ˌprograˈmiːrən | prɔɡrɐmmiːrən | 1 | |
Buchstabe (respelled Buch/stabe) | ˈbuːxʃtaːbə | bʊχʃtɐbə | 1 | |
Urheberrecht (respelled Ur/heber/rècht) | ˈuːɐ̯heːbɐˌrɛçt | ʊrhəbərrˌəçt | 1 | |
Standartenführer (respelled Standárten/führer) | ʃtanˈdartənˌfyːrɐ | ʃtɐndˈɐrtənfyːrər | 3 | |
Aufenthaltsgenehmigung (respelled Aufenthalts/genehmigung) | ˈaʊ̯fɛnthaltsɡəˌneːmiɡʊŋ | aʊ̯fənthɐltsɡəneːmɪɡʊŋk | 1 | |
doof | doːf | doːf | ||
doofes (respelled doowes) | ˈdoːʋəs | doːʋəs | 1 |
local tests = require('Module:UnitTests')
local m_de_IPA = require('Module:de-IPA')
local m_links = require('Module:links')
local lang = require('Module:languages').getByCode('de')
local function tag_IPA(IPA)
return '<span class="IPA">' .. IPA .. '</span>'
end
function tests:check_pron(De, IPA, respelling, orig)
self:equals(
m_links.full_link({term = De, lang = lang}, nil, true) ..
(respelling and (" (respelled " .. respelling .. ")") or "") ..
(orig and ", orig=" .. orig or ""),
m_de_IPA.toIPA(respelling or De, orig) or "NULL", IPA,
{ nowiki=true, display = tag_IPA }
)
end
-- Entries here usually look like
-- self:check_pron("GERMAN", "PRONUNCIATION")
--
-- but can also be
-- self:check_pron("GERMAN", "PRONUNCIATION", "RESPELLED-GERMAN")
--
-- e.g.
-- self:check_pron("Erde", "ˈeːɐ̯də", "Ehrde")
-- self:check_pron("Reichstag", "ˈraɪ̯çstaːk", "Reichs/tag")
-- A fourth argument can be specified to indicate Romance origin, which
-- causes certain changes like ultimate or penultimate stress and
-- interpreting ''v'' as /v/ instead of /f/:
-- self:check_pron("GERMAN", "PRONUNCIATION", nil, "rom")
-- self:check_pron("GERMAN", "PRONUNCIATION", "RESPELLED-GERMAN", "rom")
--
-- e.g.
-- self:check_pron("Phonem", "foˈneːm", nil, "rom")
-- self:check_pron("Enklave", "ɛnˈklaːʋə", nil, "rom")
--
-- Note: Broad transcription transcribes ⟨r⟩ as /r/, although /ʁ/ is the commonest actual pronunciation.
function tests:test_pron()
local examples = {
-- A:
{ "Vater", "ˈfaːtɐ" },
{ "Anna", "ˈana" },
{ "Saal", "zaːl" },
{ "Qual", "kʋaːl" },
{ "lokal", "loˈkaːl", nil, "rom" },
{ "Sarg", "zaɐ̯k" },
{ "hart", "haɐ̯t" },
{ "Waise", "ˈʋaɪ̯zə" },
-- Ä
{ "Schlächter", "ˈʃlɛçtɐ" },
{ "gäbe", "ˈgɛːbə" },
{ "Käse", "ˈkɛːzə" }, -- Possibly must be /eː/. Native status of ɛː is debated. I think most professional readers speak as written, but my understanding is that the spelling does not reflect any actual spoken language consistently. /ɛː/ is so absent here that my brain parses [ɛː] as [eː]
-- AH
{ "Auswahl", "ˈaʊ̯sʋaːl" },
{ "Zahlen", "ˈtsaːlən" },
-- ÄH
{ "wählen", "ˈʋɛːlən" }, -- Could be /veːlən/, see Käse
-- AU:
{ "brauchen", "ˈbraʊ̯xən" },
--CH
{ "gleichen", "ˈglaɪ̯çən" },
{ "Archen", "ˈaɐ̯çən" },
{ "Aachen", "ˈaːχən" },
{ "solch", "zɔlç" },
{ "Wacht", "ʋaχt" },
{ "doch", "dɔχ" },
-- D
{ "Stadt", "ʃtat" },
-- DSCH
{ "Dschungel", "ˈdʒʊŋəl" },
-- E:
{ "lesen", "ˈleːzən" },
{ "lecker", "ˈlɛkɐ" },
{ "Erde", "ˈeːɐ̯də", "Ērde" },
{ "werden", "ˈʋɛɐ̯dən" },
{ "abendlich", "ˈabəntlɪç" },
-- EI:
{ "Reichstag", "ˈraɪ̯çstaːk", "Reichs/tag" },
{ "Eiche", "ˈaɪ̯çə" },
-- ER:
{ "oder", "ˈoːdɐ" },
-- H
{ "Hund", "hʊnt" },
{ "sehen", "zeːn" }, -- You often see /zeːən/, which is hypercorrect spelling-pron., might be standard anyway.
{ "nah", "naː" },
-- I
{ "Nische", "ˈniːʃə", "Nīsche", "rom" }, -- Borrowing
{ "mische", "ˈmɪʃə" }, -- native
-- IE:
{ "spielen", "ˈʃpiːlən" },
{ "Tier", "tiːɐ̯" }, -- This pronunciation is pretty wrong and would be understood as 'Tia', but I think it's the expected transcription. The actual level of the r-vowel raises with the preceding vowel.
-- Ö:
{ "Österreich", "ˈøːstɐraɪ̯ç", "Ȫster/reich" },
{ "köstlich", "ˈkœstlɪç" },
{ "öffnen", "ˈœfnən" },
{ "höre", "ˈhøːrə" },
{ "hört", "hœɐ̯t" },
{ "Plörre", "ˈplœrə" },
-- QU:
{ "Quatsch", "kʋatʃ" }, -- Must be [kfatʃ] if /v/ is used instead of /ʋ/
-- S/ß:
{ "aßen", "ˈaːsən" },
{ "Haus", "haʊ̯s" },
{ "Hause", "ˈhaʊ̯zə" },
{ "lasen", "ˈlaːzən" },
{ "massig", "ˈmasɪç" },
-- SCH:
{ "Tisch", "tɪʃ" },
{ "scheußlich", "ˈʃɔʏ̯slɪç" },
{ "Asche", "ˈaʃə" },
-- TSCH:
{ "Quatsch", "kʋatʃ" },
-- U
{ "Buch", "buːx" },
{ "Kusses", "ˈkʊsəs" },
{ "Furcht", "fʊɐ̯çt" },
-- UH:
{ "Uhr", "uːɐ̯" },
-- Ü
{ "Bücher", "ˈbyːçɐ" },
{ "Brücke", "ˈbrʏkə" },
{ "Tür", "tyːɐ̯" },
-- ÜH
-- V
{ "Vogel", "ˈfoːgəl" },
{ "Vase", "ˈʋaːzə", nil, "rom" }, -- Borrowing, should this have [v]?
{ "administrativ", "ˌatmɪnɪstraˈtif", nil, "rom" }, -- Might have a long /i/; I can't tell since northern speech has no length distinction
{ "selektiv", "zeˌlɛkˈtif", nil, "rom" },
-- W
{ "Möwe", "ˈmøːʋə" },
{ "was", "ʋas" },
-- Affixes (Stress)
{ "geglichen", "gəˈglɪçən" },
{ "angeglichen", "ˈangəˌglɪçən" },
{ "aufgeben", "ˈaʊ̯fˌɡeːbən" }, -- should be smart enough not to interpret -ge- here as a prefix (because followed by -en
{ "aufgegeben", "ˈaʊ̯fɡəˌɡeːbən" },
{ "Mächtigkeit", "ˈmɛçtɪçˌkaɪ̯t" },
-- Borrowed words with unexpected stress:
{ "eventuell", "eˈʋɛntuˌɛll", "evéntuèll", "rom" }, -- Borrowing, should this have [v]?
{ "Enklave", "ɛnˈklaːʋə", nil, "rom" }, -- Borrowing, should this have [v]?
{ "Phonem", "foˈneːm", nil, "rom" },
{ "Chemie", "çeˈmiː", nil, "rom" },
{ "Information", "ˌɪnfoɐ̯maˈtsi̯oːn", nil, "rom" }, -- Notice how this Roman word uses /ɪ/
{ "Platin", "ˈplaːtin", "Plátin", "rom" }, -- And this one doesn't.
{ "Qualität", "ˌkʋaliˈtɛːt", nil, "rom" }, -- See Käse
{ "Rasur", "raˈzuːɐ̯", nil, "rom" },
{ "rasieren", "raˈziːrən", nil, "rom" },
{ "programmieren", "ˌprograˈmiːrən", nil, "rom" },
-- Slash separating compounds:
{ "Buchstabe", "ˈbuːxʃtaːbə", "Buch/stabe" },
{ "Urheberrecht", "ˈuːɐ̯heːbɐˌrɛçt", "Ur/heber/rècht" },
{ "Standartenführer", "ʃtanˈdartənˌfyːrɐ", "Standárten/führer" },
{ "Aufenthaltsgenehmigung", "ˈaʊ̯fɛnthaltsɡəˌneːmiɡʊŋ", "Aufenthalts/genehmigung" },
-- Irregular borrowings:
{ "doof", "doːf" },
{ "doofes", "ˈdoːʋəs", "doowes" }, -- Borrowing, should this have [v]?
}
self:iterate(examples, "check_pron")
end
return tests
-- For Vim, so we get 4-space tabs
-- vim: set ts=4 sw=4 noet: