Module:sk-IPA

Hello, you have come here looking for the meaning of the word Module:sk-IPA. In DICTIOUS you will not only get to know all the dictionary meanings for the word Module:sk-IPA, but we will also tell you about its etymology, its characteristics and you will know how to say Module:sk-IPA in singular and plural. Everything you need to know about the word Module:sk-IPA you have here. The definition of the word Module:sk-IPA will help you to be more precise and correct when speaking or writing your texts. Knowing the definition ofModule:sk-IPA, as well as those of other words, enriches your vocabulary and provides you with more and better linguistic resources.

This module generates IPA transcriptions of Slovak terms.

Testcases

9 of 19 tests failed. (refresh)

TextExpectedActual
test_all:
Passedmäsoˈmɛɐ̯sɔˈmɛɐ̯sɔ
Passedďakovaťˈɟakɔvacˈɟakɔvac
Passedchliebxʎi̯epxʎi̯ep
Passedštvrťʃtvr̩cʃtvr̩c
Passedvĺčaˈvl̩ːt͡ʃaˈvl̩ːt͡ʃa
Passedvŕbaˈvr̩ːbaˈvr̩ːba
Passedkôňku̯oɲku̯oɲ
Failedčlnt͡ʃl̩nt͡ʃln
Failedšmrncʃmr̩nt͡sʃmrn̩t͡s
Faileddetstvoˈɟet͡stvɔˈɟetstvɔ
Passedletoˈʎetɔˈʎetɔ
Passedneboˈɲebɔˈɲebɔ
Passeddetiˈɟeciˈɟeci
Faileddabingˈdabiŋkˈdabink
Failedhlohɦlɔxxlɔx
Failedvodopádvɔdɔpaːtˈvɔtɔpaːt
FailedformalDehydˈfɔrmaldeɦitˈfɔrmalteɦit
Failedskibobˈskibɔpˈskipɔp
Failedzárezˈzaːresˈsaːres

local export = {}

local m_params = require("Module:parameters")
local m_IPA = require("Module:IPA")
local m_syllables = require("Module:syllables")
local m_links = require("Module:links")
local m_script_utils = require("Module:script utilities")

local lang = require("Module:languages").getByCode("sk")
local sc = require("Module:scripts").getByCode("Latn")

local sub = mw.ustring.sub
local gsub = mw.ustring.gsub
local find = mw.ustring.find
local match = mw.ustring.match
local gmatch = mw.ustring.gmatch

local U = require("Module:string/char")
local long = "ː"
local nonsyllabic = U(0x32F)	-- inverted breve below
local syllabic = U(0x0329)
local tie = U(0x361)			-- combining double inverted breve
local primary_stress = "ˈ"
local secondary_stress = "ˌ"

local data = {
	 = "a" .. long,
	 = "ɛɐ" .. nonsyllabic,
	 = "t" .. tie .. "s",
	 = "t" .. tie .. "ʃ",
	 = "ɟ",
	 = "d" .. tie .. "z",
	 = "d" .. tie .. "ʒ",
	 = "e" .. long,
	 = "ɡ",
	 = "ɦ",
	 = "x",
	 = "i" .. long,
	 = "l" .. syllabic .. long,
	 = "ʎ",
	 = "ɲ",
	 = "ɔ",
	 = "o" .. long,
	 = "u" .. nonsyllabic .. "o",
	 = "œ",
	 = "kv",
	 = "r" .. syllabic .. long,
	 = "ʃ",
	 = "c",
	 = "u" .. long,
	 = "y",
	 = "ʋ",	-- most common IPA representation as in "kov"
	 = "ks",
	 = "i",
	 = "i" .. long,
	 = "ʒ",
	 = "i" .. nonsyllabic .. "a",
	 = "i" .. nonsyllabic .. "e",
	 = "i" .. nonsyllabic .. "u",
	 = primary_stress,
	 = secondary_stress,
	 = syllabic,	-- a respelling to force syllabic
}

-- Add data = "a", data = "b", etc.
for character in gmatch("abdefijklmnprstuvz ", ".") do
	data = character
end

--Define alveolars, front vowels, and palatalized consonants
local alveolars_ortho = { "t", "d", "n", "l"}
local front_vowels_ortho = { "e", "é", "i", "í", "ie", "ia"}

local palatalized_ortho = {
     = "ť",
     = "ď",
     = "ň",
     = "ľ",
}

-- ==]

--[[
This is used to replace multiple-character sounds
with numbers, which makes it easier to process them.	]]

local multiple_char = {
	"t" .. tie .. "s",	"t" .. tie .. "ʃ", "d" .. tie .. "z",	"d" .. tie .. "ʒ",
}

local singlechar = {}
for number, character in pairs(multiple_char) do
	singlechar = tostring(number)
end

local voiceless	= { "p", "t", "c", "k", "f", "s", "ʃ", "x", "1", "2", }
local voiced	= { "b", "d", "ɟ", "ɡ", "v", "z", "ʒ", "ɦ", "3", "4", }
local sonorants = { "m", "n", "ɲ", "r", "l", "ʎ", "j", }

local features = {}
local indices = {}
for i, consonant in pairs(voiceless) do
	if not features then
		features = {}
	end
	features = false
	indices = i
end

for i, consonant in pairs (voiced) do
	if not features then
		features = {}
	end
	features = true
	indices = i
end

local function palatalize_orthography(term)
    for _, alv in ipairs(alveolars_ortho) do
        for _, vow in ipairs(front_vowels_ortho) do
            local pattern = alv .. vow
            local replacement = palatalized_ortho .. vow
            term = gsub(term, pattern, replacement)
        end
    end
    return term
end

local function devoice_finally(IPA)
	local voiced_obstruent = ""
	
	local final_voiced_obstruent = match(IPA, voiced_obstruent .. "+$") or match(IPA, voiced_obstruent .. "+%s")
	
	if final_voiced_obstruent then
		local replacement = {}
		
		local length = mw.ustring.len(final_voiced_obstruent)
		
		for i = 1, length do
			local consonant = sub(final_voiced_obstruent, i, i)
			local index = indices
			local devoiced = voiceless
			
			table.insert(replacement, devoiced)
		end
		
		replacement = table.concat(replacement)
		-- This will cause problems if the same consonant cluster occurs elsewhere in the term.
		IPA = gsub(IPA, final_voiced_obstruent, replacement)
	end
	
	return IPA
end

local function syllabicize_sonorants(IPA)
	local sonorant = gsub("", "", "") -- all except ɲ and ʎ and j
	local obstruent = ""
	local consonant = "]", "") .. "]"
	
	-- between a consonant and an obstruent
	IPA = gsub(IPA, "(" .. consonant .. sonorant .. ")(" .. obstruent .. ")", "%1" .. syllabic .. "%2")
	-- at the beginning of a word before an obstruent
	IPA = gsub(IPA, "^(" .. sonorant .. ")(" .. obstruent .. ")", "%1" .. syllabic .. "%2")
	-- at the end of a word after an obstruent
	IPA = gsub(IPA, "(" .. obstruent .. sonorant .. ")$", "%1" .. syllabic)
	
	return IPA
end

local function add_stress(IPA)
	local syllable_count = m_syllables.getVowels(IPA, lang)
	
	if not syllable_count then
		-- words like “čln” or “v” contain no designated vowels, yet they are
		-- valid Slovak words
		-- error("Could not count syllables of " .. IPA)
		syllable_count = 1
	end
	
	if syllable_count > 1 and not find(IPA, " ") then
		IPA = primary_stress .. IPA
	end
	
	return IPA
end

local function apply_rules(IPA)
	-- Replace multiple-character units with numbers.
	for sound, character in pairs(singlechar) do
		IPA = gsub(IPA, sound, character)
	end
	
	IPA = devoice_finally(IPA)
	IPA = syllabicize_sonorants(IPA)
	IPA = add_stress(IPA)
	
	-- Change double to single consonants.
	local consonant = ""
	IPA = gsub(IPA, "(" .. consonant .. ")%1", "%1")
	
	-- Replace numbers with multiple-character units.
	for sound, character in pairs(singlechar) do
		IPA = gsub(IPA, character, sound)
	end
	
	return IPA
end

function export.toIPA(term)
	term = palatalize_orthography(term)
	local IPA = {}
	local transcription = mw.ustring.lower(term)
	
	local working_string = transcription
	
	while mw.ustring.len(working_string) > 0 do
		local IPA_letter
		
		local letter = sub(working_string, 1, 1)
		local twoletters = sub(working_string, 1, 2) or ""
		
		if data then
			IPA_letter = data
			working_string = sub(working_string, 3)
		else
			IPA_letter = data or error('The letter "' .. tostring(letter) .. '" is not a member of the Slovak alphabet.')
			working_string = sub(working_string, 2)
		end
		
		table.insert(IPA, IPA_letter)
	end
	
	IPA = table.concat(IPA)
	IPA = apply_rules(IPA)
	
	return IPA, transcription
end

function export.show(frame)
	local params = {
		 = {}
	}
	
	local title = mw.title.getCurrentTitle()
	
	local args = m_params.process(frame:getParent().args, params)
	local term = args or title.nsText == "Template" and "príklad" or title.text
	
	local IPA = export.toIPA(term)
	
	IPA = ""
	IPA = m_IPA.format_IPA_full { lang = lang, items = {{ pron = IPA }} }
	
	return IPA
end

function export.example(frame)
	local params = {
		 = { required = true },
		 = {}
	}
	
	local args = m_params.process(frame.args, params)
	local term = args or args
	local transcribable = args
	
	local IPA, transcribable = export.toIPA(transcribable)
	
	IPA = ""
	IPA = m_IPA.format_IPA_full { lang = lang, items = {{ pron = IPA }} }
	
	link = m_links.full_link( { term = term, lang = lang, sc = sc }, "term" )
	
	return link .. ( term ~= transcribable and ( " (" .. m_script_utils.tag_text(transcribable, lang, nil, "term") .. ") — " ) or " — " ) .. IPA
end

return export