Module:sandbox/hi-IPA/testcases:
Lua error: bad argument #1 to 'gsub' (string expected, got nil)
local export = {}
local lang = require("Module:languages").getByCode("hi")
local sc = require("Module:scripts").getByCode("Deva")
local m_IPA = require("Module:IPA")
local m_a = require("Module:accent qualifier")
local gsub = mw.ustring.gsub
local gmatch = mw.ustring.gmatch
local find = mw.ustring.find
local correspondences = {
= "ŋ", = "ɡ",
= "t͡ʃ", = "d͡ʒ",
= "ʈ", = "ɖ", = "ɳ",
= "t̪", = "d̪",
= "j", = "ɾ", = "ʋ", = "l̪",
= "ʃ", = "ʂ", = "ɦ",
= "ɽ", = "ʒ", = "ɭ", = "ɣ", = "q", = "x", = "n", = "r",
= "ə", = "ɑː", = "ɪ",
= "iː", = "oː", = "eː",
= "ʊ", = "uː", = "ɔ", = "æ",
= "ẽː", = "ʊ̃", = "õː", = "ə̃", = "ɑ̃ː", = "ɪ̃", = "ĩː",
= "oːm", = "(ɦ)", = "(ʔ)",
}
local perso_arabic = {
= "kh", = "g", = "k", = "z", = "j", = "ph", = "",
}
local urdu = {
= "ʃ", = "n",
gsub(result, "(...)ɑ(ː)$", "%1ᵊ"),
gsub(result, "(...)ɑ(ː) ", "%1ᵊ "),
gsub(result, "(...)ɑ(ː)%.?%-", "%1ᵊ-"),
gsub(result, "%.?%-", "."),
}
local deccani = {
= "x",
}
local lengthen = {
= "ā", = "ī", = "ū",
}
local vowels = "aāiīuūoŏĕʊɪɔɔ̃ɛeæãā̃ẽĩī̃õũū̃ː"
local vowel = "ː?"
local weak_h = "()h"
local aspirate = "()"
local syllabify_pattern = "(̃?)(+)(̃?)"
local function find_consonants(text)
local current = ""
local cons = {}
for cc in mw.ustring.gcodepoint(text .. " ") do
local ch = mw.ustring.char(cc)
if find(current .. ch, "^$") or find(current .. ch, "^h$") then
current = current .. ch
else
table.insert(cons, current)
current = ch
end
end
return cons
end
local function syllabify(text)
for count = 1, 2 do
text = gsub(text, syllabify_pattern, function(a, b, c)
b_set = find_consonants(b)
table.insert(b_set, #b_set > 1 and 2 or 1, ".")
return a .. table.concat(b_set) .. c
end)
text = gsub(text, "(" .. vowel .. ")(?=" .. vowel .. ")", "%1.")
end
for count = 1, 2 do
text = gsub(text, "(" .. vowel .. ")(" .. vowel .. ")", "%1.%2")
end
return text
end
local identical = "knlsfzθ"
for character in gmatch(identical, ".") do
correspondences = character
end
local function transliterate(text)
return lang:transliterate(text)
end
function export.link(term)
return require("Module:links").full_link{ term = term, lang = lang, sc = sc }
end
function export.narrow_IPA(ipa)
-- what /ɑ/ really is
ipa = gsub(ipa, 'ɑ', 'ä')
-- dentals
ipa = gsub(ipa, '()', '%1̪')
-- nasals induce nasalization
ipa = gsub(ipa, '()(ː?)()', '%1̃%2%3')
-- cc, jj
ipa = gsub(ipa, 't͡ʃ(%.?)t͡ʃ', 't̚%1t͡ʃ')
ipa = gsub(ipa, 'd͡ʒ(%.?)d͡ʒ', 'd̚%1d͡ʒ')
-- syllable boundary consonants
ipa = gsub(ipa, '()%.()', '%1̚.%2')
ipa = gsub(ipa, '()%.()', '%1̚.%2')
ipa = gsub(ipa, '(̪?)%.()', '%1̚.%2')
ipa = gsub(ipa, '()%.()', '%1̚.%2')
-- aspiration rules
ipa = gsub(ipa, 'əɦ%.()', 'ɛɦ.%1')
ipa = gsub(ipa, 'ʊɦ%.()', 'ɔɦ.%1')
ipa = gsub(ipa, 'ə%.ɦə', 'ɛ.ɦɛ')
ipa = gsub(ipa, 'ʊ%.ɦə', 'ɔ.ɦɔ')
ipa = gsub(ipa, 'ə%.ɦʊ', 'ɔ.ɦɔ')
-- v/w
ipa = gsub(ipa, '(̪?%.?)ʋ', '%1w')
-- retroflex s rules
ipa = gsub(ipa, 'ʂ(%.?)', 'ʃ%1')
ipa = gsub(ipa, '()%.()', 'ɴ.%2')
ipa = gsub(ipa, 'ʂ$', 'ʃ')
ipa = gsub(ipa, "ɪ%.j", "i.j")
return ipa
end
function export.toIPA(text, style)
text = gsub(text, '॰', '-')
local translit = transliterate(text)
if not translit then
error('The term "' .. Hindi .. '" could not be transliterated.')
end
if style == "nonpersianized" then
translit = gsub(translit, "", perso_arabic)
end
if style == "desanskritanize" then
translit = gsub(translit, "", urdu)
end
if style == "dakhini" then
translit = gsub(translit, "", deccani)
end
-- force final schwa
translit = gsub(translit, "a~$", "ə")
-- vowels
translit = gsub(translit, "͠", "̃")
translit = gsub(translit, 'a(̃?)i', 'ɛ%1ː')
translit = gsub(translit, 'a(̃?)u', 'ɔ%1ː')
translit = gsub(translit, "%-$", "")
translit = gsub(translit, "^%-", "")
translit = gsub(translit, "ŕ$", "r")
translit = gsub(translit, "ŕ", "ri")
translit = gsub(translit, ",", "")
translit = gsub(translit, " ", "..")
translit = syllabify(translit)
translit = gsub(translit, "%.ː", "ː.")
translit = gsub(translit, "%.̃", "̃")
-- gy
translit = gsub(translit, 'jñ', 'gy')
translit = gsub(translit, aspirate .. "h", '%1ʰ')
translit = gsub(translit, weak_h, '%1ʱ')
local result = gsub(translit, ".", correspondences)
-- remove final schwa (Pandey, 2014)
-- actually weaken
result = gsub(result, "(...)ə$", "%1ᵊ")
result = gsub(result, "(...)ə ", "%1ᵊ ")
result = gsub(result, "(...)ə%.?%-", "%1ᵊ-")
result = gsub(result, "%.?%-", ".")
result = gsub(result, "%.%.", "‿")
-- formatting
result = gsub(result, "ː̃", "̃ː")
result = gsub(result, "ː%.̃", "̃ː.")
result = gsub(result, "%.$", "")
-- ñ
result = gsub(result, "ñ", "n")
-- i and u lengthening
result = gsub(result, "ʊ(̃?)(ʱ?)$", "u%1ː%2")
result = gsub(result, "ɪ(̃?)(ʱ?)$", "i%1ː%2")
result = gsub(result, "ɛː(%.?)j", function(a)
local res = "ə̯i"
res = res .. a .. "j"
return res
end)
result = gsub(result, "ɔː(%.?)ʋ", function(a)
local res = "ə̯u"
res = res .. a .. "ʋ"
return res
end)
return result
end
function export.make(frame)
local args = frame:getParent().args
local pagetitle = mw.title.getCurrentTitle().text
local p, results = {}, {}, {}
if args then
for index, item in ipairs(args) do
table.insert(p, (item ~= "") and item or nil)
end
else
p = { pagetitle }
end
for _, Hindi in ipairs(p) do
local persianized = export.toIPA(Hindi, "persianized")
local nonpersianized = export.toIPA(Hindi, "nonpersianized")
table.insert(results, { pron = "/" .. persianized .. "/" })
local narrow = export.narrow_IPA(persianized)
if narrow ~= persianized then table.insert(results, { pron = "" }) end
if persianized ~= nonpersianized then
table.insert(results, { pron = "/" .. nonpersianized .. "/" })
local narrow = export.narrow_IPA(nonpersianized)
if narrow ~= nonpersianized then table.insert(results, { pron = "" }) end
end
end
return m_a.format_qualifiers(lang, {'Delhi'}) .. ' ' .. m_IPA.format_IPA_full { lang = lang, items = results }
end
function export.make_ur(frame)
local args = frame:getParent().args
local pagetitle = mw.title.getCurrentTitle().text
local lang = require("Module:languages").getByCode("ur")
local sc = require("Module:scripts").getByCode("ur-Arab")
local p, results = {}, {}, {}
if args then
for index, item in ipairs(args) do
table.insert(p, (item ~= "") and item or nil)
end
else
error("No transliterations given.")
end
for _, Urdu in ipairs(p) do
local desanskritanize = export.toIPA(Urdu, "desanskritanize")
table.insert(results, { pron = "/" .. desanskritanize .. "/" })
end
return m_a.show(lang, {'urd'}) .. ' ' .. m_IPA.format_IPA_full { lang = lang, items = results }
end
return export