Module:Wikt-lang explained

require('strict')local m_data = mw.loadData("Module:Wikt-lang/data")local langData = m_data.languages or m_data

local p =

local function ifNotEmpty(value) if value

"" then return nil else return value endend

local function makeEntryName(word, languageCode) local data = langData[languageCode] local ugsub = mw.ustring.gsub word = tostring(word) if word

nil then error("The function makeEntryName requires a string argument") elseif word

"" then return "" else -- Remove bold and italics, so that words that contain bolding or emphasis can be linked without piping. word = word:gsub("\'\'\'", "") word = word:gsub("\'\'", "") if data

nil then return word else local replacements = data and data["replacements"] if replacements

nil then return word else -- Decompose so that the diacritics of characters such -- as รก can be removed in one go. -- No need to compose at the end, because the MediaWiki software -- will handle that. if replacements.decompose then word = mw.ustring.toNFD(word) for i, from in ipairs(replacements.from) do word = ugsub(word, from, replacements.to and replacements.to[i] or "") end else for regex, replacement in pairs(replacements) do word = ugsub(word, regex, replacement) end end return word end end endend

local function fixScriptCode(firstLetter, threeLetters) return string.upper(firstLetter) .. string.lower(threeLetters)end

local function getCodes(codes, text) local languageCode, scriptCode, invalidCode local errorText if codes

nil or codes

"" then errorText = 'no language or script code provided' elseif codes:find("^%a%a%a?$") or codes:find("^%a%a%a?%-%a%a%a%a$") then -- A three- or two-letter lowercase sequence at beginning of first parameter languageCode = codes:find("^%a%a%a?") and (codes:match("^(%l%l%l?)") or codes:match("^(%a%a%a?)") :gsub("(%a%a%a?)", string.lower, 1) ) -- One uppercase and three lowercase letters at the end of the first parameter scriptCode = codes:find("%a%a%a%a$") and (codes:match("(%u%l%l%l)$") or gsub(codes:match("(%a%a%a%a)$"), "(%a)(%a%a%a)", fixScriptCode, 1 ) ) elseif codes:find("^%a%a%a?%-%a%a%a?$") or codes:find("^%a%a%a%-%a%a%a%-%a%a%a$") then languageCode = codes -- Private-use subtag: x followed by one or more sequences of 1-8 lowercase -- letters separated by hyphens. This only allows for one sequence, as it is -- needed for proto-languages such as ine-x-proto (Proto-Indo-European). elseif codes:find("^%a%a%a?%-x%-%a%a?%a?%a?%a?%a?%a?%a?$") then languageCode, scriptCode = codes:match("^(%a%a%a%-x%-%a%a?%a?%a?%a?%a?%a?%a?)%-?(.*)$") if not languageCode then errorText = ''..codes..' is not a valid language or script code.' elseif scriptCode ~= "" and not scriptCode:find("%a%a%a%a") then errorText = ''..scriptCode..' is not a valid script code.' else scriptCode = scriptCode:gsub("(%a)(%a%a%a)", fixScriptCode, 1 ) end elseif codes:find("^%a%a%a?") then languageCode, invalidCode = codes:match("^(%a%a%a?)%-?(.*)") languageCode = string.lower(languageCode) errorText = ''..invalidCode..' is not a valid script code.' elseif codes:find("%-?%a%a%a%a$") then invalidCode, scriptCode = codes:match("(.*)%-?(%a%a%a%a)$") scriptCode = gsub(scriptCode, "(%a)(%a%a%a)", fixScriptCode ) errorText = ''..invalidCode..' is not a valid language code.' else errorText = ''..codes..' is not a valid language or script code.' end if not scriptCode or scriptCode

"" then scriptCode = require("Module:Unicode data").is_Latin(text) and "Latn" or "unknown" end if errorText then errorText = '

[' .. errorText .. ']' else errorText = "" end languageCode = m_data.redirects[languageCode] or languageCode return languageCode, scriptCode, errorTextend

local function tag(text, languageCode, script, italics) local data = langData[languageCode] -- Use Wikipedia code if it has been given: for instance, -- Proto-Indo-European has the Wiktionary code "ine-pro" but the Wikipedia -- code "ine-x-proto". languageCode = data and data.Wikipedia_code or languageCode local italicize = script

"Latn" and italics if not text then text = "[text?]" end local textDirectionMarkers = if data and data["direction"]

"rtl" then textDirectionMarkers = end local out = if italicize then table.insert(out, "" .. text .. "") else table.insert(out, "

" .. text .. "") end table.insert(out, textDirectionMarkers[3]) return table.concat(out)end

local function linkToWiktionary(entry, linkText, languageCode) local data = langData[languageCode] local name if languageCode then if data and data.name then name = data.name else -- On other languages' wikis, use mw.getContentLanguage:getCode, -- or replace 'en' with that wiki's language code. name = mw.language.fetchLanguageName(languageCode, 'en') if name

"" then error("Name for the language code " .. ("%q"):format(languageCode or nil) .. " could not be retrieved with mw.language.fetchLanguageName, " .. "so it should be added to ") end end if entry:sub(1, 1)

"*" then if name ~= "" then entry = "Reconstruction:" .. name .. "/" .. entry:sub(2) else error("Language name is empty") end elseif data and data.type

"reconstructed" then mw.log("Reconstructed language without asterisk:", languageCode, name, entry) local frame = mw.getCurrentFrame -- Track reconstructed entries with no asterisk by transcluding -- a nonexistent template. This technique is used in Wiktionary: -- see . -- pcall(frame.expandTemplate, frame, ) if name ~= "" then entry = "Reconstruction:" .. name .. "/" .. entry else error("Language name is empty") end elseif data and data.type

"appendix" then if name ~= "" then entry = "Appendix:" .. name .. "/" .. entry else error("Language name is empty") end end if entry and linkText then return "" .. linkText .. "" else error("linkToWiktionary needs a Wiktionary entry or link text, or both") end else return "" .. linkText .. "" endend

function p.wiktlang(frame) local parent = frame:getParent local args = parent.args[1] and parent.args or frame.args local codes = args[1] and mw.text.trim(args[1]) local word1 = ifNotEmpty(args[2]) local word2 = ifNotEmpty(args[3]) if not args[2] or

args[2] then return '

[text?] Parameter 2 is required'; end local languageCode, scriptCode, errorText = getCodes(codes, word2 or word1) local italics = args.italics or args.i or args.italic italics = not (italics

"n" or italics

"-" or italics

"no") local entry, linkText if word2 and word1 then entry = makeEntryName(word1, languageCode) linkText = word2 elseif word1 then entry = makeEntryName(word1, languageCode) linkText = word1 end local out if languageCode and entry and linkText then out = tag(linkToWiktionary(entry, linkText, languageCode), languageCode, scriptCode, italics) elseif entry and linkText then out = linkToWiktionary(entry, linkText) else out = '

[text?]' end if out and errorText then return out .. errorText else return errorText or error("The function wiktlang generated nothing") endend

return p