Article snapshot taken from Wikipedia with creative commons attribution-sharealike license.
Give it a read and then ask your questions in the chat.
We can research this topic together.
This module is rated as beta, and is ready for widespread use. It is still new and should be used with some caution to ensure the results are as expected.
This module is used by {{Wikt-lang}}. It is inspired by the templates {{m}} and {{l}} and their associated modules on Wiktionary. It has a Wiktionary link function that links to the correct section of the Wiktionary entry, and applies correct language formatting and italics. The language-tagging function does most of what {{Lang}} does, except that italics can't be customized and categories aren't added.
The module uses Module:Wikt-lang/data to retrieve the language name for a language code, and to perform the necessary entry-name replacements (for instance, removing macrons from Latin entry names). These are unfortunately not automatically retrieved from Wiktionary's Wikt-lang data modules. For language codes that do not have a name value in this module, the language name is fetched with mw.language.fetchLanguage. When mw.language.fetchLanguage does not fetch the correct language name (or any language name at all), please add it to Module:Wikt-lang/data, and similarly when the correct entry name is not generated, please add the entry name replacements to the module.
require('strict')
local m_data = mw.loadData("Module:Wikt-lang/data")
local langData = m_data.languages or m_data
local p = {}
local error_mesages = {
= "The function makeEntryName requires a string argument",
= "Name for the language code $1 could not be retrieved with mw.language.fetchLanguageName, so it should be added to ]",
= "Language name is empty",
= "linkToWiktionary needs a Wiktionary entry or link text, or both",
= "The function wiktlang generated nothing",
}
local cfg = {
template = "Wikt-lang",
wiki_language = "en",
error = "Error",
category = "Category:Wikt-lang template errors",
appendix = "Appendix:$1/$2",
reconstruction = "Reconstruction:$1/$2",
types = {
appendix = "appendix",
reconstructed = "reconstructed",
}
}
local function ifNotEmpty(value)
if value == "" then
return nil
else
return value
end
end
local function makeEntryName(word, languageCode)
local data = langData
local ugsub = mw.ustring.gsub
word = tostring(word)
if word == nil then
error(error_mesages.makeEntryName)
elseif word == "" then
return ""
else
-- Remove bold and italics, so that words that contain bolding or emphasis can be linked without piping.
word = word:gsub("\'\'\'", "")
word = word:gsub("\'\'", "")
if data == nil then
return word
else
local replacements = data and data
if replacements == nil then
return word
else
-- Decompose so that the diacritics of characters such
-- as á can be removed in one go.
-- No need to compose at the end, because the MediaWiki software
-- will handle that.
if replacements.decompose then
word = mw.ustring.toNFD(word)
for i, from in ipairs(replacements.from) do
word = ugsub(
word,
from,
replacements.to and replacements.to or "")
end
else
for regex, replacement in pairs(replacements) do
word = ugsub(word, regex, replacement)
end
end
return word
end
end
end
end
local function tag(text, languageCode, script, italics)
local data = langData
-- Use Misplaced Pages code if it has been given: for instance,
-- Proto-Indo-European has the Wiktionary code "ine-pro" but the Misplaced Pages
-- code "ine-x-proto".
languageCode = data and data.Wikipedia_code or languageCode
local italicize = script == "Latn" and italics
if not text then text = "" end
local textDirectionMarkers = {"", "", ""}
if data and data == "rtl" then
textDirectionMarkers = {' dir="rtl"', '‏', '‎'}
end
local out = {textDirectionMarkers}
if italicize then
table.insert(out, "<i lang=\"" .. languageCode .. "\"" .. textDirectionMarkers .. ">" .. text .. "</i>")
else
table.insert(out, "<span lang=\"" .. languageCode .. "\"" .. textDirectionMarkers .. ">" .. text .. "</span>")
end
table.insert(out, textDirectionMarkers)
return table.concat(out)
end
local function linkToWiktionary(entry, link_text, languageCode)
local data = langData
local name
if languageCode then
if data and data.name then
name = data.name
else
-- On other languages' wikis, use mw.getContentLanguage():getCode(),
-- or replace 'en' with that wiki's language code.
name = mw.language.fetchLanguageName(languageCode, cfg.wiki_language)
if name == "" then
error("Name for the language code " .. ("%q"):format(languageCode or nil)
.. " could not be retrieved with mw.language.fetchLanguageName, "
.. "so it should be added to ]")
end
end
if entry:sub(1, 1) == "*" then
if name ~= "" then
entry = "Reconstruction:" .. name .. "/" .. entry:sub(2)
else
error(error_mesages.empty_language_name)
end
elseif data and data.type == cfg.types.reconstructed then
mw.log("Reconstructed language without asterisk:", languageCode, name, entry)
local frame = mw.getCurrentFrame()
-- Track reconstructed entries with no asterisk by transcluding
-- a nonexistent template. This technique is used in Wiktionary:
-- see ].
-- ]
pcall(frame.expandTemplate, frame,
{ title = 'tracking/wikt-lang/reconstructed with no asterisk' })
if name ~= "" then
entry = "Reconstruction:" .. name .. "/" .. entry
else
error(error_mesages.empty_language_name)
end
elseif data and data.type == cfg.types.appendix then
if name ~= "" then
entry = "Appendix:" .. name .. "/" .. entry
else
error(error_mesages.empty_language_name)
end
end
if entry and link_text then
return "]"
else
error(error_mesages.no_text)
end
else
return "]"
end
end
--[[--------------------------< M A K E _ E R R O R _ S P A N >--------------------------------------------------
]]
local function maker_error_span (msg)
return table.concat ({'<span style="color: #d33;">', cfg.error, ': ', cfg.template, msg, '</span>'})
end
--[[--------------------------< W I K T L A N G >--------------------------------------------------------------------
Entry point for {{Wikt-lang}}.
Parameters are received from the template's frame (parent frame).
1 - language codes
2 - link text
3 - display text
italic - no to disable
]]
function p.wiktlang(frame)
local parent = frame:getParent()
local args = parent.args and parent.args or frame.args
if not args or '' == args then
return maker_error_span(" Parameter 2 is required") .. cfg.category
end
local codes = args and mw.text.trim(args)
local link_text = ifNotEmpty(args)
local display_text = ifNotEmpty(args)
if display_text then
link_text = display_text
end
local formatted_code
local languageCode
local language_name
local rtl
local italic
local msg
local errorText
local langM = require("Module:Lang/sandbox2")
formatted_code, languageCode, language_name, rtl, italic, msg = langM.test({code = codes, text = link_text or display_text}, "wikt-lang")
if msg then
return msg
end
languageCode = m_data.redirects or languageCode
local entry = makeEntryName(link_text, languageCode)
local out
if languageCode and entry and link_text then
local scriptCode = require("Module:Unicode data").is_Latin(link_text or display_text) and "Latn" or "unknown"
out = tag(linkToWiktionary(entry, link_text, languageCode), languageCode, scriptCode, italic) -- tag should also be replaced with the lang.make_text_html function
elseif entry and link_text then
out = linkToWiktionary(entry, link_text)
else
out = '<span style="font-size: smaller;"></span>'
end
if errorText then
return errorText or error(error_mesages.no_result)
else
return out
end
end
return p