Module: Language
enwiki>MusikBot II m (Changed protection settings for "Module:Language": High-risk template or module: 2500 transclusions (more info) ([Edit=Require extended confirmed access] (indefinite) [Move=Require extended confirmed access] (indefinite))) |
m (1 revision imported) |
||
(No difference)
|
Latest revision as of 18:57, 28 February 2024
This module is rated as beta, and is ready for widespread use. It is still new and should be used with some caution to ensure the results are as expected. |
Language templates |
---|
Language names (ISO 639) |
|
Interwiki links |
Foreign-language text |
|
Other |
This module depends on the following other modules: |
This module is used by {{wikt-lang}}
. It is inspired by the templates {{m}} and {{l}} and their associated modules on Wiktionary. It has a Wiktionary link function that links to the correct section of the Wiktionary entry, and applies correct language formatting and italics. The language-tagging function does most of what {{lang}} does, except that italics can't be customized and categories aren't added.
The module uses Module:Language/data to retrieve the language name for a language code, and to perform the necessary entry-name replacements (for instance, removing macrons from Latin entry names). These are unfortunately not automatically retrieved from Wiktionary's language data modules. For language codes that do not have a name
value in this module, the language name is fetched with mw.language.fetchLanguage
. When mw.language.fetchLanguage
does not fetch the correct language name (or any language name at all), please add it to Module:language/data, and similarly when the correct entry name is not generated, please add the entry name replacements to the module.
Examples
{{#invoke:Language|wikt|en|language}}
-> language{{#invoke:Language|wikt|en|language|languages}}
-> languages{{#invoke:Language|wikt|fr|bourguignon}}
-> bourguignon{{#invoke:Language|wikt|la|homō}}
-> homō{{#invoke:Language|wikt|grc|δημοκρατίᾱ}}
-> δημοκρατίᾱ{{#invoke:Language|wikt|ru|язы́к}}
-> язы́к{{#invoke:Language|wikt|ar|العَرَبِيَّة}}
-> العَرَبِيَّة{{#invoke:Language|wikt|fa|فارسی}}
-> فارسی{{#invoke:Language|wikt|ine-x-proto|*h₂enǵʰ-}}
-> *h₂enǵʰ-
Invalid codes
{{#invoke:Language|wikt|EN|language}}
-> language{{#invoke:Language|wikt|En|language|languages}}
-> languages{{#invoke:Language|wikt|La|homō}}
-> homō{{#invoke:Language|wikt|Grc|δημοκρατίᾱ}}
-> δημοκρατίᾱ{{#invoke:Language|wikt|Ru|язы́к}}
-> язы́к{{#invoke:Language|wikt|Ar|العَرَبِيَّة}}
-> العَرَبِيَّة{{#invoke:Language|wikt|Fa|فارسی}}
-> فارسی
Errors
{{#invoke:Language|wikt|en-Latin|language}}
-> language [Latin
is not a valid script code.]
Tracking categories
- Category:Language module errors (0)
- Category:Language module reconstructed with no asterisk (0)
- Category:Language module using redirect code (0)
require('strict') local m_data = mw.loadData("Module:Language/data") local langData = m_data.languages or m_data local p = {} local function ifNotEmpty(value) if value == "" then return nil else return value end end local function makeLinkedName(languageCode) local data = langData[languageCode] local article = data["article"] local name = data["Wikipedia_name"] or data["name"] return "[[" .. article .. "|" .. name .. "]]: " end local function makeEntryName(word, languageCode) local data = langData[languageCode] local ugsub = mw.ustring.gsub word = tostring(word) if word == nil then error("The function makeEntryName requires a string argument") elseif word == "" then return "" else -- Remove bold and italics, so that words that contain bolding or emphasis can be linked without piping. word = word:gsub("\'\'\'", "") word = word:gsub("\'\'", "") if data == nil then return word else local replacements = data and data["replacements"] if replacements == nil then return word else -- Decompose so that the diacritics of characters such -- as á can be removed in one go. -- No need to compose at the end, because the MediaWiki software -- will handle that. if replacements.decompose then word = mw.ustring.toNFD(word) for i, from in ipairs(replacements.from) do word = ugsub( word, from, replacements.to and replacements.to[i] or "") end else for regex, replacement in pairs(replacements) do word = ugsub(word, regex, replacement) end end return word end end end end p.makeEntryName = makeEntryName local function fixScriptCode(firstLetter, threeLetters) return string.upper(firstLetter) .. string.lower(threeLetters) end local function getCodes(codes, text) local languageCode, scriptCode, invalidCode local errorText if codes == nil or codes == "" then errorText = 'no language or script code provided' elseif codes:find("^%a%a%a?$") or codes:find("^%a%a%a?%-%a%a%a%a$") then -- A three- or two-letter lowercase sequence at beginning of first parameter languageCode = codes:find("^%a%a%a?") and ( codes:match("^(%l%l%l?)") or codes:match("^(%a%a%a?)") :gsub("(%a%a%a?)", string.lower, 1) ) -- One uppercase and three lowercase letters at the end of the first parameter scriptCode = codes:find("%a%a%a%a$") and ( codes:match("(%u%l%l%l)$") or gsub( codes:match("(%a%a%a%a)$"), "(%a)(%a%a%a)", fixScriptCode, 1 ) ) elseif codes:find("^%a%a%a?%-%a%a%a?$") or codes:find("^%a%a%a%-%a%a%a%-%a%a%a$") then languageCode = codes -- Private-use subtag: x followed by one or more sequences of 1-8 lowercase -- letters separated by hyphens. This only allows for one sequence, as it is -- needed for proto-languages such as ine-x-proto (Proto-Indo-European). elseif codes:find("^%a%a%a?%-x%-%a%a?%a?%a?%a?%a?%a?%a?$") then languageCode, scriptCode = codes:match("^(%a%a%a%-x%-%a%a?%a?%a?%a?%a?%a?%a?)%-?(.*)$") if not languageCode then errorText = '<code>'..codes..'</code> is not a valid language or script code.' elseif scriptCode ~= "" and not scriptCode:find("%a%a%a%a") then errorText = '<code>'..scriptCode..'</code> is not a valid script code.' else scriptCode = scriptCode:gsub( "(%a)(%a%a%a)", fixScriptCode, 1 ) end elseif codes:find("^%a%a%a?") then languageCode, invalidCode = codes:match("^(%a%a%a?)%-?(.*)") languageCode = string.lower(languageCode) errorText = '<code>'..invalidCode..'</code> is not a valid script code.' elseif codes:find("%-?%a%a%a%a$") then invalidCode, scriptCode = codes:match("(.*)%-?(%a%a%a%a)$") scriptCode = gsub( scriptCode, "(%a)(%a%a%a)", fixScriptCode ) errorText = '<code>'..invalidCode..'</code> is not a valid language code.' else errorText = '<code>'..codes..'</code> is not a valid language or script code.' end if not scriptCode or scriptCode == "" then scriptCode = require("Module:Unicode data").is_Latin(text) and "Latn" or "unknown" end if errorText then errorText = ' <span style="font-size: smaller">[' .. errorText .. ']</span>' else errorText = "" end languageCode = m_data.redirects[languageCode] or languageCode return languageCode, scriptCode, errorText end local function tag(text, languageCode, script, italics) local data = langData[languageCode] -- Use Wikipedia code if it has been given: for instance, -- Proto-Indo-European has the Wiktionary code "ine-pro" but the Wikipedia -- code "ine-x-proto". languageCode = data and data.Wikipedia_code or languageCode local italicize = script == "Latn" and italics if not text then text = "[text?]" end local textDirectionMarkers = { "", "", "" } if data and data["direction"] == "rtl" then textDirectionMarkers = { ' dir="rtl"', '‏', '‎' } end local out = { textDirectionMarkers[2] } if italicize then table.insert(out, "<i lang=\"" .. languageCode .. "\"" .. textDirectionMarkers[1] .. ">" .. text .. "</i>") else table.insert(out, "<span lang=\"" .. languageCode .. "\"" .. textDirectionMarkers[1] .. ">" .. text .. "</span>") end table.insert(out, textDirectionMarkers[3]) return table.concat(out) end function p.lang(frame) local parent = frame:getParent() local args = parent.args[1] and parent.args or frame.args local codes = args[1] and mw.text.trim(args[1]) local text = args[2] or error("Provide text in the second parameter") local languageCode, scriptCode, errorText = getCodes(codes, text) local italics = args.italics or args.i or args.italic italics = not (italics == "n" or italics == "-" or italics == "no") return tag(text, languageCode, scriptCode, italics) .. errorText end local function linkToWiktionary(entry, linkText, languageCode) local data = langData[languageCode] local name if languageCode then if data and data.name then name = data.name else -- On other languages' wikis, use mw.getContentLanguage():getCode(), -- or replace 'en' with that wiki's language code. name = mw.language.fetchLanguageName(languageCode, 'en') if name == "" then error("Name for the language code " .. ("%q"):format(languageCode or nil) .. " could not be retrieved with mw.language.fetchLanguageName, " .. "so it should be added to [[Module:Language/data]]") end end if entry:sub(1, 1) == "*" then if name ~= "" then entry = "Reconstruction:" .. name .. "/" .. entry:sub(2) else error("Language name is empty") end elseif data and data.type == "reconstructed" then mw.log("Reconstructed language without asterisk:", languageCode, name, entry) local frame = mw.getCurrentFrame() -- Track reconstructed entries with no asterisk by transcluding -- a nonexistent template. This technique is used in Wiktionary: -- see [[wikt:Module:debug]]. -- [[Special:WhatLinksHere/tracking/wikt-lang/reconstructed with no asterisk]] pcall(frame.expandTemplate, frame, { title = 'tracking/wikt-lang/reconstructed with no asterisk' }) if name ~= "" then entry = "Reconstruction:" .. name .. "/" .. entry else error("Language name is empty") end elseif data and data.type == "appendix" then if name ~= "" then entry = "Appendix:" .. name .. "/" .. entry else error("Language name is empty") end end if entry and linkText then return "[[wikt:" .. entry .. "#" .. name .. "|" .. linkText .. "]]" else error("linkToWiktionary needs a Wiktionary entry or link text, or both") end else return "[[wikt:" .. entry .. "|" .. linkText .. "]]" end end function p.wiktlang(frame) local parent = frame:getParent() local args = parent.args[1] and parent.args or frame.args local codes = args[1] and mw.text.trim(args[1]) local word1 = ifNotEmpty(args[2]) local word2 = ifNotEmpty(args[3]) if not args[2] then error("Parameter 2 is required") end local languageCode, scriptCode, errorText = getCodes(codes, word2 or word1) local italics = args.italics or args.i or args.italic italics = not (italics == "n" or italics == "-" or italics == "no") local entry, linkText if word2 and word1 then entry = makeEntryName(word1, languageCode) linkText = word2 elseif word1 then entry = makeEntryName(word1, languageCode) linkText = word1 end local out if languageCode and entry and linkText then out = tag(linkToWiktionary(entry, linkText, languageCode), languageCode, scriptCode, italics) elseif entry and linkText then out = linkToWiktionary(entry, linkText) else out = '<span style="font-size: smaller;">[text?]</span>' end if out and errorText then return out .. errorText else return errorText or error("The function wiktlang generated nothing") end end function p.wikt(frame) local parent = frame:getParent() local args = parent.args[1] and parent.args or frame.args local codes = args[1] and mw.text.trim(args[1]) local word1 = ifNotEmpty(args[2]) local word2 = ifNotEmpty(args[3]) if not word1 then error("Provide a word in parameter 2.") end local languageCode, scriptCode, errorText = getCodes(codes, word1) local entry, linkText if word2 and word1 then entry = makeEntryName(word1, languageCode) linkText = word2 elseif word1 then entry = makeEntryName(word1, languageCode) linkText = word1 end local out if languageCode and entry and linkText then out = linkToWiktionary(entry, linkText, languageCode) elseif entry and linkText then out = linkToWiktionary(entry, linkText) else out = '<span style="font-size: smaller;">[text?]</span>' end if out and errorText then return out and out .. errorText else return errorText or error("The function wikt generated nothing") end end return p