Content deleted Content added
trim code to allow removing "%s*" from patterns |
sync from sandbox: include explicitly given script subtag in language tagging |
||
(22 intermediate revisions by 8 users not shown) | |||
Line 1:
require('
local m_data = mw.loadData("Module:
local langData = m_data.languages or m_data
local p = {}
local function
if value == "" then
return nil
else
return value
end
end
Line 57 ⟶ 54:
end
end
local function fixScriptCode(firstLetter, threeLetters)
Line 64 ⟶ 59:
end
local function getCodes(codes
local languageCode, scriptCode, invalidCode
local errorText
if codes == nil or codes == "" then
errorText = 'no language or script code provided'
elseif codes:find("^%a%a%a?$") or codes:find("^%a%a%a?%-%a%a%a%a$") then
-- A three- or two-letter lowercase sequence at beginning of first parameter
Line 107 ⟶ 83:
)
)
elseif codes:find("^%a%a%a?%-%a%a%a?$")
languageCode = codes
-- Private-use subtag: x followed by one or more sequences of 1-8 lowercase
-- letters separated by hyphens. This only allows for one sequence, as it is
-- needed for proto-languages such as ine-x-proto (Proto-Indo-European).
elseif codes:find("^%a%a%a?%-x%-%a%a?%a?%a?%a?%a?%a?%a?$") then
languageCode, scriptCode =
codes:match("^(%a%a%a%-x%-%a%a?%a?%a?%a?%a?%a?%a?)%-?(.*)$")
if not languageCode then
errorText = '<code>'..codes..'</code> is not a valid language or script code.'
elseif scriptCode ~= "" and not scriptCode:find("%a%a%a%a") then
errorText = '<code>'..scriptCode..'</code> is not a valid script code.'
else
scriptCode = scriptCode:gsub(
"(%a)(%a%a%a)",
fixScriptCode,
1
)
end
elseif codes:find("^%a%a%a?") then
languageCode, invalidCode = codes:match("^(%a%a%a?)%-?(.*)")
Line 124 ⟶ 118:
else
errorText = '<code>'..codes..'</code> is not a valid language or script code.'
end
if errorText then
Line 137 ⟶ 128:
end
local function tag(text, languageCode, script,
local data = langData[languageCode]
-- Use Wikipedia code if it has been given: for instance,
Line 143 ⟶ 134:
-- code "ine-x-proto".
languageCode = data and data.Wikipedia_code or languageCode
if script and script ~= "" then
languageCode = languageCode .. "-" .. script
end
if not text then text = "[text?]" end
Line 155 ⟶ 147:
local out = { textDirectionMarkers[2] }
if italicize then
table.insert(out, "<i lang=\"" .. languageCode
else
table.insert(out, "<span
end
table.insert(out, textDirectionMarkers[3])
return table.concat(out)
end
Line 187 ⟶ 162:
if data and data.name then
name = data.name
else
-- On other languages' wikis, use mw.getContentLanguage():getCode(),
-- or replace 'en' with that wiki's language code. name = mw.language.fetchLanguageName(languageCode, 'en')
if name == "" then
error("
.. " could not be retrieved with mw.language.fetchLanguageName, "
.. "so it should be added to [[Module:Wikt-lang/data]]")
end
end
if entry:sub(1, 1) == "*" then
Line 235 ⟶ 214:
local codes = args[1] and mw.text.trim(args[1])
local word1 = ifNotEmpty(args[2])
local word2 = ifNotEmpty(args[3])
if not args[2] or '' == args[2] then
end
local languageCode, scriptCode, errorText = getCodes(codes
local italics = args.italics or args.i or args.italic
italics = not (italics == "n" or italics == "-" or italics == "no")
local entry, linkText
if
entry = makeEntryName(word1, languageCode)
linkText = word2
elseif
entry = makeEntryName(word1, languageCode)
linkText = word1
end
local italicize = italics and (scriptCode == "Latn" or require("Module:Unicode data").is_Latin(linkText))
local out
if languageCode and entry and linkText then
out = tag(linkToWiktionary(entry, linkText, languageCode), languageCode, scriptCode,
elseif entry and linkText then
out = linkToWiktionary(entry, linkText)
Line 269 ⟶ 250:
else
return errorText or error("The function wiktlang generated nothing")
end
end
|