Module:ISO 3166/sandbox: Difference between revisions

Content deleted Content added
Properly suppress category
Don't display script warnings if nocat is set to true
 
(26 intermediate revisions by 2 users not shown)
Line 7:
local p = {}
local getArgs = require("Module:Arguments").getArgs
local data = mw.loadData("Module:ISO 3166/data/National/sandbox")
 
--[[----------E R R O R S----------]]-- -- Assign error categories and display warnings
local function errors(errType, args, code, alpha2)
if not (args.nocat and args.nocat == 'true') then
if code then
local warningText = code .. ' ("%s") is not a recognized ' .. errType .. ' in [[ISO 3166-%s]] ([[Module:ISO 3166]]).'
if errType == 'country' then
mw.addWarning(string.format(warningText, args[1], '1'))
elseif errType == 'subdivision' and alpha2 then
mw.addWarning(string.format(warningText, args[2], '2:' .. alpha2))
end
end
return mw.title.getCurrentTitle().namespace == 0 and ('[[Category:Wikipedia articles with obscure ' .. errType .. 'subdivision]]') or ''
end
return ''
end
 
--[[----------F I N D N A M E----------]]-- -- Finds the name in the database
Line 54 ⟶ 70:
 
function p.strip(text)
if not text then return nil end
local accents = {["À"]="A",["Á"]="A",["Â"]="A",["Ã"]="A", --accent list (each is two bytes; first byte = 195)
["Ä"]="A",["Å"]="A",["Ç"]="C",["È"]="E",["É"]="E",
["Ê"] local accents ="E", {["ËÀ"]="EA",["ÌÁ"]="IA",["ÍÂ"]="IA",["ÎÃ"]="IA",
["ÏÄ"]="IA",["ÑÅ"]="NA",["ÒÆ"]="OAE",["ÓÇ"]="OC",["ÔÈ"]="OE",
["ÕÉ"]="OE",["ÖÊ"]="OE",["ØË"]="OE",["ÙÌ"]="UI",["ÚÍ"]="UI",
["ÛÎ"]="UI",["ÜÏ"]="UI",["ÝÐ"]="YD",["Ñ"]="N",["Ò"]="O",
["Ó"]="O",["Ô"]="O",["Õ"]="O",["Ö"]="O",["Ø"]="O",
["Ù"]="U",["Ú"]="U",["Û"]="U",["Ü"]="U",["Ý"]="Y",
["Þ"]="TH",
["Ā"]="A",["Ă"]="A",["Ą"]="A",["Ć"]="C",["Č"]="C",
["Ĉ"]="C",["Ċ"]="C",["Ď"]="D",["Đ"]="D",["Ĕ"]="E",
["Ě"]="E",["Ė"]="E",["Ē"]="E",["Ę"]="E",["Ŋ"]="N",
["Ğ"]="G",["Ģ"]="G",["Ĝ"]="G",["Ġ"]="G",["Ĥ"]="H",
["Ħ"]="H",["Ĭ"]="I",["İ"]="I",["Ī"]="I",["Į"]="I",
["Ĩ"]="I",["IJ"]="IJ",["Ĵ"]="J",["Ķ"]="K",["Ĺ"]="L",
["Ľ"]="L",["Ļ"]="L",["Ŀ"]="L",["Ł"]="L",["Ń"]="N",
["Ň"]="N",["Ņ"]="N",["Ŏ"]="O",["Ő"]="O",["Ō"]="O",
["Œ"]="OE",["Ŕ"]="R",["Ř"]="R",["Ŗ"]="R",["Ś"]="S",
["Š"]="S",["Ş"]="S",["Ŝ"]="S",["Ť"]="T",["Ţ"]="T",
["Ŧ"]="T",["Ŭ"]="U",["Ű"]="U",["Ū"]="U",["Ų"]="U",
["Ů"]="U",["Ũ"]="U",["Ŵ"]="W",["Ŷ"]="Y",["Ÿ"]="Y",
["Ź"]="Z",["Ž"]="Z",["Ż"]="Z",
}
local remove = {"NATION OF","COUNTRY OF","TERRITORY OF", -- text to be removed list
"FLAG OF","FLAG","KINGDOM OF","STATE OF"," STATE ",
"PROVINCE OF","PROVINCE","TERRITORY","COUNTY","GOVERNORATE"
}
local patterns = { "(%a)%.(%a)%.",".+:","|.+","%(.-%)", -- patterns to follow (order may matter)
"%.%S.*","^THE ","%_","%-","%d%d?%d?PX"
[".+:"]="",
}
["|.+"]="",
local replacements = {["(%a)%.(%a)%."]="%1%2", -- Replacements for patterns above (order does not matter)
["%(.-%)"]="",
["%.+:"]="",["|.*+"]="",["%(.-%)"]="",
["%.%S.*"]="",["^THE "]="",["%_"]=" ",["%-"]=" ",
["%_"]=" ",
["%d%d?%d?PX"]="",
}
 
text = mw.text.decode(text) -- Decode HTML entities (passed from wikidata?)
text = mw.ustring.upper(text) --case insensitivity
text = mw.text.unstripNoWiki(text) -- Remove <nowiki> tags
 
text = text:gsub('\195mw.',accentsustring.upper(text) --Deaccent Case insensitivity
text = mw.ustring.gsub(text,"[À-Ż]",accents) -- Deaccent
 
for pattern,value in pairs(patterns) do --Follow patterns
for _,pattern in ipairs(patterns) do -- Follow patterns
text = text:gsub(pattern,value)
local value = replacements[pattern]
text = mw.ustring.gsub(text,pattern,value)
end
 
for _,words in pairs(remove) do -- Remove unneeded words
text = text:mw.ustring.gsub(text,words,"")
end
 
text = text:mw.ustring.gsub(text,"[^%w%-]W","") --Only keepRemove ASCIInon alphanumeric and hyphenalpha-numeric
 
return text
end
 
Line 95 ⟶ 129:
 
function p.callstrip(frame)
 
local args = getArgs(frame)
 
return p.strip(args[1]) or ""
 
Line 103 ⟶ 137:
 
--[[----------P . L U A C O D E---------]]-- -- Makes the ISO code of a country
 
-- Returns tuple (code,errorcat,errortext). code is empty string upon error because MW stops at first nil
function p.luacode(args)
localargs[1], catnocountryargs[2] = (args.nocat[1] and args.nocat ==or 'true'), args[2] andor ''
local code1 = p.strip(args[1])
or '[[Category:Wikipedia page with obscure country]]'
local catnosubdivisioncode2 = p.strip(args.nocat and args.nocat == 'true'[2]) and ''
 
or '[[Category:Wikipedia page with obscure subdivision]]'
if args["codetype"]=="3" then args["codetype"]="alpha3" end
local functioneot = luacodeimpl(args).error or ""
if code1 == "" then
local country, subdivision = args[1], args[2]
if not (args.nocat and args.nocat == 'true') then
mw.addWarning((args[1] ~= "" and ('Invalid parameter "' .. args[1] .. '"') or 'No parameter') ..
if args["codetype"]=="3" then
' for the country given ([[Module:ISO 3166]]).')
args["codetype"]="alpha3"
end
return errors('country', args), '<span style="font-size:100%" class="error">"No parameter for the country given"</span>'
end
if notcode2 subdivision== "" then --3166-1 code
for alpha2,cdata in pairs(data) do
if findname(alpha2,cdata,countrycode1) then
if args["codetype"]=="numeric" or args["codetype"]=="alpha3" then
return cdata[args["codetype"]]
else
return alpha2
end
end
end
end
if mw.title.getCurrentTitle().namespace ~= 0 then catnocountry = '' end
if string.find(args[1],"%-") then
return '',catnocountry
args[1], args[2] = string.match(args[1],"^([^%-]*)%-(.*)$")
else --3166-2 code
if args[2] then return p.luacode(args) end
for alpha2,cdata in pairs(data) do
end
if findname(alpha2,cdata,country) then
return errors('country', args, code1)
if alpha2:sub(1,2) == "GB" then --Treat all UK countries as the UK
else --3166-2 code
alpha2 = "GB"
for alpha2,cdata in pairs(data) do
end
if findname(alpha2,cdata,code1) then
local sdata = mw.loadData("Module:ISO 3166/data/"..alpha2)
if mw.ustring.match(alpha2,"GB") then -- For England, Wales etc.
local empty = true
alpha2 = "GB"
for scode,scdata in pairs(sdata) do
end
if type(scdata) == "table" then
local sdata = mw.loadData("Module:ISO 3166/data/"..alpha2)
empty = false
local empty = true
if findname(scode,scdata,subdivision) then
for scode,scdata in pairs(sdata) do
return alpha2.."-"..scode
if type(scdata)=="table" then
end
empty = false
if findname(scode,scdata,code2) then
return alpha2.."-"..scode
end
end
if mw.title.getCurrentTitle().namespace ~= 0 then catnosubdivision = '' end
return '',catnosubdivision
end
if string.find(args[2] or '',"%-") then
code1, args[2] = string.match(args[2] or '',"^([^%-]*)%-(.*)$")
args[1] = args[1].."-"..code1
return p.luacode(args)
end
return errors('subdivision', args, code2, alpha2)
end
if mw.title.getCurrentTitle().namespace ~= 0 then catnocountry = '' end
return '',catnocountry
end
if string.find(args[1],"%-") then
args[1] = string.match(args[1],"^([^%-]*)%-(.*)$")
end
return p.luacode(args)
 
if args[1] then args[1] = p.strip(args[1]) end
if args[2] then args[2] = p.strip(args[2]) end
 
local a1,a2 = args[1],args[2]
 
if not a1 or a1 == '' then
if mw.title.getCurrentTitle().namespace ~= 0 then catnocountry = '' end
return '',catnocountry,'<span class="error">ISO 3166: name not specified</span>'
end
 
if a2 ~= nil and a2 ~= '' then --explicit subdivision, no splitting
return luacodeimpl(args)
end
 
-- Which hyphen to split on, for cases in order of likelihood:
-- none | <country>
-- first | <country>-<subdivision>
-- first | <country>-<hyphenated-subdivision>
-- none | <hyphenated-country>
-- later | <hyphenated-country>-<subdivision>
-- later | <hyphenated-country>-<hyphenated-subdivision>
-- Therefore, first try splitting on first, then on none, then other left-to-right.
 
local hyphenPos = a1:find('-',1,true)
 
if not hyphenPos then --no hyphen
return luacodeimpl(args)
end
 
args[1] = a1:sub(1, hyphenPos-1) --Split on first
args[2] = a1:sub(hyphenPos+1)
local result = luacodeimpl(args)
if result ~= '' then
return result
end
 
-- (a2 is known to be blank by this point)
args[1],args[2] = a1,a2 --Don't split
local result = luacodeimpl(args)
if result ~= '' then
return result
end
 
while true do --Split on rest
hyphenPos = a1:find('-', hyphenPos+1, true)
if not hyphenPos then break end
 
args[1] = a1:sub(1, hyphenPos-1)
args[2] = a1:sub(hyphenPos+1)
result = luacodeimpl(args)
if result ~= '' then
return result
end
return errors('country', args, code1)
end
return errors('country', args, code1)
end
 
--[[----------P . C O D E---------]]-- -- Calls P.Luacode but using Module:Arguments
if mw.title.getCurrentTitle().namespace ~= 0 then
return ''
else
return '', catnocountry..catnosubdivision
end
 
function p.code(frame)
end
 
return p.luacode(getArgs(frame)) or ""
--[[----------P . C O D E---------]]-- -- Calls P.luacode but using Module:Arguments
 
function p.code(frame)
return p.luacode(getArgs(frame))
end
 
--[[----------P . N U M E R I C---------]]-- -- Calls P.luacodeLuacode but using Module:Arguments and setting it to output a numeric value
 
function p.numeric(frame)
 
local args = getArgs(frame)
 
args["codetype"]="numeric"
 
return p.luacode(args) or ""
 
end
 
--[[----------P . L U A N A M E---------]]-- -- Makes the ISO/common name of a country
-- Returns tuple (name,errorcat,errortext). name is empty string upon error because MW stops at first nil
function p.luaname(args)
 
local code1 = p.luacode(args)
local code2 = ''
if string.find(code1,"%-") then
code1, code2 = string.match(code1,"^([^%-]*)%-(.*)$")
end
if string.find(code1 == '',"^%u%u$") then
if code2=="" then --3166-1 alpha-2 code
return '','','<span class="error">No such country or subdivision</span>'
if data[code1] then
end
return (args.isoname or args.lang) and isoname(data,code1,args.lang)
 
or (data[code1]["displayname"] or data[code1]["name"])
local hyphenPos = code1:find("-",1,true)
else
if hyphenPos then --3166-2 code
return errors('country', args)
local code2 = code1:sub(hyphenPos+1)
end
code1 = code1:sub(1, hyphenPos-1)
else --3166-2 code
 
local sdata
local catnodata = '[[Category:Wikipedia page with obscure country]]'
if data[code1] then
 
sdata = mw.loadData("Module:ISO 3166/data/"..code1)
local sdata
else
if data[code1] then
return errors('country', args)
sdata = mw.loadData("Module:ISO 3166/data/"..code1)
else end
if sdata[code2] then
return '',catnodata
return (args.isoname or args.lang) and isoname(sdata,code2,args.lang)
end
if or (sdata[code2]["displayname"] thenor sdata[code2]["name"])
else
return (args.isoname or args.lang) and isoname(sdata,code2,args.lang)
return errors('country', args)
or (sdata[code2]["displayname"] or sdata[code2]["name"])
else end
return '',catnodata
end
 
else --3166-1 alpha-2 code
if data[code1] then
return (args.isoname or args.lang) and isoname(data,code1,args.lang)
or (data[code1]["displayname"] or data[code1]["name"])
else
return '[[Category:Wikipedia page with obscure country]]'
end
end
 
end
 
Line 282 ⟶ 264:
function p.name(frame)
 
return p.luaname(getArgs(frame)) or ""
 
end
 
--[[----------P . G E O C O O R D I N S E R T---------]]-- -- Wrapper for Module:Coordinates.coordinsert
function p.geocoordinsert(frame)
Line 294 ⟶ 276:
local args = frame.args
local subdivisionqueried = false
local catnocountry = (args.nocat and args.nocat == 'true') and ''
or '[[Category:Wikipedia page with obscure country]]'
local catnosubdivision = (args.nocat and args.nocat == 'true') and ''
or '[[Category:Wikipedia page with obscure subdivision]]' or ''
local tracking = ''
local targs = {}
targs[1] = args[1] or ''
for i, v in pairs(args) do
if i == 'country' and not stringmw.ustring.find(targs[1], 'region:', 1, true) then
local country = v
local k, region = 1, ''
-- look for a valid subdivision
while region == '' and k < 3 do
Line 317 ⟶ 295:
if region == '' then
region = p.luacode({country, nocat = 'true'})
if mw.title.getCurrentTitle().namespace ~= 0 then catnocountry,catnosubdivision = '','' end
if region == '' then
tracking = tracking .. catnocountryerrors('country', args)
elseif subdivisionqueried == true then
tracking = tracking .. catnosubdivisionerrors('subdivision', args)
end
end
Line 328 ⟶ 305:
targs[#targs + 1] = 'region:' .. region
end
elseif i == 'type' or i == 'scale' or i == 'dim'
or i == 'source' or i == 'globe' then
targs[#targs + 1] = i .. ':' .. v