Module:ISO 3166/sandbox: Difference between revisions

Content deleted Content added
No edit summary
Don't display script warnings if nocat is set to true
 
(42 intermediate revisions by 4 users not shown)
Line 1:
-- to enable us to replicate the current functioning of Country extract, we need to deal with:
-- 2 {{<name>}} DONE!
-- 3 [[<name>]] DONE!
-- 4 [[<name>|<junk>]] DONE!
-- 5 [[image:flag of <country>.[svg|gif|png|jpg]|\d+px]] DONE!
 
local p = {}
local datagetArgs = mw.loadDatarequire("Module:ISO 3166/data/NationalArguments").getArgs
local data = mw.loadData("Module:ISO 3166/data/National/sandbox")
local catnocountry = '[[Category:Wikipedia page with obscure country]]'
 
local catnosubdivision = '[[Category:Wikipedia page with obscure subdivision]]'
--[[----------SE TR R IO PR S----------]]-- -- Assign error categories and display warnings
local function errors(errType, args, code, alpha2)
-- Remove unnecessary text
if not (args.nocat and args.nocat == 'true') then
local function strip(text)
if code then
local accents = {
local warningText = code .. ' ("%s") is not a recognized ' .. errType .. ' in [[ISO 3166-%s]] ([[Module:ISO 3166]]).'
["À"]="A", ["Á"]="A", ["Â"]="A", ["Ã"]="A", ["Ä"]="A", ["Å"]="A",
if errType == 'country' then
["Ç"]="C",
mw.addWarning(string.format(warningText, args[1], '1'))
["È"]="E", ["É"]="E", ["Ê"]="E", ["Ë"]="E",
elseif errType == 'subdivision' and alpha2 then
["Ì"]="I", ["Í"]="I", ["Î"]="I", ["Ï"]="I",
mw.addWarning(string.format(warningText, args[2], '2:' .. alpha2))
["Ñ"]="N",
end
["Ò"]="O", ["Ó"]="O", ["Ô"]="O", ["Õ"]="O", ["Ö"]="O", ["Ø"]="O",
end
["Ù"]="U", ["Ú"]="U", ["Û"]="U", ["Ü"]="U",
return mw.title.getCurrentTitle().namespace == 0 and ('[[Category:Wikipedia articles with obscure ' .. errType .. 'subdivision]]') or ''
["Ý"]="Y"
}
local patterns = {
["%_"]=" ",
["%-"]=" "
}
local remove = {
"%d+PX",
"<.*>",
".+:",
"|.+",
"%(.-%)",
"%..*",
"^THE",
",.*$",
"%W",
"^[0]+",
"KINGDOMOF",
"OF",
"^STATE",
"STATE$",
"REPUBLIC$",
"NATION",
"COUNTRY",
"TERRITORY",
"FLAG",
"PROVINCE"
}
text = mw.ustring.upper(text)
if mw.ustring.match(text,"[À-Ý]") then
text = mw.ustring.gsub(text,"[À-Ý]",accents)
end
text = mw.text.unstrip(text)
for find, replace in pairs(patterns) do
text = mw.ustring.gsub(text,find,replace)
end
return ''
for _, find in ipairs(remove) do
text = mw.ustring.gsub(text,find,"")
end
return text
end
 
--[[----------F I N D C O D E----------]]--
--[[----------F I N D N A M E----------]]-- -- Finds the name in the database
-- Check to find the code or name
 
local function findcode(code,cdata,qry)
local sqryfunction = stripfindname(code,cdata,qry)
if local sqry == codep.strip(qry)
or if sqrycdata["name"] and sqry== p.strip(cdata["alpha3name"])
or cdata["numericisoname"] and sqry == mwp.ustring.gsubstrip(cdata["numericisoname"], '^[0]+','')
or sqry ==not strip(cdata["isonamenocode"] orand '')sqry==code
or sqry == strip(cdata["namealpha3"] or '')sqry==cdata["numeric"]
then
return true
end
for _,tname in pairs(cdata["isonames"] or {}) do
if sqry == p.strip(tname) then
return true
end
end
for _,tname in pairs(cdata["altnames"] or {}) do
if sqry == p.strip(tname) then
return true
end
Line 79 ⟶ 48:
return false
end
 
--[[----------N A M E O R C O D E---------]]--
--[[----------I S O N A M E----------]]-- -- Find the ISO name of a country/region
--Determine what name or alpha2 code to return
 
local function nameorcode(args,data,ldata,alpha2,dash2)
local function isoname(data,code,lang)
if args.type == "name" then
if args.isoname or args.langdata[code]["isonames"] then
local langname = args.lang or ldatadata[code]["defaultlangisodisplaynames"] orand data["defaultlang"code] or ["enisodisplaynames"][lang]
return ldataor data["isonames"code] and ldata["isonames"][lang] or ldata["isoname"] or ''
or data[code]["isodisplaynames"] and data[code]["isodisplaynames"][data[code]["defaultlang"] or data["defaultlang"]]
end
or data[code]["isonames"][data[code]["defaultlang"] or data["defaultlang"]]
return ldata["name"]
or data[code]["isodisplaynames"] and data[code]["isodisplaynames"]["en"]
elseif dash2 then
or data[code]["isonames"]["en"]
return alpha2.."-"..dash2
if name then return name end
for _,iname in pairs(data[code]["isonames"]) do return iname end
return data[code]["isodisplayname"] or data[code]["isoname"]
else
return data[code]["isodisplayname"] or data[code]["isoname"]
return alpha2
end
end
 
--[[----------G E T C O D E---------]]--
--[[----------S T R I P----------]]-- -- Removes junk from the input
-- Return the code or name
 
local function getcode(args)
function p.strip(text)
catnocountry = args.nocat == 'true' and '' or catnocountry
if not text then return nil end
catnosubdivision = args.nocat == 'true' and '' or catnosubdivision
if not args[1] then return catnocountry end
local accents = {["À"]="A",["Á"]="A",["Â"]="A",["Ã"]="A",
if string.find(args[1], "^%s*(%w%w?%w?)%-(%w%w?%w?)") then
["Ä"]="A",["Å"]="A",["Æ"]="AE",["Ç"]="C",["È"]="E",
args[1], args[2] = string.match(args[1],"^%s*(%w%w?%w?)%-(%w%w?%w?)")
["É"]="E",["Ê"]="E",["Ë"]="E",["Ì"]="I",["Í"]="I",
["Î"]="I",["Ï"]="I",["Ð"]="D",["Ñ"]="N",["Ò"]="O",
["Ó"]="O",["Ô"]="O",["Õ"]="O",["Ö"]="O",["Ø"]="O",
["Ù"]="U",["Ú"]="U",["Û"]="U",["Ü"]="U",["Ý"]="Y",
["Þ"]="TH",
["Ā"]="A",["Ă"]="A",["Ą"]="A",["Ć"]="C",["Č"]="C",
["Ĉ"]="C",["Ċ"]="C",["Ď"]="D",["Đ"]="D",["Ĕ"]="E",
["Ě"]="E",["Ė"]="E",["Ē"]="E",["Ę"]="E",["Ŋ"]="N",
["Ğ"]="G",["Ģ"]="G",["Ĝ"]="G",["Ġ"]="G",["Ĥ"]="H",
["Ħ"]="H",["Ĭ"]="I",["İ"]="I",["Ī"]="I",["Į"]="I",
["Ĩ"]="I",["IJ"]="IJ",["Ĵ"]="J",["Ķ"]="K",["Ĺ"]="L",
["Ľ"]="L",["Ļ"]="L",["Ŀ"]="L",["Ł"]="L",["Ń"]="N",
["Ň"]="N",["Ņ"]="N",["Ŏ"]="O",["Ő"]="O",["Ō"]="O",
["Œ"]="OE",["Ŕ"]="R",["Ř"]="R",["Ŗ"]="R",["Ś"]="S",
["Š"]="S",["Ş"]="S",["Ŝ"]="S",["Ť"]="T",["Ţ"]="T",
["Ŧ"]="T",["Ŭ"]="U",["Ű"]="U",["Ū"]="U",["Ų"]="U",
["Ů"]="U",["Ũ"]="U",["Ŵ"]="W",["Ŷ"]="Y",["Ÿ"]="Y",
["Ź"]="Z",["Ž"]="Z",["Ż"]="Z",
}
local remove = {"NATION OF","COUNTRY OF","TERRITORY OF", -- text to be removed list
"FLAG OF","FLAG","KINGDOM OF","STATE OF"," STATE ",
"PROVINCE OF","PROVINCE","TERRITORY","COUNTY","GOVERNORATE"
}
local patterns = {"(%a)%.(%a)%.",".+:","|.+","%(.-%)", -- patterns to follow (order may matter)
"%.%S.*","^THE ","%_","%-","%d%d?%d?PX"
}
local replacements = {["(%a)%.(%a)%."]="%1%2", -- Replacements for patterns above (order does not matter)
[".+:"]="",["|.+"]="",["%(.-%)"]="",
["%.%S.*"]="",["^THE "]="",["%_"]=" ",["%-"]=" ",
["%d%d?%d?PX"]="",
}
text = mw.text.decode(text) -- Decode HTML entities (passed from wikidata?)
text = mw.text.unstripNoWiki(text) -- Remove <nowiki> tags
text = mw.ustring.upper(text) -- Case insensitivity
text = mw.ustring.gsub(text,"[À-Ż]",accents) -- Deaccent
for _,pattern in ipairs(patterns) do -- Follow patterns
local value = replacements[pattern]
text = mw.ustring.gsub(text,pattern,value)
end
if args[1] then args[1] = strip(args[1]) end
for _,words in pairs(remove) do -- Remove unneeded words
if args[2] then args[2] = strip(args[2]) end
text = mw.ustring.gsub(text,words,"")
if args["codetype"] == "3" then args["codetype"] = "alpha3" end
end
for alpha2,cdata in pairs(data) do
if findcode(alpha2,cdata,args[1]) then
text = mw.ustring.gsub(text,"%W","") -- Remove non alpha-numeric
if args.type == "numeric" or args.type == "alpha3" then
return cdata[args.type]
return text
else
local scode = nil
end
if args[2] then
 
local scdata = mw.loadData("Module:ISO 3166/data/"..alpha2)
--[[----------P . C A L L S T R I P ---------]]-- -- Calls P.strip but using Module:Arguments
for scode,sdata in pairs(scdata) do
 
if findcode(scode,sdata,args[2]) then
function p.callstrip(frame)
return nameorcode(args,scdata,sdata,alpha2,scode)
local args = getArgs(frame)
return p.strip(args[1]) or ""
 
end
 
--[[----------P . L U A C O D E---------]]-- -- Makes the ISO code of a country
 
function p.luacode(args)
args[1], args[2] = args[1] or '', args[2] or ''
local code1 = p.strip(args[1])
local code2 = p.strip(args[2])
 
if args["codetype"]=="3" then args["codetype"]="alpha3" end
local eot = args.error or ""
if code1 == "" then
if not (args.nocat and args.nocat == 'true') then
mw.addWarning((args[1] ~= "" and ('Invalid parameter "' .. args[1] .. '"') or 'No parameter') ..
' for the country given ([[Module:ISO 3166]]).')
end
return errors('country', args), '<span style="font-size:100%" class="error">"No parameter for the country given"</span>'
end
if code2 == "" then --3166-1 code
for alpha2,cdata in pairs(data) do
if findname(alpha2,cdata,code1) then
if args["codetype"]=="numeric" or args["codetype"]=="alpha3" then
return cdata[args["codetype"]]
else
return alpha2
end
end
end
if string.find(args[1],"%-") then
args[1], args[2] = string.match(args[1],"^([^%-]*)%-(.*)$")
if args[2] then return p.luacode(args) end
end
return errors('country', args, code1)
else --3166-2 code
for alpha2,cdata in pairs(data) do
if findname(alpha2,cdata,code1) then
if mw.ustring.match(alpha2,"GB") then -- For England, Wales etc.
alpha2 = "GB"
end
local sdata = mw.loadData("Module:ISO 3166/data/"..alpha2)
local empty = true
for scode,scdata in pairs(sdata) do
if type(scdata)=="table" then
empty = false
if findname(scode,scdata,code2) then
return alpha2.."-"..scode
end
end
return catnosubdivision
else
return nameorcode(args,data,cdata,alpha2)
end
if string.find(args[2] or '',"%-") then
code1, args[2] = string.match(args[2] or '',"^([^%-]*)%-(.*)$")
args[1] = args[1].."-"..code1
return p.luacode(args)
end
return errors('subdivision', args, code2, alpha2)
end
end
if string.find(args[1],"%-") then
args[1] = string.match(args[1],"^([^%-]*)%-(.*)$")
return p.luacode(args)
end
return errors('country', args, code1)
end
return catnocountryerrors('country', args, code1)
end
 
--[[----------M A K E F U N C---------]]--
--[[----------P . C O D E---------]]-- -- Calls P.Luacode but using Module:Arguments
-- Make a function for the p table
 
local function makefunc(params)
function p.code(frame)
params = params or {}
 
return function(frame)
return p.luacode(getArgs(frame)) or ""
local args = {}
 
if type(frame.args) == 'table' then
end
args = frame.args
 
elseif type(frame) == 'table' then
--[[----------P . N U M E R I C---------]]-- -- Calls P.Luacode but using Module:Arguments and setting it to output a numeric value
args = frame
 
end
function p.numeric(frame)
if params.type then
 
args.type = params.type
local args = getArgs(frame)
end
if params.func == 'strip' then
args["codetype"]="numeric"
return strip(args[1] or args.text) or ''
else
return getcodep.luacode(args) or ''""
end
--[[----------P . L U A N A M E---------]]-- -- Makes the ISO/common name of a country
function p.luaname(args)
 
local code1 = p.luacode(args)
local code2 = ''
if string.find(code1,"%-") then
code1, code2 = string.match(code1,"^([^%-]*)%-(.*)$")
end
if string.find(code1,"^%u%u$") then
if code2=="" then --3166-1 alpha-2 code
if data[code1] then
return (args.isoname or args.lang) and isoname(data,code1,args.lang)
or (data[code1]["displayname"] or data[code1]["name"])
else
return errors('country', args)
end
else --3166-2 code
local sdata
if data[code1] then
sdata = mw.loadData("Module:ISO 3166/data/"..code1)
else
return errors('country', args)
end
if sdata[code2] then
return (args.isoname or args.lang) and isoname(sdata,code2,args.lang)
or (sdata[code2]["displayname"] or sdata[code2]["name"])
else
return errors('country', args)
end
end
end
end
 
--[[----------P . N A M E---------]]-- -- Calls P.Luaname but using Module:Arguments
 
function p.name(frame)
 
return p.luaname(getArgs(frame)) or ""
 
end
--[[----------E X P O R T E D F U N C T I O N S---------]]--
--[[----------P . G E O C O O R D I N S E R T---------]]-- -- Wrapper for Module:Coordinates.coordinsert
-- Functions in the p table
p.strip = makefunc({func='strip'})
p.code = makefunc()
p['alpha2'] = makefunc()
p['alpha3'] = makefunc({type='alpha3'})
p.numeric = makefunc({type='numeric'})
p.name = makefunc({type='name'})
--[[----------P . G E O C O O R D I N S E R T---------]]--
-- Wrapper for Module:Coordinates.coordinsert
function p.geocoordinsert(frame)
-- {{#invoke:ISO 3166|geocoordinsert|{{coord|...}}
Line 166 ⟶ 276:
local args = frame.args
local subdivisionqueried = false
catnocountry = args.nocat == 'true' and '' or catnocountry
catnosubdivision = args.nocat == 'true' and '' or catnosubdivision
local tracking = ''
local targs = {}
Line 188 ⟶ 296:
region = p.luacode({country, nocat = 'true'})
if region == '' then
tracking = tracking .. catnocountryerrors('country', args)
elseif subdivisionqueried == true then
tracking = tracking .. catnosubdivisionerrors('subdivision', args)
end
end
Line 210 ⟶ 318:
return targs[1] .. tracking
end
 
return p