User:Ohconfucius/script/Sources.js: Difference between revisions

Browse history interactively

← Previous edit

Content deleted Content added

Revision as of 14:55, 17 June 2020 view source Ohconfucius (talk \| contribs) Autopatrolled, Extended confirmed users, Pending changes reviewers 332,930 edits align to test script ← Previous edit		Latest revision as of 18:45, 23 June 2025 view source Ohconfucius (talk \| contribs) Autopatrolled, Extended confirmed users, Pending changes reviewers 332,930 edits line spacing
(28 intermediate revisions by 4 users not shown)
Line 1: // <nowiki> // ******************************************************************************************* Line 6 ⟶ 7: // ******************************************************************************************* if (typeof importScriptURI !== 'undefined') { // not available on mobile. mw.loader.load('//meta.wikimedia.org/w/index.php?title=User:Pathoschild/Scripts/Regex_menu_framework.js&action=raw&ctype=text/javascript'); importScript("User:Ohconfucius/script/MOSNUM_utils.js"); //needed for "'Accessed' -> importScript("User:Ohconfucius/test/Sources_subscript1.js"); //convert ___domain names into article names ~~importScriptURI('//meta.wikimedia.org/w/index.php?title=User:Pathoschild/Scripts/Regex_menu_framework.js&action=raw&ctype=text/javascript');~~ importScript("User:Ohconfucius/~~script~~test/~~MOSNUM_utils~~Sources_subscript2.js"); //~~needed~~Correctly ~~for~~casing ~~"'Accessed'~~titles and apply or ->rem italicisation importScript("User:Ohconfucius/test/Sources_subscript3.js"); //link-fixing, dabbing etc // importScript("User:Ohconfucius/~~test~~script/~~Sources_subscript1~~foreigndates.js"); //~~convert ___domain names into~~link-fixing, ~~article~~dabbing ~~names~~etc } ~~importScript("User:Ohconfucius/test/Sources_subscript2.js"); //Correctly casing titles and apply or rem italicisation~~ ~~importScript("User:Ohconfucius/test/Sources_subscript3.js"); //link-fixing, dabbing etc~~ ~~importScript("User:Ohconfucius/script/foreigndates.js"); //link-fixing, dabbing etc~~ function Ohc_add_ref_tags() { Line 26 ⟶ 28: //test regex(/\s?(<ref>(?:[^<>]\\|\surl\s=\|\[?)https?:\/\/((?:\w+\.)\w+(?:\.(?:com?\|org\|net\|gov\|ac\|)(?:\.[a-z]{2}\|)))\/[^<>{}]+\\|publisher=)(?=}}<\/ref>)/gi, "$1$2"); //capture ___domain name to add to publisher regex(/(\\|\s?(?:publisher\|website)\s\=\s)w{3}\.(\w+\.(?:com?\|org\|net\|gov\|ac\|)(?:\.[a-z]{2}\|))(?=\s[\|}])/gi, '$1$2'); regex(/(\\|\s?publisher=)\s?\\|\s?via\s\=\s(\w+)(?=\s[\|}])/gi, '$1$2'); // regex(/\\|\s?via\s\=\s/gi, '\|work='); regex(/\s?[-–]\s?(?:The \|)(\w+\.(?:com?\|org\|net\|gov\|ac\|)(?:\.[a-z]{2}\|))\s?(\\|\s?publisher\s\=\s)\1(?=}})/gi, '$2$1'); regex(/\s?[-–]\s?([^\|]+)\s?(\\|\s?publisher\s\=\s)(The )\1(?=}})/gi, '$2$3$1'); regex(/\\|\s?first\s\=[^\|]\\|\s?last\s\=(?:Editor\|Group\|Staff\|Reporter\|Writer)\s(?=\\|)/gi, ''); regex(/({{Navbox deaths}})(\n)/gi, '==References==$2{{Reflist}}$2$1$2'); Line 36 ⟶ 38: } function Ohc_remove_urls() { var txt=document.editform.wpTextbox1; // warning-tagging template:Primary source inline regex(/(<ref[^<>]>[^<>]\\|[ ]url ?= ?https?:\/\/(?:(?:www\.\|mobile\.\|)(?:blogger\|blogspot\|facebook\|sites\.google\|instagram\|tiktok\|twitter\|wordpress\|x)\.com\|www\.formspring\.me)\/[^<>{]<\/ref>)(?:\{\{Primary source inline\}\}\|)/gi, '$1{{Primary source inline}}'); regex(/(<ref[^<>]>[^<>]\\|[ ]url ?= ?https?:\/\/(?:(?:www\.\|)(?:myspace\|findagrave)\.com)\/[^<>{]<\/ref>)(?:\{\{Primary source inline\}\}\|)/gi, '$1{{Primary source inline}}'); regex(/(<ref>\shttps?:\/\/(?:(?:www\.\|)(?:blogger\|blogspot\|facebook\|sites\.google\|findagrave\|instagram\|myspace\|tiktok\|twitter\|wordpress\|x)\.com)\/[^\s\]<]<\/ref>)(?:\{\{Primary source inline\}\}\|)/gi, '$1{{Primary source inline}}'); regex(/(<ref>\s\[https?:\/\/(?:(?:www\.\|)(?:blogger\|blogspot\|facebook\|sites\.google\|findagrave\|instagram\|myspace\|tiktok\|twitter\|wordpress\|x)\.com)\/[^\s\]][ ]+[\w\d][^\]]\]<\/ref>)(?:\{\{Primary source inline\}\}\|)/gi, '$1{{Primary source inline}}'); // removing http links within publisher/journal/work fields // // regex(/(\\|\s(?:author\|publisher\|work) = )(?:https?:~~\|ftp:)~~\/{2}\|)(?:\w{~~2,4~~3}\.\|)(\w+)(?:\.(?:com?\|net\|org\|gov\|\w{2})\|)(?:\.\w{2}\|))(?:\/[^\|}]\|)(?=\s[\]\|}])/gi, '$1$2'); //returns ___domain name regex(/(\\|\s~~?(?:author(?:link\d?\|)\|chapter\|journal\|magazine\|newspaper\|publisher\|~~title~~\|work\|via)~~\s\=)\s~~)(?:~~https?:\/{2}(?:w{3}\/.\|)~~www~~\w+\.com(?=\w)s?(?:[=\|{]\|\/?}\}))/gi, '$1$2 '); ~~//leave only ___domain name~~ regex(/(~~>{{cit[^}]+~~\\|\s~~?website~~title\s\=)\s~~)(?:~~https?:\/\/{2}[^\|~~)www~~\~~.(\w[^}<~~s]+)(?=\s?(?:[=\|{]\|\}\}<))/gi, '$1$2 '); ~~//leave only ___domain name~~ // regex(/(\\|\s~~?(?:chapter\|journal\|magazine\|newspaper\|publisher\|~~title~~\|work\|via)~~\s\=)\s)Archived copy(?=\[s?~~https~~(?:~~\/\/~~[~~^\s\~~=\|{]]\|\~~s([~~}\w][^\]]}))~~\]?~~/gi, '$1$2 '); ~~//leave~~rem as ~~only~~creating ~~linked~~CS1 ~~text~~errors regex(/\s?<!--ACTUAL ARTICLE TITLE BELONGS HERE!(?: original text:\|)[^>]-->/gi, ' '); //rem error introduced by earlier version of this script; entirely strip title field regex(/(\\|\s(?:author(?:link\d?\|)\|chapter\|journal\|magazine\|newspaper\|publisher\|title\|work\|via)\s\=\s)https?:\/{2}(?:w{3}\.\|)(?=\w)/gi, '$1'); //removes http:// and optionally www. regex(/(\\|\s(?:author(?:link\d?\|)\|chapter\|journal\|magazine\|newspaper\|publisher\|title\|work\|via)\s\=\s)(?:w{3}\.)(?=\w)/gi, '$1'); //removes www. regex(/(\\|\s(?:author(?:link\d?\|)\|chapter\|journal\|magazine\|newspaper\|publisher\|title\|work\|via)\s\=\s)(\w+(?:\.(?:com?\|net\|org\|gov\|\w{2}))(?:\.\w{2}\|))(?:\/[^\|}]\|)(?=\s[\]\|}])/gi, '$1$2'); //returns ___domain name regex(/(>{{cit[^}]+\\|\s?website\s\=\s)https?:\/{2}(?:w{3}\.\|)(?=\w)/gi, '$1'); //leave only ___domain name regex(/(>{{cit[^}]+\\|\s?website\s\=\s)(?:w{3}\.)(?=\w)/gi, '$1'); //leave only ___domain name // removing hyperlinks within publisher/journal/website/work fields ~~regex(/(\\|\s?author(?:link\d?\|)\s\=\s)\[https?:\/\/[^\s\]]\s([\w][^\]])\]/gi, '$1$2');~~ regex(/(\\|\s~~?author~~(?:~~link\d?~~chapter\|journal\|magazine\|newspaper\|publisher\|title\|work\|via)\s\=\s)~~(?:~~\[https?:\/\/~~\|)www~~[^\.s\]]\s([\w][^\|}\](?=[\|}])\]/gi, '$1$2'); //~~rem~~leave ~~outright~~only ~~(not~~linked ~~a WL)~~text regex(/({{cit[^}]+\\|\s?website\s\=\s)\[https?:\/\/[^\s\]]\s([\w][^\]])\]/gi, '$1$2'); //citation templates: rem url whilst leaving only linked text within \|website= regex(/(\\|\stitle\s=\s)(?:\w+(?:\.(?:com?\|net\|org\|gov\|\w{2}))(?:\.\w{2}\|))(?:\/[^\|}]+)(?:\/[^\|}]+)(?:\/[^\|}]+)(?:\/[^\|}]+)\/([^\|}]+)\/?(?=\s[\]\|}])/gi, '$1$2'); //returns terminal part of url regex(/(\\|\stitle\s=\s)(?:\w+(?:\.(?:com?\|net\|org\|gov\|\w{2}))(?:\.\w{2}\|))(?:\/[^\|}]+)(?:\/[^\|}]+)(?:\/[^\|}]+)\/([^\|}]+)\/?(?=\s[\]\|}])/gi, '$1$2'); //returns terminal part of url regex(/(\\|\stitle\s=\s)(?:\w+(?:\.(?:com?\|net\|org\|gov\|\w{2}))(?:\.\w{2}\|))(?:\/[^\|}]+)(?:\/[^\|}]+)\/([^\|}]+)\/?(?=\s[\]\|}])/gi, '$1$2'); //returns terminal part of url regex(/(\\|\stitle\s=\s)(?:\w+(?:\.(?:com?\|net\|org\|gov\|\w{2}))(?:\.\w{2}\|))(?:\/[^\|}]+)\/([^\|}]+)\/?(?=\s[\]\|}])/gi, '$1$2'); //returns terminal part of url regex(/(\\|\stitle\s=\s)(?:\w+(?:\.(?:com?\|net\|org\|gov\|\w{2}))(?:\.\w{2}\|))\/([^\|}]+)\/?(?=\s[\]\|}])/gi, '$1$2'); //returns terminal part of url regex(/(\\|\sauthor(?:link\d?\|)\s\=\s)\[https?:\/\/[^\s\]]\s([\w][^\]])\]/gi, '$1$2'); regex(/(\\|\sauthor(?:link\d?\|)\s\=\s)(?:https?:\/\/\|)www\.[\w][^\|}](?=[\|}])/gi, '$1'); //rem outright (not a WL) // removing references to other WP articles and 'external' WP links regex(/<ref[^<>]>[^<>]\\|[ ]url ?= ?https?:\/\/\w{2}\.wikipedia\.org\/w[^<>]<\/ref>/gi, '{{cn}}<!-- WP:RS needed; removed link to WP-->'); regex(/<ref>\shttps?:\/\/\w{2}\.wikipedia\.org\/wiki\/[^\s\]<]<\/ref>/gi, '{{cn}}<!-- WP:RS needed; removed link to WP-->'); regex(/<ref>\s\[https?:\/\/\w{2}\.wikipedia\.org\/w[^\s\]][ ]+[\w\d][^\]]\]<\/ref>/gi, '{{cn}}<!-- WP:RS needed; removed link to WP-->'); regex(/<ref(?: name=[^<>]\|)>[^<>]\\|\surl[ ]=[ ]https?:\/\/\w{2}\.wikipedia\.org\/w[^\s\\|\{\}<][^<>]<\/ref>/gi, '{{cn}}<!-- WP:RS needed; removed link to WP-->'); regex(/\[https?:\/\/\w{2}\.wikipedia\.org\/w[^\s\]][ ]+([\w][^\]])\]/gi, ' [[$1]]'); ~~regex(/(<ref[^<>]>[^<>]\\|[ ]url ?=https?:\/\/(?:(?:www\.\|)(?:facebook\|twitter)\.com)\/[^<>{])(<\/ref>)/gi, '$1{{Primary source inline}}$2');~~ ~~regex(/(<ref[^<>]>[^<>]\\|[ ]url ?=https?:\/\/(?:(?:www\.\|)(?:myspace\|findagrave)\.com)\/[^<>{])(<\/ref>)/gi, '$1{{Primary source inline}}$2');~~ ~~regex(/(<ref>\shttps?:\/\/(?:(?:www\.\|)(?:facebook\|myspace\|twitter\|mailonline\|findagrave)\.com\|dailymail\.co\.uk)\/[^\s\]<])(<\/ref>)/gi, '$1{{Primary source inline}}$2');~~ ~~regex(/(<ref>\s\[https?:\/\/(?:(?:www\.\|)(?:facebook\|myspace\|twitter\|mailonline\|findagrave)\.com\|dailymail\.co\.uk)\/[^\s\]][ ]+[\w\d][^\]]\])(<\/ref>)/gi, '$1{{Primary source inline}}$2');~~ //deprecated sources regex(/<ref[^<>]>[^<>]\\|[ ]url ?= ?https?:\/\/(?:(?:\w+\.\|)((?:the\|)epochtimes\|ntdtv)\.com)\/[^<>{]<\/ref>/gi, '<!--rem deprecated source \($1\)-->'); regex(/<ref[^<>]>[^<>]\\|[ ]url ?= ?https?:\/\/(?:(?:\w+\.\|)(thesun\|dailymail)\.co\.uk)\/[^<>{]<\/ref>/gi, '<!--rem deprecated source \($1\)-->'); ~~regex(/(\\|\s?url\s\=\s\|\[)(https?:[^\|{}#\s]+)#[A-Za-z0-9\.]{12,13}(?=[\s\[\]\|{}<>])/gi, '$1$2'); //rem link tracking~~ ~~regex(/(\\|\s?url\s\=\s)(https?:[^\|{}#\s]+\.html?)\?[^\|}]{1,5}(?=[\s\[\]\|{}<>])/gi, '$1$2'); //rem link tracking~~ ~~regex(/(\\|\s?url\s\=\s\|\[)(https?:\/\/books\.google\.[^\/]+\/books\?id=\w{12}&pg=PA\d{1,3})&dq[^\s\|}]+(?=\s?[\|}])/gi, '$1$2'); //rem browser optimisation~~ regex(/(\\|\surl\s\=\s\|\[)(https?:[^\|{}#\s]+)(?:#[A-Za-z0-9\.]{12,13}\|\?CMP=fb_gu)(?=[\s\[\]\|{}<>])/gi, '$1$2'); //rem link tracking regex(/(\\|\surl\s\=\s)(https?:[^\|{}#\s]+\.html?)\?[^\|}]{1,5}(?=[\s\[\]\|{}<>])/gi, '$1$2'); //rem link tracking regex(/(\\|\surl\s\=\s\|\[)(https?:\/\/books\.google\.[^\/]+\/books\?id=\w{12}&pg=PA\d{1,3})&dq[^\s\|}]+(?=\s?[\|}])/gi, '$1$2'); //rem browser optimisation } Line 78 ⟶ 95: // removing artefacts within fields regex(/(\\|\s?author\s\=\s)(?:by \|)(?:[^\|]+staff\|(?:staff \|)(?:reporter\|writer)s?\|)[\s\n](?=[\|}])/gi, ''); regex(/(\\|\s?author\s\=\s)([A-Z][a-z](?: [A-Z][a-z])) (?:(?:wire \|)staff\|(?:staff \|)(?:reporter\|writer)s?)[\s\n](?=[\|}])/gi, '$1$2'); regex(/\\|[ ]last=(Reporter\|staff)[ ]\\|[ ]first=[^\|\{\}](?=[\\|{}])/gi, ''); regex(/\\|[ ](?:first\|last)=(?:staff \|)(?:reporter\|writer)[ ](?=[\\|{}])/gi, ''); regex(/\\|[ ]first= ?staff ?\\|[ ]last=(?:reporter\|writer)[ ](?=[\\|{}])/gi, ''); regex(/\\|[ ]first= ?The ?\\|[ ]last=[^\\|{}](?=[\\|{}])/gi, ''); regex(/(\\|\s?access-?date\s\=\s)(?:accessed\|retrieved)(?: by\| on\|):?[ ](\d)/gi, '$1$2'); regex(/(\\|\s?access-?date\s\=\s\d{4}\s?)(?=[\|}])/gi, ''); regex(/(\\|\s?work\s\=\s)(?:article\|interview\|review) ?(?=[\|}])/gi, '$1'); regex(/(\\|\s?volume\s\=\s)vol(?:ume\|\.?)[ ](\d)/gi, '$1$2'); regex(/(\\|\s?pages?\s\=\s)(?:pages?\|p[gp]?\.?)[ ](\d)/gi, '$1$2'); regex(/ [-–] (?:每日明報 daily news\|東方日報)/gi, ''); regex(/(\.\.\. \|)\{\{!\}\} 立場(報道\|新聞)/gi, ''); regex(/(\\|\s?title\s\=\s)Login ?(?=[\|}])/gi, '$1'); //creating deliberate error (blank title) per Trappist ~~regex(/(\\|\s?)(?:publisher\|website\|work)=You ?tube(?:\.com\|)(?=\s[\|}])/gi, '$1via=YouTube');~~ regex(/(\\|\s?)(?:publisher\|website\|work)=(~~Amazon)(?:~~Newspapers\.com\|Twitter\|Vimeo\|Youtube)(?:\.~~\w{2}~~com\|)(?=\s[\|}])/gi, '$1via=$2'); regex(/(\\|\s?)(?:publisher\|website\|work)=(~~Vimeo~~Amazon)(?:\.com\|)(?:\.\w{2}\|)(?=\s[\|}])/gi, '$1via=$2'); regex(/(\\|\s?)(?:publisher\|website\|work)=(~~Newspapers~~\~~.com~~[\[Twitter\\|𝕏\]\])(?: \(Formerly (?:Twitter\|\[\[Twitter\]\]\)) \|)(?=\s[\|}])/gi, '$1via=$2'); regex(/(\\|\s?publisher=)\\|\s?via\s\=\s(\w+)(?=\s[\|}])/gi, '$1$2'); regex(/(?:-[ ]Google Books[ ](?:\\|[^}]\|)\|)\\|\s?publisher\s\=\s(Google Books)(?=[\s\.][\|}])/g, '\|via=$1'); ~~// regex(/(\\|\s?)(?:publisher\|website\|work)=books\.google(?:\.com?\|.co\.uk\|)(?=\s[\|}])/gi, '\|via=Google Books');~~ ~~// regex(/\\|\s?(?:publisher\|website\|work)=(British Newspaper Archive\|Google Books\|Project Gutenberg\|Proquest\|Scribd\|web(?:\.archive\\|citation)(?:\.org\|))(?=\s[\|}])/gi, '\|via=$1');~~ //Remove COinS corrupting templates from CS1 citations regex(/(\\|\s?(?:authors?\|first\d?\|last\d?\|publisher\|work)\s\=\s(?:[^{}\|]\|)){{(?:Sm\|Aut\|SC\|Small[- ]caps\|Sm?caps)\\|([^{}\|])}}(?=(?:[^{}\|]\|)[\|}])/gi, '$1'); regex(/(\\|\s?)\w+\=(url\s\=\shttps?:\/\/)(?=[\|}])/gi, '$1$2'); //common cs1 error regex(/(\\|\s?url\s\=)(www\.)(?=[\|}])/gi, '$1http//$2'); //common cs1 error regex(/(\\|\sdate\s=\s)(?:not? \|non-\|un)date[ds]?\s(?=[\|}])/gi, '$1n.d.'); //common cs1 error regex(/(\\|\s?dead-?url=no?)(?=\s[\|}])/gi, '\|url-status=dead'); //common cs1 error (deprecated parameter) ~~regex(/\{\{wikinews ?(\|2\|cat(?:egory)?\|has\|par2?\|portal\|table\|-inline)(\\|[^\}]+\|)\}\}\s/gi, '');~~ regex(/(\[ ]\|)\[\[n:[^\]\\|]\]\][\r\n]/gi, ''); ~~// regex(/\[ ]\{\{(?:Facebook\|Find a Grave\|Myspace)\\|([^}])\}\}[\n\r\s]/gi, ''); //disabled 19 Sept 2015 per Batty's request~~ //citation template fixes // regex(/(\\|\s?)published\s?=/gi, '$1publisher='); //disabled 12/5/21 – false positive in book infobox // rem copyright assertion regex(/(\\|\s?publisher\s\=\s)(?:\[\[copyright(?:\\|©\|)\]\])\s?/gi, '$1'); regex(/(\\|\s?publisher\s\=\s)(?:©\|copyright)\s?/gi, '$1'); regex(/(\\|\s?title\s\=\s[^\|}]+?)[-‒–—―]\s+([^\|}]+?)(\\|\s?(?:publisher\|work)\s\=\s\2)/gi, '$1$3'); regex(/(\\|\s?title\s\=\s([^\|}]+?))[-‒–—―]\s+([^\|}]+?\\|\s?(?:publisher\|work)\s\=\s\2)/gi, '$1$3'); // misused 'date' parameter Line 125 ⟶ 138: // rem toggles and redundant quote marks regex(/(\\|\s?(?:agency\|author\|newspaper\|work\|journal\|publisher\|title)\s\=\s)\'\'([^\|}]+)\'\'(?=\s[\}\\|])/gi, '$1$2'); //without link regex(/(\\|\s?(?:agency\|author\|newspaper\|work\|journal\|publisher\|title)\s\=\s)\'\'(\[\[(?:[^\\|]+\\|\|)[^\\|\]]+\]\])\'\'(?=\s[\}\\|])/gi, '$1$2'); //with link regex(/(\\|\s?title\s\=\s)\''([^\\|\{\}]+)\''/gi, '$1$2'); //rem ' in titles regex(/(\\|\s?publisher\s\=\s)\(([^\\|\{\}]+)\)/gi, '$1$2'); //rem parenthetical publishers regex(/(\\|\spublisher\s\=\s)\"([^\\|\{\}]+)\"/gi, '$1$2'); //rem quote marks around publishers // reordering 'work' and 'publisher' (first run - see second run in cleanup function) regex(/(\\|\s?publisher\s\=\s(?:\[\[[^<{}\]]\]\]\|[^{}\\|\}<>]))(\s?\\|[^}<>]\|)(\\|\s?(?: journal\|newspaper\|magazine\|periodical\|website\|work)\s\=\s(?:\[\[[^<{}\]]\]\]\|[^{}\\|\}<>]))(?=[\s\.][\|}])/g, '$3$1$2'); regex(/(\\|\s?website\s\=\s(?:\[\[[^<{}\]]\]\]\|[^{}\\|\}<>]))(\s?\\|[^}<>]\|)(\\|\s?(?: journal\|newspaper\|magazine\|periodical\|work)\s\=\s(?:\[\[[^<{}\]]\]\]\|[^{}\\|\}<>]))(?=[\s\.][\|}])/g, '$3$1$2'); /// removing identical/similar entries in 'work' and 'publisher', and in 'work' and 'website' (different default vs [post] cleanup rules) Line 141 ⟶ 155: regex(/\\|\s?publisher\s\=\s([^=\|}\[<>])(\\|[^}<>]\|)\\|\s?publisher\s\=\s(?:\1\|\[\[\1\]\])\.?(?=\s[\|}])/g, '\|publisher=$1$2'); //unlinked work regex(/\\|\s?publisher\s\=\s\[\[([^<\|\]])\]\](\\|[^}<>]\|)\\|\s?publisher\s\=\s(?:\1\|\[\[\1\]\])\.?(?=\s[\|}])/g, '\|publisher=$1$2'); //unpiped work regex(/\\|\s?publisher\s\=\s(\[\[(?:[^<\|\]])\\|([^}<>])\]\])(\\|[^}<>]\|)\\|\s?publisher\s\=\s(\1\|\2)\.?(?=\s[\|}])/g, '\|publisher=$1$32'); //piped work // remove redundant parentheses and templates from dm and md dates (equivalents also exists in Mosnum script) Line 147 ⟶ 161: // rem corporate designation regex(/(\\|\s?(?:author\|publisher\|work)\s\=\s[^\[\|}]{1,40}),? (?:Inc\|LL[CP]\|Ltd\|Limited\|PLC\|SA\|(?:Snd\. \|)Berhad)\.?(?=[ ]\\|\})/gi, '$1'); // correcting yahoo! corporate designation regex(/(\\|\s?(?:publisher\|work)\s\=\sYahoo)(?: \|)(Finance\|Green\|Kids\|Music\|News\|)(?=[ ]\\|\})/gi, '$1! $2'); // rem unnecessary quote marks regex(/(\\|\s?title\s\=\s)["“]([^\\|]+)["”](?=\s?[\|}])/gi, '$1$2'); regex(/(\\|\s?title\s\=\s)['‘]([^\\|'’]+)['’](?=\s?[\|}])/gi, '$1$2'); // repl double 'in-title' quote marks with single quotes regex(/(\\|\s?title\s\=\s[\w ]* )["“]((?:\w[\w]* )+(?:\w[\w]))["”]([^\\|]+\|)(?=\s?[\|}])/gi, '$1\'$2\'$3'); // adjust for possibly incorrectly input title regex(/(\\|\s?title\s\=\s)([^\\|\}<>])(\s?\\|[^}<>]\|)\\|\s?(publisher\|work)\s\=\s(?:\1\|\[\[\1\]\])(?=\s[\|}])/g, '$1 \|$4=$2$3'); //creating deliberate error (blank title) per Trappist ~~regex(/(\\|\s?title\s\=\s)(\w+\.com)(?=\s?[=\|{}])/gi, '$1<!--ACTUAL ARTICLE TITLE BELONGS HERE!--> \|publisher=$2');~~ // rem misplaced punctuation Line 167 ⟶ 180: // removing blank or redundant parameters regex(/(?:\\|[ ](?:agency\|arxiv\|asin\|at\|author(-?link\|-mask\|-name-separator\|-separator\|\d\|\d-link\|link\d?\|)\|bibcode\|chapter\|chapter-url\|coauthors?\|contribution(?:-url\|)\|date\|deadurl\|display-authors\|doi\|doi-inactive\|doibroken\|edition\|(?:editor\|translator)(?:-first\|-last\|-link\|\d\|\d-first\|\d-last\|\d-link)\|(?:first\|last)\d?\|format\|id\|is[bs]n\|issue\|jfm\|journal\|jstor\|language\|lay(?:date\|source\|summary)\|lccn\|___location\|magazine\|day\|month\|mr\|newspaper\|nopp\|oclc\|ol\|origyear\|osti\|others\|pages?\|periodical\|place\|pm[cd]\|pmid\|postscript\|publisher\|quote\|ref\|rfc\|separator\|series\|ssrn\|trans_title\|type\|url\|volume\|via\|work\|year\|zbl)[ ]=[\s])(?=[}\|])/gi, ''); // regex(/(?:\\|[ ](began\|ended)[ ]=[^}\|])(?=[}\|])/gi, ''); //disabled 18/06/20: false positive removal of associated (Start date) templates regex(/(\\|\s?work\s?\=\s?)\[\[iTunes\]\] Archive\s/gi, '\|publisher=[[iTunes ~~Store~~]]'); //rem underlining within certain fields regex(/(\\|\s?(?:journal\|newspaper\|periodical\|publisher\|work)\s\=\s)<u>([^\|}]+)<\/u>/gi, '$1$2'); //rem redundant top-level domains (.com, .net, .org), strip "www" regex(/(\\|\s?(?:journal\|newspaper\|periodical\|publisher\|work)\s\=\s)(\[\[[^\[\]\}]\]\])\.(?:biz\|com\|net\|org\|co\.uk\|(?:com\.\|)[a-z]{2})(?=\s[\|}])/gi, '$1$2'); //rem duplicated publishers in separate fields (pre) regex(/(?:[‒–—―]+\|\|)\s(?:The \|)([^\\|\}&]{3,})(?:\.com\|)\s(\\|\s?(?:agency\|publisher\|work)\s\=\s)\1(?=\s[\|}])/gi, '$2$1'); regex(/(?:[‒–—―]+\|\|)\s([^\\|\}&]{3,})(?:\.com\|)\s(\\|\s?(?:agency\|publisher\|work)\s\=\s)(The \|)\1(?=\s[\|}])/gi, '$2$3$1'); //'work' and its alias (pre) Line 191 ⟶ 204: // removing english language parameters regex(/[ ]?\{\{en[- ]icon\}\}/gi, ""); // regex(/\\|[ ]?language[ ]?=[ ]?en(?:-\w{2}\|glish\|)(?=\s[}\|])/gi, ""); // regex(/(\\|[ ]?language[ ]?=[ ]?)\{\{(\w{2})(?:[- ](?:icon\|UK\|GB\|US)\|)\}\}/gi, ""); // removing icon template from within "\|language=" parameter // eliminating time of day Line 240 ⟶ 253: //linked publishing houses // removing publishers less well-known than their titles regex(/(\\|\s?publisher\s?\=MTV\\|\s?)publisher\s\=\s(?:MTV Networks(?: \(Viacom\)\|)\|Viacom)/gi, '$1='); regex(/(?:\\|publisher=Turner Sports Interactive, Inc)\.? ?\\|publisher=(NBA)(?= ?\\|)/gi, '$1'); Line 250 ⟶ 263: regex(/(?:\\|\s?(newspaper\|work\|publisher)\s\=\s(ACP Magazines\|The Herald and Weekly Times\|John Fairfax (and Sons Ltd\.?\|Holdings)\|Fairfax(?: Media(?: Limited\|)\| Digital\| newspapers\|)))(?=[\s\.][\|}])/gi, ''); regex(/(?:\\|\s?(newspaper\|work\|publisher)\s\=\s\[\[(ACP Magazines\|The Herald and Weekly Times\|John Fairfax (and Sons Ltd\.?\|Holdings)\|Fairfax(?: Media(?: Limited\|)\| Digital\| newspapers))\]\])(?=[\s\.][\|}])/gi, ''); regex(/\\| ?publisher ?= ?(?:Fandango Media\|\[\[Fandango Media\]\]) ?/gi, ''); regex(/(?:\\|\s?publisher\s\=\s(Alexander Lebedev\|American Media\|Associated Newspapers\|Bauer (?:Consumer Media\|Media Group)\|Cond[eé] Nast(?: Publications\|)\|Daily Mail and General Trust\|Devin Laz[ae]rine\|Dow Jones & Company\|Future plc\|(Guardian\|Telegraph) Media Group\|(?:Guardian\|Independent) News (?:and\|&) Media (?:Limited\|Ltd\.\|)\|Hachette Filipacchi Médias\|Hearst (?:Corporation\|Magazines(?: UK\|))\|Herald Media\|IGN Entertainment\|Imdb Inc\.?\|InterMedia Partners\|IDG\|IPC Media\|Lee Enterprises\|Media ?News Group\|Mortimer Zuckerman\|MTV Networks\|News (?:Corporation\|International\|Limited)\|Prometheus Global Media\|Reed Business Information\|Rovi Corporation\|Trinity Mirror\|Times Newspapers\|Nielsen (?: Media Research\|Business Media)\|Viacom\|Time(?: Warner ?\|)))(,? Inc\| LL[CP]\| Ltd\|Limited\|)[\s\.](?=[\|}])/gi, ''); regex(/(?:\\|\s?publisher\s\=\s(Alexander Lebedev\|American Media\|Associated Newspapers\|Bauer (?:Consumer Media\|Media Group)\|Cond[eé] Nast(?: Publications\|)\|Daily Mail and General Trust\|Devin Laz[ae]rine\|Dow Jones & Company\|Future plc\|(Guardian\|Telegraph) Media Group\|(?:Guardian\|Independent) News (?:and\|&) Media(?: Limited\| Ltd\.\|)\|Hachette Filipacchi Médias\|Hearst (?:Corporation\|Magazines(?: UK\|))\|Herald Media\|IGN Entertainment\|Imdb Inc\.?\|InterMedia Partners\|IDG\|IPC Media\|Lee Enterprises\|Media ?News Group\|Mediacorp\|Mortimer Zuckerman\|MTV Networks\|News (?:Corporation\|International\|Limited)\|Postmedia Network Inc\.?\|Prometheus Global Media\|Reed Business Information\|Rovi Corporation\|Trinity Mirror\|Times Newspapers\|Nielsen (?: Media Research\|Business Media)\|Viacom\|Time(?: Warner ?\|)))(,? Inc\| LL[CP]\| Ltd\|Limited\|)[\s\.](?=[\|}])/gi, ''); regex(/\\|\s?publisher\s\=\s(?:The \|)(?:Deseret News Publishing\|Dispatch Printing\|E\. W\. Scripps\|Evening Post Publishing\|Forbes(?: Publishing\|, Inc\.)\|Gannett?\|Independent News & Media\|Irish Times Trust\|(?:Jann Wenner\|Wenner Media)\|Johnson Publishing\|Journal Communications\|Mac Publishing\|Media24\|McClatchy\|Nash holdings LLC\|New York Times\|Seattle Times\|Star Tribune\|Thomp?son(?:[- ]?Reuters)?(?: Corporation\| Plc.?\|)\|Torstar\|Time Inc\.\|Times (?:Group\|Publishing)\|Tribune\|Vox Media\|Washington Post\|World Publishing\|Ziff Davis Media)(?: Co(?:mpany\|\.)?)?(?=[\s\.][\|}])/g, ''); regex(/\\|\s?publisher\s\=\s(?:The \|)(?:Deseret News Publishing\|Dispatch Printing\|E\. W\. Scripps\|Evening Post Publishing\|Forbes(?: Publishing\|, Inc\.)\|Gannett?\|Independent News & Media\|Irish Times Trust\|(?:Jann Wenner\|Wenner Media)\|Johnson Publishing\|Journal Communications\|Mac Publishing\|Media24\|McClatchy\|Nash holdings LLC\|New York Times\|Seattle Times\|Star Tribune\|Thomp?son(?:[- ]?Reuters)?(?: Corporation\| Plc.?\|)\|Singapore Press Holdings\|Torstar\|Time Inc\.\|Times (?:Group\|Publishing)\|Tribune\|Vox Media\|Washington Post\|World Publishing\|Ziff Davis Media)(?: Co(?:mpany\|\.)?)?(?=[\s\.][\|}])/g, ''); ~~regex(/\\|\s?publisher\s\=\s(?:Cox\|Halifax\|North Jersey\|Sun-Times\|Tampa\|Herald\|Stephens\|WEHCO\|\w+) Media(?: Group(?:,? Inc\.)?\| Berhad)?(?=[\s\.][\|}])/g, '');~~ regex(/\\|\s?publisher\s\=\s(?:Cox\|Halifax\|North Jersey\|Sun-Times\|Tampa\|Herald\|Stephens\|WEHCO) Media(?: Group(?:,? Inc\.)?\| Berhad)?(?=[\s\.][\|}])/g, ''); // regex(/\\|\s?publisher\s\=\s(?:\w+ )+(?:Media\|Publishing\|Publications)(?: Group(?:,? Inc\.)?\| Berhad)(?=[\s\.][\|}])/g, ''); //rem "Communications" - false positive for "Ministry of Economic Affairs and Communications" reported 28 May 2014 //duplicate above with links //("Corporation" excluded - false positive with Australian Broadcasting Corporation) regex(/(?:\\|\s?publisher\s\=\s\[\[(Alexander Lebedev\|American Media\|Associated Newspapers\|Bauer (?:Consumer Media\|Media Group)\|Cond[eé] Nast(?: Publications\|)\|Daily Mail and General Trust\|Devin Laz[ae]rine\|Dow Jones & Company\|Future plc\|(Guardian\|Telegraph) Media Group\|(?:Guardian\|Independent) News (?:and\|&) Media (?: Limited\| Ltd\.\|)\|Hachette Filipacchi Médias\|Hearst (?:Corporation\|Magazines(?: UK\|))\|Herald Media\|IGN Entertainment\|Imdb Inc\.?\|InterMedia Partners\|IDG\|IPC Media\|Lee Enterprises\|Media ?News Group\|Mediacorp\|Mortimer Zuckerman\|MTV Networks\|News (?:Corporation\|International\|Limited)\|Postmedia Network Inc\.?\|Prometheus Global Media\|Reed Business Information\|Rovi Corporation\|Trinity Mirror\|Times Newspapers\|Nielsen (?: Media Research\|Business Media)\|Viacom\|Time(?: Warner ?\|)))(,? Inc\| LL[CP]\| Ltd\|Limited\|)(?:\\|[^\]\}]\|)\]\][\s\.](?=[\|}])/gi, ''); regex(/\\|\s?publisher\s\=\s\[\[(?:The \|)(?:Deseret News Publishing\|Dispatch Printing\|E\. W\. Scripps\|Evening Post Publishing\|Forbes(?: Publishing\|, Inc\.)\|Gannett?\|Independent News & Media\|Irish Times Trust\|(?:Jann Wenner\|Wenner Media)\|Johnson Publishing\|Journal Communications\|Mac Publishing\|McClatchy\|Nash holdings LLC\|New York Times\|Seattle Times\|Star Tribune\|Thomp?son(?:[- ]?Reuters)?(?: Corporation\| Plc.?\|)\|Singapore Press Holdings\|Torstar\|Time Inc\.\|Times Publishing\|Tribune\|Vox Media\|Washington Post\|World Publishing\|Ziff Davis Media)(?: Co(?:mpany\|\.)?)?\]\](?=[\s\.][\|}])/g, ''); regex(/\\|\s?publisher\s\=\s\[\[(?:Cox\|Halifax\|North Jersey\|Sun-Times\|Tampa\|Herald\|Stephens\|WEHCO~~\|\w+~~) Media(?: Group(?:,? Inc\.)?\| Berhad)?\]\](?=[\s\.][\|}])/g, ''); // regex(/\\|\s?publisher\s\=\s\[\[(?:\w+ )+(?:Media\|Publishing\|Publications)(?: Group(?:,? Inc\.)?\| Berhad)\]\](?=[\s\.][\|}])/g, ''); regex(/\\| ?publisher ?= ?Star Publications \(Malaysia\)\|\[\[Star Publications \(Malaysia\)\]\] ?/gi, ''); regex(/\\| ?publisher ?= ?(?:New Straits Times Press\|\[\[New Straits Times Press\]\]) ?/gi, ''); regex(/(\\|\s?publisher\s?\=\s?MTV\s?)\\|\s\=\s\(\w+\)/gi, '$1='); //palliative - correction for unsuppoeted parameters } Line 269 ⟶ 283: var txt=document.editform.wpTextbox1; // The following regexes for dab-links are in sets of four. If changing, please ensure all sets are changed )note (unique regex line for Empire film magazineadded 20/6/2021) regex(/(=[ ](?:The ?\|)[A-Z]\w(?: [A-Z]\w\|)) \((South Africa)(?:n newspaper\|)\)([ ][\|}])/g, '$1\|___location=$2$3'); regex(/(''(?:The ?\|)[A-Z]\w(?: [A-Z]\w\|)) \((South Africa)(?:n newspaper\|)\)(''[\.,;])/g, '$1$3$2'); Line 279 ⟶ 293: regex(/(\\|)(The Advertiser)(?: \((Adelaide)\))(\]\])/g, '$1$2$4\|___location=$3'); regex(/(\[\[)(The Advertiser)( \((Adelaide)\))(\]\])/g, '$1$2$3\|$2$5\|___location=$4'); regex(/(=[ ])(Apollo\|Billboard\|Brick\|Campaign\|Clash\|Coda\|Ebony\|Esquire\|Essence\|Fanfare\|Fast Company\|Fortune\|Glamour\|Hello!\|Life\|Limelight\|Maxim\|Mojo\|Mother Jones\|New York\|Nuts\|Paste\|People\|Poetry\|Q\|Reason\|Shape\|Slate\|Spin\|Time(?: Out\|)\|Variety\|Wired) \((?:magazine)\)(?=\s[\|}])/g, '$1$2'); //non-standard code regex(/('')(Apollo\|Billboard\|Brick\|Campaign\|Clash\|Coda\|Ebony\|Esquire\|Essence\|Fanfare\|Fast Company\|Fortune\|Glamour\|Hello!\|Life\|Limelight\|Maxim\|Mojo\|Mother Jones\|New York\|Nuts\|Paste\|People\|Poetry\|Q\|Reason\|Shape\|Slate\|Spin\|Time(?: Out\|)\|Variety\|Wired) \(magazine\)(?='')/g, '$1$2'); //non-standard code regex(/(''\[\[(Apollo\|Billboard\|Brick\|Campaign\|Clash\|Coda\|Ebony\|Esquire\|Essence\|Fanfare\|Fast Company\|Fortune\|Glamour\|Hello!\|Life\|Limelight\|Maxim\|Mojo\|Mother Jones\|New York\|Nuts\|Paste\|People\|Poetry\|Q\|Reason\|Shape\|Slate\|Spin\|Time(?: Out\|)\|Variety\|Wired) \(magazine\))(?=\]\]'')/g, '$1\|$2'); //non-standard code - tweaked to insert title per pipe trick regex(/(\\|)(Apollo\|Billboard\|Brick\|Campaign\|Clash\|Coda\|Ebony\|Esquire\|Essence\|Fanfare\|Fast Company\|Fortune\|Glamour\|Hello!\|Life\|Limelight\|Maxim\|Mojo\|Mother Jones\|New York\|Nuts\|Paste\|People\|Poetry\|Q\|Reason\|Shape\|Slate\|Spin\|Time(?: Out\|)\|Variety\|Wired)(?: \(magazine\))(?=\]\])/g, '$1$2'); regex(/(=[ ])(Empire) \((?:film magazine)\)(?=\s[\|}])/g, '$1$2'); //non-standard code regex(/('')(Empire) \(film magazine\)(?='')/g, '$1$2'); //non-standard code regex(/(''\[\[(Empire) \(film magazine\))(?=\]\]'')/g, '$1$2'); //non-standard code regex(/(=[ ]\[\[(Empire) \(film magazine\))(?=\]\][ ]\\|)/g, '$1\|$2'); //non-standard code (unique regex added 20/6/2021) regex(/(\\|)(Empire)(?: \(film magazine\))(?=\]\])/g, '$1$2'); //Journals regex(/(=[ ])(Science\|Nature) \((?:journal)\)(?=\s[\|}])/g, '$1$2'); //non-standard code regex(/('')(Science\|Nature) \(journal\)(?='')/g, '$1$2'); //non-standard code regex(/(''\[\[(Science\|Nature) \(journal\))(?=\]\]'')/g, '$1\|$2'); //non-standard code regex(/(\\|)(Science\|Nature)(?: \(journal\))(?=\]\])/g, '$1$2'); regex(/(=[ ])(Quartz) \((?:publication)\)(?=\s[\|}])/g, '$1$2'); //non-standard code regex(/('')(Quartz) \(publication\)(?='')/g, '$1$2'); //non-standard code regex(/(''\[\[(Quartz) \(publication\))(?=\]\]'')/g, '$1\|$2'); //non-standard code regex(/(\\|)(Quartz)(?: \(publication\))(?=\]\])/g, '$1$2'); regex(/(=[ ])(Salon) \((?:website)\)(?=\s[\|}])/g, '$1$2'); //non-standard code regex(/('')(Salon) \(website\)(?='')/g, '$1$2'); //non-standard code regex(/(''\[\[(Salon) \(website\))(?=\]\]'')/g, '$1\|$2'); //non-standard code regex(/(\\|)(Salon)(?: \(website\))(?=\]\])/g, '$1$2'); regex(/(=[ ])(Stuff) \((?:company)\)(?=\s[\|}])/g, '$1$2'); //non-standard code regex(/('')(Stuff) \(company\)(?='')/g, '$1$2'); //non-standard code regex(/(''\[\[(Stuff) \(company\))(?=\]\]'')/g, '$1\|$2'); //non-standard code regex(/(\\|)(Stuff)(?: \(company\))(?=\]\])/g, '$1$2'); regex(/(=[ ]Daily News) \((New York)\)([ ][\|}])/g, '$1\|___location=$2$3'); Line 310 ⟶ 340: regex(/(''(?:Daily Star)) \((United Kingdom)\)('')/g, '$1$3 ($2)'); regex(/(\\|)(Daily Star)(?: \(United Kingdom\))(\]\])/g, '$1$2$3'); regex(/(=[ ]El Comercio) \((Equador\|Peru\|Spain)\)(\s[\|}])/g, '$1\|___location=$2$3'); regex(/(''El Comercio) \((Equador\|Peru\|Spain)\)('')/g, '$1$3 ($2)'); regex(/(\\|)(El Comercio)(?: \((?:Equador\|Peru\|Spain)\))(\]\])/g, '$1$2$3'); regex(/(=[ ]El Mundo) \((Columbia\|Spain)\)(\s[\|}])/g, '$1\|___location=$2$3'); regex(/(''El Mundo) \((Columbia\|Spain)\)('')/g, '$1$3 ($2)'); Line 322 ⟶ 355: regex(/(''The Herald) \((Glasgow)\)('')/g, '$1$3 ($2)'); regex(/(\\|)(The Herald)(?: \(Glasgow\))(\]\])/g, '$1$2$3'); regex(/(=[ ]The Mercury) \((Hobart)\)(\s[\|}])/g, '$1\|___location=$2$3'); regex(/(''The Mercury) \((Hobart)\)('')/g, '$1$3 ($2)'); regex(/(\\|)(The Mercury)(?: \(Hobart\))(\]\])/g, '$1$2$3'); regex(/(=[ ]Metro) \((British newspaper)\)(\s[\|}])/g, '$1\|___location=UK$3'); regex(/(''Metro) \((British newspaper)\)('')/g, '$1$3 (UK)'); Line 353 ⟶ 389: regex(/(\\|)(Sporting Life)(?: \(British newspaper\))(\]\])/g, '$1$2$3'); regex(/(=[ ]The Standard) \((Hong Kong\|Kenya)\)(\s[\|}])/g, '$1\|___location=$2$3'); regex(/(=[ ]Today) \((Singapore newspaper)\)(\s[\|}])/g, '$1\|___location=Singapore$3'); regex(/(''Today) \((Singapore newspaper)\)('')/g, '$1$3 (Singapore)'); regex(/(\\|)(Today)(?: \(Singapore newspaper\))(\]\])/g, '$1$2$3'); regex(/(''The Standard) \((Hong Kong\|Kenya)\)('')/g, '$1$3 ($2)'); regex(/(\\|)(The Standard)(?: \((?:Hong Kong\|Kenya)\))(\]\])/g, '$1$2$3'); Line 389 ⟶ 428: regex(/(= ?(?:RT)) \((TV network)\)([ ][\|}])/g, '$1\|___location=Russia$3'); regex(/(\\|)(RT)(?: \(TV network\))(\]\])/g, '$1$2$3'); regex(/((?:agency\|author\|journal\|magazine\|newspaper\|periodical\|website\|work)[ ]=[ ]\[\[[\w\s]+\w) ?(\\|language=\w{2} ?(?:\\|___location=(?=Hong Kong\|Taiwan) ?\|))(\]\])[ ](?=[\|}])/g, '$1$3 $2'); //adjust misplaced brackets due to insertion // regex(/(=[ ]\[\[)([^\[\]\(\)\\|:])( \([^\[\]\(\)\\|]\))(\]\])/gi, '$1$2$3\|$2$4'); //adding piping to parentheticals inside parameters //disabled 7/3/2020 false positives (e.g. [[Communist Party of India (Marxist)]]) Line 397 ⟶ 438: regex(/ – (?:Times of India\|Rediff.com [\w])(?=[ ]?\\|)/gi, ''); regex(/(?: +[‒–—―] Times Of India\|)(\]. +''The Times of India''\.)indiatimes\.com/gi, '$1'); regex(/(?: +[‒–—―] ([\w ]+))(\\|\s?(?:publisher\|work)\s\=\s\1)/gi, '$2'); regex(/(\w''\.)indiatimes\.com/gi, '$1'); // regex(/\\|[ ]?language[ ]?\=[ ]?English[ ]?(?=[\|}])/gi, ''); //~~note:~~disabled ~~adjusted~~removal ~~for~~of ~~false~~non-displaying ~~positive in~~language ~~infoboxes~~template ~~books~~parameter regex(/- [\w]\.com[ ]\\|/gi, '\|'); regex(/(.) – Google [^ \]](\][\.,;]) Books\.google\.\w{2,3}(\.\| )/gi, '$1$2Google Books$3'); regex(/(.) at Discogs(\][\.,;]) Discogs\.com(\.\| )/gi, '$1$2Discogs$3'); regex(/(\\|\s?author\s?\=\s?)(?:posted\|publishe[dr]\|written)\s?(?:by\|on):?\s/gi, '$1'); regex(/\\|\s?(?:publisher\|website\|work)(\s?\=MTV)\\|\s?publisher\s\=\s(?:MTV Networks\|Viacom)/gi, '\|publisher$1='); Line 414 ⟶ 455: //rem duplicated publishers in separate fields (post); rem preceding nbsp regex(/\s? \s?(\\|\s?(?:agency\|publisher\|work)\s\=\s)/gi, ' $1'); regex(/(?:[‒–—―]+\|\|)\s(?:The \|)([^\\|\}&]{3,})(?:\.com\|)\s(\\|\s?(?:agency\|publisher\|work)\s\=\s)\1(?=\s[\|}])/gi, '$2$1'); regex(/(?:[‒–—―]+\|\|)\s([^\\|\}&]{3,})(?:\.com\|)\s(\\|\s?(?:agency\|publisher\|work)\s\=\s)(The \|)\1(?=\s[\|}])/gi, '$2$3$1'); //per [[Help:Citation Style 1#Elements not included]] // toggling domains within \|website= parameter // regex(/(\\|\s?(?:work\|website)\s\=\s)(\w+\.(?:com?\|org\|net\|gov\|ac\|)(?:\.[a-z]{2}\|))(?=\s[\|}])/gi, '$1\'\'$2\'\''); // reordering 'work' and 'publisher'; reordering 'work' and 'website' regex(/(\\|\s?publisher\s\=\s(?:\[\[[^<{}\]]\]\]\|[^{}\\|\}<>]))(\s?\\|[^}<>]\|)(\\|\s?(?: journal\|newspaper\|magazine\|periodical\|website\|work)\s\=\s(?:\[\[[^<{}\]]\]\]\|[^{}\\|\}<>]))(?=[\s\.][\|}])/g, '$3$1$2'); regex(/(\\|\s?website\s\=\s(?:\[\[[^<{}\]]\]\]\|[^{}\\|\}<>]))(\s?\\|[^}<>]\|)(\\|\s?work\s\=\s(?:\[\[[^<{}\]]\]\]\|[^{}\\|\}<>]))(?=[\s\.][\|}])/g, '$3$1$2'); /// removing identical/similar entries in 'work' and 'publisher', and in 'work' and 'website' Line 436 ⟶ 477: regex(/\\|\s?publisher\s\=\s(\[\[(?:[^<\|\]])\\|([^}<>])\]\])(\\|[^}<>]\|)\\|\s?publisher\s\=\s(\1\|\2)\.?(?=\s[\|}])/g, '\|publisher=$1$3'); //piped work regex(/(\\|\s?(?:newspaper\|website\|work)\s\=\s(?:[^=\|}\[<>])(?:\\|[^}<>]\|))\\|\s?work\s\=\s(?:[^\|}])(?=\s[\|}])/g, '$1'); //unlinked work regex(/(\\|\s?(?:newspaper\|website\|work)\s\=\s\[\[([^<\|\]])\]\](?:\\|[^}<>]\|))\\|\s?work\s\=\s(?:[^\|}])(?=\s[\|}])/g, '$1'); //linked unpiped work regex(/(\\|\s?(?:newspaper\|website\|work)\s\=\s(?:\[\[(?:[^<\|\]])\\|(?:[^}<>])\]\])(?:\\|[^}<>]\|))\\|\s?work\s\=\s(?:\[\[(?:[^<\|\]])\\|(?:[^}<>])\]\])(?=\s[\|}])/g, '$1'); //piped work x2 regex(/(\\|\s(?:newspaper\|website\|work)\s\=\s(?:\[\[(?:[^<\|\]])\\|(?:[^}<>])\]\])(?:\\|[^}<>]\|))\\|\s?work\s\=\s(?:[^\[\|}])(?=\s[\|}])/g, '$1'); //piped work x1 regex(/\\|\s?___location\s\=\sNew York(?: City\|)\s(\\|[^}<>]\|)\\|\s?___location\s\=\s(New York(?: City\|)\|USA)(?=[\s\.][\|}])/g, '\|___location=New York $1'); regex(/(?:\\|[ ]?___location=[^\\|<\}])([^<}]\|)\\|[ ]?___location=[^\|}])(?=[\|}])+/gi, '$1$2'); regex(/(\\|[ ]?publisher=[^=}])(?:\\|[ ]?publisher=[^=}])(?=[\|}])+/gi, '$1'); // regex(/(\\|[ ]?work=[^=}])(?:\\|[ ]?work=[^=}])(?=[\|}])+/gi, '$1$2'); regex(/(\\|[ ]?agency=[^=}])([^<}]\|)(?:\\|[ ]?agency=[^=}])(?=[\|}])/gi, '$1$2'); //remove redundant parameter ('website' is an alias of 'work') // regex(/\\|\s?(?:newspaper\|website\|work)\s\=\s([^=\|}\[<>])(\\|[^}<>]\|)\\|\s?(?:newspaper\|website\|work)\s\=\s(?:\[\[[^\]]+\]\]\|[\|}]+)(?=\s[\|}])/g, '\|work=$1$2'); //unlinked work // regex(/\\|\s?(?:newspaper\|website\|work)\s\=\s\[\[([^<\|\]])\]\](\\|[^}<>]\|)\\|\s?(?:newspaper\|website\|work)\s\=\s(?:\[\[[^\]]+\]\]\|[\|}]+)(?=\s[\|}])/g, '\|work=$1$2'); //unpiped work // regex(/\\|\s?(?:newspaper\|website\|work)\s\=\s(\[\[(?:[^<\|\]])\\|([^}<>])\]\])(\\|[^}<>]\|)\\|\s?(?:newspaper\|website\|work)\s\=\s(\1\|\2)\.?(?=\s[\|}])/g, '\|work=$1$3'); //piped work regex(/(\\|\s(?:newspaper\|website\|work)\s\=\s[^=}<>](?:\\|[^}<>]\|))\\|\s?(?:newspaper\|website\|work)\s\=\s[^\}\|]+(?=\s[\|}])/g, '$1'); //universal work and aliases ~~//remove duplicated parameter created by conversions ('agency')~~ ~~regex(/\\|\s?agency\s\=\s([^=\|}\[<>])(\\|[^}<>]\|)\\|\s?agency\s\=\s(?:[^\]]+\|[\|}]+)(?=\s[\|}])/g, '\|agency=$1$2'); //unlinked agency~~ ~~regex(/\\|\s?agency\s\=\s\[\[([^<\|\]])\]\](\\|[^}<>]\|)\\|\s?agency\s\=\s(?:\[\[[^\]]+\]\]\|[\|}]+)(?=\s[\|}])/g, '\|agency=$1$2'); //unpiped agency~~ ~~regex(/\\|\s?agency\s\=\s(\[\[(?:[^<\|\]])\\|([^}<>])\]\])(\\|[^}<>]\|)\\|\s?agency\s\=\s(\1\|\2)\.?(?=\s[\|}])/g, '\|agency=$1$3'); //piped agency~~ //unwinding of unnecessary pipes Line 461 ⟶ 501: // removing artefacts (within citation templates) // regex(/(\\|[ ]?author=)(?:(?:Mon\|Tues\|Wednes\|Thurs\|Fri\|Satur\|Sun)day,? ?)(?=[^\]\\|\}]\\|)/gi, '$1'); //redundant/duplicated regex(/(?:\| (?:Daily\|English\|(?:Mail \|)Online\|Music\|News\|Indian Express))(?=\s\\|)+/gi, ''); //\|=: Video Gaming & Real Talk - PS4, Xbox One, Switch, PC, Handheld, Retro regex(/(?:(?:[ ]+\|[ ]+HighBeam Research[ ]+[-–][ ]+FREE trial[ ]+\|)\\|publisher=Highbeam.com)/gi, '\|via=Highbeam'); Line 471 ⟶ 511: regex(/(?:[-–\|]\|\|)[ ](?:Entertainment\|Football\|(?:inter\|)national\|Latest\|local\|Music\|UK\|world\|) News(?=[ ]?[&\\|])/gi, ''); regex(/<!-- Bot generated title -->/gi, ''); regex(/(\\|\s?title\s\=\s[^\|}]+?)[-‒–—―]\s+([^\|}]+?)(\\|\s?(?:publisher\|work)\s\=\s\2)/gi, '$1$3'); regex(/(\\|\s?title\s\=\s([^\|}]+?))[-‒–—―]\s+([^\|}]+?\\|\s?(?:publisher\|work)\s\=\s\2)/gi, '$1$3'); regex(/(\\|\swebsite\s\=\sPlay Legit):\s+[^\|}]+?(?=[\\|}])/gi, '$1'); regex(/(DOC\|PDF)\) \./gi, '$1).'); Line 484 ⟶ 525: // expanding/dating tags // regex(/{{(?:cn\|fact)}}/gi, '{{citation needed\|date=October 2017}}'); //dynamic columns for reflists; remove scroll bar Line 492 ⟶ 533: // regex(/({{reflist)\\|\d(?:\dem\|)(}})/g, '$1$2'); //default } ~~// disambiguating duplicated ref names~~ ~~regex(/(<ref name=[^/>"])><\/ref>/gi, '$1/>');~~ function Ohc_duplicatedcite() { ~~regex(/(<ref name=[^/>"])>([\s\S])\1>([\s\S])\1>/gi, '$1A>$2$1B>$3$1C');~~ var txt=document.editform.wpTextbox1; // disambiguating duplicated ref names //strips down duplicated refs with doubled-up citation templates regex(/(<ref name=[^/>"])>(\{\{[^\}]\}\})([\s\S])\1>\2<\/ref>([\s\S])\1>\2<\/ref>([\s\S])\1>\2<\/ref>/gi, '$1>$2$3$1/>$4$1/>$5$1/>'); regex(/(<ref name=[^/>"])>(\{\{[^\}]\}\})([\s\S])\1>\2<\/ref>([\s\S])\1>\2<\/ref>/gi, '$1>$2$3$1/>$4$1/>'); regex(/(<ref name=[^/>"])>(\{\{[^\}]\}\})([\s\S])\1>\2<\/ref>/gi, '$1>$2$3$1/>'); regex(/(<ref name=[^/>"])><\/ref>/gi, '$1/>'); regex(/(<ref name=[^/>"])>([\s\S])\1>([^\{\}])\1>([^\{\}])/gi, '$1A>$2$1B>$3$1C>$4'); // regex(/(<ref name=[^/>"])>([\s\S])\1>/gi, '$1A>$2$1B>'); // regex(/(<ref name="[^/>])">([\s\S])\1>/gi, '$1A>$2$1B">'); } Line 529 ⟶ 580: // protect the rest (after purging urls inserted in ('website' or )'work' parameters) regex(/((?:[\[=]\s)(?:https?:\|ftp:))([^\]\\|\}])(\s[\]\|}])/gi, protect_function); regex(/(~~\{\{~~(?:harv\wCategory\|~~sfn\w\|cite ?book~~Image\|~~listen~~File)~~\s?\\|~~:)([^\|\}]+])([\|\}]])/gi, protect_function); //protect file names from being changed regex(/(\\|{\s{(?:~~contribution~~FAA-airport\|~~quote~~harv\w\|sfn\w\|cite ?book\|~~title~~listen)\s=?\\|)([^\|\}]+)(\\|}\})/gi, protect_function); regex(/(\\|\s(?:contribution\|quote\|title)\s=)([^\|}]+)([\\|\}])/gi, protect_function); //whitelisting -against changes made by generic regex in Ohc_sourcepub (e.g. Fast Company) } regex(/(\\|\s(?:journal\|newspaper\|periodical\|website\|work)\s=\sFast )(Company\s)([\\|\}])/gi, protect_function); } function ohc_unprotect_urls() Line 569 ⟶ 623: Ohc_remove_urls(); Ohc_duplicatedcite(); ohc_protect_urls(); Ohc_sources_prep(); // ohc_foreign_dates(); Ohc_unpipe(); Ohc_dab_news_sources(); Line 582 ⟶ 637: Ohc_sources_cleanup(); ohc_unprotect_urls(); Ohc_Source_edit_summary(); Line 591 ⟶ 645: // removing references to other WP articles and 'external' WP links regex(/<ref[^<>]>[^<>]\\|[ ]url ?= ?https?:\/\/(?:\w{2}\.wikipedia\.org\/wiki\|(?:www\.\|)(?:blogger\|blogspot\|facebook\|~~myspace~~findagrave\|~~twitter~~instagram\|mailonline\|~~findagrave~~myspace\|twitter\|x)\.com)\/[^<>]<\/ref>/gi, ''); regex(/<ref>https?:\/\/(?:en\.wikipedia\.org\/wiki\|(?:www\.\|)(?:blogger\|blogspot\|facebook\|~~myspace~~findagrave\|~~twitter~~instagram\|mailonline\|~~findagrave~~myspace\|twitter\|x)\.com)\/[^\s\]<]<\/ref>/gi, ''); regex(/<ref>\[https?:\/\/(?:en\.wikipedia\.org\/wiki\|(?:www\.\|)(?:blogger\|blogspot\|facebook\|~~myspace~~findagrave\|~~twitter~~instagram\|mailonline\|~~findagrave~~myspace\|twitter\|x)\.com)\/[^\s\]][ ]+[\w\d][^\]]\]<\/ref>/gi, ''); regex(/\\|[ ]url[ ]=[ ]https?:\/\/(?:\w{2}\.wikipedia\.org\/wiki\|(?:www\.\|)(?:blogger\|blogspot\|facebook\|~~myspace~~findagrave\|~~twitter~~instagram\|mailonline\|~~findagrave~~myspace\|twitter\|x)\.com)[^\s\\|\{\}<](?=[ ][\|}])/gi, ''); regex(/[ ]\[https?:\/\/en\.wikipedia\.org\/wiki\/[^\s\]][ ]+([\w][^\]])\]/gi, ' [[$1]]'); Line 603 ⟶ 656: function ohc_ref_names() { // give names to citations in templates that are without names regex(/<ref>((?:[^<>]\\|w,\surl\~~s=\|[~~.&]+\"?\[~~\s]?~~)https?:\/\/(?:[^\|</]+\.)(\w+)\.(?:(?:com?\|org\|net\|gov\|ac)(?:\.[a-z]{2}\|))\/(?:[^<>\|{}\d]\D\|)(\d{6,12})[^<>])(?=<\/ref>)/gi, "<ref name=$22_$3>$1"); //urls with non-date serial numbers regex(/<ref>((?:[^<>]\\|\surl\s=\|[\[\s]?)https?:\/\/(?:[^\|</]+\.)([-\w]+)\.(?:(?:com?\|org\|net\|gov\|ac)(?:\.[a-z]{2}\|))\/(?:[^<>\|{}\d]\D\|)(\d{6,12})[^<>])(?=<\/ref>)/gi, "<ref name=$22_$3>$1"); //urls with non-date serial numbers regex(/<ref>((?:[^<>]\\|\surl\s=\|[\[\s]?)https?:\/\/(?:[^\|</]+\.)([-\w]+)(?:\.[a-z]{2})\/[^<>\|{}\d](\d{6,12})[^<>])(?=<\/ref>)/gi, "<ref name=$2_$3>$1"); //urls with non-date serial numbers regex(/<ref>((?:[^<>]\\|\surl\s=\|[\[\s]?)https?:\/\/(?:[^\|</]+\.)(reuters)\.com\/[^<>\|{}\d](id\w{11})[^<>])(?=<\/ref>)/gi, "<ref name=$2_$3>$1"); //reuters urls with non-date serial numbers ohc_regex(/<ref>((?:[^<>]\\|\surl\s=\|[\[\s]?)https?:\/\/(?:[^\|</]+\.)([-\w]+)(?:\.[a-z]{2,3})\/[^<>\|{}\d]@YYYY[-\/]@MM[-\/]@DD\/(\w+)[^<>])(?=<\/ref>)/gi, "<ref name=$2_@Year@ZM@~~ZD$2-~~ZD_$3>$1"); //urls with non-date serial numbers ohc_regex(/<ref>((?:[^<>]\\|\surl\s=\|[\[\s]?)https?:\/\/(?:[^\|</]+\.)([-\w]+)(?:\.[a-z]{2,3})\/[^<>\|{}\d]@YYYY[-\/]@~~Month~~Mon[-\/]@DD\/(\w+)[^<>])(?=<\/ref>)/gi, "<ref name=$2_@Year@ZM@~~ZD$2-~~ZD_$3>$1"); //urls with non-date serial numbers ohc_regex(/<ref>([^<>]\\|\surl\s=https?:\/\/(?:[^\|</]+\.)(\w+)\.(?:(?:com?\|org\|net\|gov\|ac\|)(?:\.[a-z]{2}\|))\/[^<>]\\|\sdate\s=\s@Day @Month @YYYY\s[\|}][^<>])(?=<\/ref>)/gi, "<ref name=$2_@Year@ZM@ZD$2>$1"); ohc_regex(/<ref>([^<>]\\|\surl\s=https?:\/\/(?:[^\|</]+\.)(\w+)\.(?:(?:com?\|org\|net\|gov\|ac\|)(?:\.[a-z]{2}\|))\/[^<>]\\|\sdate\s=\s@Month @Day, @YYYY\s[\|}][^<>])(?=<\/ref>)/gi, "<ref name=$2_@Year@ZM@ZD$2>$1"); //this line may cause unwarranted substitution of "$5" by a comma (e.g. in 2019–20 Hong Kong protests) ohc_regex(/<ref>([^<>]\\|\surl\s=https?:\/\/(?:[^\|</]+\.)(\w+)\.(?:(?:com?\|org\|net\|gov\|ac\|)(?:\.[a-z]{2}\|))\/[^<>]\\|\sdate\s=\s=\s@YYYY-@MM-@DD\s[\|}][^<>])(?=<\/ref>)/gi, "<ref name=$2_@Year@MMZM@~~DD$2~~ZD>$1"); ohc_regex(/<ref>((?:[^<>]\\|\surl\s=\|\[?)https?:\/\/(?:[^\|<]+\.)(\w+)\.(?:(?:com?\|org\|net\|gov\|ac\|[a-z]{2})(?:\.[a-z]{2}\|))\/[^<>\|{}]+@YYYY[\/-]?@Month[\/-]?@Day[^<>])(?=<\/ref>)/gi, "<ref name=$2_@~~YYYY~~Year@MMZM@~~DD$2~~ZD>$1"); //urls with embedded dates } function prevDef ( e ) { e.preventDefault(); } function addLinks() { var add = ~~mw.util.addPortletLink;~~function() { return mw.util.addPortletLink.apply(mw.util, arguments); }; $( add('p-tb', '#', 'Add REFTAGS', 's-reftags', 'Insert missing ref tags', '', '') ).click(prevDef).click(Ohc_add_ref_tags); $( add('p-tb', '#', 'CITE name', 's-citename', 'gives names to all citations', '', '') ).click(prevDef).click(ohc_ref_names); Line 647 ⟶ 705: .then( addLinks ); } // </nowiki>