Module:Authority control

require('Module:No globals')

local p = {} local title = mw.title.getCurrentTitle local namespace = title.namespace local talkspace = (mw.site.talkNamespaces[namespace] ~= nil) local testcases = (string.sub(title.subpageText,1,9) == 'testcases')

--========================================================================== --                           Category functions --==========================================================================

function p.getCatForId( id ) local catName = '' if namespace == 0 then catName = 'Wikipedia articles with '..id..' identifiers' elseif namespace == 2 and not title.isSubpage then catName = 'User pages with '..id..' identifiers' else catName = 'Miscellaneous pages with '..id..' identifiers' end return ''..p.redCatLink(catName) end

function p.redCatLink( catName ) --catName == 'Blah', not 'Category:Blah', not '' if catName and catName ~= '' and testcases == false and mw.title.new(catName, 14).exists == false then return '' end return '' end

--========================================================================== --                     Property formatting functions --==========================================================================

function p.iaafLink( id ) --P1146's format regex: [0-9][0-9]* (e.g. 012) if not string.match( id, '^%d+$' ) then return false end return ..id....p.getCatForId( 'IAAF' ) end

function p.viafLink( id ) --P214's format regex: [1-9]\d(\d{0,7}|\d{17,20}) (e.g. 123456789, 1234567890123456789012) if not string.match( id, '^[1-9]%d%d?%d?%d?%d?%d?%d?%d?$' ) and not string.match( id, '^[1-9]%d%d%d%d%d%d%d%d%d%d%d%d%d%d%d%d%d%d%d?%d?%d?$' ) then return false end return ..id....p.getCatForId( 'VIAF' ) end

function p.kulturnavLink( id ) --P1248's format regex: [0-9a-f]{8}\-[0-9a-f]{4}\-[0-9a-f]{4}\-[0-9a-f]{4}\-[0-9a-f]{12} (e.g. 12345678-1234-1234-1234-1234567890AB) if not string.match( id, '^%x%x%x%x%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%x%x%x%x%x%x%x%x$' ) then return false end return ..id....p.getCatForId( 'KULTURNAV' ) --no https yet (10/2018) end

function p.sikartLink( id ) --P781's format regex: \d{7,9} (e.g. 123456789) if not string.match( id, '^%d%d%d%d%d%d%d%d?%d?$' ) then return false end return ..id....p.getCatForId( 'SIKART' ) --no https yet (10/2018) end

function p.tlsLink( id ) local id2 = id:gsub(' +', '_') --P1362's format regex: \p{Lu}[\p{L}\d_',\.\-\(\)\*/–]{3,59} (e.g. Abcd) local class = "[%a%d_',%.%-%(%)%*/–]" local regex = "^%u"..string.rep(class, 3)..string.rep(class.."?", 56).."$" if not mw.ustring.match( id2, regex ) then return false end return ..id....p.getCatForId( 'TLS' ) --no https yet (10/2018) end

function p.ciniiLink( id ) --P271's format regex: DA\d{7}[\dX] (e.g. DA12345678) if not string.match( id, '^DA%d%d%d%d%d%d%d[%dX]$' ) then return false end return ..id....p.getCatForId( 'CINII' ) end

function p.daaoLink( id ) --P1707's format regex: [a-z\-]+\d* (e.g. rolf-harris) if not string.match( id, '^[a-z%-]+%d*$' ) then return false end return ..id....p.getCatForId( 'DAAO' ) end

function p.bneLink( id ) --P950's format regex: (XX|FF|a)\d{4,7}|(bima|bimo|bica|bis[eo]|bivi|Mise|Mimo|Mima)\d{10} (e.g. XX1234567) if not string.match( id, '^[XF][XF]%d%d%d%d%d?%d?%d?$' ) and not string.match( id, '^a%d%d%d%d%d?%d?%d?$' ) and not string.match( id, '^bi[mcsv][aoei]%d%d%d%d%d%d%d%d%d%d$' ) and not string.match( id, '^Mi[sm][eoa]%d%d%d%d%d%d%d%d%d%d$' ) then return false end return ..id....p.getCatForId( 'BNE' ) --no https yet (10/2018) end

function p.uscongressLink( id ) --P1157's format regex: [A-Z]00[01]\d{3} (e.g. A000123) if not string.match( id, '^[A-Z]00[01]%d%d%d$' ) then return false end return ..id....p.getCatForId( 'USCongress' ) --no https yet (10/2018) end

function p.naraLink( id ) --P1225's format regex: ^([1-9]\d{0,8})$ (e.g. 123456789) if not string.match( id, '^[1-9]%d?%d?%d?%d?%d?%d?%d?%d?$' ) then return false end return ..id....p.getCatForId( 'NARA' ) end

function p.botanistLink( id ) --P428's format regex: ('t )?(d')?(de )?(la )?(van (der )?)?(Ma?c)?(De)?(Di)?\p{Lu}?C?['\p{Ll}]*([-'. ]*(van )?(y )?(d[ae][nr]?[- ])?(Ma?c)?[\p{Lu}bht]?C?['\p{Ll}]*)*\.? ?f?\.? (e.g. L.) --not easily/meaningfully implementable in Lua's regex since "(this)?" is not allowed... if not mw.ustring.match( id, "^[%u%l%d%. '-]+$" ) then --better than nothing return false end local id2 = id:gsub(' +', '%%20') return ..id....p.getCatForId( 'Botanist' ) end

function p.mgpLink( id ) --P549's format regex: \d{1,6} (e.g. 123456) if not string.match( id, '^%d%d?%d?%d?%d?%d?$' ) then return false end return ..id....p.getCatForId( 'MGP' ) end

function p.rslLink( id ) --P947's format regex: \d{1,9} (e.g. 123456789) if not string.match( id, '^%d%d?%d?%d?%d?%d?%d?%d?%d?$' ) then return false end return ..id....p.getCatForId( 'RSL' ) --no https yet (10/2018) end

function p.leonoreLink( id ) --P640's format regex: LH/\d{1,4}/\d{1,3}|19800035/\d{1,4}/\d{1,5}(Bis)?|C/0/\d{1,2} (e.g. LH/2064/18) if not id:match( '^LH/%d%d?%d?%d?/%d%d?%d?$' ) and            --IDs from       LH/1/1 to         LH/2794/54 (legionaries) not id:match( '^19800035/%d%d?%d?%d?/%d%d?%d?%d?%d?$' ) and --IDs from 19800035/1/1 to 19800035/385/51670 (legionnaires who died 1954-1977 & some who died < 1954) not id:match( '^C/0/%d%d?$' ) then                         --IDs from        C/0/1 to             C/0/84 (84 famous legionaries) return false end return ..id....p.getCatForId( 'Léonore' ) --no https yet (10/2018) end

function p.sbnLink( id ) --P396's format regex: IT\\ICCU\\(\d{10}|\D\D[\D\d]\D\\\d{6}) (e.g. IT\ICCU\CFIV\000163) if not string.match( id, '^IT\\ICCU\\%d%d%d%d%d%d%d%d%d%d$' ) and not string.match( id, '^IT\\ICCU\\%u%u[%u%d]%u\\%d%d%d%d%d%d$' ) then --legacy: %u used here instead of %D (but the faulty ID cat is empty, out of ~12k uses) return false end return ..id....p.getCatForId( 'SBN' ) end

function p.nkcLink( id ) --P691's format regex: [a-z]{2,4}[0-9]{2,14} (e.g. abcd12345678901234) if not string.match( id, '^[a-z][a-z][a-z]?[a-z]?%d%d%d?%d?%d?%d?%d?%d?%d?%d?%d?%d?%d?%d?$' ) then return false end return ..id....p.getCatForId( 'NKC' ) end

function p.nclLink( id ) --P1048's format regex: \d+ (e.g. 1081436) if not string.match( id, '^%d+$' ) then return false end return ..id....p.getCatForId( 'NCL' ) --no https yet (10/2018) end

function p.ndlLink( id ) --P349's format regex: 0?\d{8} (e.g. 012345678) if not string.match( id, '^0?%d%d%d%d%d%d%d%d$' ) then return false end return ..id....p.getCatForId( 'NDL' ) end

function p.ngvLink( id ) --P2041's format regex: \d+ (e.g. 12354) if not string.match( id, '^%d+$' ) then return false end return ..id....p.getCatForId( 'NGV' ) end

function p.sudocLink( id ) --P269's format regex: (\d{8}[\dX]|) (e.g. 026927608) if not string.match( id, '^%d%d%d%d%d%d%d%d[%dxX]$' ) then --legacy: allow lowercase 'x'		return false end return ..id....p.getCatForId( 'SUDOC' ) end

function p.hdsLink( id ) --P902's format regex: 50\d{3}|[1-4]\d{4}|[1-9]\d{0,3}| (e.g. 50123) if not string.match( id, '^50%d%d%d$' ) and not string.match( id, '^[1-4]%d%d%d%d$' ) and not string.match( id, '^[1-9]%d?%d?%d?$' ) then return false end return ..id....p.getCatForId( 'HDS' ) --no https yet (10/2018) end

function p.lirLink( id ) --P886's format regex: \d+ (e.g. 1) if not string.match( id, '^%d+$' ) then return false end return ..id....p.getCatForId( 'LIR' ) --no https yet (10/2018) end

function p.splitLccn( id ) --P244's format regex: (n|nb|nr|no|ns|sh)([4-9][0-9]|00|20[0-1][0-9])[0-9]{6} (e.g. n78039510) if id:match( '^%l%l?%l?%d%d%d%d%d%d%d%d%d?%d?$' ) then id = id:gsub( '^(%l+)(%d+)(%d%d%d%d%d%d)$', '%1/%2/%3' ) end if id:match( '^%l%l?%l?/%d%d%d?%d?/%d+$' ) then return mw.text.split( id, '/' ) end return false end

function p.append(str, c, length) while str:len < length do str = c .. str end return str end

function p.lccnLink( id ) local parts = p.splitLccn( id ) --e.g. n78039510 if not parts then return false end local lccnType = parts[1] ~= 'sh' and 'names' or 'subjects' id = parts[1] .. parts[2] .. p.append( parts[3], '0', 6 ) return ..id....p.getCatForId( 'LCCN' ) end

function p.mbaLink( id ) --P434's format regex: [0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12} (e.g. 12345678-1234-1234-1234-1234567890AB) if not string.match( id, '^%x%x%x%x%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%x%x%x%x%x%x%x%x$' ) then return false end return ..id....p.getCatForId( 'MusicBrainz' ) --special category name end

function p.mbareaLink( id ) --P982's format regex: [0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12} (e.g. 12345678-1234-1234-1234-1234567890AB) if not string.match( id, '^%x%x%x%x%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%x%x%x%x%x%x%x%x$' ) then return false end return ..id....p.getCatForId( 'MusicBrainz area' ) --special category name end

function p.mbiLink( id ) --P1330's format regex: [0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12} (e.g. 12345678-1234-1234-1234-1234567890AB) if not string.match( id, '^%x%x%x%x%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%x%x%x%x%x%x%x%x$' ) then return false end return ..id....p.getCatForId( 'MusicBrainz instrument' ) --special category name end

function p.mblLink( id ) --P966's format regex: [0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12} (e.g. 12345678-1234-1234-1234-1234567890AB) if not string.match( id, '^%x%x%x%x%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%x%x%x%x%x%x%x%x$' ) then return false end return ..id....p.getCatForId( 'MusicBrainz label' ) --special category name end

function p.mbpLink( id ) --P1004's format regex: [0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12} (e.g. 12345678-1234-1234-1234-1234567890AB) if not string.match( id, '^%x%x%x%x%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%x%x%x%x%x%x%x%x$' ) then return false end return ..id....p.getCatForId( 'MusicBrainz place' ) --special category name end

function p.mbrgLink( id ) --P436's format regex: [0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12} (e.g. 12345678-1234-1234-1234-1234567890AB) if not string.match( id, '^%x%x%x%x%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%x%x%x%x%x%x%x%x$' ) then return false end return ..id....p.getCatForId( 'MusicBrainz release group' ) --special category name end

function p.mbsLink( id ) --P1407's format regex: [0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12} (e.g. 12345678-1234-1234-1234-1234567890AB) if not string.match( id, '^%x%x%x%x%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%x%x%x%x%x%x%x%x$' ) then return false end return ..id....p.getCatForId( 'MusicBrainz series' ) --special category name end

function p.mbwLink( id ) --P435's format regex: [0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12} (e.g. 12345678-1234-1234-1234-1234567890AB) if not string.match( id, '^%x%x%x%x%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%-%x%x%x%x%x%x%x%x%x%x%x%x$' ) then return false end return ..id....p.getCatForId( 'MusicBrainz work' ) --special category name end

--Returns the ISNI check digit isni must be a string where the 15 first elements are digits, e.g. 0000000066534145 function p.getIsniCheckDigit( isni ) local total = 0 for i = 1, 15 do		local digit = isni:byte( i ) - 48 --Get integer value total = (total + digit) * 2 end local remainder = total % 11 local result = (12 - remainder) % 11 if result == 10 then return "X" end return tostring( result ) end

--Validate ISNI (and ORCID) and retuns it as a 16 characters string or returns false if it's invalid --See http://support.orcid.org/knowledgebase/articles/116780-structure-of-the-orcid-identifier function p.validateIsni( id ) --P213 (ISNI) format regex: [0-9]{4} [0-9]{4} [0-9]{4} [0-9]{3}[0-9X] (e.g. 0000-0000-6653-4145) --P496 (ORCID) format regex: 0000-000(1-[5-9]|2-[0-9]|3-[0-4])\d{3}-\d{3}[\dX] (e.g. 0000-0002-7398-5483) id = id:gsub( '[ %-]', '' ):upper if not id:match( '^%d%d%d%d%d%d%d%d%d%d%d%d%d%d%d[%dX]$' ) then return false end if p.getIsniCheckDigit( id ) ~= string.char( id:byte( 16 ) ) then return false end return id end

function p.isniLink( id ) id = p.validateIsni( id ) --e.g. 0000-0000-6653-4145 if not id then return false end return ..id:sub( 1, 4 )..' '..id:sub( 5, 8 )..' '..id:sub( 9, 12 )..' '..id:sub( 13, 16 )....p.getCatForId( 'ISNI' ) --no https yet (10/2018) end

function p.orcidLink( id ) id = p.validateIsni( id ) --e.g. 0000-0002-7398-5483 if not id then return false end id = id:sub( 1, 4 )..'-'..id:sub( 5, 8 )..'-'..id:sub( 9, 12 )..'-'..id:sub( 13, 16 ) return ..id....p.getCatForId( 'ORCID' ) end

function p.gndLink( id ) --P227's format regex: (1|1[01])\d{7}[0-9X]|[47]\d{6}-\d|[1-9]\d{0,7}-[0-9X]|3\d{7}[0-9X] (e.g. 4079154-3) if not string.match( id, '^1[01]?%d%d%d%d%d%d%d[0-9X]$' ) and not string.match( id, '^[47]%d%d%d%d%d%d%-%d$' ) and not string.match( id, '^[1-9]%d?%d?%d?%d?%d?%d?%d?%-[0-9X]$' ) and not string.match( id, '^3%d%d%d%d%d%d%d[0-9X]$' ) then return false end return ..id....p.getCatForId( 'GND' ) end

function p.selibrLink( id ) --P906's format regex: [1-9]\d{4,5} (e.g. 123456) if not string.match( id, '^[1-9]%d%d%d%d%d?$' ) then return false end return ..id....p.getCatForId( 'SELIBR' ) end

function p.bnfLink( id ) --P268's format regex: \d{8}[0-9bcdfghjkmnpqrstvwxz] (e.g. 123456789) if not string.match( id, '^c?b?%d%d%d%d%d%d%d%d[0-9bcdfghjkmnpqrstvwxz]$' ) then return false end --Add cb prefix if it has been removed if not string.match( id, '^cb.+$' ) then id = 'cb'..id	end return ''..id..' (data)'..p.getCatForId( 'BNF' ) end

function p.bpnLink( id ) --P651's format regex: \d{8} (e.g. 12345678) if not string.match( id, '^%d%d%d%d%d%d%d%d$' ) then return false end return ..id....p.getCatForId( 'BPN' ) --no https yet (10/2018) end

function p.ridLink( id ) --P1053's format regex: [A-Z]-\d{4}-(19|20)\d\d (e.g. A-1234-1934) if not string.match( id, '^[A-Z]%-%d%d%d%d%-19%d%d$' ) and not string.match( id, '^[A-Z]%-%d%d%d%d%-20%d%d$' ) then return false end return ..id....p.getCatForId( 'RID' ) end

function p.bibsysLink( id ) --P1015's format regex: [1-9]\d* or [1-9](\d{0,8}|\d{12}) (e.g. 1234567890123) --TODO: follow up @ d:Property talk:P1015 or escalate/investigate if not string.match( id, '^[1-9]%d?%d?%d?%d?%d?%d?%d?%d?$' ) and not string.match( id, '^[1-9]%d%d%d%d%d%d%d%d%d%d%d%d$' ) then return false end return ..id....p.getCatForId( 'BIBSYS' ) end

function p.ulanLink( id ) --P245's format regex: 500\d{6} (e.g. 500123456) if not string.match( id, '^500%d%d%d%d%d%d$' ) then return false end return ..id....p.getCatForId( 'ULAN' ) end

function p.nlaLink( id ) --P409's format regex: [1-9][0-9]{0,11} (e.g. 123456789012) if not string.match( id, '^[1-9]%d?%d?%d?%d?%d?%d?%d?%d?%d?%d?%d?$' ) then return false end return ..id....p.getCatForId( 'NLA' ) end

function p.nlapersonLink( id ) --P1315's format regex: [1-9]\d{5,7} (e.g. 12345678) if not string.match( id, '^[1-9]%d%d%d%d%d%d?%d?$' ) then return false end return ..id....p.getCatForId( 'NLA-person' ) end

function p.rkdartistsLink( id ) --P650's format regex: [1-9]\d{0,5} (e.g. 123456) if not string.match( id, '^[1-9]%d?%d?%d?%d?%d?$' ) then return false end return ..id....p.getCatForId( 'RKDartists' ) end

function p.snacLink( id ) --P3430's format regex: \d*[A-Za-z][0-9A-Za-z]* (e.g. A)	if not string.match( id, '^%d*[A-Za-z][0-9A-Za-z]*$' ) then return false end return ..id....p.getCatForId( 'SNAC-ID' ) --no https yet (10/2018) end

function p.dblpLink( id ) --P2456's format regex: \d{2,3} /\d+(-\d+)?|[a-z] /[a-zA-Z][0-9A-Za-z]*(-\d+)? (e.g. 123/123) if not string.match( id, '^%d%d%d?/%d+$' ) and not string.match( id, '^%d%d%d?/%d+%-%d+$' ) and not string.match( id, '^[a-z]/[a-zA-Z][0-9A-Za-z]*$' ) and not string.match( id, '^[a-z]/[a-zA-Z][0-9A-Za-z]*%-%d+$' ) then return false end return ..id....p.getCatForId( 'DBLP' ) end

function p.aagLink( id ) --P3372's format regex: \d+ (e.g. 1) if not string.match( id, '^%d+$' ) then return false end return ..id....p.getCatForId( 'AAG' ) end

function p.acmLink( id ) --P864's format regex: \d{11} (e.g. 12345678901) if not string.match( id, '^%d%d%d%d%d%d%d%d%d%d%d$' ) then return false end return ..id....p.getCatForId( 'ACM-DL' ) end

function p.adbLink( id ) --P1907's format regex: [a-z][-a-z]+-([1-2]\d|[1-9])\d{0,3} (e.g. barton-sir-edmund-toby-71) if not string.match( id, '^[a-z][-a-z]+-[1-2]%d%d?%d?%d?$' ) and not string.match( id, '^[a-z][-a-z]+-[1-9]%d?%d?%d?$' ) then return false end return ..id....p.getCatForId( 'ADB' ) end

function p.agsaLink( id ) --P6804's format regex: [1-9]\d* (e.g. 3625) if not string.match( id, '^[1-9]%d*$' ) then return false end return ..id....p.getCatForId( 'AGSA' ) end

function p.autoresuyLink( id ) --P2558's format regex: [1-9]\d{0,4} (e.g. 12345) if not string.match( id, '^[1-9]%d?%d?%d?%d?$' ) then return false end return ..id....p.getCatForId( 'autores.uy' ) end

function p.awrLink( id ) --P4186's format regex: (([A-Z]{3}\d{4})|([A-Z]{2}\d{5}))[a-z] (e.g. PR00768b) if not string.match( id, '^[A-Z][A-Z][A-Z]%d%d%d%d[a-z]$' ) and not string.match( id, '^[A-Z][A-Z]%d%d%d%d%d[a-z]$' ) then return false end return ..id....p.getCatForId( 'AWR' ) end

function p.picLink( id ) --P2750's format regex: [1-9]\d* (e.g. 1) if not string.match( id, '^[1-9]%d*$' ) then return false end return ..id....p.getCatForId( 'PIC' ) end

function p.bildLink( id ) --P2092's format regex: \d+ (e.g. 1) if not string.match( id, '^%d+$' ) then return false end return ..id....p.getCatForId( 'Bildindex' ) end

function p.jocondeLink( id ) --P347's format regex: [\-0-9A-Za-z]{11} (e.g. 12345678901) local regex = '^'..string.rep('[%-0-9A-Za-z]', 11)..'$' if not string.match( id, regex ) then return false end return ..id....p.getCatForId( 'Joconde' ) --no https yet (10/2018) end

function p.rkdidLink( id ) --P350's format regex: [1-9]\d{0,5} (e.g. 123456) if not string.match( id, '^[1-9]%d?%d?%d?%d?%d?$' ) then return false end return ..id....p.getCatForId( 'RKDID' ) end

function p.balatLink( id ) --P3293's format regex: \d+ (e.g. 1) if not string.match( id, '^%d+$' ) then return false end return ..id....p.getCatForId( 'BALaT' ) --no https yet (10/2018) end

function p.lnbLink( id ) --P1368's format regex: \d{9} (e.g. 123456789) if not string.match( id, '^%d%d%d%d%d%d%d%d%d$' ) then return false end return ..id....p.getCatForId( 'LNB' ) end

function p.nskLink( id ) --P1375's format regex: \d{9} (e.g. 123456789) if not string.match( id, '^%d%d%d%d%d%d%d%d%d$' ) then return false end return ..id....p.getCatForId( 'NSK' ) --no https yet (10/2018) end

function p.iciaLink( id ) --P1736's format regex: \d+ (e.g. 1) if not string.match( id, '^%d+$' ) then return false end return ..id....p.getCatForId( 'ICIA' ) end

function p.ta98Link( id ) --P1323's format regex: A\d{2}\.\d\.\d{2}\.\d{3}[FM]? (e.g. A12.3.45.678) if not string.match( id, '^A%d%d%.%d%.%d%d%.%d%d%d[FM]?$' ) then return false end return ..id....p.getCatForId( 'TA98' ) end

function p.teLink( id ) --P1693's format regex: E[1-8]\.\d{1,2}\.\d{1,2}\.\d{1,2}\.\d{1}\.\d{1}\.\d{1,3} (e.g. E1.23.45.67.8.9.0) local e1, e2 = string.match( id, '^E([1-8])%.(%d%d?)%.%d%d?%.%d%d?%.%d%.%d%.%d%d?%d?$' ) if not e1 then return false end local TEnum = 'TEe0'..e1 --no formatter URL in WD, probably due to this complexity if e1 == '5' or e1 == '7' then if #e2 == 1 then e2 = '0'..e2 end TEnum = TEnum..e2	end return ..id....p.getCatForId( 'TE' ) end

function p.tepapaLink( id ) --P3544's format regex: \d+ (e.g. 1) if not string.match( id, '^%d+$' ) then return false end return ..id....p.getCatForId( 'TePapa' ) end

function p.thLink( id ) --P1694's format regex: H\d\.\d{2}\.\d{2}\.\d\.\d{5} (e.g. H1.23.45.6.78901) local h1, h2 = string.match( id, '^H(%d)%.(%d%d)%.%d%d%.%d%.%d%d%d%d%d$' ) if not h1 then return false end local THnum = 'THh'..h1..h2 --no formatter URL in WD, probably due to this complexity return ..id....p.getCatForId( 'TH' ) end

function p.dsiLink( id ) --P2349's format regex: [1-9]\d* (e.g. 1538) if not string.match( id, '^[1-9]%d*$' ) then return false end return ..id....p.getCatForId( 'DSI' ) end

function p.s2authoridLink( id ) --P4012's format regex: [1-9]\d* (e.g. 1796130) if not string.match( id, '^[1-9]%d*$' ) then return false end return ..id....p.getCatForId( 'Semantic Scholar author' ) --special category name end

function p.nliLink( id ) --P949's format regex: \d{9} (e.g. 123456789) if not string.match( id, '^%d%d%d%d%d%d%d%d%d$' ) then return false end return ..id....p.getCatForId( 'NLI' ) end

function p.nlpLink( id ) --P1695's format regex: 9810[0-9]\d* or A[0-9]{7}[0-9X] (e.g. 9810123456789012345 or A10414836) if not string.match( id, '^9810%d+$' ) and not string.match( id, '^A%d%d%d%d%d%d%d[%dX]$' ) then return false end return ..id....p.getCatForId( 'NLP' ) end

function p.reroLink( id ) --P3065's format regex: 0[1-2]-[A-Z0-9]{1,10} (e.g. 02-A012345678) if not string.match( id, '^0[1-2]%-[A-Z%d][A-Z%d]?[A-Z%d]?[A-Z%d]?[A-Z%d]?[A-Z%d]?[A-Z%d]?[A-Z%d]?[A-Z%d]?[A-Z%d]?$' ) then return false end return ..id....p.getCatForId( 'RERO' ) end

function p.nlrLink( id ) --P1003's format regex: \d{9} (e.g. 123456789) if not string.match( id, '^%d%d%d%d%d%d%d%d%d$' ) then return false end return ..id....p.getCatForId( 'NLR' ) end

function p.ntaLink( id ) --P1006's format regex: \d{8}[\dX] (e.g. 12345678X) if not string.match( id, '^%d%d%d%d%d%d%d%d[%dX]$' ) then return false end return ..id....p.getCatForId( 'NTA' ) end

function p.bncLink( id ) --P1890's format regex: \d{9} (e.g. 123456789) if not string.match( id, '^%d%d%d%d%d%d%d%d%d$' ) then return false end return ..id....p.getCatForId( 'BNC' ) end

--========================================================================== --         Wikidata, navigation bar, and documentation functions --==========================================================================

function p.getIdsFromWikidata( itemId, property ) local ids = {} local statements = mw.wikibase.getBestStatements( itemId, property ) if statements then for _, statement in ipairs( statements ) do			if statement.mainsnak.datavalue then table.insert( ids, statement.mainsnak.datavalue.value ) end end end return ids end

function p.matchesWikidataRequirements( itemId, reqs ) for _, group in ipairs( reqs ) do		local property = 'P'..group[1] local qid = group[2] local statements = mw.wikibase.getBestStatements( itemId, property ) if statements then for _, statement in ipairs( statements ) do				if statement.mainsnak.datavalue then if statement.mainsnak.datavalue.value['numeric-id'] == qid then return true end	end	end	end	end return false end

function p.createRow( id, label, rawValue, link, withUid, specialCat ) if link then if withUid then return '* '..label..' '..link..' \n' end return '* '..label..' '..link..' \n' end

local catName = 'Wikipedia articles with faulty '..(specialCat or id)..' identifiers' return '* The '..id..' id '..rawValue..' is not valid. '..p.redCatLink(catName)..'\n' end

-- Creates a human-readable standalone wikitable version of p.conf, and tracking categories with page counts, for use in the documentation function p.docConfTable( frame ) local wikiTable = '{| class="wikitable sortable"\n'.. '! rowspan=2 | Parameter\n'.. '! rowspan=2 | Label\n'.. '! rowspan=2; data-sort-type=number | Wikidata property\n'.. '! colspan=4 | Tracking categories and page counts\n'.. '|-\n'.. '! Articles\n'.. '! User pages\n'.. '! Misc. pages\n'.. '! Faulty IDs\n'.. '|-\n' local lang = mw.getContentLanguage for _, conf in pairs( p.conf ) do		local param, link, pid = conf[1], conf[2], conf[3] local category = conf.category or param local args = { id = 'f', pid } local wpl = frame:expandTemplate{ title = 'Wikidata property link', args = args } --cats local articleCat = 'Wikipedia articles with '..category..' identifiers' local userCat =   'User pages with '..category..' identifiers' local miscCat =   'Miscellaneous pages with '..category..' identifiers' local faultyCat = 'Wikipedia articles with faulty '..category..' identifiers' --counts local articleCount = lang:formatNum( mw.site.stats.pagesInCategory(articleCat, 'pages') ) local userCount =   lang:formatNum( mw.site.stats.pagesInCategory(userCat, 'pages') ) local miscCount =   lang:formatNum( mw.site.stats.pagesInCategory(miscCat, 'pages') ) local faultyCount = lang:formatNum( mw.site.stats.pagesInCategory(faultyCat, 'pages') ) --concat wikiTable = wikiTable..'\n'.. '|-\n'.. '||'..param.. '||'..link.. '||data-sort-value='..pid..'|'..wpl.. '||style="text-align: right;"|'..articleCount..''.. '||style="text-align: right;"|'..  userCount..''.. '||style="text-align: right;"|'..  miscCount..''.. '||style="text-align: right;"|'.. faultyCount..'' end return wikiTable..'\n|}' end

--========================================================================== --                             Configuration --==========================================================================

-- Check that the Wikidata item has this property-->value before adding it local reqs = {}

-- Parameter format: { parameter name, label, propertyId # in Wikidata, formatting/validation function } p.conf = { { 'AAG', 'AAG', 3372, p.aagLink }, { 'ACM-DL', 'ACM DL', 864, p.acmLink }, { 'ADB', 'ADB', 1907, p.adbLink }, { 'AGSA', 'AGSA', 6804, p.agsaLink }, { 'autores.uy', 'autores.uy', 2558, p.autoresuyLink }, { 'AWR', 'AWR', 4186, p.awrLink }, { 'BALaT', 'BALaT', 3293, p.balatLink }, { 'BIBSYS', 'BIBSYS', 1015, p.bibsysLink }, { 'Bildindex', 'Bildindex', 2092, p.bildLink }, { 'BNC', 'BNC', 1890, p.bncLink }, --initially commented due to excessive WD ID errors (many bad IDs since removed) { 'BNE', 'BNE', 950, p.bneLink }, { 'BNF', 'BNF', 268, p.bnfLink }, { 'Botanist', 'Botanist', 428, p.botanistLink }, { 'BPN', 'BPN', 651, p.bpnLink }, { 'CINII', 'CiNii', 271, p.ciniiLink }, { 'DAAO', 'DAAO', 1707, p.daaoLink }, { 'DBLP', 'DBLP', 2456, p.dblpLink }, { 'DSI', 'DSI', 2349, p.dsiLink }, { 'GND', 'GND', 227, p.gndLink }, { 'HDS', 'HDS', 902, p.hdsLink }, { 'IAAF', 'IAAF', 1146, p.iaafLink }, { 'ICIA', 'ICIA', 1736, p.iciaLink }, { 'ISNI', 'ISNI', 213, p.isniLink }, { 'Joconde', 'Joconde', 347, p.jocondeLink }, { 'KULTURNAV', 'KulturNav', 1248, p.kulturnavLink }, { 'LCCN', 'LCCN', 244, p.lccnLink }, { 'LIR', 'LIR', 886, p.lirLink }, { 'LNB', 'LNB', 1368, p.lnbLink }, { 'Léonore', 'Léonore', 640, p.leonoreLink }, { 'MBA', 'MusicBrainz', 434, p.mbaLink, category = 'MusicBrainz' }, --special category name { 'MBAREA', 'MusicBrainz', 982, p.mbareaLink, category = 'MusicBrainz area' }, --special category name { 'MBI', 'MusicBrainz', 1330, p.mbiLink, category = 'MusicBrainz instrument' }, --special category name { 'MBL', 'MusicBrainz', 966, p.mblLink, category = 'MusicBrainz label' }, --special category name { 'MBP', 'MusicBrainz', 1004, p.mbpLink, category = 'MusicBrainz place' }, --special category name { 'MBRG', 'MusicBrainz release group', 436, p.mbrgLink, category = 'MusicBrainz release group' }, --special category name { 'MBS', 'MusicBrainz', 1407, p.mbsLink, category = 'MusicBrainz series' }, --special category name { 'MBW', 'MusicBrainz work', 435, p.mbwLink, category = 'MusicBrainz work' }, --special category name { 'MGP', 'MGP', 549, p.mgpLink }, { 'NARA', 'NARA', 1225, p.naraLink }, { 'NCL', 'NCL', 1048, p.nclLink }, { 'NDL', 'NDL', 349, p.ndlLink }, { 'NGV', 'NGV', 2041, p.ngvLink }, { 'NKC', 'NKC', 691, p.nkcLink }, { 'NLA', 'NLA', 409, p.nlaLink }, { 'NLA-person', 'NLA-person', 1315, p.nlapersonLink }, { 'NLI', 'NLI', 949, p.nliLink }, { 'NLP', 'NLP', 1695, p.nlpLink }, { 'NLR', 'NLR', 1003, p.nlrLink }, --initially commented due to excessive WD ID errors (conflated with National Library of Russia IDs) { 'NSK', 'NSK', 1375, p.nskLink }, { 'NTA', 'NTA', 1006, p.ntaLink }, { 'ORCID', 'ORCID', 496, p.orcidLink }, { 'PIC', 'PIC', 2750, p.picLink }, { 'RID', 'ResearcherID', 1053, p.ridLink }, { 'RERO', 'RERO', 3065, p.reroLink }, --initially commented due to excessive WD ID errors (regex fixed/relaxed) { 'RKDartists', 'RKD', 650, p.rkdartistsLink }, { 'RKDID', 'RKDimages ID', 350, p.rkdidLink }, { 'RSL', 'RSL', 947, p.rslLink }, { 'SBN', 'ICCU', 396, p.sbnLink }, { 'SELIBR', 'SELIBR', 906, p.selibrLink }, { 'SIKART', 'SIKART', 781, p.sikartLink }, { 'SNAC-ID', 'SNAC', 3430, p.snacLink }, { 'SUDOC', 'SUDOC', 269, p.sudocLink }, { 'S2AuthorId', 'S2AuthorId', 4012, p.s2authoridLink, category = 'Semantic Scholar author' }, --special category name { 'TA98', 'TA98', 1323, p.ta98Link }, { 'TE', 'TE', 1693, p.teLink }, { 'TePapa', 'TePapa', 3544, p.tepapaLink }, { 'TH', 'TH', 1694, p.thLink }, { 'TLS', 'TLS', 1362, p.tlsLink }, { 'ULAN', 'ULAN', 245, p.ulanLink }, { 'USCongress', 'US Congress', 1157, p.uscongressLink }, { 'VIAF', 'VIAF', 214, p.viafLink }, }

-- Legitimate aliases to p.conf, for convenience -- Format: { alias, parameter name in p.conf } p.aliases = { { 'RLS', 'RSL' }, { 'MusicBrainz', 'MBA' }, { 'MusicBrainz artist', 'MBA' }, { 'MusicBrainz label', 'MBL' }, { 'MusicBrainz release group', 'MBRG' }, { 'MusicBrainz work', 'MBW' }, { 'Leonore', 'Léonore' }, }

-- Deprecated aliases to p.conf, which also get assigned to a tracking cat -- Format: { deprecated parameter name, replacement parameter name in p.conf } p.deprecated = { { 'GKD', 'GND' }, { 'PND', 'GND' }, { 'SWD', 'GND' }, { 'NARA-organization', 'NARA' }, { 'NARA-person', 'NARA' }, }

--========================================================================== --                                  Main --==========================================================================

function p.authorityControl( frame ) local resolveEntity = require( "Module:ResolveEntityId" ) local parentArgs = frame:getParent.args local elements = {} --create/insert rows later local worldcatCat = '' local suppressedIdCat = '' local deprecatedIdCat = '' --Redirect aliases to proper parameter names for _, a in pairs( p.aliases ) do		local alias, param = a[1], a[2] if (parentArgs[param] == nil or parentArgs[param] == '') and parentArgs[alias] then parentArgs[param] = parentArgs[alias] end end --Redirect deprecated parameters to proper parameter names, and assign tracking cat for _, d in pairs( p.deprecated ) do		local dep, param = d[1], d[2] if (parentArgs[param] == nil or parentArgs[param] == '') and parentArgs[dep] then parentArgs[param] = parentArgs[dep] if namespace == 0 then deprecatedIdCat = '' end end end --Use QID= parameter for testing/example purposes only local itemId = nil if namespace ~= 0 then local qid = parentArgs['qid'] or parentArgs['QID'] if qid then itemId = 'Q'..mw.ustring.gsub(qid, '^[Qq]', '') itemId = resolveEntity._id(itemId) --nil if unresolvable end else itemId = mw.wikibase.getEntityIdForCurrentPage end --Wikidata fallback if requested if itemId then for _, params in ipairs( p.conf ) do			if params[3] > 0 then local val = parentArgs[params[1]] if val == nil or val == '' then local canUseWikidata = nil if reqs[params[1]] then canUseWikidata = p.matchesWikidataRequirements( itemId, reqs[params[1]] ) else canUseWikidata = true end if canUseWikidata then local wikidataIds = p.getIdsFromWikidata( itemId, 'P'..params[3] ) if wikidataIds[1] then if val == '' and (namespace == 0 or testcases) then suppressedIdCat = '' else parentArgs[params[1]] = wikidataIds[1] end	end	end	end	end	end	end --Configured rows local rct = 0 for _, params in ipairs( p.conf ) do		local val = parentArgs[params[1]] if val and val ~= '' then table.insert( elements, p.createRow( params[1], params[2]..':', val, params[4]( val ), true, params.category ) ) rct = rct + 1 end end --WorldCat local worldcatId = parentArgs['WORLDCATID'] if worldcatId and worldcatId ~= '' then --if present & unsuppressed table.insert( elements, p.createRow( 'WORLDCATID', , worldcatId, 'WorldCat Identities: '..worldcatId.., false ) ) --Validation? worldcatCat = '' elseif worldcatId == nil then --if absent & unsuppressed local viafId = parentArgs['VIAF'] local lccnId = parentArgs['LCCN'] if viafId and viafId ~= '' and p.viafLink( viafId ) then --VIAF must be present, unsuppressed, & validated table.insert( elements, p.createRow( 'VIAF', , viafId, 'WorldCat Identities (via VIAF): '..viafId.., false ) ) if namespace == 0 then worldcatCat = '' end elseif lccnId and lccnId ~= '' and p.lccnLink( lccnId ) then --LCCN must be present, unsuppressed, & validated local lccnParts = p.splitLccn( lccnId ) if lccnParts and lccnParts[1] ~= 'sh' then local lccnIdFmtd = lccnParts[1]..lccnParts[2]..'-'..lccnParts[3] table.insert( elements, p.createRow( 'LCCN', , lccnId, 'WorldCat Identities (via LCCN): '..lccnIdFmtd.., false ) ) if namespace == 0 then worldcatCat = '' end end end elseif worldcatId == '' then --if suppressed suppressedIdCat = '' end local Navbox = require('Module:Navbox') local elementsCat = '' if rct >= 20 then local catName = 'AC with '..rct..' elements' elementsCat = ''..p.redCatLink(catName) end local outString = '' if #elements > 0 then local args = {} if testcases and itemId then args = { qid = itemId } end --expensive local pencil = frame:expandTemplate{ title = 'EditAtWikidata', args = args} outString = Navbox._navbox( {			name = 'Authority control',			navboxclass = 'authority-control',			bodyclass = 'hlist',			group1 = 'Authority control'..pencil,			list1 = table.concat( elements )			} ) local auxCats = worldcatCat .. elementsCat .. suppressedIdCat .. deprecatedIdCat if testcases then auxCats = mw.ustring.gsub(auxCats, '(%[%[)(Category)', '%1:%2') --for easier checking end outString = outString .. auxCats if namespace ~= 0 then outString = mw.ustring.gsub(outString, '(%[%[)(Category:Wikipedia articles)', '%1:%2') --by definition end end return outString end

return p