Изменения

Модуль:Citation/CS1 (посмотреть исходный код)

Версия от 18:09, 24 декабря 2023

93 023 байта добавлено , 1 год назад

update from enwiki

Строка 1: Строка 1: +

require ('strict');

−

~~local z = {~~

+

--[[--------------------------< F O R W A R D D E C L A R A T I O N S >--------------------------------------

−

~~error_categories = {};~~ -- ~~for categorizing citations that contain errors~~

+

−

~~error_ids = {};~~

+

each of these counts against the Lua upvalue limit

−

~~message_tail = {};~~

−

~~maintenance_cats = {};~~ -- ~~for categorizing citations that aren't erroneous per se, but could use a little work~~

−

~~properties_cats = {};~~ -- ~~for categorizing citations based on certain properties, language~~ of ~~source for instance~~

−

}

−

~~--[[--------------------------< F O R W A R D D E C L A R A T I O N S >--------------------------------------~~

]]

−

~~local dates, year_date_check -- functions in Module:Citation/CS1/Date_validation~~

−

local ~~cfg = {}~~; -- ~~table of configuration tables that are defined~~ in Module:Citation/CS1/~~Configuration~~

+

local validation; -- functions in Module:Citation/CS1/Date_validation

−

~~local whitelist = {}; -- talbe of tables listing valid template parameter names; defined in Module:Citation/CS1/Whitelist~~

−

--~~[[------------------------------------------------------------------------------------------~~--

+

local utilities; -- functions in Module:Citation/CS1/Utilities

+

local z = {}; -- table of tables in Module:Citation/CS1/Utilities

−

~~Returns true if argument is set~~; ~~false otherwise. Argument is 'set' when it exists (~~not ~~nil) or when it is not an empty string.~~

+

local identifiers; -- functions and tables in Module:Citation/CS1/Identifiers

−

~~This function is global because it is called from both this module~~ and ~~from Date validation~~

+

local metadata; -- functions in Module:Citation/CS1/COinS

+

local cfg = {}; -- table of configuration tables that are defined in Module:Citation/CS1/Configuration

+

local whitelist = {}; -- table of tables listing valid template parameter names; defined in Module:Citation/CS1/Whitelist

+

--[[---------------------------------

+

declare variables here that have page-wide scope that are not brought in from

+

other modules; that are created here and used here

]]

−

~~function is_set( var )~~

+

−

~~return not (var == nil or var ==~~ '');

+

local added_deprecated_cat; -- Boolean flag so that the category is added only once

−

~~end~~

+

local added_vanc_errs; -- Boolean flag so we only emit one Vancouver error / category

+

local added_generic_name_errs; -- Boolean flag so we only emit one generic name error / category and stop testing names once an error is encountered

+

local added_numeric_name_errs; -- Boolean flag so we only emit one numeric name error / category and stop testing names once an error is encountered

+

local added_numeric_name_maint; -- Boolean flag so we only emit one numeric name maint category and stop testing names once a category has been emitted

+

local Frame; -- holds the module's frame table

+

local is_preview_mode; -- true when article is in preview mode; false when using 'Preview page with this template' (previewing the module)

+

local is_sandbox; -- true when using sandbox modules to render citation

+

--[[--------------------------< F I R S T _ S E T >------------------------------------------------------------

−

~~First~~ set ~~variable~~ or nil if none

+

Locates and returns the first set value in a table of values where the order established in the table,

+

left-to-right (or top-to-bottom), is the order in which the values are evaluated. Returns nil if none are set.

+

This version replaces the original 'for _, val in pairs do' and a similar version that used ipairs. With the pairs

+

version the order of evaluation could not be guaranteed. With the ipairs version, a nil value would terminate

+

the for-loop before it reached the actual end of the list.

]]

−

local function first_set(~~...~~)

+

local function first_set (list, count)

−

local ~~list~~ = ~~{...}~~;

+

local i = 1;

−

~~for _, var~~ in ~~pairs(~~list~~) do~~

+

while i <= count do -- loop through all items in list

−

if is_set( ~~var~~ ) then

+

if utilities.is_set( list[i] ) then

−

return ~~var~~;

+

return list[i]; -- return the first set list member

end

+

i = i + 1; -- point to next

end

−

~~--[[----------------------------------------------------------------------------------------~~

−

~~Whether needle~~ is in ~~haystack~~

+

--[[--------------------------< A D D _ V A N C _ E R R O R >----------------------------------------------------

+

Adds a single Vancouver system error message to the template's output regardless of how many error actually exist.

+

To prevent duplication, added_vanc_errs is nil until an error message is emitted.

+

added_vanc_errs is a Boolean declared in page scope variables above

]]

−

local function ~~in_array~~( ~~needle~~, ~~haystack~~ )

+

local function add_vanc_error (source, position)

−

if ~~needle == nil~~ then

+

if added_vanc_errs then return end

−

~~return false;~~

+

−

~~end~~

+

added_vanc_errs = true; -- note that we've added this category

−

~~for n~~,~~v in ipairs( haystack~~ ) do

+

utilities.set_message ('err_vancouver', {source, position});

−

~~if v == needle then~~

−

~~return n;~~

−

~~end~~

−

~~end~~

−

~~return false~~;

end

−

~~--[[--------------------------< S U B S T I T U T E >----------------------------------------------------------~~

−

~~Populates numbered arguments~~ in a ~~message string using an argument table~~.

+

--[[--------------------------------------------------------------------------------------

+

does this thing that purports to be a URI scheme seem to be a valid scheme? The scheme is checked to see if it

+

is in agreement with http://tools.ietf.org/html/std66#section-3.1 which says:

+

Scheme names consist of a sequence of characters beginning with a

+

letter and followed by any combination of letters, digits, plus

+

("+"), period ("."), or hyphen ("-").

+

returns true if it does, else false

]]

−

local function ~~substitute~~( ~~msg, args~~ )

+

local function is_scheme (scheme)

−

return ~~args~~ and ~~mw.message~~.~~newRawMessage( msg, args )~~:~~plain(~~) ~~or msg~~;

+

return scheme and scheme:match ('^%a[%a%d%+%.%-]*:'); -- true if scheme is set and matches the pattern

end

−

~~--[[--------------------------< E R R O R _ C O M M E N T >----------------------------------------------------~~

−

~~Wraps error messages with css markup according~~ to the ~~state~~ of ~~hidden~~.

+

--[=[---------------------------------------------------------------------------

+

Does this thing that purports to be a domain name seem to be a valid domain name?

+

Syntax defined here: http://tools.ietf.org/html/rfc1034#section-3.5

+

BNF defined here: https://tools.ietf.org/html/rfc4234

+

Single character names are generally reserved; see https://tools.ietf.org/html/draft-ietf-dnsind-iana-dns-01#page-15;

+

see also [[Single-letter second-level domain]]

+

list of TLDs: https://www.iana.org/domains/root/db

+

RFC 952 (modified by RFC 1123) requires the first and last character of a hostname to be a letter or a digit. Between

+

the first and last characters the name may use letters, digits, and the hyphen.

−

]]

+

Also allowed are IPv4 addresses. IPv6 not supported

−

~~local function error_comment( content, hidden )~~

−

~~return substitute( hidden and cfg~~.~~presentation['hidden-error'] or cfg.presentation['visible-error'], content );~~

−

~~end~~

−

~~--[[--------------------------< S E T _ E R R O R >--------------------------------------------------------------~~

+

domain is expected to be stripped of any path so that the last character in the last character of the TLD. tld

+

is two or more alpha characters. Any preceding '//' (from splitting a URL with a scheme) will be stripped

+

here. Perhaps not necessary but retained in case it is necessary for IPv4 dot decimal.

−

~~Sets an error condition~~ and ~~returns~~ the ~~appropriate error message~~. ~~The actual placement of~~ the ~~error message~~ in the ~~output~~ is

+

There are several tests:

−

the ~~responsibility of~~ the ~~calling function.~~

+

the first character of the whole domain name including subdomains must be a letter or a digit

+

internationalized domain name (ASCII characters with .xn-- ASCII Compatible Encoding (ACE) prefix xn-- in the TLD) see https://tools.ietf.org/html/rfc3490

+

single-letter/digit second-level domains in the .org, .cash, and .today TLDs

+

q, x, and z SL domains in the .com TLD

+

i and q SL domains in the .net TLD

+

single-letter SL domains in the ccTLDs (where the ccTLD is two letters)

+

two-character SL domains in gTLDs (where the gTLD is two or more letters)

+

three-plus-character SL domains in gTLDs (where the gTLD is two or more letters)

+

IPv4 dot-decimal address format; TLD not allowed

−

]]

+

returns true if domain appears to be a proper name and TLD or IPv4 address, else false

−

local function ~~set_error~~( ~~error_id, arguments, raw, prefix, suffix~~ )

+

−

~~local error_state = cfg.error_conditions[ error_id ];~~

+

]=]

−

+

−

~~prefix = prefix or "";~~

+

local function is_domain_name (domain)

−

~~suffix = suffix or "";~~

+

if not domain then

−

+

return false; -- if not set, abandon

−

if ~~error_state == nil~~ then

−

~~error( cfg.messages['undefined_error'] )~~;

−

~~elseif is_set( error_state.category ) then~~

−

~~table.insert( z.error_categories~~, ~~error_state.category );~~

end

−

~~local message~~ = ~~substitute~~( ~~error_state.message~~, ~~arguments~~ );

+

domain = domain:gsub ('^//', ''); -- strip '//' from domain name if present; done here so we only have to do it once

−

~~message = message .. "~~ (~~[[" .. cfg.messages['help page link'] ..~~

+

if not domain:match ('^[%w]') then -- first character must be letter or digit

−

~~"#" .. error_state.anchor .. "|" ..~~

+

return false;

−

~~cfg.messages['help page label~~'~~] .. "]])";~~

−

~~z.error_ids~~[ ~~error_id~~ ] ~~= true;~~

−

~~if in_array( error_id, { 'bare_url_missing_title', 'trans_missing_title~~' } )

−

~~and z.error_ids['citation_missing_title']~~ then

−

return ~~'',~~ false;

end

−

~~message = table.concat({ prefix, message, suffix });~~

−

~~if raw == true then~~

−

~~return message, error_state.hidden;~~

−

~~end~~

−

~~return error_comment( message, error_state.hidden );~~

−

~~end~~

−

--~~[[--------------------------< A D D _ M A I N T _ C A T >------------------------------------------------------~~

+

if domain:match ('^%a+:') then -- hack to detect things that look like s:Page:Title where Page: is namespace at Wikisource

+

return false;

+

end

−

~~Adds~~ a ~~category to z~~.~~maintenance_cats using names from the configuration file~~ with ~~additional text if any~~.

+

local patterns = { -- patterns that look like URLs

+

'%f[%w][%w][%w%-]+[%w]%.%a%a+$', -- three or more character hostname.hostname or hostname.tld

+

'%f[%w][%w][%w%-]+[%w]%.xn%-%-[%w]+$', -- internationalized domain name with ACE prefix

+

'%f[%a][qxz]%.com$', -- assigned one character .com hostname (x.com times out 2015-12-10)

+

'%f[%a][iq]%.net$', -- assigned one character .net hostname (q.net registered but not active 2015-12-10)

+

'%f[%w][%w]%.%a%a$', -- one character hostname and ccTLD (2 chars)

+

'%f[%w][%w][%w]%.%a%a+$', -- two character hostname and TLD

+

'^%d%d?%d?%.%d%d?%d?%.%d%d?%d?%.%d%d?%d?', -- IPv4 address

+

}

−

]]

+

for _, pattern in ipairs (patterns) do -- loop through the patterns list

+

if domain:match (pattern) then

+

return true; -- if a match then we think that this thing that purports to be a URL is a URL

+

end

+

end

−

~~local function add_maint_cat (key, arguments)~~

+

for _, d in ipairs (cfg.single_letter_2nd_lvl_domains_t) do -- look for single letter second level domain names for these top level domains

−

~~table.insert( z.maintenance_cats~~, ~~substitute~~ (cfg.~~maint_cats~~ [~~key~~]~~, arguments)~~); -- ~~make name then add to table~~

+

if domain:match ('%f[%w][%w]%.' .. d) then

+

return true

+

end

+

end

+

return false; -- no matches, we don't know what this thing is

end

−

~~--[[--------------------------< A D D _ P R O P _ C A T >--------------------------------------------------------~~

−

~~Adds~~ a ~~category~~ to z.~~properties_cats using names from~~ the ~~configuration file with additional text if any~~.

+

--[[--------------------------------------------------------------------------------------------

+

returns true if the scheme and domain parts of a URL appear to be a valid URL; else false.

+

This function is the last step in the validation process. This function is separate because there are cases that

+

are not covered by split_url(), for example is_parameter_ext_wikilink() which is looking for bracketted external

+

wikilinks.

]]

−

local function ~~add_prop_cat~~ (~~key~~, ~~arguments~~)

+

local function is_url (scheme, domain)

−

~~table~~.~~insert~~( ~~z.properties_cats, substitute~~ (~~cfg.prop_cats [key], arguments~~)); -- ~~make name then add to table~~

+

if utilities.is_set (scheme) then -- if scheme is set check it and domain

+

return is_scheme (scheme) and is_domain_name (domain);

+

else

+

return is_domain_name (domain); -- scheme not set when URL is protocol-relative

+

end

−

~~--[[--------------------------< C H E C K _ U R L >------------------------------------------------------------~~

−

~~Determines whether a URL string is valid.~~

+

--[[--------------------------< S P L I T _ U R L >------------------------------------------------------------

−

~~At present the only check is whether the string appears to be prefixed with~~ a ~~URI scheme. It is not determined whether~~

+

Split a URL into a scheme, authority indicator, and domain.

−

~~the URI~~ scheme ~~is valid or whether the URL is otherwise well formed~~.

−

]]

+

First remove Fully Qualified Domain Name terminator (a dot following TLD) (if any) and any path(/), query(?) or fragment(#).

−

~~local function check_url( url_str )~~

+

If protocol-relative URL, return nil scheme and domain else return nil for both scheme and domain.

−

~~return url_str:sub(1,2) == "//" or url_str:match( "^[^/]*:" ) ~= nil; -- Protocol~~-relative or URL scheme

−

~~end~~

−

-~~-[[--------------------------< S A F E _ F O R _ I T A L I C S >----------------------------------------------~~

+

When not protocol-relative, get scheme, authority indicator, and domain. If there is an authority indicator (one

+

or more '/' characters immediately following the scheme's colon), make sure that there are only 2.

−

~~Protects a string~~ that ~~will be wrapped in wiki italic markup ''~~ .~~.. '~~'

+

Any URL that does not have news: scheme must have authority indicator (//). TODO: are there other common schemes

+

like news: that don't use authority indicator?

−

~~Note: We cannot use for italics, as the expected behavior for italics specified by ''...'' in the title is that~~

+

Strip off any port and path;

−

~~they will be inverted (i.e. unitalicized) in the resulting references. In addition, ~~ and ~~'' tend to interact~~

−

~~poorly under Mediawiki's HTML tidy.~~

]]

−

local function ~~safe_for_italics~~( ~~str~~ )

+

local function split_url (url_str)

−

if ~~not is_set~~(~~str~~) then

+

local scheme, authority, domain;

−

~~return str;~~

+

−

~~else~~

+

url_str = url_str:gsub ('([%a%d])%.?[/%?#].*$', '%1'); -- strip FQDN terminator and path(/), query(?), fragment (#) (the capture prevents false replacement of '//')

−

if ~~str~~:~~sub~~(1,1) ~~== "~~'~~" then str = "<span~~ /~~>" .. str~~; ~~end~~

+

−

if ~~str:sub~~(-1,-1) ~~== "'"~~ then ~~str = str .. ""~~; end

+

if url_str:match ('^//%S*') then -- if there is what appears to be a protocol-relative URL

−

+

domain = url_str:match ('^//(%S*)')

−

-- ~~Remove newlines as they break italics~~.

+

elseif url_str:match ('%S-:/*%S+') then -- if there is what appears to be a scheme, optional authority indicator, and domain name

−

~~return str~~:gsub( '\n', ' ' );

+

scheme, authority, domain = url_str:match ('(%S-:)(/*)(%S+)'); -- extract the scheme, authority indicator, and domain portions

+

if utilities.is_set (authority) then

+

authority = authority:gsub ('//', '', 1); -- replace place 1 pair of '/' with nothing;

+

if utilities.is_set(authority) then -- if anything left (1 or 3+ '/' where authority should be) then

+

return scheme; -- return scheme only making domain nil which will cause an error message

+

end

+

else

+

if not scheme:match ('^news:') then -- except for news:..., MediaWiki won't link URLs that do not have authority indicator; TODO: a better way to do this test?

+

return scheme; -- return scheme only making domain nil which will cause an error message

+

end

+

end

+

domain = domain:gsub ('(%a):%d+', '%1'); -- strip port number if present

end

+

return scheme, domain;

end

−

~~--[[--------------------------< S A F E _ F O R _ U R L >------------------------------------------------------~~

−

~~Escape sequences for content that will be used for URL descriptions~~

+

--[[--------------------------< L I N K _ P A R A M _ O K >---------------------------------------------------

−

]]

+

checks the content of |title-link=, |series-link=, |author-link=, etc. for properly formatted content: no wikilinks, no URLs

−

~~local function safe_for_url( str )~~

+

Link parameters are to hold the title of a Wikipedia article, so none of the WP:TITLESPECIALCHARACTERS are allowed:

−

~~if str:match( "%~~[~~%[.-%~~]~~%]" ) ~= nil then~~

+

# < > [ ] | { } _

−

~~table.insert( z.message_tail, { set_error( 'wikilink_in_url',~~ {}~~, true ) } );~~

+

except the underscore which is used as a space in wiki URLs and # which is used for section links

−

~~end~~

−

~~return str:gsub( '[%[%]\n]', {~~

−

~~['['] = '[',~~

−

~~[']'] = '&~~#~~93;',~~

−

~~['\n'] = ' ' } );~~

−

~~end~~

−

~~--[[--------------------------< W R A P _ S T Y L E >----------------------------------------------------------~~

+

returns false when the value contains any of these characters.

−

~~Applies styling~~ to ~~various parameters. Supplied string is wrapped using~~ a ~~message_list configuration taking one~~

+

When there are no illegal characters, this function returns TRUE if value DOES NOT appear to be a valid URL (the

−

~~argument; protects italic styled parameters. Additional text taken from citation_config.presentation~~ - ~~the reason~~

+

|<param>-link= parameter is ok); else false when value appears to be a valid URL (the |<param>-link= parameter is NOT ok).

−

~~this function~~ is ~~similar~~ to ~~but separate from wrap_msg~~().

]]

−

local function ~~wrap_style~~ (~~key, str~~)

+

local function link_param_ok (value)

−

~~if not is_set( str ) then~~

+

local scheme, domain;

−

~~return ""~~;

+

if value:find ('[<>%[%]|{}]') then -- if any prohibited characters

−

~~elseif in_array~~( ~~key,~~ { '~~italic~~-~~title', 'trans~~-~~italic-title' } ) then~~

+

return false;

−

~~str = safe_for_italics( str )~~;

end

−

return ~~substitute~~( ~~cfg.presentation[key]~~, ~~{str}~~ );

+

scheme, domain = split_url (value); -- get scheme or nil and domain or nil from URL;

+

return not is_url (scheme, domain); -- return true if value DOES NOT appear to be a valid URL

end

−

~~--[[--------------------------< E X T E R N A L _ L I N K >----------------------------------------------------~~

−

~~Format~~ an ~~external~~ link with ~~error checking~~

+

--[[--------------------------< L I N K _ T I T L E _ O K >---------------------------------------------------

+

Use link_param_ok() to validate |<param>-link= value and its matching |<title>= value.

+

|<title>= may be wiki-linked but not when |<param>-link= has a value. This function emits an error message when

+

that condition exists

+

check <link> for inter-language interwiki-link prefix. prefix must be a MediaWiki-recognized language

+

code and must begin with a colon.

]]

−

local function ~~external_link~~( ~~URL~~, ~~label~~, ~~source~~ )

+

local function link_title_ok (link, lorig, title, torig)

−

local ~~error_str = ""~~;

+

local orig;

−

if ~~not~~ is_set( ~~label~~ ) then

+

if utilities.is_set (link) then -- don't bother if <param>-link doesn't have a value

−

~~label~~ = ~~URL~~;

+

if not link_param_ok (link) then -- check |<param>-link= markup

−

~~if is_set~~( ~~source~~ ) then

+

orig = lorig; -- identify the failing link parameter

−

~~error_str~~ = ~~set_error~~( '~~bare_url_missing_title~~'~~, { wrap_style~~ ('~~parameter~~'~~, source~~) ~~}, false, " "~~ );

+

elseif title:find ('%[%[') then -- check |title= for wikilink markup

−

~~else~~

+

orig = torig; -- identify the failing |title= parameter

−

~~error(~~ cfg.~~messages~~[~~"bare_url_no_origin"~~] );

+

elseif link:match ('^%a+:') then -- if the link is what looks like an interwiki

−

end

+

local prefix = link:match ('^(%a+):'):lower(); -- get the interwiki prefix

+

if cfg.inter_wiki_map[prefix] then -- if prefix is in the map, must have preceding colon

+

orig = lorig; -- flag as error

+

end

+

end

−

if ~~not check_url~~( ~~URL~~ ) then

+

−

~~error_str~~ = ~~set_error~~( '~~bad_url~~', ~~{}, false, " "~~ ) ~~.. error_str~~;

+

if utilities.is_set (orig) then

+

link = ''; -- unset

+

utilities.set_message ('err_bad_paramlink', orig); -- URL or wikilink in |title= with |title-link=;

end

−

return ~~table.concat({ "[", URL, " ", safe_for_url( label )~~, ~~"]", error_str });~~

+

return link; -- link if ok, empty string else

end

−

~~--[[--------------------------< E X T E R N A L _ L I N K _ I D >----------------------------------------------~~

−

~~Formats~~ a ~~wiki style~~ external ~~link~~

+

--[[--------------------------< C H E C K _ U R L >------------------------------------------------------------

+

Determines whether a URL string appears to be valid.

+

First we test for space characters. If any are found, return false. Then split the URL into scheme and domain

+

portions, or for protocol-relative (//example.com) URLs, just the domain. Use is_url() to validate the two

+

portions of the URL. If both are valid, or for protocol-relative if domain is valid, return true, else false.

+

Because it is different from a standard URL, and because this module used external_link() to make external links

+

that work for standard and news: links, we validate newsgroup names here. The specification for a newsgroup name

+

is at https://tools.ietf.org/html/rfc5536#section-3.1.4

]]

−

local function ~~external_link_id~~(~~options~~)

+

local function check_url( url_str )

−

~~local url_string = options.id;~~

+

if nil == url_str:match ("^%S+$") then -- if there are any spaces in |url=value it can't be a proper URL

−

if ~~options.encode~~ == ~~true or options.encode =~~= ~~nil then~~

+

return false;

−

~~url_string = mw.uri.encode( url_string )~~;

end

−

~~return mw.ustring.format( '[[%s|%s]]%s[%s%s%s %s]'~~,

+

local scheme, domain;

−

~~options.link, options.label, options.separator or " ",~~

−

~~options.prefix, url_string, options.suffix or "",~~

−

~~mw.text.nowiki(options.id)~~

−

);

−

~~end~~

−

--[[

+

scheme, domain = split_url (url_str); -- get scheme or nil and domain or nil from URL;

−

~~Categorize~~ and ~~emit an error message when the citation contains one~~ or ~~more deprecated parameters. Because deprecated parameters (currently |month=,~~

+

−

~~|coauthor=, and |coauthors=) aren't related to each other and because these parameters may be concatenated into the variables used by |date= and |author#= (and aliases)~~

+

if 'news:' == scheme then -- special case for newsgroups

−

~~details of which parameter caused the error message are not provided. Only one error message is emitted regardless of the number of deprecated parameters in the citation.~~

+

return domain:match('^[%a%d%+%-_]+%.[%a%d%+%-_%.]*[%a%d%+%-_]$');

−

]]

−

~~local function deprecated_parameter(name)~~

−

if ~~true ~~~= ~~Page_in_deprecated_cat~~ then -- ~~if we haven~~'~~t been here before then set~~ a

−

~~Page_in_deprecated_cat=true;~~ -- ~~sticky flag so that if there are more than one deprecated parameter the category is added only once~~

−

~~table~~.~~insert( z.message_tail, { set_error(~~ '~~deprecated_params', {name}, true ) }~~ ); ~~-- add error message~~

end

+

return is_url (scheme, domain); -- return true if value appears to be a valid URL

end

−

~~--[[--------------------------< K E R N _ Q U O T E S >--------------------------------------------------------~~

−

~~Apply kerning to open~~ the space ~~between~~ the ~~quote mark provided by the Module and~~ a ~~leading or trailing quote mark contained in~~ a |title= or |chapter= ~~parameter's value.~~

+

--[=[-----------------------------------------------------

−

~~This function will positive kern either single~~ or ~~double quotes:~~

+

−

"'~~Unkerned~~ title ~~with leading and trailing single quote marks'"~~

+

Return true if a parameter value has a string that begins and ends with square brackets [ and ] and the first

−

~~" 'Kerned title with leading and trailing single quote marks' " (in real life the kerning isn't~~ as ~~wide as this example)~~

+

non-space characters following the opening bracket appear to be a URL. The test will also find external wikilinks

−

~~Double single quotes (italic or bold wikimarkup) are not kerned~~.

+

that use protocol-relative URLs. Also finds bare URLs.

+

The frontier pattern prevents a match on interwiki-links which are similar to scheme:path URLs. The tests that

+

find bracketed URLs are required because the parameters that call this test (currently |title=, |chapter=, |work=,

+

and |publisher=) may have wikilinks and there are articles or redirects like '//Hus' so, while uncommon, |title=[[//Hus]]

+

is possible as might be [[en://Hus]].

−

~~Call this function for chapter titles, for website titles, etc; not for book titles.~~

+

]=]

−

]]

+

local function is_parameter_ext_wikilink (value)

+

local scheme, domain;

−

~~local function kern_quotes~~ (~~str~~)

+

if value:match ('%f[%[]%[%a%S*:%S+.*%]') then -- if ext. wikilink with scheme and domain: [xxxx://yyyyy.zzz]

−

~~local cap~~='';

+

scheme, domain = split_url (value:match ('%f[%[]%[(%a%S*:%S+).*%]'));

−

~~local cap2=~~'';

+

elseif value:match ('%f[%[]%[//%S+.*%]') then -- if protocol-relative ext. wikilink: [//yyyyy.zzz]

−

+

scheme, domain = split_url (value:match ('%f[%[]%[(//%S+).*%]'));

−

~~cap~~, ~~cap2~~ = ~~str~~:match ("^(~~[\"\~~'])(~~[^\~~'].+)~~");~~ -- ~~match~~ leading ~~double~~ or ~~single quote but not double single quotes~~

+

elseif value:match ('%a%S*:%S+') then -- if bare URL with scheme; may have leading or trailing plain text

−

~~if is_set~~ (~~cap~~) then

+

scheme, domain = split_url (value:match ('(%a%S*:%S+)'));

−

~~str~~ = ~~substitute~~ (~~cfg.presentation[~~'~~kern~~-left'~~], {cap, cap2});~~

+

elseif value:match ('//%S+') then -- if protocol-relative bare URL: //yyyyy.zzz; may have leading or trailing plain text

+

scheme, domain = split_url (value:match ('(//%S+)')); -- what is left should be the domain

+

else

+

return false; -- didn't find anything that is obviously a URL

end

−

~~cap, cap2 = str:match~~ (~~"^(.+[^\'])([\"\'])$")~~

+

return is_url (scheme, domain); -- return true if value appears to be a valid URL

−

~~if is_set (cap) then~~

−

~~str = substitute (cfg.presentation['kern-right'], {cap~~, ~~cap2}~~);

−

~~end~~

−

return ~~str;~~

end

−

~~--[[--------------------------< F O R M A T _ S C R I P T _ V A L U E >----------------------------------------~~

−

~~|script-title= holds title parameters that are not written in Latin based scripts: Chinese, Japanese, Arabic, Hebrew, etc. These scripts should~~

−

~~not be italicized and may be written right-to-left. The value supplied by |script-title= is concatenated onto Title after Title has been wrapped~~

−

~~in italic markup.~~

−

~~Regardless of language, all values provided by |script-title= are wrapped in <bdi>...</bdi> tags to isolate rtl languages from the English left to right.~~

−

~~|script-title= provides a unique feature. The value in |script-title= may be prefixed with a two-character ISO639-1 language code and a colon:~~

−

~~|script-title=ja:*** *** (where * represents a Japanese character)~~

−

~~Spaces between the two-character code and the colon and the colon and the first script character are allowed:~~

−

|script-title=ja : *** ***

−

|script-title=ja: *** ***

−

|script-title=ja :*** ***

−

Spaces preceding the prefix are allowed: |script-title = ja:*** ***

−

~~The prefix is checked for validity. If it is a valid ISO639~~-~~1 language code, the lang attribute (lang="ja") is added to the~~ <~~bdi~~> ~~tag so that browsers can~~

+

--[[-------------------------< C H E C K _ F O R _ U R L >-----------------------------------------------------

−

~~know the language the tag contains. This may help the browser render the script more correctly. If the prefix is invalid, the lang attribute~~

−

~~is not added. At this time there is no error message for this condition.~~

−

~~At this writing, only |script-title= is supported~~. ~~It is anticipated that additional parameters will be created to use this function~~.

+

loop through a list of parameters and their values. Look at the value and if it has an external link, emit an error message.

−

~~TODO: error messages when prefix is invalid ISO639-1 code; when script_value has prefix but no script;~~

]]

−

local function ~~format_script_value~~ (~~script_value~~)

+

local function check_for_url (parameter_list, error_list)

−

~~local lang=''; -- initialize to empty string~~

+

for k, v in pairs (parameter_list) do -- for each parameter in the list

−

~~local name;~~

+

if is_parameter_ext_wikilink (v) then -- look at the value; if there is a URL add an error message

−

~~if script_value:match~~(~~'^%l%l%s*:'~~) ~~then~~ -- ~~if first 3 non-space characters are script language prefix~~

+

table.insert (error_list, utilities.wrap_style ('parameter', k));

−

~~lang = script_value:match('^(%l%l)%s*:%s*%S.*'); -- get~~ the ~~language prefix or nil if there is no script~~

−

if ~~not is_set~~ (~~lang~~) then

−

~~return '';~~ -- ~~script_value was just~~ the ~~prefix so return empty string~~

−

~~end~~

−

~~-- if we get this far we have prefix and script~~

−

~~name = mw.language.fetchLanguageName( lang, "en" )~~; ~~-- get language name so that we can use it to categorize~~

−

if ~~is_set (name) then --~~ is ~~prefix~~ a ~~proper ISO 639-1 language code?~~

−

~~script_value = script_value:gsub~~ (~~'^%l%l%s*:%s*'~~, ~~''); -- strip prefix from script~~

−

~~-- is prefix one of these language codes?~~

−

~~if in_array (lang, {'ar', 'bg', 'bs', 'dv', 'el', 'fa', 'hy', 'ja', 'ka', 'ko', 'ku', 'he', 'ps', 'ru', 'sd', 'sr', 'th', 'uk', 'ug', 'yi', 'zh'}) then~~

−

~~add_prop_cat~~ ('~~script_with_name~~', ~~{name, lang}~~)

−

~~else~~

−

~~add_prop_cat ('script'~~)

−

~~end~~

−

~~lang = ' lang="' .. lang .. '" '; -- convert prefix into a lang attribute~~

−

~~else~~

−

~~lang = ''~~; ~~-- invalid so set lang to empty string~~

end

−

~~script_value = substitute (cfg.presentation['bdi'], {lang, script_value}); -- isolate in case script is rtl~~

−

~~return script_value;~~

end

−

~~--[[--------------------------< S C R I P T _ C O N C A T E N A T E >------------------------------------------~~

−

~~Initially for |title= and |script~~-~~title=, this function concatenates those two parameter values after the script value has been~~

+

--[[--------------------------< S A F E _ F O R _ U R L >------------------------------------------------------

−

~~wrapped in~~ <~~bdi~~> ~~tags.~~

+

Escape sequences for content that will be used for URL descriptions

+

]]

−

local function ~~script_concatenate~~ (~~title, script~~)

+

local function safe_for_url( str )

−

if ~~is_set~~ (~~script~~) then

+

if str:match( "%[%[.-%]%]" ) ~= nil then

−

~~script = format_script_value~~ (~~script); -- <bdi> tags, lang atribute, categorization~~, ~~etc; returns empty string on error~~

+

utilities.set_message ('err_wikilink_in_url', {});

−

~~if is_set (script~~) ~~then~~

−

~~title = title .. ' ' .. script~~; ~~-- concatenate title and script title~~

−

~~end~~

end

−

return ~~title~~;

+

return str:gsub( '[%[%]\n]', {

+

['['] = '[',

+

[']'] = ']',

+

['\n'] = ' ' } );

end

−

--[[--------------------------< W R A P _ ~~M S G~~ >~~----------~~----------------------------------------------------

+

--[[--------------------------< E X T E R N A L _ L I N K >----------------------------------------------------

−

~~Applies additional message text to various parameter values. Supplied string is wrapped using a message_list~~

+

Format an external link with error checking

−

~~configuration taking one argument. Supports lower case text for {{citation}} templates. Additional text taken~~

−

~~from citation_config.messages - the reason this function is similar to but separate from wrap_style().~~

]]

−

local function ~~wrap_msg~~ (~~key~~, ~~str~~, ~~lower~~)

+

local function external_link (URL, label, source, access)

−

if not is_set( ~~str~~ ) then

+

local err_msg = '';

−

~~return~~ "";

+

local domain;

+

local path;

+

local base_url;

+

if not utilities.is_set (label) then

+

label = URL;

+

if utilities.is_set (source) then

+

utilities.set_message ('err_bare_url_missing_title', {utilities.wrap_style ('parameter', source)});

+

else

+

error (cfg.messages["bare_url_no_origin"]); -- programmer error; valid parameter name does not have matching meta-parameter

+

end

+

end

+

if not check_url (URL) then

+

utilities.set_message ('err_bad_url', {utilities.wrap_style ('parameter', source)});

end

−

if ~~true == lower~~ then

+

−

~~local msg~~;

+

domain, path = URL:match ('^([/%.%-%+:%a%d]+)([/%?#].*)$'); -- split the URL into scheme plus domain and path

−

~~msg~~ = ~~cfg~~.~~messages[key]:lower~~(); -- ~~set the message to lower case before~~

+

if path then -- if there is a path portion

−

~~str~~ = ~~substitute~~( ~~msg~~, ~~{str~~} ); -- ~~including template text~~

+

path = path:gsub ('[%[%]]', {['['] = '%5b', [']'] = '%5d'}); -- replace '[' and ']' with their percent-encoded values

−

~~return str;~~

+

URL = table.concat ({domain, path}); -- and reassemble

−

~~else~~

+

end

−

~~return~~ substitute( cfg.~~messages~~[~~key~~], {~~str~~} );

+

−

end

+

base_url = table.concat ({ "[", URL, " ", safe_for_url (label), "]" }); -- assemble a wiki-markup URL

+

if utilities.is_set (access) then -- access level (subscription, registration, limited)

+

base_url = utilities.substitute (cfg.presentation['ext-link-access-signal'], {cfg.presentation[access].class, cfg.presentation[access].title, base_url}); -- add the appropriate icon

+

end

+

return base_url;

end

−

~~--[[--------------------------< S E L E C T _ O N E >----------------------------------------------------------~~

−

~~Chooses~~ one ~~matching~~ parameter ~~from a list of parameters~~ to ~~consider~~

+

--[[--------------------------< D E P R E C A T E D _ P A R A M E T E R >--------------------------------------

−

~~Generates an~~ error ~~if more than~~ one ~~match~~ is ~~present~~.

+

Categorize and emit an error message when the citation contains one or more deprecated parameters. The function includes the

+

offending parameter name to the error message. Only one error message is emitted regardless of the number of deprecated

+

parameters in the citation.

+

added_deprecated_cat is a Boolean declared in page scope variables above

]]

−

local function ~~select_one~~( ~~args, possible, error_condition, index~~ )

+

local function deprecated_parameter(name)

−

~~local value = nil;~~

+

if not added_deprecated_cat then

−

~~local selected = '';~~

+

added_deprecated_cat = true; -- note that we've added this category

−

~~local error_list = {};~~

+

utilities.set_message ('err_deprecated_params', {name}); -- add error message

−

if ~~index ~= nil~~ then ~~index~~ = ~~tostring(index)~~; ~~end~~

−

-- ~~Handle special case of "#" replaced by empty string~~

−

~~if index ==~~ '~~1' then~~

−

~~for _, v in ipairs( possible ) do~~

−

~~v = v:gsub( "#", "" );~~

−

~~if is_set(args[v]) then~~

−

~~if value ~= nil and selected ~= v then~~

−

~~table~~.~~insert~~( ~~error_list~~, v );

−

~~else~~

−

~~value = args[v];~~

−

~~selected = v;~~

−

~~end~~

−

~~end~~

−

~~end~~

end

−

+

end

−

~~for _, v in ipairs( possible ) do~~

+

−

~~if index ~= nil then~~

+

−

v = ~~v:gsub( "#", index );~~

+

--[=[-------------------------< K E R N _ Q U O T E S >--------------------------------------------------------

−

~~end~~

+

−

~~if is_set(args[v]) then~~

+

Apply kerning to open the space between the quote mark provided by the module and a leading or trailing quote

−

~~if value ~~~= ~~nil and selected ~~~= ~~v then~~

+

mark contained in a |title= or |chapter= parameter's value.

−

~~table~~.~~insert( error_list, v );~~

+

−

~~else~~

+

This function will positive kern either single or double quotes:

−

~~value = args[v];~~

+

"'Unkerned title with leading and trailing single quote marks'"

−

~~selected = v;~~

+

" 'Kerned title with leading and trailing single quote marks' " (in real life the kerning isn't as wide as this example)

−

~~end~~

+

Double single quotes (italic or bold wiki-markup) are not kerned.

−

~~end~~

+

−

~~end~~

+

Replaces Unicode quote marks in plain text or in the label portion of a [[L|D]] style wikilink with typewriter

−

+

quote marks regardless of the need for kerning. Unicode quote marks are not replaced in simple [[D]] wikilinks.

−

~~if #error_list > 0 then~~

−

~~local error_str =~~ "";

−

~~for _, k in ipairs( error_list ) do~~

−

~~if error_str ~=~~ "~~" then error_str = error_str .. cfg.messages[~~'~~parameter-separator~~'~~] end~~

−

~~error_str = error_str .. wrap_style~~ ('~~parameter', k~~);

−

~~end~~

−

~~if #error_list > 1 then~~

−

~~error_str = error_str .. cfg.messages~~[~~'parameter-final-separator'~~];

−

~~else~~

−

~~error_str = error_str~~ .~~. cfg.messages~~[~~'parameter-pair-separator'~~];

−

~~end~~

−

~~error_str = error_str .. wrap_style ('parameter', selected);~~

−

~~table.insert( z~~.~~message_tail, { set_error( error_condition, {error_str}, true ) } );~~

−

~~end~~

−

~~return value, selected;~~

−

~~end~~

−

~~--[[--------------------------< F O R M A T _ C H A P T E R _ T I T L E >--------------------------------------~~

+

Call this function for chapter titles, for website titles, etc.; not for book titles.

−

~~Format the three chapter parameters: |chapter~~=~~, |trans-chapter=, and |chapter-url= into a single Chapter meta-~~

+

]=]

−

~~parameter (chapter_url_source used for error messages).~~

−

]]

+

local function kern_quotes (str)

+

local cap = '';

+

local wl_type, label, link;

−

~~local function format_chapter_title (chapter~~, ~~transchapter~~, ~~chapterurl~~, ~~chapter_url_source~~)

+

wl_type, label, link = utilities.is_wikilink (str); -- wl_type is: 0, no wl (text in label variable); 1, [[D]]; 2, [[L|D]]

−

~~local chapter_error = ''~~;

−

if ~~not is_set~~ (~~chapter~~) then

+

if 1 == wl_type then -- [[D]] simple wikilink with or without quote marks

−

~~chapter~~ = ''; -~~- just to be safe for concatenation~~

+

if mw.ustring.match (str, '%[%[[\"“”\'‘’].+[\"“”\'‘’]%]%]') then -- leading and trailing quote marks

−

~~if is_set~~ (~~transchapter~~) then

+

str = utilities.substitute (cfg.presentation['kern-left'], str);

−

~~chapter~~ = ~~wrap_style~~ ('~~trans~~-~~quoted-title~~', ~~transchapter~~);

+

str = utilities.substitute (cfg.presentation['kern-right'], str);

−

~~chapter_error~~ = ~~" "~~ .. ~~set_error (~~'~~trans_missing_chapter~~');

+

elseif mw.ustring.match (str, '%[%[[\"“”\'‘’].+%]%]') then -- leading quote marks

+

str = utilities.substitute (cfg.presentation['kern-left'], str);

+

elseif mw.ustring.match (str, '%[%[.+[\"“”\'‘’]%]%]') then -- trailing quote marks

+

str = utilities.substitute (cfg.presentation['kern-right'], str);

end

−

if is_set (~~chapterurl~~) then

+

−

~~chapter~~ = ~~external_link~~ (~~chapterurl, chapter~~, ~~chapter_url_source~~); ~~-- adds bare_url_missing_title error if appropriate~~

+

else -- plain text or [[L|D]]; text in label variable

+

label = mw.ustring.gsub (label, '[“”]', '\"'); -- replace “” (U+201C & U+201D) with " (typewriter double quote mark)

+

label = mw.ustring.gsub (label, '[‘’]', '\''); -- replace ‘’ (U+2018 & U+2019) with ' (typewriter single quote mark)

+

cap = mw.ustring.match (label, "^([\"\'][^\'].+)"); -- match leading double or single quote but not doubled single quotes (italic markup)

+

if utilities.is_set (cap) then

+

label = utilities.substitute (cfg.presentation['kern-left'], cap);

end

−

~~return chapter .. chapter_error;~~

+

−

~~else -- here when chapter is set~~

+

cap = mw.ustring.match (label, "^(.+[^\'][\"\'])$") -- match trailing double or single quote but not doubled single quotes (italic markup)

−

~~chapter~~ = ~~kern_quotes~~ (~~chapter~~); -- ~~if necessary, separate chapter title's leading and~~ trailing quote ~~marks from Module provided quote marks~~

+

if utilities.is_set (cap) then

−

~~chapter = wrap_style~~ (~~'quoted-title', chapter~~);

+

label = utilities.substitute (cfg.presentation['kern-right'], cap);

−

if is_set (~~transchapter~~) then

−

~~transchapter~~ = ~~wrap_style~~ ('~~trans~~-~~quoted-title~~', ~~transchapter~~);

−

~~chapter = chapter .. ' ' .. transchapter~~;

end

−

if ~~is_set (chapterurl)~~ then

+

−

~~chapter~~ = ~~external_link~~ (~~chapterurl~~, ~~chapter~~); -- ~~adds bare_url_missing_title error if appropriate~~

+

if 2 == wl_type then

+

str = utilities.make_wikilink (link, label); -- reassemble the wikilink

+

else

+

str = label;

end

−

return ~~chapter~~;

+

return str;

end

−

~~--[[~~

−

~~Argument wrapper. This function provides support for argument~~

−

~~mapping defined in the configuration file so that multiple names~~

−

~~can be transparently aliased to single internal variable.~~

−

]]

−

local function ~~argument_wrapper~~( ~~args~~ )

+

--[[--------------------------< F O R M A T _ S C R I P T _ V A L U E >----------------------------------------

−

local ~~origin~~ = {};

+

−

+

|script-title= holds title parameters that are not written in Latin-based scripts: Chinese, Japanese, Arabic, Hebrew, etc. These scripts should

−

~~return setmetatable~~({

+

not be italicized and may be written right-to-left. The value supplied by |script-title= is concatenated onto Title after Title has been wrapped

−

~~ORIGIN~~ = ~~function~~( ~~self, k~~ )

+

in italic markup.

−

~~local dummy = self~~[k]; --~~force the variable to be loaded.~~

+

−

return ~~origin[k]~~;

+

Regardless of language, all values provided by |script-title= are wrapped in <bdi>...</bdi> tags to isolate RTL languages from the English left to right.

+

|script-title= provides a unique feature. The value in |script-title= may be prefixed with a two-character ISO 639-1 language code and a colon:

+

|script-title=ja:*** *** (where * represents a Japanese character)

+

Spaces between the two-character code and the colon and the colon and the first script character are allowed:

+

|script-title=ja : *** ***

+

|script-title=ja: *** ***

+

|script-title=ja :*** ***

+

Spaces preceding the prefix are allowed: |script-title = ja:*** ***

+

The prefix is checked for validity. If it is a valid ISO 639-1 language code, the lang attribute (lang="ja") is added to the <bdi> tag so that browsers can

+

know the language the tag contains. This may help the browser render the script more correctly. If the prefix is invalid, the lang attribute

+

is not added. At this time there is no error message for this condition.

+

Supports |script-title=, |script-chapter=, |script-<periodical>=

+

]]

+

local function format_script_value (script_value, script_param)

+

local lang=''; -- initialize to empty string

+

local name;

+

if script_value:match('^%l%l%l?%s*:') then -- if first 3 or 4 non-space characters are script language prefix

+

lang = script_value:match('^(%l%l%l?)%s*:%s*%S.*'); -- get the language prefix or nil if there is no script

+

if not utilities.is_set (lang) then

+

utilities.set_message ('err_script_parameter', {script_param, cfg.err_msg_supl['missing title part']}); -- prefix without 'title'; add error message

+

return ''; -- script_value was just the prefix so return empty string

end

−

},

+

-- if we get this far we have prefix and script

−

{

+

name = cfg.lang_tag_remap[lang] or mw.language.fetchLanguageName( lang, cfg.this_wiki_code ); -- get language name so that we can use it to categorize

−

~~__index~~ = ~~function~~ ( ~~tbl~~, k )

+

if utilities.is_set (name) then -- is prefix a proper ISO 639-1 language code?

−

if ~~origin[k] ~= nil~~ then

+

script_value = script_value:gsub ('^%l+%s*:%s*', ''); -- strip prefix from script

−

~~return nil~~;

+

-- is prefix one of these language codes?

+

if utilities.in_array (lang, cfg.script_lang_codes) then

+

utilities.add_prop_cat ('script', {name, lang})

+

else

+

utilities.set_message ('err_script_parameter', {script_param, cfg.err_msg_supl['unknown language code']}); -- unknown script-language; add error message

end

−

+

lang = ' lang="' .. lang .. '" '; -- convert prefix into a lang attribute

−

~~local args, list, v~~ = ~~args, cfg~~.~~aliases[k]~~;

+

else

−

+

utilities.set_message ('err_script_parameter', {script_param, cfg.err_msg_supl['invalid language code']}); -- invalid language code; add error message

−

~~if type~~( ~~list ) ==~~ '~~table~~' ~~then~~

+

lang = ''; -- invalid so set lang to empty string

−

v, ~~origin~~[~~k] = select_one( args, list,~~ '~~redundant_parameters~~' );

+

end

−

~~if origin[k] == nil then~~

+

else

−

~~origin[k]~~ = ''; -- ~~Empty~~ string~~, not nil~~

+

utilities.set_message ('err_script_parameter', {script_param, cfg.err_msg_supl['missing prefix']}); -- no language code prefix; add error message

−

end

+

end

−

~~elseif list ~= nil then~~

+

script_value = utilities.substitute (cfg.presentation['bdi'], {lang, script_value}); -- isolate in case script is RTL

−

~~v, origin[k] = args[list], list;~~

+

−

else

+

return script_value;

−

~~-- maybe let through instead of raising an error?~~

+

end

−

~~-- v~~, ~~origin[k] = args[k]~~, k;

+

−

~~error(~~ cfg.~~messages~~['~~unknown_argument_map~~'] ~~.. ': cfg.aliases = ' .. mw.dumpObject( cfg.aliases ) .. ', k = ' .. mw.dumpObject( k )~~ );

+

−

~~end~~

+

--[[--------------------------< S C R I P T _ C O N C A T E N A T E >------------------------------------------

−

+

−

-- ~~Empty strings, not nil~~;

+

Initially for |title= and |script-title=, this function concatenates those two parameter values after the script

−

~~if v == nil then~~

+

value has been wrapped in <bdi> tags.

−

v = cfg.~~defaults~~[~~k] or~~ '';

−

~~origin[k~~] ~~= '';~~

−

~~end~~

−

~~tbl = rawset( tbl~~, k, v );

−

return v;

−

end,

−

~~});~~

−

~~end~~

−

~~--[[~~

−

~~Looks for a parameter's name in the whitelist.~~

−

~~Parameters in the whitelist can have three values:~~

−

~~true - active, supported parameters~~

−

~~false - deprecated, supported parameters~~

−

~~nil - unsupported parameters~~

]]

−

local function ~~validate~~( ~~name~~ )

+

local function script_concatenate (title, script, script_param)

−

~~local name = tostring~~( ~~name~~ );

+

if utilities.is_set (script) then

−

~~local state~~ = ~~whitelist.basic_arguments[ name ]~~;

+

script = format_script_value (script, script_param); -- <bdi> tags, lang attribute, categorization, etc.; returns empty string on error

−

+

if utilities.is_set (script) then

−

-- ~~Normal arguments~~

+

title = title .. ' ' .. script; -- concatenate title and script title

−

if ~~true == state~~ then ~~return true; end -- valid actively supported parameter~~

+

end

−

~~if false~~ =~~= state then~~

−

~~deprecated_parameter (name)~~; -- ~~parameter is deprecated but still supported~~

−

~~return true;~~

end

−

+

return title;

−

~~-- Arguments with numbers in them~~

−

~~name = name:gsub( "%d+", "#" ); -- replace digit(s) with # (last25 becomes last#~~

−

~~state = whitelist.numbered_arguments[ name ];~~

−

~~if true == state then return true; end -- valid actively supported parameter~~

−

~~if false == state then~~

−

~~deprecated_parameter (name); -- parameter is deprecated but still supported~~

−

~~return true;~~

−

~~end~~

−

return ~~false~~; ~~-- Not supported because not found or name is set to nil~~

end

−

-- ~~Formats a wiki style internal link~~

+

--[[--------------------------< W R A P _ M S G >--------------------------------------------------------------

−

~~local function internal_link_id(options)~~

−

~~return mw.ustring.format( '~~[[~~%s|%s]]%s[[%s%s%s|%s]]',~~

−

~~options.link, options.label, options.separator or " ",~~

−

~~options.prefix, options.id, options.suffix or "",~~

−

~~mw.text.nowiki(options.id)~~

−

);

−

~~end~~

−

+

Applies additional message text to various parameter values. Supplied string is wrapped using a message_list

−

~~--[[--------------------------< N O W R A P _ D A T E >--------------------------------------------------------~~

+

configuration taking one argument. Supports lower case text for {{citation}} templates. Additional text taken

−

+

from citation_config.messages - the reason this function is similar to but separate from wrap_style().

−

~~When date is YYYY-MM-DD format wrap in nowrap span: <span~~ .~~..>YYYY-MM-DD~~. ~~When date is DD MMMM YYYY or is~~

−

~~MMMM DD, YYYY then wrap in nowrap span: <span~~ .~~..>DD MMMM YYYY or MMMM DD, YYYY~~

−

~~DOES NOT yet support MMMM YYYY or any of~~ the ~~date ranges~~.

]]

−

local function ~~nowrap_date~~ (~~date~~)

+

local function wrap_msg (key, str, lower)

−

~~local cap='';~~

+

if not utilities.is_set ( str ) then

−

~~local cap2='';~~

+

return "";

−

if ~~date:match("^%d%d%d%d%-%d%d%-%d%d$") then~~

−

~~date = substitute (cfg~~.~~presentation['nowrap1'], date);~~

−

~~elseif date:match~~(~~"^%a+%s*%d%d?,%s*%d%d%d%d$") or date:match ("^%d%d?%s*%a+%s*%d%d%d%d$"~~) then

−

~~cap, cap2 = string.match (date,~~ "~~^(.*)%s+(%d%d%d%d)$~~");

−

~~date = substitute (cfg.presentation['nowrap2'], {cap, cap2})~~;

end

−

+

if true == lower then

−

return ~~date~~;

+

local msg;

+

msg = cfg.messages[key]:lower(); -- set the message to lower case before

+

return utilities.substitute ( msg, str ); -- including template text

+

else

+

return utilities.substitute ( cfg.messages[key], str );

+

end

−

~~--[[--------------------------< IS _ V A L I D _ I S X N >-----------------------------------------------------~~

−

~~ISBN~~-10 and ~~ISSN validator code calculates checksum across all isbn/issn digits including the check digit~~. ~~ISBN-13~~ is ~~checked in check_isbn~~().

+

--[[----------------< W I K I S O U R C E _ U R L _ M A K E >-------------------

−

~~If the number is valid the result will be 0. Before calling this function, issbn/issn must be checked for length and stripped of dashes,~~

+

−

~~spaces and other non~~-~~isxn characters.~~

+

Makes a Wikisource URL from Wikisource interwiki-link. Returns the URL and appropriate

+

label; nil else.

+

str is the value assigned to |chapter= (or aliases) or |title= or |title-link=

]]

−

local function ~~is_valid_isxn~~ (~~isxn_str~~, ~~len)~~

+

local function wikisource_url_make (str)

−

local ~~temp = 0~~;

+

local wl_type, D, L;

−

~~isxn_str~~ = { ~~isxn_str~~:~~byte~~(1, ~~len~~) }; -- ~~make~~ a ~~table of byte values~~ '~~0' → 0x30 .~~. '9' ~~→ 0x39,~~ '~~X' → 0x58~~

+

local ws_url, ws_label;

−

~~len~~ = ~~len+1;~~ -- ~~adjust to be~~ a ~~loop counter~~

+

local wikisource_prefix = table.concat ({'https://', cfg.this_wiki_code, '.wikisource.org/wiki/'});

−

~~for i~~, ~~v in ipairs( isxn_str~~ ) do -- ~~loop through all of the bytes and calculate~~ the ~~checksum~~

+

−

~~if v~~ == ~~string~~.~~byte~~( ~~"X"~~ ) ~~then~~ -- if ~~checkdigit is X~~ (~~compares the byte value of 'X' which is 0x58~~)

+

wl_type, D, L = utilities.is_wikilink (str); -- wl_type is 0 (not a wikilink), 1 (simple wikilink), 2 (complex wikilink)

−

~~temp~~ = temp + 10*( ~~len~~ - i ); -- ~~it represents 10 decimal~~

+

−

~~else~~

+

if 0 == wl_type then -- not a wikilink; might be from |title-link=

−

~~temp~~ = ~~temp~~ + ~~tonumber~~( ~~string~~.~~char~~(v) )*(~~len~~-i);

+

str = D:match ('^[Ww]ikisource:(.+)') or D:match ('^[Ss]:(.+)'); -- article title from interwiki link with long-form or short-form namespace

+

if utilities.is_set (str) then

+

ws_url = table.concat ({ -- build a Wikisource URL

+

wikisource_prefix, -- prefix

+

str, -- article title

+

});

+

ws_label = str; -- label for the URL

+

end

+

elseif 1 == wl_type then -- simple wikilink: [[Wikisource:ws article]]

+

str = D:match ('^[Ww]ikisource:(.+)') or D:match ('^[Ss]:(.+)'); -- article title from interwiki link with long-form or short-form namespace

+

if utilities.is_set (str) then

+

ws_url = table.concat ({ -- build a Wikisource URL

+

wikisource_prefix, -- prefix

+

str, -- article title

+

});

+

ws_label = str; -- label for the URL

+

end

+

elseif 2 == wl_type then -- non-so-simple wikilink: [[Wikisource:ws article|displayed text]] ([[L|D]])

+

str = L:match ('^[Ww]ikisource:(.+)') or L:match ('^[Ss]:(.+)'); -- article title from interwiki link with long-form or short-form namespace

+

if utilities.is_set (str) then

+

ws_label = D; -- get ws article name from display portion of interwiki link

+

ws_url = table.concat ({ -- build a Wikisource URL

+

wikisource_prefix, -- prefix

+

str, -- article title without namespace from link portion of wikilink

+

});

end

−

~~return temp % 11 == 0; -- returns true if calculation result is zero~~

−

~~end~~

+

if ws_url then

+

ws_url = mw.uri.encode (ws_url, 'WIKI'); -- make a usable URL

+

ws_url = ws_url:gsub ('%%23', '#'); -- undo percent-encoding of fragment marker

+

end

−

--[[~~----------~~----------------< ~~C H~~ E C ~~K _ I S B N~~ >~~-------------------------------------~~-----------------------

+

return ws_url, ws_label, L or D; -- return proper URL or nil and a label or nil

+

end

+

--[[----------------< F O R M A T _ P E R I O D I C A L >-----------------------

−

~~Determines whether an ISBN string is valid~~

+

Format the three periodical parameters: |script-<periodical>=, |<periodical>=,

+

and |trans-<periodical>= into a single Periodical meta-parameter.

]]

−

local function ~~check_isbn~~( ~~isbn_str~~ )

+

local function format_periodical (script_periodical, script_periodical_source, periodical, trans_periodical)

−

if ~~nil ~= isbn_str:match~~(~~"[^%s-0-9X]"~~) then ~~return false~~; ~~end~~ -- ~~fail if isbn_str contains anything but digits, hyphens, or the uppercase X~~

+

−

~~isbn_str~~ = ~~isbn_str:gsub~~( "-~~", "" ):gsub( " "~~, "" ); -- ~~remove hyphens and spaces~~

+

if not utilities.is_set (periodical) then

−

~~local len = isbn_str:len();~~

+

periodical = ''; -- to be safe for concatenation

−

+

else

−

~~if len ~= 10 and len ~= 13 then~~

+

periodical = utilities.wrap_style ('italic-title', periodical); -- style

−

~~return false;~~

end

−

~~if len~~ =~~= 10 then~~

+

periodical = script_concatenate (periodical, script_periodical, script_periodical_source); -- <bdi> tags, lang attribute, categorization, etc.; must be done after title is wrapped

−

if ~~isbn_str:match~~( ~~"^%d*X?$"~~ ) ~~== nil~~ then ~~return false; end~~

+

−

~~return is_valid_isxn~~(~~isbn_str~~, 10);

+

if utilities.is_set (trans_periodical) then

−

~~else~~

+

trans_periodical = utilities.wrap_style ('trans-italic-title', trans_periodical);

−

~~local temp = 0~~;

+

if utilities.is_set (periodical) then

−

if ~~isbn_str:match~~( ~~"^97[89]%d*$"~~ ) =~~= nil then return false~~; ~~end~~ -- ~~isbn13 begins with 978~~ or ~~979~~

+

periodical = periodical .. ' ' .. trans_periodical;

−

~~isbn_str~~ = ~~{ isbn_str:byte(1, len) }~~;

+

else -- here when trans-periodical without periodical or script-periodical

−

~~for i, v in ipairs( isbn_str ) do~~

+

periodical = trans_periodical;

−

~~temp = temp + (3 - 2*(i % 2)) * tonumber( string~~.~~char~~(v) );

+

utilities.set_message ('err_trans_missing_title', {'periodical'});

end

−

~~return temp % 10 == 0;~~

end

+

return periodical;

end

−

~~--[[------------------------------------------------------------------------------------------------~~

−

~~Validate and format an issn. This code fixes the case where an editor has included an ISSN in the citation but has separated the two groups of four~~

+

--[[------------------< F O R M A T _ C H A P T E R _ T I T L E >---------------

−

~~digits with a space. When that condition occurred, the resulting link looked like this:~~

−

|~~issn~~=~~0819 4327 gives: [http://www.worldcat.org/issn/0819 4327 0819 4327]~~ -~~- can't have spaces in an external link~~

+

Format the four chapter parameters: |script-chapter=, |chapter=, |trans-chapter=,

−

+

and |chapter-url= into a single chapter meta- parameter (chapter_url_source used

−

~~This code now prevents that by inserting a hyphen at the issn midpoint. It also validates the issn for length~~ and ~~makes sure that the checkdigit agrees~~

+

for error messages).

−

~~with the calculated value. Incorrect length (8 digits), characters other than 0~~-~~9 and X, or checkdigit / calculated value mismatch will all cause~~ a ~~check issn~~

−

error ~~message. The issn is always displayed with a hyphen, even if the issn was given as a single group of 8 digits~~.

]]

−

local function ~~issn~~(id)

+

local function format_chapter_title (script_chapter, script_chapter_source, chapter, chapter_source, trans_chapter, trans_chapter_source, chapter_url, chapter_url_source, no_quotes, access)

−

local ~~issn_copy~~ = id; -- ~~save a copy of unadulterated issn~~; ~~use this version for display~~ if ~~issn does~~ not ~~validate~~

+

local ws_url, ws_label, L = wikisource_url_make (chapter); -- make a wikisource URL and label from a wikisource interwiki link

−

~~local handler~~ = ~~cfg.id_handlers[~~'~~ISSN~~'];

+

if ws_url then

−

~~local text~~;

+

ws_label = ws_label:gsub ('_', ' '); -- replace underscore separators with space characters

−

~~local valid_issn~~ = ~~true~~;

+

chapter = ws_label;

+

end

+

if not utilities.is_set (chapter) then

+

chapter = ''; -- to be safe for concatenation

+

else

+

if false == no_quotes then

+

chapter = kern_quotes (chapter); -- if necessary, separate chapter title's leading and trailing quote marks from module provided quote marks

+

chapter = utilities.wrap_style ('quoted-title', chapter);

+

end

+

end

−

id=~~id:gsub~~( ~~"[%s-–]"~~, "" ); -- ~~strip spaces~~, ~~hyphens~~, ~~and endashes from the issn~~

+

chapter = script_concatenate (chapter, script_chapter, script_chapter_source); -- <bdi> tags, lang attribute, categorization, etc.; must be done after title is wrapped

−

if ~~8 ~= id:len~~() ~~or nil =~~= ~~id:match~~( ~~"^%d*X?$"~~ ) ~~then~~ -- ~~validate the issn: 8 digits long, containing only 0-9 or X in the last position~~

+

if utilities.is_set (chapter_url) then

−

~~valid_issn~~=~~false~~; -- ~~wrong length or improper character~~

+

chapter = external_link (chapter_url, chapter, chapter_url_source, access); -- adds bare_url_missing_title error if appropriate

−

~~else~~

+

elseif ws_url then

−

~~valid_issn~~=~~is_valid_isxn~~(id, 8); ~~-- validate issn~~

+

chapter = external_link (ws_url, chapter .. ' ', 'ws link in chapter'); -- adds bare_url_missing_title error if appropriate; space char to move icon away from chap text; TODO: better way to do this?

+

chapter = utilities.substitute (cfg.presentation['interwiki-icon'], {cfg.presentation['class-wikisource'], L, chapter});

end

−

if ~~true == valid_issn~~ then

+

if utilities.is_set (trans_chapter) then

−

id = ~~string~~.~~sub~~( id, ~~1, 4~~ ) .. ~~"-"~~ .. ~~string~~.~~sub( id, 5 )~~; -- ~~if valid, display correctly formatted version~~

+

trans_chapter = utilities.wrap_style ('trans-quoted-title', trans_chapter);

−

~~else~~

+

if utilities.is_set (chapter) then

−

id = ~~issn_copy~~; -- ~~if not valid~~, ~~use the show the invalid issn with error message~~

+

chapter = chapter .. ' ' .. trans_chapter;

+

else -- here when trans_chapter without chapter or script-chapter

+

chapter = trans_chapter;

+

chapter_source = trans_chapter_source:match ('trans%-?(.+)'); -- when no chapter, get matching name from trans-<param>

+

utilities.set_message ('err_trans_missing_title', {chapter_source});

+

end

−

+

−

~~text = external_link_id({link = handler.link, label = handler.label,~~

+

return chapter;

−

~~prefix=handler.prefix,id=id,separator=handler.separator, encode=handler.encode})~~

−

~~if false == valid_issn then~~

−

~~text = text .. ' ' .. set_error( 'bad_issn' ) -- add an error message if the issn is invalid~~

−

~~end~~

−

return ~~text~~

end

−

~~--[[--------------------------< A M A Z O N >------------------------------------------------------------------~~

−

~~Formats a link to Amazon. Do simple error checking: asin must be mix of 10 numeric or uppercase alpha~~

+

--[[----------------< H A S _ I N V I S I B L E _ C H A R S >-------------------

−

~~characters. If a mix, first character must be uppercase alpha; if all numeric, asins must be 10~~-~~digit~~

−

~~isbn. If 10~~-~~digit isbn, add a maintenance category so a bot or awb script can replace |asin= with |isbn=.~~

−

~~Error message if not 10 characters, if not isbn10, if mixed and first character is a digit.~~

−

]]

+

This function searches a parameter's value for non-printable or invisible characters.

+

The search stops at the first match.

+

This function will detect the visible replacement character when it is part of the Wikisource.

−

~~local function amazon~~(id, ~~domain~~)

+

Detects but ignores nowiki and math stripmarkers. Also detects other named stripmarkers

−

~~local err_cat = ""~~

+

(gallery, math, pre, ref) and identifies them with a slightly different error message.

+

See also coins_cleanup().

−

~~if not id:match("^[%d%u][%d%u][%d%u][%d%u][%d%u][%d%u][%d%u][%d%u][%d%u][%d%u]$") then~~

+

Output of this function is an error message that identifies the character or the

−

~~err_cat = ' ' .. set_error ('bad_asin'); -- asin~~ is ~~not a mix of 10 uppercase alpha and numeric characters~~

+

Unicode group, or the stripmarker that was detected along with its position (or,

−

~~else~~

+

for multi-byte characters, the position of its first byte) in the parameter value.

−

~~if id:match("^%d%d%d%d%d%d%d%d%d[%dX]$") then -- if 10-digit numeric (~~or ~~9 digits~~ with ~~terminal X)~~

−

~~if check_isbn~~( ~~id ) then -- see if asin value is isbn10~~

−

~~add_maint_cat ('ASIN');~~

−

~~elseif not is_set (err_cat) then~~

−

~~err_cat = ' ' .. set_error ('bad_asin'); -- asin is not isbn10~~

−

~~end~~

−

~~elseif not id:match("^%u[%d%u]+$") then~~

−

~~err_cat = ' ' .. set_error ('bad_asin'); -- asin doesn't begin with uppercase alpha~~

−

~~end~~

−

~~end~~

−

~~if not is_set(domain) then~~

−

~~domain = "com";~~

−

~~elseif in_array (domain, {'jp'~~, ~~'uk'}) then -- Japan, United Kingdom~~

−

~~domain = "co." .. domain;~~

−

~~elseif in_array (domain, {'au', 'br', 'mx'}) then~~ -~~- Australia~~, ~~Brazil, Mexico~~

−

~~domain = "com." .. domain;~~

−

~~end~~

−

~~local handler = cfg.id_handlers['ASIN'];~~

−

~~return external_link_id({link = handler.link,~~

−

~~label=handler.label , prefix="//www.amazon."..domain.."/dp/",id=id,~~

−

~~encode=handler.encode, separator = handler.separator}~~) .~~. err_cat;~~

−

~~end~~

−

~~--[[--------------------------< A R X I V >--------------------------------------------------------------------~~

+

]]

−

~~See: http://arxiv.org/help/arxiv_identifier~~

+

local function has_invisible_chars (param, v)

+

local position = ''; -- position of invisible char or starting position of stripmarker

+

local capture; -- used by stripmarker detection to hold name of the stripmarker

+

local stripmarker; -- boolean set true when a stripmarker is found

−

~~format and error check arXiv identifier~~. ~~There are three valid forms of the identifier:~~

+

capture = string.match (v, '[%w%p ]*'); -- test for values that are simple ASCII text and bypass other tests if true

−

~~the first form~~, ~~valid only between date codes 9108 and 0703 is:~~

+

if capture == v then -- if same there are no Unicode characters

−

~~arXiv:<archive>.<class>/<date code><number><version>~~

+

return;

−

~~where:~~

+

end

−

~~<archive> is a string of alpha characters - may be hyphenated~~; ~~no other punctuation~~

−

~~<class> is a string of alpha characters~~ - ~~may be hyphenated; no other punctuation~~

−

~~<date code> is four digits in the form YYMM where YY is the last two digits of the four~~-~~digit year and MM is the month number January = 01~~

−

~~first digit of YY~~ for ~~this form can only 9~~ and 0

−

~~<number> is a three~~-~~digit number~~

−

~~<version> is a 1 or more digit number preceded with a lowercase v~~; ~~no spaces (undocumented)~~

−

~~the second form, valid from April 2007 through December 2014 is:~~

−

~~arXiv:<date code>.<number><version>~~

−

~~where:~~

−

~~<date code> is four digits in the form YYMM where YY is the last two digits of the four-digit year and MM is the month number January = 01~~

−

~~<number> is a four-digit number~~

−

~~<version> is a 1 or more digit number preceded with a lowercase v; no spaces~~

−

the ~~third form~~, ~~valid from January 2015~~ is:

+

for _, invisible_char in ipairs (cfg.invisible_chars) do

−

~~arXiv:<date code>~~.~~<number><version>~~

+

local char_name = invisible_char[1]; -- the character or group name

−

~~where:~~

+

local pattern = invisible_char[2]; -- the pattern used to find it

−

~~<date code>~~ and ~~<version> are as defined for 0704~~-~~1412~~

+

position, _, capture = mw.ustring.find (v, pattern); -- see if the parameter value contains characters that match the pattern

−

~~<number> is a five~~-~~digit number~~

+

−

]]

+

if position and (cfg.invisible_defs.zwj == capture) then -- if we found a zero-width joiner character

+

if mw.ustring.find (v, cfg.indic_script) then -- it's ok if one of the Indic scripts

+

position = nil; -- unset position

+

elseif cfg.emoji_t[mw.ustring.codepoint (v, position+1)] then -- is zwj followed by a character listed in emoji{}?

+

position = nil; -- unset position

+

end

+

end

+

if position then

+

if 'nowiki' == capture or 'math' == capture or -- nowiki and math stripmarkers (not an error condition)

+

('templatestyles' == capture and utilities.in_array (param, {'id', 'quote'})) then -- templatestyles stripmarker allowed in these parameters

+

stripmarker = true; -- set a flag

+

elseif true == stripmarker and cfg.invisible_defs.del == capture then -- because stripmakers begin and end with the delete char, assume that we've found one end of a stripmarker

+

position = nil; -- unset

+

else

+

local err_msg;

+

if capture and not (cfg.invisible_defs.del == capture or cfg.invisible_defs.zwj == capture) then

+

err_msg = capture .. ' ' .. char_name;

+

else

+

err_msg = char_name .. ' ' .. 'character';

+

end

−

~~local function arxiv~~ (~~id, class)~~

+

utilities.set_message ('err_invisible_char', {err_msg, utilities.wrap_style ('parameter', param), position}); -- add error message

−

~~local handler = cfg.id_handlers[~~'~~ARXIV~~'];

+

return; -- and done with this parameter

−

~~local year~~, ~~month, version;~~

+

end

−

~~local err_cat = '';~~

−

~~local text;~~

−

~~if id:match("^%a[%a%.%-]+/[90]%d[01]%d%d%d%d$") or id:match("^%a[%a%.%-]+/[90]%d[01]%d%d%d%dv%d+$") then -- test for the 9108-0703 format w/ & w/o version~~

−

~~year, month = id:match("^%a[%a%.%-]+/([90]%d)([01]%d)%d%d%d[v%d]*$");~~

−

~~year = tonumber(year);~~

−

~~month = tonumber(month);~~

−

~~if ((not (90 < year or 8 > year)) or (1 > month or 12 < month)) or -- if invalid year or invalid month~~

−

~~((91 == year and 7 > month) or (7 == year and 3 < month)) then -- if years ok~~, ~~are starting and ending months ok?~~

−

~~err_cat = ' '~~ .~~. set_error~~( '~~bad_arxiv~~' ~~); -- set error message~~

−

~~end~~

−

~~elseif id:match("^%d%d[01]%d%.%d%d%d%d$") or id:match("^%d%d[01]%d%.%d%d%d%dv%d+$") then -- test for the 0704-1412 w/ & w/o version~~

−

~~year~~, ~~month = id:match("^(%d%d)([01]%d~~)~~%.%d%d%d%d[v%d]*$");~~

−

~~year = tonumber(year);~~

−

~~month = tonumber(month);~~

−

~~if ((7 > year) or (14 < year) or (1 > month or 12 < month)) or -- is year invalid or is month invalid? (doesn't test for future years)~~

−

~~((7 == year) and (4 > month)) then --or -- when year is 07~~, ~~is month invalid (before April)?~~

−

~~err_cat = ' ' .. set_error( 'bad_arxiv'~~ ); -- ~~set~~ error message

−

~~end~~

−

~~elseif id:match("^%d%d[01]%d%.%d%d%d%d%d$") or id:match("^%d%d[01]%d%.%d%d%d%d%dv%d+$") then -- test for the 1501- format w/ & w/o version~~

−

~~year, month = id:match("^(%d%d)([01]%d)%.%d%d%d%d%d[v%d]*$");~~

−

~~year = tonumber(year);~~

−

~~month = tonumber(month)~~;

−

~~if ((15 > year) or (1 > month or 12 < month)) then~~ -- ~~is year invalid or is month invalid? (doesn't test for future years)~~

−

~~err_cat = ' ' .. set_error( 'bad_arxiv' ); -- set error message~~

end

−

~~else~~

−

~~err_cat = ' ' .. set_error( 'bad_arxiv' ); -- arXiv id doesn't match any format~~

end

+

end

−

~~text = external_link_id({link = handler.link, label = handler.label,~~

−

~~prefix=handler.prefix,id=id,separator=handler.separator, encode=handler.encode}) .. err_cat;~~

−

~~if is_set (class) then~~

+

--[[-------------------< A R G U M E N T _ W R A P P E R >----------------------

−

~~class = '~~ [[~~' .. '//arxiv.org/archive/' .. class .. ' ' .. class .. ']]';~~ -- ~~external link within square brackets, not wikilink~~

−

~~else~~

−

~~class = '';~~ -- ~~empty string for concatenation~~

−

~~end~~

−

~~return text .. class;~~

−

~~end~~

−

~~--[[~~

+

Argument wrapper. This function provides support for argument mapping defined

−

~~lccn normalization (http://www.loc.gov/marc/lccn-namespace.html#normalization)~~

+

in the configuration file so that multiple names can be transparently aliased to

−

~~1. Remove all blanks~~.

+

single internal variable.

−

~~2. If there is a forward slash (/)~~ in the ~~string, remove it, and remove all characters to the right of the forward slash.~~

−

~~3. If there is a hyphen in the string:~~

−

~~a. Remove it.~~

−

~~b. Inspect the substring following (to the right of) the (removed) hyphen. Then (and assuming~~ that ~~steps 1 and 2 have been carried out):~~

−

~~1. All these characters should~~ be ~~digits, and there should be six or less. (not done in this function)~~

−

~~2. If the length of the substring is less than 6, left-fill the substring with zeroes until the length is six~~.

−

~~Returns a normalized lccn for lccn() to validate. There is no error checking (step 3.b.1) performed in this function.~~

]]

−

local function ~~normalize_lccn~~ (~~lccn~~)

+

local function argument_wrapper ( args )

−

~~lccn = lccn:gsub ("%s", ""); -- 1. strip whitespace~~

+

local origin = {};

−

~~if nil ~= string.find (lccn,'/') then~~

−

~~lccn = lccn:match ("(.-)/"); -- 2. remove forward slash and all character to the right of it~~

−

~~end~~

−

local ~~prefix~~

−

~~local suffix~~

−

~~prefix, suffix = lccn:match ("(.+)%-(.+)"); -- 3.a remove hyphen by splitting the string into prefix and suffix~~

−

~~if nil ~= suffix then -- if there was a hyphen~~

−

~~suffix=string.rep("0", 6-string.len (suffix)) .. suffix; -- 3.b.2 left fill the suffix with 0s if suffix length less than 6~~

−

~~lccn~~=~~prefix..suffix~~; ~~-- reassemble the lccn~~

−

~~end~~

−

return ~~lccn;~~

+

return setmetatable({

−

~~end~~

+

ORIGIN = function ( self, k )

−

+

local dummy = self[k]; -- force the variable to be loaded.

−

~~--[[~~

+

return origin[k];

−

~~Format LCCN link and do simple error checking. LCCN is a character string 8-12 characters long. The length of the LCCN dictates the character type of the first 1-3 characters; the~~

−

~~rightmost eight are always digits. http://info-uri.info/registry/OAIHandler?verb~~=~~GetRecord&metadataPrefix=reg&identifier=info:lccn/~~

−

~~length = 8 then all digits~~

−

~~length = 9 then lccn[1] is lower case alpha~~

−

~~length = 10 then lccn[1] and lccn[2] are both lower case alpha or both digits~~

−

~~length = 11 then lccn[1] is lower case alpha, lccn[2] and lccn[3] are both lower case alpha or both digits~~

−

~~length = 12 then lccn[1] and lccn[2] are both lower case alpha~~

−

]]

−

~~local~~ function ~~lccn~~(~~lccn~~)

−

local ~~handler~~ = ~~cfg.id_handlers~~[~~'LCCN'~~];

−

~~local err_cat = '';~~ -- ~~presume that LCCN is valid~~

−

~~local id = lccn; -- local copy of~~ the ~~lccn~~

−

~~id = normalize_lccn (id); -- get canonical form (no whitespace, hyphens, forward slashes)~~

−

~~local len = id:len(); -- get the length of the lccn~~

−

~~if 8 == len then~~

−

~~if id:match("~~[~~^%d~~]~~") then -- if LCCN has anything but digits (nil if only digits)~~

−

~~err_cat = ' ' .. set_error( 'bad_lccn' )~~; ~~-- set an error message~~

end

−

~~elseif 9 == len then -- LCCN should be adddddddd~~

+

},

−

~~if nil =~~= ~~id:match~~(~~"%l%d%d%d%d%d%d%d%d"~~) ~~then -- does it match our pattern?~~

+

{

−

~~err_cat = ' ' .. set_error( 'bad_lccn' ); -- set an error message~~

+

__index = function ( tbl, k )

−

~~end~~

+

if origin[k] ~= nil then

−

~~elseif 10 == len then -- LCCN should be aadddddddd or dddddddddd~~

+

return nil;

−

if ~~id:match("~~[~~^%d~~]~~") then -- if LCCN has anything but digits (~~nil ~~if only digits) ...~~

−

~~if nil == id:match("^%l%l%d%d%d%d%d%d%d%d")~~ then ~~-- ... see if it matches our pattern~~

−

~~err_cat = ' ' .. set_error( 'bad_lccn' )~~; ~~-- no match, set an error message~~

end

−

~~end~~

+

−

~~elseif 11~~ =~~= len then -- LCCN should be aaadddddddd or adddddddddd~~

+

local args, list, v = args, cfg.aliases[k];

−

if ~~not~~ (~~id:match("^%l%l%l%d%d%d%d%d%d%d%d") or id:match("^%l%d%d%d%d%d%d%d%d%d%d")~~) then ~~-- see if it matches one of our patterns~~

+

−

~~err_cat~~ = ~~' '~~ .~~. set_error~~( '~~bad_lccn~~' ); -- ~~no match~~, ~~set an error message~~

+

if type( list ) == 'table' then

−

end

+

v, origin[k] = utilities.select_one ( args, list, 'err_redundant_parameters' );

−

elseif 12 == ~~len then~~ -- ~~LCCN should be aadddddddddd~~

+

if origin[k] == nil then

−

~~if not id:match("^%l%l%d%d%d%d%d%d%d%d%d%d") then~~ -- ~~see if it matches our pattern~~

+

origin[k] = ''; -- Empty string, not nil

−

~~err_cat =~~ ' ' .. ~~set_error(~~ '~~bad_lccn~~' ); -- ~~no match~~, ~~set an error message~~

+

end

−

~~end~~

+

elseif list ~= nil then

−

~~else~~

+

v, origin[k] = args[list], list;

−

~~err_cat~~ = ' ' ~~.. set_error~~( ~~'bad_lccn'~~ ); ~~-- wrong length~~, ~~set an error message~~

+

else

−

end

+

-- maybe let through instead of raising an error?

+

-- v, origin[k] = args[k], k;

+

error( cfg.messages['unknown_argument_map'] .. ': ' .. k);

+

end

+

-- Empty strings, not nil;

+

if v == nil then

+

v = '';

+

origin[k] = '';

+

end

+

tbl = rawset( tbl, k, v );

+

return v;

+

end,

+

});

+

end

+

--[[--------------------------< N O W R A P _ D A T E >-------------------------

−

~~if not is_set (err_cat) and nil ~= lccn~~:~~find ('%s') then~~

+

When date is YYYY-MM-DD format wrap in nowrap span: YYYY-MM-DD.

−

~~err_cat = ' '~~ .. ~~set_error( 'bad_lccn' );~~ -- ~~lccn contains a space~~, ~~set an error message~~

+

When date is DD MMMM YYYY or is MMMM DD, YYYY then wrap in nowrap span:

−

~~end~~

+

DD MMMM YYYY or MMMM DD, YYYY

−

~~return external_link_id({link = handler~~.~~link, label = handler.label,~~

+

DOES NOT yet support MMMM YYYY or any of the date ranges.

−

~~prefix=handler.prefix,id=lccn,separator=handler.separator, encode=handler.encode}) .. err_cat;~~

−

~~end~~

−

~~--[[~~

−

~~Format PMID and do simple error checking. PMIDs are sequential numbers beginning at 1 and counting up. This code checks the PMID to see that it~~

−

~~contains only digits and is less than test_limit; the value in local variable test_limit will need to be updated periodically as more PMIDs are issued.~~

]]

−

local function ~~pmid~~(id)

+

local function nowrap_date (date)

−

local ~~test_limit~~ = ~~30000000; -- update this value as PMIDs approach~~

+

local cap = '';

−

~~local handler = cfg.id_handlers[~~'~~PMID~~'];

+

local cap2 = '';

−

local ~~err_cat~~ = ''; ~~-- presume that PMID is valid~~

+

−

+

if date:match("^%d%d%d%d%-%d%d%-%d%d$") then

−

if id:match("[^%d]") then ~~-- if PMID has anything but digits~~

+

date = utilities.substitute (cfg.presentation['nowrap1'], date);

−

~~err_cat~~ = ~~' '~~ .. ~~set_error(~~ '~~bad_pmid~~' ); ~~-- set an error message~~

+

−

~~else -- PMID is only digits~~

+

elseif date:match("^%a+%s*%d%d?,%s+%d%d%d%d$") or date:match ("^%d%d?%s*%a+%s+%d%d%d%d$") then

−

~~local id_num~~ = ~~tonumber~~(id); ~~-- convert id to a number for range testing~~

+

cap, cap2 = string.match (date, "^(.*)%s+(%d%d%d%d)$");

−

~~if 1 > id_num or test_limit < id_num then -- if PMID is outside test limit boundaries~~

+

date = utilities.substitute (cfg.presentation['nowrap2'], {cap, cap2});

−

~~err_cat~~ = ~~' '~~ .. ~~set_error(~~ '~~bad_pmid~~' ); ~~-- set an error message~~

−

~~end~~

end

−

return ~~external_link_id({link = handler.link, label = handler.label,~~

+

return date;

−

~~prefix=handler.prefix,id=id,separator=handler.separator, encode=handler.encode}) .. err_cat~~;

end

−

~~--[[--------------------------------------------------------------------------------~~

−

~~Determines if a PMC identifier's online version is embargoed. Compares~~ the ~~date in~~ |~~embargo~~= ~~against today's date~~. ~~If embargo date~~ is

+

--[[--------------------------< S E T _ T I T L E T Y P E >---------------------

−

in the ~~future, returns the content of |embargo=; otherwise, returns and empty string because~~ the ~~embargo has expired or because~~

+

−

|~~embargo~~= ~~was not set in this cite~~.

+

This function sets default title types (equivalent to the citation including

+

|type=<default value>) for those templates that have defaults. Also handles the

+

special case where it is desirable to omit the title type from the rendered citation

+

(|type=none).

]]

−

local function ~~is_embargoed~~ (~~embargo~~)

+

local function set_titletype (cite_class, title_type)

−

if is_set (~~embargo~~) then

+

if utilities.is_set (title_type) then

−

~~local lang~~ = ~~mw.getContentLanguage();~~

+

if 'none' == cfg.keywords_xlate[title_type] then

−

~~local good1, embargo_date, good2, todays_date;~~

+

title_type = ''; -- if |type=none then type parameter not displayed

−

~~good1, embargo_date~~ = ~~pcall( lang~~.~~formatDate, lang, 'U', embargo );~~

−

~~good2, todays_date~~ = ~~pcall( lang.formatDate, lang,~~ 'U' );

−

~~if good1 and good2 then~~ -- if ~~embargo date and today's date are good dates~~

−

~~if tonumber( embargo_date ) >~~= ~~tonumber( todays_date )~~ then ~~-- is embargo date is in the future?~~

−

~~return embargo; -- still embargoed~~

−

~~else~~

−

~~add_maint_cat ('embargo')~~

−

~~return ''; -- unset because embargo has expired~~

−

~~end~~

end

+

return title_type; -- if |type= has been set to any other value use that value

end

−

return ''; -- ~~|embargo= not~~ set ~~return~~ empty string

+

return cfg.title_types [cite_class] or ''; -- set template's default title type; else empty string for concatenation

end

−

~~--[[--------------------------------------------------------------------------------------------------~~

−

~~Format a PMC, do simple error checking, and check for embargoed articles.~~

+

--[[--------------------------< S A F E _ J O I N >-----------------------------

−

~~The embargo parameter takes~~ a ~~date~~ for ~~a value. If the embargo date is in the future the PMC identifier will not~~

+

Joins a sequence of strings together while checking for duplicate separation characters.

−

~~be linked to the article. If the embargo date is today or in the past, or if it is empty or omitted, then the~~

−

~~PMC identifier is linked to the article through the link at cfg.id_handlers['PMC'].prefix.~~

−

~~PMC embargo date testing is done in function is_embargoed () which is called earlier because when the citation~~

−

~~has |pmc=<value> but does not have a |url= then |title= is linked with the PMC link. Function is_embargoed ()~~

−

~~returns the embargo date if the PMC article is still embargoed, otherwise it returns an empty string.~~

−

~~PMCs are sequential numbers beginning at 1 and counting up. This code checks the PMC to see that it contains only digits and is less~~

−

~~than test_limit; the value in local variable test_limit will need to be updated periodically as more PMCs are issued~~.

]]

−

local function ~~pmc~~(id, ~~embargo~~)

+

local function safe_join( tbl, duplicate_char )

−

local ~~test_limit~~ = ~~5000000~~; -- ~~update this value as PMCs approach~~

+

local f = {}; -- create a function table appropriate to type of 'duplicate character'

−

~~local handler = cfg.id_handlers[~~'~~PMC~~'];

+

if 1 == #duplicate_char then -- for single byte ASCII characters use the string library functions

−

~~local err_cat~~ = ~~'';~~ -- ~~presume that PMC is valid~~

+

f.gsub = string.gsub

−

+

f.match = string.match

−

~~local text;~~

+

f.sub = string.sub

−

+

else -- for multi-byte characters use the ustring library functions

−

~~if id:~~match~~("[^%d]") then -- if PMC has anything but digits~~

+

f.gsub = mw.ustring.gsub

−

~~err_cat~~ = ~~' '~~ .~~. set_error( 'bad_pmc' );~~ -- ~~set an error message~~

+

f.match = mw.ustring.match

−

~~else -~~- ~~PMC is only digits~~

+

f.sub = mw.ustring.sub

−

~~local id_num~~ = ~~tonumber(id); -- convert id to a number for range testing~~

−

~~if 1 > id_num or test_limit < id_num then -- if PMC is outside test limit boundaries~~

−

~~err_cat~~ = ~~' '~~ .. ~~set_error( 'bad_pmc' ); -- set an error message~~

end

−

~~end~~

−

~~if is_set (embargo) then -- is PMC is still embargoed?~~

−

~~text="[[" .. handler.link .. "|" .. handler.label .. "]]:" .. handler.separator .. id .. err_cat; -- still embargoed so no external link~~

−

~~else~~

−

~~text = external_link_id({link = handler.link, label = handler.label, -- no embargo date or embargo has expired, ok to link to article~~

−

~~prefix=handler.prefix,id=id,separator=handler.separator, encode=handler.encode}) .. err_cat;~~

−

~~end~~

−

~~return text;~~

−

~~end~~

−

-- ~~Formats a DOI~~ and ~~checks~~ for ~~DOI errors~~.

+

local str = ''; -- the output string

−

+

local comp = ''; -- what does 'comp' mean?

−

-- ~~DOI names contain two parts: prefix and suffix separated by a forward slash~~.

+

local end_chr = '';

−

-- ~~Prefix: directory indicator~~ '10.' ~~followed by a registrant code~~

+

local trim;

−

-- ~~Suffix: character~~ string of ~~any length chosen by the registrant~~

+

for _, value in ipairs( tbl ) do

+

if value == nil then value = ''; end

+

if str == '' then -- if output string is empty

+

str = value; -- assign value to it (first time through the loop)

+

elseif value ~= '' then

+

if value:sub(1, 1) == '<' then -- special case of values enclosed in spans and other markup.

+

comp = value:gsub( "%b<>", "" ); -- remove HTML markup (string -> string)

+

else

+

comp = value;

+

end

+

-- typically duplicate_char is sepc

+

if f.sub(comp, 1, 1) == duplicate_char then -- is first character same as duplicate_char? why test first character?

+

-- Because individual string segments often (always?) begin with terminal punct for the

+

-- preceding segment: 'First element' .. 'sepc next element' .. etc.?

+

trim = false;

+

end_chr = f.sub(str, -1, -1); -- get the last character of the output string

+

-- str = str .. "<HERE(enchr=" .. end_chr .. ")" -- debug stuff?

+

if end_chr == duplicate_char then -- if same as separator

+

str = f.sub(str, 1, -2); -- remove it

+

elseif end_chr == "'" then -- if it might be wiki-markup

+

if f.sub(str, -3, -1) == duplicate_char .. "''" then -- if last three chars of str are sepc''

+

str = f.sub(str, 1, -4) .. "''"; -- remove them and add back ''

+

elseif f.sub(str, -5, -1) == duplicate_char .. "]]''" then -- if last five chars of str are sepc]]''

+

trim = true; -- why? why do this and next differently from previous?

+

elseif f.sub(str, -4, -1) == duplicate_char .. "]''" then -- if last four chars of str are sepc]''

+

trim = true; -- same question

+

end

+

elseif end_chr == "]" then -- if it might be wiki-markup

+

if f.sub(str, -3, -1) == duplicate_char .. "]]" then -- if last three chars of str are sepc]] wikilink

+

trim = true;

+

elseif f.sub(str, -3, -1) == duplicate_char .. '"]' then -- if last three chars of str are sepc"] quoted external link

+

trim = true;

+

elseif f.sub(str, -2, -1) == duplicate_char .. "]" then -- if last two chars of str are sepc] external link

+

trim = true;

+

elseif f.sub(str, -4, -1) == duplicate_char .. "'']" then -- normal case when |url=something & |title=Title.

+

trim = true;

+

end

+

elseif end_chr == " " then -- if last char of output string is a space

+

if f.sub(str, -2, -1) == duplicate_char .. " " then -- if last two chars of str are <sepc><space>

+

str = f.sub(str, 1, -3); -- remove them both

+

end

+

end

−

~~-- This function checks a DOI name for: prefix/suffix. If the doi name contains spaces or endashes,~~

+

if trim then

−

~~-- or,~~ if ~~it ends with a period or a comma, this function will emit a bad_doi error message.~~

+

if value ~= comp then -- value does not equal comp when value contains HTML markup

−

+

local dup2 = duplicate_char;

−

~~-- DOI names are case-insensitive and can incorporate any printable Unicode characters so the test for spaces, endash,~~

+

if f.match(dup2, "%A" ) then dup2 = "%" .. dup2; end -- if duplicate_char not a letter then escape it

−

-- ~~and terminal punctuation may~~ not ~~be technically correct but it appears, that in practice these characters are rarely if ever used in doi names.~~

+

−

+

value = f.gsub(value, "(%b<>)" .. dup2, "%1", 1 ) -- remove duplicate_char if it follows HTML markup

−

local ~~function doi(id, inactive)~~

+

else

−

~~local cat = ""~~

+

value = f.sub(value, 2, -1 ); -- remove duplicate_char when it is first character

−

~~local handler~~ = ~~cfg.id_handlers['DOI']~~;

+

end

−

+

end

−

~~local text;~~

+

end

−

if ~~is_set~~(~~inactive~~) then

+

str = str .. value; -- add it to the output string

−

~~local inactive_year~~ = ~~inactive:match(~~"%~~d%d%d%d~~"~~) or ''~~; -- ~~try to get the year portion from the inactive date~~

−

~~text~~ = ~~"[[" .. handler.link .~~. "|" .. ~~handler.label ..~~ "~~]]:~~" ~~.. id;~~

−

~~if is_set(inactive_year) then~~

−

~~table~~.~~insert~~( ~~z.error_categories~~, ~~"Pages with DOIs inactive since " .. inactive_year~~ );

−

~~else~~

−

~~table~~.~~insert( z~~.~~error_categories, "Pages with inactive DOIs" )~~; -- ~~when inactive doesn't contain a recognizable year~~

end

−

~~inactive = " (" .. cfg.messages['inactive'] .. " " .. inactive .. ")"~~

−

~~else~~

−

~~text = external_link_id({link = handler.link, label = handler.label,~~

−

~~prefix=handler.prefix,id=id,separator=handler.separator, encode=handler.encode})~~

−

~~inactive = ""~~

end

−

+

return str;

−

~~if nil == id:match("^10%.[^%s–]-/[^%s–]-[^%.,]$") then -- doi must begin with '10.', must contain a fwd slash, must not contain spaces or endashes, and must not end with period or comma~~

−

~~cat = ' ' .. set_error( 'bad_doi' )~~;

−

~~end~~

−

~~return text .. inactive .. cat~~

end

−

~~-- Formats an OpenLibrary link, and checks for associated errors.~~

−

~~local function openlibrary(id)~~

−

~~local code = id:match("^%d+([AMW])$"); -- only digits followed by 'A', 'M', or 'W'~~

−

~~local handler = cfg.id_handlers['OL'];~~

−

~~if ( code == "A" ) then~~

−

~~return external_link_id({link=handler.link, label=handler.label,~~

−

~~prefix="http://openlibrary.org/authors/OL",id=id, separator=handler.separator,~~

−

~~encode = handler.encode})~~

−

~~elseif ( code == "M" ) then~~

−

~~return external_link_id({link=handler.link, label=handler.label,~~

−

~~prefix="http://openlibrary.org/books/OL",id=id, separator=handler.separator,~~

−

~~encode = handler.encode})~~

−

~~elseif ( code == "W" ) then~~

−

~~return external_link_id({link=handler.link, label=handler.label,~~

−

~~prefix= "http://openlibrary.org/works/OL",id=id, separator=handler.separator,~~

−

~~encode = handler.encode})~~

−

~~else~~

−

~~return external_link_id({link=handler.link, label=handler.label,~~

−

~~prefix= "http://openlibrary.org/OL",id=id, separator=handler.separator,~~

−

~~encode = handler.encode}) ..~~

−

~~' ' .. set_error( 'bad_ol' );~~

−

~~end~~

−

~~end~~

+

--[[-------------------------------------------------------

−

~~--[[--------------------------< M E S S A G E _ I D >----------------------------------------------------------~~

+

returns true if suffix is properly formed Jr, Sr, or ordinal in the range 1–9.

−

+

Puncutation not allowed.

−

~~Validate and format a usenet message id. Simple error checking~~, ~~looks for 'id-left@id-right' not enclosed~~ in

−

~~'<' and/or '>' angle brackets~~.

]]

−

local function ~~message_id~~ (id)

+

local function is_suffix (suffix)

−

~~local handler = cfg~~.~~id_handlers[~~'~~USENETID~~'];

+

if utilities.in_array (suffix, {'Jr', 'Sr', 'Jnr', 'Snr', '1st', '2nd', '3rd'}) or suffix:match ('^%dth$') then

−

+

return true;

−

~~text = external_link_id({link = handler.link~~, ~~label = handler.label~~,

+

end

−

~~prefix=handler.prefix~~,~~id=id~~,~~separator=handler.separator~~, ~~encode=handler.encode})~~

+

return false;

−

~~if not id:match(~~'~~^.+@.+$~~') or ~~not id~~:match('^~~[^<].*[^>]~~$')then ~~-- doesn't have '@' or has one or first or last character is '< or '>'~~

−

~~text = text .. ' ' .. set_error( 'bad_message_id' ) -- add an error message if the message id is invalid~~

−

end

−

return ~~text~~

end

−

~~--[[--------------------------< S E T _ T I T L E T Y P E >----------------------------------------------------~~

−

~~This function sets default title types (equivalent to the citation including |type=~~<~~default value~~>~~) for those templates that have defaults.~~

+

--[[---------------------------------------

−

~~Also handles the special case where it is desirable to omit the title type from the rendered citation (|type=none).~~

−

]]

+

For Vancouver style, author/editor names are supposed to be rendered in Latin

+

(read ASCII) characters. When a name uses characters that contain diacritical

+

marks, those characters are to be converted to the corresponding Latin

+

character. When a name is written using a non-Latin alphabet or logogram, that

+

name is to be transliterated into Latin characters. The module doesn't do this

+

so editors may/must.

−

~~local function set_titletype (cite_class, title_type)~~

+

This test allows |first= and |last= names to contain any of the letters defined

−

~~if is_set(title_type) then~~

+

in the four Unicode Latin character sets

−

~~if "none"~~ == ~~title_type then~~

+

[http://www.unicode.org/charts/PDF/U0000.pdf C0 Controls and Basic Latin] 0041–005A, 0061–007A

−

~~title_type = ""; -- if |type=none then type parameter not displayed~~

+

[http://www.unicode.org/charts/PDF/U0080.pdf C1 Controls and Latin-1 Supplement] 00C0–00D6, 00D8–00F6, 00F8–00FF

−

~~end~~

+

[http://www.unicode.org/charts/PDF/U0100.pdf Latin Extended-A] 0100–017F

−

~~return title_type;~~ -- ~~if |type= has been set to any other value use that value~~

+

[http://www.unicode.org/charts/PDF/U0180.pdf Latin Extended-B] 0180–01BF, 01C4–024F

−

~~end~~

−

~~return cfg~~.~~title_types [cite_class] or ''; -- set template's default title type; else empty string for concatenation~~

+

|lastn= also allowed to contain hyphens, spaces, and apostrophes.

−

~~end~~

+

(http://www.ncbi.nlm.nih.gov/books/NBK7271/box/A35029/)

+

|firstn= also allowed to contain hyphens, spaces, apostrophes, and periods

−

~~--[~~[-------~~-------------------< C L E~~ A ~~N _ I S B N >--------------------------------------------------~~--------

+

This original test:

+

if nil == mw.ustring.find (last, "^[A-Za-zÀ-ÖØ-öø-ƿǄ-ɏ%-%s%']*$")

+

or nil == mw.ustring.find (first, "^[A-Za-zÀ-ÖØ-öø-ƿǄ-ɏ%-%s%'%.]+[2-6%a]*$") then

+

was written outside of the code editor and pasted here because the code editor

+

gets confused between character insertion point and cursor position. The test has

+

been rewritten to use decimal character escape sequence for the individual bytes

+

of the Unicode characters so that it is not necessary to use an external editor

+

to maintain this code.

−

~~Removes irrelevant text and dashes from ISBN number~~

+

\195\128-\195\150 – À-Ö (U+00C0–U+00D6 – C0 controls)

−

~~Similar to that used for Special:BookSources~~

+

\195\152-\195\182 – Ø-ö (U+00D8-U+00F6 – C0 controls)

+

\195\184-\198\191 – ø-ƿ (U+00F8-U+01BF – C0 controls, Latin extended A & B)

+

\199\132-\201\143 – Ǆ-ɏ (U+01C4-U+024F – Latin extended B)

]]

−

local function ~~clean_isbn~~( ~~isbn_str~~ )

+

local function is_good_vanc_name (last, first, suffix, position)

−

return ~~isbn_str:gsub~~( "[^-0-9X]", "" );

+

if not suffix then

+

if first:find ('[,%s]') then -- when there is a space or comma, might be first name/initials + generational suffix

+

first = first:match ('(.-)[,%s]+'); -- get name/initials

+

suffix = first:match ('[,%s]+(.+)$'); -- get generational suffix

+

end

+

end

+

if utilities.is_set (suffix) then

+

if not is_suffix (suffix) then

+

add_vanc_error (cfg.err_msg_supl.suffix, position);

+

return false; -- not a name with an appropriate suffix

+

end

+

end

+

if nil == mw.ustring.find (last, "^[A-Za-z\195\128-\195\150\195\152-\195\182\195\184-\198\191\199\132-\201\143%-%s%']*$") or

+

nil == mw.ustring.find (first, "^[A-Za-z\195\128-\195\150\195\152-\195\182\195\184-\198\191\199\132-\201\143%-%s%'%.]*$") then

+

add_vanc_error (cfg.err_msg_supl['non-Latin char'], position);

+

return false; -- not a string of Latin characters; Vancouver requires Romanization

+

end;

+

return true;

end

−

~~--[[--------------------------< E S C A P E _ L U A _ M A G I C _ C H A R S >----------------------------------~~

−

~~Returns a string where all~~ of ~~lua's magic characters have been escaped~~. ~~This is important because functions like~~

+

--[[--------------------------< R E D U C E _ T O _ I N I T I A L S >------------------------------------------

−

~~string.gsub() treat their pattern and replace strings as patterns, not literal strings.~~

+

−

]]

+

Attempts to convert names to initials in support of |name-list-style=vanc.

−

~~local function escape_lua_magic_chars (argument)~~

+

−

~~argument~~ = ~~argument:gsub("%%"~~, ~~"%%%%"); -- replace % with %%~~

+

Names in |firstn= may be separated by spaces or hyphens, or for initials, a period.

−

~~argument = argument~~:~~gsub("([%^%$%(%)%~~.~~%[%]%*%+%-%?])", "%%%1"); -- replace all other lua magic pattern characters~~

+

See http://www.ncbi.nlm.nih.gov/books/NBK7271/box/A35062/.

−

~~return argument;~~

−

~~end~~

−

~~--[[--------------------------< S T R I P _ A P O S T R O P H E _ M A R K U P >--------------------------------~~

+

Vancouver style requires family rank designations (Jr, II, III, etc.) to be rendered

+

as Jr, 2nd, 3rd, etc. See http://www.ncbi.nlm.nih.gov/books/NBK7271/box/A35085/.

+

This code only accepts and understands generational suffix in the Vancouver format

+

because Roman numerals look like, and can be mistaken for, initials.

−

~~Strip wiki italic and bold markup from argument so that it doesn't contaminate COinS metadata.~~

+

This function uses ustring functions because firstname initials may be any of the

−

This function ~~strips common patterns~~ of ~~apostrophe markup. We presume that editors who have taken~~ the ~~time to~~

+

Unicode Latin characters accepted by is_good_vanc_name ().

−

~~markup a title have, as a result, provided valid markup. When they don't, some single apostrophes are left behind~~.

]]

−

local function ~~strip_apostrophe_markup~~ (~~argument~~)

+

local function reduce_to_initials(first, position)

−

~~if not is_set~~ (~~argument~~) ~~then return argument~~; ~~end~~

+

local name, suffix = mw.ustring.match(first, "^(%u+) ([%dJS][%drndth]+)$");

−

~~while true do~~

+

if not name then -- if not initials and a suffix

−

if ~~argument:match ("%'%'%'%'%'")~~ then -- ~~bold italic (5)~~

+

name = mw.ustring.match(first, "^(%u+)$"); -- is it just initials?

−

~~argument~~=~~argument:gsub("%'%'%'%'%'", ""); -- remove all instances of it~~

−

~~elseif argument:~~match (~~"%'%'%'%'") then -- italic start and end without content (4)~~

−

~~argument=argument:gsub("%'%'%'%'"~~, "~~");~~

−

~~elseif argument:match~~ (~~"%'%'~~%~~'") then -- bold (3~~)

−

~~argument=argument:gsub("%'%'%'", "~~");

−

~~elseif argument:match ("%'%'") then~~ -- ~~italic (2)~~

−

~~argument=argument:gsub("%'%'", "");~~

−

~~else~~

−

~~break;~~

−

~~end~~

end

−

~~return argument; -- done~~

−

~~end~~

−

--~~[[--------------------------< M A K E _ C O I N S _ T I T L E~~ >--------------------~~--------------------------~~

+

if name then -- if first is initials with or without suffix

−

+

if 3 > mw.ustring.len (name) then -- if one or two initials

−

~~Makes a title~~ for ~~COinS from Title and / or ScriptTitle (or any other name-script pairs)~~

+

if suffix then -- if there is a suffix

−

+

if is_suffix (suffix) then -- is it legitimate?

−

~~Apostrophe markup~~ (~~bold~~, ~~italics) is stripped from each value so that the COinS metadata isn~~'~~t correupted with strings~~

+

return first; -- one or two initials and a valid suffix so nothing to do

−

of %~~27%27...~~

+

else

−

]]

+

add_vanc_error (cfg.err_msg_supl.suffix, position); -- one or two initials with invalid suffix so error message

+

return first; -- and return first unmolested

+

end

+

else

+

return first; -- one or two initials without suffix; nothing to do

+

end

+

end

+

end -- if here then name has 3 or more uppercase letters so treat them as a word

+

local initials, names = {}, {}; -- tables to hold name parts and initials

+

local i = 1; -- counter for number of initials

+

names = mw.text.split (first, '[%s,]+'); -- split into a table of names and possible suffix

−

~~local function make_coins_title~~ (~~title~~, ~~script~~)

+

while names[i] do -- loop through the table

−

if ~~is_set~~ (~~title~~) then

+

if 1 < i and names[i]:match ('[%dJS][%drndth]+%.?$') then -- if not the first name, and looks like a suffix (may have trailing dot)

−

~~title = strip_apostrophe_markup~~ (~~title~~); -- ~~strip any apostrophe markup~~

+

names[i] = names[i]:gsub ('%.', ''); -- remove terminal dot if present

−

~~else~~

+

if is_suffix (names[i]) then -- if a legitimate suffix

−

~~title~~=''; -- ~~if not set, make sure title is an empty string~~

+

table.insert (initials, ' ' .. names[i]); -- add a separator space, insert at end of initials table

+

break; -- and done because suffix must fall at the end of a name

+

end -- no error message if not a suffix; possibly because of Romanization

+

end

+

if 3 > i then

+

table.insert (initials, mw.ustring.sub(names[i], 1, 1)); -- insert the initial at end of initials table

+

end

+

i = i + 1; -- bump the counter

end

−

~~if is_set (script) then~~

+

−

~~script = script:gsub ('^%l%l%s*:%s*', ''); -- remove language prefix if present~~ (~~script value may now be empty string~~)

+

return table.concat(initials) -- Vancouver format does not include spaces.

−

~~script = strip_apostrophe_markup (script); -- strip any apostrophe markup~~

−

~~else~~

−

~~script='';~~ -- if not ~~set, make sure script is an empty string~~

−

~~end~~

−

~~if is_set (title) and is_set (script) then~~

−

~~script = ' ' .. script; -- add a space before we concatenate~~

−

~~end~~

−

~~return title~~ .~~. script; -- return the concatenation~~

end

−

~~--[[--------------------------< G E T _ C O I N S _ P A G E S >------------------------------------------------~~

−

~~Extract page numbers~~ from ~~external wikilinks in any~~ of the ~~|page=~~, ~~|pages=~~, ~~or |at= parameters for use in COinS~~.

+

--[[------------------------------------------------------------

+

extract interwiki prefixen from <value>. Returns two one or two values:

+

false – no prefixen

+

nil – prefix exists but not recognized

+

project prefix, language prefix – when value has either of:

+

:<project>:<language>:<article>

+

:<language>:<project>:<article>

+

project prefix, nil – when <value> has only a known single-letter prefix

+

nil, language prefix – when <value> has only a known language prefix

+

accepts single-letter project prefixen: 'd' (wikidata), 's' (wikisource), and 'w' (wikipedia) prefixes; at this

+

writing, the other single-letter prefixen (b (wikibook), c (commons), m (meta), n (wikinews), q (wikiquote), and

+

v (wikiversity)) are not supported.

]]

−

local function ~~get_coins_pages~~ (~~pages~~)

+

local function interwiki_prefixen_get (value, is_link)

−

~~local pattern;~~

+

if not value:find (':%l+:') then -- if no prefix

−

if not ~~is_set~~ (~~pages~~) then return ~~pages~~; end -- if ~~no page numbers~~ then ~~we're done~~

+

return false; -- abandon; boolean here to distinguish from nil fail returns later

+

end

+

local prefix_patterns_linked_t = { -- sequence of valid interwiki and inter project prefixen

+

'^%[%[:([dsw]):(%l%l+):', -- wikilinked; project and language prefixes

+

'^%[%[:(%l%l+):([dsw]):', -- wikilinked; language and project prefixes

+

'^%[%[:([dsw]):', -- wikilinked; project prefix

+

'^%[%[:(%l%l+):', -- wikilinked; language prefix

+

}

+

local prefix_patterns_unlinked_t = { -- sequence of valid interwiki and inter project prefixen

+

'^:([dsw]):(%l%l+):', -- project and language prefixes

+

'^:(%l%l+):([dsw]):', -- language and project prefixes

+

'^:([dsw]):', -- project prefix

+

'^:(%l%l+):', -- language prefix

+

}

+

local cap1, cap2;

+

for _, pattern in ipairs ((is_link and prefix_patterns_linked_t) or prefix_patterns_unlinked_t) do

+

cap1, cap2 = value:match (pattern);

+

if cap1 then

+

break; -- found a match so stop looking

+

end

+

end

−

~~while true do~~

+

if cap1 and cap2 then -- when both then :project:language: or :language:project: (both forms allowed)

−

~~pattern~~ = ~~pages~~:match("%[(%w*:~~?//~~[^ ]~~+%s+)~~[~~%w%d~~]~~.*%]");~~ -- ~~pattern~~ is the ~~opening bracket~~, ~~the url~~ and ~~following space~~(s)~~: "[url "~~

+

if 1 == #cap1 then -- length == 1 then :project:language:

−

if nil == ~~pattern~~ then ~~break~~; ~~end~~ -- no more ~~urls~~

+

if cfg.inter_wiki_map[cap2] then -- is language prefix in the interwiki map?

−

~~pattern = escape_lua_magic_chars (pattern);~~ -- ~~pattern~~ is ~~not a literal string; escape lua's magic pattern characters~~

+

return cap1, cap2; -- return interwiki project and interwiki language

−

~~pages = pages:gsub(pattern~~, ~~"")~~; -- ~~remove as many instances of pattern as possible~~

+

end

+

else -- here when :language:project:

+

if cfg.inter_wiki_map[cap1] then -- is language prefix in the interwiki map?

+

return cap2, cap1; -- return interwiki project and interwiki language

+

end

+

end

+

return nil; -- unknown interwiki language

+

elseif not (cap1 or cap2) then -- both are nil?

+

return nil; -- we got something that looks like a project prefix but isn't; return fail

+

elseif 1 == #cap1 then -- here when one capture

+

return cap1, nil; -- length is 1 so return project, nil language

+

else -- here when one capture and its length it more than 1

+

if cfg.inter_wiki_map[cap1] then -- is language prefix in the interwiki map?

+

return nil, cap1; -- return nil project, language

+

end

−

~~pages = pages:gsub("[%[%]]", ""); -- remove the brackets~~

−

~~pages = pages:gsub("–", "-" ); -- replace endashes with hyphens~~

−

~~pages = pages:gsub("&%w+;", "-" ); -- and replace html entities (– etc.) with hyphens; do we need to replace numerical entities like   and the like?~~

−

~~return pages;~~

end

−

~~-- Gets the display text for a wikilink like [[A|B]] or [[B]] gives B~~

−

~~local function remove_wiki_link( str )~~

−

~~return (str:gsub( "%[%[([^%[%]]*)%]%]", function(l)~~

−

~~return l:gsub( "^[^|]*|(.*)$", "%1" ):gsub("^%s*(.-)%s*$", "%1");~~

−

~~end));~~

−

~~end~~

−

-- ~~Converts a hyphen to a dash~~

+

--[[--------------------------< L I S T _ P E O P L E >--------------------------

−

~~local function hyphen_to_dash( str )~~

+

−

~~if not is_set(str) or str:match( "~~[%[~~%]{}~~<>~~]" ) ~= nil then~~

+

Formats a list of people (authors, contributors, editors, interviewers, translators)

−

~~return str;~~

−

~~end~~

−

~~return str:gsub~~( ~~'-'~~, ~~'–'~~ );

−

~~end~~

−

-~~-[[--------------------------~~< ~~S A F E _ J O I N~~ >--~~----------------------------------------------------------~~

+

names in the list will be linked when

+

|<name>-link= has a value

+

|<name>-mask- does NOT have a value; masked names are presumed to have been

+

rendered previously so should have been linked there

−

~~Joins a sequence of strings together while checking for duplicate separation characters.~~

+

when |<name>-mask=0, the associated name is not rendered

]]

−

local function ~~safe_join~~( ~~tbl~~, ~~duplicate_char~~ )

+

local function list_people (control, people, etal)

−

--[[

+

local sep;

−

~~Note: we use string functions here, rather than ustring functions~~.

+

local namesep;

+

local format = control.format;

+

local maximum = control.maximum;

+

local name_list = {};

+

if 'vanc' == format then -- Vancouver-like name styling?

+

sep = cfg.presentation['sep_nl_vanc']; -- name-list separator between names is a comma

+

namesep = cfg.presentation['sep_name_vanc']; -- last/first separator is a space

+

else

+

sep = cfg.presentation['sep_nl']; -- name-list separator between names is a semicolon

+

namesep = cfg.presentation['sep_name']; -- last/first separator is <comma><space>

+

end

−

~~This has considerably faster performance and should work correctly as~~

+

if sep:sub (-1, -1) ~= " " then sep = sep .. " " end

−

~~long as the duplicate_char is strict ASCII~~. ~~The strings~~

+

if utilities.is_set (maximum) and maximum < 1 then return "", 0; end -- returned 0 is for EditorCount; not used for other names

−

~~in tbl may be ASCII or UTF8~~.

−

]]

−

~~local str = ''; -- the output string~~

+

for i, person in ipairs (people) do

−

~~local comp = ''; -- what does 'comp' mean?~~

+

if utilities.is_set (person.last) then

−

~~local end_chr = '';~~

+

local mask = person.mask;

−

~~local trim;~~

+

local one;

−

for _, ~~value~~ in ipairs( ~~tbl~~ ) do

+

local sep_one = sep;

−

if ~~value == nil~~ then ~~value~~ = ''; ~~end~~

+

−

+

if utilities.is_set (maximum) and i > maximum then

−

~~if str == '' then -- if output string is empty~~

+

etal = true;

−

~~str~~ = ~~value~~; ~~-- assign value to it (first time through the loop)~~

+

break;

−

~~elseif value ~= '' then~~

−

if ~~value:sub~~(~~1,1~~) ~~== '<'~~ then ~~-- Special case of values enclosed in spans and other markup.~~

−

~~comp~~ = ~~value:gsub( "%b<>", "" )~~; ~~-- remove html markup (string -> string)~~

−

~~else~~

−

~~comp = value~~;

end

−

~~-- typically duplicate_char is sepc~~

+

−

if ~~comp:sub(1,1) == duplicate_char~~ then ~~-- is first charactier same as duplicate_char? why test first character?~~

+

if mask then

−

~~-- Because individual string segments often (always?) begin with terminal punct for th~~

+

local n = tonumber (mask); -- convert to a number if it can be converted; nil else

−

~~-- preceding segment: 'First element' .. 'sepc next element' .. etc?~~

+

if n then

−

~~trim~~ = ~~false;~~

+

one = 0 ~= n and string.rep("—", n) or nil; -- make a string of (n > 0) mdashes, nil else, to replace name

−

~~end_chr = str:sub~~(~~-1,-1~~); -- ~~get the last character of the output string~~

+

person.link = nil; -- don't create link to name if name is replaces with mdash string or has been set nil

−

~~-- str = str .. "<HERE(enchr=" .. end_chr.. ")" -- debug stuff?~~

+

else

−

if ~~end_chr == duplicate_char~~ then ~~-- if same as separator~~

+

one = mask; -- replace name with mask text (must include name-list separator)

−

~~str~~ = ~~str:sub~~(~~1,-2)~~; ~~-- remove it~~

+

sep_one = " "; -- modify name-list separator

−

~~elseif end_chr == "'~~" ~~then -- if it might be wikimarkup~~

−

~~if str:sub(-3~~,-1) ~~== duplicate_char .. "''" then~~ -- ~~if last three chars~~ of ~~str are sepc''~~

−

~~str = str:sub~~(1, ~~-4) .. "''"; -- remove them and add back ''~~

−

~~elseif str:sub(-5,-1) == duplicate_char~~ .~~. "]]''" then -- if last five chars of str are sepc]]''~~

−

~~trim~~ = ~~true~~; -- ~~why? why do this and next differently from previous?~~

−

~~elseif str:sub(-4,-1) == duplicate_char .. "]~~'~~'" then --~~ if ~~last four chars of str are sepc]''~~

−

~~trim = true; -- same question~~

−

~~end~~

−

~~elseif end_chr == "]" then -- if it might be wikimarkup~~

−

~~if str:sub(-3,-1)~~ =~~= duplicate_char .. "]]" then~~ -- ~~if last three chars of str are sepc]] wikilink~~

−

~~trim = true;~~

−

~~elseif str:sub~~(-~~2,-1~~) ~~== duplicate_char .. "]" then -- if last two chars of str are sepc] external link~~

−

~~trim = true;~~

−

~~elseif str:sub(-4,-1) =~~= ~~duplicate_char ..~~ "~~'']~~" ~~then -- normal case when |url=something & |title=Title.~~

−

~~trim = true~~;

−

~~end~~

−

~~elseif end_chr == " " then~~ -- ~~if last char of output string is a space~~

−

~~if str:sub(~~-~~2,-1) == duplicate_char .. " " then -- if last two chars of str are <sepc><space>~~

−

~~str = str:sub(1,-3); -- remove them both~~

−

~~end~~

end

−

+

else

−

~~if trim then~~

+

one = person.last; -- get surname

−

~~if value ~~~= ~~comp then~~ -- ~~value does not equal comp when value contains html markup~~

+

local first = person.first -- get given name

−

local ~~dup2~~ = ~~duplicate_char;~~

+

if utilities.is_set (first) then

−

if ~~dup2:match~~( "%A" ) then ~~dup2 = "%" .. dup2; end~~ -- if ~~duplicate_char not a letter then escape it~~

+

if ("vanc" == format) then -- if Vancouver format

−

+

one = one:gsub ('%.', ''); -- remove periods from surnames (http://www.ncbi.nlm.nih.gov/books/NBK7271/box/A35029/)

−

~~value~~ = ~~value~~:gsub( "(%~~b<>~~)" .. ~~dup2~~, ~~"%1"~~, 1 ) -- ~~remove duplicate_char if it follows html markup~~

+

if not person.corporate and is_good_vanc_name (one, first, nil, i) then -- and name is all Latin characters; corporate authors not tested

−

~~else~~

+

first = reduce_to_initials (first, i); -- attempt to convert first name(s) to initials

−

~~value~~ = ~~value:sub~~( 2, -1 ); -- ~~remove duplicate_char when it is~~ first ~~character~~

+

end

+

one = one .. namesep .. first;

end

−

~~str~~ = ~~str~~ .. ~~value~~; --~~add it to the output string~~

+

if utilities.is_set (person.link) then

−

~~end~~

+

one = utilities.make_wikilink (person.link, one); -- link author/editor

−

~~end~~

+

end

−

~~return str;~~

−

end

−

--~~[[--------------------------~~< ~~I S _ G O O D _ V A N C _ N A M E~~ >--~~------------------------------------------~~

+

if one then -- if <one> has a value (name, mdash replacement, or mask text replacement)

+

local proj, tag = interwiki_prefixen_get (one, true); -- get the interwiki prefixen if present

−

~~For Vancouver Style, author/editor names are supposed to be rendered in Latin~~ (~~read ASCII) characters~~. ~~When a~~ name

+

if 'w' == proj and ('Wikipedia' == mw.site.namespaces.Project['name']) then

−

~~uses characters that contain diacritical marks, those characters are to converted to the corresponding Latin character.~~

+

proj = nil; -- for stuff like :w:de:<article>, :w is unnecessary TODO: maint cat?

−

~~When a name is written using a non~~-~~Latin alphabet or logogram~~, ~~that name~~ is ~~to be transliterated into Latin characters.~~

+

end

−

~~These things are not currently possible in this module so are left to the editor to do.~~

+

if proj then

−

+

proj = ({['d'] = 'Wikidata', ['s'] = 'Wikisource', ['w'] = 'Wikipedia'})[proj]; -- :w (wikipedia) for linking from a non-wikipedia project

−

~~This test allows |first~~= ~~and |last~~= ~~names to contain any of the letters defined in the four Unicode Latin character sets~~

+

if proj then

−

[~~http://www.unicode.org/charts/PDF/U0000.pdf C0 Controls and Basic Latin~~] ~~0041–005A~~, ~~0061–007A~~

+

one = one .. utilities.wrap_style ('interproj', proj); -- add resized leading space, brackets, static text, language name

−

[~~http~~:~~//www~~.~~unicode~~.~~org/charts/PDF/U0080~~.~~pdf C1 Controls and Latin~~-~~1 Supplement] 00C0–00D6~~, ~~00D8–00F6~~, ~~00F8–00FF~~

+

tag = nil; -- unset; don't do both project and language

−

~~[http~~:~~//www~~.~~unicode~~.~~org/charts/PDF/U0100~~.~~pdf Latin Extended~~-~~A] 0100–017F~~

+

end

−

~~[http://www~~.~~unicode~~.~~org/charts/PDF/U0180~~.~~pdf Latin Extended~~-~~B] 0180–01BF~~, ~~01C4–024F~~

+

end

+

if tag == cfg.this_wiki_code then

+

tag = nil; -- stuff like :en:<article> at en.wiki is pointless TODO: maint cat?

+

end

+

if tag then

+

local lang = cfg.lang_tag_remap[tag] or cfg.mw_languages_by_tag_t[tag];

+

if lang then -- error messaging done in extract_names() where we know parameter names

+

one = one .. utilities.wrap_style ('interwiki', lang); -- add resized leading space, brackets, static text, language name

+

end

+

end

−

~~|lastn= also allowed~~ to ~~contain hyphens, spaces, and apostrophes~~. (~~http://www.ncbi.nlm.nih.gov/books/NBK7271/box/A35029/~~)

+

table.insert (name_list, one); -- add it to the list of names

−

~~|firstn= also allowed to contain hyphens, spaces, apostrophes, and periods~~

+

table.insert (name_list, sep_one); -- add the proper name-list separator

+

end

+

end

+

end

−

~~At the time~~ of ~~this writing, I had to write the~~ 'if ~~nil~~ == mw.~~ustring.find~~ ...' ~~test ouside of the code editor~~ and ~~past it here~~

+

local count = #name_list / 2; -- (number of names + number of separators) divided by 2

−

~~because~~ the ~~code editor gets confused between character insertion point and cursor position.~~

+

if 0 < count then

+

if 1 < count and not etal then

+

if 'amp' == format then

+

name_list[#name_list-2] = " & "; -- replace last separator with ampersand text

+

elseif 'and' == format then

+

if 2 == count then

+

name_list[#name_list-2] = cfg.presentation.sep_nl_and; -- replace last separator with 'and' text

+

else

+

name_list[#name_list-2] = cfg.presentation.sep_nl_end; -- replace last separator with '(sep) and' text

+

end

+

end

+

end

+

name_list[#name_list] = nil; -- erase the last separator

+

end

−

]]

+

local result = table.concat (name_list); -- construct list

−

+

if etal and utilities.is_set (result) then -- etal may be set by |display-authors=etal but we might not have a last-first list

−

local ~~function is_good_vanc_name~~ (~~last, first~~)

+

result = result .. sep .. cfg.messages['et al']; -- we've got a last-first list and etal so add et al.

−

if ~~nil == mw~~.~~ustring.find~~ (~~last, "^[A~~-Za-zÀ-ÖØ-~~öø-ƿǄ-ɏ%-%s%']*$") or nil~~ =~~= mw~~.~~ustring~~.~~find (first, "^~~[~~A-Za-zÀ-ÖØ-öø-ƿǄ-ɏ%-%s%~~'%.]*$") then

+

end

−

~~if true ~= Page_in_vanc_error_cat then~~ -- if we ~~haven~~'~~t been here before then set~~ a ~~sticky flag~~

+

−

~~Page_in_vanc_error_cat=true; -~~- so ~~that if there are more than one error the category is added only once~~

+

return result, count; -- return name-list string and count of number of names (count used for editor names only)

−

~~table.insert( z~~.~~message_tail, { set_error( 'vancouver', {}, true ) } );~~

−

end

−

return ~~false~~; -- ~~not a~~ string of ~~latin characters; Vancouver required Romanization~~

−

~~end;~~

−

~~return true;~~

end

−

~~--[[--------------------------< R E D U C E _ T O _ I N I T I A L S >------------------------------------------~~

−

~~Attempts to convert names to initials in support of |name~~-~~list~~-~~format=vanc.~~

+

--[[--------------------< M A K E _ C I T E R E F _ I D >-----------------------

−

~~Names in |firstn= may be separated by spaces~~ or ~~hyphens, or for initials,~~ a ~~period. See http://www.ncbi.nlm.nih~~.~~gov/books/NBK7271/box/A35062/~~.

+

Generates a CITEREF anchor ID if we have at least one name or a date. Otherwise

+

returns an empty string.

−

~~Vancouver style requires family rank designations (Jr~~, II, ~~III, etc) to be rendered as Jr, 2nd, 3rd, etc~~. ~~This form~~ is ~~not~~

+

namelist is one of the contributor-, author-, or editor-name lists chosen in that

−

~~currently supported by this code so correctly formed names like Smith JL 2nd are converted to Smith J2. See http://www.ncbi.nlm.nih.gov/books/NBK7271/box/A35085/.~~

+

order. year is Year or anchor_year.

−

~~This function uses ustring functions because firstname initials may be any of the unicode Latin characters accepted by is_good_vanc_name ()~~.

]]

−

local function ~~reduce_to_initials~~(~~first)~~

+

local function make_citeref_id (namelist, year)

−

~~if mw.ustring.match(first~~, ~~"^%u%u$"~~) ~~then return first end; -- when first contains just two upper-case letters, nothing to do~~

+

local names={}; -- a table for the one to four names and year

−

local ~~initials~~ = {}

+

for i,v in ipairs (namelist) do -- loop through the list and take up to the first four last names

−

~~local i = 0~~; -- ~~counter~~ for ~~number of initials~~

+

names[i] = v.last

−

for ~~word~~ in ~~mw.ustring.gmatch~~(~~first, "[^%s%.%-]+"~~) do -- names ~~separated by spaces, hyphens, or periods~~

+

if i == 4 then break end -- if four then done

−

table.insert(~~initials~~, mw.~~ustring~~.~~sub~~(~~word,1,1~~)) -- ~~Vancouver format does~~ not ~~include full stops.~~

+

end

−

~~i = i + 1~~; -- ~~bump~~ the ~~counter~~

+

table.insert (names, year); -- add the year at the end

−

~~if 2 <= i then break~~; ~~end~~ -- ~~only two initials allowed~~ in ~~Vancouver system; if 2, quit~~

+

local id = table.concat(names); -- concatenate names and year for CITEREF id

+

if utilities.is_set (id) then -- if concatenation is not an empty string

+

return "CITEREF" .. id; -- add the CITEREF portion

+

else

+

return ''; -- return an empty string; no reason to include CITEREF id in this citation

end

−

~~return table.concat(initials) -- Vancouver format does not include spaces.~~

end

−

~~--[[--------------------------< L I S T _ P E O P L E >-------------------------------------------------------~~

−

~~Formats a list of people (e~~.g. ~~authors / editors)~~

+

--[[--------------------------< C I T E _ C L A S S _A T T R I B U T E _M A K E >------------------------------

+

construct <cite> tag class attribute for this citation.

+

<cite_class> – config.CitationClass from calling template

+

<mode> – value from |mode= parameter

]]

−

local function ~~list_people~~(~~control~~, ~~people, etal~~)

+

local function cite_class_attribute_make (cite_class, mode)

−

local ~~sep;~~

+

local class_t = {};

−

~~local namesep~~;

+

table.insert (class_t, 'citation'); -- required for blue highlight

−

~~local format = control~~.~~format~~

+

if 'citation' ~= cite_class then

−

~~local maximum = control.maximum~~

+

table.insert (class_t, cite_class); -- identify this template for user css

−

~~local lastauthoramp = control.lastauthoramp~~;

+

table.insert (class_t, utilities.is_set (mode) and mode or 'cs1'); -- identify the citation style for user css or javascript

−

~~local text = {}~~

−

if '~~vanc~~' =~~= format~~ then ~~-- Vancouver-like author/editor name styling?~~

−

~~sep = '~~,'; -- ~~name-list separator between authors is a comma~~

−

~~namesep =~~ ' '; -- ~~last/first separator is a space~~

else

−

~~sep =~~ ';~~' -- name-list separator between authors is a semicolon~~

+

table.insert (class_t, utilities.is_set (mode) and mode or 'cs2'); -- identify the citation style for user css or javascript

−

~~namesep = ', '~~ -- ~~last/first separator is <comma><space>~~

end

−

+

for _, prop_key in ipairs (z.prop_keys_t) do

−

~~if sep:sub(-1,-1) ~= " " then sep = sep .. " " end~~

+

table.insert (class_t, prop_key); -- identify various properties for user css or javascript

−

~~if is_set (maximum) and maximum < 1 then return "", 0; end -- returned 0 is for EditorCount; not used~~ for ~~authors~~

−

~~for i~~,~~person~~ in ipairs(~~people~~) do

−

~~if is_set(person~~.~~last) then~~

−

~~local mask = person.mask~~

−

~~local one~~

−

~~local sep_one = sep;~~

−

~~if is_set~~ (~~maximum) and i > maximum then~~

−

~~etal = true;~~

−

~~break;~~

−

~~elseif (mask ~= nil) then~~

−

~~local n = tonumber(mask)~~

−

~~if (n ~= nil) then~~

−

~~one = string.rep("—"~~,n)

−

~~else~~

−

~~one = mask~~;

−

~~sep_one = " ";~~

−

~~end~~

−

~~else~~

−

~~one = person.last~~

−

~~local first = person.first~~

−

~~if is_set(first) then~~

−

~~if ( "vanc" == format ) then~~ -- ~~if vancouver format~~

−

~~one = one:gsub ('%.', ''); -- remove periods from surnames (http://www.ncbi.nlm.nih.gov/books/NBK7271/box/A35029/)~~

−

~~if is_good_vanc_name (one, first) then -- and name is all Latin characters~~

−

~~first = reduce_to_initials(first) -- attempt to convert first name(s) to initials~~

−

~~end~~

−

~~end~~

−

~~one = one .. namesep .. first~~

−

~~end~~

−

~~if is_set(person.link) and person.link ~= control.page_name then~~

−

~~one = "[[" .. person.link .. "|" .. one .. "]]" -- link author/editor if this page is not the author's/editor's page~~

−

~~end~~

−

~~if is_set(person.link) and ((nil ~= person.link:find("//"))~~ or ~~(nil ~= person.link:find("[%[%]]"))) then~~

−

~~one = one .. " " .. set_error( 'bad_authorlink' ) end -- url or wikilink in author link;~~

−

~~end~~

−

~~table.insert( text, one )~~

−

~~table.insert( text, sep_one )~~

−

~~end~~

end

−

~~local count = #text / 2;~~

+

return table.concat (class_t, ' '); -- make a big string and done

−

~~if count > 0 then~~

−

~~if count > 1 and is_set(lastauthoramp) and not etal then~~

−

~~text[#text-2] = " & ";~~

−

~~end~~

−

~~text[#text] = nil;~~

−

~~end~~

−

~~local result =~~ table.concat(~~text~~) -- ~~construct list~~

−

~~if etal then~~

−

~~local etal_text = cfg.messages['et al'];~~

−

~~result = result .. " " .. etal_text;~~

−

~~end~~

−

~~return result, count~~

end

−

~~--[[--------------------------< A N C H O R _ I D >------------------------------------------------------------~~

−

~~Generates a CITEREF anchor ID if we have at least one~~ name ~~or a date~~. ~~Otherwise~~ returns ~~an empty string~~.

+

--[[---------------------< N A M E _ H A S _ E T A L >--------------------------

+

Evaluates the content of name parameters (author, editor, etc.) for variations on

+

the theme of et al. If found, the et al. is removed, a flag is set to true and

+

the function returns the modified name and the flag.

+

This function never sets the flag to false but returns its previous state because

+

it may have been set by previous passes through this function or by the associated

+

|display-<names>=etal parameter

]]

−

local function ~~anchor_id~~( ~~options~~ )

+

local function name_has_etal (name, etal, nocat, param)

−

local id = ~~table~~.~~concat~~( ~~options~~ ); -- ~~concatenate names and year for CITEREF id~~

+

−

if ~~is_set~~ (id) then -- if ~~concatenation~~ is ~~not an empty string~~

+

if utilities.is_set (name) then -- name can be nil in which case just return

−

~~return "CITEREF" .. id~~; -- ~~add the CITEREF portion~~

+

local patterns = cfg.et_al_patterns; -- get patterns from configuration

−

~~else~~

+

−

~~return~~ ''; -- ~~return~~ an ~~empty string; no reason to include CITEREF id in this citation~~

+

for _, pattern in ipairs (patterns) do -- loop through all of the patterns

+

if name:match (pattern) then -- if this 'et al' pattern is found in name

+

name = name:gsub (pattern, ''); -- remove the offending text

+

etal = true; -- set flag (may have been set previously here or by |display-<names>=etal)

+

if not nocat then -- no categorization for |vauthors=

+

utilities.set_message ('err_etal', {param}); -- and set an error if not added

+

end

+

end

+

end

+

return name, etal;

end

−

~~--[[--------------------------< E X T R A C T _ N A M E S >----------------------------------------------------~~

−

~~Gets name list from the input arguments~~

−

~~Searches through args in sequential order to find |lastn=~~ and ~~|firstn= parameters (or their aliases), and their matching link and mask parameters~~.

+

--[[---------------------< N A M E _ I S _ N U M E R I C >----------------------

−

+

−

~~find |last4= and |last5= then the search is done~~.

+

Add an error message and category when <name> parameter value does not contain letters.

+

Add a maintenance category when <name> parameter value has numeric characters mixed with characters that are

+

not numeric characters; could be letters and/or punctuation characters.

−

This function ~~emits an~~ error message ~~when there is a |firstn= without a matching |lastn=~~. ~~When there are 'holes' in~~ the ~~list of last names, |last1= and |last3=~~

+

This function will only emit one error and one maint message for the current template. Does not emit both error

−

~~are present but |last2= is missing, an error message is emitted. |lastn= is not required to have a matching |firstn=~~.

+

and maint messages/categories for the same parameter value.

−

~~When an author or editor parameter contains some form of 'et al.', the 'et al.' is stripped from the parameter and a flag (etal) returned~~

+

returns nothing

−

~~that will cause list_people() to add the static 'et al.' text from Module:Citation/CS1/Configuration. This keeps 'et al.' out of the~~

−

~~template's metadata. When this occurs, the page is added to a maintenance category.~~

]]

−

local function ~~extract_names~~(~~args~~, list_name)

+

local function name_is_numeric (name, name_alias, list_name)

−

local ~~names~~ = {~~}; -- table of names~~

+

local patterns = {

−

~~local last; -- individual name components~~

+

'^%D+%d', -- <name> must have digits preceded by other characters

−

~~local first;~~

+

'^%D*%d+%D+', -- <name> must have digits followed by other characters

−

~~local link;~~

+

}

−

~~local mask;~~

−

~~local i = 1; -- loop counter/indexer~~

−

~~local n = 1; -- output table indexer~~

−

~~local count = 0;~~ ~~-- used to count the number of times we haven~~'~~t found a |last= (or alias for authors~~, ~~|editor~~-~~last or alias for editors)~~

−

~~local etal=false;~~ ~~-- return value set to true when we find some form of et al. in an author parameter~~

−

local pattern = ",? *'*~~[Ee][Tt] *[Aa][Ll][~~%~~.']*$" -- variations on the 'et al' theme~~

−

~~local err_msg_list_name = list_name:match ("(~~%w+~~)List") ..~~ '~~s list';~~ -- ~~modify AuthorList or EditorList for use in error messages if necessary~~

−

~~while true do~~

+

if not added_numeric_name_errs and mw.ustring.match (name, '^[%A]+$') then -- if we have not already set an error message and <name> does not have any alpha characters

−

~~last = select_one~~( ~~args~~, ~~cfg.aliases~~[~~list_name .. '-Last'~~]~~, 'redundant_parameters~~'~~, i~~ ); -- ~~search through args for~~ name ~~components beginning at 1~~

+

utilities.set_message ('err_numeric_names', name_alias); -- add an error message

−

~~first = select_one~~( ~~args, cfg.aliases[list_name ..~~ '~~-First'], 'redundant_parameters~~', i );

+

added_numeric_name_errs = true; -- set the flag so we emit only one error message

−

~~link~~ = ~~select_one( args, cfg.aliases[list_name .. '~~-~~Link'], 'redundant_parameters', i );~~

+

return; -- when here no point in further testing; abandon

−

~~mask = select_one( args, cfg.aliases[list_name .. '~~-~~Mask'], 'redundant_parameters', i )~~;

+

end

−

~~local name = tostring~~(~~last~~);

+

if not added_numeric_name_maint then -- if we have already set a maint message

−

if ~~name:~~match (pattern) then -- ~~varients on et al~~.

+

for _, pattern in ipairs (patterns) do -- spin through list of patterns

−

~~last = name:gsub~~ (~~pattern,~~ ''); -- ~~if found, remove~~

+

if mw.ustring.match (name, pattern) then -- digits preceded or followed by anything but digits; %D+ includes punctuation

−

~~etal~~ = true;

+

utilities.set_message ('maint_numeric_names', cfg.special_case_translation [list_name]); -- add a maint cat for this template

−

~~end~~

+

added_numeric_name_maint = true; -- set the flag so we emit only one maint message

−

~~name = tostring(first);~~

+

return; -- when here no point in further testing; abandon

−

~~if name:match (pattern) then~~ -- ~~varients on et al.~~

+

end

−

~~first = name:gsub (pattern, '')~~; -- ~~if found, remove~~

−

~~etal = true;~~

end

+

end

+

end

+

--[[-----------------< N A M E _ H A S _ M U L T _ N A M E S >------------------

+

Evaluates the content of last/surname (authors etc.) parameters for multiple names.

+

Multiple names are indicated if there is more than one comma or any "unescaped"

+

semicolons. Escaped semicolons are ones used as part of selected HTML entities.

+

If the condition is met, the function adds the multiple name maintenance category.

−

if first ~~and~~ not ~~last then -- if there is~~ a ~~firstn without~~ a ~~matching lastn~~

+

Same test for first except that commas should not appear in given names (MOS:JR says

−

~~table~~.~~insert~~( ~~z.message_tail~~, ~~{ set_error~~( '~~first_missing_last~~', ~~{err_msg_list_name, i}, true ) }~~ ); -- ~~add this error message~~

+

that the generational suffix does not take a separator character). Titles, degrees,

−

~~elseif not first and not last then -- if both firstn and lastn aren~~'~~t found~~, ~~are we done?~~

+

postnominals, affiliations, all normally comma separated don't belong in a citation.

−

~~count = count + 1~~; -- number of ~~times we haven't found last and first~~

+

−

~~if 2 ==~~ count ~~then~~ -- ~~two missing names and we give up~~

+

<name> – name parameter value

−

~~break;~~ -- ~~normal exit or~~ there is ~~a two~~-~~name hole in~~ the ~~list; can't tell which~~

+

<list_name> – AuthorList, EditorList, etc

−

~~end~~

+

<limit> – number of allowed commas; 1 (default) for surnames; 0 for given names

−

~~else~~ -- ~~we have last with or without a first~~

+

−

~~names[n] = {last = last~~, ~~first~~ = ~~first~~, ~~link = link, mask = mask}~~; -- ~~add this name to our names list~~

+

returns nothing

−

~~n = n +~~ 1; -- ~~point~~ to ~~next location in the names table~~

+

−

~~if 1 == count then~~ -- if ~~the previous name was missing~~

+

]]

−

~~table~~.~~insert( z.message_tail, { set_error~~( '~~missing_name~~', ~~{err_msg_list_name, i-1}, true ) }~~ ); -- add ~~this error~~ message

+

−

~~end~~

+

local function name_has_mult_names (name, list_name, limit)

−

~~count = 0; -- reset the counter, we're looking for two consecutive missing names~~

+

local _, commas, semicolons, nbsps;

+

limit = limit and limit or 1;

+

if utilities.is_set (name) then

+

_, commas = name:gsub (',', ''); -- count the number of commas

+

_, semicolons = name:gsub (';', ''); -- count the number of semicolons

+

-- nbsps probably should be its own separate count rather than merged in

+

-- some way with semicolons because Lua patterns do not support the

+

-- grouping operator that regex does, which means there is no way to add

+

-- more entities to escape except by adding more counts with the new

+

-- entities

+

_, nbsps = name:gsub (' ',''); -- count nbsps

+

-- There is exactly 1 semicolon per   entity, so subtract nbsps

+

-- from semicolons to 'escape' them. If additional entities are added,

+

-- they also can be subtracted.

+

if limit < commas or 0 < (semicolons - nbsps) then

+

utilities.set_message ('maint_mult_names', cfg.special_case_translation [list_name]); -- add a maint message

end

−

~~i = i + 1; -- point to next args location~~

−

~~end~~

−

~~if true == etal then~~

−

~~add_maint_cat ('etal');~~

end

−

~~return names, etal; -- all done, return our list of names~~

end

−

~~-- Populates ID table from arguments using configuration settings~~

−

~~local function extract_ids( args )~~

−

~~local id_list = {};~~

−

~~for k, v in pairs( cfg.id_handlers ) do~~

−

~~v = select_one( args, v.parameters, 'redundant_parameters' );~~

−

~~if is_set(v) then id_list[k] = v; end~~

−

~~end~~

−

~~return id_list;~~

−

~~end~~

−

--[[--------------------------< ~~B U~~ I ~~L D~~ _ I ~~D _ L I S T~~ >--------------------------------------------------------

+

--[=[-----------------------------------------------------------------------------------

+

Compares values assigned to various parameters according to the string provided as <item> in the function call.

+

<item> can have on of two values:

+

'generic_names' – for name-holding parameters: |last=, |first=, |editor-last=, etc

+

'generic_titles' – for |title=

+

There are two types of generic tests. The 'accept' tests look for a pattern that should not be rejected by the

+

'reject' test. For example,

+

|author=[[John Smith (author)|Smith, John]]

+

would be rejected by the 'author' reject test. But piped wikilinks with 'author' disambiguation should not be

+

rejected so the 'accept' test prevents that from happening. Accept tests are always performed before reject

+

tests.

+

Each of the 'accept' and 'reject' sequence tables hold tables for en.wiki (['en']) and local.wiki (['local'])

+

that each can hold a test sequence table The sequence table holds, at index [1], a test pattern, and, at index

+

[2], a boolean control value. The control value tells string.find() or mw.ustring.find() to do plain-text search (true)

+

or a pattern search (false). The intent of all this complexity is to make these searches as fast as possible so

+

that we don't run out of processing time on very large articles.

−

~~Takes~~ a ~~table of IDs and turns it into a table of formatted ID outputs.~~

+

Returns

+

true when a reject test finds the pattern or string

+

false when an accept test finds the pattern or string

+

nil else

−

]]

+

]=]

−

local function ~~build_id_list~~( ~~id_list~~, ~~options~~ )

+

local function is_generic (item, value, wiki)

−

local ~~new_list~~, ~~handler~~ = {};

+

local test_val;

+

local str_lower = { -- use string.lower() for en.wiki (['en']) and use mw.ustring.lower() or local.wiki (['local'])

+

['en'] = string.lower,

+

['local'] = mw.ustring.lower,

+

}

+

local str_find = { -- use string.find() for en.wiki (['en']) and use mw.ustring.find() or local.wiki (['local'])

+

['en'] = string.find,

+

['local'] = mw.ustring.find,

+

}

−

function ~~fallback~~(k) ~~return { __index =~~ function(~~t,i~~) ~~return cfg.id_handlers~~[k][i] ~~end } end;~~

+

local function test (val, test_t, wiki) -- local function to do the testing; <wiki> selects lower() and find() functions

−

+

val = test_t[2] and str_lower[wiki](value) or val; -- when <test_t[2]> set to 'true', plaintext search using lowercase value

−

~~for k, v in pairs~~( ~~id_list~~ ) do

+

return str_find[wiki] (val, test_t[1], 1, test_t[2]); -- return nil when not found or matched

−

-- ~~fallback~~ to ~~read-only cfg~~

+

end

−

~~handler = setmetatable~~( { [~~'id'~~] ~~= v }~~, ~~fallback(k)~~ );

−

~~if handler.mode =~~= '~~external~~' ~~then~~

+

local test_types_t = {'accept', 'reject'}; -- test accept patterns first, then reject patterns

−

~~table.insert( new_list~~, ~~{handler.label, external_link_id( handler ) } );~~

+

local wikis_t = {'en', 'local'}; -- do tests for each of these keys; en.wiki first, local.wiki second

−

~~elseif handler.mode ==~~ '~~internal~~' ~~then~~

+

−

~~table.insert( new_list, {handler.label, internal_link_id( handler )~~ } );

+

for _, test_type in ipairs (test_types_t) do -- for each test type

−

~~elseif handler.mode ~= 'manual'~~ then

+

for _, generic_value in pairs (cfg.special_case_translation[item][test_type]) do -- spin through the list of generic value fragments to accept or reject

−

~~error( cfg.messages['unknown_ID_mode'] );~~

+

for _, wiki in ipairs (wikis_t) do

−

~~elseif k =~~= '~~DOI~~' ~~then~~

+

if generic_value[wiki] then

−

~~table.insert( new_list~~, ~~{handler.label, doi( v, options.DoiBroken ) } );~~

+

if test (value, generic_value[wiki], wiki) then -- go do the test

−

~~elseif k ==~~ '~~ARXIV~~' ~~then~~

+

return ('reject' == test_type); -- param value rejected, return true; false else

−

~~table.insert( new_list, {handler.label, arxiv( v, options.Class )~~ } );

+

end

−

~~elseif k == 'ASIN' then~~

+

end

−

~~table.insert( new_list, {handler.label, amazon( v, options.ASINTLD ) } )~~;

+

end

−

~~elseif k == 'LCCN' then~~

−

~~table~~.~~insert( new_list~~, ~~{handler~~.~~label, lccn( v ) } );~~

−

~~elseif k == 'OL' then~~

−

~~table.insert( new_list, {handler.label~~, ~~openlibrary~~( v ) ~~} );~~

−

~~elseif k == 'PMC' then~~

−

~~table.insert( new_list~~, ~~{handler.label, pmc~~( ~~v, options~~.~~Embargo~~ ) ~~} );~~

−

~~elseif k == 'PMID' then~~

−

~~table.insert( new_list, {handler.label~~, ~~pmid~~( v ) ~~} );~~

−

~~elseif k == 'ISSN'~~ then

−

~~table.insert~~( ~~new_list~~, ~~{handler.label~~, ~~issn( v~~ ) ~~} );~~

−

~~elseif k == 'ISBN'~~ then

−

~~local ISBN = internal_link_id( handler );~~

−

~~if not check_isbn( v ) and not is_set(options.IgnoreISBN) then~~

−

~~ISBN = ISBN .. set_error~~( '~~bad_isbn~~'~~, {}, false, " ", ""~~ );

−

~~end~~

−

~~table.insert( new_list~~, ~~{handler.label, ISBN } )~~;

−

~~elseif k == 'USENETID' then~~

−

~~table.insert( new_list, {handler.label, message_id( v ) } );~~

−

~~else~~

−

~~error( cfg.messages['unknown_manual_ID'] );~~

end

−

+

end

−

~~function comp~~( a~~, b ) --~~ used in ~~following table.sort()~~

+

−

~~return a[1~~] ~~< b[1~~];

+

−

~~end~~

+

--[[--------------------------< N A M E _ I S _ G E N E R I C >------------------------------------------------

−

+

−

~~table.sort~~( ~~new_list~~, ~~comp~~ );

+

calls is_generic() to determine if <name> is a 'generic name' listed in cfg.generic_names; <name_alias> is the

−

~~for k~~, ~~v in ipairs( new_list~~ ) do

+

parameter name used in error messaging

−

~~new_list[k]~~ = ~~v[2]~~;

+

]]

+

local function name_is_generic (name, name_alias)

+

if not added_generic_name_errs and is_generic ('generic_names', name) then

+

utilities.set_message ('err_generic_name', name_alias); -- set an error message

+

added_generic_name_errs = true;

end

−

~~return new_list;~~

end

−

-- ~~COinS metadata (see~~ <~~http://ocoins.info/~~>~~) allows automated tools to parse~~

+

−

-- the ~~citation information~~.

+

--[[--------------------------< N A M E _ C H E C K S >--------------------------------------------------------

−

local function ~~COinS~~(~~data~~, ~~class~~)

+

−

if ~~'table' ~~~= ~~type~~(~~data~~) or ~~nil == next~~(~~data~~) ~~then~~

+

This function calls various name checking functions used to validate the content of the various name-holding parameters.

−

~~return '';~~

+

]]

+

local function name_checks (last, first, list_name, last_alias, first_alias)

+

local accept_name;

+

if utilities.is_set (last) then

+

last, accept_name = utilities.has_accept_as_written (last); -- remove accept-this-as-written markup when it wraps all of <last>

+

if not accept_name then -- <last> not wrapped in accept-as-written markup

+

name_has_mult_names (last, list_name); -- check for multiple names in the parameter

+

name_is_numeric (last, last_alias, list_name); -- check for names that have no letters or are a mix of digits and other characters

+

name_is_generic (last, last_alias); -- check for names found in the generic names list

+

end

−

+

−

~~local ctx_ver~~ = ~~"Z39~~.88-~~2004";~~

+

if utilities.is_set (first) then

−

+

first, accept_name = utilities.has_accept_as_written (first); -- remove accept-this-as-written markup when it wraps all of <first>

−

-- ~~treat table strictly~~ as ~~an array with only set values.~~

+

−

~~local OCinSoutput = setmetatable~~( {}, {

+

if not accept_name then -- <first> not wrapped in accept-as-written markup

−

~~__newindex = function~~(~~self~~, ~~key~~, ~~value~~)

+

name_has_mult_names (first, list_name, 0); -- check for multiple names in the parameter; 0 is number of allowed commas in a given name

−

~~if is_set~~(~~value) then~~

+

name_is_numeric (first, first_alias, list_name); -- check for names that have no letters or are a mix of digits and other characters

−

~~rawset( self, #self+1, table.concat{ key, '='~~, ~~mw.uri.encode( remove_wiki_link( value ) ) }~~ );

+

name_is_generic (first, first_alias); -- check for names found in the generic names list

−

~~end~~

end

−

~~});~~

+

local wl_type, D = utilities.is_wikilink (first);

−

+

if 0 ~= wl_type then

−

~~if is_set(data.Chapter) then~~

+

first = D;

−

~~OCinSoutput.rft_val_fmt = "info:ofi/fmt:kev:mtx:book";~~

+

utilities.set_message ('err_bad_paramlink', first_alias);

−

~~OCinSoutput["rft.genre"] = "bookitem";~~

−

~~OCinSoutput["rft.atitle"] = data.Chapter;~~

−

~~OCinSoutput["rft.btitle"]~~ = ~~data~~.~~Title;~~

−

~~elseif is_set~~(~~data.Periodical~~) ~~then~~

−

~~OCinSoutput.rft_val_fmt = "info:ofi/fmt:kev:mtx:journal"~~;

−

if ~~'arxiv' =~~= ~~class~~ then

−

~~OCinSoutput["rft.genre"]~~ = ~~"preprint"~~; ~~-- cite arxiv~~

−

~~else~~

−

~~OCinSoutput["rft~~.~~genre"] = "article"~~;

end

−

~~OCinSoutput["rft.jtitle"] = data.Periodical;~~

−

~~OCinSoutput["rft.atitle"] = data.Title;~~

−

~~else~~

−

~~OCinSoutput.rft_val_fmt = "info:ofi/fmt:kev:mtx:book";~~

−

~~OCinSoutput["rft.genre"] = "book"~~

−

~~OCinSoutput["rft.btitle"] = data.Title;~~

end

−

+

−

~~OCinSoutput["rft.place"] = data.PublicationPlace;~~

+

return last, first; -- done

−

~~OCinSoutput["rft.date"] = data.Date;~~

−

~~OCinSoutput["rft.series"] = data.Series;~~

−

~~OCinSoutput["rft.volume"] = data.Volume;~~

−

~~OCinSoutput["rft.issue"] = data.Issue;~~

−

~~OCinSoutput["rft.pages"] = data.Pages;~~

−

~~OCinSoutput["rft.edition"] = data.Edition;~~

−

~~OCinSoutput["rft.pub"] = data.PublisherName;~~

−

~~for k, v in pairs( data.ID_list ) do~~

−

~~local id, value = cfg.id_handlers[k].COinS;~~

−

~~if k == 'ISBN' then value = clean_isbn( v ); else value = v; end~~

−

~~if string.sub( id or "", 1, 4 ) == 'info' then~~

−

~~OCinSoutput["rft_id"] = table.concat{ id, "/", v };~~

−

~~else~~

−

~~OCinSoutput[ id ] = value;~~

−

~~end~~

−

~~end~~

−

~~local last, first;~~

−

~~for k, v in ipairs( data.Authors ) do~~

−

~~last, first = v.last, v.first;~~

−

~~if k == 1 then~~

−

~~if is_set(~~last~~) then~~

−

~~OCinSoutput["rft.aulast"] = last;~~

−

~~end~~

−

~~if is_set(first) then~~

−

~~OCinSoutput["rft.aufirst"] = first;~~

−

~~end~~

−

~~end~~

−

~~if is_set(last) and is_set(first) then~~

−

~~OCinSoutput["rft.au"] = table.concat{ last, ", ", first };~~

−

~~elseif is_set(last) then~~

−

~~OCinSoutput["rft.au"] = last;~~

−

~~end~~

−

~~end~~

−

~~OCinSoutput.rft_id = data.URL;~~

−

~~OCinSoutput.rfr_id = table.concat{ "info:sid/", mw.site.server:match( "[^/]*$" ), ":"~~, ~~data.RawPage };~~

−

~~OCinSoutput = setmetatable( OCinSoutput, nil );~~

−

~~-- sort with version string always~~ first~~, and combine.~~

−

~~table.sort( OCinSoutput );~~

−

~~table.insert( OCinSoutput, 1, "ctx_ver=" .. ctx_ver )~~; -- ~~such as "Z39.88~~-~~2004"~~

−

~~return table.concat(OCinSoutput, "&");~~

end

−

--[[~~----~~----------------------< G E T _ I S ~~O 6 3 9 _ C O D E~~ >~~-----------------------~~-------------------------

+

--[[----------------------< E X T R A C T _ N A M E S >-------------------------

−

~~Validates language names provided in |language= parameter if not an ISO639-1 code. Handles~~ the ~~special case that is Norwegian where~~

+

Gets name list from the input arguments

−

~~ISO639-1 code 'no' is mapped to language name 'Norwegian Bokmål' by Extention:CLDR.~~

−

~~Returns the language name~~ and ~~associated ISO639-1 code~~. ~~Because case of the source may be incorrect or different from the case that Wikimedia~~

+

Searches through args in sequential order to find |lastn= and |firstn= parameters

−

~~uses, the name comparisons~~ are ~~done~~ in ~~lower case and when a match is~~ found, the ~~Wikimedia version (assumed to be correct) is returned along~~

+

(or their aliases), and their matching link and mask parameters. Stops searching

−

~~with the code. When there~~ is ~~no match, we return the original language name string~~.

+

when both |lastn= and |firstn= are not found in args after two sequential attempts:

+

+

search is done.

−

mw.~~language.fetchLanguageNames() will return a list of languages that aren~~'~~t part of ISO639-1. Names that aren~~'~~t ISO639-1 but that are included~~

+

This function emits an error message when there is a |firstn= without a matching

−

in the list ~~will be found if that name is provided in the~~ |~~language~~= ~~parameter. For example, if~~ |~~language~~=~~Samaritan Aramaic, that name will be~~

+

|lastn=. When there are 'holes' in the list of last names, |last1= and |last3=

−

~~found with the associated code 'sam'~~, ~~not~~ an ~~ISO639-1 code~~. ~~When names are found and the associated code~~ is not ~~two characters, this function~~

+

are present but |last2= is missing, an error message is emitted. |lastn= is not

−

~~returns only the Wikimedia language name~~.

+

required to have a matching |firstn=.

−

~~Adapted~~ from ~~code taken~~ from Module:~~Check ISO 639-1~~.

+

When an author or editor parameter contains some form of 'et al.', the 'et al.'

+

is stripped from the parameter and a flag (etal) returned that will cause list_people()

+

to add the static 'et al.' text from Module:Citation/CS1/Configuration. This keeps

+

'et al.' out of the template's metadata. When this occurs, an error is emitted.

]]

−

local function ~~get_iso639_code~~ (~~lang~~)

+

local function extract_names(args, list_name)

−

if '~~norwegian' =~~= ~~lang:lower~~() ~~then~~ -- ~~special case related~~ to ~~Wikimedia remap~~ of ~~code~~ 'no' at ~~Extension:CLDR~~

+

local names = {}; -- table of names

−

~~return~~ '~~Norwegian~~', 'no'; -- ~~Make sure rendered version is properly capitalized~~

+

local last; -- individual name components

−

~~end~~

+

local first;

+

local link;

+

local mask;

+

local i = 1; -- loop counter/indexer

+

local n = 1; -- output table indexer

+

local count = 0; -- used to count the number of times we haven't found a |last= (or alias for authors, |editor-last or alias for editors)

+

local etal = false; -- return value set to true when we find some form of et al. in an author parameter

+

local last_alias, first_alias, link_alias; -- selected parameter aliases used in error messaging

+

while true do

+

last, last_alias = utilities.select_one ( args, cfg.aliases[list_name .. '-Last'], 'err_redundant_parameters', i ); -- search through args for name components beginning at 1

+

first, first_alias = utilities.select_one ( args, cfg.aliases[list_name .. '-First'], 'err_redundant_parameters', i );

+

link, link_alias = utilities.select_one ( args, cfg.aliases[list_name .. '-Link'], 'err_redundant_parameters', i );

+

mask = utilities.select_one ( args, cfg.aliases[list_name .. '-Mask'], 'err_redundant_parameters', i );

−

~~local languages~~ = ~~mw.~~language.~~fetchLanguageNames~~('en', ~~'all'~~) -- ~~get a list of~~ language ~~names known to Wikimedia~~

+

if last then -- error check |lastn= alias for unknown interwiki link prefix; done here because this is where we have the parameter name

−

-- ('~~all~~' ~~is required for North Ndebele~~, ~~South Ndebele~~, and ~~Ojibwa~~)

+

local project, language = interwiki_prefixen_get (last, true); -- true because we expect interwiki links in |lastn= to be wikilinked

−

local ~~langlc~~ = ~~mw.ustring.lower~~(~~lang~~); -- ~~lower case version for comparisons~~

+

if nil == project and nil == language then -- when both are nil

−

+

utilities.set_message ('err_bad_paramlink', last_alias); -- not known, emit an error message -- TODO: err_bad_interwiki?

−

~~for code~~, name ~~in pairs~~(~~languages~~) do -- ~~scan~~ the list ~~to see if we~~ can ~~find our language~~

+

last = utilities.remove_wiki_link (last); -- remove wikilink markup; show display value only

−

~~if langlc =~~= ~~mw.ustring.lower~~(~~name~~) ~~then~~

+

end

−

if ~~2 ~~~= ~~code:len~~() ~~then~~ -- ~~ISO639~~-~~1 codes~~ only

+

end

−

~~return name~~; -- ~~so return~~ the name ~~but not the code~~

+

if link then -- error check |linkn= alias for unknown interwiki link prefix

+

local project, language = interwiki_prefixen_get (link, false); -- false because wiki links in |author-linkn= is an error

+

if nil == project and nil == language then -- when both are nil

+

utilities.set_message ('err_bad_paramlink', link_alias); -- not known, emit an error message -- TODO: err_bad_interwiki?

+

link = nil; -- unset so we don't link

+

link_alias = nil;

+

end

+

end

+

last, etal = name_has_etal (last, etal, false, last_alias); -- find and remove variations on et al.

+

first, etal = name_has_etal (first, etal, false, first_alias); -- find and remove variations on et al.

+

last, first = name_checks (last, first, list_name, last_alias, first_alias); -- multiple names, extraneous annotation, etc. checks

+

if first and not last then -- if there is a firstn without a matching lastn

+

local alias = first_alias:find ('given', 1, true) and 'given' or 'first'; -- get first or given form of the alias

+

utilities.set_message ('err_first_missing_last', {

+

first_alias, -- param name of alias missing its mate

+

first_alias:gsub (alias, {['first'] = 'last', ['given'] = 'surname'}), -- make param name appropriate to the alias form

+

}); -- add this error message

+

elseif not first and not last then -- if both firstn and lastn aren't found, are we done?

+

count = count + 1; -- number of times we haven't found last and first

+

if 2 <= count then -- two missing names and we give up

+

break; -- normal exit or there is a two-name hole in the list; can't tell which

+

end

+

else -- we have last with or without a first

+

local result;

+

link = link_title_ok (link, link_alias, last, last_alias); -- check for improper wiki-markup

+

if first then

+

link = link_title_ok (link, link_alias, first, first_alias); -- check for improper wiki-markup

+

end

+

names[n] = {last = last, first = first, link = link, mask = mask, corporate = false}; -- add this name to our names list (corporate for |vauthors= only)

+

n = n + 1; -- point to next location in the names table

+

if 1 == count then -- if the previous name was missing

+

utilities.set_message ('err_missing_name', {list_name:match ("(%w+)List"):lower(), i - 1}); -- add this error message

end

−

~~return name, code~~; -- ~~found it~~, ~~return name to ensure proper capitalization and the ISO639-1 code~~

+

count = 0; -- reset the counter, we're looking for two consecutive missing names

end

+

i = i + 1; -- point to next args location

end

−

return ~~lang~~; -- ~~not valid language;~~ return ~~language in original case~~ and ~~nil for ISO639-1 code~~

+

return names, etal; -- all done, return our list of names and the etal flag

end

−

~~--[[--------------------------< L A N G U A G E _ P A R A M E T E R >------------------------------------------~~

−

~~Get language name from ISO639~~-~~1 code value provided. If a code is valid use the returned name; if not, then use the value that was provided with the language parameter.~~

+

--[[--------------------------< N A M E _ T A G _ G E T >------------------------------------------------------

−

~~There is an exception. There are three ISO639-1 codes for Norewegian~~ language ~~variants. There are two official variants: Norwegian Bokmål (code 'nb')~~ and

+

attempt to decode |language=<lang_param> and return language name and matching tag; nil else.

−

~~Norwegian Nynorsk (code 'nn'). The third, code 'no', is defined by ISO639-1 as 'Norwegian' though in Norway this is pretty much meaningless. However, it appears~~

−

~~that on enwiki, editors are for the most part unaware of the nb~~ and ~~nn variants (compare page counts for these variants at Category:Articles with non-English-language external links~~.

−

~~Because Norwegian Bokmål is the most common language variant, Media wiki has been modified to return Norwegian Bokmål~~ for ~~ISO639-1 code 'no'~~. ~~Here we undo that and~~

+

This function looks for:

−

~~return 'Norwegian'~~ when ~~editors use |language=no~~. ~~We presume that editors don't know about~~ the ~~variants or can't descriminate between them~~.

+

<lang_param> as a tag in cfg.lang_tag_remap{}

+

<lang_param> as a name in cfg.lang_name_remap{}

+

<lang_param> as a name in cfg.mw_languages_by_name_t

+

<lang_param> as a tag in cfg.mw_languages_by_tag_t

+

when those fail, presume that <lang_param> is an IETF-like tag that MediaWiki does not recognize. Strip all

+

script, region, variant, whatever subtags from <lang_param> to leave just a two or three character language tag

+

and look for the new <lang_param> in cfg.mw_languages_by_tag_t{}

−

~~See Help talk:Citation Style_1#An ISO 639-1 language~~ name ~~test~~

+

on success, returns name (in properly capitalized form) and matching tag (in lowercase); on failure returns nil

−

~~When |language= contains a valid ISO639-1 code, the page is assigned to the category for that code: Category:Norwegian-language sources (no) if~~

+

]]

−

~~the page is a mainspace page and the ISO639-1 code is not 'en'. Similarly, if the parameter is |language=Norwegian, it will be categorized in the same way.~~

−

~~This~~ function ~~supports multiple languages in the form |language~~=~~nb, French, th where~~ the ~~language names or codes are separated from each other by commas.~~

+

local function name_tag_get (lang_param)

+

local lang_param_lc = mw.ustring.lower (lang_param); -- use lowercase as an index into the various tables

+

local name;

+

local tag;

−

]]

+

name = cfg.lang_tag_remap[lang_param_lc]; -- assume <lang_param_lc> is a tag; attempt to get remapped language name

+

if name then -- when <name>, <lang_param> is a tag for a remapped language name

+

if cfg.lang_name_remap[name:lower()][2] ~= lang_param_lc then

+

utilities.set_message ('maint_unknown_lang'); -- add maint category if not already added

+

return name, cfg.lang_name_remap[name:lower()][2]; -- so return name and tag from lang_name_remap[name]; special case to xlate sr-ec and sr-el to sr-cyrl and sr-latn

+

end

+

return name, lang_param_lc; -- so return <name> from remap and <lang_param_lc>

+

end

−

~~local function language_parameter~~ (~~lang, namespace~~)

+

tag = lang_param_lc:match ('^(%a%a%a?)%-.*'); -- still assuming that <lang_param_lc> is a tag; strip script, region, variant subtags

−

~~local code~~; -- ~~the ISO639-1 two character code~~

+

name = cfg.lang_tag_remap[tag]; -- attempt to get remapped language name with language subtag only

−

~~local~~ name; -- ~~the~~ language name

+

if name then -- when <name>, <tag> is a tag for a remapped language name

−

~~local language_list = {};~~ -- ~~table of~~ language ~~names to be rendered~~

+

return name, tag; -- so return <name> from remap and <tag>

−

~~local names_table = {}~~; -- ~~table made~~ from ~~the value assigned~~ to |language=

+

end

−

~~local unrec_cat~~ = ~~false~~ -- ~~flag so~~ that ~~we only add unrecognized category once~~

+

if cfg.lang_name_remap[lang_param_lc] then -- not a remapped tag, assume <lang_param_lc> is a name; attempt to get remapped language tag

+

return cfg.lang_name_remap[lang_param_lc][1], cfg.lang_name_remap[lang_param_lc][2]; -- for this <lang_param_lc>, return a (possibly) new name and appropriate tag

+

end

+

name = cfg.mw_languages_by_tag_t[lang_param_lc]; -- assume that <lang_param_lc> is a tag; attempt to get its matching language name

−

~~names_table = mw.text.split (lang~~, ~~'%s*,%s*')~~; -- ~~names should be~~ a ~~comma separated list~~

+

if name then

+

return name, lang_param_lc; -- <lang_param_lc> is a tag so return it and <name>

+

end

−

~~for _, lang in ipairs (names_table) do~~ -- ~~reuse lang~~

+

tag = cfg.mw_languages_by_name_t[lang_param_lc]; -- assume that <lang_param_lc> is a language name; attempt to get its matching tag

−

~~if 0 == namespace and (('en' == lang:lower()) or ('english' == lang:lower())) then~~

−

~~add_maint_cat ('english')~~;

−

~~end~~

−

if ~~2 == lang:len()~~ then ~~-- ISO639-1 language code are 2 characters (fetchLanguageName also supports 3 character codes)~~

+

if tag then

−

~~name = mw~~.~~language.fetchLanguageName( lang:lower()~~, ~~"en" )~~; -- ~~get ISO 639-1 language name if Language~~ is a ~~proper code~~

+

return cfg.mw_languages_by_tag_t[tag], tag; -- <lang_param_lc> is a name so return the name from the table and <tag>

−

end

+

end

−

+

−

~~if is_set (name) then -- if Language specified a valid ISO639-1 code~~

+

tag = lang_param_lc:match ('^(%a%a%a?)%-.*'); -- is <lang_param_lc> an IETF-like tag that MediaWiki doesn't recognize? <tag> gets the language subtag; nil else

−

~~code~~ = ~~lang~~:~~lower~~(); -~~- save it~~

+

−

~~else~~

+

if tag then

−

~~name, code = get_iso639_code (lang~~); -- ~~attempt to get code from name (assign name here so~~ that ~~we are sure of proper capitalization)~~

+

name = cfg.mw_languages_by_tag_t[tag]; -- attempt to get a language name using the shortened <tag>

−

~~end~~

+

if name then

−

+

return name, tag; -- <lang_param_lc> is an unrecognized IETF-like tag so return <name> and language subtag

−

if ~~is_set (code)~~ then

−

~~if 'no' == code then~~ name = ~~'Norwegian' end~~; -- ~~override wikimedia when code is 'no'~~

−

~~if 0 == namespace and 'en' ~= code then -- is this page main / article space and English not the~~ language?

−

~~add_prop_cat ('foreign_lang_source', {~~name~~, code})~~

−

~~end~~

−

~~elseif false == unrec_cat~~ then

−

~~unrec_cat = true~~; -- ~~only add this category once~~

−

~~add_maint_cat (unknown_lang);~~

end

−

~~table.insert (language_list, name);~~

−

~~name = ''; -- so we can reuse it~~

−

~~end~~

−

~~code = #language_list -- reuse code as number of languages in the list~~

−

~~if 2 >= code then~~

−

~~name = table.concat (language_list, ' and ') -- insert '<space>and<space>' between two language names~~

−

~~elseif 2 < code then~~

−

~~language_list[code] = 'and ' .. language_list[code]; -- prepend last name with 'and<space>'~~

−

~~name = table.concat (language_list, ', ') -- and concatenate with '<comma><space>' separators~~

end

−

~~return (" " .. wrap_msg ('language', name)); -- wrap with '(in ...)'~~

end

−

~~--[[--------------------------< S E T _ C S 1 _ S T Y L E >----------------------------------------------------~~

−

~~Set style settings for CS1 citation templates. Returns separator and postscript settings~~

+

--[[-------------------< L A N G U A G E _ P A R A M E T E R >------------------

−

]]

+

Gets language name from a provided two- or three-character ISO 639 code. If a code

+

is recognized by MediaWiki, use the returned name; if not, then use the value that

+

was provided with the language parameter.

−

~~local function set_cs1_style~~ (ps)

+

When |language= contains a recognized language (either code or name), the page is

−

~~if not is_set~~ (ps) ~~then~~ -~~- unless explicitely set~~ to ~~something~~

+

assigned to the category for that code: Category:Norwegian-language sources (no).

−

~~ps =~~ '.'~~; -~~- ~~terminate the rendered citation with a period~~

+

For valid three-character code languages, the page is assigned to the single category

−

~~end~~

+

for '639-2' codes: Category:CS1 ISO 639-2 language sources.

−

~~return '~~.~~', ps; -- separator is a full stop~~

−

~~end~~

−

--~~[[--------------------------< S E T _ C S 2 _ S T Y L E >----------------------------------------------------~~

+

Languages that are the same as the local wiki are not categorized. MediaWiki does

+

not recognize three-character equivalents of two-character codes: code 'ar' is

+

recognized but code 'ara' is not.

−

~~Set style settings for CS2 citation templates. Returns separator~~, ~~postscript~~, ~~ref settings~~

+

This function supports multiple languages in the form |language=nb, French, th

+

where the language names or codes are separated from each other by commas with

+

optional space characters.

]]

−

local function ~~set_cs2_style~~ (ps, ~~ref~~)

+

local function language_parameter (lang)

−

if ~~not~~ is_set (ps) then -- if |~~postscript~~= has not ~~been set~~, ~~set cs2 default~~

+

local tag; -- some form of IETF-like language tag; language subtag with optional region, sript, vatiant, etc subtags

−

ps = ''; -- ~~make sure~~ it ~~isn't nil~~

+

local lang_subtag; -- ve populates |language= with mostly unecessary region subtags the MediaWiki does not recognize; this is the base language subtag

−

end

+

local name; -- the language name

−

if ~~not is_set~~ (~~ref~~) then -- if |~~ref~~= ~~is not set~~

+

local language_list = {}; -- table of language names to be rendered

−

~~ref = "harv"~~; -- ~~set default |ref=harv~~

+

local names_t = {}; -- table made from the value assigned to |language=

+

local this_wiki_name = mw.language.fetchLanguageName (cfg.this_wiki_code, cfg.this_wiki_code); -- get this wiki's language name

+

names_t = mw.text.split (lang, '%s*,%s*'); -- names should be a comma separated list

+

for _, lang in ipairs (names_t) do -- reuse lang here because we don't yet know if lang is a language name or a language tag

+

name, tag = name_tag_get (lang); -- attempt to get name/tag pair for <lang>; <name> has proper capitalization; <tag> is lowercase

+

if utilities.is_set (tag) then

+

lang_subtag = tag:gsub ('^(%a%a%a?)%-.*', '%1'); -- for categorization, strip any IETF-like tags from language tag

+

if cfg.this_wiki_code ~= lang_subtag then -- when the language is not the same as this wiki's language

+

if 2 == lang_subtag:len() then -- and is a two-character tag

+

utilities.add_prop_cat ('foreign-lang-source', {name, tag}, lang_subtag); -- categorize it; tag appended to allow for multiple language categorization

+

else -- or is a recognized language (but has a three-character tag)

+

utilities.add_prop_cat ('foreign-lang-source-2', {lang_subtag}, lang_subtag); -- categorize it differently TODO: support multiple three-character tag categories per cs1|2 template?

+

end

+

elseif cfg.local_lang_cat_enable then -- when the language and this wiki's language are the same and categorization is enabled

+

utilities.add_prop_cat ('local-lang-source', {name, lang_subtag}); -- categorize it

+

end

+

else

+

name = lang; -- return whatever <lang> has so that we show something

+

utilities.set_message ('maint_unknown_lang'); -- add maint category if not already added

+

end

+

table.insert (language_list, name);

+

name = ''; -- so we can reuse it

+

end

+

name = utilities.make_sep_list (#language_list, language_list);

+

if (1 == #language_list) and (lang_subtag == cfg.this_wiki_code) then -- when only one language, find lang name in this wiki lang name; for |language=en-us, 'English' in 'American English'

+

return ''; -- if one language and that language is this wiki's return an empty string (no annotation)

end

−

return ',', ~~ps, ref~~; -- ~~separator is a comma~~

+

return (" " .. wrap_msg ('language', name)); -- otherwise wrap with '(in ...)'

+

--[[ TODO: should only return blank or name rather than full list

+

so we can clean up the bunched parenthetical elements Language, Type, Format

+

]]

end

−

~~--[[--------------------------< G E T _ S E T T I N G S _ F R O M _ C I T E _ C L A S S >----------------------~~

−

~~When |~~mode~~= is not set~~ or ~~when its value is invalid~~, ~~use config~~.~~CitationClass~~ and ~~parameter values to establish~~

+

--[[-----------------------< S E T _ C S _ S T Y L E >--------------------------

−

~~rendered style~~.

+

Gets the default CS style configuration for the given mode.

+

Returns default separator and either postscript as passed in or the default.

+

In CS1, the default postscript and separator are '.'.

+

In CS2, the default postscript is the empty string and the default separator is ','.

]]

−

local function ~~get_settings_from_cite_class~~ (ps, ~~ref, cite_class~~)

+

local function set_cs_style (postscript, mode)

−

~~local sep;~~

+

if utilities.is_set(postscript) then

−

if (~~cite_class == "citation"~~) then -- for ~~citation templates (CS2)~~

+

-- emit a maintenance message if user postscript is the default cs1 postscript

−

~~sep, ps, ref~~ = ~~set_cs2_style~~ (~~ps, ref~~);

+

-- we catch the opposite case for cs2 in set_style

−

else ~~-- not a citation template so CS1~~

+

if mode == 'cs1' and postscript == cfg.presentation['ps_' .. mode] then

−

~~sep, ps~~ = ~~set_cs1_style (ps)~~;

+

utilities.set_message ('maint_postscript');

+

end

+

else

+

postscript = cfg.presentation['ps_' .. mode];

end

+

return cfg.presentation['sep_' .. mode], postscript;

+

end

−

~~return sep, ps, ref -- return them all~~

−

~~end~~

−

--[[--------------------------< S E T _ S T Y L E >~~-------------------------------~~-----------------------------

+

--[[--------------------------< S E T _ S T Y L E >-----------------------------

−

~~Establish basic style settings to be used when rendering~~ the ~~citation~~. ~~Uses~~ |mode= ~~if set~~ and ~~valid or uses~~

+

Sets the separator and postscript styles. Checks the |mode= first and the

−

~~config~~.~~CitationClass from~~ the ~~template's #invoke: to establish style~~.

+

#invoke CitationClass second. Removes the postscript if postscript == none.

]]

−

local function set_style (mode, ~~ps, ref~~, cite_class)

+

local function set_style (mode, postscript, cite_class)

local sep;

−

if 'cs2' == mode then ~~-- if this template is to be rendered in CS2 (citation) style~~

+

if 'cs2' == mode then

−

sep, ~~ps, ref~~ = ~~set_cs2_style~~ (ps, ~~ref~~);

+

sep, postscript = set_cs_style (postscript, 'cs2');

−

elseif 'cs1' == mode then ~~-- if this template is to be rendered in CS1~~ (~~cite xxx~~) ~~style~~

+

elseif 'cs1' == mode then

−

sep, ps = ~~set_cs1_style~~ (ps);

+

sep, postscript = set_cs_style (postscript, 'cs1');

−

else -- ~~anything but~~ cs1 ~~or cs2~~

+

elseif 'citation' == cite_class then

−

if ~~is_set (~~mode) then

+

sep, postscript = set_cs_style (postscript, 'cs2');

−

~~table.insert( z~~.~~message_tail, { set_error~~( '~~invalid_param_val', {~~'~~mode', mode}, true ) }~~ ); ~~-- add error message~~

+

else

+

sep, postscript = set_cs_style (postscript, 'cs1');

+

end

+

if cfg.keywords_xlate[postscript:lower()] == 'none' then

+

-- emit a maintenance message if user postscript is the default cs2 postscript

+

-- we catch the opposite case for cs1 in set_cs_style

+

if 'cs2' == mode or 'citation' == cite_class then

+

utilities.set_message ('maint_postscript');

end

−

~~sep, ps, ref = get_settings_from_cite_class (ps, ref, cite_class); -- get settings based on the template's CitationClass~~

+

postscript = '';

−

~~end~~

−

~~if 'none' == ps:lower() then -- if assigned value is 'none' then~~

−

ps = ''; ~~-- set to empty string~~

end

−

return sep, ~~ps, ref~~

+

return sep, postscript

end

−

~~--[=[-------------------------------------------------------------------------------------------~~

−

~~Determines if a url has the file extension is one of the pdf file extensions used by~~ [[~~MediaWiki:Common.css]] when~~

+

--[=[------------------------------------------------------------

−

~~applying the pdf icon to external links.~~

−

returns true if file extension is one of the recognized ~~extension~~, else false

+

Determines if a URL has the file extension that is one of the PDF file extensions

+

used by [[MediaWiki:Common.css]] when applying the PDF icon to external links.

+

returns true if file extension is one of the recognized extensions, else false

]=]

local function is_pdf (url)

−

return url:match ('%.pdf[%?#]?') or url:match ('%.PDF[%?#]?');

+

return url:match ('%.pdf$') or url:match ('%.PDF$') or

+

url:match ('%.pdf[%?#]') or url:match ('%.PDF[%?#]') or

+

url:match ('%.PDF&#035') or url:match ('%.pdf&#035');

end

−

~~--[[--------------------------< S T Y L E _ F O R M A T >------------------------------------------------------~~

−

Applies ~~css~~ style to |format=, |chapter-format=, etc. Also emits an error message if the format parameter does

+

--[[--------------------------< S T Y L E _ F O R M A T >-----------------------

−

not have a matching ~~url~~ parameter. If the format parameter is not set and the ~~url~~ contains a file extension that

+

−

is recognized as a ~~pdf~~ document by MediaWiki's commons.css, this code will set the format parameter to (PDF) with

+

Applies CSS style to |format=, |chapter-format=, etc. Also emits an error message

+

if the format parameter does not have a matching URL parameter. If the format parameter

+

is not set and the URL contains a file extension that is recognized as a PDF document

+

by MediaWiki's commons.css, this code will set the format parameter to (PDF) with

the appropriate styling.

Строка 1851: Строка 1884:

local function style_format (format, url, fmt_param, url_param)

−

if is_set (format) then

+

if utilities.is_set (format) then

−

format = wrap_style ('format', format~~:upper()~~); -- ~~force upper case,~~ add leading space, ~~parenthases~~, resize

+

format = utilities.wrap_style ('format', format); -- add leading space, parentheses, resize

−

if not is_set (url) then

+

if not utilities.is_set (url) then

−

~~format = format .~~. ~~set_error~~( '~~format_missing_url~~', {fmt_param, url_param} ); -- add an error message

+

utilities.set_message ('err_format_missing_url', {fmt_param, url_param}); -- add an error message

end

−

elseif is_pdf (url) then -- format is not set so if ~~url~~ is a ~~pdf~~ file then

+

elseif is_pdf (url) then -- format is not set so if URL is a PDF file then

−

format = wrap_style ('format', 'PDF'); -- set format to ~~pdf~~

+

format = utilities.wrap_style ('format', 'PDF'); -- set format to PDF

else

format = ''; -- empty string for concatenation

Строка 1864: Строка 1897:

end

−

~~--[[--------------------------< G E T _ D I S P L A Y _ A U T H O R S _ E D I T O R S >------------------------~~

−

~~Returns a number that may or may not limit the length of the author or editor name lists.~~

+

--[[---------------------< G E T _ D I S P L A Y _ N A M E S >------------------

−

~~When the value assigned to |display-authors= is~~ a number ~~greater than or equal to zero, return~~ the number and

+

Returns a number that defines the number of names displayed for author and editor

−

~~the previous state of the 'etal'~~ flag ~~(false by default but may have been set~~ to ~~true if~~ the name list ~~contains~~

+

name lists and a Boolean flag to indicate when et al. should be appended to the name list.

−

~~some variant of the text 'et al.')~~.

−

When the value assigned to |display-~~authors~~= is the keyword 'etal', return a number that is one greater than the

+

When the value assigned to |display-xxxxors= is a number greater than or equal to zero,

−

number of authors in the list and set the 'etal' flag true. This will cause the list_people() to display all of

+

return the number and the previous state of the 'etal' flag (false by default

−

the names in the name list followed by 'et al.'

+

but may have been set to true if the name list contains some variant of the text 'et al.').

+

When the value assigned to |display-xxxxors= is the keyword 'etal', return a number

+

that is one greater than the number of authors in the list and set the 'etal' flag true.

+

This will cause the list_people() to display all of the names in the name list followed by 'et al.'

In all other cases, returns nil and the previous state of the 'etal' flag.

+

inputs:

+

max: A['DisplayAuthors'] or A['DisplayEditors'], etc; a number or some flavor of etal

+

count: #a or #e

+

list_name: 'authors' or 'editors'

+

etal: author_etal or editor_etal

+

This function sets an error message when |display-xxxxors= value greater than or equal to number of names but

+

not when <max> comes from {{cs1 config}} global settings. When using global settings, <param> is set to the

+

keyword 'cs1 config' which is used to supress the normal error. Error is suppressed because it is to be expected

+

that some citations in an article will have the same or fewer names that the limit specified in {{cs1 config}}.

]]

−

local function ~~get_display_authors_editors~~ (max, count, list_name, etal)

+

local function get_display_names (max, count, list_name, etal, param)

−

if is_set (max) then

+

if utilities.is_set (max) then

if 'etal' == max:lower():gsub("[ '%.]", '') then -- the :gsub() portion makes 'etal' from a variety of 'et al.' spellings and stylings

max = count + 1; -- number of authors + 1 so display all author name plus et al.

Строка 1887: Строка 1933:

elseif max:match ('^%d+$') then -- if is a string of numbers

max = tonumber (max); -- make it a number

−

if max >= count and '~~authors~~' =~~= list_name~~ then -- ~~AUTHORS ONLY -- if~~ |display-xxxxors= value greater than or equal to number of ~~authors/editors~~

+

if (max >= count) and ('cs1 config' ~= param) then -- error when local |display-xxxxors= value greater than or equal to number of names; not an error when using global setting

−

~~add_maint_cat~~ ('~~disp_auth_ed~~', ~~list_name~~);

+

utilities.set_message ('err_disp_name', {param, max}); -- add error message

+

max = nil;

end

else -- not a valid keyword or number

−

~~table~~.~~insert( z.message_tail, { set_error~~( '~~invalid_param_val~~', {~~'display-' .. list_name~~, max~~}, true )~~ } ); -- add error message

+

utilities.set_message ('err_disp_name', {param, max}); -- add error message

−

max = nil; -- unset

+

max = nil; -- unset; as if |display-xxxxors= had not been set

end

−

~~elseif 'authors' == list_name then -- AUTHORS ONLY need to clear implicit et al category~~

−

~~max = count + 1; -- number of authors + 1~~

end

Строка 1901: Строка 1946:

end

−

~~--[[--------------------------< C I T A T I O N 0 >------------------------------------------------------------~~

−

~~This is~~ the ~~main function doing~~ the ~~majority~~ of ~~the citation~~

+

--[[----------< E X T R A _ T E X T _ I N _ P A G E _ C H E C K >---------------

−

~~formatting~~.

+

Adds error if |page=, |pages=, |quote-page=, |quote-pages= has what appears to be

+

some form of p. or pp. abbreviation in the first characters of the parameter content.

+

check page for extraneous p, p., pp, pp., pg, pg. at start of parameter value:

+

good pattern: '^P[^%.P%l]' matches when page begins PX or P# but not Px

+

where x and X are letters and # is a digit

+

bad pattern: '^[Pp][PpGg]' matches when page begins pp, pP, Pp, PP, pg, pG, Pg, PG

]]

−

local function ~~citation0~~( ~~config~~, ~~args~~)

+

local function extra_text_in_page_check (val, name)

−

--[[

+

if not val:match (cfg.vol_iss_pg_patterns.good_ppattern) then

−

~~Load Input Parameters~~

+

for _, pattern in ipairs (cfg.vol_iss_pg_patterns.bad_ppatterns) do -- spin through the selected sequence table of patterns

−

~~The argument_wrapper facilitates~~ the ~~mapping~~ of ~~multiple~~

+

if val:match (pattern) then -- when a match, error so

−

~~aliases~~ to ~~single internal variable.~~

+

utilities.set_message ('err_extra_text_pages', name); -- add error message

−

]]

+

return; -- and done

−

~~local A = argument_wrapper( args );~~

+

end

+

end

+

end

+

end

+

--[[--------------------------< E X T R A _ T E X T _ I N _ V O L _ I S S _ C H E C K >------------------------

+

Adds error if |volume= or |issue= has what appears to be some form of redundant 'type' indicator.

+

For |volume=:

+

'V.', or 'Vol.' (with or without the dot) abbreviations or 'Volume' in the first characters of the parameter

+

content (all case insensitive). 'V' and 'v' (without the dot) are presumed to be roman numerals so

+

are allowed.

−

~~local i~~

+

For |issue=:

−

~~local PPrefix = A[~~'~~PPrefix~~']

+

'No.', 'I.', 'Iss.' (with or without the dot) abbreviations, or 'Issue' in the first characters of the

−

~~local PPPrefix = A[~~'~~PPPrefix~~']

+

parameter content (all case insensitive).

−

~~if is_set~~( A['~~NoPP~~'] ) ~~then PPPrefix~~ = ~~"" PPrefix = "" end~~

+

Single character values ('v', 'i', 'n') allowed when not followed by separator character ('.', ':', '=', or

+

whitespace character) – param values are trimmed of whitespace by MediaWiki before delivered to the module.

−

~~-- Pick out the relevant fields from the arguments. Different citation templates~~

+

<val> is |volume= or |issue= parameter value

−

~~-- define different field names~~ for ~~the same underlying things.~~

+

<name> is |volume= or |issue= parameter name for error message

−

~~local Authors = A[~~'~~Authors~~'];

+

<selector> is 'v' for |volume=, 'i' for |issue=

−

~~local author_etal;~~

+

−

~~local a, author_etal~~ = ~~extract_names( args~~, '~~AuthorList~~' );

+

sets error message on failure; returns nothing

−

~~local Coauthors = A['Coauthors'~~];

+

]]

−

~~local Others = A['Others'~~];

−

~~local Editors = A['Editors'];~~

−

~~local editor_etal;~~

−

~~local e, editor_etal = extract_names( args, 'EditorList' );~~

−

local ~~NameListFormat = A['NameListFormat']; -- replaces |author-format= and |editor-format=~~

+

local function extra_text_in_vol_iss_check (val, name, selector)

−

if is_set (~~NameListFormat) and ('vanc' ~= NameListFormat~~) then ~~-- only accepted value for this parameter is 'vanc'~~

+

if not utilities.is_set (val) then

−

~~table.insert( z.message_tail, { set_error( 'invalid_param_val', {'name-list-format', NameListFormat}, true ) } ); -- not vanc so add error message~~

+

return;

−

~~NameListFormat = ''~~; ~~-- set to empty string~~

end

+

local patterns = 'v' == selector and cfg.vol_iss_pg_patterns.vpatterns or cfg.vol_iss_pg_patterns.ipatterns;

−

local ~~Year~~ = A['~~Year~~'];

+

local handler = 'v' == selector and 'err_extra_text_volume' or 'err_extra_text_issue';

−

~~local PublicationDate~~ = A['~~PublicationDate~~'];

+

val = val:lower(); -- force parameter value to lower case

−

~~local OrigYear~~ = ~~A['OrigYear']~~;

+

for _, pattern in ipairs (patterns) do -- spin through the selected sequence table of patterns

−

~~local Date = A['Date']~~;

+

if val:match (pattern) then -- when a match, error so

−

~~local LayDate~~ = A[~~'LayDate'];~~

+

utilities.set_message (handler, name); -- add error message

−

------------------------------------------------- ~~Get title data~~

+

return; -- and done

−

~~local Title = A['Title'];~~

+

end

−

~~local ScriptTitle~~ = ~~A['ScriptTitle'];~~

+

end

−

~~local BookTitle~~ = ~~A['BookTitle'];~~

+

end

−

~~local Conference = A['Conference'];~~

+

−

~~local TransTitle = A['TransTitle'];~~

+

−

~~local TitleNote = A['TitleNote'];~~

+

--[=[-------------------------< G E T _ V _ N A M E _ T A B L E >----------------------------------------------

−

~~local TitleLink = A['TitleLink'];~~

+

−

~~local Chapter = A['Chapter']~~;

+

split apart a |vauthors= or |veditors= parameter. This function allows for corporate names, wrapped in doubled

−

~~local ChapterLink = A['ChapterLink']; -- deprecated~~

+

parentheses to also have commas; in the old version of the code, the doubled parentheses were included in the

−

~~local TransChapter = A['TransChapter'];~~

+

rendered citation and in the metadata. Individual author names may be wikilinked

−

~~local TitleType~~ = A[~~'TitleType'];~~

+

−

~~local Degree = A~~[~~'Degree'~~];

+

|vauthors=Jones AB, [[E. B. White|White EB]], ((Black, Brown, and Co.))

−

~~local Docket = A['Docket'~~];

−

~~local ArchiveFormat = A['ArchiveFormat'];~~

−

~~local ArchiveURL = A['ArchiveURL'];~~

−

~~local URL = A['URL']~~

−

~~local URLorigin = A:ORIGIN~~(~~'URL'); -- get name of parameter that holds URL~~

−

~~local ChapterURL = A['ChapterURL'];~~

−

~~local ChapterURLorigin = A:ORIGIN~~(~~'ChapterURL'~~)~~; -- get name of parameter that holds ChapterURL~~

−

~~local ConferenceFormat = A['ConferenceFormat'];~~

−

~~local ConferenceURL = A['ConferenceURL'];~~

−

~~local ConferenceURLorigin = A:ORIGIN('ConferenceURL'~~)~~; -- get name of parameter that holds ConferenceURL~~

−

~~local Periodical = A['Periodical'];~~

−

~~local Series = A['Series'];~~

+

]=]

−

~~local Volume = A['Volume'];~~

−

~~local Issue = A['Issue'];~~

−

~~local Position = '';~~

−

~~local Page = A['Page'];~~

−

~~local Pages = hyphen_to_dash( A['Pages'~~] );

−

~~local At~~ = ~~A['At'~~];

−

local ~~Edition = A['Edition'];~~

+

local function get_v_name_table (vparam, output_table, output_link_table)

−

local ~~PublicationPlace~~ = ~~A['PublicationPlace']~~

+

local name_table = mw.text.split(vparam, "%s*,%s*"); -- names are separated by commas

−

local ~~Place = A['Place']~~;

+

local wl_type, label, link; -- wl_type not used here; just a placeholder

−

local ~~PublisherName~~ = ~~A['PublisherName']~~;

+

local i = 1;

−

~~local RegistrationRequired = A~~[~~'RegistrationRequired'~~];

+

−

~~local SubscriptionRequired = A~~['~~SubscriptionRequired~~'];

+

while name_table[i] do

−

local ~~Via~~ = A[~~'Via'~~];

+

if name_table[i]:match ('^%(%(.*[^%)][^%)]$') then -- first segment of corporate with one or more commas; this segment has the opening doubled parentheses

−

~~local AccessDate~~ = A[~~'AccessDate'~~];

+

local name = name_table[i];

−

~~local ArchiveDate~~ = A['~~ArchiveDate~~'];

+

i = i + 1; -- bump indexer to next segment

−

~~local Agency = A~~['~~Agency~~'];

+

while name_table[i] do

−

~~local DeadURL~~ = A['~~DeadURL~~']

+

name = name .. ', ' .. name_table[i]; -- concatenate with previous segments

−

~~local Language~~ = A[~~'Language'~~];

+

if name_table[i]:match ('^.*%)%)$') then -- if this table member has the closing doubled parentheses

−

~~local Format = A~~[~~'Format'~~];

+

break; -- and done reassembling so

−

~~local ChapterFormat = A~~[~~'ChapterFormat'~~];

+

end

−

~~local DoiBroken~~ = A[~~'DoiBroken'~~];

+

i = i + 1; -- bump indexer

−

~~local ID = A~~[~~'ID'~~];

+

end

−

~~local ASINTLD~~ = ~~A['ASINTLD']~~;

+

table.insert (output_table, name); -- and add corporate name to the output table

−

~~local IgnoreISBN = A['IgnoreISBN'];~~

+

table.insert (output_link_table, ''); -- no wikilink

−

~~local Embargo = A['Embargo']~~;

+

else

−

~~local Class =~~ A~~['Class'];~~ -- ~~arxiv class identifier~~

+

wl_type, label, link = utilities.is_wikilink (name_table[i]); -- wl_type is: 0, no wl (text in label variable); 1, [[D]]; 2, [[L|D]]

+

table.insert (output_table, label); -- add this name

+

if 1 == wl_type then

+

table.insert (output_link_table, label); -- simple wikilink [[D]]

+

else

+

table.insert (output_link_table, link); -- no wikilink or [[L|D]]; add this link if there is one, else empty string

+

end

+

end

+

i = i + 1;

+

end

+

return output_table;

+

end

+

--[[----------------------------------------------------------

−

~~local ID_list~~ = ~~extract_ids~~( ~~args~~ );

+

This function extracts author / editor names from |vauthors= or |veditors= and finds matching |xxxxor-maskn= and

+

|xxxxor-linkn= in args. It then returns a table of assembled names just as extract_names() does.

−

~~local Quote~~ = ~~A['Quote'];~~

+

Author / editor names in |vauthors= or |veditors= must be in Vancouver system style. Corporate or institutional names

+

may sometimes be required and because such names will often fail the is_good_vanc_name() and other format compliance

+

tests, are wrapped in doubled parentheses ((corporate name)) to suppress the format tests.

−

~~local LayFormat = A['LayFormat'];~~

+

Supports generational suffixes Jr, 2nd, 3rd, 4th–6th.

−

~~local LayURL = A['LayURL'];~~

−

~~local LaySource = A['LaySource'];~~

−

~~local Transcript = A['Transcript'];~~

−

~~local TranscriptFormat = A['TranscriptFormat'];~~

−

~~local TranscriptURL = A['TranscriptURL']~~

−

~~local TranscriptURLorigin = A:ORIGIN('TranscriptURL'); -- get name of parameter that holds TranscriptURL~~

−

~~local LastAuthorAmp = A[~~'~~LastAuthorAmp'];~~

+

This function sets the Vancouver error when a required comma is missing and when there is a space between an author's initials.

−

~~local no_tracking_cats = A['NoTracking'];~~

−

~~--these are used by cite interview~~

+

]]

−

~~local Callsign = A['Callsign'~~];

−

~~local City = A['City'~~];

−

~~local Program = A['Program'];~~

−

--local ~~variables that are not cs1 parameters~~

+

local function parse_vauthors_veditors (args, vparam, list_name)

−

local ~~use_lowercase~~; -- ~~controls capitalization~~ of ~~certain static text~~

+

local names = {}; -- table of names assembled from |vauthors=, |author-maskn=, |author-linkn=

−

local ~~this_page~~ = ~~mw.title.getCurrentTitle()~~; -- ~~also used for COinS and for language~~

+

local v_name_table = {};

−

local ~~anchor_year~~; -- ~~used in the CITEREF identifier~~

+

local v_link_table = {}; -- when name is wikilinked, targets go in this table

−

local ~~COinS_date~~; ~~-- used in the COinS metadata~~

+

local etal = false; -- return value set to true when we find some form of et al. vauthors parameter

+

local last, first, link, mask, suffix;

+

local corporate = false;

−

~~-- set default parameter values defined by |mode~~= ~~parameter. If |mode= is empty or omitted~~, ~~use CitationClass to set these values~~

+

vparam, etal = name_has_etal (vparam, etal, true); -- find and remove variations on et al. do not categorize (do it here because et al. might have a period)

−

~~local sepc~~; -- ~~separator between citation elements for CS1~~ a period~~, for CS2, a comma~~

+

v_name_table = get_v_name_table (vparam, v_name_table, v_link_table); -- names are separated by commas

−

~~local PostScript;~~

−

~~local Ref;~~

−

~~sepc, PostScript, Ref~~ = ~~set_style~~ (~~A['Mode']:lower(), A['PostScript']~~, ~~A['Ref']~~, ~~config.CitationClass~~);

−

~~use_lowercase = ( sepc == ',' );~~ -- ~~used to control capitalization for certain static text~~

−

--~~check this page~~ to ~~see if~~ it ~~is in one of the namespaces that cs1 is not supposed to add to the error categories~~

+

for i, v_name in ipairs(v_name_table) do

−

~~if not is_set~~ (~~no_tracking_cats~~) ~~then~~ -- ~~ignore if we are already not going to categorize~~ this ~~page~~

+

first = ''; -- set to empty string for concatenation and because it may have been set for previous author/editor

−

if ~~in_array (this_page.nsText, cfg.uncategorized_namespaces)~~ then

+

local accept_name;

−

~~no_tracking_cats~~ = "true"; -- ~~set no_tracking_cats~~

+

v_name, accept_name = utilities.has_accept_as_written (v_name); -- remove accept-this-as-written markup when it wraps all of <v_name>

−

~~end~~

+

−

~~for _~~,~~v in ipairs (cfg.uncategorized_subpages~~) ~~do -- cycle through page name patterns~~

+

if accept_name then

−

if ~~this_page.text~~:~~match~~ (v) then -- ~~test page name against each pattern~~

+

last = v_name;

−

~~no_tracking_cats = "true"~~; ~~-- set no_tracking_cats~~

+

corporate = true; -- flag used in list_people()

−

~~break~~; ~~-- bail out if one is found~~

+

elseif string.find(v_name, "%s") then

+

if v_name:find('[;%.]') then -- look for commonly occurring punctuation characters;

+

add_vanc_error (cfg.err_msg_supl.punctuation, i);

end

−

~~end~~

+

local lastfirstTable = {}

−

~~end~~

+

lastfirstTable = mw.text.split(v_name, "%s+")

+

first = table.remove(lastfirstTable); -- removes and returns value of last element in table which should be initials or generational suffix

−

-- ~~check for extra |page~~=~~, |pages~~= ~~or |at~~= ~~parameters~~.

+

if not mw.ustring.match (first, '^%u+$') then -- mw.ustring here so that later we will catch non-Latin characters

−

~~if is_set~~(~~Page~~) ~~then~~

+

suffix = first; -- not initials so assume that whatever we got is a generational suffix

−

if is_set(~~Pages) or is_set(At~~) then

+

first = table.remove(lastfirstTable); -- get what should be the initials from the table

−

~~Page~~ = ~~Page~~ .. ~~" "~~ .. ~~set_error~~('~~extra_pages~~'); -- ~~add error message~~

+

end

−

~~Pages =~~ ''; -- ~~unset the others~~

+

last = table.concat(lastfirstTable, ' ') -- returns a string that is the concatenation of all other names that are not initials and generational suffix

−

At = '';

+

if not utilities.is_set (last) then

+

first = ''; -- unset

+

last = v_name; -- last empty because something wrong with first

+

add_vanc_error (cfg.err_msg_supl.name, i);

+

end

+

if mw.ustring.match (last, '%a+%s+%u+%s+%a+') then

+

add_vanc_error (cfg.err_msg_supl['missing comma'], i); -- matches last II last; the case when a comma is missing

+

end

+

if mw.ustring.match (v_name, ' %u %u$') then -- this test is in the wrong place TODO: move or replace with a more appropriate test

+

add_vanc_error (cfg.err_msg_supl.initials, i); -- matches a space between two initials

+

end

+

else

+

last = v_name; -- last name or single corporate name? Doesn't support multiword corporate names? do we need this?

end

−

~~elseif is_set(Pages) then~~

+

−

if is_set(At) then

+

if utilities.is_set (first) then

−

~~Pages = Pages~~ .. " " .. ~~set_error~~('~~extra_pages~~'); -- ~~add error messages~~

+

if not mw.ustring.match (first, "^%u?%u$") then -- first shall contain one or two upper-case letters, nothing else

−

At = ''; -- unset

+

add_vanc_error (cfg.err_msg_supl.initials, i); -- too many initials; mixed case initials (which may be ok Romanization); hyphenated initials

+

end

+

is_good_vanc_name (last, first, suffix, i); -- check first and last before restoring the suffix which may have a non-Latin digit

+

if utilities.is_set (suffix) then

+

first = first .. ' ' .. suffix; -- if there was a suffix concatenate with the initials

+

suffix = ''; -- unset so we don't add this suffix to all subsequent names

+

end

+

else

+

if not corporate then

+

is_good_vanc_name (last, '', nil, i);

+

end

−

~~end~~

−

~~-- both |publication-place= and |place~~= (~~|location=~~) ~~allowed if different~~

+

link = utilities.select_one ( args, cfg.aliases[list_name .. '-Link'], 'err_redundant_parameters', i ) or v_link_table[i];

−

~~if not is_set~~(~~PublicationPlace~~) ~~and is_set(Place) then~~

+

mask = utilities.select_one ( args, cfg.aliases[list_name .. '-Mask'], 'err_redundant_parameters', i );

−

~~PublicationPlace~~ = ~~Place~~; -- ~~promote |place= (|location=)~~ to ~~|publication-place~~

+

names[i] = {last = last, first = first, link = link, mask = mask, corporate = corporate}; -- add this assembled name to our names list

end

−

+

return names, etal; -- all done, return our list of names

−

~~if PublicationPlace == Place then Place = ''~~; ~~end~~ -- ~~don't need both if they are the same~~

+

end

−

+

−

--[[

+

−

~~Parameter remapping for cite encyclopedia:~~

+

--[[--------------------------< S E L E C T _ A U T H O R _ E D I T O R _ S O U R C E >------------------------

−

~~When~~ the ~~citation has~~ these ~~parameters~~:

+

−

+

Select one of |authors=, |authorn= / |lastn / firstn=, or |vauthors= as the source of the author name list or

−

|~~encyclopedia and~~ |~~article then map~~ |~~encyclopedia to~~ |~~title~~

+

select one of |editorn= / editor-lastn= / |editor-firstn= or |veditors= as the source of the editor name list.

−

~~|encyclopedia then map |encyclopedia~~ to ~~|title~~

+

Only one of these appropriate three will be used. The hierarchy is: |authorn= (and aliases) highest and |authors= lowest;

+

|editorn= (and aliases) highest and |veditors= lowest (support for |editors= withdrawn)

+

When looking for |authorn= / |editorn= parameters, test |xxxxor1= and |xxxxor2= (and all of their aliases); stops after the second

+

test which mimicks the test used in extract_names() when looking for a hole in the author name list. There may be a better

+

way to do this, I just haven't discovered what that way is.

+

Emits an error message when more than one xxxxor name source is provided.

−

~~|trans_title maps to |trans_chapter when |title is re-mapped~~

+

In this function, vxxxxors = vauthors or veditors; xxxxors = authors as appropriate.

−

~~|url maps to |chapterurl when |title is remapped~~

−

~~All other combinations of |encyclopedia, |title, and |article are not modified~~

−

~~TODO: script-title to script-chapter if and when we support script-chapter~~

]]

−

local ~~Encyclopedia~~ = A['~~Encyclopedia~~'];

+

local function select_author_editor_source (vxxxxors, xxxxors, args, list_name)

+

local lastfirst = false;

+

if utilities.select_one ( args, cfg.aliases[list_name .. '-Last'], 'none', 1 ) or -- do this twice in case we have a |first1= without a |last1=; this ...

+

utilities.select_one ( args, cfg.aliases[list_name .. '-First'], 'none', 1 ) or -- ... also catches the case where |first= is used with |vauthors=

+

utilities.select_one ( args, cfg.aliases[list_name .. '-Last'], 'none', 2 ) or

+

utilities.select_one ( args, cfg.aliases[list_name .. '-First'], 'none', 2 ) then

+

lastfirst = true;

+

end

−

if ( ~~config~~.~~CitationClass~~ == ~~"encyclopaedia"~~ ) or ( ~~config~~.~~CitationClass == "citation"~~ and is_set (~~Encyclopedia~~)) ~~then -- test code for citation~~

+

if (utilities.is_set (vxxxxors) and true == lastfirst) or -- these are the three error conditions

−

~~if is_set~~(~~Periodical) then -- Periodical is set when |encyclopedia is set~~

+

(utilities.is_set (vxxxxors) and utilities.is_set (xxxxors)) or

−

if is_set(~~Title~~) ~~then~~

+

(true == lastfirst and utilities.is_set (xxxxors)) then

−

~~if not is_set(Chapter~~) then

+

local err_name;

−

+

if 'AuthorList' == list_name then -- figure out which name should be used in error message

−

~~TransChapter = TransTitle~~;

+

err_name = 'author';

−

~~ChapterURL = URL;~~

+

else

−

~~Title = Periodical;~~

+

err_name = 'editor';

−

~~ChapterFormat = Format;~~

−

~~Periodical =~~ ''~~; -- redundant so unset~~

−

~~TransTitle~~ = ~~''; -- redundant so unset~~

−

~~URL~~ = ~~'';~~ -- ~~redundant so unset~~

−

~~Format~~ = ''; ~~-- redundant so unset~~

−

~~end~~

−

else ~~-- |title not set~~

−

~~Title = Periodical; -- |encyclopedia set and |article set or not set so map |encyclopedia to |title~~

−

~~Periodical~~ = ''; ~~-- redundant so unset~~

end

−

~~end~~

+

utilities.set_message ('err_redundant_parameters', err_name .. '-name-list parameters'); -- add error message

end

−

~~-- Special case for cite techreport.~~

+

if true == lastfirst then return 1 end; -- return a number indicating which author name source to use

−

if ~~(config.CitationClass~~ == ~~"techreport")~~ then -- ~~special case for cite techreport~~

+

if utilities.is_set (vxxxxors) then return 2 end;

−

if is_set(~~Issue~~) then ~~-- cite techreport uses 'number', which other citations aliase to 'issue'~~

+

if utilities.is_set (xxxxors) then return 3 end;

−

if ~~not~~ is_set(ID) then ~~-- can we use ID for the "number"?~~

+

return 1; -- no authors so return 1; this allows missing author name test to run in case there is a first without last

−

~~ID = Issue~~; ~~-- yes, use it~~

+

end

−

~~Issue = ""~~; -- ~~unset Issue~~ so ~~that "number" isn't duplicated~~ in ~~the rendered citation or COinS metadata~~

+

−

~~else~~ -- ~~can~~'~~t use ID so emit error message~~

+

−

~~ID = ID~~ .. ~~" "~~ .~~. set_error('redundant_parameters'~~, ~~'<code>|id=</code>~~ and ~~<code>|number=</code>');~~

+

--[[--------------------------------------------------------

−

~~end~~

+

−

~~end~~

+

This function is used to validate a parameter's assigned value for those parameters that have only a limited number

−

~~end~~

+

of allowable values (yes, y, true, live, dead, etc.). When the parameter value has not been assigned a value (missing

+

or empty in the source template) the function returns the value specified by ret_val. If the parameter value is one

+

of the list of allowed values returns the translated value; else, emits an error message and returns the value

+

specified by ret_val.

−

~~-- special case for cite interview~~

+

TODO: explain <invert>

−

~~if (config.CitationClass == "interview") then~~

−

~~if is_set(Program) then~~

−

~~ID = ' ' .. Program;~~

−

~~end~~

−

~~if is_set(Callsign) then~~

−

~~if is_set(ID) then~~

−

~~ID = ID .. sepc .. ' ' .. Callsign;~~

−

~~else~~

−

~~ID = ' ' .. Callsign;~~

−

~~end~~

−

~~end~~

−

~~if is_set(City) then~~

−

~~if is_set(ID) then~~

−

~~ID = ID .. sepc .. ' ' .. City;~~

−

~~else~~

−

~~ID = ' ' .. City;~~

−

~~end~~

−

~~end~~

−

~~if is_set(Others) then~~

+

]]

−

~~if is_set(TitleType) then~~

−

~~Others = ' ' .. TitleType .. ' with ' .. Others;~~

−

~~TitleType = '';~~

−

~~else~~

−

~~Others = ' ' .. 'Interview with ' .. Others;~~

−

~~end~~

−

~~else~~

−

~~Others = '(Interview)';~~

−

~~end~~

−

~~end~~

−

~~-- special case for cite mailing list~~

+

local function is_valid_parameter_value (value, name, possible, ret_val, invert)

−

if (~~config.CitationClass == "mailinglist"~~) then

+

if not utilities.is_set (value) then

−

~~Periodical = A ['MailingList']~~;

+

return ret_val; -- an empty parameter is ok

end

−

~~-- Account for the oddity that is {{cite conference}}, before generation of COinS data.~~

+

if (not invert and utilities.in_array (value, possible)) then -- normal; <value> is in <possible> table

−

if ~~'conference' == config~~.~~CitationClass then~~

+

return cfg.keywords_xlate[value]; -- return translation of parameter keyword

−

~~if is_set~~(~~BookTitle~~) then

+

elseif invert and not utilities.in_array (value, possible) then -- invert; <value> is not in <possible> table

−

~~Chapter = Title~~;

+

return value; -- return <value> as it is

−

-- ~~ChapterLink = TitleLink~~; -- ~~|chapterlink= is deprecated~~

+

else

−

~~ChapterURL = URL~~;

+

utilities.set_message ('err_invalid_param_val', {name, value}); -- not an allowed value so add error message

−

~~ChapterURLorigin = URLorigin;~~

+

return ret_val;

−

~~URLorigin = '';~~

−

~~ChapterFormat = Format~~;

−

~~TransChapter = TransTitle;~~

−

~~Title = BookTitle;~~

−

~~Format = '';~~

−

-- ~~TitleLink = '';~~

−

~~TransTitle = '';~~

−

~~URL = '';~~

−

~~end~~

−

~~elseif 'speech' ~= config~~.~~CitationClass then~~

−

~~Conference =~~ ''; -- not ~~cite conference or cite speech~~ so ~~make sure this is empty string~~

end

+

end

+

--[[--------------------------< T E R M I N A T E _ N A M E _ L I S T >----------------------------------------

+

This function terminates a name list (author, contributor, editor) with a separator character (sepc) and a space

+

when the last character is not a sepc character or when the last three characters are not sepc followed by two

+

closing square brackets (close of a wikilink). When either of these is true, the name_list is terminated with a

+

single space character.

+

]]

−

~~-- cite map oddities~~

+

local function terminate_name_list (name_list, sepc)

−

local ~~Cartography = "";~~

+

if (string.sub (name_list, -3, -1) == sepc .. '. ') then -- if already properly terminated

−

~~local Scale = "";~~

+

return name_list; -- just return the name list

−

~~local Sheet = A['Sheet'] or '';~~

+

elseif (string.sub (name_list, -1, -1) == sepc) or (string.sub (name_list, -3, -1) == sepc .. ']]') then -- if last name in list ends with sepc char

−

~~local Sheets = A['Sheets'] or '';~~

+

return name_list .. " "; -- don't add another

−

if ~~config~~.~~CitationClass~~ == ~~"map" then~~

+

else

−

~~Chapter = A[~~'~~Map~~'];

+

return name_list .. sepc .. ' '; -- otherwise terminate the name list

−

~~ChapterURL = A['MapURL']~~;

+

end

−

~~TransChapter~~ = ~~A['TransMap'];~~

+

end

−

~~ChapterURLorigin~~ = ~~A:ORIGIN~~(~~'MapURL'~~);

−

~~ChapterFormat~~ = ~~A['MapFormat~~'];

−

~~Cartography = A['Cartography~~'];

−

~~if is_set( Cartography~~ ) then

−

~~Cartography = sepc~~ .. " " ~~.. wrap_msg (~~'~~cartography', Cartography, use_lowercase);~~

−

~~end~~

−

~~Scale = A['Scale'];~~

−

~~if is_set( Scale ) then~~

−

~~Scale = sepc~~ .. ~~" "~~ .. ~~Scale~~;

−

end

−

end

−

~~-- Account for the oddities that are {{cite episode}} and {{cite serial}}, before generation of COinS data.~~

−

~~if 'episode' == config.CitationClass or 'serial' == config.CitationClass then~~

−

~~local AirDate = A['AirDate'];~~

−

~~local Began = A['Began']; -- these two are deprecated because the module understands date ranges~~

−

~~local Ended = A['Ended'];~~

−

~~local SeriesLink = A['SeriesLink'];~~

−

~~local Network = A['Network'];~~

−

~~local Station = A['Station'];~~

−

~~local s, n = {}, {};~~

−

-- ~~do common parameters first~~

+

--[[-------------------------< F O R M A T _ V O L U M E _ I S S U E >-----------------------------------------

−

~~if is_set(Network) then table.insert(n, Network); end~~

−

~~if is_set(Station) then table.insert(n, Station); end~~

−

~~ID = table.concat(n, sepc .. ' ');~~

−

~~if not is_set (Date) then~~ -- ~~promote airdate or Began/Ended to date~~

−

~~if is_set (AirDate) then~~

−

~~Date = AirDate;~~

−

~~elseif is_set (Began) then~~ -- ~~deprecated~~

−

~~if Began:match('%s') or Ended:match('%s') then~~ -- ~~so we don't create errors: if either has spaces then~~

−

~~Date = Began .. ' – ' .. Ended;~~ -- ~~use spaced ndash as separator~~

−

~~else~~

−

~~Date = Began .. '–' .. Ended;~~ -- ~~elsewise no spaces~~

−

~~end~~

−

~~end~~

−

~~end~~

−

~~if 'episode' == config.CitationClass then -- handle~~ the ~~oddities that are strictly {{cite episode}}~~

+

returns the concatenation of the formatted volume and issue (or journal article number) parameters as a single

−

~~local Season = A['Season'];~~

+

string; or formatted volume or formatted issue, or an empty string if neither are set.

−

~~local SeriesNumber = A['SeriesNumber']~~;

−

~~if is_set (Season) and is_set (SeriesNumber) then -- these are mutually exclusive so if both are set~~

+

]]

−

~~table.insert( z.message_tail, { set_error( 'redundant_parameters', {wrap_style ('parameter', 'season') .. ' and ' .. wrap_style ('parameter', 'seriesno')}, true ) } );~~ ~~-- add error message~~

+

−

~~SeriesNumber = ''; -- unset; prefer |season= over |seriesno=~~

+

local function format_volume_issue (volume, issue, article, cite_class, origin, sepc, lower)

−

~~end~~

+

if not utilities.is_set (volume) and not utilities.is_set (issue) and not utilities.is_set (article) then

−

~~-- assemble a table of parts concatenated later into Series~~

+

return '';

−

~~if is_set~~(~~Season) then table.insert(s~~, ~~wrap_msg ('season'~~, ~~Season~~, ~~use_lowercase)); end~~

−

~~if is_set(SeriesNumber) then table.insert(s~~, ~~wrap_msg ('series'~~, ~~SeriesNumber~~, ~~use_lowercase)~~)~~; end~~

−

if ~~is_set(Issue) then table.insert(s, wrap_msg ('episode', Issue, use_lowercase)); end~~

−

~~Issue = ''; -- unset because this is~~ not ~~a unique parameter~~

−

~~Chapter = Title; -- promote title parameters to chapter~~

−

~~ChapterLink = TitleLink; -- alias episodelink~~

−

~~TransChapter = TransTitle;~~

−

~~ChapterURL = URL;~~

−

~~ChapterURLorigin = A:ORIGIN('URL');~~

−

~~Title = Series; -- promote series to title~~

−

~~TitleLink = SeriesLink;~~

−

~~Series = table.concat(s, sepc .~~. ~~' '); -- this is concatenation of season, seriesno, episode number~~

−

if is_set (~~ChapterLink~~) and not is_set (~~ChapterURL~~) ~~then -- link but~~ not ~~URL~~

−

~~Chapter = '[[' .. ChapterLink .. '|' .. Chapter .~~. ~~']]'; -- ok to wikilink~~

−

~~elseif~~ is_set (~~ChapterLink) and is_set (ChapterURL~~) then ~~-- if both are set, URL links episode;~~

−

~~Series = '[[' .. ChapterLink .. '|' .. Series .. ']]'; -- series links with ChapterLink (episodelink -> TitleLink -> ChapterLink) ugly~~

−

~~end~~

−

~~URL = ''; -- unset~~

−

~~TransTitle = ''; -- unset~~

−

~~else -- now oddities that are cite serial~~

−

~~Issue = ''; -- unset because this parameter no longer supported by the citation/core version of cite serial~~

−

~~Chapter = A['Episode']; -- TODO: make |episode= available to cite episode someday?~~

−

~~if is_set (Series) and is_set (SeriesLink) then~~

−

~~Series = '[[' .. SeriesLink .. '|' .. Series ..~~ ']]';

−

~~end~~

−

~~Series = wrap_style ('italic-title', Series); -- series is italicized~~

−

~~end~~

end

−

~~-- end of {{cite episode}} stuff~~

−

-- ~~Account for the oddities that are {{cite arxiv}}, before generation of COinS data.~~

+

-- same condition as in format_pages_sheets()

−

if '~~arxiv~~' == ~~config.CitationClass then~~

+

local is_journal = 'journal' == cite_class or (utilities.in_array (cite_class, {'citation', 'map', 'interview'}) and 'journal' == origin);

−

~~if not is_set (ID_list['ARXIV']) then -- |arxiv=~~ or ~~|eprint= required for cite arxiv~~

−

~~table.insert~~( z.~~message_tail, { set_error~~( ~~'arxiv_missing'~~, {~~}, true ) } ); -- add error message~~

−

~~end~~

−

~~if first_set (AccessDate, At, Chapter, Format, Page, Pages, Periodical, PublisherName, URL, -- a crude list of parameters that are not supported by cite arxiv~~

−

~~ID_list[~~'~~ASIN~~'], ~~ID_list[~~'~~BIBCODE~~'], ~~ID_list[~~'~~DOI~~'~~], ID_list['ISBN'], ID_list['ISSN'],~~

−

~~ID_list['JFM'], ID_list['JSTOR'], ID_list['LCCN'], ID_list['MR'], ID_list['OCLC'], ID_list['OL'],~~

−

~~ID_list['OSTI'], ID_list['PMC'], ID_list['PMID'], ID_list['RFC'], ID_list['SSRN'], ID_list['USENETID'], ID_list['ZBL']~~) ~~then~~

−

~~table.insert( z.message_tail, { set_error(~~ '~~arxiv_params_not_supported~~'~~, {}, true ) }~~ ); ~~-- add error message~~

−

~~AccessDate~~= ''~~; -- set these to empty string; not supported in cite arXiv~~

+

local is_numeric_vol = volume and (volume:match ('^[MDCLXVI]+$') or volume:match ('^%d+$')); -- is only uppercase roman numerals or only digits?

−

~~PublisherName =~~ ''; -- ~~(if the article has been published, use cite journal,~~ or ~~other)~~

+

local is_long_vol = volume and (4 < mw.ustring.len(volume)); -- is |volume= value longer than 4 characters?

−

~~Chapter~~ = '';

+

−

~~URL~~ = ~~'';~~

+

if volume and (not is_numeric_vol and is_long_vol) then -- when not all digits or Roman numerals, is |volume= longer than 4 characters?

−

~~Format = '';~~

+

utilities.add_prop_cat ('long-vol'); -- yes, add properties cat

−

~~Page~~ = ~~''; Pages = ''; At = '';~~

−

~~end~~

−

~~Periodical =~~ '~~arXiv~~'; -- ~~set to arXiv for COinS; after that~~, ~~must be set to empty string~~

end

−

-- ~~handle type parameter for those CS1 citations that have default values~~

+

if is_journal then -- journal-style formatting

+

local vol = '';

−

if ~~in_array~~(~~config.CitationClass, {"AV~~-~~media~~-~~notes", "DVD~~-~~notes"~~, ~~"mailinglist"~~, ~~"map", "podcast", "pressrelease", "report", "techreport", "thesis"~~}) then

+

if utilities.is_set (volume) then

−

~~TitleType~~ = ~~set_titletype~~ (~~config~~.~~CitationClass~~, ~~TitleType~~);

+

if is_numeric_vol then -- |volume= value all digits or all uppercase Roman numerals?

−

~~if is_set(Degree) and "Thesis" == TitleType then~~ -- ~~special case for cite thesis~~

+

vol = utilities.substitute (cfg.presentation['vol-bold'], {sepc, volume}); -- render in bold face

−

~~TitleType~~ = ~~Degree~~ .. ~~" thesis"~~;

+

elseif is_long_vol then -- not all digits or Roman numerals; longer than 4 characters?

+

vol = utilities.substitute (cfg.messages['j-vol'], {sepc, utilities.hyphen_to_dash (volume)}); -- not bold

+

else -- four or fewer characters

+

vol = utilities.substitute (cfg.presentation['vol-bold'], {sepc, utilities.hyphen_to_dash (volume)}); -- bold

+

end

+

vol = vol .. (utilities.is_set (issue) and utilities.substitute (cfg.messages['j-issue'], issue) or '')

+

vol = vol .. (utilities.is_set (article) and utilities.substitute (cfg.messages['j-article-num'], article) or '')

+

return vol;

end

−

+

−

if is_set(~~TitleType~~) then -- ~~if type parameter is specified~~

+

if 'podcast' == cite_class and utilities.is_set (issue) then

−

~~TitleType = "~~ (" .. ~~TitleType~~ .~~. "~~)"; -- ~~display it in parentheses~~

+

return wrap_msg ('issue', {sepc, issue}, lower);

+

end

+

if 'conference' == cite_class and utilities.is_set (article) then -- |article-number= supported only in journal and conference cites

+

if utilities.is_set (volume) and utilities.is_set (article) then -- both volume and article number

+

return wrap_msg ('vol-art', {sepc, utilities.hyphen_to_dash (volume), article}, lower);

+

elseif utilities.is_set (article) then -- article number alone; when volume alone, handled below

+

return wrap_msg ('art', {sepc, article}, lower);

+

end

−

-- ~~legacy: promote concatenation~~ of ~~|month=, and |year= to Date if Date not set; or, promote PublicationDate to Date if neither Date nor Year are set.~~

+

-- all other types of citation

−

if ~~not~~ is_set (~~Date~~) then

+

if utilities.is_set (volume) and utilities.is_set (issue) then

−

~~Date = Year;~~ -~~- promote Year to Date~~

+

return wrap_msg ('vol-no', {sepc, utilities.hyphen_to_dash (volume), issue}, lower);

−

~~Year = nil~~; ~~-- make nil so Year as empty string isn't used for CITEREF~~

+

elseif utilities.is_set (volume) then

−

if is_set(~~Date~~) then

+

return wrap_msg ('vol', {sepc, utilities.hyphen_to_dash (volume)}, lower);

−

~~local Month = A[~~'~~Month~~'];

+

else

−

~~if is_set~~(~~Month~~) ~~then~~

+

return wrap_msg ('issue', {sepc, issue}, lower);

−

~~Date = Month .. " " .. Date~~;

−

~~end~~

−

~~elseif is_set~~(~~PublicationDate) then -- use PublicationDate when |date= and |year= are not set~~

−

~~Date = PublicationDate; -- promote PublicationDate to Date~~

−

~~PublicationDate =~~ ''; ~~-- unset, no longer needed~~

−

~~end~~

end

+

end

+

--[[-------------------------< F O R M A T _ P A G E S _ S H E E T S >-----------------------------------------

−

~~if PublicationDate~~ == ~~Date then PublicationDate = ''; end -- if PublicationDate~~ is ~~same as Date~~, ~~don't display in rendered citation~~

+

adds static text to one of |page(s)= or |sheet(s)= values and returns it with all of the others set to empty strings.

+

The return order is:

+

page, pages, sheet, sheets

−

~~--[[~~

+

Singular has priority over plural when both are provided.

−

~~Go test all of the date-holding parameters for valid MOS:DATE format and make sure that dates~~ are ~~real dates. This must be done before we do COinS because here is where~~

−

~~we get the date used in the metadata~~.

−

~~Date validation supporting code is in Module:Citation/CS1/Date_validation~~

]]

−

~~do -- create defined block to contain local variables error_message and mismatch~~

−

~~local error_message = '';~~

−

~~-- AirDate has been promoted to Date so not necessary to check it~~

−

~~anchor_year, COinS_date, error_message = dates({['accessdate']=AccessDate, ['archivedate']=ArchiveDate, ['date']=Date, ['doi_brokendate']=DoiBroken,~~

−

~~['embargo']=Embargo, ['laydate']=LayDate, ['publicationdate']=PublicationDate, ['year']=Year});~~

−

~~if is_set (Year) and is_set (Date) then -- both |date= and |year= not normally needed;~~

+

local function format_pages_sheets (page, pages, sheet, sheets, cite_class, origin, sepc, nopp, lower)

−

local ~~mismatch = year_date_check~~ (~~Year~~, ~~Date~~)

+

if 'map' == cite_class then -- only cite map supports sheet(s) as in-source locators

−

if 0 == ~~mismatch~~ then -- ~~|year= does not match a year~~-~~value in |date=~~

+

if utilities.is_set (sheet) then

−

if is_set (~~error_message~~) then -- if ~~there is already an error message~~

+

if 'journal' == origin then

−

~~error_message = error_message ..~~ ', '; ~~-- tack on this additional message~~

+

return '', '', wrap_msg ('j-sheet', sheet, lower), '';

−

~~end~~

+

else

−

~~error_message = error_message ..~~ '~~|year= / |date= mismatch~~';

+

return '', '', wrap_msg ('sheet', {sepc, sheet}, lower), '';

−

elseif 1 == ~~mismatch~~ then -~~- |year= matches year-value in |date=~~

+

end

−

~~add_maint_cat~~ ('~~date_year~~');

+

elseif utilities.is_set (sheets) then

+

if 'journal' == origin then

+

return '', '', '', wrap_msg ('j-sheets', sheets, lower);

+

else

+

return '', '', '', wrap_msg ('sheets', {sepc, sheets}, lower);

end

+

end

−

if is_set(~~error_message~~) then

+

local is_journal = 'journal' == cite_class or (utilities.in_array (cite_class, {'citation', 'map', 'interview'}) and 'journal' == origin);

−

~~table~~.~~insert~~( z.~~message_tail~~, { ~~set_error~~( '~~bad_date~~', {~~error_message}~~, ~~true )~~ } ); ~~-- add this error message~~

+

if utilities.is_set (page) then

+

if is_journal then

+

return utilities.substitute (cfg.messages['j-page(s)'], page), '', '', '';

+

elseif not nopp then

+

return utilities.substitute (cfg.messages['p-prefix'], {sepc, page}), '', '', '';

+

else

+

return utilities.substitute (cfg.messages['nopp'], {sepc, page}), '', '', '';

end

−

~~end -- end of do~~

+

elseif utilities.is_set (pages) then

−

+

if is_journal then

−

~~-- Account for the oddity that is {{cite journal}} with |pmc= set and |url= not set~~. ~~Do this after date check but before COInS~~.

+

return utilities.substitute (cfg.messages['j-page(s)'], pages), '', '', '';

−

-~~- Here we unset Embargo if PMC not embargoed~~ (~~|embargo= not set in the citation~~) ~~or if the embargo time has expired. Otherwise~~, ~~holds embargo date~~

+

elseif tonumber(pages) ~= nil and not nopp then -- if pages is only digits, assume a single page number

−

~~Embargo = is_embargoed~~ (~~Embargo~~); --

+

return '', utilities.substitute (cfg.messages['p-prefix'], {sepc, pages}), '', '';

−

+

elseif not nopp then

−

~~if config~~.~~CitationClass == "journal" and not is_set~~(~~URL) and is_set(ID_list~~['~~PMC~~']) ~~then~~

+

return '', utilities.substitute (cfg.messages['pp-prefix'], {sepc, pages}), '', '';

−

if not ~~is_set (Embargo)~~ then ~~-- if not embargoed or embargo has expired~~

+

else

−

~~URL=~~cfg.~~id_handlers~~['~~PMC~~']~~.prefix .. ID_list[~~'~~PMC~~']; ~~-- set url to be the same as the PMC external link if not embargoed~~

+

return '', utilities.substitute (cfg.messages['nopp'], {sepc, pages}), '', '';

−

~~URLorigin =~~ cfg.~~id_handlers~~['~~PMC~~']~~.parameters[1]~~; ~~-- set URLorigin to parameter name for use in error message if citation is missing a |title=~~

end

+

return '', '', '', ''; -- return empty strings

+

end

−

~~-- At this point fields may be nil if they weren't specified in the template use. We can use that fact.~~

−

~~-- Test if citation has no title~~

−

~~if not is_set(Title) and~~

−

~~not is_set(TransTitle) and~~

−

~~not is_set(ScriptTitle) then~~

−

~~table.insert( z.message_tail, { set_error( 'citation_missing_title', {}, true ) } );~~

−

~~end~~

−

~~if 'none' == Title and is_set(Periodical) and not (( config.CitationClass == "encyclopaedia" ) or ( config.CitationClass == "citation" and is_set (Encyclopedia))) then -- special case~~

−

~~Title = ''; -- set title to empty string~~

−

~~add_maint_cat ('untitled');~~

−

~~end~~

−

-- ~~COinS metadata (see~~ <~~http://ocoins.info/~~>~~) for automated parsing of citation information.~~

+

--[[------------------------------------------------------------------------

−

-- ~~handle the oddity that is cite encyclopedia and {{citation |encyclopedia=something}}. Here we presume that~~

−

-- ~~when Periodical, Title, and Chapter are all set, then Periodical is the book (encyclopedia) title, Title~~

−

-- ~~is the article title, and Chapter is a section within the article. So, we remap~~

−

~~local coins_chapter = Chapter;~~ -- ~~default assuming that remapping not required~~

−

~~local coins_title = Title;~~ -- ~~et tu~~

−

~~if 'encyclopaedia' == config.CitationClass or ('citation' == config.CitationClass and is_set (Encyclopedia)) then~~

−

~~if is_set (Chapter) and is_set (Title) and is_set (Periodical) then~~ -- ~~if all are used then~~

−

~~coins_chapter = Title;~~ -- ~~remap~~

−

~~coins_title = Periodical;~~

−

~~end~~

−

~~end~~

−

-- ~~this is the function call to COinS()~~

−

~~local OCinSoutput = COinS({~~

−

~~['Periodical'] = Periodical,~~

−

~~['Chapter'] = strip_apostrophe_markup (coins_chapter),~~ -- ~~Chapter stripped of bold / italic wikimarkup~~

−

~~['Title'] = make_coins_title (coins_title, ScriptTitle),~~ -- ~~Title and ScriptTitle stripped of bold / italic wikimarkup~~

−

~~['PublicationPlace'] = PublicationPlace,~~

−

~~['Date'] = first_set(COinS_date, Date),~~ -- ~~COinS_date has correctly formatted date if Date is valid; any reason to keep Date here? Should we be including invalid dates in metadata?~~

−

~~['Series'] = Series,~~

−

~~['Volume'] = Volume,~~

−

~~['Issue'] = Issue,~~

−

~~['Pages'] = get_coins_pages (first_set(Sheet, Sheets, Page, Pages, At)),~~ -- ~~pages stripped of external links~~

−

~~['Edition'] = Edition,~~

−

~~['PublisherName'] = PublisherName,~~

−

~~['URL'] = first_set( URL, ChapterURL ),~~

−

~~['Authors'] = a,~~

−

~~['ID_list'] = ID_list,~~

−

~~['RawPage'] = this_page.prefixedText,~~

−

~~}, config.CitationClass);~~

−

~~-- Account for~~ the ~~oddities that are {{cite arxiv}}, AFTER generation of COinS data.~~

+

returns one of the in-source locators: page, pages, or at.

−

~~if 'arxiv' == config.CitationClass then~~ -~~- we have set rft.jtitle in COinS to arXiv~~, ~~now unset so it isn't displayed~~

−

~~Periodical = ''; -- periodical not allowed in cite arxiv; if article has been published~~, ~~use cite journal~~

−

~~end~~

−

-~~- special case~~ for ~~cite newsgroup~~. ~~Do this after~~ COinS because we ~~are modifying Publishername~~ to ~~include some static text~~

+

If any of these are interwiki links to Wikisource, returns the label portion of the interwiki-link as plain text

−

~~if 'newsgroup' == config.CitationClass then~~

+

for use in COinS. This COinS thing is done because here we convert an interwiki-link to an external link and

−

~~if is_set~~ (~~PublisherName~~) ~~then~~

+

add an icon span around that; get_coins_pages() doesn't know about the span. TODO: should it?

−

~~PublisherName =~~ '~~[[Newsgroup]]: ' .~~. ~~external_link( 'news~~:~~' .. PublisherName, PublisherName );~~

−

~~end~~

−

~~end~~

+

TODO: add support for sheet and sheets?; streamline;

+

TODO: make it so that this function returns only one of the three as the single in-source (the return value assigned

+

to a new name)?

−

~~-- Now perform various field substitutions.~~

+

]]

−

~~-- We also add leading spaces and surrounding markup and punctuation to the~~

−

~~-- various parts of the citation, but only when they are non-nil.~~

−

~~do -- do-block to limit scope of LastFirstAuthors~~

−

~~local LastFirstAuthors;~~

−

~~local Maximum = A['DisplayAuthors'~~];

−

~~Maximum~~ , ~~author_etal = get_display_authors_editors (Maximum~~, #a, ~~'authors'~~, ~~author_etal~~);

+

local function insource_loc_get (page, page_orig, pages, pages_orig, at)

+

local ws_url, ws_label, coins_pages, L; -- for Wikisource interwiki-links; TODO: this corrupts page metadata (span remains in place after cleanup; fix there?)

−

~~local control = {~~

+

if utilities.is_set (page) then

−

~~format~~ = ~~NameListFormat,~~ -- ~~empty string or~~ '~~vanc~~'

+

if utilities.is_set (pages) or utilities.is_set (at) then

−

~~maximum~~ = ~~Maximum~~,

+

pages = ''; -- unset the others

−

~~lastauthoramp~~ = ~~LastAuthorAmp~~,

+

at = '';

−

~~page_name~~ = ~~this_page~~.~~text~~ -- ~~get current~~ page ~~name so that we don't wikilink to it via authorlinkn~~

+

end

−

};

+

extra_text_in_page_check (page, page_orig); -- emit error message when |page= value begins with what looks like p., pp., etc.

−

+

−

~~-- If the coauthor field is also used, prevent ampersand and et al. formatting~~.

+

ws_url, ws_label, L = wikisource_url_make (page); -- make ws URL from |page= interwiki link; link portion L becomes tooltip label

−

if is_set(~~Coauthors~~) then

+

if ws_url then

−

~~control.lastauthoramp~~ = ~~nil;~~

+

page = external_link (ws_url, ws_label .. ' ', 'ws link in page'); -- space char after label to move icon away from in-source text; TODO: a better way to do this?

−

~~control.maximum = #a + 1~~;

+

page = utilities.substitute (cfg.presentation['interwiki-icon'], {cfg.presentation['class-wikisource'], L, page});

+

coins_pages = ws_label;

+

end

+

elseif utilities.is_set (pages) then

+

if utilities.is_set (at) then

+

at = ''; -- unset

end

−

+

extra_text_in_page_check (pages, pages_orig); -- emit error message when |page= value begins with what looks like p., pp., etc.

−

~~LastFirstAuthors = list_people~~(~~control~~, ~~a, author_etal~~);

−

~~if is_set~~ (~~Authors~~) then

+

ws_url, ws_label, L = wikisource_url_make (pages); -- make ws URL from |pages= interwiki link; link portion L becomes tooltip label

−

~~if is_set~~ (~~LastFirstAuthors~~) ~~then~~ -- ~~if both author name styles~~

+

if ws_url then

−

~~table~~.~~insert~~( z.~~message_tail, { set_error(~~ '~~redundant_parameters~~', {~~wrap_style (~~'~~parameter~~', ~~'authors'~~) .~~. ' and '~~ .. ~~wrap_style (~~'~~parameter~~', '~~last~~'~~)}, true ) }~~ ); -- ~~add error message~~

+

pages = external_link (ws_url, ws_label .. ' ', 'ws link in pages'); -- space char after label to move icon away from in-source text; TODO: a better way to do this?

−

~~Authors = LastFirstAuthors~~; -- TODO: is this ~~correct or should we use |authors= instead~~?

+

pages = utilities.substitute (cfg.presentation['interwiki-icon'], {cfg.presentation['class-wikisource'], L, pages});

−

~~end~~

+

coins_pages = ws_label;

−

~~else~~

+

end

−

~~Authors~~ = ~~LastFirstAuthors~~; ~~-- either an author name list or an empty string~~

+

elseif utilities.is_set (at) then

+

ws_url, ws_label, L = wikisource_url_make (at); -- make ws URL from |at= interwiki link; link portion L becomes tooltip label

+

if ws_url then

+

at = external_link (ws_url, ws_label .. ' ', 'ws link in at'); -- space char after label to move icon away from in-source text; TODO: a better way to do this?

+

at = utilities.substitute (cfg.presentation['interwiki-icon'], {cfg.presentation['class-wikisource'], L, at});

+

coins_pages = ws_label;

end

−

~~end -- end of do~~

−

~~if not is_set(Authors) and is_set(Coauthors) then -- coauthors aren't displayed if one of authors=, authorn=, or lastn= isn't specified~~

−

~~table.insert( z.message_tail, { set_error('coauthors_missing_author', {}, true) } ); -- emit error message~~

end

+

return page, pages, at, coins_pages;

+

end

−

~~local EditorCount;~~ -- ~~used only for choosing {ed.) or (eds.) annotation at end of editor name~~-~~list~~

+

--[[--------------------------------------------------------------

−

~~if not is_set(Editors) then~~

−

~~local Maximum =~~ A~~['DisplayEditors'];~~

−

~~Maximum , editor_etal = get_display_authors_editors (Maximum, #e, 'editors', editor_etal);~~

+

add error message when |archive-url= value is same as |url= or chapter-url= (or alias...) value

−

-~~- Preserve old-style implicit et al.~~

−

~~if not is_set(Maximum) and #e~~ == ~~4 then~~

−

~~Maximum~~ = 3;

−

~~table~~.~~insert( z~~.~~message_tail, { set_error('implict_etal_editor', {}, true) }~~ );

−

~~end~~

−

~~local control = {~~

+

]]

−

~~format = NameListFormat, -- empty string or 'vanc'~~

−

~~maximum = Maximum,~~

−

~~lastauthoramp = LastAuthorAmp,~~

−

~~page_name = this_page.text -- get current page name so that we don't wikilink to it via editorlinkn~~

−

};

−

~~Editors~~, ~~EditorCount = list_people(control~~, e, ~~editor_etal~~);

+

local function is_unique_archive_url (archive, url, c_url, source, date)

−

if 1 == ~~EditorCount and (true~~ == ~~editor_etal or 1 < #e~~) ~~then~~ -- ~~only one editor displayed but includes etal then~~

+

if utilities.is_set (archive) then

−

~~EditorCount~~ = 2; -- ~~spoof to display (eds.) annotation~~

+

if archive == url or archive == c_url then

+

utilities.set_message ('err_bad_url', {utilities.wrap_style ('parameter', source)}); -- add error message

+

return '', ''; -- unset |archive-url= and |archive-date= because same as |url= or |chapter-url=

end

−

~~else~~

−

~~EditorCount = 1;~~

end

−

-- ~~apply |~~[xx-~~]format= styling; at the end, these parameters hold correctly styled format annotation,~~

+

return archive, date;

−

-- ~~an error message if the associated url is not set, or an empty string for concatenation~~

+

end

−

~~ArchiveFormat = style_format (ArchiveFormat, ArchiveURL, 'archive~~-~~format', 'archive~~-~~url');~~

+

−

~~ChapterFormat = style_format (ChapterFormat, ChapterURL, 'chapter~~-~~format', 'chapter~~-~~url');~~

+

−

~~ConferenceFormat = style_format (ConferenceFormat, ConferenceURL, 'conference~~-~~format', 'conference~~-~~url');~~

+

--[=[-------------------------< A R C H I V E _ U R L _ C H E C K >--------------------------------------------

−

~~Format = style_format (Format,~~ URL, '~~format', 'url~~');

+

−

~~LayFormat = style_format (LayFormat, LayURL, 'lay-format', 'lay-url');~~

+

Check archive.org URLs to make sure they at least look like they are pointing at valid archives and not to the

−

~~TranscriptFormat = style_format (TranscriptFormat, TranscriptURL, 'transcript-format', 'transcripturl');~~

+

save snapshot URL or to calendar pages. When the archive URL is 'https://web.archive.org/save/' (or http://...)

+

archive.org saves a snapshot of the target page in the URL. That is something that Wikipedia should not allow

+

unwitting readers to do.

−

if ~~not is_set(URL) then~~ --and

+

When the archive.org URL does not have a complete timestamp, archive.org chooses a snapshot according to its own

−

-~~- not is_set(ArchiveURL) then --~~and ~~-- prevents format_missing_url~~ error ~~from registering~~

+

algorithm or provides a calendar 'search' result. [[WP:ELNO]] discourages links to search results.

−

-- ~~not is_set(ConferenceURL) and~~ -~~- TODO: keep this here? conference as part of cite web or cite podcast?~~

+

−

-- not ~~is_set~~(~~TranscriptURL~~) ~~then -- TODO: remove?~~ |~~transcript~~-url= and |~~transcript~~= ~~has separate test~~

+

This function looks at the value assigned to |archive-url= and returns empty strings for |archive-url= and

−

+

|archive-date= and an error message when:

−

-- ~~Test if cite~~ web ~~or cite podcast |url= is missing or empty~~

+

|archive-url= holds an archive.org save command URL

−

~~if in_array(config~~.~~CitationClass, {"~~web~~","podcast", "mailinglist"}) then~~

+

|archive-url= is an archive.org URL that does not have a complete timestamp (YYYYMMDDhhmmss 14 digits) in the

−

~~table~~.~~insert~~( ~~z.message_tail~~, ~~{ set_error(~~ '~~cite_web_url~~', {}, ~~true~~ ) } );

+

correct place

−

~~end~~

+

otherwise returns |archive-url= and |archive-date=

−

+

−

~~-- Test if accessdate~~ is ~~given without giving~~ a URL

+

There are two mostly compatible archive.org URLs:

−

~~if is_set~~(~~AccessDate~~) ~~and~~ not ~~is_set~~(~~ChapterURL~~)~~then~~ -- ~~ChapterURL may be set when~~ the ~~others are not set; TODO: move this to a separate test?~~

+

//web.archive.org/<timestamp>... -- the old form

−

~~table.insert~~( ~~z.message_tail~~, ~~{ set_error(~~ '~~accessdate_missing_url~~', {}, ~~true ) } )~~;

+

//web.archive.org/web/<timestamp>... -- the new form

−

~~AccessDate~~ = '';

+

−

~~end~~

+

The old form does not support or map to the new form when it contains a display flag. There are four identified flags

+

('id_', 'js_', 'cs_', 'im_') but since archive.org ignores others following the same form (two letters and an underscore)

+

we don't check for these specific flags but we do check the form.

+

This function supports a preview mode. When the article is rendered in preview mode, this function may return a modified

+

archive URL:

+

for save command errors, return undated wildcard (/*/)

+

for timestamp errors when the timestamp has a wildcard, return the URL unmodified

+

for timestamp errors when the timestamp does not have a wildcard, return with timestamp limited to six digits plus wildcard (/yyyymm*/)

+

A secondary function is to return an archive-url timestamp from those urls that have them (archive.org and

+

archive.today). The timestamp is used by validation.archive_date_check() to see if the value in |archive-date=

+

matches the timestamp in the archive url.

+

]=]

+

local function archive_url_check (url, date)

+

local err_msg = ''; -- start with the error message empty

+

local path, timestamp, flag; -- portions of the archive.org URL

+

timestamp = url:match ('//archive.today/(%d%d%d%d%d%d%d%d%d%d%d%d%d%d)/'); -- get timestamp from archive.today urls

+

if timestamp then -- if this was an archive.today url ...

+

return url, date, timestamp; -- return ArchiveURL, ArchiveDate, and timestamp from |archive-url=, and done

end

−

+

-- here for archive.org urls

−

~~local OriginalURL, OriginalFormat;~~ -- ~~TODO: swap chapter and title~~ here ~~so that~~ archive ~~applies to most specific if both are set?~~

+

if (not url:match('//web%.archive%.org/')) and (not url:match('//liveweb%.archive%.org/')) then -- also deprecated liveweb Wayback machine URL

−

~~DeadURL = DeadURL:lower(); -- used later when assembling archived text~~

+

return url, date; -- not an archive.org archive, return ArchiveURL and ArchiveDate

−

if ~~is_set~~( ~~ArchiveURL ) then~~

−

~~if is_set~~ (~~URL) then~~

−

~~OriginalURL = URL; -- save copy of original source URL~~

−

~~OriginalFormat = Format; -- and original |format=~~

−

~~if 'no~~' ~~~= DeadURL then -- if URL set then archive-url applies to it~~

−

~~URL = ArchiveURL -- swap-in the~~ archive's url

−

~~URLorigin = A~~:~~ORIGIN~~('~~ArchiveURL~~') ~~-- name of archive url parameter for error messages~~

−

~~Format = ArchiveFormat or ''; -- swap in archive's format~~

−

~~end~~

−

~~elseif is_set (ChapterURL~~) then -- URL ~~not set so if chapter-~~url ~~is set apply archive url to it~~

−

~~OriginalURL = ChapterURL~~; -- ~~save copy of source chapter's url for~~ archive ~~text~~

−

~~OriginalFormat = ChapterFormat; -- and original |format=~~

−

~~if 'no' ~= DeadURL then~~

−

~~ChapterURL = ArchiveURL -- swap-in the~~ archive~~'s url~~

−

~~URLorigin = A:ORIGIN('~~ArchiveURL~~') -- name of archive url parameter for error messages~~

−

~~ChapterFormat = ArchiveFormat or ''; -- swap in archive's format~~

−

~~end~~

−

~~end~~

end

−

if ~~in_array~~(~~config~~.~~CitationClass~~, {"web~~","news","journal","pressrelease","podcast", "newsgroup"~~, '~~arxiv~~'}) or

+

if url:match('//web%.archive%.org/save/') then -- if a save command URL, we don't want to allow saving of the target page

−

('~~citation~~' == ~~config~~.~~CitationClass and is_set~~ (~~Periodical~~) ~~and~~ not ~~is_set~~ (~~Encyclopedia)~~) then

+

err_msg = cfg.err_msg_supl.save;

−

if ~~is_set~~ (~~Chapter~~) or ~~is_set~~ (~~TransChapter~~) or ~~is_set~~ (~~ChapterURL~~)then -- ~~chapter parameters not supported for these citation types~~

+

url = url:gsub ('(//web%.archive%.org)/save/', '%1/*/', 1); -- for preview mode: modify ArchiveURL

−

~~table~~.~~insert( z~~.~~message_tail, { set_error~~( '~~chapter_ignored~~', ~~{}, true~~ ) } ); -- ~~add error message~~

+

elseif url:match('//liveweb%.archive%.org/') then

−

~~Chapter~~ = ''; -- ~~set~~ to ~~empty string to be safe with concatenation~~

+

err_msg = cfg.err_msg_supl.liveweb;

−

~~TransChapter = '';~~

+

else

−

~~ChapterURL = '';~~

+

path, timestamp, flag = url:match('//web%.archive%.org/([^%d]*)(%d+)([^/]*)/'); -- split out some of the URL parts for evaluation

+

if not path then -- malformed in some way; pattern did not match

+

err_msg = cfg.err_msg_supl.timestamp;

+

elseif 14 ~= timestamp:len() then -- path and flag optional, must have 14-digit timestamp here

+

err_msg = cfg.err_msg_supl.timestamp;

+

if '*' ~= flag then

+

local replacement = timestamp:match ('^%d%d%d%d%d%d') or timestamp:match ('^%d%d%d%d'); -- get the first 6 (YYYYMM) or first 4 digits (YYYY)

+

if replacement then -- nil if there aren't at least 4 digits (year)

+

replacement = replacement .. string.rep ('0', 14 - replacement:len()); -- year or yearmo (4 or 6 digits) zero-fill to make 14-digit timestamp

+

url=url:gsub ('(//web%.archive%.org/[^%d]*)%d[^/]*', '%1' .. replacement .. '*', 1) -- for preview, modify ts to 14 digits plus splat for calendar display

+

end

−

~~else~~ -- ~~otherwise, format chapter~~ / ~~article title~~

+

elseif utilities.is_set (path) and 'web/' ~= path then -- older archive URLs do not have the extra 'web/' path element

−

~~Chapter~~ = ~~format_chapter_title (Chapter, TransChapter, ChapterURL, ChapterURLorigin)~~;

+

err_msg = cfg.err_msg_supl.path;

−

if is_set (~~Chapter~~) then

+

elseif utilities.is_set (flag) and not utilities.is_set (path) then -- flag not allowed with the old form URL (without the 'web/' path element)

−

~~if 'map'~~ =~~= config~~.~~CitationClass~~ and ~~is_set~~ (~~TitleType~~) then

+

err_msg = cfg.err_msg_supl.flag;

−

~~Chapter~~ = ~~Chapter .. ' '~~ .. ~~TitleType~~;

+

elseif utilities.is_set (flag) and not flag:match ('%a%a_') then -- flag if present must be two alpha characters and underscore (requires 'web/' path element)

−

~~end~~

+

err_msg = cfg.err_msg_supl.flag;

−

~~Chapter~~ = ~~Chapter .. ChapterFormat .. sepc .. ' ';~~

+

else

+

return url, date, timestamp; -- return ArchiveURL, ArchiveDate, and timestamp from |archive-url=

end

+

-- if here, something not right so

+

utilities.set_message ('err_archive_url', {err_msg}); -- add error message and

−

-- ~~Format main title.~~

+

if is_preview_mode then

−

~~if is_set(TitleLink) and is_set(Title) then~~

+

return url, date, timestamp; -- preview mode so return ArchiveURL, ArchiveDate, and timestamp from |archive-url=

−

~~Title = "[[" .. TitleLink .. "|" .. Title .. "]]"~~

+

else

+

return '', ''; -- return empty strings for ArchiveURL and ArchiveDate

end

+

end

+

--[[----------------------------------------------------------------------------------

−

~~if in_array(config.CitationClass~~, ~~{"web","news","journal","pressrelease","podcast", "newsgroup", "mailinglist"~~, ~~'arxiv'}) or~~

+

check |place=, |publication-place=, |location= to see if these params include digits. This function added because

−

~~('citation'~~ =~~= config~~.~~CitationClass and is_set (Periodical) and not is_set (Encyclopedia)) or~~

+

many editors misuse location to specify the in-source location (|page(s)= and |at= are supposed to do that)

−

~~('map' == config.CitationClass and is_set (Periodical)) then -- special case for cite map when~~ the ~~map is~~ in ~~a periodical treat as an article~~

+

−

~~Title = kern_quotes (Title); -~~- ~~if necessary, separate title's leading and trailing quote marks from Module provided quote marks~~

+

returns the original parameter value without modification; added maint cat when parameter value contains digits

−

~~Title = wrap_style~~ (~~'quoted-title', Title);~~

+

−

+

]]

−

~~Title = script_concatenate~~ (~~Title, ScriptTitle~~)~~; -- <bdi> tags, lang atribute, categorization, etc; must be done after title is wrapped~~

−

~~TransTitle~~= ~~wrap_style ('trans-quoted-title', TransTitle );~~

−

~~elseif 'report' == config.CitationClass then -- no styling for cite report~~

−

~~Title~~ = ~~script_concatenate (Title, ScriptTitle); -- <bdi> tags, lang atribute, categorization, etc; must be done after title is wrapped~~

−

~~TransTitle= wrap_style ('trans-quoted-title', TransTitle~~ )~~; -- for cite report, use this form for trans-title~~

−

~~else~~

−

~~Title = wrap_style ('italic-title', Title)~~;

−

~~Title = script_concatenate (Title, ScriptTitle); -- <bdi> tags, lang atribute, categorization, etc; must be done after title is wrapped~~

−

~~TransTitle = wrap_style ('trans-italic-title', TransTitle);~~

−

~~end~~

−

~~TransError = "";~~

+

local function place_check (param_val)

−

~~if is_set~~(~~TransTitle~~) ~~then~~

+

if not utilities.is_set (param_val) then -- parameter empty or omitted

−

if is_set(~~Title~~) then

+

return param_val; -- return that empty state

−

~~TransTitle = " " .. TransTitle;~~

−

~~else~~

−

~~TransError = " " .. set_error( 'trans_missing_title' )~~;

−

~~end~~

end

−

~~Title = Title~~ .. ~~TransTitle~~;

+

if mw.ustring.find (param_val, '%d') then -- not empty, are there digits in the parameter value

+

utilities.set_message ('maint_location'); -- yep, add maint cat

+

end

−

~~if is_set(Title) then~~

+

return param_val; -- and done

−

~~if not is_set(TitleLink) and is_set(URL) then~~

+

end

−

~~Title~~ = ~~external_link~~( ~~URL, Title~~ ) ~~.. TransError .. Format~~;

+

−

~~URL = "";~~

+

−

~~Format = ""~~;

+

--[[------------------------------------------------------------------------

−

else

+

−

~~Title = Title .. TransError;~~

+

compares |title= to 'Archived copy' (placeholder added by bots that can't find proper title); if matches, return true; nil else

−

~~end~~

−

~~end~~

−

~~if is_set(Place) then~~

+

]]

−

~~Place = " " .. wrap_msg ('written', Place, use_lowercase) .. sepc .. " ";~~

−

~~end~~

−

if ~~is_set~~ (~~Conference~~) then

+

local function is_archived_copy (title)

−

if ~~is_set~~ (~~ConferenceURL~~) then

+

title = mw.ustring.lower(title); -- switch title to lower case

−

~~Conference = external_link( ConferenceURL, Conference )~~;

+

if title:find (cfg.special_case_translation.archived_copy.en) then -- if title is 'Archived copy'

+

return true;

+

elseif cfg.special_case_translation.archived_copy['local'] then

+

if mw.ustring.find (title, cfg.special_case_translation.archived_copy['local']) then -- mw.ustring() because might not be Latin script

+

return true;

end

−

~~Conference = sepc .. " " .. Conference .. ConferenceFormat;~~

−

~~elseif is_set(ConferenceURL) then~~

−

~~Conference = sepc .. " " .. external_link( ConferenceURL, nil, ConferenceURLorigin );~~

end

+

end

−

~~if not is_set(Position) then~~

+

−

local ~~Minutes = A[~~'~~Minutes~~'];

+

--[[--------------------------< D I S P L A Y _ N A M E S _ S E L E C T >--------------------------------------

−

~~if is_set~~(~~Minutes~~) ~~then~~

+

−

~~Position~~ = ~~" " .. Minutes .. " " .. cfg.messages['minutes'];~~

+

for any of the |display-authors=, |display-editors=, etc parameters, select either the local or global setting.

−

~~else~~

+

When both are present, look at <local_display_names> value. When the value is some sort of 'et al.'string,

−

local ~~Time~~ = ~~A['Time'~~];

+

special handling is required.

−

if is_set(~~Time~~) then

+

−

~~local TimeCaption~~ = A['~~TimeCaption~~']

+

When {{cs1 config}} has |display-<namelist>= AND this template has |display-<namelist>=etal AND:

−

~~if not is_set~~(~~TimeCaption~~) ~~then~~

+

the number of names specified by <number_of_names> is:

−

~~TimeCaption~~ = ~~cfg.messages['event']~~;

+

greater than the number specified in the global |display-<namelist>= parameter (<global_display_names>)

−

if ~~sepc ~= '.'~~ then

+

use global |display-<namelist>= parameter value

−

~~TimeCaption = TimeCaption:lower~~();

+

set overridden maint category

−

~~end~~

+

less than or equal to the number specified in the global |display-<namelist>= parameter

−

~~end~~

+

use local |display-<namelist>= parameter value

−

~~Position = " " .. TimeCaption .. " " .. Time~~;

+

The purpose of this function is to prevent categorizing a template that has fewer names than the global setting

+

to keep the etal annotation specified by <local_display_names>.

+

]]

+

local function display_names_select (global_display_names, local_display_names, param_name, number_of_names, test)

+

if global_display_names and utilities.is_set (local_display_names) then -- when both

+

if 'etal' == local_display_names:lower():gsub("[ '%.]", '') then -- the :gsub() portion makes 'etal' from a variety of 'et al.' spellings and stylings

+

number_of_names = tonumber (number_of_names); -- convert these to numbers for comparison

+

local global_display_names_num = tonumber (global_display_names); -- <global_display_names> not set when parameter value is not digits

+

if number_of_names > global_display_names_num then -- template has more names than global config allows to be displayed?

+

utilities.set_message ('maint_overridden_setting'); -- set a maint message because global is overriding local |display-<namelist>=etal

+

return global_display_names, 'cs1 config'; -- return global with spoof parameter name (for get_display_names())

+

else

+

return local_display_names, param_name; -- return local because fewer names so let <local_display_names> control

end

−

~~else~~

+

-- here when <global_display_names> and <local_display_names> both numbers; <global_display_names> controls

−

~~Position = " "~~ .~~. Position~~;

+

utilities.set_message ('maint_overridden_setting'); -- set a maint message

−

~~At =~~ '';

+

return global_display_names, 'cs1 config'; -- return global with spoof parameter name (for get_display_names())

end

−

+

-- here when only one of <global_display_names> or <local_display_names> set

−

if ~~not is_set(Page)~~ then

+

if global_display_names then

−

~~if is_set~~(~~Pages) then~~

+

return global_display_names, 'cs1 config'; -- return global with spoof parameter name (for get_display_names())

−

~~if is_set(Periodical) and~~

−

~~not in_array~~(~~config.CitationClass, {"encyclopaedia","web","book","news","podcast"}~~) ~~then~~

−

~~Pages = ": " .. Pages;~~

−

~~elseif tonumber(Pages~~) ~~~= nil then~~

−

~~Pages = sepc .." " .. PPrefix .. Pages;~~

−

~~else~~

−

~~Pages = sepc .." " .. PPPrefix .. Pages;~~

−

~~end~~

−

~~end~~

else

−

~~if is_set(Periodical) and~~

+

return local_display_names, param_name; -- return local

−

~~not in_array(config.CitationClass~~, ~~{"encyclopaedia","web","book","news","podcast"}) then~~

−

~~Page = ": " .. Page;~~

−

~~else~~

−

~~Page = sepc .." " .. PPrefix .. Page~~;

−

~~end~~

end

+

end

−

~~if 'map' == config.CitationClass then -- cite map oddity done after COinS call (and with other in-source locators)~~

−

~~if is_set (Sheet) or is_set (Sheets) then~~

−

~~local err_msg1 = 'sheet=, |sheets'; -- default error message in case any of page pages or at are set~~

−

~~local err_msg2;~~

−

~~if is_set (Page) or is_set (Pages) or is_set (At) then -- are any set?~~

−

~~err_msg2 = 'page=, |pages=, |at'; -- a generic error message~~

−

~~Page = ''; Pages = ''; At = '';~~

−

~~elseif is_set (Sheet) and is_set (Sheets) then -- if both are set make error message~~

−

~~err_msg1 = 'sheet';~~

−

~~err_msg2 = 'sheets';~~

−

~~end~~

−

~~if is_set (err_msg2) then~~

−

~~table.insert( z.message_tail, { set_error( 'redundant_parameters', {wrap_style ('parameter', err_msg1) .. ' and ' .. wrap_style ('parameter', err_msg2)}, true ) } ); -- add error message~~

−

~~end~~

−

~~if not is_set (Sheet) then -- do sheet static text and formatting; Sheet has priority over Sheets if both provided~~

−

~~if is_set (Sheets) then~~

−

~~if is_set (Periodical) then~~

−

~~Sheet = ": Sheets " .. Sheets; -- because Sheet has priority, no need to support both later on~~

−

~~else~~

−

~~Sheet = sepc .. " Sheets " .. Sheets;~~

−

~~end~~

−

~~end~~

−

~~else~~

−

~~if is_set (Periodical) then~~

−

~~Sheet = ": Sheet " .. Sheet;~~

−

~~else~~

−

~~Sheet = sepc .. " Sheet " .. Sheet;~~

−

~~end~~

−

~~end~~

−

~~end~~

−

~~end~~

−

~~At = is_set(At) and (sepc .. " " .. At) or "";~~

+

--[[--------------------------< C I T A T I O N 0 >------------------------------------------------------------

−

~~Position = is_set(Position) and (sepc .. " " .. Position) or "";~~

−

~~if config.CitationClass == 'map' then~~

−

~~local Section = A~~[~~'Section'];~~

−

~~local Sections = A~~[~~'Sections'];~~

−

~~local Inset =~~ A~~['Inset'];~~

−

~~if is_set( Inset ) then~~

−

~~Inset = sepc .. " " .. wrap_msg ('inset', Inset, use_lowercase);~~

−

~~end~~

−

~~if is_set( Sections ) then~~

−

~~Section = sepc .. " " .. wrap_msg ('sections', Sections, use_lowercase);~~

−

~~elseif is_set( Section ) then~~

−

~~Section = sepc .. " " .. wrap_msg ('section', Section, use_lowercase);~~

−

~~end~~

−

~~At = At .. Inset .. Section;~~

−

~~end~~

−

~~if is_set (Language) then~~

+

This is the main function doing the majority of the citation formatting.

−

~~Language = language_parameter (Language, this_page~~.~~namespace); -- format, categories (article namespace only), name from ISO639-1, etc~~

−

~~else~~

−

~~Language=""; -- language not specified so make sure this is an empty string;~~

−

~~end~~

−

~~Others = is_set(Others) and (sepc .. " " .. Others) or "";~~

+

]]

−

~~TitleNote = is_set~~(~~TitleNote) and (sepc .. " " .. TitleNote~~) ~~or "";~~

+

local function citation0( config, args )

−

~~Edition = is_set(Edition) and (" " .. wrap_msg ('edition', Edition)) or "";~~

+

--[[

−

~~Issue = is_set(Issue) and (" (" .. Issue .. ")") or "";~~

+

Load Input Parameters

−

~~Series = is_set(Series) and (sepc .. " " .~~. ~~Series) or "";~~

+

The argument_wrapper facilitates the mapping of multiple aliases to single internal variable.

−

~~OrigYear = is_set(OrigYear) and (" [" .. OrigYear .. "~~]~~") or "";~~

+

]]

−

~~Agency~~ = ~~is_set(Agency) and~~ (~~sepc .. " " .. Agency~~) ~~or ""~~;

+

local A = argument_wrapper ( args );

+

local i

−

~~if is_set(Volume) then~~

+

-- Pick out the relevant fields from the arguments. Different citation templates

−

if ~~( mw~~.~~ustring.len(Volume) > 4 )~~

+

-- define different field names for the same underlying things.

−

~~then Volume~~ = ~~sepc~~ ..~~" " .. Volume~~;

+

−

else ~~Volume~~ = ~~" " .. hyphen_to_dash~~(~~Volume~~) .~~. ""~~;

+

local author_etal;

+

local a = {}; -- authors list from |lastn= / |firstn= pairs or |vauthors=

+

local Authors;

+

local NameListStyle;

+

if cfg.global_cs1_config_t['NameListStyle'] then -- global setting in {{cs1 config}} overrides local |name-list-style= parameter value; nil when empty or assigned value invalid

+

NameListStyle = is_valid_parameter_value (cfg.global_cs1_config_t['NameListStyle'], 'cs1 config: name-list-style', cfg.keywords_lists['name-list-style'], ''); -- error messaging 'param' here is a hoax

+

else

+

NameListStyle = is_valid_parameter_value (A['NameListStyle'], A:ORIGIN('NameListStyle'), cfg.keywords_lists['name-list-style'], '');

end

−

~~end~~

−

~~------------------------------------ totally unrelated data~~

+

if cfg.global_cs1_config_t['NameListStyle'] and utilities.is_set (A['NameListStyle']) then -- when template has |name-list-style=<something> which global setting has overridden

−

if is_set(~~Via~~) then

+

utilities.set_message ('maint_overridden_setting'); -- set a maint message

−

~~Via = " " .~~. ~~wrap_msg~~ ('~~via~~'~~, Via~~);

+

end

−

end

−

--[[

+

local Collaboration = A['Collaboration'];

−

~~Subscription implies paywall~~; ~~Registration does not. If both are used in a citation, the subscription required link~~

−

~~note is displayed. There are no error messages for this condition.~~

−

]]

+

do -- to limit scope of selected

−

~~if in_array~~(~~SubscriptionRequired:lower(), {~~'~~yes~~', '~~true~~', 'y'}) then

+

local selected = select_author_editor_source (A['Vauthors'], A['Authors'], args, 'AuthorList');

−

~~SubscriptionRequired~~ = ~~sepc .. " " .. cfg.messages[~~'~~subscription~~']; -- ~~subscription required message~~

+

if 1 == selected then

−

elseif ~~in_array(RegistrationRequired:lower(), {~~'~~yes~~', '~~true~~', 'y'}) then

+

−

~~SubscriptionRequired~~ = ~~sepc .. " " .. cfg.messages~~['~~registration~~']; -- ~~registration required message~~

+

elseif 2 == selected then

−

~~else~~

+

NameListStyle = 'vanc'; -- override whatever |name-list-style= might be

−

~~SubscriptionRequired~~ = ''; -- ~~either or both might be set to something other than yes true y~~

+

a, author_etal = parse_vauthors_veditors (args, A['Vauthors'], 'AuthorList'); -- fetch author list from |vauthors=, |author-linkn=, and |author-maskn=

+

elseif 3 == selected then

+

+

end

+

if utilities.is_set (Collaboration) then

+

author_etal = true; -- so that |display-authors=etal not required

+

end

−

~~if is_set(AccessDate) then~~

+

local editor_etal;

−

local ~~retrv_text~~ = ~~" " .. cfg.messages['retrieved']~~

+

local e = {}; -- editors list from |editor-lastn= / |editor-firstn= pairs or |veditors=

−

~~AccessDate~~ = ~~nowrap_date~~ (~~AccessDate~~); -- ~~wrap in nowrap span if date in appropriate format~~

+

do -- to limit scope of selected

−

if ~~(sepc ~~~= ~~".")~~ then ~~retrv_text~~ = ~~retrv_text:lower~~() ~~end~~ -- ~~if 'citation'~~, ~~lower case~~

+

local selected = select_author_editor_source (A['Veditors'], nil, args, 'EditorList'); -- support for |editors= withdrawn

−

~~AccessDate~~ = ~~substitute (retrv_text, AccessDate)~~; -- ~~add retrieved text~~

+

if 1 == selected then

−

-- ~~neither of these work; don't know why; it seems that substitute() isn't being called~~

+

−

~~AccessDate~~ = ~~substitute~~ (~~cfg~~.~~presentation[~~'~~accessdate~~'~~], {sepc, AccessDate}~~); -- ~~allow editors to hide accessdates~~

+

elseif 2 == selected then

+

NameListStyle = 'vanc'; -- override whatever |name-list-style= might be

+

e, editor_etal = parse_vauthors_veditors (args, args.veditors, 'EditorList'); -- fetch editor list from |veditors=, |editor-linkn=, and |editor-maskn=

+

end

+

local Chapter = A['Chapter']; -- done here so that we have access to |contribution= from |chapter= aliases

+

local Chapter_origin = A:ORIGIN ('Chapter');

+

local Contribution; -- because contribution is required for contributor(s)

+

if 'contribution' == Chapter_origin then

+

Contribution = Chapter; -- get the name of the contribution

+

end

+

local c = {}; -- contributors list from |contributor-lastn= / contributor-firstn= pairs

−

if ~~is_set~~(~~ID) then ID = sepc .~~." "~~.. ID; end~~

+

if utilities.in_array (config.CitationClass, {"book", "citation"}) and not utilities.is_set (A['Periodical']) then -- |contributor= and |contribution= only supported in book cites

−

if "~~thesis~~" ~~== config~~.~~CitationClass and~~ is_set(~~Docket~~) then

+

c = extract_names (args, 'ContributorList'); -- fetch contributor list from |contributorn= / |contributor-lastn=, -firstn=, -linkn=, -maskn=

−

ID = ~~sepc~~ ..~~" Docket ".. Docket .. ID~~;

+

−

end

+

if 0 < #c then

−

if ~~"report"~~ == ~~config~~.~~CitationClass and is_set~~(~~Docket~~) ~~then~~ -- ~~for~~ cite ~~report when |docket= is set~~

+

if not utilities.is_set (Contribution) then -- |contributor= requires |contribution=

−

~~ID = sepc~~ .. ' ' .~~. Docket~~; -- ~~overwrite ID even if |id~~= ~~is set~~

+

utilities.set_message ('err_contributor_missing_required_param', 'contribution'); -- add missing contribution error message

+

c = {}; -- blank the contributors' table; it is used as a flag later

+

end

+

if 0 == #a then -- |contributor= requires |author=

+

utilities.set_message ('err_contributor_missing_required_param', 'author'); -- add missing author error message

+

c = {}; -- blank the contributors' table; it is used as a flag later

+

end

+

end

+

else -- if not a book cite

+

if utilities.select_one (args, cfg.aliases['ContributorList-Last'], 'err_redundant_parameters', 1 ) then -- are there contributor name list parameters?

+

utilities.set_message ('err_contributor_ignored'); -- add contributor ignored error message

+

end

+

Contribution = nil; -- unset

end

−

~~ID_list~~ = ~~build_id_list( ID_list, {DoiBroken~~ = ~~DoiBroken, ASINTLD = ASINTLD, IgnoreISBN = IgnoreISBN, Embargo=Embargo, Class = Class} )~~;

+

local Title = A['Title'];

+

local TitleLink = A['TitleLink'];

−

if ~~is_set~~(~~URL~~) ~~then~~

+

local auto_select = ''; -- default is auto

−

~~URL = " " .~~. ~~external_link~~( ~~URL~~, ~~nil~~, ~~URLorigin~~ );

+

local accept_link;

+

TitleLink, accept_link = utilities.has_accept_as_written (TitleLink, true); -- test for accept-this-as-written markup

+

if (not accept_link) and utilities.in_array (TitleLink, {'none', 'pmc', 'doi'}) then -- check for special keywords

+

auto_select = TitleLink; -- remember selection for later

+

TitleLink = ''; -- treat as if |title-link= would have been empty

end

−

~~if is_set~~(~~Quote) then~~

+

TitleLink = link_title_ok (TitleLink, A:ORIGIN ('TitleLink'), Title, 'title'); -- check for wiki-markup in |title-link= or wiki-markup in |title= when |title-link= is set

−

~~if Quote~~:~~sub~~(1,1) == '"' ~~and Quote:sub(~~-1,-1) == '"' then

+

−

~~Quote = Quote:sub(2,-2);~~

+

local Section = ''; -- {{cite map}} only; preset to empty string for concatenation if not used

−

~~end~~

+

if 'map' == config.CitationClass and 'section' == Chapter_origin then

−

~~Quote~~ = ~~sepc .." " .. wrap_style (~~'~~quoted-text~~'~~, Quote )~~; -- ~~wrap~~ in ~~<q>...</q> tags~~

+

Section = A['Chapter']; -- get |section= from |chapter= alias list; |chapter= and the other aliases not supported in {{cite map}}

−

~~PostScript~~ = ""; -- ~~CS1 does not supply terminal punctuation when~~ |~~quote~~= ~~is set~~

+

Chapter = ''; -- unset for now; will be reset later from |map= if present

end

+

local Periodical = A['Periodical'];

+

local Periodical_origin = A:ORIGIN('Periodical');

+

local ScriptPeriodical = A['ScriptPeriodical'];

+

local ScriptPeriodical_origin = A:ORIGIN('ScriptPeriodical');

+

local TransPeriodical = A['TransPeriodical'];

+

local TransPeriodical_origin = A:ORIGIN ('TransPeriodical');

−

local ~~Archived~~

+

if (utilities.in_array (config.CitationClass, {'book', 'encyclopaedia'}) and (utilities.is_set (Periodical) or utilities.is_set (ScriptPeriodical) or utilities.is_set (TransPeriodical))) then

−

if is_set(~~ArchiveURL~~) then

+

local param;

−

if not is_set(~~ArchiveDate~~) then

+

if utilities.is_set (Periodical) then -- get a parameter name from one of these periodical related meta-parameters

−

~~ArchiveDate~~ = ~~set_error(~~'~~archive_missing_date~~');

+

Periodical = ''; -- unset because not valid {{cite book}} or {{cite encyclopedia}} parameters

+

param = Periodical_origin -- get parameter name for error messaging

+

elseif utilities.is_set (TransPeriodical) then

+

TransPeriodical = ''; -- unset because not valid {{cite book}} or {{cite encyclopedia}} parameters

+

param = TransPeriodical_origin; -- get parameter name for error messaging

+

elseif utilities.is_set (ScriptPeriodical) then

+

ScriptPeriodical = ''; -- unset because not valid {{cite book}} or {{cite encyclopedia}} parameters

+

param = ScriptPeriodical_origin; -- get parameter name for error messaging

end

−

if ~~"no" == DeadURL then~~

+

−

~~local arch_text = cfg.messages['archived'];~~

+

if utilities.is_set (param) then -- if we found one

−

~~if sepc ~= "." then arch_text = arch_text:lower() end~~

+

utilities.set_message ('err_periodical_ignored', {param}); -- emit an error message

−

~~Archived = sepc .. " " .. substitute( cfg.messages['archived-not-dead'],~~

−

~~{ external_link( ArchiveURL, arch_text ) .. ArchiveFormat, ArchiveDate } );~~

−

~~if not is_set(OriginalURL) then~~

−

~~Archived = Archived .. " " .~~. ~~set_error('archive_missing_url');~~

−

~~end~~

−

~~elseif~~ is_set(~~OriginalURL~~) then

−

~~local arch_text = cfg.messages['archived~~-~~dead'];~~

−

if ~~sepc ~= "." then arch_text = arch_text:lower() end~~

−

~~Archived = sepc .. " " .~~. ~~substitute( arch_text,~~

−

~~{ external_link~~( ~~OriginalURL, cfg.messages[~~'~~original~~'~~] ) .. OriginalFormat~~, ~~ArchiveDate~~ } ); -- ~~format already styled~~

−

~~else~~

−

~~local arch_text = cfg.messages['archived-missing'];~~

−

~~if sepc ~= "." then arch_text = arch_text:lower() end~~

−

~~Archived = sepc .. " " .. substitute( arch_text,~~

−

~~{ set_error('archive_missing_url'), ArchiveDate } );~~

end

−

~~elseif is_set (ArchiveFormat) then~~

−

~~Archived = ArchiveFormat; -- if set and ArchiveURL not set ArchiveFormat has error message~~

−

~~else~~

−

~~Archived = ""~~

end

−

+

−

~~local Lay = '';~~

+

if utilities.is_set (Periodical) then

−

if is_set(~~LayURL~~) then

+

local i;

−

~~if is_set(LayDate) then LayDate~~ = " (~~" .. LayDate .. "~~)~~" end~~

+

Periodical, i = utilities.strip_apostrophe_markup (Periodical); -- strip apostrophe markup so that metadata isn't contaminated

−

if ~~is_set(LaySource)~~ then

+

if i then -- non-zero when markup was stripped so emit an error message

−

~~LaySource = " – ''" .~~. ~~safe_for_italics~~(~~LaySource) .. "~~''";

+

utilities.set_message ('err_apostrophe_markup', {Periodical_origin});

−

~~else~~

−

~~LaySource = ""~~;

end

−

~~if sepc == '.' then~~

−

~~Lay = sepc .. " " .. external_link( LayURL, cfg.messages['lay summary'] ) .. LayFormat .. LaySource .. LayDate~~

−

~~else~~

−

~~Lay = sepc .. " " .. external_link( LayURL, cfg.messages['lay summary']:lower() ) .. LayFormat .. LaySource .. LayDate~~

−

~~end~~

−

~~elseif is_set (LayFormat) then -- Test if |lay-format= is given without giving a |lay-url=~~

−

~~Lay = sepc .. LayFormat; -- if set and LayURL not set, then LayFormat has error message~~

end

−

if ~~is_set(Transcript)~~ then

+

if 'mailinglist' == config.CitationClass then -- special case for {{cite mailing list}}

−

if is_set(~~TranscriptURL~~) then

+

if utilities.is_set (Periodical) and utilities.is_set (A ['MailingList']) then -- both set emit an error TODO: make a function for this and similar?

−

~~Transcript = external_link~~( ~~TranscriptURL~~, ~~Transcript~~ );

+

utilities.set_message ('err_redundant_parameters', {utilities.wrap_style ('parameter', Periodical_origin) .. cfg.presentation['sep_list_pair'] .. utilities.wrap_style ('parameter', 'mailinglist')});

end

−

~~Transcript~~ = ~~sepc ..~~ ' ' ~~.. Transcript .. TranscriptFormat~~;

+

−

~~elseif is_set(TranscriptURL) then~~

+

Periodical = A ['MailingList']; -- error or no, set Periodical to |mailinglist= value because this template is {{cite mailing list}}

−

~~Transcript~~ = ~~external_link~~( ~~TranscriptURL, nil, TranscriptURLorigin~~ );

+

Periodical_origin = A:ORIGIN('MailingList');

end

−

~~local Publisher;~~

+

-- web and news not tested for now because of

−

if is_set(Periodical) ~~and~~

+

-- Wikipedia:Administrators%27_noticeboard#Is_there_a_semi-automated_tool_that_could_fix_these_annoying_"Cite_Web"_errors?

−

~~not in_array(~~config.CitationClass, {~~"encyclopaedia"~~,~~"web","pressrelease","podcast"~~}) then

+

if not (utilities.is_set (Periodical) or utilities.is_set (ScriptPeriodical)) then -- 'periodical' templates require periodical parameter

−

if is_set(~~PublisherName~~) then

+

-- local p = {['journal'] = 'journal', ['magazine'] = 'magazine', ['news'] = 'newspaper', ['web'] = 'website'}; -- for error message

−

if ~~is_set~~(~~PublicationPlace~~) then

+

local p = {['journal'] = 'journal', ['magazine'] = 'magazine'}; -- for error message

−

~~Publisher~~ = ~~PublicationPlace .. ": " .. PublisherName;~~

+

if p[config.CitationClass] then

−

~~else~~

+

utilities.set_message ('err_missing_periodical', {config.CitationClass, p[config.CitationClass]});

−

~~Publisher~~ = ~~PublisherName~~;

+

end

+

end

+

local Volume;

+

if 'citation' == config.CitationClass then

+

if utilities.is_set (Periodical) then

+

if not utilities.in_array (Periodical_origin, cfg.citation_no_volume_t) then -- {{citation}} does not render |volume= when these parameters are used

+

Volume = A['Volume']; -- but does for all other 'periodicals'

end

−

elseif is_set(~~PublicationPlace~~) then

+

elseif utilities.is_set (ScriptPeriodical) then

−

~~Publisher~~= ~~PublicationPlace;~~

+

if 'script-website' ~= ScriptPeriodical_origin then -- {{citation}} does not render volume for |script-website=

−

~~else~~

+

Volume = A['Volume']; -- but does for all other 'periodicals'

−

~~Publisher~~ = ~~"";~~

−

~~end~~

−

~~if is_set(PublicationDate) then~~

−

~~if is_set(Publisher) then~~

−

~~Publisher~~ = ~~Publisher .. ", " .. wrap_msg (~~'~~published~~'~~, PublicationDate);~~

−

~~else~~

−

~~Publisher = PublicationDate~~;

end

+

else

+

Volume = A['Volume']; -- and does for non-'periodical' cites

end

−

if is_set(~~Publisher~~) then

+

elseif utilities.in_array (config.CitationClass, cfg.templates_using_volume) then -- render |volume= for cs1 according to the configuration settings

−

~~Publisher~~ = " (~~" .. Publisher .. "~~)";

+

Volume = A['Volume'];

+

end

+

extra_text_in_vol_iss_check (Volume, A:ORIGIN ('Volume'), 'v');

+

local Issue;

+

if 'citation' == config.CitationClass then

+

if utilities.is_set (Periodical) and utilities.in_array (Periodical_origin, cfg.citation_issue_t) then -- {{citation}} may render |issue= when these parameters are used

+

Issue = utilities.hyphen_to_dash (A['Issue']);

end

−

~~else~~

+

elseif utilities.in_array (config.CitationClass, cfg.templates_using_issue) then -- conference & map books do not support issue; {{citation}} listed here because included in settings table

−

~~if is_set~~(~~PublicationDate~~) then

+

if not (utilities.in_array (config.CitationClass, {'conference', 'map', 'citation'}) and not (utilities.is_set (Periodical) or utilities.is_set (ScriptPeriodical))) then

−

~~PublicationDate = "~~ (" .. ~~wrap_msg (~~'~~published~~', ~~PublicationDate~~) .~~. ")";~~

+

Issue = utilities.hyphen_to_dash (A['Issue']);

−

~~end~~

−

if is_set(~~PublisherName~~) ~~then~~

−

if is_set(~~PublicationPlace~~) then

−

~~Publisher = sepc .. " " .. PublicationPlace .. ": " .. PublisherName .. PublicationDate;~~

−

~~else~~

−

~~Publisher~~ = ~~sepc~~ .~~. " " .. PublisherName .. PublicationDate;~~

−

~~end~~

−

~~elseif is_set~~(~~PublicationPlace~~) ~~then~~

−

~~Publisher= sepc .. " " .. PublicationPlace .. PublicationDate;~~

−

~~else~~

−

~~Publisher = PublicationDate~~;

end

−

~~-- Several of the above rely upon detecting this as nil, so do it last.~~

+

local ArticleNumber;

−

if is_set(Periodical) then

+

−

~~if is_set~~(~~Title~~) ~~or is_set~~(~~TitleNote~~) then

+

if utilities.in_array (config.CitationClass, {'journal', 'conference'}) or ('citation' == config.CitationClass and utilities.is_set (Periodical) and 'journal' == Periodical_origin) then

−

~~Periodical~~ = ~~sepc .~~. ~~" " .. wrap_style~~ ('~~italic-title~~'~~, Periodical~~)

+

ArticleNumber = A['ArticleNumber'];

−

~~else~~

+

end

−

~~Periodical~~ = ~~wrap_style~~ ('~~italic-title~~'~~, Periodical~~)

+

−

~~end~~

+

extra_text_in_vol_iss_check (Issue, A:ORIGIN ('Issue'), 'i');

+

local Page;

+

local Pages;

+

local At;

+

local QuotePage;

+

local QuotePages;

+

if not utilities.in_array (config.CitationClass, cfg.templates_not_using_page) then -- TODO: rewrite to emit ignored parameter error message?

+

Page = A['Page'];

+

Pages = utilities.hyphen_to_dash (A['Pages']);

+

At = A['At'];

+

QuotePage = A['QuotePage'];

+

QuotePages = utilities.hyphen_to_dash (A['QuotePages']);

end

−

--[[

+

local Edition = A['Edition'];

−

~~Handle the oddity that is cite speech. This code overrides whatever may be the value assigned to TitleNote~~ (~~through |department=~~) ~~and forces it to be " (Speech~~)~~" so that~~

+

local PublicationPlace = place_check (A['PublicationPlace'], A:ORIGIN('PublicationPlace'));

−

~~the annotation directly follows the |title~~= ~~parameter value in the citation rather than the |event~~= ~~parameter value~~ (if ~~provided~~).

+

local Place = place_check (A['Place'], A:ORIGIN('Place'));

−

]]

+

−

~~if "speech"~~ =~~= config.CitationClass then -- cite speech only~~

+

local PublisherName = A['PublisherName'];

−

~~TitleNote~~ = " (~~Speech~~)"; -- ~~annotate the citation~~

+

local PublisherName_origin = A:ORIGIN('PublisherName');

−

if ~~is_set~~ (~~Periodical~~) then -- ~~if Periodical, perhaps because of~~ an ~~included |website= or |journal= parameter~~

+

if utilities.is_set (PublisherName) and (cfg.keywords_xlate['none'] ~= PublisherName) then

−

~~if is_set~~ (~~Conference~~) ~~then -- and if |event= is set~~

+

local i = 0;

−

~~Conference = Conference .. sepc .. " "~~; ~~-- then add appropriate punctuation to the end of the Conference variable before rendering~~

+

PublisherName, i = utilities.strip_apostrophe_markup (PublisherName); -- strip apostrophe markup so that metadata isn't contaminated; publisher is never italicized

−

~~end~~

+

if i and (0 < i) then -- non-zero when markup was stripped so emit an error message

+

utilities.set_message ('err_apostrophe_markup', {PublisherName_origin});

end

+

if ('document' == config.CitationClass) and not utilities.is_set (PublisherName) then

+

utilities.set_message ('err_missing_publisher', {config.CitationClass, 'publisher'});

+

end

+

local Newsgroup = A['Newsgroup']; -- TODO: strip apostrophe markup?

+

local Newsgroup_origin = A:ORIGIN('Newsgroup');

−

~~-- Piece all bits together at last~~. ~~Here, all should be non-nil~~.

+

if 'newsgroup' == config.CitationClass then

−

-- ~~We build things this way because it is more efficient~~ in ~~LUA~~

+

if utilities.is_set (PublisherName) and (cfg.keywords_xlate['none'] ~= PublisherName) then -- general use parameter |publisher= not allowed in cite newsgroup

−

~~-- not to keep reassigning to the same string variable over and over~~.

+

utilities.set_message ('err_parameter_ignored', {PublisherName_origin});

+

end

−

~~local tcommon~~

+

PublisherName = nil; -- ensure that this parameter is unset for the time being; will be used again after COinS

−

~~if in_array(config.CitationClass, {"journal","citation"}) and is_set(Periodical) then~~

+

end

−

~~if is_set(Others) then Others = Others .. sepc .. " "~~ end

+

−

~~tcommon = safe_join( {Others, Title, TitleNote, Conference, Periodical, Format, TitleType, Series,~~

+

local URL = A['URL']; -- TODO: better way to do this for URL, ChapterURL, and MapURL?

−

~~Language, Edition, Publisher, Agency, Volume, Issue}, sepc );~~

+

local UrlAccess = is_valid_parameter_value (A['UrlAccess'], A:ORIGIN('UrlAccess'), cfg.keywords_lists['url-access'], nil);

−

+

−

~~elseif~~ '~~map~~' ~~== config.CitationClass then~~ -- ~~special cases~~ for ~~cite map~~

+

if not utilities.is_set (URL) and utilities.is_set (UrlAccess) then

−

~~if is_set (Chapter) then -- map in a book; TitleType is part of Chapter~~

+

UrlAccess = nil;

−

~~tcommon~~ = ~~safe_join~~( ~~{Title, Format, Edition~~, ~~Scale, Series, Language, Cartography, Others, Publisher, Volume}, sepc );~~

+

utilities.set_message ('err_param_access_requires_param', 'url');

−

~~elseif is_set~~ (~~Periodical~~) ~~then~~ -~~- map in a periodical~~

−

~~tcommon = safe_join( {Title, TitleType, Format, Periodical, Scale, Series, Language, Cartography, Others, Publisher, Volume, Issue}~~, ~~sepc~~ );

−

~~else -- a sheet or stand-alone map~~

−

~~tcommon = safe_join~~( ~~{Title, TitleType, Format, Edition, Scale, Series, Language, Cartography, Others, Publisher}, sepc~~ );

−

~~end~~

−

~~elseif 'episode' == config~~.~~CitationClass~~ then ~~-- special case for cite episode~~

−

~~tcommon~~ = ~~safe_join( {Title, TitleNote, TitleType, Series, Transcript, Language, Edition, Publisher}, sepc )~~;

−

~~else -- all other CS1 templates~~

−

~~tcommon = safe_join~~( ~~{Title~~, ~~TitleNote, Conference, Periodical, Format, TitleType, Series, Language,~~

−

~~Volume, Issue, Others, Edition, Publisher, Agency}, sepc~~ );

end

−

if ~~#ID_list > 0~~ then

+

local ChapterURL = A['ChapterURL'];

−

~~ID_list~~ = ~~safe_join~~( { ~~sepc .. " "~~, ~~table.concat~~( ~~ID_list~~, ~~sepc .. " "~~ ), ~~ID }~~, ~~sepc~~ );

+

local ChapterUrlAccess = is_valid_parameter_value (A['ChapterUrlAccess'], A:ORIGIN('ChapterUrlAccess'), cfg.keywords_lists['url-access'], nil);

−

~~else~~

+

if not utilities.is_set (ChapterURL) and utilities.is_set (ChapterUrlAccess) then

−

~~ID_list~~ = ID;

+

ChapterUrlAccess = nil;

+

utilities.set_message ('err_param_access_requires_param', {A:ORIGIN('ChapterUrlAccess'):gsub ('%-access', '')});

+

end

+

local MapUrlAccess = is_valid_parameter_value (A['MapUrlAccess'], A:ORIGIN('MapUrlAccess'), cfg.keywords_lists['url-access'], nil);

+

if not utilities.is_set (A['MapURL']) and utilities.is_set (MapUrlAccess) then

+

MapUrlAccess = nil;

+

utilities.set_message ('err_param_access_requires_param', {'map-url'});

end

−

+

−

local ~~idcommon~~ = ~~safe_join~~( ~~{ ID_list, URL, Archived, AccessDate, Via, SubscriptionRequired, Lay, Quote }, sepc~~ );

+

local this_page = mw.title.getCurrentTitle(); -- also used for COinS and for language

−

local ~~text;~~

+

local no_tracking_cats = is_valid_parameter_value (A['NoTracking'], A:ORIGIN('NoTracking'), cfg.keywords_lists['yes_true_y'], nil);

−

~~local pgtext~~ = ~~Position~~ .~~. Sheet .. Page .. Pages .. At~~;

+

−

+

-- check this page to see if it is in one of the namespaces that cs1 is not supposed to add to the error categories

−

if is_set(~~Authors~~) then

+

if not utilities.is_set (no_tracking_cats) then -- ignore if we are already not going to categorize this page

−

if ~~is_set(Coauthors)~~ then

+

if cfg.uncategorized_namespaces[this_page.namespace] then -- is this page's namespace id one of the uncategorized namespace ids?

−

~~local sep~~ = ~~'; '~~;

+

no_tracking_cats = "true"; -- set no_tracking_cats

−

if ~~'vanc' == NameListFormat~~ then

+

end

−

~~sep~~ = ~~', '~~;

+

for _, v in ipairs (cfg.uncategorized_subpages) do -- cycle through page name patterns

+

if this_page.text:match (v) then -- test page name against each pattern

+

no_tracking_cats = "true"; -- set no_tracking_cats

+

break; -- bail out if one is found

end

−

~~Authors = Authors .. sep .. Coauthors;~~

−

~~end~~

−

~~if is_set(Date) then~~

−

~~Date = " ("..Date..")" .. OrigYear .. sepc .. " "~~

−

~~elseif string.sub(Authors,-1,-1) == sepc then~~

−

~~Authors = Authors .. " "~~

−

~~else~~

−

~~Authors = Authors .. sepc .. " "~~

−

~~end~~

−

~~if is_set(Editors) then~~

−

~~local in_text = " ";~~

−

~~local post_text = "";~~

−

~~if is_set(Chapter) then~~

−

~~in_text = in_text .. cfg.messages['in'] .. " "~~

−

~~else~~

−

~~if EditorCount <= 1 then~~

−

~~post_text = ", " .. cfg.messages['editor'];~~

−

~~else~~

−

~~post_text = ", " .. cfg.messages['editors'];~~

−

~~end~~

−

~~end~~

−

~~if (sepc ~= '.') then in_text = in_text:lower() end~~

−

~~Editors = in_text .. Editors .. post_text;~~

−

~~if (string.sub(Editors,-1,-1) == sepc) or (string.sub(Editors,-3,-1) == sepc .. ']]') then -- if last editor name ends with sepc char~~

−

~~Editors = Editors .. " "; -- don't add another~~

−

~~else~~

−

~~Editors = Editors .. sepc .. " " -- otherwise terninate the editor list~~

−

~~end~~

−

~~end~~

−

~~text = safe_join( {Authors, Date, Chapter, Place, Editors, tcommon }, sepc );~~

−

~~text = safe_join( {text, pgtext, idcommon}, sepc );~~

−

~~elseif is_set(Editors) then~~

−

~~if is_set(Date) then~~

−

~~if EditorCount <= 1 then~~

−

~~Editors = Editors .. ", " .. cfg.messages['editor'];~~

−

~~else~~

−

~~Editors = Editors .. ", " .. cfg.messages['editors'];~~

−

~~end~~

−

~~Date = " (" .. Date ..")" .. OrigYear .. sepc .. " "~~

−

~~else~~

−

~~if EditorCount <= 1 then~~

−

~~Editors = Editors .. " (" .. cfg.messages['editor'] .. ")" .. sepc .. " "~~

−

~~else~~

−

~~Editors = Editors .. " (" .. cfg.messages['editors'] .. ")" .. sepc .. " "~~

−

~~end~~

−

~~end~~

−

~~text = safe_join( {Editors, Date, Chapter, Place, tcommon}, sepc );~~

−

~~text = safe_join( {text, pgtext, idcommon}, sepc );~~

−

~~else~~

−

~~if is_set(Date) then~~

−

~~if ( string.sub(tcommon,-1,-1) ~= sepc )~~

−

~~then Date = sepc .." " .. Date .. OrigYear~~

−

~~else Date = " " .. Date .. OrigYear~~

−

~~end~~

−

~~end~~

−

~~if config.CitationClass=="journal" and is_set(Periodical) then~~

−

~~text = safe_join( {Chapter, Place, tcommon}, sepc );~~

−

~~text = safe_join( {text, pgtext, Date, idcommon}, sepc );~~

−

~~else~~

−

~~text = safe_join( {Chapter, Place, tcommon, Date}, sepc );~~

−

~~text = safe_join( {text, pgtext, idcommon}, sepc );~~

end

+

-- check for extra |page=, |pages= or |at= parameters. (also sheet and sheets while we're at it)

+

utilities.select_one (args, {'page', 'p', 'pp', 'pages', 'at', 'sheet', 'sheets'}, 'err_redundant_parameters'); -- this is a dummy call simply to get the error message and category

+

local coins_pages;

−

~~if is_set(PostScript) and PostScript ~= sepc then~~

+

Page, Pages, At, coins_pages = insource_loc_get (Page, A:ORIGIN('Page'), Pages, A:ORIGIN('Pages'), At);

−

~~text = safe_join( {text~~, ~~sepc}~~, ~~sepc ); --Deals with italics~~, ~~spaces~~, ~~etc.~~

−

~~text = text~~:~~sub~~(1,~~-sepc~~:~~len~~()~~-1);~~

−

~~end~~

−

~~text = safe_join( {text, PostScript}~~, ~~sepc~~ );

−

~~-- Now enclose the whole thing in a element~~

+

local NoPP = is_valid_parameter_value (A['NoPP'], A:ORIGIN('NoPP'), cfg.keywords_lists['yes_true_y'], nil);

−

local ~~options~~ = ~~{};~~

+

−

+

if utilities.is_set (PublicationPlace) and utilities.is_set (Place) then -- both |publication-place= and |place= (|location=) allowed if different

−

~~if is_set~~(~~config~~.~~CitationClass~~) ~~and config.CitationClass ~= "citation" then~~

+

utilities.add_prop_cat ('location-test'); -- add property cat to evaluate how often PublicationPlace and Place are used together

−

~~options.class = "citation " .. config.CitationClass~~;

+

if PublicationPlace == Place then

−

~~else~~

+

Place = ''; -- unset; don't need both if they are the same

−

~~options.class = "citation";~~

−

~~end~~

−

if is_set(~~Ref~~) and ~~Ref:lower~~() ~= ~~"none" then~~

−

~~local id~~ = ~~Ref~~

−

if ( ~~"harv" =~~= ~~Ref~~ ) ~~then~~

−

~~local names = {} --table of last names & year~~

−

if ~~#a > 0 then~~

−

~~for i,v in ipairs(a) do~~

−

~~names[i] = v~~.~~last~~

−

~~if i == 4 then break end~~

−

~~end~~

−

~~elseif #e > 0 then~~

−

~~for i,v in ipairs~~(e) do

−

~~names[i] = v.last~~

−

if i == 4 then ~~break end~~

−

~~end~~

−

~~end~~

−

~~names[ #names + 1 ]~~ = ~~first_set(Year, anchor_year)~~; -- ~~Year first for legacy citations and for YMD dates that require disambiguation~~

−

~~id = anchor_id(names)~~

end

−

~~options.id~~ = id;

+

elseif not utilities.is_set (PublicationPlace) and utilities.is_set (Place) then -- when only |place= (|location=) is set ...

+

PublicationPlace = Place; -- promote |place= (|location=) to |publication-place

end

+

if PublicationPlace == Place then Place = ''; end -- don't need both if they are the same

+

local URL_origin = A:ORIGIN('URL'); -- get name of parameter that holds URL

+

local ChapterURL_origin = A:ORIGIN('ChapterURL'); -- get name of parameter that holds ChapterURL

+

local ScriptChapter = A['ScriptChapter'];

+

local ScriptChapter_origin = A:ORIGIN ('ScriptChapter');

+

local Format = A['Format'];

+

local ChapterFormat = A['ChapterFormat'];

+

local TransChapter = A['TransChapter'];

+

local TransChapter_origin = A:ORIGIN ('TransChapter');

+

local TransTitle = A['TransTitle'];

+

local ScriptTitle = A['ScriptTitle'];

−

~~if string.len(text:gsub("<span~~[~~^>/]*>.-", "")~~:~~gsub("%b<>","")) <= 2 then~~

+

--[[

−

~~z.error_categories = {};~~

+

Parameter remapping for cite encyclopedia:

−

~~text~~ = ~~set_error('empty_citation');~~

+

When the citation has these parameters:

−

~~z.message_tail~~ = ~~{};~~

+

−

~~end~~

+

|encyclopedia= and |article= then map |encyclopedia= to |title= for rendering

−

~~if is_set(options.id)~~ then

−

~~text~~ = ~~'' .. text .. "";~~

−

~~else~~

−

~~text~~ = ~~'' .. text .. "";~~

−

~~end~~

−

~~local empty_span~~ = ~~' ';~~

+

|trans-title= maps to |trans-chapter= when |title= is re-mapped

+

|url= maps to |chapter-url= when |title= is remapped

−

~~-- Note: Using display: none on then COinS span breaks some clients.~~

+

All other combinations of |encyclopedia=, |title=, and |article= are not modified

−

~~local OCinS~~ = ~~'<span~~ title=~~"' .. OCinSoutput .. '" class~~=~~"Z3988">' .. empty_span .. '';~~

−

~~text = text .. OCinS;~~

−

~~if #z.message_tail ~= 0 then~~

+

]]

−

~~text~~ = ~~text .. " "~~;

+

−

~~for i,v in ipairs( z.message_tail ) do~~

+

local Encyclopedia = A['Encyclopedia']; -- used as a flag by this module and by ~/COinS

−

if is_set(~~v[1]~~) then

+

−

if i == #z.~~message_tail~~ then

+

if utilities.is_set (Encyclopedia) then -- emit error message when Encyclopedia set but template is other than {{cite encyclopedia}} or {{citation}}

−

~~text = text .~~. ~~error_comment~~( ~~v[1]~~, ~~v[2]~~ );

+

if 'encyclopaedia' ~= config.CitationClass and 'citation' ~= config.CitationClass then

−

~~else~~

+

utilities.set_message ('err_parameter_ignored', {A:ORIGIN ('Encyclopedia')});

−

~~text~~ = ~~text .. error_comment( v[1] .. "~~; ~~", v[2] );~~

+

Encyclopedia = nil; -- unset because not supported by this template

−

~~end~~

−

~~end~~

end

−

if ~~#z.maintenance_cats ~~~= ~~0 then~~

+

if ('encyclopaedia' == config.CitationClass) or ('citation' == config.CitationClass and utilities.is_set (Encyclopedia)) then

−

~~text~~ = ~~text .~~. ' ~~';~~

+

if utilities.is_set (Periodical) and utilities.is_set (Encyclopedia) then -- when both parameters set emit an error message; {{citation}} only; Periodical not allowed in {{cite encyclopedia}}

−

~~for _, v in ipairs~~( z.~~maintenance_cats~~ ) do -- ~~append maintenance categories~~

+

utilities.set_message ('err_periodical_ignored', {Periodical_origin});

−

~~text = text .. v .~~. ' (~~[[:Category:~~' ~~.. v ..~~'~~|link]]~~)';

end

−

~~text~~ = ~~text .. ''~~; -- ~~maintenance mesages~~ (~~realy just the names of the categories for now~~)

+

−

~~end~~

+

if utilities.is_set (Encyclopedia) then

−

+

Periodical = Encyclopedia; -- error or no, set Periodical to Encyclopedia for rendering; {{citation}} could (not legitimately) have both; use Encyclopedia

−

~~no_tracking_cats~~ = ~~no_tracking_cats~~:~~lower~~();

+

Periodical_origin = A:ORIGIN ('Encyclopedia');

−

if ~~in_array~~(~~no_tracking_cats, {"", "no", "false", "n"}~~) then

+

−

~~for _, v in ipairs~~( ~~z.error_categories~~ ) do

+

if utilities.is_set (Title) or utilities.is_set (ScriptTitle) then

−

~~text~~ = ~~text ..~~ '~~[[Category:~~' .. v .~~.']]'~~;

+

if not utilities.is_set (Chapter) then

−

end

+

−

~~for _, v in ipairs( z.maintenance_cats ) do~~ -- ~~append maintenance categories~~

+

ScriptChapter = ScriptTitle;

−

~~text~~ = ~~text ..~~ '~~[[Category:~~' ~~.. v ..~~']]';

+

ScriptChapter_origin = A:ORIGIN('ScriptTitle')

−

end

+

TransChapter = TransTitle;

−

~~for _, v in ipairs~~( z.~~properties_cats~~ ) do -- ~~append maintenance categories~~

+

ChapterURL = URL;

−

~~text~~ = ~~text .. '[[Category:' .. v ..~~']]';

+

ChapterURL_origin = URL_origin;

+

ChapterUrlAccess = UrlAccess;

+

if not utilities.is_set (ChapterURL) and utilities.is_set (TitleLink) then

+

Chapter = utilities.make_wikilink (TitleLink, Chapter);

+

end

+

Title = Periodical;

+

ChapterFormat = Format;

+

Periodical = ''; -- redundant so unset

+

TransTitle = '';

+

URL = '';

+

Format = '';

+

TitleLink = '';

+

ScriptTitle = '';

+

end

+

elseif utilities.is_set (Chapter) or utilities.is_set (ScriptChapter) then -- |title= not set

+

Title = Periodical; -- |encyclopedia= set and |article= set so map |encyclopedia= to |title= for rendering

+

Periodical = ''; -- redundant so unset

+

end

−

~~return text~~

−

~~end~~

−

-- ~~This is used by templates such as {{~~cite ~~book}} to create the actual citation text.~~

+

-- special case for cite techreport.

−

~~function z~~.~~citation(frame)~~

+

local ID = A['ID'];

−

local ~~pframe~~ = ~~frame:getParent()~~

+

if (config.CitationClass == "techreport") then -- special case for cite techreport

−

~~local validation~~;

+

if utilities.is_set (A['Number']) then -- cite techreport uses 'number', which other citations alias to 'issue'

−

+

if not utilities.is_set (ID) then -- can we use ID for the "number"?

−

if ~~nil ~~~= ~~string.find (frame:getTitle(), 'sandbox', 1, true~~) then -- ~~did the {{#invoke:}} use sandbox version?~~

+

ID = A['Number']; -- yes, use it

−

~~cfg = mw~~.~~loadData~~ ('~~Module:Citation/CS1/Configuration/sandbox~~'); -- ~~load sandbox versions of Configuration and Whitelist and ...~~

+

else -- ID has a value so emit error message

−

~~whitelist = mw~~.~~loadData~~ (~~'Module:Citation/CS1/Whitelist/sandbox'~~);

+

utilities.set_message ('err_redundant_parameters', {utilities.wrap_style ('parameter', 'id') .. cfg.presentation['sep_list_pair'] .. utilities.wrap_style ('parameter', 'number')});

−

~~validation~~ = ~~require (~~'~~Module:Citation/CS1/Date_validation/sandbox~~'); -- ~~... sandbox version of date validation code~~

+

end

−

+

end

−

else -- ~~otherwise~~

−

~~cfg = mw~~.~~loadData~~ ('~~Module:Citation/CS1/Configuration~~')~~; -- load live versions of Configuration and Whitelist and~~ ...

−

~~whitelist = mw~~.~~loadData~~ ('~~Module:Citation/CS1/Whitelist~~');

−

~~validation = require (~~'~~Module:Citation/CS1/Date_validation~~'); ~~-- ... live version of date validation code~~

end

−

~~dates~~ = ~~validation.dates~~; -- ~~imported functions~~

+

-- Account for the oddity that is {{cite conference}}, before generation of COinS data.

−

~~year_date_check~~ = ~~validation.year_date_check~~;

+

local ChapterLink -- = A['ChapterLink']; -- deprecated as a parameter but still used internally by cite episode

−

+

local Conference = A['Conference'];

−

local ~~args~~ = {};

+

local BookTitle = A['BookTitle'];

−

~~local suggestions~~ = {};

+

local TransTitle_origin = A:ORIGIN ('TransTitle');

−

~~local error_text, error_state~~;

+

if 'conference' == config.CitationClass then

−

+

if utilities.is_set (BookTitle) then

−

~~local~~ config = {};

+

Chapter = Title;

−

~~for k~~, ~~v in pairs( frame~~.~~args~~ ) do

+

Chapter_origin = 'title';

−

~~config~~[k] ~~= v~~;

+

-- ChapterLink = TitleLink; -- |chapter-link= is deprecated

−

~~args~~[k] = v;

+

ChapterURL = URL;

−

end

+

ChapterUrlAccess = UrlAccess;

+

ChapterURL_origin = URL_origin;

+

URL_origin = '';

+

ChapterFormat = Format;

+

TransChapter = TransTitle;

+

TransChapter_origin = TransTitle_origin;

+

Title = BookTitle;

+

Format = '';

+

-- TitleLink = '';

+

TransTitle = '';

+

URL = '';

+

end

+

elseif 'speech' ~= config.CitationClass then

+

Conference = ''; -- not cite conference or cite speech so make sure this is empty string

+

end

+

-- CS1/2 mode

+

local Mode;

+

if cfg.global_cs1_config_t['Mode'] then -- global setting in {{cs1 config}} overrides local |mode= parameter value; nil when empty or assigned value invalid

+

Mode = is_valid_parameter_value (cfg.global_cs1_config_t['Mode'], 'cs1 config: mode', cfg.keywords_lists['mode'], ''); -- error messaging 'param' here is a hoax

+

else

+

Mode = is_valid_parameter_value (A['Mode'], A:ORIGIN('Mode'), cfg.keywords_lists['mode'], '');

+

end

+

if cfg.global_cs1_config_t['Mode'] and utilities.is_set (A['Mode']) then -- when template has |mode=<something> which global setting has overridden

+

utilities.set_message ('maint_overridden_setting'); -- set a maint message

+

end

−

~~for k, v in pairs( pframe.args ) do~~

+

-- separator character and postscript

−

~~if v ~= '' then~~

+

local sepc, PostScript = set_style (Mode:lower(), A['PostScript'], config.CitationClass);

−

~~if not validate( k ) then~~

+

-- controls capitalization of certain static text

−

~~error_text = "";~~

+

local use_lowercase = ( sepc == ',' );

−

~~if type( k ) ~= 'string' then~~

−

-- ~~Exclude empty numbered parameters~~

−

~~if v:match("%S+") ~= nil then~~

−

~~error_text~~, ~~error_state~~ = ~~set_error~~( ~~'text_ignored', {v}, true );~~

−

~~end~~

−

~~elseif validate( k:lower() ) then~~

−

~~error_text, error_state = set_error( 'parameter_ignored_suggest', {k, k~~:lower()}, ~~true );~~

−

~~else~~

−

~~if #suggestions == 0 then~~

−

~~suggestions = mw.loadData( 'Module:Citation/CS1/Suggestions' );~~

−

~~end~~

−

~~if suggestions~~[ ~~k:lower() ] ~= nil then~~

−

~~error_text, error_state = set_error(~~ '~~parameter_ignored_suggest~~'~~, {k, suggestions[ k:lower()~~ ]~~}, true );~~

−

~~else~~

−

~~error_text, error_state = set_error( 'parameter_ignored', {k}~~, ~~true );~~

−

~~end~~

−

~~end~~

−

~~if error_text ~= '' then~~

−

~~table.insert( z~~.~~message_tail, {error_text, error_state}~~ );

−

~~end~~

−

~~end~~

−

~~args[k] = v;~~

−

~~elseif args[k] ~~~= ~~nil or~~ (k == '~~postscript~~') ~~then~~

−

~~args[k] = v~~;

−

~~end~~

−

~~end~~

−

return ~~citation0~~( config, ~~args~~)

+

-- cite map oddities

+

local Cartography = "";

+

local Scale = "";

+

local Sheet = A['Sheet'] or '';

+

local Sheets = A['Sheets'] or '';

+

if config.CitationClass == "map" then

+

if utilities.is_set (Chapter) then --TODO: make a function for this and similar?

+

utilities.set_message ('err_redundant_parameters', {utilities.wrap_style ('parameter', 'map') .. cfg.presentation['sep_list_pair'] .. utilities.wrap_style ('parameter', Chapter_origin)}); -- add error message

+

end

+

Chapter = A['Map'];

+

Chapter_origin = A:ORIGIN('Map');

+

ChapterURL = A['MapURL'];

+

ChapterURL_origin = A:ORIGIN('MapURL');

+

TransChapter = A['TransMap'];

+

ScriptChapter = A['ScriptMap']

+

ScriptChapter_origin = A:ORIGIN('ScriptMap')

+

ChapterUrlAccess = MapUrlAccess;

+

ChapterFormat = A['MapFormat'];

+

Cartography = A['Cartography'];

+

if utilities.is_set ( Cartography ) then

+

Cartography = sepc .. " " .. wrap_msg ('cartography', Cartography, use_lowercase);

+

end

+

Scale = A['Scale'];

+

if utilities.is_set ( Scale ) then

+

Scale = sepc .. " " .. Scale;

+

end

+

end

+

-- Account for the oddities that are {{cite episode}} and {{cite serial}}, before generation of COinS data.

+

local Series = A['Series'];

+

if 'episode' == config.CitationClass or 'serial' == config.CitationClass then

+

local SeriesLink = A['SeriesLink'];

+

SeriesLink = link_title_ok (SeriesLink, A:ORIGIN ('SeriesLink'), Series, 'series'); -- check for wiki-markup in |series-link= or wiki-markup in |series= when |series-link= is set

+

local Network = A['Network'];

+

local Station = A['Station'];

+

local s, n = {}, {};

+

-- do common parameters first

+

if utilities.is_set (Network) then table.insert(n, Network); end

+

if utilities.is_set (Station) then table.insert(n, Station); end

+

ID = table.concat(n, sepc .. ' ');

+

if 'episode' == config.CitationClass then -- handle the oddities that are strictly {{cite episode}}

+

local Season = A['Season'];

+

local SeriesNumber = A['SeriesNumber'];

+

if utilities.is_set (Season) and utilities.is_set (SeriesNumber) then -- these are mutually exclusive so if both are set TODO: make a function for this and similar?

+

utilities.set_message ('err_redundant_parameters', {utilities.wrap_style ('parameter', 'season') .. cfg.presentation['sep_list_pair'] .. utilities.wrap_style ('parameter', 'seriesno')}); -- add error message

+

SeriesNumber = ''; -- unset; prefer |season= over |seriesno=

+

end

+

-- assemble a table of parts concatenated later into Series

+

if utilities.is_set (Season) then table.insert(s, wrap_msg ('season', Season, use_lowercase)); end

+

if utilities.is_set (SeriesNumber) then table.insert(s, wrap_msg ('seriesnum', SeriesNumber, use_lowercase)); end

+

if utilities.is_set (Issue) then table.insert(s, wrap_msg ('episode', Issue, use_lowercase)); end

+

Issue = ''; -- unset because this is not a unique parameter

+

Chapter = Title; -- promote title parameters to chapter

+

ScriptChapter = ScriptTitle;

+

ScriptChapter_origin = A:ORIGIN('ScriptTitle');

+

ChapterLink = TitleLink; -- alias |episode-link=

+

TransChapter = TransTitle;

+

ChapterURL = URL;

+

ChapterUrlAccess = UrlAccess;

+

ChapterURL_origin = URL_origin;

+

ChapterFormat = Format;

+

Title = Series; -- promote series to title

+

TitleLink = SeriesLink;

+

Series = table.concat(s, sepc .. ' '); -- this is concatenation of season, seriesno, episode number

+

if utilities.is_set (ChapterLink) and not utilities.is_set (ChapterURL) then -- link but not URL

+

Chapter = utilities.make_wikilink (ChapterLink, Chapter);

+

elseif utilities.is_set (ChapterLink) and utilities.is_set (ChapterURL) then -- if both are set, URL links episode;

+

Series = utilities.make_wikilink (ChapterLink, Series);

+

end

+

URL = ''; -- unset

+

TransTitle = '';

+

ScriptTitle = '';

+

Format = '';

+

else -- now oddities that are cite serial

+

Issue = ''; -- unset because this parameter no longer supported by the citation/core version of cite serial

+

Chapter = A['Episode']; -- TODO: make |episode= available to cite episode someday?

+

if utilities.is_set (Series) and utilities.is_set (SeriesLink) then

+

Series = utilities.make_wikilink (SeriesLink, Series);

+

end

+

Series = utilities.wrap_style ('italic-title', Series); -- series is italicized

+

end

+

end

+

-- end of {{cite episode}} stuff

+

-- handle type parameter for those CS1 citations that have default values

+

local TitleType = A['TitleType'];

+

local Degree = A['Degree'];

+

if utilities.in_array (config.CitationClass, {'AV-media-notes', 'document', 'interview', 'mailinglist', 'map', 'podcast', 'pressrelease', 'report', 'speech', 'techreport', 'thesis'}) then

+

TitleType = set_titletype (config.CitationClass, TitleType);

+

if utilities.is_set (Degree) and "Thesis" == TitleType then -- special case for cite thesis

+

TitleType = Degree .. ' ' .. cfg.title_types ['thesis']:lower();

+

end

+

end

+

if utilities.is_set (TitleType) then -- if type parameter is specified

+

TitleType = utilities.substitute ( cfg.messages['type'], TitleType); -- display it in parentheses

+

-- TODO: Hack on TitleType to fix bunched parentheses problem

+

end

+

-- legacy: promote PublicationDate to Date if neither Date nor Year are set.

+

local Date = A['Date'];

+

local Date_origin; -- to hold the name of parameter promoted to Date; required for date error messaging

+

local PublicationDate = A['PublicationDate'];

+

local Year = A['Year'];

+

if not utilities.is_set (Date) then

+

Date = Year; -- promote Year to Date

+

Year = nil; -- make nil so Year as empty string isn't used for CITEREF

+

if not utilities.is_set (Date) and utilities.is_set (PublicationDate) then -- use PublicationDate when |date= and |year= are not set

+

Date = PublicationDate; -- promote PublicationDate to Date

+

PublicationDate = ''; -- unset, no longer needed

+

Date_origin = A:ORIGIN('PublicationDate'); -- save the name of the promoted parameter

+

else

+

Date_origin = A:ORIGIN('Year'); -- save the name of the promoted parameter

+

end

+

else

+

Date_origin = A:ORIGIN('Date'); -- not a promotion; name required for error messaging

+

end

+

if PublicationDate == Date then PublicationDate = ''; end -- if PublicationDate is same as Date, don't display in rendered citation

+

--[[

+

Go test all of the date-holding parameters for valid MOS:DATE format and make sure that dates are real dates. This must be done before we do COinS because here is where

+

we get the date used in the metadata.

+

Date validation supporting code is in Module:Citation/CS1/Date_validation

+

]]

+

local DF = is_valid_parameter_value (A['DF'], A:ORIGIN('DF'), cfg.keywords_lists['df'], '');

+

if not utilities.is_set (DF) then

+

DF = cfg.global_df; -- local |df= if present overrides global df set by {{use xxx date}} template

+

end

+

local ArchiveURL;

+

local ArchiveDate;

+

local ArchiveFormat = A['ArchiveFormat'];

+

local archive_url_timestamp; -- timestamp from wayback machine url

+

ArchiveURL, ArchiveDate, archive_url_timestamp = archive_url_check (A['ArchiveURL'], A['ArchiveDate'])

+

ArchiveFormat = style_format (ArchiveFormat, ArchiveURL, 'archive-format', 'archive-url');

+

ArchiveURL, ArchiveDate = is_unique_archive_url (ArchiveURL, URL, ChapterURL, A:ORIGIN('ArchiveURL'), ArchiveDate); -- add error message when URL or ChapterURL == ArchiveURL

+

local AccessDate = A['AccessDate'];

+

local COinS_date = {}; -- holds date info extracted from |date= for the COinS metadata by Module:Date verification

+

local DoiBroken = A['DoiBroken'];

+

local Embargo = A['Embargo'];

+

local anchor_year; -- used in the CITEREF identifier

+

do -- create defined block to contain local variables error_message, date_parameters_list, mismatch

+

local error_message = '';

+

-- AirDate has been promoted to Date so not necessary to check it

+

local date_parameters_list = {

+

['access-date'] = {val = AccessDate, name = A:ORIGIN ('AccessDate')},

+

['archive-date'] = {val = ArchiveDate, name = A:ORIGIN ('ArchiveDate')},

+

['date'] = {val = Date, name = Date_origin},

+

['doi-broken-date'] = {val = DoiBroken, name = A:ORIGIN ('DoiBroken')},

+

['pmc-embargo-date'] = {val = Embargo, name = A:ORIGIN ('Embargo')},

+

['publication-date'] = {val = PublicationDate, name = A:ORIGIN ('PublicationDate')},

+

['year'] = {val = Year, name = A:ORIGIN ('Year')},

+

};

+

local error_list = {};

+

anchor_year, Embargo = validation.dates(date_parameters_list, COinS_date, error_list);

+

-- start temporary Julian / Gregorian calendar uncertainty categorization

+

if COinS_date.inter_cal_cat then

+

utilities.add_prop_cat ('jul-greg-uncertainty');

+

end

+

-- end temporary Julian / Gregorian calendar uncertainty categorization

+

if utilities.is_set (Year) and utilities.is_set (Date) then -- both |date= and |year= not normally needed;

+

validation.year_date_check (Year, A:ORIGIN ('Year'), Date, A:ORIGIN ('Date'), error_list);

+

end

+

if 0 == #error_list then -- error free dates only; 0 when error_list is empty

+

local modified = false; -- flag

+

if utilities.is_set (DF) then -- if we need to reformat dates

+

modified = validation.reformat_dates (date_parameters_list, DF); -- reformat to DF format, use long month names if appropriate

+

end

+

if true == validation.date_hyphen_to_dash (date_parameters_list) then -- convert hyphens to dashes where appropriate

+

modified = true;

+

utilities.set_message ('maint_date_format'); -- hyphens were converted so add maint category

+

end

+

-- for those wikis that can and want to have English date names translated to the local language; not supported at en.wiki

+

if cfg.date_name_auto_xlate_enable and validation.date_name_xlate (date_parameters_list, cfg.date_digit_auto_xlate_enable ) then

+

utilities.set_message ('maint_date_auto_xlated'); -- add maint cat

+

modified = true;

+

end

+

if modified then -- if the date_parameters_list values were modified

+

AccessDate = date_parameters_list['access-date'].val; -- overwrite date holding parameters with modified values

+

ArchiveDate = date_parameters_list['archive-date'].val;

+

Date = date_parameters_list['date'].val;

+

DoiBroken = date_parameters_list['doi-broken-date'].val;

+

PublicationDate = date_parameters_list['publication-date'].val;

+

end

+

if archive_url_timestamp and utilities.is_set (ArchiveDate) then

+

validation.archive_date_check (ArchiveDate, archive_url_timestamp, DF); -- does YYYYMMDD in archive_url_timestamp match date in ArchiveDate

+

end

+

else

+

utilities.set_message ('err_bad_date', {utilities.make_sep_list (#error_list, error_list)}); -- add this error message

+

end

+

end -- end of do

+

if utilities.in_array (config.CitationClass, {'book', 'encyclopaedia'}) or -- {{cite book}}, {{cite encyclopedia}}; TODO: {{cite conference}} and others?

+

('citation' == config.CitationClass and utilities.is_set (Encyclopedia)) or -- {{citation}} as an encylopedia citation

+

('citation' == config.CitationClass and not utilities.is_set (Periodical)) then -- {{citation}} as a book citation

+

if utilities.is_set (PublicationPlace) then

+

if not utilities.is_set (PublisherName) then

+

local date = COinS_date.rftdate and tonumber (COinS_date.rftdate:match ('%d%d%d%d')); -- get year portion of COinS date (because in Arabic numerals); convert string to number

+

if date and (1850 <= date) then -- location has no publisher; if date is 1850 or later

+

utilities.set_message ('maint_location_no_publisher'); -- add maint cat

+

end

+

else -- PublisherName has a value

+

if cfg.keywords_xlate['none'] == PublisherName then -- if that value is 'none' (only for book and encyclopedia citations)

+

PublisherName = ''; -- unset

+

end

+

end

+

end

+

end

+

local ID_list = {}; -- sequence table of rendered identifiers

+

local ID_list_coins = {}; -- table of identifiers and their values from args; key is same as cfg.id_handlers's key

+

local Class = A['Class']; -- arxiv class identifier

+

local ID_support = {

+

{A['ASINTLD'], 'ASIN', 'err_asintld_missing_asin', A:ORIGIN ('ASINTLD')},

+

{DoiBroken, 'DOI', 'err_doibroken_missing_doi', A:ORIGIN ('DoiBroken')},

+

{Embargo, 'PMC', 'err_embargo_missing_pmc', A:ORIGIN ('Embargo')},

+

}

+

ID_list, ID_list_coins = identifiers.identifier_lists_get (args, {DoiBroken = DoiBroken, ASINTLD = A['ASINTLD'], Embargo = Embargo, Class = Class}, ID_support);

+

-- Account for the oddities that are {{cite arxiv}}, {{cite biorxiv}}, {{cite citeseerx}}, {{cite medrxiv}}, {{cite ssrn}}, before generation of COinS data.

+

+

if not (args[cfg.id_handlers[config.CitationClass:upper()].parameters[1]] or -- can't use ID_list_coins k/v table here because invalid parameters omitted

+

args[cfg.id_handlers[config.CitationClass:upper()].parameters[2]]) then -- which causes unexpected parameter missing error message

+

utilities.set_message ('err_' .. config.CitationClass .. '_missing'); -- add error message

+

end

+

Periodical = ({['arxiv'] = 'arXiv', ['biorxiv'] = 'bioRxiv', ['citeseerx'] = 'CiteSeerX', ['medrxiv'] = 'medRxiv', ['ssrn'] = 'Social Science Research Network'})[config.CitationClass];

+

end

+

-- Link the title of the work if no |url= was provided, but we have a |pmc= or a |doi= with |doi-access=free

+

if config.CitationClass == "journal" and not utilities.is_set (URL) and not utilities.is_set (TitleLink) and not utilities.in_array (cfg.keywords_xlate[Title], {'off', 'none'}) then -- TODO: remove 'none' once existing citations have been switched to 'off', so 'none' can be used as token for "no title" instead

+

if 'none' ~= cfg.keywords_xlate[auto_select] then -- if auto-linking not disabled

+

if identifiers.auto_link_urls[auto_select] then -- manual selection

+

URL = identifiers.auto_link_urls[auto_select]; -- set URL to be the same as identifier's external link

+

URL_origin = cfg.id_handlers[auto_select:upper()].parameters[1]; -- set URL_origin to parameter name for use in error message if citation is missing a |title=

+

elseif identifiers.auto_link_urls['pmc'] then -- auto-select PMC

+

URL = identifiers.auto_link_urls['pmc']; -- set URL to be the same as the PMC external link if not embargoed

+

URL_origin = cfg.id_handlers['PMC'].parameters[1]; -- set URL_origin to parameter name for use in error message if citation is missing a |title=

+

elseif identifiers.auto_link_urls['doi'] then -- auto-select DOI

+

URL = identifiers.auto_link_urls['doi'];

+

URL_origin = cfg.id_handlers['DOI'].parameters[1];

+

end

+

end

+

if utilities.is_set (URL) then -- set when using an identifier-created URL

+

if utilities.is_set (AccessDate) then -- |access-date= requires |url=; identifier-created URL is not |url=

+

utilities.set_message ('err_accessdate_missing_url'); -- add an error message

+

AccessDate = ''; -- unset

+

end

+

if utilities.is_set (ArchiveURL) then -- |archive-url= requires |url=; identifier-created URL is not |url=

+

utilities.set_message ('err_archive_missing_url'); -- add an error message

+

ArchiveURL = ''; -- unset

+

end

+

end

+

end

+

-- At this point fields may be nil if they weren't specified in the template use. We can use that fact.

+

-- Test if citation has no title

+

if not utilities.is_set (Title) and not utilities.is_set (TransTitle) and not utilities.is_set (ScriptTitle) then -- has special case for cite episode

+

utilities.set_message ('err_citation_missing_title', {'episode' == config.CitationClass and 'series' or 'title'});

+

end

+

if utilities.in_array (cfg.keywords_xlate[Title], {'off', 'none'}) and

+

utilities.in_array (config.CitationClass, {'journal', 'citation'}) and

+

(utilities.is_set (Periodical) or utilities.is_set (ScriptPeriodical)) and

+

('journal' == Periodical_origin or 'script-journal' == ScriptPeriodical_origin) then -- special case for journal cites

+

Title = ''; -- set title to empty string

+

utilities.set_message ('maint_untitled'); -- add maint cat

+

end

+

-- COinS metadata (see <http://ocoins.info/>) for automated parsing of citation information.

+

-- handle the oddity that is cite encyclopedia and {{citation |encyclopedia=something}}. Here we presume that

+

-- when Periodical, Title, and Chapter are all set, then Periodical is the book (encyclopedia) title, Title

+

-- is the article title, and Chapter is a section within the article. So, we remap

+

local coins_chapter = Chapter; -- default assuming that remapping not required

+

local coins_title = Title; -- et tu

+

if 'encyclopaedia' == config.CitationClass or ('citation' == config.CitationClass and utilities.is_set (Encyclopedia)) then

+

if utilities.is_set (Chapter) and utilities.is_set (Title) and utilities.is_set (Periodical) then -- if all are used then

+

coins_chapter = Title; -- remap

+

coins_title = Periodical;

+

end

+

end

+

local coins_author = a; -- default for coins rft.au

+

if 0 < #c then -- but if contributor list

+

coins_author = c; -- use that instead

+

end

+

-- this is the function call to COinS()

+

local OCinSoutput = metadata.COinS({

+

['Periodical'] = utilities.strip_apostrophe_markup (Periodical), -- no markup in the metadata

+

['Encyclopedia'] = Encyclopedia, -- just a flag; content ignored by ~/COinS

+

['Chapter'] = metadata.make_coins_title (coins_chapter, ScriptChapter), -- Chapter and ScriptChapter stripped of bold / italic / accept-as-written markup

+

['Degree'] = Degree; -- cite thesis only

+

['Title'] = metadata.make_coins_title (coins_title, ScriptTitle), -- Title and ScriptTitle stripped of bold / italic / accept-as-written markup

+

['PublicationPlace'] = PublicationPlace,

+

['Date'] = COinS_date.rftdate, -- COinS_date.* has correctly formatted date values if Date is valid;

+

['Season'] = COinS_date.rftssn,

+

['Quarter'] = COinS_date.rftquarter,

+

['Chron'] = COinS_date.rftchron,

+

['Series'] = Series,

+

['Volume'] = Volume,

+

['Issue'] = Issue,

+

['ArticleNumber'] = ArticleNumber,

+

['Pages'] = coins_pages or metadata.get_coins_pages (first_set ({Sheet, Sheets, Page, Pages, At, QuotePage, QuotePages}, 7)), -- pages stripped of external links

+

['Edition'] = Edition,

+

['PublisherName'] = PublisherName or Newsgroup, -- any apostrophe markup already removed from PublisherName

+

['URL'] = first_set ({ChapterURL, URL}, 2),

+

['Authors'] = coins_author,

+

['ID_list'] = ID_list_coins,

+

['RawPage'] = this_page.prefixedText,

+

}, config.CitationClass);

+

-- Account for the oddities that are {{cite arxiv}}, {{cite biorxiv}}, {{cite citeseerx}}, {{cite medrxiv}}, and {{cite ssrn}} AFTER generation of COinS data.

+

if utilities.in_array (config.CitationClass, whitelist.preprint_template_list_t) then -- we have set rft.jtitle in COinS to arXiv, bioRxiv, CiteSeerX, medRxiv, or ssrn now unset so it isn't displayed

+

Periodical = ''; -- periodical not allowed in these templates; if article has been published, use cite journal

+

end

+

-- special case for cite newsgroup. Do this after COinS because we are modifying Publishername to include some static text

+

if 'newsgroup' == config.CitationClass and utilities.is_set (Newsgroup) then

+

PublisherName = utilities.substitute (cfg.messages['newsgroup'], external_link( 'news:' .. Newsgroup, Newsgroup, Newsgroup_origin, nil ));

+

end

+

local Editors;

+

local EditorCount; -- used only for choosing {ed.) or (eds.) annotation at end of editor name-list

+

local Contributors; -- assembled contributors name list

+

local contributor_etal;

+

local Translators; -- assembled translators name list

+

local translator_etal;

+

local t = {}; -- translators list from |translator-lastn= / translator-firstn= pairs

+

t = extract_names (args, 'TranslatorList'); -- fetch translator list from |translatorn= / |translator-lastn=, -firstn=, -linkn=, -maskn=

+

local Interviewers;

+

local interviewers_list = {};

+

interviewers_list = extract_names (args, 'InterviewerList'); -- process preferred interviewers parameters

+

local interviewer_etal;

+

-- Now perform various field substitutions.

+

-- We also add leading spaces and surrounding markup and punctuation to the

+

-- various parts of the citation, but only when they are non-nil.

+

do

+

local last_first_list;

+

local control = {

+

format = NameListStyle, -- empty string, '&', 'amp', 'and', or 'vanc'

+

maximum = nil, -- as if display-authors or display-editors not set

+

mode = Mode

+

};

+

do -- do editor name list first because the now unsupported coauthors used to modify control table

+

local display_names, param = display_names_select (cfg.global_cs1_config_t['DisplayEditors'], A['DisplayEditors'], A:ORIGIN ('DisplayEditors'), #e);

+

control.maximum, editor_etal = get_display_names (display_names, #e, 'editors', editor_etal, param);

+

Editors, EditorCount = list_people (control, e, editor_etal);

+

if 1 == EditorCount and (true == editor_etal or 1 < #e) then -- only one editor displayed but includes etal then

+

EditorCount = 2; -- spoof to display (eds.) annotation

+

end

+

end

+

do -- now do interviewers

+

local display_names, param = display_names_select (cfg.global_cs1_config_t['DisplayInterviewers'], A['DisplayInterviewers'], A:ORIGIN ('DisplayInterviewers'), #interviewers_list);

+

control.maximum, interviewer_etal = get_display_names (display_names, #interviewers_list, 'interviewers', interviewer_etal, param);

+

Interviewers = list_people (control, interviewers_list, interviewer_etal);

+

end

+

do -- now do translators

+

local display_names, param = display_names_select (cfg.global_cs1_config_t['DisplayTranslators'], A['DisplayTranslators'], A:ORIGIN ('DisplayTranslators'), #t);

+

control.maximum, translator_etal = get_display_names (display_names, #t, 'translators', translator_etal, param);

+

Translators = list_people (control, t, translator_etal);

+

end

+

do -- now do contributors

+

local display_names, param = display_names_select (cfg.global_cs1_config_t['DisplayContributors'], A['DisplayContributors'], A:ORIGIN ('DisplayContributors'), #c);

+

control.maximum, contributor_etal = get_display_names (display_names, #c, 'contributors', contributor_etal, param);

+

Contributors = list_people (control, c, contributor_etal);

+

end

+

do -- now do authors

+

local display_names, param = display_names_select (cfg.global_cs1_config_t['DisplayAuthors'], A['DisplayAuthors'], A:ORIGIN ('DisplayAuthors'), #a, author_etal);

+

control.maximum, author_etal = get_display_names (display_names, #a, 'authors', author_etal, param);

+

last_first_list = list_people (control, a, author_etal);

+

if utilities.is_set (Authors) then

+

Authors, author_etal = name_has_etal (Authors, author_etal, false, 'authors'); -- find and remove variations on et al.

+

if author_etal then

+

Authors = Authors .. ' ' .. cfg.messages['et al']; -- add et al. to authors parameter

+

end

+

else

+

Authors = last_first_list; -- either an author name list or an empty string

+

end

+

end -- end of do

+

if utilities.is_set (Authors) and utilities.is_set (Collaboration) then

+

Authors = Authors .. ' (' .. Collaboration .. ')'; -- add collaboration after et al.

+

end

+

end

+

local ConferenceFormat = A['ConferenceFormat'];

+

local ConferenceURL = A['ConferenceURL'];

+

ConferenceFormat = style_format (ConferenceFormat, ConferenceURL, 'conference-format', 'conference-url');

+

Format = style_format (Format, URL, 'format', 'url');

+

-- special case for chapter format so no error message or cat when chapter not supported

+

if not (utilities.in_array (config.CitationClass, {'web', 'news', 'journal', 'magazine', 'pressrelease', 'podcast', 'newsgroup', 'arxiv', 'biorxiv', 'citeseerx', 'medrxiv', 'ssrn'}) or

+

('citation' == config.CitationClass and (utilities.is_set (Periodical) or utilities.is_set (ScriptPeriodical)) and not utilities.is_set (Encyclopedia))) then

+

ChapterFormat = style_format (ChapterFormat, ChapterURL, 'chapter-format', 'chapter-url');

+

end

+

if not utilities.is_set (URL) then

+

if utilities.in_array (config.CitationClass, {"web", "podcast", "mailinglist"}) or -- |url= required for cite web, cite podcast, and cite mailinglist

+

('citation' == config.CitationClass and ('website' == Periodical_origin or 'script-website' == ScriptPeriodical_origin)) then -- and required for {{citation}} with |website= or |script-website=

+

utilities.set_message ('err_cite_web_url');

+

end

+

-- do we have |accessdate= without either |url= or |chapter-url=?

+

if utilities.is_set (AccessDate) and not utilities.is_set (ChapterURL) then -- ChapterURL may be set when URL is not set;

+

utilities.set_message ('err_accessdate_missing_url');

+

AccessDate = '';

+

end

+

end

+

local UrlStatus = is_valid_parameter_value (A['UrlStatus'], A:ORIGIN('UrlStatus'), cfg.keywords_lists['url-status'], '');

+

local OriginalURL

+

local OriginalURL_origin

+

local OriginalFormat

+

local OriginalAccess;

+

UrlStatus = UrlStatus:lower(); -- used later when assembling archived text

+

if utilities.is_set ( ArchiveURL ) then

+

if utilities.is_set (ChapterURL) then -- if chapter-url= is set apply archive url to it

+

OriginalURL = ChapterURL; -- save copy of source chapter's url for archive text

+

OriginalURL_origin = ChapterURL_origin; -- name of |chapter-url= parameter for error messages

+

OriginalFormat = ChapterFormat; -- and original |chapter-format=

+

if 'live' ~= UrlStatus then

+

ChapterURL = ArchiveURL -- swap-in the archive's URL

+

ChapterURL_origin = A:ORIGIN('ArchiveURL') -- name of |archive-url= parameter for error messages

+

ChapterFormat = ArchiveFormat or ''; -- swap in archive's format

+

ChapterUrlAccess = nil; -- restricted access levels do not make sense for archived URLs

+

end

+

elseif utilities.is_set (URL) then

+

OriginalURL = URL; -- save copy of original source URL

+

OriginalURL_origin = URL_origin; -- name of URL parameter for error messages

+

OriginalFormat = Format; -- and original |format=

+

OriginalAccess = UrlAccess;

+

if 'live' ~= UrlStatus then -- if URL set then |archive-url= applies to it

+

URL = ArchiveURL -- swap-in the archive's URL

+

URL_origin = A:ORIGIN('ArchiveURL') -- name of archive URL parameter for error messages

+

Format = ArchiveFormat or ''; -- swap in archive's format

+

UrlAccess = nil; -- restricted access levels do not make sense for archived URLs

+

end

+

end

+

elseif utilities.is_set (UrlStatus) then -- if |url-status= is set when |archive-url= is not set

+

utilities.set_message ('maint_url_status'); -- add maint cat

+

end

+

if utilities.in_array (config.CitationClass, {'web', 'news', 'journal', 'magazine', 'pressrelease', 'podcast', 'newsgroup', 'arxiv', 'biorxiv', 'citeseerx', 'medrxiv', 'ssrn'}) or -- if any of the 'periodical' cites except encyclopedia

+

('citation' == config.CitationClass and (utilities.is_set (Periodical) or utilities.is_set (ScriptPeriodical)) and not utilities.is_set (Encyclopedia)) then

+

local chap_param;

+

if utilities.is_set (Chapter) then -- get a parameter name from one of these chapter related meta-parameters

+

chap_param = A:ORIGIN ('Chapter')

+

elseif utilities.is_set (TransChapter) then

+

chap_param = A:ORIGIN ('TransChapter')

+

elseif utilities.is_set (ChapterURL) then

+

chap_param = A:ORIGIN ('ChapterURL')

+

elseif utilities.is_set (ScriptChapter) then

+

chap_param = ScriptChapter_origin;

+

else utilities.is_set (ChapterFormat)

+

chap_param = A:ORIGIN ('ChapterFormat')

+

end

+

if utilities.is_set (chap_param) then -- if we found one

+

utilities.set_message ('err_chapter_ignored', {chap_param}); -- add error message

+

Chapter = ''; -- and set them to empty string to be safe with concatenation

+

TransChapter = '';

+

ChapterURL = '';

+

ScriptChapter = '';

+

ChapterFormat = '';

+

end

+

else -- otherwise, format chapter / article title

+

local no_quotes = false; -- default assume that we will be quoting the chapter parameter value

+

if utilities.is_set (Contribution) and 0 < #c then -- if this is a contribution with contributor(s)

+

if utilities.in_array (Contribution:lower(), cfg.keywords_lists.contribution) then -- and a generic contribution title

+

no_quotes = true; -- then render it unquoted

+

end

+

end

+

Chapter = format_chapter_title (ScriptChapter, ScriptChapter_origin, Chapter, Chapter_origin, TransChapter, TransChapter_origin, ChapterURL, ChapterURL_origin, no_quotes, ChapterUrlAccess); -- Contribution is also in Chapter

+

if utilities.is_set (Chapter) then

+

Chapter = Chapter .. ChapterFormat ;

+

if 'map' == config.CitationClass and utilities.is_set (TitleType) then

+

Chapter = Chapter .. ' ' .. TitleType; -- map annotation here; not after title

+

end

+

Chapter = Chapter .. sepc .. ' ';

+

elseif utilities.is_set (ChapterFormat) then -- |chapter= not set but |chapter-format= is so ...

+

Chapter = ChapterFormat .. sepc .. ' '; -- ... ChapterFormat has error message, we want to see it

+

end

+

end

+

-- Format main title

+

local plain_title = false;

+

local accept_title;

+

Title, accept_title = utilities.has_accept_as_written (Title, true); -- remove accept-this-as-written markup when it wraps all of <Title>

+

if accept_title and ('' == Title) then -- only support forced empty for now "(())"

+

Title = cfg.messages['notitle']; -- replace by predefined "No title" message

+

-- TODO: utilities.set_message ( 'err_redundant_parameters', ...); -- issue proper error message instead of muting

+

ScriptTitle = ''; -- just mute for now

+

TransTitle = ''; -- just mute for now

+

plain_title = true; -- suppress text decoration for descriptive title

+

utilities.set_message ('maint_untitled'); -- add maint cat

+

end

+

if not accept_title then -- <Title> not wrapped in accept-as-written markup

+

if '...' == Title:sub (-3) then -- if ellipsis is the last three characters of |title=

+

Title = Title:gsub ('(%.%.%.)%.+$', '%1'); -- limit the number of dots to three

+

elseif not mw.ustring.find (Title, '%.%s*%a%.$') and -- end of title is not a 'dot-(optional space-)letter-dot' initialism ...

+

not mw.ustring.find (Title, '%s+%a%.$') then -- ...and not a 'space-letter-dot' initial (''Allium canadense'' L.)

+

Title = mw.ustring.gsub(Title, '%' .. sepc .. '$', ''); -- remove any trailing separator character; sepc and ms.ustring() here for languages that use multibyte separator characters

+

end

+

if utilities.is_set (ArchiveURL) and is_archived_copy (Title) then

+

utilities.set_message ('maint_archived_copy'); -- add maintenance category before we modify the content of Title

+

end

+

if is_generic ('generic_titles', Title) then

+

utilities.set_message ('err_generic_title'); -- set an error message

+

end

+

end

+

if (not plain_title) and (utilities.in_array (config.CitationClass, {'web', 'news', 'journal', 'magazine', 'document', 'pressrelease', 'podcast', 'newsgroup', 'mailinglist', 'interview', 'arxiv', 'biorxiv', 'citeseerx', 'medrxiv', 'ssrn'}) or

+

('citation' == config.CitationClass and (utilities.is_set (Periodical) or utilities.is_set (ScriptPeriodical)) and not utilities.is_set (Encyclopedia)) or

+

('map' == config.CitationClass and (utilities.is_set (Periodical) or utilities.is_set (ScriptPeriodical)))) then -- special case for cite map when the map is in a periodical treat as an article

+

Title = kern_quotes (Title); -- if necessary, separate title's leading and trailing quote marks from module provided quote marks

+

Title = utilities.wrap_style ('quoted-title', Title);

+

Title = script_concatenate (Title, ScriptTitle, 'script-title'); -- <bdi> tags, lang attribute, categorization, etc.; must be done after title is wrapped

+

TransTitle = utilities.wrap_style ('trans-quoted-title', TransTitle );

+

elseif plain_title or ('report' == config.CitationClass) then -- no styling for cite report and descriptive titles (otherwise same as above)

+

Title = script_concatenate (Title, ScriptTitle, 'script-title'); -- <bdi> tags, lang attribute, categorization, etc.; must be done after title is wrapped

+

TransTitle = utilities.wrap_style ('trans-quoted-title', TransTitle ); -- for cite report, use this form for trans-title

+

else

+

Title = utilities.wrap_style ('italic-title', Title);

+

Title = script_concatenate (Title, ScriptTitle, 'script-title'); -- <bdi> tags, lang attribute, categorization, etc.; must be done after title is wrapped

+

TransTitle = utilities.wrap_style ('trans-italic-title', TransTitle);

+

end

+

if utilities.is_set (TransTitle) then

+

if utilities.is_set (Title) then

+

TransTitle = " " .. TransTitle;

+

else

+

utilities.set_message ('err_trans_missing_title', {'title'});

+

end

+

end

+

if utilities.is_set (Title) then -- TODO: is this the right place to be making Wikisource URLs?

+

if utilities.is_set (TitleLink) and utilities.is_set (URL) then

+

utilities.set_message ('err_wikilink_in_url'); -- set an error message because we can't have both

+

TitleLink = ''; -- unset

+

end

+

if not utilities.is_set (TitleLink) and utilities.is_set (URL) then

+

Title = external_link (URL, Title, URL_origin, UrlAccess) .. TransTitle .. Format;

+

URL = ''; -- unset these because no longer needed

+

Format = "";

+

elseif utilities.is_set (TitleLink) and not utilities.is_set (URL) then

+

local ws_url;

+

ws_url = wikisource_url_make (TitleLink); -- ignore ws_label return; not used here

+

if ws_url then

+

Title = external_link (ws_url, Title .. ' ', 'ws link in title-link'); -- space char after Title to move icon away from italic text; TODO: a better way to do this?

+

Title = utilities.substitute (cfg.presentation['interwiki-icon'], {cfg.presentation['class-wikisource'], TitleLink, Title});

+

Title = Title .. TransTitle;

+

else

+

Title = utilities.make_wikilink (TitleLink, Title) .. TransTitle;

+

end

+

else

+

local ws_url, ws_label, L; -- Title has italic or quote markup by the time we get here which causes is_wikilink() to return 0 (not a wikilink)

+

ws_url, ws_label, L = wikisource_url_make (Title:gsub('^[\'"]*(.-)[\'"]*$', '%1')); -- make ws URL from |title= interwiki link (strip italic or quote markup); link portion L becomes tooltip label

+

if ws_url then

+

Title = Title:gsub ('%b[]', ws_label); -- replace interwiki link with ws_label to retain markup

+

Title = external_link (ws_url, Title .. ' ', 'ws link in title'); -- space char after Title to move icon away from italic text; TODO: a better way to do this?

+

Title = utilities.substitute (cfg.presentation['interwiki-icon'], {cfg.presentation['class-wikisource'], L, Title});

+

Title = Title .. TransTitle;

+

else

+

Title = Title .. TransTitle;

+

end

+

end

+

else

+

Title = TransTitle;

+

end

+

if utilities.is_set (Place) then

+

Place = " " .. wrap_msg ('written', Place, use_lowercase) .. sepc .. " ";

+

end

+

local ConferenceURL_origin = A:ORIGIN('ConferenceURL'); -- get name of parameter that holds ConferenceURL

+

if utilities.is_set (Conference) then

+

if utilities.is_set (ConferenceURL) then

+

Conference = external_link( ConferenceURL, Conference, ConferenceURL_origin, nil );

+

end

+

Conference = sepc .. " " .. Conference .. ConferenceFormat;

+

elseif utilities.is_set (ConferenceURL) then

+

Conference = sepc .. " " .. external_link( ConferenceURL, nil, ConferenceURL_origin, nil );

+

end

+

local Position = '';

+

if not utilities.is_set (Position) then

+

local Minutes = A['Minutes'];

+

local Time = A['Time'];

+

if utilities.is_set (Minutes) then

+

if utilities.is_set (Time) then --TODO: make a function for this and similar?

+

utilities.set_message ('err_redundant_parameters', {utilities.wrap_style ('parameter', 'minutes') .. cfg.presentation['sep_list_pair'] .. utilities.wrap_style ('parameter', 'time')});

+

end

+

Position = " " .. Minutes .. " " .. cfg.messages['minutes'];

+

else

+

if utilities.is_set (Time) then

+

local TimeCaption = A['TimeCaption']

+

if not utilities.is_set (TimeCaption) then

+

TimeCaption = cfg.messages['event'];

+

if sepc ~= '.' then

+

TimeCaption = TimeCaption:lower();

+

end

+

end

+

Position = " " .. TimeCaption .. " " .. Time;

+

end

+

end

+

else

+

Position = " " .. Position;

+

At = '';

+

end

+

Page, Pages, Sheet, Sheets = format_pages_sheets (Page, Pages, Sheet, Sheets, config.CitationClass, Periodical_origin, sepc, NoPP, use_lowercase);

+

At = utilities.is_set (At) and (sepc .. " " .. At) or "";

+

Position = utilities.is_set (Position) and (sepc .. " " .. Position) or "";

+

if config.CitationClass == 'map' then

+

local Sections = A['Sections']; -- Section (singular) is an alias of Chapter so set earlier

+

local Inset = A['Inset'];

+

if utilities.is_set ( Inset ) then

+

Inset = sepc .. " " .. wrap_msg ('inset', Inset, use_lowercase);

+

end

+

if utilities.is_set ( Sections ) then

+

Section = sepc .. " " .. wrap_msg ('sections', Sections, use_lowercase);

+

elseif utilities.is_set ( Section ) then

+

Section = sepc .. " " .. wrap_msg ('section', Section, use_lowercase);

+

end

+

At = At .. Inset .. Section;

+

end

+

local Others = A['Others'];

+

if utilities.is_set (Others) and 0 == #a and 0 == #e then -- add maint cat when |others= has value and used without |author=, |editor=

+

if config.CitationClass == "AV-media-notes"

+

or config.CitationClass == "audio-visual" then -- special maint for AV/M which has a lot of 'false' positives right now

+

utilities.set_message ('maint_others_avm')

+

else

+

utilities.set_message ('maint_others');

+

end

+

end

+

Others = utilities.is_set (Others) and (sepc .. " " .. Others) or "";

+

if utilities.is_set (Translators) then

+

Others = safe_join ({sepc .. ' ', wrap_msg ('translated', Translators, use_lowercase), Others}, sepc);

+

end

+

if utilities.is_set (Interviewers) then

+

Others = safe_join ({sepc .. ' ', wrap_msg ('interview', Interviewers, use_lowercase), Others}, sepc);

+

end

+

local TitleNote = A['TitleNote'];

+

TitleNote = utilities.is_set (TitleNote) and (sepc .. " " .. TitleNote) or "";

+

if utilities.is_set (Edition) then

+

if Edition:match ('%f[%a][Ee]d%n?%.?$') or Edition:match ('%f[%a][Ee]dition$') then -- Ed, ed, Ed., ed., Edn, edn, Edn., edn.

+

utilities.set_message ('err_extra_text_edition'); -- add error message

+

end

+

Edition = " " .. wrap_msg ('edition', Edition);

+

else

+

Edition = '';

+

end

+

Series = utilities.is_set (Series) and wrap_msg ('series', {sepc, Series}) or ""; -- not the same as SeriesNum

+

local Agency = A['Agency'];

+

Agency = utilities.is_set (Agency) and wrap_msg ('agency', {sepc, Agency}) or "";

+

Volume = format_volume_issue (Volume, Issue, ArticleNumber, config.CitationClass, Periodical_origin, sepc, use_lowercase);

+

if utilities.is_set (AccessDate) then

+

local retrv_text = " " .. cfg.messages['retrieved']

+

AccessDate = nowrap_date (AccessDate); -- wrap in nowrap span if date in appropriate format

+

if (sepc ~= ".") then retrv_text = retrv_text:lower() end -- if mode is cs2, lower case

+

AccessDate = utilities.substitute (retrv_text, AccessDate); -- add retrieved text

+

AccessDate = utilities.substitute (cfg.presentation['accessdate'], {sepc, AccessDate}); -- allow editors to hide accessdates

+

end

+

if utilities.is_set (ID) then ID = sepc .. " " .. ID; end

+

local Docket = A['Docket'];

+

if "thesis" == config.CitationClass and utilities.is_set (Docket) then

+

ID = sepc .. " Docket " .. Docket .. ID;

+

end

+

if "report" == config.CitationClass and utilities.is_set (Docket) then -- for cite report when |docket= is set

+

ID = sepc .. ' ' .. Docket; -- overwrite ID even if |id= is set

+

end

+

if utilities.is_set (URL) then

+

URL = " " .. external_link( URL, nil, URL_origin, UrlAccess );

+

end

+

local Quote = A['Quote'];

+

local TransQuote = A['TransQuote'];

+

local ScriptQuote = A['ScriptQuote'];

+

if utilities.is_set (Quote) or utilities.is_set (TransQuote) or utilities.is_set (ScriptQuote) then

+

if utilities.is_set (Quote) then

+

if Quote:sub(1, 1) == '"' and Quote:sub(-1, -1) == '"' then -- if first and last characters of quote are quote marks

+

Quote = Quote:sub(2, -2); -- strip them off

+

end

+

end

+

Quote = kern_quotes (Quote); -- kern if needed

+

Quote = utilities.wrap_style ('quoted-text', Quote ); -- wrap in <q>...</q> tags

+

if utilities.is_set (ScriptQuote) then

+

Quote = script_concatenate (Quote, ScriptQuote, 'script-quote'); -- <bdi> tags, lang attribute, categorization, etc.; must be done after quote is wrapped

+

end

+

if utilities.is_set (TransQuote) then

+

if TransQuote:sub(1, 1) == '"' and TransQuote:sub(-1, -1) == '"' then -- if first and last characters of |trans-quote are quote marks

+

TransQuote = TransQuote:sub(2, -2); -- strip them off

+

end

+

Quote = Quote .. " " .. utilities.wrap_style ('trans-quoted-title', TransQuote );

+

end

+

if utilities.is_set (QuotePage) or utilities.is_set (QuotePages) then -- add page prefix

+

local quote_prefix = '';

+

if utilities.is_set (QuotePage) then

+

extra_text_in_page_check (QuotePage, 'quote-page'); -- add to maint cat if |quote-page= value begins with what looks like p., pp., etc.

+

if not NoPP then

+

quote_prefix = utilities.substitute (cfg.messages['p-prefix'], {sepc, QuotePage}), '', '', '';

+

else

+

quote_prefix = utilities.substitute (cfg.messages['nopp'], {sepc, QuotePage}), '', '', '';

+

end

+

elseif utilities.is_set (QuotePages) then

+

extra_text_in_page_check (QuotePages, 'quote-pages'); -- add to maint cat if |quote-pages= value begins with what looks like p., pp., etc.

+

if tonumber(QuotePages) ~= nil and not NoPP then -- if only digits, assume single page

+

quote_prefix = utilities.substitute (cfg.messages['p-prefix'], {sepc, QuotePages}), '', '';

+

elseif not NoPP then

+

quote_prefix = utilities.substitute (cfg.messages['pp-prefix'], {sepc, QuotePages}), '', '';

+

else

+

quote_prefix = utilities.substitute (cfg.messages['nopp'], {sepc, QuotePages}), '', '';

+

end

+

end

+

Quote = quote_prefix .. ": " .. Quote;

+

else

+

Quote = sepc .. " " .. Quote;

+

end

+

PostScript = ""; -- cs1|2 does not supply terminal punctuation when |quote= is set

+

end

+

-- We check length of PostScript here because it will have been nuked by

+

-- the quote parameters. We'd otherwise emit a message even if there wasn't

+

-- a displayed postscript.

+

-- TODO: Should the max size (1) be configurable?

+

-- TODO: Should we check a specific pattern?

+

if utilities.is_set(PostScript) and mw.ustring.len(PostScript) > 1 then

+

utilities.set_message ('maint_postscript')

+

end

+

local Archived;

+

if utilities.is_set (ArchiveURL) then

+

if not utilities.is_set (ArchiveDate) then -- ArchiveURL set but ArchiveDate not set

+

utilities.set_message ('err_archive_missing_date'); -- emit an error message

+

ArchiveURL = ''; -- empty string for concatenation

+

ArchiveDate = ''; -- empty string for concatenation

+

end

+

else

+

if utilities.is_set (ArchiveDate) then -- ArchiveURL not set but ArchiveDate is set

+

utilities.set_message ('err_archive_date_missing_url'); -- emit an error message

+

ArchiveURL = ''; -- empty string for concatenation

+

ArchiveDate = ''; -- empty string for concatenation

+

end

+

end

+

if utilities.is_set (ArchiveURL) then

+

local arch_text;

+

if "live" == UrlStatus then

+

arch_text = cfg.messages['archived'];

+

if sepc ~= "." then arch_text = arch_text:lower() end

+

if utilities.is_set (ArchiveDate) then

+

Archived = sepc .. ' ' .. utilities.substitute ( cfg.messages['archived-live'],

+

{external_link( ArchiveURL, arch_text, A:ORIGIN('ArchiveURL'), nil) .. ArchiveFormat, ArchiveDate } );

+

else

+

Archived = '';

+

end

+

if not utilities.is_set (OriginalURL) then

+

utilities.set_message ('err_archive_missing_url');

+

Archived = ''; -- empty string for concatenation

+

end

+

elseif utilities.is_set (OriginalURL) then -- UrlStatus is empty, 'dead', 'unfit', 'usurped', 'bot: unknown'

+

if utilities.in_array (UrlStatus, {'unfit', 'usurped', 'bot: unknown'}) then

+

arch_text = cfg.messages['archived-unfit'];

+

if sepc ~= "." then arch_text = arch_text:lower() end

+

Archived = sepc .. ' ' .. arch_text .. ArchiveDate; -- format already styled

+

if 'bot: unknown' == UrlStatus then

+

utilities.set_message ('maint_bot_unknown'); -- and add a category if not already added

+

else

+

utilities.set_message ('maint_unfit'); -- and add a category if not already added

+

end

+

else -- UrlStatus is empty, 'dead'

+

arch_text = cfg.messages['archived-dead'];

+

if sepc ~= "." then arch_text = arch_text:lower() end

+

if utilities.is_set (ArchiveDate) then

+

Archived = sepc .. " " .. utilities.substitute ( arch_text,

+

{ external_link( OriginalURL, cfg.messages['original'], OriginalURL_origin, OriginalAccess ) .. OriginalFormat, ArchiveDate } ); -- format already styled

+

else

+

Archived = ''; -- unset for concatenation

+

end

+

end

+

else -- OriginalUrl not set

+

utilities.set_message ('err_archive_missing_url');

+

Archived = ''; -- empty string for concatenation

+

end

+

elseif utilities.is_set (ArchiveFormat) then

+

Archived = ArchiveFormat; -- if set and ArchiveURL not set ArchiveFormat has error message

+

else

+

Archived = '';

+

end

+

local TranscriptURL = A['TranscriptURL']

+

local TranscriptFormat = A['TranscriptFormat'];

+

TranscriptFormat = style_format (TranscriptFormat, TranscriptURL, 'transcript-format', 'transcripturl');

+

local Transcript = A['Transcript'];

+

local TranscriptURL_origin = A:ORIGIN('TranscriptURL'); -- get name of parameter that holds TranscriptURL

+

if utilities.is_set (Transcript) then

+

if utilities.is_set (TranscriptURL) then

+

Transcript = external_link( TranscriptURL, Transcript, TranscriptURL_origin, nil );

+

end

+

Transcript = sepc .. ' ' .. Transcript .. TranscriptFormat;

+

elseif utilities.is_set (TranscriptURL) then

+

Transcript = external_link( TranscriptURL, nil, TranscriptURL_origin, nil );

+

end

+

local Publisher;

+

if utilities.is_set (PublicationDate) then

+

PublicationDate = wrap_msg ('published', PublicationDate);

+

end

+

if utilities.is_set (PublisherName) then

+

if utilities.is_set (PublicationPlace) then

+

Publisher = sepc .. " " .. PublicationPlace .. ": " .. PublisherName .. PublicationDate;

+

else

+

Publisher = sepc .. " " .. PublisherName .. PublicationDate;

+

end

+

elseif utilities.is_set (PublicationPlace) then

+

Publisher= sepc .. " " .. PublicationPlace .. PublicationDate;

+

else

+

Publisher = PublicationDate;

+

end

+

-- Several of the above rely upon detecting this as nil, so do it last.

+

if (utilities.is_set (Periodical) or utilities.is_set (ScriptPeriodical) or utilities.is_set (TransPeriodical)) then

+

if utilities.is_set (Title) or utilities.is_set (TitleNote) then

+

Periodical = sepc .. " " .. format_periodical (ScriptPeriodical, ScriptPeriodical_origin, Periodical, TransPeriodical, TransPeriodical_origin);

+

else

+

Periodical = format_periodical (ScriptPeriodical, ScriptPeriodical_origin, Periodical, TransPeriodical, TransPeriodical_origin);

+

end

+

end

+

local Language = A['Language'];

+

if utilities.is_set (Language) then

+

Language = language_parameter (Language); -- format, categories, name from ISO639-1, etc.

+

else

+

Language=''; -- language not specified so make sure this is an empty string;

+

--[[ TODO: need to extract the wrap_msg from language_parameter

+

so that we can solve parentheses bunching problem with Format/Language/TitleType

+

]]

+

end

+

--[[

+

Handle the oddity that is cite speech. This code overrides whatever may be the value assigned to TitleNote (through |department=) and forces it to be " (Speech)" so that

+

the annotation directly follows the |title= parameter value in the citation rather than the |event= parameter value (if provided).

+

]]

+

if "speech" == config.CitationClass then -- cite speech only

+

TitleNote = TitleType; -- move TitleType to TitleNote so that it renders ahead of |event=

+

TitleType = ''; -- and unset

+

if utilities.is_set (Periodical) then -- if Periodical, perhaps because of an included |website= or |journal= parameter

+

if utilities.is_set (Conference) then -- and if |event= is set

+

Conference = Conference .. sepc .. " "; -- then add appropriate punctuation to the end of the Conference variable before rendering

+

end

+

end

+

end

+

-- Piece all bits together at last. Here, all should be non-nil.

+

-- We build things this way because it is more efficient in LUA

+

-- not to keep reassigning to the same string variable over and over.

+

local tcommon;

+

local tcommon2; -- used for book cite when |contributor= is set

+

if utilities.in_array (config.CitationClass, {"journal", "citation"}) and utilities.is_set (Periodical) then

+

if not (utilities.is_set (Authors) or utilities.is_set (Editors)) then

+

Others = Others:gsub ('^' .. sepc .. ' ', ''); -- when no authors and no editors, strip leading sepc and space

+

end

+

if utilities.is_set (Others) then Others = safe_join ({Others, sepc .. " "}, sepc) end -- add terminal punctuation & space; check for dup sepc; TODO why do we need to do this here?

+

tcommon = safe_join( {Others, Title, TitleNote, Conference, Periodical, Format, TitleType, Series, Language, Edition, Publisher, Agency, Volume}, sepc );

+

elseif utilities.in_array (config.CitationClass, {"book", "citation"}) and not utilities.is_set (Periodical) then -- special cases for book cites

+

if utilities.is_set (Contributors) then -- when we are citing foreword, preface, introduction, etc.

+

tcommon = safe_join( {Title, TitleNote}, sepc ); -- author and other stuff will come after this and before tcommon2

+

tcommon2 = safe_join( {Conference, Periodical, Format, TitleType, Series, Language, Volume, Others, Edition, Publisher, Agency}, sepc );

+

else

+

tcommon = safe_join( {Title, TitleNote, Conference, Periodical, Format, TitleType, Series, Language, Volume, Others, Edition, Publisher, Agency}, sepc );

+

end

+

elseif 'map' == config.CitationClass then -- special cases for cite map

+

if utilities.is_set (Chapter) then -- map in a book; TitleType is part of Chapter

+

tcommon = safe_join( {Title, Format, Edition, Scale, Series, Language, Cartography, Others, Publisher, Volume}, sepc );

+

elseif utilities.is_set (Periodical) then -- map in a periodical

+

tcommon = safe_join( {Title, TitleType, Format, Periodical, Scale, Series, Language, Cartography, Others, Publisher, Volume}, sepc );

+

else -- a sheet or stand-alone map

+

tcommon = safe_join( {Title, TitleType, Format, Edition, Scale, Series, Language, Cartography, Others, Publisher}, sepc );

+

end

+

elseif 'episode' == config.CitationClass then -- special case for cite episode

+

tcommon = safe_join( {Title, TitleNote, TitleType, Series, Language, Edition, Publisher}, sepc );

+

else -- all other CS1 templates

+

tcommon = safe_join( {Title, TitleNote, Conference, Periodical, Format, TitleType, Series, Language,

+

Volume, Others, Edition, Publisher, Agency}, sepc );

+

end

+

if #ID_list > 0 then

+

ID_list = safe_join( { sepc .. " ", table.concat( ID_list, sepc .. " " ), ID }, sepc );

+

else

+

ID_list = ID;

+

end

+

local Via = A['Via'];

+

Via = utilities.is_set (Via) and wrap_msg ('via', Via) or '';

+

local idcommon;

+

if 'audio-visual' == config.CitationClass or 'episode' == config.CitationClass then -- special case for cite AV media & cite episode position transcript

+

idcommon = safe_join( { ID_list, URL, Archived, Transcript, AccessDate, Via, Quote }, sepc );

+

else

+

idcommon = safe_join( { ID_list, URL, Archived, AccessDate, Via, Quote }, sepc );

+

end

+

local text;

+

local pgtext = Position .. Sheet .. Sheets .. Page .. Pages .. At;

+

local OrigDate = A['OrigDate'];

+

OrigDate = utilities.is_set (OrigDate) and wrap_msg ('origdate', OrigDate) or '';

+

if utilities.is_set (Date) then

+

if utilities.is_set (Authors) or utilities.is_set (Editors) then -- date follows authors or editors when authors not set

+

Date = " (" .. Date .. ")" .. OrigDate .. sepc .. " "; -- in parentheses

+

else -- neither of authors and editors set

+

if (string.sub(tcommon, -1, -1) == sepc) then -- if the last character of tcommon is sepc

+

Date = " " .. Date .. OrigDate; -- Date does not begin with sepc

+

else

+

Date = sepc .. " " .. Date .. OrigDate; -- Date begins with sepc

+

end

+

end

+

end

+

if utilities.is_set (Authors) then

+

if (not utilities.is_set (Date)) then -- when date is set it's in parentheses; no Authors termination

+

Authors = terminate_name_list (Authors, sepc); -- when no date, terminate with 0 or 1 sepc and a space

+

end

+

if utilities.is_set (Editors) then

+

local in_text = '';

+

local post_text = '';

+

if utilities.is_set (Chapter) and 0 == #c then

+

in_text = cfg.messages['in'] .. ' ';

+

if (sepc ~= '.') then

+

in_text = in_text:lower(); -- lowercase for cs2

+

end

+

end

+

if EditorCount <= 1 then

+

post_text = ' (' .. cfg.messages['editor'] .. ')'; -- be consistent with no-author, no-date case

+

else

+

post_text = ' (' .. cfg.messages['editors'] .. ')';

+

end

+

Editors = terminate_name_list (in_text .. Editors .. post_text, sepc); -- terminate with 0 or 1 sepc and a space

+

end

+

if utilities.is_set (Contributors) then -- book cite and we're citing the intro, preface, etc.

+

local by_text = sepc .. ' ' .. cfg.messages['by'] .. ' ';

+

if (sepc ~= '.') then by_text = by_text:lower() end -- lowercase for cs2

+

Authors = by_text .. Authors; -- author follows title so tweak it here

+

if utilities.is_set (Editors) and utilities.is_set (Date) then -- when Editors make sure that Authors gets terminated

+

Authors = terminate_name_list (Authors, sepc); -- terminate with 0 or 1 sepc and a space

+

end

+

if (not utilities.is_set (Date)) then -- when date is set it's in parentheses; no Contributors termination

+

Contributors = terminate_name_list (Contributors, sepc); -- terminate with 0 or 1 sepc and a space

+

end

+

text = safe_join( {Contributors, Date, Chapter, tcommon, Authors, Place, Editors, tcommon2, pgtext, idcommon }, sepc );

+

else

+

text = safe_join( {Authors, Date, Chapter, Place, Editors, tcommon, pgtext, idcommon }, sepc );

+

end

+

elseif utilities.is_set (Editors) then

+

if utilities.is_set (Date) then

+

if EditorCount <= 1 then

+

Editors = Editors .. cfg.presentation['sep_name'] .. cfg.messages['editor'];

+

else

+

Editors = Editors .. cfg.presentation['sep_name'] .. cfg.messages['editors'];

+

end

+

else

+

if EditorCount <= 1 then

+

Editors = Editors .. " (" .. cfg.messages['editor'] .. ")" .. sepc .. " "

+

else

+

Editors = Editors .. " (" .. cfg.messages['editors'] .. ")" .. sepc .. " "

+

end

+

end

+

text = safe_join( {Editors, Date, Chapter, Place, tcommon, pgtext, idcommon}, sepc );

+

else

+

if utilities.in_array (config.CitationClass, {"journal", "citation"}) and utilities.is_set (Periodical) then

+

text = safe_join( {Chapter, Place, tcommon, pgtext, Date, idcommon}, sepc );

+

else

+

text = safe_join( {Chapter, Place, tcommon, Date, pgtext, idcommon}, sepc );

+

end

+

end

+

if utilities.is_set (PostScript) and PostScript ~= sepc then

+

text = safe_join( {text, sepc}, sepc ); -- Deals with italics, spaces, etc.

+

text = text:sub(1, -sepc:len() - 1);

+

end

+

text = safe_join( {text, PostScript}, sepc );

+

-- Now enclose the whole thing in a <cite> element

+

local options_t = {};

+

options_t.class = cite_class_attribute_make (config.CitationClass, Mode);

+

local Ref = is_valid_parameter_value (A['Ref'], A:ORIGIN('Ref'), cfg.keywords_lists['ref'], nil, true); -- nil when |ref=harv; A['Ref'] else

+

if 'none' ~= cfg.keywords_xlate[(Ref and Ref:lower()) or ''] then

+

local namelist_t = {}; -- holds selected contributor, author, editor name list

+

local year = first_set ({Year, anchor_year}, 2); -- Year first for legacy citations and for YMD dates that require disambiguation

+

if #c > 0 then -- if there is a contributor list

+

namelist_t = c; -- select it

+

elseif #a > 0 then -- or an author list

+

namelist_t = a;

+

elseif #e > 0 then -- or an editor list

+

namelist_t = e;

+

end

+

local citeref_id;

+

if #namelist_t > 0 then -- if there are names in namelist_t

+

citeref_id = make_citeref_id (namelist_t, year); -- go make the CITEREF anchor

+

if mw.uri.anchorEncode (citeref_id) == ((Ref and mw.uri.anchorEncode (Ref)) or '') then -- Ref may already be encoded (by {{sfnref}}) so citeref_id must be encoded before comparison

+

utilities.set_message ('maint_ref_duplicates_default');

+

end

+

else

+

citeref_id = ''; -- unset

+

end

+

options_t.id = Ref or citeref_id;

+

end

+

if string.len (text:gsub('%b<>', '')) <= 2 then -- remove html and html-like tags; then get length of what remains;

+

z.error_cats_t = {}; -- blank the categories list

+

z.error_msgs_t = {}; -- blank the error messages list

+

OCinSoutput = nil; -- blank the metadata string

+

text = ''; -- blank the the citation

+

utilities.set_message ('err_empty_citation'); -- set empty citation message and category

+

end

+

local render_t = {}; -- here we collect the final bits for concatenation into the rendered citation

+

if utilities.is_set (options_t.id) then -- here we wrap the rendered citation in <cite ...>...</cite> tags

+

table.insert (render_t, utilities.substitute (cfg.presentation['cite-id'], {mw.uri.anchorEncode(options_t.id), mw.text.nowiki(options_t.class), text})); -- when |ref= is set or when there is a namelist

+

else

+

table.insert (render_t, utilities.substitute (cfg.presentation['cite'], {mw.text.nowiki(options_t.class), text})); -- when |ref=none or when namelist_t empty and |ref= is missing or is empty

+

end

+

if OCinSoutput then -- blanked when citation is 'empty' so don't bother to add boilerplate metadata span

+

table.insert (render_t, utilities.substitute (cfg.presentation['ocins'], OCinSoutput)); -- format and append metadata to the citation

+

end

+

local template_name = ('citation' == config.CitationClass) and 'citation' or 'cite ' .. (cfg.citation_class_map_t[config.CitationClass] or config.CitationClass);

+

local template_link = '[[Template:' .. template_name .. '|' .. template_name .. ']]';

+

local msg_prefix = '<code class="cs1-code">{{' .. template_link .. '}}</code>: ';

+

if 0 ~= #z.error_msgs_t then

+

mw.addWarning (utilities.substitute (cfg.messages.warning_msg_e, template_link));

+

table.insert (render_t, ' '); -- insert a space between citation and its error messages

+

table.sort (z.error_msgs_t); -- sort the error messages list; sorting includes wrapping and <code> tags; hidden-error sorts ahead of visible-error

+

local hidden = true; -- presume that the only error messages emited by this template are hidden

+

for _, v in ipairs (z.error_msgs_t) do -- spin through the list of error messages

+

if v:find ('cs1-visible-error', 1, true) then -- look for the visible error class name

+

hidden = false; -- found one; so don't hide the error message prefix

+

break; -- and done because no need to look further

+

end

+

end

+

z.error_msgs_t[1] = table.concat ({utilities.error_comment (msg_prefix, hidden), z.error_msgs_t[1]}); -- add error message prefix to first error message to prevent extraneous punctuation

+

table.insert (render_t, table.concat (z.error_msgs_t, '; ')); -- make a big string of error messages and add it to the rendering

+

end

+

if 0 ~= #z.maint_cats_t then

+

mw.addWarning (utilities.substitute (cfg.messages.warning_msg_m, template_link));

+

table.sort (z.maint_cats_t); -- sort the maintenance messages list

+

local maint_msgs_t = {}; -- here we collect all of the maint messages

+

if 0 == #z.error_msgs_t then -- if no error messages

+

table.insert (maint_msgs_t, msg_prefix); -- insert message prefix in maint message livery

+

end

+

for _, v in ipairs( z.maint_cats_t ) do -- append maintenance categories

+

table.insert (maint_msgs_t, -- assemble new maint message and add it to the maint_msgs_t table

+

table.concat ({v, ' (', utilities.substitute (cfg.messages[':cat wikilink'], v), ')'})

+

);

+

end

+

table.insert (render_t, utilities.substitute (cfg.presentation['hidden-maint'], table.concat (maint_msgs_t, ' '))); -- wrap the group of maint messages with proper presentation and save

+

end

+

if not no_tracking_cats then

+

local sort_key;

+

local cat_wikilink = 'cat wikilink';

+

if cfg.enable_sort_keys then -- when namespace sort keys enabled

+

local namespace_number = mw.title.getCurrentTitle().namespace; -- get namespace number for this wikitext

+

sort_key = (0 ~= namespace_number and (cfg.name_space_sort_keys[namespace_number] or cfg.name_space_sort_keys.other)) or nil; -- get sort key character; nil for mainspace

+

cat_wikilink = (not sort_key and 'cat wikilink') or 'cat wikilink sk'; -- make <cfg.messages> key

+

end

+

for _, v in ipairs (z.error_cats_t) do -- append error categories

+

table.insert (render_t, utilities.substitute (cfg.messages[cat_wikilink], {v, sort_key}));

+

end

+

for _, v in ipairs (z.maint_cats_t) do -- append maintenance categories

+

table.insert (render_t, utilities.substitute (cfg.messages[cat_wikilink], {v, sort_key}));

+

end

+

for _, v in ipairs (z.prop_cats_t) do -- append properties categories

+

table.insert (render_t, utilities.substitute (cfg.messages['cat wikilink'], v)); -- no sort keys

+

end

+

end

+

return table.concat (render_t); -- make a big string and done

end

−

return z

+

--[[--------------------------< V A L I D A T E >--------------------------------------------------------------

+

Looks for a parameter's name in one of several whitelists.

+

Parameters in the whitelist can have three values:

+

true - active, supported parameters

+

false - deprecated, supported parameters

+

nil - unsupported parameters

+

]]

+

local function validate (name, cite_class, empty)

+

local name = tostring (name);

+

local enum_name; -- parameter name with enumerator (if any) replaced with '#'

+

local state;

+

local function state_test (state, name) -- local function to do testing of state values

+

if true == state then return true; end -- valid actively supported parameter

+

if false == state then

+

if empty then return nil; end -- empty deprecated parameters are treated as unknowns

+

deprecated_parameter (name); -- parameter is deprecated but still supported

+

return true;

+

end

+

if 'tracked' == state then

+

local base_name = name:gsub ('%d', ''); -- strip enumerators from parameter names that have them to get the base name

+

utilities.add_prop_cat ('tracked-param', {base_name}, base_name); -- add a properties category; <base_name> modifies <key>

+

return true;

+

end

+

return nil;

+

end

+

if name:find ('#') then -- # is a cs1|2 reserved character so parameters with # not permitted

+

return nil;

+

end

+

-- replace wnumerator digit(s) with # (|last25= becomes |last#=) (mw.ustring because non-Western 'local' digits)

+

enum_name = mw.ustring.gsub (name, '%d+$', '#'); -- where enumerator is last charaters in parameter name (these to protect |s2cid=)

+

enum_name = mw.ustring.gsub (enum_name, '%d+([%-l])', '#%1'); -- where enumerator is in the middle of the parameter name; |author#link= is the oddity

+

if 'document' == cite_class then -- special case for {{cite document}}

+

state = whitelist.document_parameters_t[enum_name]; -- this list holds enumerated and nonenumerated parameters

+

if true == state_test (state, name) then return true; end

+

return false;

+

end

+

if utilities.in_array (cite_class, whitelist.preprint_template_list_t) then -- limited parameter sets allowed for these templates

+

state = whitelist.limited_parameters_t[enum_name]; -- this list holds enumerated and nonenumerated parameters

+

if true == state_test (state, name) then return true; end

+

state = whitelist.preprint_arguments_t[cite_class][name]; -- look in the parameter-list for the template identified by cite_class

+

if true == state_test (state, name) then return true; end

+

return false; -- not supported because not found or name is set to nil

+

end -- end limited parameter-set templates

+

if utilities.in_array (cite_class, whitelist.unique_param_template_list_t) then -- template-specific parameters for templates that accept parameters from the basic argument list

+

state = whitelist.unique_arguments_t[cite_class][name]; -- look in the template-specific parameter-lists for the template identified by cite_class

+

if true == state_test (state, name) then return true; end

+

end -- if here, fall into general validation

+

state = whitelist.common_parameters_t[enum_name]; -- all other templates; all normal parameters allowed; this list holds enumerated and nonenumerated parameters

+

if true == state_test (state, name) then return true; end

+

return false; -- not supported because not found or name is set to nil

+

end

+

--[=[-----------------------------------------------------------------------

+

check <value> for inter-language interwiki-link markup. <prefix> must be a MediaWiki-recognized language

+

code. when these values have the form (without leading colon):

+

[[<prefix>:link|label]] return label as plain-text

+

[[<prefix>:link]] return <prefix>:link as plain-text

+

return value as is else

+

]=]

+

local function inter_wiki_check (parameter, value)

+

local prefix = value:match ('%[%[(%a+):'); -- get an interwiki prefix if one exists

+

local _;

+

if prefix and cfg.inter_wiki_map[prefix:lower()] then -- if prefix is in the map, needs preceding colon so

+

utilities.set_message ('err_bad_paramlink', parameter); -- emit an error message

+

_, value, _ = utilities.is_wikilink (value); -- extract label portion from wikilink

+

end

+

return value;

+

end

+

--[[--------------------------< M I S S I N G _ P I P E _ C H E C K >------------------------------------------

+

Look at the contents of a parameter. If the content has a string of characters and digits followed by an equal

+

sign, compare the alphanumeric string to the list of cs1|2 parameters. If found, then the string is possibly a

+

parameter that is missing its pipe. There are two tests made:

+

{{cite ... |title=Title access-date=2016-03-17}} -- the first parameter has a value and whitespace separates that value from the missing pipe parameter name

+

{{cite ... |title=access-date=2016-03-17}} -- the first parameter has no value (whitespace after the first = is trimmed by MediaWiki)

+

cs1|2 shares some parameter names with XML/HTML attributes: class=, title=, etc. To prevent false positives XML/HTML

+

tags are removed before the search.

+

If a missing pipe is detected, this function adds the missing pipe maintenance category.

+

]]

+

local function missing_pipe_check (parameter, value)

+

local capture;

+

value = value:gsub ('%b<>', ''); -- remove XML/HTML tags because attributes: class=, title=, etc.

+

capture = value:match ('%s+(%a[%w%-]+)%s*=') or value:match ('^(%a[%w%-]+)%s*='); -- find and categorize parameters with possible missing pipes

+

if capture and validate (capture) then -- if the capture is a valid parameter name

+

utilities.set_message ('err_missing_pipe', parameter);

+

end

+

end

+

--[[--------------------------< H A S _ E X T R A N E O U S _ P U N C T >--------------------------------------

+

look for extraneous terminal punctuation in most parameter values; parameters listed in skip table are not checked

+

]]

+

local function has_extraneous_punc (param, value)

+

if 'number' == type (param) then

+

return;

+

end

+

param = param:gsub ('%d+', '#'); -- enumerated name-list mask params allow terminal punct; normalize

+

if cfg.punct_skip[param] then

+

return; -- parameter name found in the skip table so done

+

end

+

if value:match ('[,;:]$') then

+

utilities.set_message ('maint_extra_punct'); -- has extraneous punctuation; add maint cat

+

end

+

if value:match ('^=') then -- sometimes an extraneous '=' character appears ...

+

utilities.set_message ('maint_extra_punct'); -- has extraneous punctuation; add maint cat

+

end

+

end

+

--[[--------------------------< H A S _ E X T R A N E O U S _ U R L >------------------------------------------

+

look for extraneous url parameter values; parameters listed in skip table are not checked

+

]]

+

local function has_extraneous_url (url_param_t)

+

local url_error_t = {};

+

check_for_url (url_param_t, url_error_t); -- extraneous url check

+

if 0 ~= #url_error_t then -- non-zero when there are errors

+

table.sort (url_error_t);

+

utilities.set_message ('err_param_has_ext_link', {utilities.make_sep_list (#url_error_t, url_error_t)}); -- add this error message

+

end

+

end

+

--[[--------------------------< C I T A T I O N >--------------------------------------------------------------

+

This is used by templates such as {{cite book}} to create the actual citation text.

+

]]

+

local function citation(frame)

+

Frame = frame; -- save a copy in case we need to display an error message in preview mode

+

local config = {}; -- table to store parameters from the module {{#invoke:}}

+

for k, v in pairs( frame.args ) do -- get parameters from the {{#invoke}} frame

+

config[k] = v;

+

-- args[k] = v; -- crude debug support that allows us to render a citation from module {{#invoke:}}; skips parameter validation; TODO: keep?

+

end

+

-- i18n: set the name that your wiki uses to identify sandbox subpages from sandbox template invoke (or can be set here)

+

local sandbox = ((config.SandboxPath and '' ~= config.SandboxPath) and config.SandboxPath) or '/sandbox'; -- sandbox path from {{#invoke:Citation/CS1/sandbox|citation|SandboxPath=/...}}

+

is_sandbox = nil ~= string.find (frame:getTitle(), sandbox, 1, true); -- is this invoke the sandbox module?

+

sandbox = is_sandbox and sandbox or ''; -- use i18n sandbox to load sandbox modules when this module is the sandox; live modules else

+

local pframe = frame:getParent()

+

local styles;

+

cfg = mw.loadData ('Module:Citation/CS1/Configuration' .. sandbox); -- load sandbox versions of support modules when {{#invoke:Citation/CS1/sandbox|...}}; live modules else

+

whitelist = mw.loadData ('Module:Citation/CS1/Whitelist' .. sandbox);

+

utilities = require ('Module:Citation/CS1/Utilities' .. sandbox);

+

validation = require ('Module:Citation/CS1/Date_validation' .. sandbox);

+

identifiers = require ('Module:Citation/CS1/Identifiers' .. sandbox);

+

metadata = require ('Module:Citation/CS1/COinS' .. sandbox);

+

styles = 'Module:Citation/CS1' .. sandbox .. '/styles.css';

+

utilities.set_selected_modules (cfg); -- so that functions in Utilities can see the selected cfg tables

+

identifiers.set_selected_modules (cfg, utilities); -- so that functions in Identifiers can see the selected cfg tables and selected Utilities module

+

validation.set_selected_modules (cfg, utilities); -- so that functions in Date validataion can see selected cfg tables and the selected Utilities module

+

metadata.set_selected_modules (cfg, utilities); -- so that functions in COinS can see the selected cfg tables and selected Utilities module

+

z = utilities.z; -- table of error and category tables in Module:Citation/CS1/Utilities

+

is_preview_mode = not utilities.is_set (frame:preprocess ('{{REVISIONID}}'));

+

local args = {}; -- table where we store all of the template's arguments

+

local suggestions = {}; -- table where we store suggestions if we need to loadData them

+

local error_text; -- used as a flag

+

local capture; -- the single supported capture when matching unknown parameters using patterns

+

local empty_unknowns = {}; -- sequence table to hold empty unknown params for error message listing

+

for k, v in pairs( pframe.args ) do -- get parameters from the parent (template) frame

+

v = mw.ustring.gsub (v, '^%s*(.-)%s*$', '%1'); -- trim leading/trailing whitespace; when v is only whitespace, becomes empty string

+

if v ~= '' then

+

if ('string' == type (k)) then

+

k = mw.ustring.gsub (k, '%d', cfg.date_names.local_digits); -- for enumerated parameters, translate 'local' digits to Western 0-9

+

end

+

if not validate( k, config.CitationClass ) then

+

if type (k) ~= 'string' then -- exclude empty numbered parameters

+

if v:match("%S+") ~= nil then

+

error_text = utilities.set_message ('err_text_ignored', {v});

+

end

+

elseif validate (k:lower(), config.CitationClass) then

+

error_text = utilities.set_message ('err_parameter_ignored_suggest', {k, k:lower()}); -- suggest the lowercase version of the parameter

+

else

+

if nil == suggestions.suggestions then -- if this table is nil then we need to load it

+

suggestions = mw.loadData ('Module:Citation/CS1/Suggestions' .. sandbox); --load sandbox version of suggestion module when {{#invoke:Citation/CS1/sandbox|...}}; live module else

+

end

+

for pattern, param in pairs (suggestions.patterns) do -- loop through the patterns to see if we can suggest a proper parameter

+

capture = k:match (pattern); -- the whole match if no capture in pattern else the capture if a match

+

if capture then -- if the pattern matches

+

param = utilities.substitute (param, capture); -- add the capture to the suggested parameter (typically the enumerator)

+

if validate (param, config.CitationClass) then -- validate the suggestion to make sure that the suggestion is supported by this template (necessary for limited parameter lists)

+

error_text = utilities.set_message ('err_parameter_ignored_suggest', {k, param}); -- set the suggestion error message

+

else

+

error_text = utilities.set_message ('err_parameter_ignored', {k}); -- suggested param not supported by this template

+

v = ''; -- unset

+

end

+

end

+

end

+

if not utilities.is_set (error_text) then -- couldn't match with a pattern, is there an explicit suggestion?

+

if (suggestions.suggestions[ k:lower() ] ~= nil) and validate (suggestions.suggestions[ k:lower() ], config.CitationClass) then

+

utilities.set_message ('err_parameter_ignored_suggest', {k, suggestions.suggestions[ k:lower() ]});

+

else

+

utilities.set_message ('err_parameter_ignored', {k});

+

v = ''; -- unset value assigned to unrecognized parameters (this for the limited parameter lists)

+

end

+

end

+

end

+

end

+

args[k] = v; -- save this parameter and its value

+

elseif not utilities.is_set (v) then -- for empty parameters

+

if not validate (k, config.CitationClass, true) then -- is this empty parameter a valid parameter

+

k = ('' == k) and '(empty string)' or k; -- when k is empty string (or was space(s) trimmed to empty string), replace with descriptive text

+

table.insert (empty_unknowns, utilities.wrap_style ('parameter', k)); -- format for error message and add to the list

+

end

+

-- crude debug support that allows us to render a citation from module {{#invoke:}} TODO: keep?

+

-- elseif args[k] ~= nil or (k == 'postscript') then -- when args[k] has a value from {{#invoke}} frame (we don't normally do that)

+

-- args[k] = v; -- overwrite args[k] with empty string from pframe.args[k] (template frame); v is empty string here

+

end -- not sure about the postscript bit; that gets handled in parameter validation; historical artifact?

+

end

+

if 0 ~= #empty_unknowns then -- create empty unknown error message

+

utilities.set_message ('err_param_unknown_empty', {

+

1 == #empty_unknowns and '' or 's',

+

utilities.make_sep_list (#empty_unknowns, empty_unknowns)

+

});

+

end

+

local url_param_t = {};

+

for k, v in pairs( args ) do

+

if 'string' == type (k) then -- don't evaluate positional parameters

+

has_invisible_chars (k, v); -- look for invisible characters

+

end

+

has_extraneous_punc (k, v); -- look for extraneous terminal punctuation in parameter values

+

missing_pipe_check (k, v); -- do we think that there is a parameter that is missing a pipe?

+

args[k] = inter_wiki_check (k, v); -- when language interwiki-linked parameter missing leading colon replace with wiki-link label

+

if 'string' == type (k) and not cfg.url_skip[k] then -- when parameter k is not positional and not in url skip table

+

url_param_t[k] = v; -- make a parameter/value list for extraneous url check

+

end

+

end

+

has_extraneous_url (url_param_t); -- look for url in parameter values where a url does not belong

+

return table.concat ({

+

frame:extensionTag ('templatestyles', '', {src=styles}),

+

citation0( config, args)

+

});

+

end

+

--[[--------------------------< E X P O R T E D F U N C T I O N S >------------------------------------------

+

]]

+

return {citation = citation};

Александр Машин

Бюрократы, steward, Администраторы

1712

правок

Изменения

Модуль:Citation/CS1 (посмотреть исходный код)

Версия от 18:09, 24 декабря 2023

Навигация

Поиск