Module:Citation/CS1/Configuration: Difference between revisions

m 1 revision imported: templates
m 1 revision imported: template update
 
(One intermediate revision by one other user not shown)
Line 1: Line 1:
local lang_obj = mw.language.getContentLanguage(); -- make a language object for the local language; used here for languages and dates  
local lang_obj = mw.language.getContentLanguage(); -- make a language object for the local language; used here for languages and dates  
--[[--------------------------< S E T T I N G S >--------------------------------------------------------------
boolean settings used to control various things.  these setting located here to make them easy to find
]]
-- these settings local to this module only
local local_digits_from_mediawiki = false; -- for i18n; when true, module fills date_names['local_digits'] from MediaWiki; manual fill required else; always false at en.wiki
local local_date_names_from_mediawiki = false; -- for i18n; when true, module fills date_names['local']['long'] and date_names['local']['short'] from MediaWiki;
-- manual translation required else; ; always false at en.wiki
-- these settings exported to other modules
local use_identifier_redirects = true; -- when true use redirect name for identifier label links; always true at en.wiki
local local_lang_cat_enable = false; -- when true categorizes pages where |language=<local wiki's language>; always false at en.wiki
local date_name_auto_xlate_enable = false; -- when true translates English month-names to the local-wiki's language month names; always false at en.wiki
local date_digit_auto_xlate_enable = false; -- when true translates Western date digit to the local-wiki's language digits (date_names['local_digits']); always false at en.wiki
local enable_sort_keys = true; -- when true module adds namespace sort keys to error and maintenance category links


--[[--------------------------< U N C A T E G O R I Z E D _ N A M E S P A C E S >------------------------------
--[[--------------------------< U N C A T E G O R I Z E D _ N A M E S P A C E S >------------------------------
Line 12: Line 31:
]]
]]


uncategorized_namespaces_t = {[2]=true}; -- init with user namespace id
local uncategorized_namespaces_t = {[2]=true}; -- init with user namespace id
for k, _ in pairs (mw.site.talkNamespaces) do -- add all talk namespace ids
for k, _ in pairs (mw.site.talkNamespaces) do -- add all talk namespace ids
uncategorized_namespaces_t[k] = true;
uncategorized_namespaces_t[k] = true;
Line 19: Line 38:
local uncategorized_subpages = {'/[Ss]andbox', '/[Tt]estcases', '/[^/]*[Ll]og', '/[Aa]rchive'}; -- list of Lua patterns found in page names of pages we should not categorize
local uncategorized_subpages = {'/[Ss]andbox', '/[Tt]estcases', '/[^/]*[Ll]og', '/[Aa]rchive'}; -- list of Lua patterns found in page names of pages we should not categorize


--[[
at en.wiki Greek characters are used as sort keys for certain items in a category so that those items are
placed at the end of a category page.  See Wikipedia:Categorization#Sort_keys.  That works well for en.wiki
because English is written using the Latn script.  This may not work well for other languages.  At en.wiki it
is desireable to place content from certain namespaces at the end of a category listing so the module adds sort
keys to error and maintenance category links when rendering a cs1|2 template on a page in that namespace.
i18n: if this does not work well for your language, set <enable_sort_keys> to false.
]]
local name_space_sort_keys = { -- sort keys to be used with these namespaces:
[4] = 'ω', -- wikipedia; omega
[10] = 'τ', -- template; tau
[118] = 'Δ', -- draft; delta
['other'] = 'ο', -- all other non-talk namespaces except main (article); omicron
}


--[[--------------------------< M E S S A G E S >--------------------------------------------------------------
--[[--------------------------< M E S S A G E S >--------------------------------------------------------------
Line 34: Line 69:
['archived-dead'] = 'Archived from $1 on $2',
['archived-dead'] = 'Archived from $1 on $2',
['archived-live'] = '$1 from the original on $2',
['archived-live'] = '$1 from the original on $2',
['archived-missing'] = 'Archived from the original $1 on $2',
['archived-unfit'] = 'Archived from the original on ',
['archived-unfit'] = 'Archived from the original on ',
['archived'] = 'Archived',
['archived'] = 'Archived',
Line 48: Line 82:
['inset'] = '$1 inset',
['inset'] = '$1 inset',
['interview'] = 'Interviewed by $1',
['interview'] = 'Interviewed by $1',
['lay summary'] = 'Lay summary',
['mismatch'] = '<code class="cs1-code">&#124;$1=</code> / <code class="cs1-code">&#124;$2=</code> mismatch', -- $1 is year param name; $2 is date param name
['mismatch'] = '<code class="cs1-code">&#124;$1=</code> / <code class="cs1-code">&#124;$2=</code> mismatch', -- $1 is year param name; $2 is date param name
['newsgroup'] = '[[Usenet newsgroup|Newsgroup]]:&nbsp;$1',
['newsgroup'] = '[[Usenet newsgroup|Newsgroup]]:&nbsp;$1',
Line 98: Line 131:
-- categories
-- categories
['cat wikilink'] = '[[Category:$1]]', -- $1 is the category name
['cat wikilink'] = '[[Category:$1]]', -- $1 is the category name
['cat wikilink sk'] = '[[Category:$1|$2]]', -- $1 is the category name; $2 is namespace sort key
[':cat wikilink'] = '[[:Category:$1|link]]', -- category name as maintenance message wikilink; $1 is the category name
[':cat wikilink'] = '[[:Category:$1|link]]', -- category name as maintenance message wikilink; $1 is the category name


Line 125: Line 159:


local citation_class_map_t = { -- TODO: if kept, these and all other config.CitationClass 'names' require some sort of i18n
local citation_class_map_t = { -- TODO: if kept, these and all other config.CitationClass 'names' require some sort of i18n
['arxiv'] = 'arXiv',
['audio-visual'] = 'AV media',
['audio-visual'] = 'AV media',
['AV-media-notes'] = 'AV media notes',
['AV-media-notes'] = 'AV media notes',
['biorxiv'] = 'bioRxiv',
['citeseerx'] = 'CiteSeerX',
['encyclopaedia'] = 'encyclopedia',
['encyclopaedia'] = 'encyclopedia',
['mailinglist'] = 'mailing list',
['mailinglist'] = 'mailing list',
['pressrelease'] = 'press release'
['medrxiv'] = 'medRxiv',
['pressrelease'] = 'press release',
['ssrn'] = 'SSRN',
['techreport'] = 'tech report',
}
}


Line 179: Line 219:


['ext-link-access-signal'] = '<span class="$1" title="$2">$3</span>', -- external link with appropriate lock icon
['ext-link-access-signal'] = '<span class="$1" title="$2">$3</span>', -- external link with appropriate lock icon
['free'] = {class='cs1-lock-free', title='Freely accessible'}, -- classes defined in Module:Citation/CS1/styles.css
['free'] = {class='id-lock-free', title='Freely accessible'}, -- classes defined in Module:Citation/CS1/styles.css
['registration'] = {class='cs1-lock-registration', title='Free registration required'},
['registration'] = {class='id-lock-registration', title='Free registration required'},
['limited'] = {class='cs1-lock-limited', title='Free access subject to limited trial, subscription normally required'},
['limited'] = {class='id-lock-limited', title='Free access subject to limited trial, subscription normally required'},
['subscription'] = {class='cs1-lock-subscription', title='Paid subscription required'},
['subscription'] = {class='id-lock-subscription', title='Paid subscription required'},


['interwiki-icon'] = '<span class="$1" title="$2">$3</span>',
['interwiki-icon'] = '<span class="$1" title="$2">$3</span>',
Line 242: Line 282:
['ASINTLD'] = 'asin-tld',
['ASINTLD'] = 'asin-tld',
['At'] = 'at', -- Used by InternetArchiveBot
['At'] = 'at', -- Used by InternetArchiveBot
['Authors'] = {'authors', 'people', 'credits'},
['Authors'] = {'people', 'credits'},
['BookTitle'] = {'book-title', 'booktitle'},
['BookTitle'] = {'book-title', 'booktitle'},
['Cartography'] = 'cartography',
['Cartography'] = 'cartography',
Line 248: Line 288:
['ChapterFormat'] = {'chapter-format', 'contribution-format', 'entry-format',
['ChapterFormat'] = {'chapter-format', 'contribution-format', 'entry-format',
'article-format', 'section-format'};
'article-format', 'section-format'};
['ChapterURL'] = {'chapter-url', 'contribution-url', 'entry-url', 'article-url', 'section-url', 'chapterurl'}, -- Used by InternetArchiveBot
['ChapterURL'] = {'chapter-url', 'contribution-url', 'entry-url', 'article-url', 'section-url'}, -- Used by InternetArchiveBot
['ChapterUrlAccess'] = {'chapter-url-access', 'contribution-url-access',
['ChapterUrlAccess'] = {'chapter-url-access', 'contribution-url-access',
'entry-url-access', 'article-url-access', 'section-url-access'}, -- Used by InternetArchiveBot
'entry-url-access', 'article-url-access', 'section-url-access'}, -- Used by InternetArchiveBot
Line 275: Line 315:
['Issue'] = {'issue', 'number'},
['Issue'] = {'issue', 'number'},
['Language'] = {'language', 'lang'},
['Language'] = {'language', 'lang'},
['LayDate'] = 'lay-date',
['LayFormat'] = 'lay-format',
['LaySource'] = 'lay-source',
['LayURL'] = 'lay-url',
['MailingList'] = {'mailing-list', 'mailinglist'}, -- cite mailing list only
['MailingList'] = {'mailing-list', 'mailinglist'}, -- cite mailing list only
['Map'] = 'map', -- cite map only
['Map'] = 'map', -- cite map only
Line 309: Line 345:
['ScriptChapter'] = {'script-chapter', 'script-contribution', 'script-entry',
['ScriptChapter'] = {'script-chapter', 'script-contribution', 'script-entry',
'script-article', 'script-section'},
'script-article', 'script-section'},
['ScriptEncyclopedia'] = {'script-encyclopedia', 'script-encyclopaedia'}, -- cite encyclopedia only
['ScriptMap'] = 'script-map',
['ScriptMap'] = 'script-map',
['ScriptPeriodical'] = {'script-journal', 'script-magazine', 'script-newspaper',
['ScriptPeriodical'] = {'script-journal', 'script-magazine', 'script-newspaper',
Line 326: Line 363:
['Title'] = 'title', -- Used by InternetArchiveBot
['Title'] = 'title', -- Used by InternetArchiveBot
['TitleLink'] = {'title-link', 'episode-link', 'episodelink'}, -- Used by InternetArchiveBot
['TitleLink'] = {'title-link', 'episode-link', 'episodelink'}, -- Used by InternetArchiveBot
['TitleNote'] = 'department',
['TitleNote'] = {'title-note', 'department'},
['TitleType'] = {'type', 'medium'},
['TitleType'] = {'type', 'medium'},
['TransChapter'] = {'trans-article', 'trans-chapter', 'trans-contribution',
['TransChapter'] = {'trans-article', 'trans-chapter', 'trans-contribution',
Line 332: Line 369:
['Transcript'] = 'transcript',
['Transcript'] = 'transcript',
['TranscriptFormat'] = 'transcript-format',
['TranscriptFormat'] = 'transcript-format',
['TranscriptURL'] = {'transcript-url', 'transcripturl'}, -- Used by InternetArchiveBot
['TranscriptURL'] = 'transcript-url', -- Used by InternetArchiveBot
['TransEncyclopedia'] = {'trans-encyclopedia', 'trans-encyclopaedia'}, -- cite encyclopedia only
['TransMap'] = 'trans-map', -- cite map only
['TransMap'] = 'trans-map', -- cite map only
['TransPeriodical'] = {'trans-journal', 'trans-magazine', 'trans-newspaper',
['TransPeriodical'] = {'trans-journal', 'trans-magazine', 'trans-newspaper',
Line 347: Line 385:
['Year'] = 'year',
['Year'] = 'year',


['AuthorList-First'] = {"first#", "author-first#", "author#-first", "given#",
['AuthorList-First'] = {"first#", "author-first#", "author#-first", "author-given#", "author#-given",
"author-given#", "author#-given"},
"subject-first#", "subject#-first", "subject-given#", "subject#-given",
['AuthorList-Last'] = {"last#", "author-last#", "author#-last", "surname#",
"given#"},
"author-surname#", "author#-surname", "author#", "subject#", 'host#'},
['AuthorList-Last'] = {"last#", "author-last#", "author#-last", "author-surname#", "author#-surname",
"subject-last#", "subject#-last", "subject-surname#", "subject#-surname",
"author#", 'host#', "subject#", "surname#"},
['AuthorList-Link'] = {"author-link#", "author#-link", "subject-link#",
['AuthorList-Link'] = {"author-link#", "author#-link", "subject-link#",
"subject#-link", "authorlink#", "author#link"},
"subject#-link", "authorlink#", "author#link"},
Line 394: Line 434:
'AuthorList-Mask', 'ContributorList-Mask', 'EditorList-Mask', 'InterviewerList-Mask', 'TranslatorList-Mask', -- name-list mask may have name separators
'AuthorList-Mask', 'ContributorList-Mask', 'EditorList-Mask', 'InterviewerList-Mask', 'TranslatorList-Mask', -- name-list mask may have name separators
'PostScript', 'Quote', 'ScriptQuote', 'TransQuote', 'Ref', -- miscellaneous
'PostScript', 'Quote', 'ScriptQuote', 'TransQuote', 'Ref', -- miscellaneous
'ArchiveURL', 'ChapterURL', 'ConferenceURL', 'LayURL', 'MapURL', 'TranscriptURL', 'URL', -- URL-holding parameters
'ArchiveURL', 'ChapterURL', 'ConferenceURL', 'MapURL', 'TranscriptURL', 'URL', -- URL-holding parameters
}
}


local url_meta_params = { -- table of aliases[] keys (meta parameters); each key has a table of parameter names for a value
local url_meta_params = { -- table of aliases[] keys (meta parameters); each key has a table of parameter names for a value
'ArchiveURL', 'ChapterURL', 'ConferenceURL', 'ID', 'LayURL', 'MapURL', 'TranscriptURL', 'URL', -- parameters allowed to hold urls
'ArchiveURL', 'ChapterURL', 'ConferenceURL', 'ID', 'MapURL', 'TranscriptURL', 'URL', -- parameters allowed to hold urls
'Page', 'Pages', 'At', 'QuotePage', 'QuotePages', -- insource locators allowed to hold urls
'Page', 'Pages', 'At', 'QuotePage', 'QuotePages', -- insource locators allowed to hold urls
}
}
Line 432: Line 472:
]]
]]


local single_letter_2nd_lvl_domains_t = {'cash', 'company', 'foundation', 'org', 'today'};
local single_letter_2nd_lvl_domains_t = {'cash', 'company', 'foundation', 'media', 'org', 'today'};




Line 443: Line 483:


]]
]]
local is_Latn = 'A-Za-z\195\128-\195\150\195\152-\195\182\195\184-\198\191\199\132-\201\143';
local is_Latn = 'A-Za-z\195\128-\195\150\195\152-\195\182\195\184-\198\191\199\132-\201\143\225\184\128-\225\187\191';
local special_case_translation = {
local special_case_translation = {
['AuthorList'] = 'authors list', -- used to assemble maintenance category names
['AuthorList'] = 'authors list', -- used to assemble maintenance category names
Line 476: Line 516:
{['en'] = {'website is for sale', true}, ['local'] = nil},
{['en'] = {'website is for sale', true}, ['local'] = nil},
{['en'] = {'^404', false}, ['local'] = nil},
{['en'] = {'^404', false}, ['local'] = nil},
{['en'] = {'error[ %-]404', false}, ['local'] = nil},
{['en'] = {'internet archive wayback machine', true}, ['local'] = nil},
{['en'] = {'internet archive wayback machine', true}, ['local'] = nil},
{['en'] = {'log into facebook', true}, ['local'] = nil},
{['en'] = {'log into facebook', true}, ['local'] = nil},
Line 499: Line 540:
{['en'] = {'allmusic', true}, ['local'] = nil},
{['en'] = {'allmusic', true}, ['local'] = nil},
{['en'] = {'%f[%a][Aa]uthor%f[%A]', false}, ['local'] = nil},
{['en'] = {'%f[%a][Aa]uthor%f[%A]', false}, ['local'] = nil},
{['en'] = {'^[Bb]ureau$', false}, ['local'] = nil},
{['en'] = {'business', true}, ['local'] = nil},
{['en'] = {'business', true}, ['local'] = nil},
{['en'] = {'cnn', true}, ['local'] = nil},
{['en'] = {'cnn', true}, ['local'] = nil},
{['en'] = {'collaborator', true}, ['local'] = nil},
{['en'] = {'collaborator', true}, ['local'] = nil},
{['en'] = {'^[Cc]ompany$', false}, ['local'] = nil},
{['en'] = {'contributor', true}, ['local'] = nil},
{['en'] = {'contributor', true}, ['local'] = nil},
{['en'] = {'contact us', true}, ['local'] = nil},
{['en'] = {'contact us', true}, ['local'] = nil},
{['en'] = {'correspondent', true}, ['local'] = nil},
{['en'] = {'^[Dd]esk$', false}, ['local'] = nil},
{['en'] = {'directory', true}, ['local'] = nil},
{['en'] = {'directory', true}, ['local'] = nil},
{['en'] = {'%f[%(%[][%(%[]%s*eds?%.?%s*[%)%]]?$', false}, ['local'] = nil},
{['en'] = {'%f[%(%[][%(%[]%s*eds?%.?%s*[%)%]]?$', false}, ['local'] = nil},
Line 511: Line 556:
{['en'] = {'%f[%a][Ee]dited%f[%A]', false}, ['local'] = nil},
{['en'] = {'%f[%a][Ee]dited%f[%A]', false}, ['local'] = nil},
{['en'] = {'%f[%a][Ee]ditors?%f[%A]', false}, ['local'] = nil},
{['en'] = {'%f[%a][Ee]ditors?%f[%A]', false}, ['local'] = nil},
{['en'] = {'%f[%a]]Ee]mail%f[%A]', false}, ['local'] = nil},
{['en'] = {'%f[%a][Ee]mail%f[%A]', false}, ['local'] = nil},
{['en'] = {'facebook', true}, ['local'] = nil},
{['en'] = {'facebook', true}, ['local'] = nil},
{['en'] = {'google', true}, ['local'] = nil},
{['en'] = {'google', true}, ['local'] = nil},
{['en'] = {'^[Gg]roup$', false}, ['local'] = nil},
{['en'] = {'home page', true}, ['local'] = nil},
{['en'] = {'home page', true}, ['local'] = nil},
{['en'] = {'^[Ii]nc%.?$', false}, ['local'] = nil},
{['en'] = {'^[Ii]nc%.?$', false}, ['local'] = nil},
{['en'] = {'instagram', true}, ['local'] = nil},
{['en'] = {'instagram', true}, ['local'] = nil},
{['en'] = {'interviewer', true}, ['local'] = nil},
{['en'] = {'interviewer', true}, ['local'] = nil},
{['en'] = {'^[Ll]imited$', false}, ['local'] = nil},
{['en'] = {'linkedIn', true}, ['local'] = nil},
{['en'] = {'linkedIn', true}, ['local'] = nil},
{['en'] = {'^[Nn]ews$', false}, ['local'] = nil},
{['en'] = {'^[Nn]ews$', false}, ['local'] = nil},
{['en'] = {'[Nn]ews[ %-]?[Rr]oom', false}, ['local'] = nil},
{['en'] = {'pinterest', true}, ['local'] = nil},
{['en'] = {'pinterest', true}, ['local'] = nil},
{['en'] = {'policy', true}, ['local'] = nil},
{['en'] = {'policy', true}, ['local'] = nil},
Line 561: Line 609:


local_date_names_from_mediawiki is a boolean.  When set to:
local_date_names_from_mediawiki is a boolean.  When set to:
true – module will fetch local month names from MediaWiki for both date_names['local']['long'] and date_names['local']['short']
true – module will fetch local month names from MediaWiki for both date_names['local']['long'] and date_names['local']['short']; this will unconditionally overwrite manual translations
false – module will *not* fetch local month names from MediaWiki
false – module will *not* fetch local month names from MediaWiki


Line 573: Line 621:
]]
]]


local local_date_names_from_mediawiki = true; -- when false, manual translation required for date_names['local']['long'] and date_names['local']['short']
local local_date_names_from_mediawiki = true; -- when false, manual translation required for date_names['local']['long'] and date_names['local']['short']; overwrites manual translations
-- when true, module fetches long and short month names from MediaWiki
-- when true, module fetches long and short month names from MediaWiki
local date_names = {
local date_names = {
Line 617: Line 665:
date_names[invert_t[2]][i] = name; -- invert to get [i] = 'name' for conversions from ymd
date_names[invert_t[2]][i] = name; -- invert to get [i] = 'name' for conversions from ymd
end
end
end
if local_digits_from_mediawiki then -- if fetching local digits from MediaWiki is enabled
local digits_t = {};
for i=0, 9 do -- loop 10x and
digits_t [lang_obj:formatNum (i)] = tostring (i); -- format the loop indexer as local lang table index and assign loop indexer (a string) as the value
end
date_names['local_digits'] = digits_t;
end
end


Line 638: Line 694:
'{{ *([Mm]DY) *[|}]', -- 0
'{{ *([Mm]DY) *[|}]', -- 0
}
}
local title_object = mw.title.getCurrentTitle();
local content; -- done this way  so that unused templates appear in unused-template-reports; self-transcluded makes them look like they are used
if 10 ~= title_object.namespace then -- all namespaces except Template
content = title_object:getContent() or ''; -- get the content of the article or ''; new pages edited w/ve do not have 'content' until saved; ve does not preview; phab:T221625
end


local function get_date_format ()
local function get_date_format ()
local title_object = mw.title.getCurrentTitle();
if not content then -- nil content when we're in template
if title_object.namespace == 10 then -- not in template space so that unused templates appear in unused-template-reports;
return nil; -- auto-formatting does not work in Template space so don't set global_df
return nil; -- auto-formatting does not work in Template space so don't set global_df
end
end
local content = title_object:getContent() or ''; -- get the content of the article or ''; new pages edited w/ve do not have 'content' until saved; ve does not preview; phab:T221625
for _, pattern in ipairs (df_template_patterns) do -- loop through the patterns looking for {{Use dmy dates}} or {{Use mdy dates}} or any of their redirects
for _, pattern in ipairs (df_template_patterns) do -- loop through the patterns looking for {{Use dmy dates}} or {{Use mdy dates}} or any of their redirects
local start, _, match = content:find(pattern); -- match is the three letters indicating desired date format
local start, _, match = content:find(pattern); -- match is the three letters indicating desired date format
if match then
if match then
content = content:match ('%b{}', start); -- get the whole template
local use_dates_template = content:match ('%b{}', start); -- get the whole template
if content:match ('| *cs1%-dates *= *[lsy][sy]?') then -- look for |cs1-dates=publication date length access-/archive-date length
if use_dates_template:match ('| *cs1%-dates *= *[lsy][sy]?') then -- look for |cs1-dates=publication date length access-/archive-date length
return match:lower() .. '-' .. content:match ('| *cs1%-dates *= *([lsy][sy]?)');
return match:lower() .. '-' .. use_dates_template:match ('| *cs1%-dates *= *([lsy][sy]?)');
else
else
return match:lower() .. '-all'; -- no |cs1-dates= k/v pair; return value appropriate for use in |df=
return match:lower() .. '-all'; -- no |cs1-dates= k/v pair; return value appropriate for use in |df=
Line 658: Line 718:
end
end


local global_df;
local global_df; -- TODO: add this to <global_cs1_config_t>?




Line 704: Line 764:
'^[Pp]gs.?',
'^[Pp]gs.?',
},
},
vpatterns = { -- patterns for |volume=
vi_patterns_t = { -- combined to catch volume-like text in |issue= and issue-like text in |volume=
'^volumes?',
'^volumes?', -- volume-like text
'^vols?[%.:=]?'
'^vols?[%.:=]?',
},
 
ipatterns = { -- patterns for |issue=
'^issues?', --issue-like text
'^issues?',
'^iss[%.:=]?',
'^iss[%.:=]?',
'^numbers?',
'^numbers?',
'^nos?%A', -- don't match 'november' or 'nostradamus'
'^nos?%A', -- don't match 'november' or 'nostradamus'
'^nr[%.:=]?',
'^nr[%.:=]?',
'^n[%.:= ]' -- might be a valid issue without separator (space char is sep char here)
'^n[%.:= ]', -- might be a valid issue without separator (space char is sep char here)
}
'^n°', -- 'n' with degree sign (U+00B0)
'^№', -- precomposed unicode numero character (U+2116)
},
}
}


Line 850: Line 911:




--[[---------------------< S T R I P M A R K E R S >----------------------------
--[[--------------------------< C S 1 _ C O N F I G _ G E T >--------------------------------------------------


Common pattern definition location for stripmarkers so that we don't have to go
fetch and validate values from {{cs1 config}} template to fill <global_cs1_config_t>
hunting for them if (when) MediaWiki changes their form.


]]
no error messages; when errors are detected, the parameter value from {{cs1 config}} is blanked.


local stripmarkers = {
Supports all parameters and aliases associated with the metaparameters: DisplayAuthors, DisplayContributors,
['any'] = '\127[^\127]*UNIQ%-%-(%a+)%-[%a%d]+%-QINU[^\127]*\127', -- capture returns name of stripmarker
DisplayEditors, DisplayInterviewers, DisplayTranslators, NameListStyle, and Mode.  The DisplayWhatever metaparameters
['math'] = '\127[^\127]*UNIQ%-%-math%-[%a%d]+%-QINU[^\127]*\127' -- math stripmarkers used in coins_cleanup() and coins_replace_math_stripmarker()
accept numeric values only (|display-authors=etal and the like is not supported).
}


]]


--[[------------< I N V I S I B L E _ C H A R A C T E R S >---------------------
local global_cs1_config_t = {}; -- TODO: add value returned from get_date_format() to this table?


This table holds non-printing or invisible characters indexed either by name or
local function get_cs1_config ()
by Unicode group. Values are decimal representations of UTF-8 codes.  The table
if not content then -- nil content when we're in template
is organized as a table of tables because the Lua pairs keyword returns table
return nil; -- auto-formatting does not work in Template space so don't set global_df
data in an arbitrary order.  Here, we want to process the table from top to bottom
end
because the entries at the top of the table are also found in the ranges specified
 
by the entries at the bottom of the table.
local start = content:find('{{ *[Cc][Ss]1 config *[|}]'); -- <start> is offset into <content> when {{cs1 config}} found; nil else
if start then
local cs1_config_template = content:match ('%b{}', start); -- get the whole template


Also here is a pattern that recognizes stripmarkers that begin and end with the
if not cs1_config_template then
delete characters.  The nowiki stripmarker is not an error but some others are
return nil;
because the parameter values that include them become part of the template's
end
metadata before stripmarker replacement.


]]
local params_t = mw.text.split (cs1_config_template:gsub ('^{{%s*', ''):gsub ('%s*}}$', ''), '%s*|%s*'); -- remove '{{' and '}}'; make a sequence of parameter/value pairs (split on the pipe)
table.remove (params_t, 1); -- remove the template name because it isn't a parameter/value pair


local invisible_defs = {
local config_meta_params_t = {'DisplayAuthors', 'DisplayContributors', 'DisplayEditors', 'DisplayInterviewers', 'DisplayTranslators', 'NameListStyle', 'Mode'};
del = '\127', -- used to distinguish between stripmarker and del char
local meta_param_map_t = {}; -- list of accepted parameter names usable in {{cs1 config}} goes here
zwj = '\226\128\141', -- used with capture because zwj may be allowed
}
for _, meta_param in ipairs (config_meta_params_t) do -- for i18n using <config_meta_params_t>, map template parameter names to their metaparameter equivalents
if 'table' == type (aliases[meta_param]) then -- if <meta_param> is a sequence,
for _, param in ipairs (aliases[meta_param]) do -- extract its contents
meta_param_map_t[param] = meta_param; -- and add to <meta_param_map_t>
end
else
meta_param_map_t[aliases[meta_param]] = meta_param; -- not a sequence so just add the parameter to <meta_param_map_t>
end
end
 
local keywords_t = {}; -- map valid keywords to their associate metaparameter; reverse form of <keyword_lists[key] for these metaparameters
for _, metaparam_t in ipairs ({{'NameListStyle', 'name-list-style'}, {'Mode', 'mode'}}) do -- only these metaparameter / keywords_lists key pairs
for _, keyword in ipairs (keywords_lists[metaparam_t[2]]) do -- spin through the list of keywords
keywords_t[keyword] = metaparam_t[1]; -- add [keyword] = metaparameter to the map
end
end
 
for _, param in ipairs (params_t) do -- spin through the {{cs1 config}} parameters and fill <global_cs1_config_t>
local k, v = param:match ('([^=]-)%s*=%s*(.+)'); -- <k> is the parameter name; <v> is parameter's assigned value
if k then
if k:find ('^display') then -- if <k> is one of the |display-<namelist>= parameters
if v:match ('%d+') then -- the assigned value must be digits; doesn't accept 'etal'
global_cs1_config_t[meta_param_map_t[k]]=v; -- add the display param and its value to globals table
end
else
if keywords_t[v] == meta_param_map_t[k] then -- keywords_t[v] returns nil or the metaparam name; these must be the same
global_cs1_config_t[meta_param_map_t[k]]=v; -- add the parameter and its value to globals table
end
end
end
end
end
end
 
get_cs1_config (); -- fill <global_cs1_config_t>


local invisible_chars = {
{'replacement', '\239\191\189'}, -- U+FFFD, EF BF BD
{'zero width joiner', '('.. invisible_defs.zwj .. ')'}, -- U+200D, E2 80 8D; capture because zwj may be allowed
{'zero width space', '\226\128\139'}, -- U+200B, E2 80 8B
{'hair space', '\226\128\138'}, -- U+200A, E2 80 8A
{'soft hyphen', '\194\173'}, -- U+00AD, C2 AD
{'horizontal tab', '\009'}, -- U+0009 (HT), 09
{'line feed', '\010'}, -- U+000A (LF), 0A
{'no-break space', '\194\160'}, -- U+00A0 (NBSP), C2 A0
{'carriage return', '\013'}, -- U+000D (CR), 0D
{'stripmarker', stripmarkers.any}, -- stripmarker; may or may not be an error; capture returns the stripmaker type
{'delete', '('.. invisible_defs.del .. ')'}, -- U+007F (DEL), 7F; must be done after stripmarker test; capture to distinguish isolated del chars not part of stripmarker
{'C0 control', '[\000-\008\011\012\014-\031]'}, -- U+0000–U+001F (NULL–US), 00–1F (except HT, LF, CR (09, 0A, 0D))
{'C1 control', '[\194\128-\194\159]'}, -- U+0080–U+009F (XXX–APC), C2 80 – C2 9F
-- {'Specials', '[\239\191\185-\239\191\191]'}, -- U+FFF9-U+FFFF, EF BF B9 – EF BF BF
-- {'Private use area', '[\238\128\128-\239\163\191]'}, -- U+E000–U+F8FF, EE 80 80 – EF A3 BF
-- {'Supplementary Private Use Area-A', '[\243\176\128\128-\243\191\191\189]'}, -- U+F0000–U+FFFFD, F3 B0 80 80 – F3 BF BF BD
-- {'Supplementary Private Use Area-B', '[\244\128\128\128-\244\143\191\189]'}, -- U+100000–U+10FFFD, F4 80 80 80 – F4 8F BF BD
}


--[[
--[[---------------------< S T R I P M A R K E R S >----------------------------


Indic script makes use of zero width joiner as a character modifier so zwj
Common pattern definition location for stripmarkers so that we don't have to go
characters must be left in.  This pattern covers all of the unicode characters
hunting for them if (when) MediaWiki changes their form.
for these languages:
Devanagari 0900–097F – https://unicode.org/charts/PDF/U0900.pdf
Devanagari extended A8E0–A8FF – https://unicode.org/charts/PDF/UA8E0.pdf
Bengali 0980–09FF – https://unicode.org/charts/PDF/U0980.pdf
Gurmukhi 0A00–0A7F – https://unicode.org/charts/PDF/U0A00.pdf
Gujarati 0A80–0AFF – https://unicode.org/charts/PDF/U0A80.pdf
Oriya 0B00–0B7F – https://unicode.org/charts/PDF/U0B00.pdf
Tamil 0B80–0BFF – https://unicode.org/charts/PDF/U0B80.pdf
Telugu 0C00–0C7F – https://unicode.org/charts/PDF/U0C00.pdf
Kannada 0C80–0CFF – https://unicode.org/charts/PDF/U0C80.pdf
Malayalam 0D00–0D7F – https://unicode.org/charts/PDF/U0D00.pdf
plus the not-necessarily Indic scripts for Sinhala and Burmese:
Sinhala 0D80-0DFF - https://unicode.org/charts/PDF/U0D80.pdf
Myanmar 1000-109F - https://unicode.org/charts/PDF/U1000.pdf
Myanmar extended A AA60-AA7F - https://unicode.org/charts/PDF/UAA60.pdf
Myanmar extended B A9E0-A9FF - https://unicode.org/charts/PDF/UA9E0.pdf
the pattern is used by has_invisible_chars() and coins_cleanup()


]]
]]


local indic_script = '[\224\164\128-\224\181\191\224\163\160-\224\183\191\225\128\128-\225\130\159\234\167\160-\234\167\191\234\169\160-\234\169\191]';
local stripmarkers = {
['any'] = '\127[^\127]*UNIQ%-%-(%a+)%-[%a%d]+%-QINU[^\127]*\127', -- capture returns name of stripmarker
['math'] = '\127[^\127]*UNIQ%-%-math%-[%a%d]+%-QINU[^\127]*\127' -- math stripmarkers used in coins_cleanup() and coins_replace_math_stripmarker()
}
 
 
--[[------------< I N V I S I B L E _ C H A R A C T E R S >---------------------


-- list of emoji that use a zwj character (U+200D) to combine with another emoji
This table holds non-printing or invisible characters indexed either by name or
-- from: https://unicode.org/Public/emoji/15.0/emoji-zwj-sequences.txt; version: 15.0; 2022-05-06
by Unicode group. Values are decimal representations of UTF-8 codes. The table
-- table created by: [[:en:Module:Make emoji zwj table]]
is organized as a table of tables because the Lua pairs keyword returns table
local emoji_t = { -- indexes are decimal forms of the hex values in U+xxxx
data in an arbitrary order. Here, we want to process the table from top to bottom
[9760] = true, -- U+2620 ☠ skull and crossbones
because the entries at the top of the table are also found in the ranges specified
[9792] = true, -- U+2640 ♀ female sign
by the entries at the bottom of the table.
[9794] = true, -- U+2642 ♂ male sign
 
[9877] = true, -- U+2695 ⚕ staff of aesculapius
Also here is a pattern that recognizes stripmarkers that begin and end with the
[9878] = true, -- U+2696 ⚖ scales
delete characters.  The nowiki stripmarker is not an error but some others are
[9895] = true, -- U+26A7 ⚧ male with stroke and male and female sign
because the parameter values that include them become part of the template's
[9992] = true, -- U+2708 ✈ airplane
metadata before stripmarker replacement.
[10052] = true, -- U+2744 ❄ snowflake
 
[10084] = true, -- U+2764 ❤ heavy black heart
]]
[11035] = true, -- U+2B1B ⬛ black large square
 
[127752] = true, -- U+1F308 🌈 rainbow
local invisible_defs = {
[127787] = true, -- U+1F32B 🌫 fog
del = '\127', -- used to distinguish between stripmarker and del char
[127806] = true, -- U+1F33E 🌾 ear of rice
zwj = '\226\128\141', -- used with capture because zwj may be allowed
[127859] = true, -- U+1F373 🍳 cooking
}
[127868] = true, -- U+1F37C 🍼 baby bottle
 
[127876] = true, -- U+1F384 🎄 christmas tree
local invisible_chars = {
[127891] = true, -- U+1F393 🎓 graduation cap
{'replacement', '\239\191\189'}, -- U+FFFD, EF BF BD
[127908] = true, -- U+1F3A4 🎤 microphone
{'zero width joiner', '('.. invisible_defs.zwj .. ')'}, -- U+200D, E2 80 8D; capture because zwj may be allowed
[127912] = true, -- U+1F3A8 🎨 artist palette
{'zero width space', '\226\128\139'}, -- U+200B, E2 80 8B
[127979] = true, -- U+1F3EB 🏫 school
{'hair space', '\226\128\138'}, -- U+200A, E2 80 8A
[127981] = true, -- U+1F3ED 🏭 factory
{'soft hyphen', '\194\173'}, -- U+00AD, C2 AD
[128102] = true, -- U+1F466 👦 boy
{'horizontal tab', '\009'}, -- U+0009 (HT), 09
[128103] = true, -- U+1F467 👧 girl
{'line feed', '\010'}, -- U+000A (LF), 0A
[128104] = true, -- U+1F468 👨 man
{'no-break space', '\194\160'}, -- U+00A0 (NBSP), C2 A0
[128105] = true, -- U+1F469 👩 woman
{'carriage return', '\013'}, -- U+000D (CR), 0D
[128139] = true, -- U+1F48B 💋 kiss mark
{'stripmarker', stripmarkers.any}, -- stripmarker; may or may not be an error; capture returns the stripmaker type
[128168] = true, -- U+1F4A8 💨 dash symbol
{'delete', '('.. invisible_defs.del .. ')'}, -- U+007F (DEL), 7F; must be done after stripmarker test; capture to distinguish isolated del chars not part of stripmarker
[128171] = true, -- U+1F4AB 💫 dizzy symbol
{'C0 control', '[\000-\008\011\012\014-\031]'}, -- U+0000–U+001F (NULL–US), 00–1F (except HT, LF, CR (09, 0A, 0D))
[128187] = true, -- U+1F4BB 💻 personal computer
{'C1 control', '[\194\128-\194\159]'}, -- U+0080–U+009F (XXX–APC), C2 80 – C2 9F
[128188] = true, -- U+1F4BC 💼 brief case
-- {'Specials', '[\239\191\185-\239\191\191]'}, -- U+FFF9-U+FFFF, EF BF B9 – EF BF BF
[128293] = true, -- U+1F525 🔥 fire
-- {'Private use area', '[\238\128\128-\239\163\191]'}, -- U+E000–U+F8FF, EE 80 80 – EF A3 BF
[128295] = true, -- U+1F527 🔧 wrench
-- {'Supplementary Private Use Area-A', '[\243\176\128\128-\243\191\191\189]'}, -- U+F0000–U+FFFFD, F3 B0 80 80 – F3 BF BF BD
[128300] = true, -- U+1F52C 🔬 microscope
-- {'Supplementary Private Use Area-B', '[\244\128\128\128-\244\143\191\189]'}, -- U+100000–U+10FFFD, F4 80 80 80 – F4 8F BF BD
[128488] = true, -- U+1F5E8 🗨 left speech bubble
[128640] = true, -- U+1F680 🚀 rocket
[128658] = true, -- U+1F692 🚒 fire engine
[129309] = true, -- U+1F91D 🤝 handshake
[129455] = true, -- U+1F9AF 🦯 probing cane
[129456] = true, -- U+1F9B0 🦰 emoji component red hair
[129457] = true, -- U+1F9B1 🦱 emoji component curly hair
[129458] = true, -- U+1F9B2 🦲 emoji component bald
[129459] = true, -- U+1F9B3 🦳 emoji component white hair
[129466] = true, -- U+1F9BA 🦺 safety vest
[129468] = true, -- U+1F9BC 🦼 motorized wheelchair
[129469] = true, -- U+1F9BD 🦽 manual wheelchair
[129489] = true, -- U+1F9D1 🧑 adult
[129657] = true, -- U+1FA79 🩹 adhesive bandage
[129778] = true, -- U+1FAF2 🫲 leftwards hand
}
}


--[[


--[[----------------------< L A N G U A G E  S U P P O R T >-------------------
Indic script makes use of zero width joiner as a character modifier so zwj
 
characters must be left in.  This pattern covers all of the unicode characters
These tables and constants support various language-specific functionality.
for these languages:
 
Devanagari 0900–097F – https://unicode.org/charts/PDF/U0900.pdf
]]
Devanagari extended A8E0–A8FF – https://unicode.org/charts/PDF/UA8E0.pdf
 
Bengali 0980–09FF – https://unicode.org/charts/PDF/U0980.pdf
--local this_wiki_code = mw.getContentLanguage():getCode(); -- get this wiki's language code
Gurmukhi 0A00–0A7F – https://unicode.org/charts/PDF/U0A00.pdf
local this_wiki_code = lang_obj:getCode(); -- get this wiki's language code
Gujarati 0A80–0AFF – https://unicode.org/charts/PDF/U0A80.pdf
if string.match (mw.site.server, 'wikidata') then
Oriya 0B00–0B7F – https://unicode.org/charts/PDF/U0B00.pdf
this_wiki_code = mw.getCurrentFrame():preprocess('{{int:lang}}'); -- on Wikidata so use interface language setting instead
Tamil 0B80–0BFF – https://unicode.org/charts/PDF/U0B80.pdf
end
Telugu 0C00–0C7F – https://unicode.org/charts/PDF/U0C00.pdf
Kannada 0C80–0CFF – https://unicode.org/charts/PDF/U0C80.pdf
Malayalam 0D00–0D7F – https://unicode.org/charts/PDF/U0D00.pdf
plus the not-necessarily Indic scripts for Sinhala and Burmese:
Sinhala 0D80-0DFF - https://unicode.org/charts/PDF/U0D80.pdf
Myanmar 1000-109F - https://unicode.org/charts/PDF/U1000.pdf
Myanmar extended A AA60-AA7F - https://unicode.org/charts/PDF/UAA60.pdf
Myanmar extended B A9E0-A9FF - https://unicode.org/charts/PDF/UA9E0.pdf
the pattern is used by has_invisible_chars() and coins_cleanup()


local mw_languages_by_tag_t = mw.language.fetchLanguageNames (this_wiki_code, 'all'); -- get a table of language tag/name pairs known to Wikimedia; used for interwiki tests
]]
local mw_languages_by_name_t = {};
for k, v in pairs (mw_languages_by_tag_t) do -- build a 'reversed' table name/tag language pairs know to MediaWiki; used for |language=
v = mw.ustring.lower (v); -- lowercase for tag fetch; get name's proper case from mw_languages_by_tag_t[<tag>]
if mw_languages_by_name_t[v] then -- when name already in the table
if 2 == #k or 3 == #k then -- if tag does not have subtags
mw_languages_by_name_t[v] = k; -- prefer the shortest tag for this name
end
else -- here when name not in the table
mw_languages_by_name_t[v] = k; -- so add name and matching tag
end
end


local inter_wiki_map = {}; -- map of interwiki prefixes that are language-code prefixes
local indic_script = '[\224\164\128-\224\181\191\224\163\160-\224\183\191\225\128\128-\225\130\159\234\167\160-\234\167\191\234\169\160-\234\169\191]';
for k, v in pairs (mw.site.interwikiMap ('local')) do -- spin through the base interwiki map (limited to local)
if mw_languages_by_tag_t[v["prefix"]] then -- if the prefix matches a known language tag
inter_wiki_map[v["prefix"]] = true; -- add it to our local map
end
end


 
-- list of emoji that use a zwj character (U+200D) to combine with another emoji
--[[--------------------< S C R I P T _ L A N G _ C O D E S >-------------------
-- from: https://unicode.org/Public/emoji/15.1/emoji-zwj-sequences.txt; version: 15.1; 2023-06-05
 
-- table created by: [[:en:Module:Make emoji zwj table]]
This table is used to hold ISO 639-1 two-character and ISO 639-3 three-character
local emoji_t = { -- indexes are decimal forms of the hex values in U+xxxx
language codes that apply only to |script-title= and |script-chapter=
[8596] = true, -- U+2194 ↔ left right arrow
 
[8597] = true, -- U+2195 ↕ up down arrow
]]
[9760] = true, -- U+2620 ☠ skull and crossbones
 
[9792] = true, -- U+2640 ♀ female sign
local script_lang_codes = {
[9794] = true, -- U+2642 ♂ male sign
'ab', 'am', 'ar', 'be', 'bg', 'bn', 'bo', 'bs', 'dv', 'dz', 'el', 'fa', 'gu',  
[9877] = true, -- U+2695 ⚕ staff of aesculapius
'he', 'hi', 'hy', 'ja', 'ka', 'kk', 'km', 'kn', 'ko', 'ku', 'ky', 'lo', 'mk',
[9878] = true, -- U+2696 ⚖ scales
'ml', 'mn', 'mr', 'my', 'ne', 'or', 'ota', 'pa', 'ps', 'ru', 'sd', 'si', 'sr',
[9895] = true, -- U+26A7 ⚧ male with stroke and male and female sign
'syc', 'ta', 'te', 'tg', 'th', 'ti', 'tt', 'ug', 'uk', 'ur', 'uz', 'yi', 'yue', 'zh'
[9992] = true, -- U+2708 ✈ airplane
};
[10052] = true, -- U+2744 ❄ snowflake
 
[10084] = true, -- U+2764 ❤ heavy black heart
 
[10145] = true, -- U+27A1 ➡ black rightwards arrow
--[[---------------< L A N G U A G E  R E M A P P I N G >----------------------
[11035] = true, -- U+2B1B ⬛ black large square
 
[127752] = true, -- U+1F308 🌈 rainbow
These tables hold language information that is different (correct) from MediaWiki's definitions
[127787] = true, -- U+1F32B 🌫 fog
 
[127806] = true, -- U+1F33E 🌾 ear of rice
For each ['code'] = 'language name' in lang_code_remap{} there must be a matching ['language name'] = {'language name', 'code'} in lang_name_remap{}
[127859] = true, -- U+1F373 🍳 cooking
 
[127868] = true, -- U+1F37C 🍼 baby bottle
lang_code_remap{}:
[127876] = true, -- U+1F384 🎄 christmas tree
key is always lowercase ISO 639-1, -2, -3 language code or a valid lowercase IETF language tag
[127891] = true, -- U+1F393 🎓 graduation cap
value is properly spelled and capitalized language name associated with key
[127908] = true, -- U+1F3A4 🎤 microphone
only one language name per key;
[127912] = true, -- U+1F3A8 🎨 artist palette
key/value pair must have matching entry in lang_name_remap{}
[127979] = true, -- U+1F3EB 🏫 school
 
[127981] = true, -- U+1F3ED 🏭 factory
lang_name_remap{}:
[128102] = true, -- U+1F466 👦 boy
key is always lowercase language name
[128103] = true, -- U+1F467 👧 girl
value is a table the holds correctly spelled and capitalized language name [1] and associated code [2] (code must match a code key in lang_code_remap{})
[128104] = true, -- U+1F468 👨 man
may have multiple keys referring to a common preferred name and code; For example:
[128105] = true, -- U+1F469 👩 woman
['kolsch'] and ['kölsch'] both refer to 'Kölsch' and 'ksh'
[128139] = true, -- U+1F48B 💋 kiss mark
 
[128165] = true, -- U+1F4A5 💥 collision symbol
]]
[128168] = true, -- U+1F4A8 💨 dash symbol
 
[128171] = true, -- U+1F4AB 💫 dizzy symbol
local lang_code_remap = { -- used for |language= and |script-title= / |script-chapter=
[128187] = true, -- U+1F4BB 💻 personal computer
['als'] = 'Tosk Albanian', -- MediaWiki returns Alemannisch
[128188] = true, -- U+1F4BC 💼 brief case
['bh'] = 'Bihari', -- MediaWiki uses 'bh' as a subdomain name for Bhojpuri Wikipedia: bh.wikipedia.org
[128293] = true, -- U+1F525 🔥 fire
['bla'] = 'Blackfoot', -- MediaWiki/IANA/ISO 639: Siksika; use en.wiki preferred name
[128295] = true, -- U+1F527 🔧 wrench
['bn'] = 'Bengali', -- MediaWiki returns Bangla
[128300] = true, -- U+1F52C 🔬 microscope
['ca-valencia'] = 'Valencian', -- IETF variant of Catalan
[128488] = true, -- U+1F5E8 🗨 left speech bubble
['ilo'] = 'Ilocano', -- MediaWiki/IANA/ISO 639: Iloko; use en.wiki preferred name
[128640] = true, -- U+1F680 🚀 rocket
['ksh'] = 'Kölsch', -- MediaWiki: Colognian; use IANA/ISO 639 preferred name
[128658] = true, -- U+1F692 🚒 fire engine
['ksh-x-colog'] = 'Colognian', -- override MediaWiki ksh; no IANA/ISO 639 code for Colognian; IETF private code created at Module:Lang/data
[129001] = true, -- U+1F7E9 🟩 large green square
['mis-x-ripuar'] = 'Ripuarian', -- override MediaWiki ksh; no IANA/ISO 639 code for Ripuarian; IETF private code created at Module:Lang/data
[129003] = true, -- U+1F7EB 🟫 large brown square
['nan-tw'] = 'Taiwanese Hokkien', -- make room for MediaWiki/IANA/ISO 639 nan: Min Nan Chinese and support en.wiki preferred name
[129309] = true, -- U+1F91D 🤝 handshake
[129455] = true, -- U+1F9AF 🦯 probing cane
[129456] = true, -- U+1F9B0 🦰 emoji component red hair
[129457] = true, -- U+1F9B1 🦱 emoji component curly hair
[129458] = true, -- U+1F9B2 🦲 emoji component bald
[129459] = true, -- U+1F9B3 🦳 emoji component white hair
[129466] = true, -- U+1F9BA 🦺 safety vest
[129468] = true, -- U+1F9BC 🦼 motorized wheelchair
[129469] = true, -- U+1F9BD 🦽 manual wheelchair
[129489] = true, -- U+1F9D1 🧑 adult
[129490] = true, -- U+1F9D2 🧒 child
[129657] = true, -- U+1FA79 🩹 adhesive bandage
[129778] = true, -- U+1FAF2 🫲 leftwards hand
}
}


local lang_name_remap = { -- used for |language=; names require proper capitalization; tags must be lowercase
['alemannisch'] = {'Swiss German', 'gsw'}, -- not an ISO or IANA language name; MediaWiki uses 'als' as a subdomain name for Alemannic Wikipedia: als.wikipedia.org
['bangla'] = {'Bengali', 'bn'}, -- MediaWiki returns Bangla (the endonym) but we want Bengali (the exonym); here we remap
['bengali'] = {'Bengali', 'bn'}, -- MediaWiki doesn't use exonym so here we provide correct language name and 639-1 code
['bhojpuri'] = {'Bhojpuri', 'bho'}, -- MediaWiki uses 'bh' as a subdomain name for Bhojpuri Wikipedia: bh.wikipedia.org
['bihari'] = {'Bihari', 'bh'}, -- MediaWiki replaces 'Bihari' with 'Bhojpuri' so 'Bihari' cannot be found
['blackfoot'] = {'Blackfoot', 'bla'}, -- MediaWiki/IANA/ISO 639: Siksika; use en.wiki preferred name
['colognian'] = {'Colognian', 'ksh-x-colog'}, -- MediaWiki preferred name for ksh
['ilocano'] = {'Ilocano', 'ilo'}, -- MediaWiki/IANA/ISO 639: Iloko; use en.wiki preferred name
['kolsch'] = {'Kölsch', 'ksh'}, -- use IANA/ISO 639 preferred name (use non-diacritical o instead of umlaut ö)
['kölsch'] = {'Kölsch', 'ksh'}, -- use IANA/ISO 639 preferred name
['ripuarian'] = {'Ripuarian', 'mis-x-ripuar'}, -- group of dialects; no code in MediaWiki or in IANA/ISO 639
['taiwanese hokkien'] = {'Taiwanese Hokkien', 'nan-tw'}, -- make room for MediaWiki/IANA/ISO 639 nan: Min Nan Chinese
['tosk albanian'] = {'Tosk Albanian', 'als'}, -- MediaWiki replaces 'Tosk Albanian' with 'Alemannisch' so 'Tosk Albanian' cannot be found
['valencian'] = {'Valencian', 'ca-valencia'}, -- variant of Catalan; categorizes as Valencian
}


--[[----------------------< L A N G U A G E  S U P P O R T >-------------------
These tables and constants support various language-specific functionality.


--[[---------------< P R O P E R T I E S _ C A T E G O R I E S >----------------
]]


Properties categories. These are used for investigating qualities of citations.
--local this_wiki_code = mw.getContentLanguage():getCode(); -- get this wiki's language code
local this_wiki_code = lang_obj:getCode(); -- get this wiki's language code
if string.match (mw.site.server, 'wikidata') then
this_wiki_code = mw.getCurrentFrame():callParserFunction('int', {'lang'}); -- on Wikidata so use interface language setting instead
end


]]
local mw_languages_by_tag_t = mw.language.fetchLanguageNames (this_wiki_code, 'all'); -- get a table of language tag/name pairs known to Wikimedia; used for interwiki tests
 
local mw_languages_by_name_t = {};
local prop_cats = {
for k, v in pairs (mw_languages_by_tag_t) do -- build a 'reversed' table name/tag language pairs know to MediaWiki; used for |language=
['foreign-lang-source'] = 'CS1 $1-language sources ($2)', -- |language= categories; $1 is foreign-language name, $2 is ISO639-1 code
v = mw.ustring.lower (v); -- lowercase for tag fetch; get name's proper case from mw_languages_by_tag_t[<tag>]
['foreign-lang-source-2'] = 'CS1 foreign language sources (ISO 639-2)|$1', -- |language= category; a cat for ISO639-2 languages; $1 is the ISO 639-2 code used as a sort key
if mw_languages_by_name_t[v] then -- when name already in the table
['jul-greg-uncertainty'] = 'CS1: Julian–Gregorian uncertainty', -- probably temporary cat to identify scope of template with dates 1 October 1582 – 1 January 1926
if 2 == #k or 3 == #k then -- if tag does not have subtags
['local-lang-source'] = 'CS1 $1-language sources ($2)', -- |language= categories; $1 is local-language name, $2 is ISO639-1 code; not emitted when local_lang_cat_enable is false
mw_languages_by_name_t[v] = k; -- prefer the shortest tag for this name
['location-test'] = 'CS1 location test',
end
['long-vol'] = 'CS1: long volume value', -- probably temporary cat to identify scope of |volume= values longer than 4 characters
else -- here when name not in the table
['script'] = 'CS1 uses $1-language script ($2)', -- |script-title=xx: has matching category; $1 is language name, $2 is ISO639-1 code
mw_languages_by_name_t[v] = k; -- so add name and matching tag
['tracked-param'] = 'CS1 tracked parameter: $1', -- $1 is base (enumerators removed) parameter name
end
['year-range-abbreviated'] = 'CS1: abbreviated year range', -- probably temporary cat to identify scope of |date=, |year= values using YYYY–YY form
end
}
 
local inter_wiki_map = {}; -- map of interwiki prefixes that are language-code prefixes
for k, v in pairs (mw.site.interwikiMap ('local')) do -- spin through the base interwiki map (limited to local)
if mw_languages_by_tag_t[v["prefix"]] then -- if the prefix matches a known language tag
inter_wiki_map[v["prefix"]] = true; -- add it to our local map
end
end




--[[-------------------< T I T L E _ T Y P E S >--------------------------------
--[[--------------------< S C R I P T _ L A N G _ C O D E S >-------------------


Here we map a template's CitationClass to TitleType (default values for |type= parameter)
This table is used to hold ISO 639-1 two-character and ISO 639-3 three-character
language codes that apply only to |script-title= and |script-chapter=


]]
]]


local title_types = {
local script_lang_codes = {
['AV-media-notes'] = 'Media notes',
'ab', 'am', 'ar', 'be', 'bg', 'bn', 'bo', 'bs', 'ce', 'dv', 'dz', 'el', 'fa', 'grc',
['interview'] = 'Interview',
'gu', 'he', 'hi', 'hy', 'ja', 'ka', 'kk', 'km', 'kn', 'ko', 'ku', 'ky', 'lo', 'mk', 'ml',
['mailinglist'] = 'Mailing list',
'mn', 'mni', 'mr', 'my', 'ne', 'or', 'ota', 'pa', 'ps', 'ru', 'sd', 'si', 'sr', 'syc',
['map'] = 'Map',
'ta', 'te', 'tg', 'th', 'ti', 'tt', 'ug', 'uk', 'ur', 'uz', 'yi', 'yue', 'zh'
['podcast'] = 'Podcast',
};
['pressrelease'] = 'Press release',
 
['report'] = 'Report',
 
['speech'] = 'Speech',
--[[---------------< L A N G U A G E  R E M A P P I N G >----------------------
['techreport'] = 'Technical report',
['thesis'] = 'Thesis',
}


These tables hold language information that is different (correct) from MediaWiki's definitions


--[[===================<< E R R O R  M E S S A G I N G >>======================
For each ['<tag>'] = 'language name' in lang_code_remap{} there must be a matching ['language name'] = {'language name', '<tag>'} in lang_name_remap{}
]]


--[[----------< E R R O R  M E S S A G E  S U P P L I M E N T S >-------------
lang_tag_remap{}:
key is always lowercase ISO 639-1, -2, -3 language tag or a valid lowercase IETF language tag
value is properly spelled and capitalized language name associated with <tag>
only one language name per <tag>;
key/value pair must have matching entry in lang_name_remap{}


I18N for those messages that are supplemented with additional specific text that
lang_name_remap{}:
describes the reason for the error
key is always lowercase language name
value is a table the holds correctly spelled and capitalized language name [1] and associated tag [2] (tag must match a tag key in lang_tag_remap{})
may have multiple keys referring to a common preferred name and tag; For example:
['kolsch'] and ['kölsch'] both refer to 'Kölsch' and 'ksh'


TODO: merge this with special_case_translations{}?
]]
]]


local err_msg_supl = {
local lang_tag_remap = { -- used for |language= and |script-title= / |script-chapter=
['char'] = 'invalid character', -- |isbn=, |sbn=
['als'] = 'Tosk Albanian', -- MediaWiki returns Alemannisch
['check'] = 'checksum', -- |isbn=, |sbn=
['bh'] = 'Bihari', -- MediaWiki uses 'bh' as a subdomain name for Bhojpuri Wikipedia: bh.wikipedia.org
['flag'] = 'flag', -- |archive-url=
['bla'] = 'Blackfoot', -- MediaWiki/IANA/ISO 639: Siksika; use en.wiki preferred name
['form'] = 'invalid form', -- |isbn=, |sbn=
['bn'] = 'Bengali', -- MediaWiki returns Bangla
['group'] = 'invalid group id', -- |isbn=
['ca-valencia'] = 'Valencian', -- IETF variant of Catalan
['initials'] = 'initials', -- Vancouver
['fkv'] = 'Kven', -- MediaWiki returns Kvensk
['invalid language code'] = 'invalid language code', -- |script-<param>=
['gsw'] = 'Swiss German',
['journal'] = 'journal', -- |bibcode=
['ilo'] = 'Ilocano', -- MediaWiki/IANA/ISO 639: Iloko; use en.wiki preferred name
['length'] = 'length', -- |isbn=, |bibcode=, |sbn=
['ksh'] = 'Kölsch', -- MediaWiki: Colognian; use IANA/ISO 639 preferred name
['liveweb'] = 'liveweb', -- |archive-url=
['ksh-x-colog'] = 'Colognian', -- override MediaWiki ksh; no IANA/ISO 639 code for Colognian; IETF private code created at Module:Lang/data
['missing comma'] = 'missing comma', -- Vancouver
['mis-x-ripuar'] = 'Ripuarian', -- override MediaWiki ksh; no IANA/ISO 639 code for Ripuarian; IETF private code created at Module:Lang/data
['missing prefix'] = 'missing prefix', -- |script-<param>=
['nan-tw'] = 'Taiwanese Hokkien', -- make room for MediaWiki/IANA/ISO 639 nan: Min Nan Chinese and support en.wiki preferred name
['missing title part'] = 'missing title part', -- |script-<param>=
['sr-ec'] = 'Serbian (Cyrillic script)', -- MediaWiki returns српски (ћирилица)
['name'] = 'name', -- Vancouver
['sr-el'] = 'Serbian (Latin script)', -- MediaWiki returns srpski (latinica)
['non-Latin char'] = 'non-Latin character', -- Vancouver
['path'] = 'path', -- |archive-url=
['prefix'] = 'invalid prefix', -- |isbn=
['punctuation'] = 'punctuation', -- Vancouver
['save'] = 'save command', -- |archive-url=
['suffix'] = 'suffix', -- Vancouver
['timestamp'] = 'timestamp', -- |archive-url=
['unknown language code'] = 'unknown language code', -- |script-<param>=
['value'] = 'value', -- |bibcode=
['year'] = 'year', -- |bibcode=
}
}


local lang_name_remap = { -- used for |language=; names require proper capitalization; tags must be lowercase
['alemannic'] = {'Swiss German', 'gsw'}, -- ISO 639-2, -3 alternate for Swiss German; MediaWiki mediawiki returns Alemannic for gsw; en.wiki preferred name
['alemannisch'] = {'Swiss German', 'gsw'}, -- not an ISO or IANA language name; MediaWiki uses 'als' as a subdomain name for Alemannic Wikipedia: als.wikipedia.org
['bangla'] = {'Bengali', 'bn'}, -- MediaWiki returns Bangla (the endonym) but we want Bengali (the exonym); here we remap
['bengali'] = {'Bengali', 'bn'}, -- MediaWiki doesn't use exonym so here we provide correct language name and 639-1 code
['bhojpuri'] = {'Bhojpuri', 'bho'}, -- MediaWiki uses 'bh' as a subdomain name for Bhojpuri Wikipedia: bh.wikipedia.org
['bihari'] = {'Bihari', 'bh'}, -- MediaWiki replaces 'Bihari' with 'Bhojpuri' so 'Bihari' cannot be found
['blackfoot'] = {'Blackfoot', 'bla'}, -- MediaWiki/IANA/ISO 639: Siksika; use en.wiki preferred name
['colognian'] = {'Colognian', 'ksh-x-colog'}, -- MediaWiki preferred name for ksh
['ilocano'] = {'Ilocano', 'ilo'}, -- MediaWiki/IANA/ISO 639: Iloko; use en.wiki preferred name
['kolsch'] = {'Kölsch', 'ksh'}, -- use IANA/ISO 639 preferred name (use non-diacritical o instead of umlaut ö)
['kölsch'] = {'Kölsch', 'ksh'}, -- use IANA/ISO 639 preferred name
['kven'] = {'Kven', 'fkv'}, -- Unicode CLDR have decided not to support English language name for these two...
['kvensk'] = {'Kven', 'fkv'}, -- ...they say to refer to IANA registry for English names
['ripuarian'] = {'Ripuarian', 'mis-x-ripuar'}, -- group of dialects; no code in MediaWiki or in IANA/ISO 639
['serbian (cyrillic script)'] = {'Serbian (Cyrillic script)', 'sr-cyrl'}, -- special case to get correct tag when |language=sr-ec
['serbian (latin script)'] = {'Serbian (Latin script)', 'sr-latn'}, -- special case to get correct tag when |language=sr-el
['swiss german'] = {'Swiss German', 'gsw'},
['taiwanese hokkien'] = {'Taiwanese Hokkien', 'nan-tw'}, -- make room for MediaWiki/IANA/ISO 639 nan: Min Nan Chinese
['tosk albanian'] = {'Tosk Albanian', 'als'}, -- MediaWiki replaces 'Tosk Albanian' with 'Alemannisch' so 'Tosk Albanian' cannot be found
['valencian'] = {'Valencian', 'ca-valencia'}, -- variant of Catalan; categorizes as Valencian
}


--[[--------------< E R R O R _ C O N D I T I O N S >---------------------------


Error condition table.  This table has two sections: errors at the top, maintenance
--[[---------------< P R O P E R T I E S _ C A T E G O R I E S >----------------
at the bottom.  Maint 'messaging' does not have a 'message' (message=nil)


The following contains a list of IDs for various error conditions defined in the
Properties categories. These are used for investigating qualities of citations.
code.  For each ID, we specify a text message to display, an error category to
include, and whether the error message should be wrapped as a hidden comment.
 
Anchor changes require identical changes to matching anchor in Help:CS1 errors
 
TODO: rename error_conditions{} to something more generic; create separate error
and maint tables inside that?


]]
]]


local error_conditions = {
local prop_cats = {
err_accessdate_missing_url = {
['foreign-lang-source'] = 'CS1 $1-language sources ($2)', -- |language= categories; $1 is foreign-language name, $2 is ISO639-1 code
message = '<code class="cs1-code">&#124;access-date=</code> requires <code class="cs1-code">&#124;url=</code>',
['foreign-lang-source-2'] = 'CS1 foreign language sources (ISO 639-2)|$1', -- |language= category; a cat for ISO639-2 languages; $1 is the ISO 639-2 code used as a sort key
anchor = 'accessdate_missing_url',
['interproj-linked-name'] = 'CS1 interproject-linked names|$1', -- any author, editor, etc that has an interproject link; $1 is interproject tag used as a sort key
category = 'CS1 errors: access-date without URL',
['interwiki-linked-name'] = 'CS1 interwiki-linked names|$1', -- any author, editor, etc that has an interwiki link; $1 is interwiki tag used as a sort key; yeilds to interproject
hidden = false
['local-lang-source'] = 'CS1 $1-language sources ($2)', -- |language= categories; $1 is local-language name, $2 is ISO639-1 code; not emitted when local_lang_cat_enable is false
},
['location-test'] = 'CS1 location test',
err_apostrophe_markup = {
['long-vol'] = 'CS1: long volume value', -- probably temporary cat to identify scope of |volume= values longer than 4 characters
message = 'Italic or bold markup not allowed in: <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
['script'] = 'CS1 uses $1-language script ($2)', -- |script-title=xx: has matching category; $1 is language name, $2 is ISO639-1 code
anchor = 'apostrophe_markup',
['tracked-param'] = 'CS1 tracked parameter: $1', -- $1 is base (enumerators removed) parameter name
category = 'CS1 errors: markup',
['year-range-abbreviated'] = 'CS1: abbreviated year range', -- probably temporary cat to identify scope of |date=, |year= values using YYYY–YY form
hidden = false
}
},
 
err_archive_missing_date = {
 
message = '<code class="cs1-code">&#124;archive-url=</code> requires <code class="cs1-code">&#124;archive-date=</code>',
--[[-------------------< T I T L E _ T Y P E S >--------------------------------
anchor = 'archive_missing_date',
 
category = 'CS1 errors: archive-url',
Here we map a template's CitationClass to TitleType (default values for |type= parameter)
hidden = false
 
},
]]
err_archive_missing_url = {
 
message = '<code class="cs1-code">&#124;archive-url=</code> requires <code class="cs1-code">&#124;url=</code>',
local title_types = {
anchor = 'archive_missing_url',
['AV-media-notes'] = 'Media notes',
category = 'CS1 errors: archive-url',
['document'] = 'Document',
hidden = false
['interview'] = 'Interview',
},
['mailinglist'] = 'Mailing list',
err_archive_url = {
['map'] = 'Map',
message = '<code class="cs1-code">&#124;archive-url=</code> is malformed: $1', -- $1 is error message detail
['podcast'] = 'Podcast',
anchor = 'archive_url',
['pressrelease'] = 'Press release',
category = 'CS1 errors: archive-url',
['report'] = 'Report',
hidden = false
['speech'] = 'Speech',
},
['techreport'] = 'Technical report',
err_arxiv_missing = {
['thesis'] = 'Thesis',
message = '<code class="cs1-code">&#124;arxiv=</code> required',
}
anchor = 'arxiv_missing',
 
category = 'CS1 errors: arXiv', -- same as bad arxiv
 
hidden = false
--[[--------------------------< B U I L D _ K N O W N _ F R E E _ D O I _ R E G I S T R A N T S _ T A B L E >--
},
 
err_asintld_missing_asin = {
build a table of doi registrants known to be free-to-read  In a doi, the registrant ID is the series of digits
message = '<code class="cs1-code">&#124;$1=</code> requires <code class="cs1-code">&#124;asin=</code>', -- $1 is parameter name
between the '10.' and the first '/': in doi 10.1100/sommat, 1100 is the registrant ID
anchor = 'asintld_missing_asin',
 
category = 'CS1 errors: ASIN TLD',
see §3.2.2 DOI prefix of the Doi Handbook p. 43
hidden = false
https://www.doi.org/doi-handbook/DOI_Handbook_Final.pdf#page=43
},
 
err_bad_arxiv = {
]]
message = 'Check <code class="cs1-code">&#124;arxiv=</code> value',
 
anchor = 'bad_arxiv',
local function build_free_doi_registrants_table()
category = 'CS1 errors: arXiv',
local registrants_t = {};
hidden = false
for _, v in ipairs ({
},
'1045', '1074', '1096', '1100', '1155', '1186', '1194', '1371', '1629', '1989', '1999', '2147', '2196', '3285', '3389', '3390',
err_bad_asin = {
'3748', '3814', '3847', '3897', '4061', '4089', '4103', '4172', '4175', '4230', '4236', '4239', '4240', '4249', '4251',
message = 'Check <code class="cs1-code">&#124;asin=</code> value',
'4252', '4253', '4254', '4291', '4292', '4329', '4330', '4331', '5194', '5210', '5306', '5312', '5313', '5314',
anchor = 'bad_asin',
'5315', '5316', '5317', '5318', '5319', '5320', '5321', '5334', '5402', '5409', '5410', '5411', '5412',
category ='CS1 errors: ASIN',
'5492', '5493', '5494', '5495', '5496', '5497', '5498', '5499', '5500', '5501', '5527', '5528', '5662',
hidden = false
'6064', '6219', '7167', '7217', '7287', '7482', '7490', '7554', '7717', '7759', '7766', '11131', '11569', '11647',
},
'11648', '12688', '12703', '12715', '12942', '12998', '13105', '14256', '14293', '14303', '15215', '15347', '15412', '15560', '16995',
err_bad_asin_tld = {
'17645', '19080', '19173', '20944', '21037', '21468', '21767', '22261', '22323', '22459', '24105', '24196', '24966',
message = 'Check <code class="cs1-code">&#124;asin-tld=</code> value',
'26775', '30845', '32545', '35711', '35712', '35713', '35995', '36648', '37126', '37532', '37871', '47128',
anchor = 'bad_asin_tld',
'47622', '47959', '52437', '52975', '53288', '54081', '54947', '55667', '55914', '57009', '58647', '59081',
category ='CS1 errors: ASIN TLD',
}) do
hidden = false
registrants_t[v] = true; -- build a k/v table of known free-to-read doi registrants
},
end
err_bad_bibcode = {
 
message = 'Check <code class="cs1-code">&#124;bibcode=</code> $1', -- $1 is error message detail
return registrants_t;
anchor = 'bad_bibcode',
end
category = 'CS1 errors: bibcode',
 
hidden = false
local extended_registrants_t = { -- known free registrants identifiable by the doi suffix incipit
},
['1016'] = {'j.heliyon'}, -- Heliyon
err_bad_biorxiv = {
['1046'] = {'j.1365-8711', 'j.1365-246x'}, -- MNRAS, GJI
message = 'Check <code class="cs1-code">&#124;biorxiv=</code> value',
['1093'] = {'mnras', 'mnrasl', 'gji', 'rasti'}, -- MNRAS, MNRAS Letters, GJI, RASTI
anchor = 'bad_biorxiv',
['1099'] = {'acmi', 'mic', '00221287', 'mgen'},                             -- Access Microbiology, Microbiology, Journal of General Microbiology, Microbial Genomics
category = 'CS1 errors: bioRxiv',
['1111'] = {'j.1365-2966', 'j.1745-3933', 'j.1365-246X'}, -- MNRAS, MNRAS Letters, GJI
hidden = false
['1210'] = {'jendso','jcemcr'}, -- Journal of the Endocrine Society, JCEM Case Reports
},
}
err_bad_citeseerx = {
 
message = 'Check <code class="cs1-code">&#124;citeseerx=</code> value',
 
anchor = 'bad_citeseerx',
--[[===================<< E R R O R  M E S S A G I N G >>======================
category = 'CS1 errors: citeseerx',
]]
 
--[[----------< E R R O R  M E S S A G E  S U P P L I M E N T S >-------------
 
I18N for those messages that are supplemented with additional specific text that
describes the reason for the error
 
TODO: merge this with special_case_translations{}?
]]
 
local err_msg_supl = {
['char'] = 'invalid character', -- |isbn=, |sbn=
['check'] = 'checksum', -- |isbn=, |sbn=
['flag'] = 'flag', -- |archive-url=
['form'] = 'invalid form', -- |isbn=, |sbn=
['group'] = 'invalid group id', -- |isbn=
['initials'] = 'initials', -- Vancouver
['invalid language code'] = 'invalid language code', -- |script-<param>=
['journal'] = 'journal', -- |bibcode=
['length'] = 'length', -- |isbn=, |bibcode=, |sbn=
['liveweb'] = 'liveweb', -- |archive-url=
['missing comma'] = 'missing comma', -- Vancouver
['missing prefix'] = 'missing prefix', -- |script-<param>=
['missing title part'] = 'missing title part', -- |script-<param>=
['name'] = 'name', -- Vancouver
['non-Latin char'] = 'non-Latin character', -- Vancouver
['path'] = 'path', -- |archive-url=
['prefix'] = 'invalid prefix', -- |isbn=
['punctuation'] = 'punctuation', -- Vancouver
['save'] = 'save command', -- |archive-url=
['suffix'] = 'suffix', -- Vancouver
['timestamp'] = 'timestamp', -- |archive-url=
['unknown language code'] = 'unknown language code', -- |script-<param>=
['value'] = 'value', -- |bibcode=
['year'] = 'year', -- |bibcode=
}
 
 
--[[--------------< E R R O R _ C O N D I T I O N S >---------------------------
 
Error condition table.  This table has two sections: errors at the top, maintenance
at the bottom.  Maint 'messaging' does not have a 'message' (message=nil)
 
The following contains a list of IDs for various error conditions defined in the
code.  For each ID, we specify a text message to display, an error category to
include, and whether the error message should be wrapped as a hidden comment.
 
Anchor changes require identical changes to matching anchor in Help:CS1 errors
 
TODO: rename error_conditions{} to something more generic; create separate error
and maint tables inside that?
 
]]
 
local error_conditions = {
err_accessdate_missing_url = {
message = '<code class="cs1-code">&#124;access-date=</code> requires <code class="cs1-code">&#124;url=</code>',
anchor = 'accessdate_missing_url',
category = 'CS1 errors: access-date without URL',
hidden = false
hidden = false
},
},
err_bad_date = {
err_apostrophe_markup = {
message = 'Check date values in: $1', -- $1 is a parameter name list
message = 'Italic or bold markup not allowed in: <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
anchor = 'bad_date',
anchor = 'apostrophe_markup',
category = 'CS1 errors: dates',
category = 'CS1 errors: markup',
hidden = false
hidden = false
},
},
err_bad_doi = {
err_archive_date_missing_url = {
message = 'Check <code class="cs1-code">&#124;doi=</code> value',
message = '<code class="cs1-code">&#124;archive-date=</code> requires <code class="cs1-code">&#124;archive-url=</code>',
anchor = 'bad_doi',
anchor = 'archive_date_missing_url',
category = 'CS1 errors: DOI',
category = 'CS1 errors: archive-url',
hidden = false
hidden = false
},
},
err_bad_hdl = {
err_archive_date_url_ts_mismatch = {
message = 'Check <code class="cs1-code">&#124;hdl=</code> value',
message = '<code class="cs1-code">&#124;archive-date=</code> / <code class="cs1-code">&#124;archive-url=</code> timestamp mismatch; $1 suggested',
anchor = 'bad_hdl',
anchor = 'archive_date_url_ts_mismatch',
category = 'CS1 errors: HDL',
category = 'CS1 errors: archive-url',
hidden = false
hidden = false
},
},
err_bad_isbn = {
err_archive_missing_date = {
message = 'Check <code class="cs1-code">&#124;isbn=</code> value: $1', -- $1 is error message detail
message = '<code class="cs1-code">&#124;archive-url=</code> requires <code class="cs1-code">&#124;archive-date=</code>',
anchor = 'bad_isbn',
anchor = 'archive_missing_date',
category = 'CS1 errors: ISBN',
category = 'CS1 errors: archive-url',
hidden = false
hidden = false
},
},
err_bad_ismn = {
err_archive_missing_url = {
message = 'Check <code class="cs1-code">&#124;ismn=</code> value',
message = '<code class="cs1-code">&#124;archive-url=</code> requires <code class="cs1-code">&#124;url=</code>',
anchor = 'bad_ismn',
anchor = 'archive_missing_url',
category = 'CS1 errors: ISMN',
category = 'CS1 errors: archive-url',
hidden = false
hidden = false
},
},
err_bad_issn = {
err_archive_url = {
message = 'Check <code class="cs1-code">&#124;$1issn=</code> value', -- $1 is 'e' or '' for eissn or issn
message = '<code class="cs1-code">&#124;archive-url=</code> is malformed: $1', -- $1 is error message detail
anchor = 'bad_issn',
anchor = 'archive_url',
category = 'CS1 errors: ISSN',
category = 'CS1 errors: archive-url',
hidden = false
hidden = false
},
},
err_bad_jfm = {
err_arxiv_missing = {
message = 'Check <code class="cs1-code">&#124;jfm=</code> value',
message = '<code class="cs1-code">&#124;arxiv=</code> required',
anchor = 'bad_jfm',
anchor = 'arxiv_missing',
category = 'CS1 errors: JFM',
category = 'CS1 errors: arXiv', -- same as bad arxiv
hidden = false
hidden = false
},
},
err_bad_jstor = {
err_asintld_missing_asin = {
message = 'Check <code class="cs1-code">&#124;jstor=</code> value',
message = '<code class="cs1-code">&#124;$1=</code> requires <code class="cs1-code">&#124;asin=</code>', -- $1 is parameter name
anchor = 'bad_jstor',
anchor = 'asintld_missing_asin',
category = 'CS1 errors: JSTOR',
category = 'CS1 errors: ASIN TLD',
hidden = false
hidden = false
},
},
err_bad_lccn = {
err_bad_arxiv = {
message = 'Check <code class="cs1-code">&#124;lccn=</code> value',
message = 'Check <code class="cs1-code">&#124;arxiv=</code> value',
anchor = 'bad_lccn',
anchor = 'bad_arxiv',
category = 'CS1 errors: LCCN',
category = 'CS1 errors: arXiv',
hidden = false
hidden = false
},
},
err_bad_mr = {
err_bad_asin = {
message = 'Check <code class="cs1-code">&#124;mr=</code> value',
message = 'Check <code class="cs1-code">&#124;asin=</code> value',
anchor = 'bad_mr',
anchor = 'bad_asin',
category = 'CS1 errors: MR',
category ='CS1 errors: ASIN',
hidden = false
hidden = false
},
},
err_bad_oclc = {
err_bad_asin_tld = {
message = 'Check <code class="cs1-code">&#124;oclc=</code> value',
message = 'Check <code class="cs1-code">&#124;asin-tld=</code> value',
anchor = 'bad_oclc',
anchor = 'bad_asin_tld',
category = 'CS1 errors: OCLC',
category ='CS1 errors: ASIN TLD',
hidden = false
hidden = false
},
},
err_bad_ol = {
err_bad_bibcode = {
message = 'Check <code class="cs1-code">&#124;ol=</code> value',
message = 'Check <code class="cs1-code">&#124;bibcode=</code> $1', -- $1 is error message detail
anchor = 'bad_ol',
anchor = 'bad_bibcode',
category = 'CS1 errors: OL',
category = 'CS1 errors: bibcode',
hidden = false
hidden = false
},
},
err_bad_osti = {
err_bad_biorxiv = {
message = 'Check <code class="cs1-code">&#124;osti=</code> value',
message = 'Check <code class="cs1-code">&#124;biorxiv=</code> value',
anchor = 'bad_osti',
anchor = 'bad_biorxiv',
category = 'CS1 errors: OSTI',
category = 'CS1 errors: bioRxiv',
hidden = false
hidden = false
},
},
err_bad_paramlink = { -- for |title-link=, |author/editor/translator-link=, |series-link=, |episode-link=
err_bad_citeseerx = {
message = 'Check <code class="cs1-code">&#124;$1=</code> value', -- $1 is parameter name
message = 'Check <code class="cs1-code">&#124;citeseerx=</code> value',
anchor = 'bad_paramlink',
anchor = 'bad_citeseerx',
category = 'CS1 errors: parameter link',
category = 'CS1 errors: citeseerx',
hidden = false
hidden = false
},
},
err_bad_pmc = {
err_bad_date = {
message = 'Check <code class="cs1-code">&#124;pmc=</code> value',
message = 'Check date values in: $1', -- $1 is a parameter name list
anchor = 'bad_pmc',
anchor = 'bad_date',
category = 'CS1 errors: PMC',
category = 'CS1 errors: dates',
hidden = false
hidden = false
},
},
err_bad_pmid = {
err_bad_doi = {
message = 'Check <code class="cs1-code">&#124;pmid=</code> value',
message = 'Check <code class="cs1-code">&#124;doi=</code> value',
anchor = 'bad_pmid',
anchor = 'bad_doi',
category = 'CS1 errors: PMID',
category = 'CS1 errors: DOI',
hidden = false
hidden = false
},
},
err_bad_rfc = {
err_bad_hdl = {
message = 'Check <code class="cs1-code">&#124;rfc=</code> value',
message = 'Check <code class="cs1-code">&#124;hdl=</code> value',
anchor = 'bad_rfc',
anchor = 'bad_hdl',
category = 'CS1 errors: RFC',
category = 'CS1 errors: HDL',
hidden = false
hidden = false
},
},
err_bad_s2cid = {
err_bad_isbn = {
message = 'Check <code class="cs1-code">&#124;s2cid=</code> value',
message = 'Check <code class="cs1-code">&#124;isbn=</code> value: $1', -- $1 is error message detail
anchor = 'bad_s2cid',
anchor = 'bad_isbn',
category = 'CS1 errors: S2CID',
category = 'CS1 errors: ISBN',
hidden = false
hidden = false
},
},
err_bad_sbn = {
err_bad_ismn = {
message = 'Check <code class="cs1-code">&#124;sbn=</code> value: $1', -- $1 is error message detail
message = 'Check <code class="cs1-code">&#124;ismn=</code> value',
anchor = 'bad_sbn',
anchor = 'bad_ismn',
category = 'CS1 errors: SBN',
category = 'CS1 errors: ISMN',
hidden = false
hidden = false
},
},
err_bad_ssrn = {
err_bad_issn = {
message = 'Check <code class="cs1-code">&#124;ssrn=</code> value',
message = 'Check <code class="cs1-code">&#124;$1issn=</code> value', -- $1 is 'e' or '' for eissn or issn
anchor = 'bad_ssrn',
anchor = 'bad_issn',
category = 'CS1 errors: SSRN',
category = 'CS1 errors: ISSN',
hidden = false
hidden = false
},
},
err_bad_url = {
err_bad_jfm = {
message = 'Check $1 value', -- $1 is parameter name
message = 'Check <code class="cs1-code">&#124;jfm=</code> value',
anchor = 'bad_url',
anchor = 'bad_jfm',
category = 'CS1 errors: URL',
category = 'CS1 errors: JFM',
hidden = false
hidden = false
},
},
err_bad_usenet_id = {
err_bad_jstor = {
message = 'Check <code class="cs1-code">&#124;message-id=</code> value',
message = 'Check <code class="cs1-code">&#124;jstor=</code> value',
anchor = 'bad_message_id',
anchor = 'bad_jstor',
category = 'CS1 errors: message-id',
category = 'CS1 errors: JSTOR',
hidden = false
hidden = false
},
},
err_bad_zbl = {
err_bad_lccn = {
message = 'Check <code class="cs1-code">&#124;zbl=</code> value',
message = 'Check <code class="cs1-code">&#124;lccn=</code> value',
anchor = 'bad_zbl',
anchor = 'bad_lccn',
category = 'CS1 errors: Zbl',
category = 'CS1 errors: LCCN',
hidden = false
hidden = false
},
},
err_bare_url_missing_title = {
err_bad_medrxiv = {
message = '$1 missing title', -- $1 is parameter name
message = 'Check <code class="cs1-code">&#124;medrxiv=</code> value',
anchor = 'bare_url_missing_title',
anchor = 'bad_medrxiv',
category = 'CS1 errors: bare URL',
category = 'CS1 errors: medRxiv',
hidden = false
hidden = false
},
},
err_biorxiv_missing = {
err_bad_mr = {
message = '<code class="cs1-code">&#124;biorxiv=</code> required',
message = 'Check <code class="cs1-code">&#124;mr=</code> value',
anchor = 'biorxiv_missing',
anchor = 'bad_mr',
category = 'CS1 errors: bioRxiv', -- same as bad bioRxiv
category = 'CS1 errors: MR',
hidden = false
hidden = false
},
},
err_chapter_ignored = {
err_bad_oclc = {
message = '<code class="cs1-code">&#124;$1=</code> ignored', -- $1 is parameter name
message = 'Check <code class="cs1-code">&#124;oclc=</code> value',
anchor = 'chapter_ignored',
anchor = 'bad_oclc',
category = 'CS1 errors: chapter ignored',
category = 'CS1 errors: OCLC',
hidden = false
hidden = false
},
},
err_citation_missing_title = {
err_bad_ol = {
message = 'Missing or empty <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
message = 'Check <code class="cs1-code">&#124;ol=</code> value',
anchor = 'citation_missing_title',
anchor = 'bad_ol',
category = 'CS1 errors: missing title',
category = 'CS1 errors: OL',
hidden = false
hidden = false
},
},
err_citeseerx_missing = {
err_bad_osti = {
message = '<code class="cs1-code">&#124;citeseerx=</code> required',
message = 'Check <code class="cs1-code">&#124;osti=</code> value',
anchor = 'citeseerx_missing',
anchor = 'bad_osti',
category = 'CS1 errors: citeseerx', -- same as bad citeseerx
category = 'CS1 errors: OSTI',
hidden = false
hidden = false
},
},
err_cite_web_url = { -- this error applies to cite web and to cite podcast
err_bad_paramlink = { -- for |title-link=, |author/editor/translator-link=, |series-link=, |episode-link=
message = 'Missing or empty <code class="cs1-code">&#124;url=</code>',
message = 'Check <code class="cs1-code">&#124;$1=</code> value', -- $1 is parameter name
anchor = 'cite_web_url',
anchor = 'bad_paramlink',
category = 'CS1 errors: requires URL',
category = 'CS1 errors: parameter link',
hidden = false
hidden = false
},
},
err_class_ignored = {
err_bad_pmc = {
message = '<code class="cs1-code">&#124;class=</code> ignored',
message = 'Check <code class="cs1-code">&#124;pmc=</code> value',
anchor = 'class_ignored',
anchor = 'bad_pmc',
category = 'CS1 errors: class',
category = 'CS1 errors: PMC',
hidden = false
hidden = false
},
},
err_contributor_ignored = {
err_bad_pmid = {
message = '<code class="cs1-code">&#124;contributor=</code> ignored',
message = 'Check <code class="cs1-code">&#124;pmid=</code> value',
anchor = 'contributor_ignored',
anchor = 'bad_pmid',
category = 'CS1 errors: contributor',
category = 'CS1 errors: PMID',
hidden = false
hidden = false
},
},
err_contributor_missing_required_param = {
err_bad_rfc = {
message = '<code class="cs1-code">&#124;contributor=</code> requires <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
message = 'Check <code class="cs1-code">&#124;rfc=</code> value',
anchor = 'contributor_missing_required_param',
anchor = 'bad_rfc',
category = 'CS1 errors: contributor',
category = 'CS1 errors: RFC',
hidden = false
hidden = false
},
},
err_deprecated_params = {
err_bad_s2cid = {
message = 'Cite uses deprecated parameter <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
message = 'Check <code class="cs1-code">&#124;s2cid=</code> value',
anchor = 'deprecated_params',
anchor = 'bad_s2cid',
category = 'CS1 errors: deprecated parameters',
category = 'CS1 errors: S2CID',
hidden = false
hidden = false
},
},
err_disp_name = {
err_bad_sbn = {
message = 'Invalid <code class="cs1-code">&#124;$1=$2</code>', -- $1 is parameter name; $2 is the assigned value
message = 'Check <code class="cs1-code">&#124;sbn=</code> value: $1', -- $1 is error message detail
anchor = 'disp_name',
anchor = 'bad_sbn',
category = 'CS1 errors: display-names',
category = 'CS1 errors: SBN',
hidden = false,
hidden = false
},
},
err_doibroken_missing_doi = {
err_bad_ssrn = {
message = '<code class="cs1-code">&#124;$1=</code> requires <code class="cs1-code">&#124;doi=</code>', -- $1 is parameter name
message = 'Check <code class="cs1-code">&#124;ssrn=</code> value',
anchor = 'doibroken_missing_doi',
anchor = 'bad_ssrn',
category = 'CS1 errors: DOI',
category = 'CS1 errors: SSRN',
hidden = false
hidden = false
},
},
err_embargo_missing_pmc = {
err_bad_url = {
message = '<code class="cs1-code">&#124;$1=</code> requires <code class="cs1-code">&#124;pmc=</code>', -- $1 is parameter name
message = 'Check $1 value', -- $1 is parameter name
anchor = 'embargo_missing_pmc',
anchor = 'bad_url',
category = 'CS1 errors: PMC embargo',
category = 'CS1 errors: URL',
hidden = false
hidden = false
},
},
err_empty_citation = {
err_bad_usenet_id = {
message = 'Empty citation',
message = 'Check <code class="cs1-code">&#124;message-id=</code> value',
anchor = 'empty_citation',
anchor = 'bad_message_id',
category = 'CS1 errors: empty citation',
category = 'CS1 errors: message-id',
hidden = false
hidden = false
},
},
err_etal = {
err_bad_zbl = {
message = 'Explicit use of et al. in: <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
message = 'Check <code class="cs1-code">&#124;zbl=</code> value',
anchor = 'explicit_et_al',
anchor = 'bad_zbl',
category = 'CS1 errors: explicit use of et al.',
category = 'CS1 errors: Zbl',
hidden = false
hidden = false
},
},
err_extra_text_edition = {
err_bare_url_missing_title = {
message = '<code class="cs1-code">&#124;edition=</code> has extra text',
message = '$1 missing title', -- $1 is parameter name
anchor = 'extra_text_edition',
anchor = 'bare_url_missing_title',
category = 'CS1 errors: extra text: edition',
category = 'CS1 errors: bare URL',
hidden = false,
hidden = false
},
},
err_extra_text_issue = {
err_biorxiv_missing = {
message = '<code class="cs1-code">&#124;$1=</code> has extra text', -- $1 is parameter name
message = '<code class="cs1-code">&#124;biorxiv=</code> required',
anchor = 'extra_text_issue',
anchor = 'biorxiv_missing',
category = 'CS1 errors: extra text: issue',
category = 'CS1 errors: bioRxiv', -- same as bad bioRxiv
hidden = false,
hidden = false
},
},
err_extra_text_pages = {
err_chapter_ignored = {
message = '<code class="cs1-code">&#124;$1=</code> has extra text', -- $1 is parameter name
message = '<code class="cs1-code">&#124;$1=</code> ignored', -- $1 is parameter name
anchor = 'extra_text_pages',
anchor = 'chapter_ignored',
category = 'CS1 errors: extra text: pages',
category = 'CS1 errors: chapter ignored',
hidden = false,
hidden = false
},
},
err_extra_text_volume = {
err_citation_missing_title = {
message = '<code class="cs1-code">&#124;$1=</code> has extra text', -- $1 is parameter name
message = 'Missing or empty <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
anchor = 'extra_text_volume',
anchor = 'citation_missing_title',
category = 'CS1 errors: extra text: volume',
category = 'CS1 errors: missing title',
hidden = true,
hidden = false
},
},
err_first_missing_last = {
err_citeseerx_missing = {
message = '<code class="cs1-code">&#124;$1=</code> missing <code class="cs1-code">&#124;$2=</code>', -- $1 is first alias, $2 is matching last alias
message = '<code class="cs1-code">&#124;citeseerx=</code> required',
anchor = 'first_missing_last',
anchor = 'citeseerx_missing',
category = 'CS1 errors: missing name', -- author, contributor, editor, interviewer, translator
category = 'CS1 errors: citeseerx', -- same as bad citeseerx
hidden = false
hidden = false
},
},
err_format_missing_url = {
err_cite_web_url = { -- this error applies to cite web and to cite podcast
message = '<code class="cs1-code">&#124;$1=</code> requires <code class="cs1-code">&#124;$2=</code>', -- $1 is format parameter $2 is url parameter
message = 'Missing or empty <code class="cs1-code">&#124;url=</code>',
anchor = 'format_missing_url',
anchor = 'cite_web_url',
category = 'CS1 errors: format without URL',
category = 'CS1 errors: requires URL',
hidden = false
hidden = false
},
},
err_generic_name = {
err_class_ignored = {
message = '<code class="cs1-code">&#124;$1=</code> has generic name', -- $1 is parameter name
message = '<code class="cs1-code">&#124;class=</code> ignored',
anchor = 'generic_name',
anchor = 'class_ignored',
category = 'CS1 errors: generic name',
category = 'CS1 errors: class',
hidden = false,
hidden = false
},
},
err_generic_title = {
err_contributor_ignored = {
message = 'Cite uses generic title',
message = '<code class="cs1-code">&#124;contributor=</code> ignored',
anchor = 'generic_title',
anchor = 'contributor_ignored',
category = 'CS1 errors: generic title',
category = 'CS1 errors: contributor',
hidden = false,
},
err_invalid_param_val = {
message = 'Invalid <code class="cs1-code">&#124;$1=$2</code>', -- $1 is parameter name $2 is parameter value
anchor = 'invalid_param_val',
category = 'CS1 errors: invalid parameter value',
hidden = false
hidden = false
},
},
err_invisible_char = {
err_contributor_missing_required_param = {
message = '$1 in $2 at position $3', -- $1 is invisible char $2 is parameter name $3 is position number
message = '<code class="cs1-code">&#124;contributor=</code> requires <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
anchor = 'invisible_char',
anchor = 'contributor_missing_required_param',
category = 'CS1 errors: invisible characters',
category = 'CS1 errors: contributor',
hidden = false
hidden = false
},
},
err_missing_name = {
err_deprecated_params = {
message = 'Missing <code class="cs1-code">&#124;$1$2=</code>', -- $1 is modified NameList; $2 is enumerator
message = 'Cite uses deprecated parameter <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
anchor = 'missing_name',
anchor = 'deprecated_params',
category = 'CS1 errors: missing name', -- author, contributor, editor, interviewer, translator
category = 'CS1 errors: deprecated parameters',
hidden = false
hidden = false
},
},
err_missing_periodical = {
err_disp_name = {
message = 'Cite $1 requires <code class="cs1-code">&#124;$2=</code>', -- $1 is cs1 template name; $2 is canonical periodical parameter name for cite $1
message = 'Invalid <code class="cs1-code">&#124;$1=$2</code>', -- $1 is parameter name; $2 is the assigned value
anchor = 'missing_periodical',
anchor = 'disp_name',
category = 'CS1 errors: missing periodical',
category = 'CS1 errors: display-names',
hidden = true
hidden = false,
},
},
err_missing_pipe = {
err_doibroken_missing_doi = {
message = 'Missing pipe in: <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
message = '<code class="cs1-code">&#124;$1=</code> requires <code class="cs1-code">&#124;doi=</code>', -- $1 is parameter name
anchor = 'missing_pipe',
anchor = 'doibroken_missing_doi',
category = 'CS1 errors: missing pipe',
category = 'CS1 errors: DOI',
hidden = false
hidden = false
},
},
err_param_access_requires_param = {
err_embargo_missing_pmc = {
message = '<code class="cs1-code">&#124;$1-access=</code> requires <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
message = '<code class="cs1-code">&#124;$1=</code> requires <code class="cs1-code">&#124;pmc=</code>', -- $1 is parameter name
anchor = 'param_access_requires_param',
anchor = 'embargo_missing_pmc',
category = 'CS1 errors: param-access',
category = 'CS1 errors: PMC embargo',
hidden = false
hidden = false
},
},
err_param_has_ext_link = {
err_empty_citation = {
message = 'External link in <code class="cs1-code">$1</code>', -- $1 is parameter name
message = 'Empty citation',
anchor = 'param_has_ext_link',
anchor = 'empty_citation',
category = 'CS1 errors: external links',
category = 'CS1 errors: empty citation',
hidden = false
hidden = false
},
},
err_parameter_ignored = {
err_etal = {
message = 'Unknown parameter <code class="cs1-code">&#124;$1=</code> ignored', -- $1 is parameter name
message = 'Explicit use of et al. in: <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
anchor = 'parameter_ignored',
anchor = 'explicit_et_al',
category = 'CS1 errors: unsupported parameter',
category = 'CS1 errors: explicit use of et al.',
hidden = false
hidden = false
},
},
err_parameter_ignored_suggest = {
err_extra_text_edition = {
message = 'Unknown parameter <code class="cs1-code">&#124;$1=</code> ignored (<code class="cs1-code">&#124;$2=</code> suggested)', -- $1 is unknown parameter $2 is suggested parameter name
message = '<code class="cs1-code">&#124;edition=</code> has extra text',
anchor = 'parameter_ignored_suggest',
anchor = 'extra_text_edition',
category = 'CS1 errors: unsupported parameter',
category = 'CS1 errors: extra text: edition',
hidden = false
hidden = false,
},
err_extra_text_issue = {
message = '<code class="cs1-code">&#124;$1=</code> has extra text', -- $1 is parameter name
anchor = 'extra_text_issue',
category = 'CS1 errors: extra text: issue',
hidden = false,
},
err_extra_text_pages = {
message = '<code class="cs1-code">&#124;$1=</code> has extra text', -- $1 is parameter name
anchor = 'extra_text_pages',
category = 'CS1 errors: extra text: pages',
hidden = false,
},
err_extra_text_volume = {
message = '<code class="cs1-code">&#124;$1=</code> has extra text', -- $1 is parameter name
anchor = 'extra_text_volume',
category = 'CS1 errors: extra text: volume',
hidden = false,
},
err_first_missing_last = {
message = '<code class="cs1-code">&#124;$1=</code> missing <code class="cs1-code">&#124;$2=</code>', -- $1 is first alias, $2 is matching last alias
anchor = 'first_missing_last',
category = 'CS1 errors: missing name', -- author, contributor, editor, interviewer, translator
hidden = false
},
err_format_missing_url = {
message = '<code class="cs1-code">&#124;$1=</code> requires <code class="cs1-code">&#124;$2=</code>', -- $1 is format parameter $2 is url parameter
anchor = 'format_missing_url',
category = 'CS1 errors: format without URL',
hidden = false
},
err_generic_name = {
message = '<code class="cs1-code">&#124;$1=</code> has generic name', -- $1 is parameter name
anchor = 'generic_name',
category = 'CS1 errors: generic name',
hidden = false,
},
err_generic_title = {
message = 'Cite uses generic title',
anchor = 'generic_title',
category = 'CS1 errors: generic title',
hidden = false,
},
err_invalid_param_val = {
message = 'Invalid <code class="cs1-code">&#124;$1=$2</code>', -- $1 is parameter name $2 is parameter value
anchor = 'invalid_param_val',
category = 'CS1 errors: invalid parameter value',
hidden = false
},
err_invisible_char = {
message = '$1 in $2 at position $3', -- $1 is invisible char $2 is parameter name $3 is position number
anchor = 'invisible_char',
category = 'CS1 errors: invisible characters',
hidden = false
},
err_medrxiv_missing = {
message = '<code class="cs1-code">&#124;medrxiv=</code> required',
anchor = 'medrxiv_missing',
category = 'CS1 errors: medRxiv', -- same as bad medRxiv
hidden = false
},
err_missing_name = {
message = 'Missing <code class="cs1-code">&#124;$1$2=</code>', -- $1 is modified NameList; $2 is enumerator
anchor = 'missing_name',
category = 'CS1 errors: missing name', -- author, contributor, editor, interviewer, translator
hidden = false
},
err_missing_periodical = {
message = 'Cite $1 requires <code class="cs1-code">&#124;$2=</code>', -- $1 is cs1 template name; $2 is canonical periodical parameter name for cite $1
anchor = 'missing_periodical',
category = 'CS1 errors: missing periodical',
hidden = false
},
err_missing_pipe = {
message = 'Missing pipe in: <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
anchor = 'missing_pipe',
category = 'CS1 errors: missing pipe',
hidden = false
},
err_missing_publisher = {
message = 'Cite $1 requires <code class="cs1-code">&#124;$2=</code>', -- $1 is cs1 template name; $2 is canonical publisher parameter name for cite $1
anchor = 'missing_publisher',
category = 'CS1 errors: missing publisher',
hidden = false
},
err_numeric_names = {
message = '<code class="cs1-code">&#124;$1=</code> has numeric name', -- $1 is parameter name',
anchor = 'numeric_names',
category = 'CS1 errors: numeric name',
hidden = false,
},
err_param_access_requires_param = {
message = '<code class="cs1-code">&#124;$1-access=</code> requires <code class="cs1-code">&#124;$1=</code>', -- $1 is parameter name
anchor = 'param_access_requires_param',
category = 'CS1 errors: param-access',
hidden = false
},
err_param_has_ext_link = {
message = 'External link in <code class="cs1-code">$1</code>', -- $1 is parameter name
anchor = 'param_has_ext_link',
category = 'CS1 errors: external links',
hidden = false
},
err_parameter_ignored = {
message = 'Unknown parameter <code class="cs1-code">&#124;$1=</code> ignored', -- $1 is parameter name
anchor = 'parameter_ignored',
category = 'CS1 errors: unsupported parameter',
hidden = false
},
err_parameter_ignored_suggest = {
message = 'Unknown parameter <code class="cs1-code">&#124;$1=</code> ignored (<code class="cs1-code">&#124;$2=</code> suggested)', -- $1 is unknown parameter $2 is suggested parameter name
anchor = 'parameter_ignored_suggest',
category = 'CS1 errors: unsupported parameter',
hidden = false
},
err_periodical_ignored = {
message = '<code class="cs1-code">&#124;$1=</code> ignored', -- $1 is parameter name
anchor = 'periodical_ignored',
category = 'CS1 errors: periodical ignored',
hidden = false
},
err_redundant_parameters = {
message = 'More than one of $1 specified', -- $1 is error message detail
anchor = 'redundant_parameters',
category = 'CS1 errors: redundant parameter',
hidden = false
},
err_script_parameter = {
message = 'Invalid <code class="cs1-code">&#124;$1=</code>: $2', -- $1 is parameter name $2 is script language code or error detail
anchor = 'script_parameter',
category = 'CS1 errors: script parameters',
hidden = false
},
err_ssrn_missing = {
message = '<code class="cs1-code">&#124;ssrn=</code> required',
anchor = 'ssrn_missing',
category = 'CS1 errors: SSRN',
hidden = false
},
err_text_ignored = {
message = 'Text "$1" ignored', -- $1 is ignored text
anchor = 'text_ignored',
category = 'CS1 errors: unrecognized parameter',
hidden = false
},
err_trans_missing_title = {
message = '<code class="cs1-code">&#124;trans-$1=</code> requires <code class="cs1-code">&#124;$1=</code> or <code class="cs1-code">&#124;script-$1=</code>', -- $1 is base parameter name
anchor = 'trans_missing_title',
category = 'CS1 errors: translated title',
hidden = false
},
err_param_unknown_empty = {
message = 'Cite has empty unknown parameter$1: $2', -- $1 is 's' or empty space; $2 is emty unknown param list
anchor = 'param_unknown_empty',
category = 'CS1 errors: empty unknown parameters',
hidden = false
},
err_vancouver = {
message = 'Vancouver style error: $1 in name $2', -- $1 is error detail, $2 is the nth name
anchor = 'vancouver',
category = 'CS1 errors: Vancouver style',
hidden = false
},
err_wikilink_in_url = {
message = 'URL–wikilink conflict', -- uses ndash
anchor = 'wikilink_in_url',
category = 'CS1 errors: URL–wikilink conflict', -- uses ndash
hidden = false
},
 
 
--[[--------------------------< M A I N T >-------------------------------------
 
maint messages do not have a message (message = nil); otherwise the structure
is the same as error messages
 
]]
 
maint_archived_copy = {
message = nil,
anchor = 'archived_copy',
category = 'CS1 maint: archived copy as title',
hidden = true,
},
},
err_redundant_parameters = {
maint_bibcode = {
message = 'More than one of $1 specified', -- $1 is error message detail
message = nil,
anchor = 'redundant_parameters',
anchor = 'bibcode',
category = 'CS1 errors: redundant parameter',
category = 'CS1 maint: bibcode',
hidden = false
hidden = true,
},
},
err_script_parameter = {
maint_location_no_publisher = { -- cite book, conference, encyclopedia; citation as book cite or encyclopedia cite
message = 'Invalid <code class="cs1-code">&#124;$1=</code>: $2', -- $1 is parameter name $2 is script language code or error detail
message = nil,
anchor = 'script_parameter',
anchor = 'location_no_publisher',
category = 'CS1 errors: script parameters',
category = 'CS1 maint: location missing publisher',
hidden = false
hidden = true,
},
},
err_ssrn_missing = {
maint_bot_unknown = {
message = '<code class="cs1-code">&#124;ssrn=</code> required',
message = nil,
anchor = 'ssrn_missing',
anchor = 'bot:_unknown',
category = 'CS1 errors: SSRN', -- same as bad arxiv
category = 'CS1 maint: bot: original URL status unknown',
hidden = false
hidden = true,
},
},
err_text_ignored = {
maint_date_auto_xlated = { -- date auto-translation not supported by en.wiki
message = 'Text "$1" ignored', -- $1 is ignored text
message = nil,
anchor = 'text_ignored',
anchor = 'date_auto_xlated',
category = 'CS1 errors: unrecognized parameter',
category = 'CS1 maint: date auto-translated',
hidden = false
hidden = true,
},
},
err_trans_missing_title = {
maint_date_format = {
message = '<code class="cs1-code">&#124;trans-$1=</code> requires <code class="cs1-code">&#124;$1=</code> or <code class="cs1-code">&#124;script-$1=</code>', -- $1 is base parameter name
message = nil,
anchor = 'trans_missing_title',
anchor = 'date_format',
category = 'CS1 errors: translated title',
category = 'CS1 maint: date format',
hidden = false
hidden = true,
},
},
err_param_unknown_empty = {
maint_date_year = {
message = 'Cite has empty unknown parameter$1: $2', -- $1 is 's' or empty space; $2 is empty unknown param list
message = nil,
anchor = 'param_unknown_empty',
anchor = 'date_year',
category = 'CS1 errors: empty unknown parameters',
category = 'CS1 maint: date and year',
hidden = false
hidden = true,
},
},
err_vancouver = {
maint_doi_ignore = {
message = 'Vancouver style error: $1 in name $2', -- $1 is error detail, $2 is the nth name
anchor = 'vancouver',
category = 'CS1 errors: Vancouver style',
hidden = false
},
err_wikilink_in_url = {
message = 'URL–wikilink conflict', -- uses ndash
anchor = 'wikilink_in_url',
category = 'CS1 errors: URL–wikilink conflict', -- uses ndash
hidden = false
},
 
 
--[[--------------------------< M A I N T >-------------------------------------
 
maint messages do not have a message (message = nil); otherwise the structure
is the same as error messages
 
]]
 
maint_archived_copy = {
message = nil,
message = nil,
anchor = 'archived_copy',
anchor = 'doi_ignore',
category = 'CS1 maint: archived copy as title',
category = 'CS1 maint: ignored DOI errors',
hidden = true,
hidden = true,
},
},
maint_authors = {
maint_doi_inactive = {
message = nil,
message = nil,
anchor = 'authors',
anchor = 'doi_inactive',
category = 'CS1 maint: uses authors parameter',
category = 'CS1 maint: DOI inactive',
hidden = true,
hidden = true,
},
},
maint_bot_unknown = {
maint_doi_inactive_dated = {
message = nil,
message = nil,
anchor = 'bot:_unknown',
anchor = 'doi_inactive_dated',
category = 'CS1 maint: bot: original URL status unknown',
category = 'CS1 maint: DOI inactive as of $2$3$1', -- $1 is year, $2 is month-name or empty string, $3 is space or empty string
hidden = true,
},
maint_date_auto_xlated = { -- date auto-translation not supported by en.wiki
message = nil,
anchor = 'date_auto_xlated',
category = 'CS1 maint: date auto-translated',
hidden = true,
},
maint_date_format = {
message = nil,
anchor = 'date_format',
category = 'CS1 maint: date format',
hidden = true,
},
maint_date_year = {
message = nil,
anchor = 'date_year',
category = 'CS1 maint: date and year',
hidden = true,
},
maint_doi_ignore = {
message = nil,
anchor = 'doi_ignore',
category = 'CS1 maint: ignored DOI errors',
hidden = true,
hidden = true,
},
},
maint_doi_inactive = {
maint_doi_unflagged_free = {
message = nil,
message = nil,
anchor = 'doi_inactive',
anchor = 'doi_unflagged_free',
category = 'CS1 maint: DOI inactive',
category = 'CS1 maint: unflagged free DOI',
hidden = true,
},
maint_doi_inactive_dated = {
message = nil,
anchor = 'doi_inactive_dated',
category = 'CS1 maint: DOI inactive as of $2$3$1', -- $1 is year, $2 is month-name or empty string, $3 is space or empty string
hidden = true,
hidden = true,
},
},
Line 1,756: Line 2,000:
anchor = 'others_avm',
anchor = 'others_avm',
category = 'CS1 maint: others in cite AV media (notes)',
category = 'CS1 maint: others in cite AV media (notes)',
hidden = true,
},
maint_overridden_setting = {
message = nil,
anchor = 'overridden',
category = 'CS1 maint: overridden setting',
hidden = true,
hidden = true,
},
},
Line 1,804: Line 2,054:
anchor = 'url_status',
anchor = 'url_status',
category = 'CS1 maint: url-status',
category = 'CS1 maint: url-status',
hidden = true,
},
maint_year= {
message = nil,
anchor = 'year',
category = 'CS1 maint: year',
hidden = true,
hidden = true,
},
},
Line 1,813: Line 2,069:
},
},
}
}
--[[--------------------------< I D _ L I M I T S _ D A T A _ T >----------------------------------------------
fetch id limits for certain identifiers from c:Data:CS1/Identifier limits.tab.  This source is a json tabular
data file maintained at wikipedia commons.  Convert the json format to a table of k/v pairs.
The values from <id_limits_data_t> are used to set handle.id_limit.
]]
local id_limits_data_t = {};
for _, limit_t in ipairs (mw.ext.data.get ("CS1/Identifier limits.tab").data) do
id_limits_data_t[limit_t[1]] = limit_t[2]; -- <limit[1]> is identifier; <limit[2]> is upper limit for that identifier
end




Line 1,854: Line 2,125:
q = 'Q118398',
q = 'Q118398',
label = 'arXiv',
label = 'arXiv',
prefix = 'https://arxiv.org/abs/', -- protocol-relative tested 2013-09-04
prefix = 'https://arxiv.org/abs/',
encode = false,
encode = false,
COinS = 'info:arxiv',
COinS = 'info:arxiv',
Line 1,925: Line 2,196:
q = 'Q46339674',
q = 'Q46339674',
label = 'eISSN',
label = 'eISSN',
prefix = 'https://www.worldcat.org/issn/',
prefix = 'https://search.worldcat.org/issn/',
COinS = 'rft.eissn',
COinS = 'rft.eissn',
encode = false,
encode = false,
Line 1,968: Line 2,239:
q = 'Q131276',
q = 'Q131276',
label = 'ISSN',
label = 'ISSN',
prefix = 'https://www.worldcat.org/issn/',
prefix = 'https://search.worldcat.org/issn/',
COinS = 'rft.issn',
COinS = 'rft.issn',
encode = false,
encode = false,
Line 1,990: Line 2,261:
q = 'Q1420342',
q = 'Q1420342',
label = 'JSTOR',
label = 'JSTOR',
prefix = 'https://www.jstor.org/stable/', -- protocol-relative tested 2013-09-04
prefix = 'https://www.jstor.org/stable/',
COinS = 'pre', -- use prefix value
COinS = 'pre', -- use prefix value
encode = false,
encode = false,
Line 2,002: Line 2,273:
q = 'Q620946',
q = 'Q620946',
label = 'LCCN',
label = 'LCCN',
prefix = 'https://lccn.loc.gov/', -- protocol-relative tested 2015-12-28
prefix = 'https://lccn.loc.gov/',
COinS = 'info:lccn',
COinS = 'info:lccn',
encode = false,
separator = '&nbsp;',
},
['MEDRXIV'] = {
parameters = {'medrxiv'},
link = 'medRxiv',
redirect = 'medRxiv (identifier)',
q = 'Q58465838',
label = 'medRxiv',
prefix = 'https://www.medrxiv.org/content/',
COinS = 'pre', -- use prefix value
access = 'free', -- free to read
encode = false,
encode = false,
separator = '&nbsp;',
separator = '&nbsp;',
Line 2,024: Line 2,307:
q = 'Q190593',
q = 'Q190593',
label = 'OCLC',
label = 'OCLC',
prefix = 'https://www.worldcat.org/oclc/',
prefix = 'https://search.worldcat.org/oclc/',
COinS = 'info:oclcnum',
COinS = 'info:oclcnum',
encode = true,
encode = true,
separator = '&nbsp;',
separator = '&nbsp;',
id_limit = 9999999999, -- 10-digits
id_limit = id_limits_data_t.OCLC or 0,
},
},
['OL'] = {
['OL'] = {
Line 2,048: Line 2,331:
q = 'Q2015776',
q = 'Q2015776',
label = 'OSTI',
label = 'OSTI',
prefix = 'https://www.osti.gov/biblio/', -- protocol-relative tested 2018-09-12
prefix = 'https://www.osti.gov/biblio/',
COinS = 'pre', -- use prefix value
COinS = 'pre', -- use prefix value
encode = true,
encode = true,
separator = '&nbsp;',
separator = '&nbsp;',
id_limit = 23010000,
id_limit = id_limits_data_t.OSTI or 0,
custom_access = 'osti-access',
custom_access = 'osti-access',
},
},
Line 2,066: Line 2,349:
encode = true,
encode = true,
separator = '&nbsp;',
separator = '&nbsp;',
id_limit = 10500000,
id_limit = id_limits_data_t.PMC or 0,
access = 'free', -- free to read
access = 'free', -- free to read
},
},
Line 2,079: Line 2,362:
encode = false,
encode = false,
separator = '&nbsp;',
separator = '&nbsp;',
id_limit = 37900000,
id_limit = id_limits_data_t.PMID or 0,
},
},
['RFC'] = {
['RFC'] = {
Line 2,091: Line 2,374:
encode = false,
encode = false,
separator = '&nbsp;',
separator = '&nbsp;',
id_limit = 9300,
id_limit = id_limits_data_t.RFC or 0,
access = 'free', -- free to read
access = 'free', -- free to read
},
},
Line 2,113: Line 2,396:
encode = true,
encode = true,
separator = '&nbsp;',
separator = '&nbsp;',
id_limit = 4600000,
id_limit = id_limits_data_t.SSRN or 0,
custom_access = 'ssrn-access',
custom_access = 'ssrn-access',
},
},
Line 2,126: Line 2,409:
encode = false,
encode = false,
separator = '&nbsp;',
separator = '&nbsp;',
id_limit = 262000000,
id_limit = id_limits_data_t.S2CID or 0,
custom_access = 's2cid-access',
custom_access = 's2cid-access',
},
},
Line 2,158: Line 2,441:


return {
return {
use_identifier_redirects = true, -- when true use redirect name for identifier label links; always true at en.wiki
use_identifier_redirects = use_identifier_redirects, -- booleans defined in the settings at the top of this module
local_lang_cat_enable = false; -- when true categorizes pages where |language=<local wiki's language>; always false at en.wiki
local_lang_cat_enable = local_lang_cat_enable,
date_name_auto_xlate_enable = false; -- when true translates English month-names to the local-wiki's language month names; always false at en.wiki
date_name_auto_xlate_enable = date_name_auto_xlate_enable,
date_digit_auto_xlate_enable = false; -- when true translates Western date digit to the local-wiki's language digits (date_names['local_digits']); always false at en.wiki
date_digit_auto_xlate_enable = date_digit_auto_xlate_enable,
enable_sort_keys = enable_sort_keys,
-- tables and variables created when this module is loaded
-- tables and variables created when this module is loaded
global_df = get_date_format (), -- this line can be replaced with "global_df = 'dmy-all'," to have all dates auto translated to dmy format.
global_df = get_date_format (), -- this line can be replaced with "global_df = 'dmy-all'," to have all dates auto translated to dmy format.
global_cs1_config_t = global_cs1_config_t, -- global settings from {{cs1 config}}
punct_skip = build_skip_table (punct_skip, punct_meta_params),
punct_skip = build_skip_table (punct_skip, punct_meta_params),
url_skip = build_skip_table (url_skip, url_meta_params),
url_skip = build_skip_table (url_skip, url_meta_params),
known_free_doi_registrants_t = build_free_doi_registrants_table(),


name_space_sort_keys = name_space_sort_keys,
aliases = aliases,
aliases = aliases,
special_case_translation = special_case_translation,
special_case_translation = special_case_translation,
Line 2,175: Line 2,462:
editor_markup_patterns = editor_markup_patterns,
editor_markup_patterns = editor_markup_patterns,
et_al_patterns = et_al_patterns,
et_al_patterns = et_al_patterns,
extended_registrants_t = extended_registrants_t,
id_handlers = id_handlers,
id_handlers = id_handlers,
keywords_lists = keywords_lists,
keywords_lists = keywords_lists,
Line 2,188: Line 2,476:
prop_cats = prop_cats,
prop_cats = prop_cats,
script_lang_codes = script_lang_codes,
script_lang_codes = script_lang_codes,
lang_code_remap = lang_code_remap,
lang_tag_remap = lang_tag_remap,
lang_name_remap = lang_name_remap,
lang_name_remap = lang_name_remap,
this_wiki_code = this_wiki_code,
this_wiki_code = this_wiki_code,