Module:Lang: Difference between revisions

Content deleted Content added
m 1 revision imported
m 1 revision imported
(5 intermediate revisions by 2 users not shown)
Line 5:
require('Module:No globalsstrict');
local getArgs = require ('Module:Arguments').getArgs;
Line 25:
local namespace = mw.title.getCurrentTitle().namespace; -- used for categorization
local this_wiki_langcontent_lang = mw.language.getContentLanguage().code; -- get this wiki's language
local this_wiki_lang_tag = content_lang.code; -- get this wiki's language tag
local this_wiki_lang_dir = content_lang:getDir(); -- get this wiki's language direction
local initial_style_state; -- set by lang_xx_normal() and lang_xx_italic()
Line 385 ⟶ 387:
else -- cheap way to determine if there are prefixes; fonipa and others don't have prefixes; # operator always returns 0
if variant_table[variant]['prefixes'][1] and not in_array (code, variant_table[variant]['prefixes']) then
return code, script, region, nil, nil, table.concat ({'unrecognized variant: ', variant, ' for code: ', code});
if is_set (private) then
private = private:lower(); -- ensure that we use and return lower case version of this
Line 419 ⟶ 421:
table.insert (out, table.concat ({'[', args.text or 'undefined', '] '})); -- for error messages output args.text if available
table.insert (out, table.concat ({'<span style=\"font-sizecolor: 100%; font-style: normal;\" class=\"error#d33\">Error: {{', template, '}}: '}));
table.insert (out, msg);
table.insert (out, table.concat ({' ([[:Category:', category, ' template errors|help]])'}));
table.insert (out, '</span>');
if (0 == namespace or 10 == namespace) and not args.nocat then -- categorize in article space (and template space to take care of broken usages)
table.insert (out, table.concat ({'[[Category:', category, ' template errors]]'}));
Line 464 ⟶ 466:
if text:find ('^\n[%*:;#]') then -- look for list markup; list markup must begin at start of text
if 'italic' == style then
return mw.ustring.text:gsub (text, '(\n[%*:;#]+)([^\n]+)', '%1<i>%2</i>'); -- insert italic markup at each list item
return text;
Line 482 ⟶ 484:
return text;
--[[--------------------------< T I T L E _ W R A P P E R _ M A K E >------------------------------------------
makes a <span title="<title text>"><content_text></span> or <div title="<title text>"><content_text></div> where
<title text> is in the tool-tip in the wiki's local language and <content_text> is non-local-language text in
html markup. This because the lang= attibute applies to the content of its enclosing tag.
<tag> holds a string 'div' or 'span' used to choose the correct wrapping tag
local function title_wrapper_make (title_text, content_text, tag)
local wrapper_t = {};
table.insert (wrapper_t, table.concat ({'<', tag})); -- open opening wrapper tag
table.insert (wrapper_t, ' title=\"'); -- begin title attribute
table.insert (wrapper_t, title_text); -- add <title_text>
table.insert (wrapper_t, '\">'); -- end title attribute and close opening wrapper tag
table.insert (wrapper_t, content_text); -- add <content_text>
table.insert (wrapper_t, table.concat ({'</', tag, '>'})); -- add closing wrapper tag
return table.concat (wrapper_t); -- make a big string and done
Line 489 ⟶ 514:
Add the html markup to text according to the type of content that it is: <span> or <i> tags for inline content or
<div> tags for block content
The lang= attribute also applies to the content of the tag where it is placed so this is wrong because 'Spanish
language text' is English:
<i lang="es" title="Spanish language text">casa</i>
should be:
<span title="Spanish language text"><i lang="es">casa</i></span>
or for <div>...</div>:
<div title="Spanish language text"><div lang="es"><spanish-language-text></div></div>
local function make_text_html (code, text, tag, rtl, style, size, language)
local htmlhtml_t = {};
local style_added = '';
local wrapper_tag = tag; -- <tag> gets modified so save a copy for use when/if we create a wrapper span or div
if text:match ('^%*') then
table.insert (htmlhtml_t, '&#42;'); -- move proto language text prefix outside of italic markup if any; use numeric entity because plain splat confuses MediaWiki
text = text:gsub ('^%*', ''); -- remove the splat from the text
Line 509 ⟶ 543:
table.insert (htmlhtml_t, table.concat ({'<', tag})); -- open the <i>, <span>, or <div> html tag
code = code:gsub ('%-x%-.*', ''); -- strip private use subtag from code tag because meaningless outside of wikipedia
table.insert (html, table.concat ({' lang="', code, '\"'})); -- add language attribute
table.insert (html_t, table.concat ({' lang="', code, '\"'})); -- add language attribute
if (rtl or unicode.is_rtl(text)) and ('ltr' == this_wiki_lang_dir) then -- text is right-to-left on a left-to-right wiki
table.insert (htmlhtml_t, ' dir="rtl"'); -- add direction attribute for right -to -left languages
elseif not (rtl or unicode.is_rtl(text)) and ('rtl' == this_wiki_lang_dir) then -- text is left-to-right on a right-to-left wiki
table.insert (html_t, ' dir="ltr"'); -- add direction attribute for left-to-right languages
if 'normal' == style then -- when |italic=no
table.insert (htmlhtml_t, ' style=\"font-style: normal;'); -- override external markup, if any
style_added = '\"'; -- remember that style attribute added and is not yet closed
Line 523 ⟶ 560:
if is_set (size) then -- when |size=<something>
if is_set (style_added) then
table.insert (htmlhtml_t, table.concat ({' font-size: ', size, ';'})); -- add when style attribute already inserted
table.insert (htmlhtml_t, table.concat ({' style=\"font-size: ', size, ';'})); -- create style attribute
style_added = '\"'; -- remember that style attribute added and is not yet closed
table.insert (html_t, table.concat ({style_added, '>'})); -- close the opening html tag
if is_set (language) then
table.insert (htmlhtml_t, table.concat ({style_added, ' title=\"', language})text); --start theinsert titlethe text
if language:find ('languages') then
table.insert (html, ' collective text'); -- for collective languages
table.insert (html, '-language text'); -- for individual languages
table.insert (html, '\">'); -- close the opening html tag
table.insert (html, table.concat ({style_added, '>'})); -- close the style attribute and close opening html tag
table.insert (html, text); -- insert the text
table.insert (htmlhtml_t, table.concat ({'</', tag, '>'})); -- close the 'text' <i>, <span>, or <div> html tag
if rtlis_set (language) then -- legacy;create shouldn'ta be<title_text> necessarystring because all offor the rtltitle= textattribute isin wrappeda insidewrapper anspan html tag with dir="rtl" attributeor div
local title_text;
table.insert (html, '&lrm;'); -- make sure the browser knows that we're at the end of the rtl
if 'zxx' == code then -- special case for this tag 'no linguistic content'
title_text = table.concat ({language, ' text'}); -- not a language so don't use 'language' in title text
elseif mw.ustring.find (language, 'languages', 1, true) then
title_text = table.concat ({language, ' collective text'}); -- for collective languages
title_text = table.concat ({language, '-language text'}); -- for individual languages
return title_wrapper_make (title_text, table.concat (html_t), wrapper_tag);
return table.concat (html_t);
return table.concat (html); -- put it all together and done
Line 573 ⟶ 610:
if language_name:mw.ustring.find (language_name, 'languages', 1, true) then
return table.concat ({'[[Category:Articles with text in ', language_name, ']]'});
Line 579 ⟶ 616:
table.insert (cat, '[[Category:Articles containing ');
if 'en'this_wiki_lang_tag == code then
table.insert (cat, 'explicitly cited ' .. language_name); -- fallsunique backcategory toname Englishfor if regional namethe notlocal availablelanguage
table.insert (cat, language_name);
Line 611 ⟶ 648:
local function make_translit (code, language_name, translit, std, tscript, style)
local title;
local toutout_t = {};
local title_tabletitle_t = lang_data.translit_title_table; -- table of transliteration standards and the language codes and scripts that apply to those standards
local title_text = ''; -- tool tip text for title= attribute
if is_set (code) then -- when a language code is provided (always with {{lang-xx}} templates, not always with {{transl}})
if not style then -- nil for the default italic style
table.insert (tout, "<i lang=\""); -- so use <i> tag
table.insert (tout, table.concat ({'<span style=\"font-style: ', style, '\" lang=\"'})); -- non-standard style, construct a span tag for it
table.insert (tout, code);
table.insert (tout, "-Latn\" title=\""); -- transliterations are always Latin script
table.insert (tout, "<span title=\""); -- when no language code: no lang= attribute, not italic ({{transl}} only)
std = std and std:lower(); -- lower case for table indexing
if not is_set (std) and not is_set (tscript) then -- when neither standard nor script specified
table.inserttitle_text (tout,= language_name); -- write a generic tool tip
if not language_name:mw.ustring.find (language_name, 'languages', 1, true) then -- collective language names (plural 'languages' is part of the name)
table.inserttitle_text (tout,= title_text .. '-language') ; -- skip this text (individual and macro languages only)
table.inserttitle_text (tout,= title_text .. ' romanization'); -- finish the tool tip; use romanization when neither script nor standard supplied
elseif is_set (std) and is_set (tscript) then -- when both are specified
if title_tabletitle_t[std] then -- and if standard is legitimate
if title_tabletitle_t[std][tscript] then -- and if script for that standard is legitimate
if script_table[tscript] then
table.insert (tout, table.concat ({title_table[std][tscript:lower()], ' (', script_table[tscript][1], ' script) transliteration'})); -- add the appropriate text to the tool tip
title_text = title_text .. table.concat ({title_t[std][tscript:lower()], ' (', script_table[tscript], ' script) transliteration'}); -- add the appropriate text to the tool tip
title_text = title_text .. title_t[std]['default']; -- use the default if script not in std table; TODO: maint cat? error message because script not found for this standard?
table.inserttitle_text (tout,= title_text .. title_tabletitle_t[std]['default']); -- use the default if script not in std table; TODO: maint cat? error message because script not found for this standard?
Line 646 ⟶ 677:
elseif is_set (std) then -- translit-script not set, use language code
if not title_tabletitle_t[std] then return ''; end -- invalid standard, setup for error message
if title_tabletitle_t[std][code] then -- if language code is in the table (transl may not provide a language code)
-- tabletitle_text = title_text ..insert (tout, table.concat ({title_tabletitle_t[std][code:lower()], ' (', lang_table[code][1]language_name, ' language) transliteration'})); -- add the appropriate text to the tool tip
table.insert (tout, table.concat ({title_table[std][code:lower()], ' (', language_name, ' language) transliteration'})); -- add the appropriate text to the tool tip
else -- code doesn't match
table.inserttitle_text (tout,= title_text .. title_tabletitle_t[std]['default']); -- so use the standard's default
else -- here if translit-script set but translit-std not set
if title_tabletitle_t['no_std'][tscript] then
table.inserttitle_text (tout,= title_text .. title_tabletitle_t['no_std'][tscript]); -- use translit-script if set
elseif title_tabletitle_t['no_std'][code] then
table.inserttitle_text (tout,= title_text .. title_tabletitle_t['no_std'][code]); -- use language code
if is_set (tscript) then
table.inserttitle_text (tout,= title_text .. table.concat ({language_name, '-script transliteration'})); -- write a script tool tip
elseif is_set (code) then
if not language_name:mw.ustring.find (language_name, 'languages', 1, true) then -- collective language names (plural 'languages' is part of the name)
table.inserttitle_text (tout,= title_text .. '-language') ; -- skip this text (individual and macro languages only)
table.inserttitle_text (tout,= title_text .. ' transliteration'); -- finish the tool tip
table.inserttitle_text (tout,= title_text .. ' transliteration'); -- generic tool tip (can we ever get here?)
local close_tag;
table.insert (tout, '">');
if is_set (code) then -- when a language code is provided (always with {{lang-xx}} templates, not always with {{transl}})
table.insert (tout, translit);
code = code:match ('^(%a%a%a?)'); -- strip all subtags leaving only the language subtag
if is_set (code) and not style then -- when a language code is provided (always with {{lang-xx}} templates, not always with {{transl}})
table.insert (tout, "</i>"); -- close the italic tag
if not style then -- nil for the default italic style
table.insert (out_t, "<i lang=\""); -- so use <i> tag
close_tag = '</i>'; -- tag to be used when closing
table.insert (out_t, table.concat ({'<span style=\"font-style: ', style, '\" lang=\"'})); -- non-standard style, construct a span tag for it
close_tag = '</span>'; -- tag to be used when closing
table.insert (out_t, code);
table.insert (out_t, "-Latn\">"); -- transliterations are always Latin script
table.insert (out_t, "<span>"); -- when no language code: no lang= attribute, not italic ({{transl}} only)
close_tag = '</span>';
table.insert (out_t, translit); -- add the translit text
table.insert (out_t, close_tag); -- and add the appropriate </i> or </span>
if '' == title_text then -- when there is no need for a tool-tip
return table.concat (out_t); -- make a string and done
return title_wrapper_make (title_text, table.insertconcat (toutout_t), "</'span>"'); -- nowrap languagewith codea sotool-tip closespan the spanand tagdon
return table.concat (tout);
Line 849 ⟶ 898:
if override_table[ietf] then -- look for whole IETF tag in override table
name = override_table[ietf][1];
elseif override_table[code] then -- not there so try basic language codetag
name = override_table[code][1];
elseif lang_table[code] then -- shift to iana codeactive tag/name table
name = lang_table[code][1]; -- table entries sometimes have multiple names, always take the first one
elseif lang_dep_table[code] then -- try the iana deprecated tag/name table
name = lang_dep_table[code];
-- if cat then
-- table.insert (maint_cats, table.concat ({'Lang and lang-xx using deprecated ISO 639 codes|', code}));
-- table.insert (maint_msgs, table.concat ({'code: ', code, ' is deprecated'}));
-- end
name = lang_dep_table[code][1]; -- table entries sometimes have multiple names, always take the first one
Line 892 ⟶ 937:
local template = args.template or 'Lang';
maint_cats = {}; -- initialize because when this module required into another module, these only declared once so only initialzed once
maint_msgs = {};
validate_cat_args (args); -- determine if categorization should be suppressed
Line 933 ⟶ 981:
if nil == args.italic then -- nil when |italic= absent or not set or |italic=default; args.italic controls
if ('latn' == subtags.script) or -- script is latn
(this_wiki_langthis_wiki_lang_tag ~= code and not is_set (subtags.script) and not has_poem_tag (args.text) and unicode.is_Latin (args.text)) then -- text not this wiki's language, no script specified and not in poem markup but is wholly latn script (auto-italics)
args.italic = 'italic'; -- DEFAULT for {{lang}} templates is upright; but if latn script set for font-style:italic
Line 992 ⟶ 1,040:
return _lang (args);
--[[--------------------------< T R A N S L A T I O N _ M A K E >----------------------------------------------
stand-alone function to create literal translation of main text
Also used by {{lang-x2}}
local function translation_make (args_t)
local translation_t = {', '}; -- initialize output
if 'none' ~= args_t.label then -- if we want a label
table.insert (translation_t, '<small>'); -- open the <small> html tag
if 'no' == then
table.insert (translation_t, '<abbr title="literal translation">lit.</abbr>'); -- unlinked form
table.insert (translation_t, make_wikilink ('Literal translation', 'lit.')); -- linked form
table.insert (translation_t, "&thinsp;</small>"); -- close the <small> html tag
table.insert (translation_t, table.concat ({'&#39;', args_t.translation, '&#39;'})); -- use html entities to avoid wiki markup confusion
return table.concat (translation_t); -- make a big string and done
Line 1,053 ⟶ 1,126:
local template = args.template or 'Lang-xx';
maint_cats = {}; -- initialize because when this module required into another module, these only declared once so only initialzed once
maint_msgs = {};
if args[1] and args.text then
return make_error_msg ('conflicting: {{{1}}} and |text=', args, template);
Line 1,140 ⟶ 1,216:
table.insert (out, language_name); -- language name without wikilink
if language_name:mw.ustring.find (language_name, 'languages', 1, true) then
table.insert (out, make_wikilink (language_name)); -- collective language name uses simple wikilink
elseif lang_data.article_name[code] then
table.insert (out, make_wikilink (lang_data.article_name[code][1], language_name)); -- language name with wikilink from override data
table.insert (out, make_wikilink (language_name .. ' language', language_name)); -- language name with wikilink
Line 1,164 ⟶ 1,240:
table.insert (out, '<small>');
if script_table[args['translit-script']] then -- when |translit-script= is set, try to use the script's name
translit_script_name = script_table[args['translit-script'][1]];
translit_script_name = language_name; -- fall back on language name
Line 1,186 ⟶ 1,262:
if is_set (args.translation) then -- translation (not supported in {{lang}})
table.insert (out, ',translation_make '(args));
if 'none' ~= args.label then
table.insert (out, '<small>');
if 'no' == then
table.insert (out, '<abbr title="literal translation">lit.</abbr>');
table.insert (out, make_wikilink ('Literal translation', 'lit.'));
table.insert (out, "&thinsp;</small>");
table.insert (out, table.concat ({'&#39;', args.translation, '&#39;'})); -- use html entities to avoid wiki markup confusion
Line 1,353 ⟶ 1,419:
if msg then
local template = (args['template'] and table.concat ({'{{', args['template'], '}}: '})) or ''; -- make template name (if provided by the template)
return table.concat ({'<span style=\"font-sizecolor: 100%; font-style: normal;\" class=\"error#d33\">Error: ', template, msg, '</span>'});
Line 1,362 ⟶ 1,428:
if link then -- when |link=yes, wikilink the language name
if language_name:mw.ustring.find (language_name, 'languages', 1, true) then
language_name = make_wikilink (language_name, label); -- collective language name uses simple wikilink
elseif lang_data.article_name[code] then
language_name = make_wikilink (lang_data.article_name[code][1], label or language_name); -- language name with wikilink from override data
language_name = make_wikilink (language_name .. ' language', label or language_name); -- language name with wikilink
Line 1,417 ⟶ 1,483:
template = table.concat ({'{{', args['template'], '}}: '}); -- make template name (if provided by the template)
return table.concat ({'<span style=\"font-sizecolor: 100%; font-style: normal;\" class=\"error#d33\">Error: ', template, msg, '</span>'});
Line 1,458 ⟶ 1,524:
local msg; -- for when called functions return an error message
maint_cats = {}; -- initialize because when this module required into another module, these only declared once so only initialzed once
maint_msgs = {};
if is_set (args[3]) then -- [3] set when {{transl|code|standard|text}}
args.text = args[3]; -- get the transliterated text
Line 1,469 ⟶ 1,538:
args.text = args[2]; -- get the transliterated text
if args[1] and (args[1]:match ('^%a%a%a?%a?$') thenor -- args[2] missing; is args[1] a codelanguage or itsscript tag or is it the transliterated text?
return make_error_msgargs[1]:match ('no text', args, 'Transl^%a%a%a?%-x%-');) then -- or is args[1] is a code so we're missingprivate-use texttag
return make_error_msg ('no text', args, 'Transl'); -- args[1] is a code so we're missing text
args.text = args[1]; -- args[1] is not a code so we're missing that; assign args.text for error message
Line 1,479 ⟶ 1,549:
if is_set (args[1]) then -- IANA language code used for html lang= attribute; or ISO 15924 script code
if args[1]:match ('^%a%a%a?%a?$') or args[1]:match ('^%a%a%a?%-x%-') then -- args[1] has correct form?
args.code = args[1]:lower(); -- use the language/script code; only (2, 3, or 4 alpha characters) or private-use; lower case because table indexes are lower case
return make_error_msg (table.concat ({'unrecognized language / script code: ', args[1]}), args, 'Transl'); -- invalid language / script code
Line 1,498 ⟶ 1,568:
if override_table[args.code] then -- is code a language code defined in the override table?
language_name = override_table[args.code][1];
args.code = args.code:match ('^%a%a%a?'); -- if private use, strip all but language subtag
elseif lang_table[args.code] then -- is code a language code defined in the standard language code tables?
language_name = lang_table[args.code][1];
elseif lang_dep_table[args.code] then -- is code a language code defined in the deprecated language code tables?
language_name = lang_dep_table[args.code][1];
elseif script_table[args.code] then -- if here, code is not a language code; is it a script code?
language_name = script_table[args.code][1];
script = args.code; -- code was an ISO 15924 script so use that instead
args.code = ''; -- unset because not a language code
Line 1,536 ⟶ 1,607:
local function _category_from_tag (argsargs_t)
local subtags = {}; -- IETF subtags script, region, variant, and private
local raw_code = argsargs_t[1]; -- save a copy of the input IETF subtag
local link = 'yes' == args['']; -- make a boolean
local label = argsargs_t.label;
local code; -- the language code
local msg; -- gets an error message if IETF language tag is malformed or invalid
Line 1,547 ⟶ 1,618:
code, subtags.script, subtags.region, subtags.variant, subtags.private, msg = get_ietf_parts (raw_code);
if msg then
local template = (args['args_t.template'] and table.concat ({'{{', args['args_t.template'], '}}: '})) or ''; -- make template name (if provided by the template)
return table.concat ({'<span style=\"font-sizecolor: 100%; font-style: normal;\" class=\"error#d33\">Error: ', template, msg, '</span>'});
Line 1,555 ⟶ 1,626:
category_name = make_category (code, category_name, nil, true):gsub ('[%[%]]', '');
if link then
return category_name;
return table.concat ({'[[:', category_name, ']]'});
return category_name;
Line 1,594 ⟶ 1,669:
_name_from_tag = _name_from_tag,
_transl = _transl,
_translation_make = translation_make,