模块:Lang:修订间差异
imported>Tigerzeng |
imported>Ericliu1912 依據編輯請求更新頁面 自Module:Lang/sandbox合并優枰的版本90980088 |
||
| (未显示8个用户的25个中间版本) | |||
| 第1行: | 第1行: | ||
--[=[ | --[=[ | ||
Lua support for the {{lang}}, {{lang- | Lua support for the {{lang}}, {{langx}}, {{lang-??}}, and {{transliteration}} templates and replacement of various supporting templates. | ||
-- 中文維基百科:加入了error_msgs,用於將所有報錯情形修改爲試圖顯示正常內容並附加預設不可見的錯誤報告。 | |||
]=] | ]=] | ||
require(' | require('strict'); | ||
local getArgs = require ('Module:Arguments').getArgs; | local getArgs = require ('Module:Arguments').getArgs; | ||
local unicode = require ("Module:Unicode data"); -- for | local unicode = require ("Module:Unicode data"); -- for is_Latin() and is_rtl() | ||
local yesno = require ('Module:Yesno'); | local yesno = require ('Module:Yesno'); | ||
local lang_data = mw.loadData ('Module:Lang/data'); | local sandbox = (mw.getCurrentFrame():getTitle():match ('/sandbox') or ''); -- when called from a sandbox template or module load sandbox data and sandbox configuration | ||
local lang_data = mw.loadData ('Module:Lang/data' .. sandbox); -- language name override and transliteration tool-tip tables | |||
local lang_name_table = lang_data.lang_name_table; -- language codes, names, regions, scripts, suppressed scripts | local lang_name_table = lang_data.lang_name_table; -- language codes, names, regions, scripts, suppressed scripts | ||
local lang_table = lang_data.lang_name_table.lang; | local lang_table = lang_data.lang_name_table.lang; | ||
| 第22行: | 第26行: | ||
local synonym_table = mw.loadData ('Module:Lang/ISO 639 synonyms'); -- ISO 639-2/639-2T code translation to 639-1 code | local synonym_table = mw.loadData ('Module:Lang/ISO 639 synonyms'); -- ISO 639-2/639-2T code translation to 639-1 code | ||
local cfg = mw.loadData ('Module:Lang/configuration' .. sandbox); -- for internationalization | |||
local is_latn_data = mw.loadData ('Module:Lang/data/is latn data'); | |||
local sizeof_ranges_t = is_latn_data.sizeof_ranges_t; | |||
local namespace = mw.title.getCurrentTitle().namespace; -- used for categorization | local namespace = mw.title.getCurrentTitle().namespace; -- used for categorization | ||
local | local content_lang = mw.language.getContentLanguage(); | ||
local this_wiki_lang_tag = content_lang.code; -- get this wiki's language tag | |||
local this_wiki_lang_dir = content_lang:getDir(); -- get this wiki's language direction | |||
local initial_style_state; -- set by lang_xx_normal() and lang_xx_italic() | local initial_style_state; -- set by lang_xx_normal() and lang_xx_italic() | ||
| 第31行: | 第42行: | ||
local maint_cats = {}; -- maintenance categories go here | local maint_cats = {}; -- maintenance categories go here | ||
local maint_msgs = {}; -- and their messages go here | local maint_msgs = {}; -- and their messages go here | ||
local error_msgs = {} | |||
--[[--------------------------< M A K E _ E R R O R _ S P A N >-------------------------------------------------- | |||
]] | |||
local function make_error_span (template, msg) | |||
return table.concat ({'<span class="error" style="font-size: 1em;">', cfg.misc_text_t.error, ':', template, msg, '</span>'}) | |||
end | |||
local function make_lang_error_span (msg) | |||
return table.concat ({'<span class="lang-comment lang-comment-error" style="font-style: normal; display: none; margin-left: 0.3em; color: #33aa33;">', msg, '</span>'}) | |||
end | |||
--[[--------------------------< S U B S T I T U T E >---------------------------------------------------------- | |||
Substitutes $1, $2, etc in <message> with data from <data_t>. Returns plain-text substituted string when | |||
<data_t> not nil; returns <message> else. | |||
]] | |||
local function substitute (message, data_t) | |||
return data_t and mw.message.newRawMessage (message, data_t):plain() or message; | |||
end | |||
--[[--------------------------< M A K E _ E R R O R _ M S G >-------------------------------------------------- | |||
Assembles an error message from template name, message text, help link, and error category. | |||
]] | |||
local function make_error_msg (msg, args_t, template) | |||
local category; | |||
local text; -- handle the oddity that is {{langx}} | |||
if cfg.templates_t.langxx == template then | |||
text = args_t.text or args_t[1]; -- for {{lang-xx}} | |||
else | |||
text = args_t.text or args_t[2]; -- for {{lang}}, {{langx}}, and {{transliteration}} | |||
end | |||
if cfg.templates_t.transliteration == template then | |||
category = cfg.make_error_msg_t.xlit_err_cat; | |||
else | |||
category = cfg.make_error_msg_t.lang_err_cat; | |||
end | |||
local category_link = ((0 == namespace or 10 == namespace) and not args_t.nocat) and substitute ('[[Category:$1]]', {category}) or ''; | |||
text = text or cfg.make_error_msg_t.undefined | |||
if text == '' then | |||
text = cfg.make_error_msg_t.empty | |||
end | |||
-- {{$3}} = {{$3}} | |||
-- 防止特定情況下作爲模板展開 | |||
table.insert(error_msgs, substitute ('-{[$1]}-<span class="error" style="font-size: 1em; margin-left: 0.3em;">$2:{{$3}}:$4([[:Category:$5|$6]])</span>$7', | |||
{ | |||
text, | |||
cfg.misc_text_t.error, | |||
template, | |||
msg, | |||
category, | |||
cfg.misc_text_t.help, | |||
category_link | |||
}) | |||
) | |||
return error_msgs[#error_msgs] | |||
end | |||
--[[--------------------------< P A R A M E T E R _ V A L I D A T E >------------------------------------------ | |||
]] | |||
local function parameter_validate (args_t, template) | |||
local err_msg = cfg.parameter_validate_t.invalid_param; | |||
local ret = {} | |||
if cfg.templates_t.lang == template then -- for {{lang}} | |||
for param, _ in pairs (args_t) do | |||
if not cfg.known_params_t.params_lang_t[param] and -- unique {{lang}} parameters | |||
not cfg.known_params_t.common_params_all_t[param] then -- common to all | |||
table.insert(ret, substitute (err_msg, {param})) | |||
end | |||
end | |||
elseif cfg.templates_t.langx == template then -- for {{langx}} | |||
for param, _ in pairs (args_t) do | |||
if not cfg.known_params_t.params_langx_t[param] and -- unique {{langx}} parameters | |||
not cfg.known_params_t.params_x_t[param] and -- common to {{langx}} and {{lang-xx}} | |||
not cfg.known_params_t.common_params_all_t[param] then -- common to all | |||
table.insert(ret, substitute (err_msg, {param})) | |||
end | |||
end | |||
elseif cfg.templates_t.langxx == template then -- for {{lang-xx}} | |||
for param, _ in pairs (args_t) do | |||
if not cfg.known_params_t.params_lang_xx_t[param] and -- unique {{lang-xx}} parameters | |||
not cfg.known_params_t.params_x_t[param] and -- common to {{langx}} and {{lang-xx}} | |||
not cfg.known_params_t.common_params_all_t[param] then -- common to all | |||
table.insert(ret, substitute (err_msg, {param})) | |||
end | |||
end | |||
end | |||
if ret[1] then | |||
return table.concat(ret, '、') | |||
end | |||
end | |||
--[[--------------------------< I S _ S E T >------------------------------------------------------------------ | --[[--------------------------< I S _ S E T >------------------------------------------------------------------ | ||
Returns true if argument is set; false otherwise. Argument is 'set' when it exists (not nil) or when it is not an empty string. | Returns true if argument is set; false otherwise. Argument is 'set' when it exists (not nil) or when it is not | ||
an empty string. | |||
]] | ]] | ||
local function is_set( var ) | local function is_set (var) | ||
return not (var == nil or var == ''); | return not (var == nil or var == ''); | ||
end | end | ||
| 第48行: | 第172行: | ||
This function attempts to invert the italic markup a args.text by adding/removing leading/trailing italic markup | This function attempts to invert the italic markup a args.text by adding/removing leading/trailing italic markup | ||
in args.text. Like |italic=unset, |italic=invert disables automatic italic markup. Individual leading/trailing | in args.text. Like |italic=unset, |italic=invert disables automatic italic markup. Individual leading/trailing | ||
apostrophes are converted to their | apostrophes are converted to their HTML numeric entity equivalent so that the new italic markup doesn't become | ||
bold markup inadvertently. | bold markup inadvertently. | ||
| 第73行: | 第197行: | ||
seg[3] = source:match ('.+(%f[\']\'\'+)$') or ''; -- get trailing markup, if any; ignore single quote | seg[3] = source:match ('.+(%f[\']\'\'+)$') or ''; -- get trailing markup, if any; ignore single quote | ||
if '' ~= seg[1] and '' ~= seg[3] then -- extract the 'text' | if '' ~= seg[1] and '' ~= seg[3] then -- extract the 'text' | ||
seg[2] = source:match ('^\'\'+%f[^\'](.+)%f[\']\'\'+$') -- from between leading and trailing markup | seg[2] = source:match ('^\'\'+%f[^\'](.+)%f[\']\'\'+$') -- from between leading and trailing markup | ||
elseif '' ~= seg[1] then | elseif '' ~= seg[1] then | ||
| 第92行: | 第216行: | ||
--[[--------------------------< V A L I D A T E _ I T A L I C >------------------------------------------------ | --[[--------------------------< V A L I D A T E _ I T A L I C >------------------------------------------------ | ||
Validates |italic= or |italics= assigned values. | |||
When |italic= is set and has an | When |italic= is set and has an acceptable assigned value, return the matching CSS font-style property value or, | ||
for the special case 'default', return nil. | for the special case 'default', return nil. | ||
When |italic= is not set, or has an | When |italic= is not set, or has an unacceptable assigned value, return nil and a nil error message. | ||
When both |italic= and |italics= are set, returns nil and a 'conflicting' error message. | When both |italic= and |italics= are set, returns nil and a 'conflicting' error message. | ||
The return value nil causes the calling lang, lang_xx, or transl function to set args.italic according to the template's | The return value nil causes the calling lang, lang_xx, or transl function to set args.italic according to the template's | ||
defined default ('inherit' for {{lang}}, 'inherit' or 'italic' for {{lang- | defined default ('inherit' for {{lang}}, 'inherit' or 'italic' for {{lang-??}} depending on | ||
the individual template's requirements, 'italic' for {{ | the individual template's requirements, 'italic' for {{transliteration}}) or to the value appropriate to |script=, if set ({{lang}} | ||
and {{lang- | and {{lang-??}} only). | ||
Accepted values and the values that this function returns are are: | Accepted values and the values that this function returns are are: | ||
| 第117行: | 第241行: | ||
local function validate_italic (args) | local function validate_italic (args) | ||
local properties = {[ | local properties = {[cfg.keywords_t.affirmative] = 'italic', [cfg.keywords_t.negative] = 'normal', [cfg.keywords_t.unset] = 'inherit', [cfg.keywords_t.invert] = 'invert', [cfg.keywords_t.default] = nil}; | ||
local count = 0 | local count = 0 | ||
for _, arg in pairs {'italic', 'italics', 'i'} do | for _, arg in pairs {'italic', 'italics', 'i'} do | ||
| 第126行: | 第250行: | ||
end | end | ||
return properties[args.italic or args.italics or args.i], count > 1 and cfg.validate_italic_t.multi_italic or nil | |||
return properties[args.italic or args.italics or args.i], | |||
end | end | ||
| 第136行: | 第256行: | ||
--[=[--------------------------< V A L I D A T E _ C A T _ A R G S >---------------------------------------------------------- | --[=[--------------------------< V A L I D A T E _ C A T _ A R G S >---------------------------------------------------------- | ||
Default behavior of the {{lang}} and {{lang- | Default behavior of the {{lang}} and {{lang-??}} templates is to add categorization when the templates are used in main space. | ||
This default functionality may be suppressed by setting |nocat=yes or |cat=no. This function selects one of these two parameters | This default functionality may be suppressed by setting |nocat=yes or |cat=no. This function selects one of these two parameters | ||
to control categorization. | to control categorization. | ||
| 第157行: | 第277行: | ||
return; | return; | ||
end | end | ||
if false == yesno (args.cat) or true == yesno (args.nocat) then | if false == yesno (args.cat) or true == yesno (args.nocat) then | ||
args.nocat = true; -- set to true when args.nocat is affirmative; nil else (as if the parameter were not set in the template) | args.nocat = true; -- set to true when args.nocat is affirmative; nil else (as if the parameter were not set in the template) | ||
| 第168行: | 第288行: | ||
--[[--------------------------< I N _ A R R A Y >-------------------------------------------------------------- | --[[--------------------------< I N _ A R R A Y >-------------------------------------------------------------- | ||
Whether needle is in haystack | Whether needle is in haystack. | ||
]] | ]] | ||
local function in_array ( needle, haystack ) | local function in_array (needle, haystack) | ||
if needle == nil then | if needle == nil then | ||
return false; | return false; | ||
end | end | ||
for n,v in ipairs( haystack ) do | for n,v in ipairs (haystack) do | ||
if v == needle then | if v == needle then | ||
return n; | return n; | ||
| 第187行: | 第307行: | ||
--[[--------------------------< F O R M A T _ I E T F _ T A G >------------------------------------------------ | --[[--------------------------< F O R M A T _ I E T F _ T A G >------------------------------------------------ | ||
Prettify IETF tags to use recommended subtag formats: | |||
code: lower case | code: lower case | ||
script: sentence case | script: sentence case | ||
| 第193行: | 第313行: | ||
variant: lower case | variant: lower case | ||
private: lower case prefixed with -x- | private: lower case prefixed with -x- | ||
]] | ]] | ||
| 第202行: | 第322行: | ||
return table.concat ({code:lower(), 'x', private:lower()}, '-'); -- if private, all other tags ignored | return table.concat ({code:lower(), 'x', private:lower()}, '-'); -- if private, all other tags ignored | ||
end | end | ||
table.insert (out, code:lower()); | table.insert (out, code:lower()); | ||
if is_set (script) then | if is_set (script) then | ||
| 第212行: | 第332行: | ||
table.insert (out, region:upper()); | table.insert (out, region:upper()); | ||
end | end | ||
if is_set (variant) then | if is_set (variant) then | ||
table.insert (out, variant:lower()); | table.insert (out, variant:lower()); | ||
end | end | ||
return table.concat (out, '-'); | return table.concat (out, '-'); | ||
end | end | ||
| 第223行: | 第343行: | ||
--[[--------------------------< G E T _ I E T F _ P A R T S >-------------------------------------------------- | --[[--------------------------< G E T _ I E T F _ P A R T S >-------------------------------------------------- | ||
Extracts and returns IETF language tag parts: | |||
primary language subtag (required) - 2 or 3 character IANA language code | primary language subtag (required) - 2 or 3 character IANA language code | ||
script subtag - four character IANA script code | script subtag - four character IANA script code | ||
| 第235行: | 第355行: | ||
lang-region lang-region-variant | lang-region lang-region-variant | ||
lang-script-region lang-script-region-variant | lang-script-region lang-script-region-variant | ||
lang-x-private | lang-x-private | ||
each of lang, script, region, variant, and private, when used, must be valid | each of lang, script, region, variant, and private, when used, must be valid. | ||
Languages with both two- and three-character code synonyms are promoted to the two-character synonym because | Languages with both two- and three-character code synonyms are promoted to the two-character synonym because | ||
| 第243行: | 第363行: | ||
the synonymous three-character codes in the lang= attribute. | the synonymous three-character codes in the lang= attribute. | ||
For {{lang- | For {{lang-??}} templates, the parameters |script=, |region=, and |variant= are supported (not supported in {{lang}} | ||
because those parameters are superfluous to the IETF subtags in |code=) | because those parameters are superfluous to the IETF subtags in |code=). | ||
Returns six values; all lower case. Valid parts are returned as themselves; omitted parts are returned as empty strings, invalid | |||
parts are returned as nil; the sixth returned item is an error message (if an error detected) or nil. | parts are returned as nil; the sixth returned item is an error message (if an error detected) or nil. | ||
See http://www.rfc-editor.org/rfc/bcp/bcp47.txt section 2.1. | |||
]] | ]] | ||
local function get_ietf_parts (source, args_script, args_region, args_variant) | local function get_ietf_parts (source, args_script, args_region, args_variant) | ||
local code, script, region, variant, private; -- | local code, script, region, variant, private; -- IETF tag parts | ||
if not is_set (source) then | if not is_set (source) then | ||
return nil, nil, nil, nil, nil, | return nil, nil, nil, nil, nil, cfg.get_ietf_parts_t.missing_lang_tag; | ||
end | end | ||
local pattern = { -- table of tables holding | local override = { -- 簡寫轉換爲正確的語言標籤 | ||
['pinyin'] = 'zh-Latn-pinyin', -- 漢語拼音 | |||
['zhuyin'] = 'zh-Bopo', -- 注音符號 | |||
} | |||
source = override[source] or source | |||
local pattern = { -- table of tables holding acceptable IETF tag patterns and short names of the IETF part captured by the pattern | |||
{'^(%a%a%a?)%-(%a%a%a%a)%-(%a%a)%-(%d%d%d%d)$', 's', 'r', 'v'}, -- 1 - ll-Ssss-RR-variant (where variant is 4 digits) | {'^(%a%a%a?)%-(%a%a%a%a)%-(%a%a)%-(%d%d%d%d)$', 's', 'r', 'v'}, -- 1 - ll-Ssss-RR-variant (where variant is 4 digits) | ||
{'^(%a%a%a?)%-(%a%a%a%a)%-(%d%d%d)%-(%d%d%d%d)$', 's', 'r', 'v'}, -- 2 - ll-Ssss-DDD-variant (where region is 3 digits; variant is 4 digits) | {'^(%a%a%a?)%-(%a%a%a%a)%-(%d%d%d)%-(%d%d%d%d)$', 's', 'r', 'v'}, -- 2 - ll-Ssss-DDD-variant (where region is 3 digits; variant is 4 digits) | ||
{'^(%a%a%a?)%-(%a%a%a%a)%-(%a%a)%-(%w%w%w%w%w%w?%w?%w?)$', 's', 'r', 'v'}, -- 3 - ll-Ssss-RR-variant (where variant is 5-8 alnum characters) | {'^(%a%a%a?)%-(%a%a%a%a)%-(%a%a)%-(%w%w%w%w%w%w?%w?%w?)$', 's', 'r', 'v'}, -- 3 - ll-Ssss-RR-variant (where variant is 5-8 alnum characters) | ||
{'^(%a%a%a?)%-(%a%a%a%a)%-(%d%d%d)%-(%w%w%w%w%w%w?%w?%w?)$', 's', 'r', 'v'}, -- 4 - ll-Ssss-DDD-variant (where region is 3 digits; variant is 5-8 alnum characters) | {'^(%a%a%a?)%-(%a%a%a%a)%-(%d%d%d)%-(%w%w%w%w%w%w?%w?%w?)$', 's', 'r', 'v'}, -- 4 - ll-Ssss-DDD-variant (where region is 3 digits; variant is 5-8 alnum characters) | ||
{'^(%a%a%a?)%-(%a%a%a%a)%-(%d%d%d%d)$', 's', 'v'}, -- 5 - ll-Ssss-variant (where variant is 4 digits) | {'^(%a%a%a?)%-(%a%a%a%a)%-(%d%d%d%d)$', 's', 'v'}, -- 5 - ll-Ssss-variant (where variant is 4 digits) | ||
{'^(%a%a%a?)%-(%a%a%a%a)%-(%w%w%w%w%w%w?%w?%w?)$', 's', 'v'}, -- 6 - ll-Ssss-variant (where variant is 5-8 alnum characters) | {'^(%a%a%a?)%-(%a%a%a%a)%-(%w%w%w%w%w%w?%w?%w?)$', 's', 'v'}, -- 6 - ll-Ssss-variant (where variant is 5-8 alnum characters) | ||
{'^(%a%a%a?)%-(%a%a)%-(%d%d%d%d)$', 'r', 'v'}, -- 7 - ll-RR-variant (where variant is 4 digits) | {'^(%a%a%a?)%-(%a%a)%-(%d%d%d%d)$', 'r', 'v'}, -- 7 - ll-RR-variant (where variant is 4 digits) | ||
{'^(%a%a%a?)%-(%d%d%d)%-(%d%d%d%d)$', 'r', 'v'}, -- 8 - ll-DDD-variant (where region is 3 digits; variant is 4 digits) | {'^(%a%a%a?)%-(%d%d%d)%-(%d%d%d%d)$', 'r', 'v'}, -- 8 - ll-DDD-variant (where region is 3 digits; variant is 4 digits) | ||
{'^(%a%a%a?)%-(%a%a)%-(%w%w%w%w%w%w?%w?%w?)$', 'r', 'v'}, -- 9 - ll-RR-variant (where variant is 5-8 alnum characters) | {'^(%a%a%a?)%-(%a%a)%-(%w%w%w%w%w%w?%w?%w?)$', 'r', 'v'}, -- 9 - ll-RR-variant (where variant is 5-8 alnum characters) | ||
{'^(%a%a%a?)%-(%d%d%d)%-(%w%w%w%w%w%w?%w?%w?)$', 'r', 'v'}, -- 10 - ll-DDD-variant (where region is 3 digits; variant is 5-8 alnum characters) | {'^(%a%a%a?)%-(%d%d%d)%-(%w%w%w%w%w%w?%w?%w?)$', 'r', 'v'}, -- 10 - ll-DDD-variant (where region is 3 digits; variant is 5-8 alnum characters) | ||
{'^(%a%a%a?)%-(%d%d%d%d)$', 'v'}, -- 11 - ll-variant (where variant is 4 digits) | {'^(%a%a%a?)%-(%d%d%d%d)$', 'v'}, -- 11 - ll-variant (where variant is 4 digits) | ||
{'^(%a%a%a?)%-(%w%w%w%w%w%w?%w?%w?)$', 'v'}, -- 12 - ll-variant (where variant is 5-8 alnum characters) | {'^(%a%a%a?)%-(%w%w%w%w%w%w?%w?%w?)$', 'v'}, -- 12 - ll-variant (where variant is 5-8 alnum characters) | ||
{'^(%a%a%a?)%-(%a%a%a%a)%-(%a%a)$', 's', 'r'}, -- 13 - ll-Ssss-RR | {'^(%a%a%a?)%-(%a%a%a%a)%-(%a%a)$', 's', 'r'}, -- 13 - ll-Ssss-RR | ||
{'^(%a%a%a?)%-(%a%a%a%a)%-(%d%d%d)$', 's', 'r'}, -- 14 - ll-Ssss-DDD (region is 3 digits) | {'^(%a%a%a?)%-(%a%a%a%a)%-(%d%d%d)$', 's', 'r'}, -- 14 - ll-Ssss-DDD (region is 3 digits) | ||
{'^(%a%a%a?)%-(%a%a%a%a)$', 's'}, -- 15 - ll-Ssss | {'^(%a%a%a?)%-(%a%a%a%a)$', 's'}, -- 15 - ll-Ssss | ||
{'^(%a%a%a?)%-(%a%a)$', 'r'}, -- 16 - ll-RR | {'^(%a%a%a?)%-(%a%a)$', 'r'}, -- 16 - ll-RR | ||
{'^(%a%a%a?)%-(%d%d%d)$', 'r'}, -- 17 - ll-DDD (region is 3 digits) | {'^(%a%a%a?)%-(%d%d%d)$', 'r'}, -- 17 - ll-DDD (region is 3 digits) | ||
{'^(%a%a%a?)$'}, -- 18 - ll | {'^(%a%a%a?)$'}, -- 18 - ll | ||
{'^(%a%a%a?)%-x%-(%w%w?%w?%w?%w?%w?%w?%w?)$', 'p'}, -- 19 - ll-x-pppppppp (private is 1-8 alnum characters) | {'^(%a%a%a?)%-x%-(%w%w?%w?%w?%w?%w?%w?%w?)$', 'p'}, -- 19 - ll-x-pppppppp (private is 1-8 alnum characters) | ||
} | } | ||
local t = {}; -- table of captures; serves as a translator between captured | local t = {}; -- table of captures; serves as a translator between captured IETF tag parts and named variables | ||
for i, v in ipairs (pattern) do -- spin through the pattern table looking for a match | for i, v in ipairs (pattern) do -- spin through the pattern table looking for a match | ||
local c1, c2, c3, c4; -- captures in the 'pattern' from the pattern table go here | local c1, c2, c3, c4; -- captures in the 'pattern' from the pattern table go here | ||
c1, c2, c3, c4 = source:match (pattern[i][1]); -- one or more captures set if source matches pattern[i]) | c1, c2, c3, c4 = source:match (pattern[i][1]); -- one or more captures set if source matches pattern[i]) | ||
if c1 then -- c1 always set on match | if c1 then -- c1 always set on match | ||
| 第304行: | 第432行: | ||
}; | }; | ||
script = t.s or ''; -- translate table contents to named variables; | script = t.s or ''; -- translate table contents to named variables; | ||
region = t.r or ''; -- absent table entries are nil so set named | region = t.r or ''; -- absent table entries are nil so set named IETF parts to empty string for concatenation | ||
variant= t.v or ''; | variant= t.v or ''; | ||
private = t.p or ''; | private = t.p or ''; | ||
| 第312行: | 第440行: | ||
if not code then | if not code then | ||
return nil, nil, nil, nil, nil, | return nil, nil, nil, nil, nil, substitute (cfg.get_ietf_parts_t.unrecog_tag, {source}); -- don't know what we got but it is malformed | ||
end | end | ||
code = code:lower(); -- ensure that we use and return lower case version of this | code = code:lower(); -- ensure that we use and return lower case version of this | ||
if not (override_table[code] or lang_table[code] or synonym_table[code] or lang_dep_table[code]) then | if not (override_table[code] or lang_table[code] or synonym_table[code] or lang_dep_table[code]) then | ||
return nil, nil, nil, nil, nil, | return nil, nil, nil, nil, nil, substitute (cfg.get_ietf_parts_t.unrecog_code, {code}); -- invalid language code, don't know about the others (don't care?) | ||
end | end | ||
if synonym_table[code] then -- if 639-2/639-2T code has a 639-1 synonym | if synonym_table[code] then -- if 639-2/639-2T code has a 639-1 synonym | ||
table.insert (maint_cats, | table.insert (maint_cats, substitute (cfg.get_ietf_parts_t.maint_promo_cat, {code})); | ||
table.insert (maint_msgs, | table.insert (maint_msgs, substitute (cfg.get_ietf_parts_t.maint_promo_msg, {code, synonym_table[code]})); | ||
code = synonym_table[code]; -- use the synonym | code = synonym_table[code]; -- use the synonym | ||
end | end | ||
| 第329行: | 第457行: | ||
if is_set (script) then | if is_set (script) then | ||
if is_set (args_script) then | if is_set (args_script) then | ||
return code, nil, nil, nil, nil, | return code, nil, nil, nil, nil, cfg.get_ietf_parts_t.redundant_scr; -- both code with script and |script= not allowed | ||
end | end | ||
else | else | ||
script = args_script or ''; -- use args.script if provided | script = args_script or ''; -- use args.script if provided | ||
end | end | ||
if is_set (script) then | if is_set (script) then | ||
script = script:lower(); -- ensure that we use and return lower case version of this | script = script:lower(); -- ensure that we use and return lower case version of this | ||
if not script_table[script] then | if not script_table[script] then | ||
return code, nil, nil, nil, nil, | return code, nil, nil, nil, nil, substitute (cfg.get_ietf_parts_t.unrecog_scr_code, {script, code}); -- language code OK, invalid script, don't know about the others (don't care?) | ||
end | end | ||
end | end | ||
if suppressed_table[script] then -- ensure that code-script does not use a suppressed script | if suppressed_table[script] then -- ensure that code-script does not use a suppressed script | ||
if in_array (code, suppressed_table[script]) then | if in_array (code, suppressed_table[script]) then | ||
return code, nil, nil, nil, nil, | return code, nil, nil, nil, nil, substitute (cfg.get_ietf_parts_t.script_code, {script, code}); -- language code OK, script is suppressed for this code | ||
end | end | ||
end | end | ||
| 第349行: | 第477行: | ||
if is_set (region) then | if is_set (region) then | ||
if is_set (args_region) then | if is_set (args_region) then | ||
return code, nil, nil, nil, nil, | return code, nil, nil, nil, nil, cfg.get_ietf_parts_t.redundant_reg; -- both code with region and |region= not allowed | ||
end | end | ||
else | else | ||
region = args_region or ''; -- use args.region if provided | region = args_region or ''; -- use args.region if provided | ||
end | end | ||
if is_set (region) then | if is_set (region) then | ||
region = region:lower(); -- ensure that we use and return lower case version of this | region = region:lower(); -- ensure that we use and return lower case version of this | ||
if not region_table[region] then | if not region_table[region] then | ||
return code, script, nil, nil, nil, | return code, script, nil, nil, nil, substitute (cfg.get_ietf_parts_t.unrecog_reg_code, {region, code}); | ||
end | end | ||
end | end | ||
if is_set (variant) then | if is_set (variant) then | ||
if is_set (args_variant) then | if is_set (args_variant) then | ||
return code, nil, nil, nil, nil, | return code, nil, nil, nil, nil, cfg.get_ietf_parts_t.redundant_var; -- both code with variant and |variant= not allowed | ||
end | end | ||
else | else | ||
variant = args_variant or ''; -- use args.variant if provided | variant = args_variant or ''; -- use args.variant if provided | ||
end | end | ||
if is_set (variant) then | if is_set (variant) then | ||
variant = variant:lower(); -- ensure that we use and return lower case version of this | variant = variant:lower(); -- ensure that we use and return lower case version of this | ||
if not variant_table[variant] then -- make sure variant is valid | if not variant_table[variant] then -- make sure variant is valid | ||
return code, script, region, nil, nil, | return code, script, region, nil, nil, substitute (cfg.get_ietf_parts_t.unrecog_var, {variant}); | ||
end -- does this duplicate/replace tests in lang() and lang_xx()? | end -- does this duplicate/replace tests in lang() and lang_xx()? | ||
if is_set (script) then -- if script set it must be part of the 'prefix' | if is_set (script) then -- if script set it must be part of the 'prefix' | ||
if not in_array (table.concat ({code, '-', script}), variant_table[variant]['prefixes']) then | if not in_array (table.concat ({code, '-', script}), variant_table[variant]['prefixes']) then | ||
return code, script, region, nil, nil, | return code, script, region, nil, nil, substitute (cfg.get_ietf_parts_t.unrecog_var_code_scr, {variant, code, script}); | ||
end | end | ||
elseif is_set (region) then -- if region set, there are some prefixes that require lang code and region (en-CA-newfound) | elseif is_set (region) then -- if region set, there are some prefixes that require lang code and region (en-CA-newfound) | ||
if not in_array (code, variant_table[variant]['prefixes']) then -- first see if lang code is all that's required (en-oxendict though en-GB-oxendict is preferred) | if not in_array (code, variant_table[variant]['prefixes']) then -- first see if lang code is all that's required (en-oxendict though en-GB-oxendict is preferred) | ||
if not in_array (table.concat ({code, '-', region}), variant_table[variant]['prefixes']) then | if not in_array (table.concat ({code, '-', region}), variant_table[variant]['prefixes']) then -- now try for lang code and region (en-CA-newfound) | ||
return code, script, region, nil, nil, | return code, script, region, nil, nil, substitute (cfg.get_ietf_parts_t.unrecog_var_code_reg, {variant, code, region}); | ||
end | end | ||
end | end | ||
else | else -- cheap way to determine if there are prefixes; fonipa and others don't have prefixes; # operator always returns 0 | ||
if not in_array (code, variant_table[variant]['prefixes']) then | if variant_table[variant]['prefixes'][1] and not in_array (code, variant_table[variant]['prefixes']) then | ||
return code, script, region, nil, nil, | return code, script, region, nil, nil, substitute (cfg.get_ietf_parts_t.unrecog_var_code, {variant, code}); | ||
end | end | ||
end | end | ||
end | end | ||
if is_set (private) then | if is_set (private) then | ||
private = private:lower(); -- ensure that we use and return lower case version of this | private = private:lower(); -- ensure that we use and return lower case version of this | ||
if not override_table[table.concat ({code, '-x-', private})] then -- make sure private tag is valid; note that index | if not override_table[table.concat ({code, '-x-', private})] then -- make sure private tag is valid; note that index | ||
return code, script, region, nil, nil, | return code, script, region, nil, nil, substitute (cfg.get_ietf_parts_t.unrecog_pri, {private}); | ||
end | end | ||
end | end | ||
| 第401行: | 第529行: | ||
end | end | ||
--[=[-------------------------< M A K E _ W I K I L I N K >---------------------------------------------------- | --[=[-------------------------< M A K E _ W I K I L I N K >---------------------------------------------------- | ||
| 第455行: | 第553行: | ||
--[[--------------------------< D I V _ M A R K U P _ A D D >-------------------------------------------------- | --[[--------------------------< D I V _ M A R K U P _ A D D >-------------------------------------------------- | ||
Adds <i> and </i> tags to list-item text or to implied <p>..</p> text. Mixed not supported. | |||
]] | ]] | ||
local function div_markup_add (text, style) | local function div_markup_add (text, style) | ||
if text:find ('^\n[%*:;#]') then -- look for list markup; list markup must begin at start of text | if text:find ('^\n[%*:;#]') then -- look for list markup; list markup must begin at start of text | ||
if 'italic' == style then | if 'italic' == style then | ||
return | return text:gsub ('(\n[%*:;#]+)([^\n]+)', '%1<i>%2</i>'); -- insert italic markup at each list item | ||
else | else | ||
return text; | return text; | ||
| 第471行: | 第567行: | ||
if text:find ('\n+') then -- look for any number of \n characters in text | if text:find ('\n+') then -- look for any number of \n characters in text | ||
text = text:gsub ('([^\n])\n([^\n])', '%1 %2'); -- replace single newline characters with a space character which mimics | text = text:gsub ('([^\n])\n([^\n])', '%1 %2'); -- replace single newline characters with a space character which mimics MediaWiki | ||
if 'italic' == style then | if 'italic' == style then | ||
text = text:gsub('[^\n]+', '<p><i>%1</i></p>'); -- insert p and italic markup tags at each | text = text:gsub('[^\n]+', '<p><i>%1</i></p>'); -- insert p and italic markup tags at each implied p (two or more consecutive '\n\n' sequences) | ||
else | else | ||
text = text:gsub ('[^\n]+', '<p>%1</p>'); -- insert p markup at each | text = text:gsub ('[^\n]+', '<p>%1</p>'); -- insert p markup at each implied p | ||
text = text:gsub ('\n', ''); -- strip newline characters | text = text:gsub ('\n', ''); -- strip newline characters | ||
end | end | ||
| 第482行: | 第578行: | ||
return text; | return text; | ||
end | |||
--[[--------------------------< T I T L E _ W R A P P E R _ M A K E >------------------------------------------ | |||
Makes a <span title="<title text>"><content_text></span> or <div title="<title text>"><content_text></div> where | |||
<title text> is in the tool-tip in the wiki's local language and <content_text> is non-local-language text in | |||
HTML markup. This because the lang= attribute applies to the content of its enclosing tag. | |||
<tag> holds a string 'div' or 'span' used to choose the correct wrapping tag. | |||
]] | |||
local function title_wrapper_make (title_text, content_text, tag) | |||
local wrapper_t = {}; | |||
table.insert (wrapper_t, table.concat ({'<', tag})); -- open opening wrapper tag | |||
table.insert (wrapper_t, ' title=\"'); -- begin title attribute | |||
table.insert (wrapper_t, title_text); -- add <title_text> | |||
table.insert (wrapper_t, '\">'); -- end title attribute and close opening wrapper tag | |||
table.insert (wrapper_t, content_text); -- add <content_text> | |||
table.insert (wrapper_t, table.concat ({'</', tag, '>'})); -- add closing wrapper tag | |||
return table.concat (wrapper_t); -- make a big string and done | |||
end | end | ||
| 第487行: | 第607行: | ||
--[[--------------------------< M A K E _ T E X T _ H T M L >-------------------------------------------------- | --[[--------------------------< M A K E _ T E X T _ H T M L >-------------------------------------------------- | ||
Add the | Add the HTML markup to text according to the type of content that it is: <span> or <i> tags for inline content or | ||
<div> tags for block content | <div> tags for block content | ||
The lang= attribute also applies to the content of the tag where it is placed so this is wrong because 'Spanish | |||
language text' is English: | |||
<i lang="es" title="Spanish language text">casa</i> | |||
should be: | |||
<span title="Spanish language text"><i lang="es">casa</i></span> | |||
or for <div>...</div>: | |||
<div title="Spanish language text"><div lang="es"><spanish-language-text></div></div> | |||
]] | ]] | ||
local function make_text_html (code, text, tag, rtl, style, size, language) | local function make_text_html (code, text, tag, rtl, style, size, language) | ||
local | local html_t = {}; | ||
local style_added = ''; | local style_added = ''; | ||
local wrapper_tag = tag; -- <tag> gets modified so save a copy for use when/if we create a wrapper span or div | |||
if text:match ('^%*') then | if text:match ('^%*') then | ||
table.insert ( | table.insert (html_t, '*'); -- move proto language text prefix outside of italic markup if any; use numeric entity because plain splat confuses MediaWiki | ||
text = text:gsub ('^%*', ''); -- remove the splat from the text | text = text:gsub ('^%*', ''); -- remove the splat from the text | ||
end | end | ||
if 'span' == tag then -- default | if 'span' == tag then -- default HTML tag for inline content | ||
if 'italic' == style then -- but if italic | if 'italic' == style then -- but if italic | ||
tag = 'i'; -- change to <i> tags | tag = 'i'; -- change to <i> tags | ||
| 第509行: | 第638行: | ||
end | end | ||
table.insert ( | table.insert (html_t, table.concat ({'<', tag})); -- open the <i>, <span>, or <div> HTML tag | ||
table.insert ( | code = code:gsub ('%-x%-.*', ''); -- strip private use subtag from code tag because meaningless outside of Wikipedia | ||
table.insert (html_t, table.concat ({' lang="', code, '\"'})); -- add language attribute | |||
if rtl or unicode.is_rtl(text) then | if (rtl or unicode.is_rtl(text)) and ('ltr' == this_wiki_lang_dir) then -- text is right-to-left on a left-to-right wiki | ||
table.insert ( | table.insert (html_t, ' dir="rtl"'); -- add direction attribute for right-to-left languages | ||
elseif not (rtl or unicode.is_rtl(text)) and ('rtl' == this_wiki_lang_dir) then -- text is left-to-right on a right-to-left wiki | |||
table.insert (html_t, ' dir="ltr"'); -- add direction attribute for left-to-right languages | |||
end | end | ||
if 'normal' == style then -- when |italic=no | if 'normal' == style then -- when |italic=no | ||
table.insert ( | table.insert (html_t, ' style=\"font-style: normal;'); -- override external markup, if any | ||
style_added = '\"'; -- remember that style attribute added and is not yet closed | style_added = '\"'; -- remember that style attribute added and is not yet closed | ||
end | end | ||
| 第523行: | 第655行: | ||
if is_set (size) then -- when |size=<something> | if is_set (size) then -- when |size=<something> | ||
if is_set (style_added) then | if is_set (style_added) then | ||
table.insert ( | table.insert (html_t, table.concat ({' font-size: ', size, ';'})); -- add when style attribute already inserted | ||
else | else | ||
table.insert ( | table.insert (html_t, table.concat ({' style=\"font-size: ', size, ';'})); -- create style attribute | ||
style_added = '\"'; -- remember that style attribute added and is not yet closed | style_added = '\"'; -- remember that style attribute added and is not yet closed | ||
end | end | ||
end | end | ||
table.insert (html_t, table.concat ({style_added, '>'})); -- close the opening HTML tag | |||
table.insert (html_t, text); -- insert the text | |||
table.insert (html_t, table.concat ({'</', tag, '>'})); -- close the 'text' <i>, <span>, or <div> HTML tag | |||
if is_set (language) then -- create a <title_text> string for the title= attribute in a wrapper span or div | |||
local title_text; | |||
table. | if 'zxx' == code then -- special case for this tag 'no linguistic content' | ||
title_text = substitute ('$1$2', {language, cfg.make_text_html_t.zxx}); -- not a language so don't use 'language' in title text | |||
elseif mw.ustring.find (language, '语系', 1, true) then | |||
title_text = substitute ('$1$2', {language, cfg.make_text_html_t.collective}); -- for collective languages | |||
else | |||
title_text = substitute ('$1$2', {language, cfg.make_text_html_t.individual}); -- for individual languages | |||
end | |||
return title_wrapper_make (title_text, table.concat (html_t), wrapper_tag); | |||
else | else | ||
return table.concat (html_t); | |||
end | end | ||
end | |||
-- 中文版添加,实现#ifexist | |||
local function page_exists (title) | |||
if | local noError, titleObject = pcall (mw.title.new, title) | ||
if not noError then | |||
return false | |||
else | |||
if titleObject then | |||
return titleObject.exists | |||
else | |||
return false | |||
end | |||
end | end | ||
end | end | ||
--[=[-------------------------< M A K E _ C A T E G O R Y >---------------------------------------------------- | --[=[-------------------------< M A K E _ C A T E G O R Y >---------------------------------------------------- | ||
For individual language, <language>, returns: | |||
[[Category:Articles containing <language>-language text]] | |||
For English: | |||
[[Category:Articles containing explicitly cited English-language text]] | |||
For ISO 639-2 collective languages (and for 639-1 bh): | |||
[[Category:Articles with text in <language> languages]] | |||
注意:此处有修改 | 注意:此处有修改 | ||
对于中文(zh、zh-*): | |||
如果[[Module:Lang/data]]没有额外定义变体名称(即取得的语言名称是「中文」),则返回以下分类: | |||
[[Category:含有明确引用中文的条目]] | |||
反之,则返回以下分类: | |||
[[Category:含有< | [[Category:含有<变体>的条目]] | ||
对于非中文内容: | |||
如果存在对应语言的分类,则返回以下分类: | |||
[[Category:含有<语言>的条目]] | |||
反之,则返回以下分类: | |||
[[Category:含有非中文内容的条目]] | |||
]=] | ]=] | ||
local function make_category (code, language_name, nocat) | local function make_category (code, language_name, nocat, name_get) | ||
if ((0 ~= namespace) or nocat) and not name_get then -- only categorize in article space | |||
if (0 ~= namespace) or nocat then | |||
return ''; -- return empty string for concatenation | return ''; -- return empty string for concatenation | ||
end | end | ||
-- 中文版无 | |||
-- if mw.ustring.find (language_name, '语系', 1, true) then | |||
if | -- return substitute ('[[$1 $2]]', {cfg.make_category_t.collective_cat, language_name}); | ||
-- end | |||
if this_wiki_lang_tag == code and language_name == '中文' then -- 名稱必須是「中文」 | |||
elseif (page_exists (' | return substitute ('[[$1$2$3$4]]', { -- unique category name for the local language | ||
cfg.make_category_t.cat_prefix, | |||
cfg.make_category_t.explicit_cat, | |||
language_name, | |||
cfg.make_category_t.cat_postfix, | |||
}); | |||
elseif (page_exists (substitute ('$1$2$3', { | |||
cfg.make_category_t.cat_prefix, | |||
language_name, | |||
cfg.make_category_t.cat_postfix, | |||
}))) then | |||
return substitute ('[[$1$2$3]]', { -- category for individual languages | |||
cfg.make_category_t.cat_prefix, | |||
language_name, | |||
cfg.make_category_t.cat_postfix, | |||
}); | |||
else | else | ||
return substitute ('[[$1$2$3]]', { -- 非中文内容 | |||
cfg.make_category_t.cat_prefix, | |||
cfg.make_category_t.cat_nonezh, | |||
cfg.make_category_t.cat_postfix, | |||
}); | |||
end | end | ||
end | end | ||
| 第601行: | 第768行: | ||
--[[--------------------------< M A K E _ T R A N S L I T >---------------------------------------------------- | --[[--------------------------< M A K E _ T R A N S L I T >---------------------------------------------------- | ||
Return translit <i lang=xx-Latn>...</i> where xx is the language code; else return empty string. | |||
The value |script= is not used in {{ | The value |script= is not used in {{transliteration}} for this purpose; instead it uses |code. Because language scripts | ||
are listed in the {{ | are listed in the {{transliteration}} switches they are included in the data tables. The script parameter is introduced | ||
at {{Language with name and transliteration}}. If |script= is set, this function uses it in preference to code. | at {{Language with name and transliteration}}. If |script= is set, this function uses it in preference to code. | ||
To avoid confusion, in this module and the templates that use it, the transliteration script parameter is renamed | To avoid confusion, in this module and the templates that use it, the transliteration script parameter is renamed | ||
to be |translit-script= (in this function, tscript) | to be |translit-script= (in this function, tscript). | ||
This function is used by both lang_xx() and transl() | This function is used by both lang_xx() and transl() | ||
| 第614行: | 第781行: | ||
transl() always provides language_name, translit, and one of code or tscript, never both; always provides style | transl() always provides language_name, translit, and one of code or tscript, never both; always provides style | ||
For {{ | For {{transliteration}}, style only applies when a language code is provided. | ||
]] | ]] | ||
local function make_translit (code, language_name, translit, std, tscript, style) | local function make_translit (code, language_name, translit, std, tscript, style) | ||
local | local title_t = lang_data.translit_title_table; -- table of transliteration standards and the language codes and scripts that apply to those standards | ||
local title_text = ''; -- tool tip text for title= attribute | |||
std = std and std:lower(); -- lower case for table indexing | std = std and std:lower(); -- lower case for table indexing | ||
if not is_set (std) and not is_set (tscript) then -- when neither standard nor script specified | if not is_set (std) and not is_set (tscript) then -- when neither standard nor script specified | ||
title_text = language_name; -- write a generic tool tip | |||
-- if not | title_text = substitute ('$1$2', {title_text, cfg.lang_xx_t.romanization}); -- 中文版添加 | ||
-- 中文版不需要 | |||
-- if not mw.ustring.find (language_name, 'languages', 1, true) then -- collective language names (plural 'languages' is part of the name) | |||
-- title_text = substitute ('$1-$2', {title_text, cfg.misc_text_t.language}); -- skip this text (individual and macro languages only) | |||
-- end | |||
-- title_text = substitute ('$1 $2', {title_text, mw.ustring.lower (cfg.engvar_t[engvar]['romanisz_lc'])}); -- finish the tool tip; use romanization when neither script nor standard supplied | |||
elseif is_set (std) and is_set (tscript) then -- when both are specified | elseif is_set (std) and is_set (tscript) then -- when both are specified | ||
if | if title_t[std] then -- and if standard is legitimate | ||
if | if title_t[std][tscript] then -- and if script for that standard is legitimate | ||
if script_table[tscript] then | |||
title_text = substitute ('$1$2($3)$4', { -- add the appropriate text to the tool tip | |||
title_text, | |||
title_t[std][tscript:lower()], | |||
script_table[tscript], | |||
cfg.make_translit_t.transliteration, | |||
}); | |||
else | |||
title_text = title_text .. title_t[std]['default']; -- use the default if script not in std table; TODO: maint cat? error message because script not found for this standard? | |||
end | |||
else | else | ||
title_text = title_text .. title_t[std]['default']; -- use the default if script not in std table; TODO: maint cat? error message because script not found for this standard? | |||
end | end | ||
else | else | ||
return | return translit | ||
end | end | ||
elseif is_set (std) then -- translit-script not set, use language code | elseif is_set (std) then -- translit-script not set, use language code | ||
if not | if not title_t[std] then | ||
return translit | |||
if | end | ||
if title_t[std][code] then -- if language code is in the table (transl may not provide a language code) | |||
title_text = substitute ('$1$2($3)$4', { -- add the appropriate text to the tool tip | |||
title_text, | |||
title_t[std][code:lower()], | |||
language_name, | |||
cfg.make_translit_t.transliteration, | |||
}); | |||
else -- code doesn't match | else -- code doesn't match | ||
title_text = title_text .. title_t[std]['default']; -- so use the standard's default | |||
end | end | ||
else -- here if translit-script set but translit-std not set | else -- here if translit-script set but translit-std not set | ||
if | if title_t['no_std'][tscript] then | ||
title_text = title_text .. title_t['no_std'][tscript]; -- use translit-script if set | |||
elseif | elseif title_t['no_std'][code] then | ||
title_text = title_text .. title_t['no_std'][code]; -- use language code | |||
else | else | ||
if is_set (tscript) then | if is_set (tscript) then | ||
title_text = substitute ('$1$2-$3$4', { -- write a script tool tip | |||
title_text, | |||
language_name, | |||
cfg.make_translit_t.script, | |||
cfg.make_translit_t.transliteration, | |||
}); | |||
-- 中文版不需要 | |||
-- elseif is_set (code) then | |||
-- if not mw.ustring.find (language_name, 'languages', 1, true) then -- collective language names (plural 'languages' is part of the name) | |||
-- title_text = substitute ('$1-$2', { -- skip this text (individual and macro languages only) | |||
-- title_text, | |||
-- cfg.misc_text_t.language, | |||
-- }); | |||
-- end | |||
-- title_text = substitute ('$1 $2', { -- finish the tool tip | |||
-- title_text, | |||
-- cfg.make_translit_t.transliteration, | |||
-- }); | |||
else | else | ||
title_text = substitute ('$1$2', { -- generic tool tip (can we ever get here?) | |||
title_text, | |||
cfg.make_translit_t.transliteration, | |||
}); | |||
end | end | ||
end | end | ||
end | end | ||
local tag | |||
if is_set (code) then -- when a language code is provided (always with {{lang-??}} templates, not always with {{transliteration}}) | |||
if is_set (code) | code = code:match ('^(%a%a%a?)'); -- strip all subtags leaving only the language subtag | ||
if not style then -- 中文版默认不应用斜体 | |||
tag = '<span lang="%s-Latn">%s</span>' | |||
else | |||
tag = '<span style="font-style: %s" lang="%s-Latn">%s</span>' -- non-standard style, construct a span tag for it | |||
tag = string.format(tag, style, "%s", "%s") | |||
end | |||
tag = string.format(tag, code, "%s") | |||
else | else | ||
tag = '<span>%s</span>' -- when no language code: no lang= attribute, not italic ({{transliteration}} only) | |||
end | |||
tag = string.format(tag, translit) -- add the translit text | |||
if '' == title_text then -- when there is no need for a tool-tip | |||
return tag; -- done | |||
else | |||
-- 中文版不需要 | |||
-- title_text = cfg.engvar_sel_t.gb == engvar and title_text:gsub ('([Rr]omani)z', '%1s') or title_text; -- gb eng when engvar specifies gb eng; us eng else | |||
return title_wrapper_make (title_text, tag, 'span'); -- wrap with a tool-tip span and done | |||
end | end | ||
end | end | ||
| 第695行: | 第898行: | ||
This function checks the content of args.text and returns empty string if nothing is amiss else it returns an | This function checks the content of args.text and returns empty string if nothing is amiss else it returns an | ||
error message. | error message. The tests are for empty or missing text and for improper or disallowed use of apostrophe markup. | ||
Italic rendering is controlled by the |italic= template parameter so italic markup should never appear in args.text | Italic rendering is controlled by the |italic= template parameter so italic markup should never appear in args.text | ||
| 第704行: | 第907行: | ||
local function validate_text (template, args) | local function validate_text (template, args) | ||
if not is_set (args.text) then | if not is_set (args.text) then | ||
make_error_msg (cfg.validate_text_t.no_text, args, template) | |||
args.text = '' | |||
return | |||
end | end | ||
if args.text:find ("%f[\']\'\'\'\'%f[^\']") or args.text:find ("\'\'\'\'\'[\']+") then -- because we're looking, look for 4 appostrophes or 6+ appostrophes | if args.text:find ("%f[\']\'\'\'\'%f[^\']") or args.text:find ("\'\'\'\'\'[\']+") then -- because we're looking, look for 4 appostrophes or 6+ appostrophes | ||
make_error_msg (cfg.validate_text_t.malformed_markup, args, template) | |||
return | |||
end | end | ||
local style = args.italic; | local style = args.italic or args.italics or args.i; | ||
if ( | -- 中文版修改:|italic=no 和未指定 |italic= 時不檢查斜體標記 | ||
if style and (cfg.keywords_t.unset ~= style) and (cfg.keywords_t.negative ~= style) and (cfg.keywords_t.invert ~= style) then | |||
if args.text:find ("%f[\']\'\'%f[^\']") or args.text:find ("%f[\']\'\'\'\'\'%f[^\']") then -- italic but not bold, or bold italic | if args.text:find ("%f[\']\'\'%f[^\']") or args.text:find ("%f[\']\'\'\'\'\'%f[^\']") then -- italic but not bold, or bold italic | ||
make_error_msg (cfg.validate_text_t.italic_markup, args, template) | |||
return | |||
end | end | ||
end | end | ||
| 第723行: | 第931行: | ||
--[[--------------------------< R E N D E R _ M A I N T >------------------------------------------------------ | --[[--------------------------< R E N D E R _ M A I N T >------------------------------------------------------ | ||
Render mainenance messages and categories. | |||
]] | ]] | ||
local function render_maint(nocat) | local function render_maint (nocat) | ||
local maint = {}; | local maint = {}; | ||
if 0 < #maint_msgs then -- when there are maintenance messages | if 0 < #maint_msgs then -- when there are maintenance messages | ||
table.insert (maint, table.concat ({'<span class="lang-comment" style="font-style: normal; display: none; color: #33aa33; margin-left: 0.3em;">'})); -- opening <span> tag | table.insert (maint, table.concat ({'<span class="lang-comment" style="font-style: normal; display: none; color: #33aa33; margin-left: 0.3em;">'})); -- opening <span> tag | ||
for _, msg in ipairs (maint_msgs) do | for _, msg in ipairs (maint_msgs) do | ||
table.insert (maint, table.concat ({msg, ' '})); | table.insert (maint, table.concat ({msg, ''})); -- add message strings | ||
end | end | ||
table.insert (maint, '</span>'); -- close the span | table.insert (maint, '</span>'); -- close the span | ||
end | end | ||
if (0 < #maint_cats) and (0 == namespace) and not nocat then -- when there are maintenance categories; article namespace only | if (0 < #maint_cats) and (0 == namespace) and not nocat then -- when there are maintenance categories; article namespace only | ||
for _, cat in ipairs (maint_cats) do | for _, cat in ipairs (maint_cats) do | ||
| 第743行: | 第951行: | ||
end | end | ||
end | end | ||
return table.concat (maint); | return table.concat (maint); | ||
end | end | ||
| 第750行: | 第958行: | ||
--[[--------------------------< P R O T O _ P R E F I X >------------------------------------------------------ | --[[--------------------------< P R O T O _ P R E F I X >------------------------------------------------------ | ||
For proto languages, text is prefixed with a splat. We do that here as a flag for make_text_html() so that a splat | |||
will be rendered outside of italic markup (if used). | will be rendered outside of italic markup (if used). If the first character in text here is already a splat, we | ||
do nothing | do nothing. | ||
proto_param is boolean or nil; true adds splat prefix regardless of language name; false removes and | proto_param is boolean or nil; true adds splat prefix regardless of language name; false removes and inhibits | ||
regardless of language name; nil does nothing; presumes that the value in text is correct but removes extra splac | regardless of language name; nil does nothing; presumes that the value in text is correct but removes extra splac. | ||
]] | ]] | ||
| 第762行: | 第970行: | ||
if false == proto_param then -- when forced by |proto=no | if false == proto_param then -- when forced by |proto=no | ||
return text:gsub ('^%**', ''); -- return text without splat prefix regardless of language name or existing splat prefix in text | return text:gsub ('^%**', ''); -- return text without splat prefix regardless of language name or existing splat prefix in text | ||
elseif (language_name:find ('^ | elseif (language_name:find ('^原始') or (true == proto_param)) then -- language is a proto or forced by |proto=yes | ||
return text:gsub ('^%**', '*'); -- prefix proto-language text with a splat; also removes duplicate prefixing splats | return text:gsub ('^%**', '*'); -- prefix proto-language text with a splat; also removes duplicate prefixing splats | ||
end | end | ||
return text:gsub ('^%*+', '*'); -- return text unmolested except multiple splats reduced to one splat | return text:gsub ('^%*+', '*'); -- return text unmolested except multiple splats reduced to one splat | ||
end | end | ||
| 第772行: | 第980行: | ||
--[[--------------------------< H A S _ P O E M _ T A G >------------------------------------------------------ | --[[--------------------------< H A S _ P O E M _ T A G >------------------------------------------------------ | ||
Looks for a poem strip marker in text; returns true when found; false else. | |||
Auto-italic detection disabled when text has poem stripmarker because it is not possible for this code to know | |||
the content that will replace the stripmarker. | the content that will replace the stripmarker. | ||
| 第786行: | 第994行: | ||
--[[--------------------------< H T M L _ T A G _ S E L E C T >------------------------------------------------ | --[[--------------------------< H T M L _ T A G _ S E L E C T >------------------------------------------------ | ||
Inspects content of and selectively trims text. Returns text and the name of an appropriate | Inspects content of and selectively trims text. Returns text and the name of an appropriate HTML tag for text. | ||
If text contains: | If text contains: | ||
\n\n text has implied <p>..</p> tags - trim leading and trailing whitespace and return | \n\n text has implied <p>..</p> tags - trim leading and trailing whitespace and return | ||
If text begins with list markup: | If text begins with list markup: | ||
\n* unordered | \n* unordered | ||
| 第797行: | 第1,005行: | ||
trim all leading whitespace except \n and trim all trailing whitespace | trim all leading whitespace except \n and trim all trailing whitespace | ||
If text contains <poem>...</poem> stripmarker, return text unmodified and choose <div>..</div> tags because | If text contains <poem>...</poem> stripmarker, return text unmodified and choose <div>..</div> tags because | ||
the stripmarker is replaced with text wrapped in <div>..</div> tags. | the stripmarker is replaced with text wrapped in <div>..</div> tags. | ||
If the text contains any actual <div>...</div> tags, then it's again returned unmodified and <div>...</div> | |||
tags are used to wrap it, to prevent div/span inversion. | |||
]] | ]] | ||
| 第804行: | 第1,015行: | ||
local function html_tag_select (text) | local function html_tag_select (text) | ||
local tag; | local tag; | ||
if has_poem_tag (text) then -- contains poem stripmarker (we can't know the content of that) | if has_poem_tag (text) then -- contains poem stripmarker (we can't know the content of that) | ||
tag = 'div'; -- poem replacement is in div tags so lang must use div tags | tag = 'div'; -- poem replacement is in div tags so lang must use div tags | ||
elseif text:find ('<div') then -- reductive; if the text contains a div tag, we must use div tags | |||
tag = 'div'; | |||
elseif mw.text.trim (text):find ('\n\n+') then -- contains implied p tags | elseif mw.text.trim (text):find ('\n\n+') then -- contains implied p tags | ||
text = mw.text.trim (text); -- trim leading and trailing whitespace characters | text = mw.text.trim (text); -- trim leading and trailing whitespace characters | ||
| 第817行: | 第1,030行: | ||
tag = 'span'; -- so span is fine | tag = 'span'; -- so span is fine | ||
end | end | ||
return text, tag; | return text, tag; | ||
end | end | ||
| 第824行: | 第1,037行: | ||
--[[--------------------------< V A L I D A T E _ P R O T O >-------------------------------------------------- | --[[--------------------------< V A L I D A T E _ P R O T O >-------------------------------------------------- | ||
Validates value assigned to |proto=; permitted values are yes and no; yes returns as true, no returns as false, | |||
empty string (or parameter omitted) returns as nil; any other value returns | empty string (or parameter omitted) returns as nil; any other value returns nil with <proto_param> as second | ||
return value for use in error message. | |||
]] | ]] | ||
local function validate_proto (proto_param) | local function validate_proto (proto_param) | ||
if | if cfg.keywords_t.affirmative == proto_param then | ||
return true; | return true; | ||
elseif | elseif cfg.keywords_t.negative == proto_param then | ||
return false; | return false; | ||
elseif is_set (proto_param) then | elseif is_set (proto_param) then | ||
return nil, | return nil, proto_param; -- |proto= something other than 'yes' or 'no' | ||
else | else | ||
return nil; -- missing or empty | return nil; -- missing or empty | ||
| 第845行: | 第1,058行: | ||
--[[--------------------------< L A N G U A G E _ N A M E _ G E T >-------------------------------------------- | --[[--------------------------< L A N G U A G E _ N A M E _ G E T >-------------------------------------------- | ||
Common function to return language name from the data set according to IETF tag. | |||
Returns language name if found in data tables; nil else. | |||
]] | ]] | ||
| 第853行: | 第1,066行: | ||
local function language_name_get (ietf, code, cat) | local function language_name_get (ietf, code, cat) | ||
ietf = ietf:lower(); -- ietf:lower() because format_ietf_tag() returns mixed case | ietf = ietf:lower(); -- ietf:lower() because format_ietf_tag() returns mixed case | ||
local name; -- remains nil if not found | local name; -- remains nil if not found | ||
if override_table[ietf] then -- look for whole IETF tag in override table | if override_table[ietf] then -- look for whole IETF tag in override table | ||
name = override_table[ietf | name = override_table[ietf]; | ||
elseif override_table[code] then -- not there so try basic language | elseif override_table[code] then -- not there so try basic language tag | ||
name = override_table[code | name = override_table[code]; | ||
elseif lang_table[code] then -- shift to | elseif lang_table[code] then -- shift to IANA active tag/name table | ||
name = lang_table[code | name = lang_table[code]; | ||
elseif lang_dep_table[code] then | elseif lang_dep_table[code] then -- try the IANA deprecated tag/name table | ||
-- | name = lang_dep_table[code]; | ||
name = lang_dep_table[code | |||
end | end | ||
if lang_dep_table[code] and cat then -- because deprecated code may have been overridden to en.wiki preferred name | if lang_dep_table[code] and cat then -- because deprecated code may have been overridden to en.wiki preferred name | ||
table.insert (maint_cats, | table.insert (maint_cats, substitute (cfg.language_name_get_t.deprecated_cat, {code})); | ||
table.insert (maint_msgs, | table.insert (maint_msgs, substitute (cfg.language_name_get_t.deprecated_msg, {code})); | ||
end | end | ||
| 第878行: | 第1,087行: | ||
end | end | ||
--[[--------------------------< T E X T _ S C R I P T _ M A T C H _ T E S T >---------------------------------- | |||
IETF script subtag should match the script of the <text>. This module does not attempt to know all scripts and | |||
what they look like. It does know what Latn script looks like so when <text> is written using other than the Latn | |||
script, the IETF script subtag, if present, should not be Latn. | |||
Conversely, when <text> is written using the Latn script, the IETF script subtag, if present, should be Latn. | |||
For the purposes of this test, Latf (Fraktur) and Latg (Gaelic) are considered to be equivalent to Latn because | |||
unicode treats these two scripts as font-specific variants of Latn. | |||
Returns an error message when mismatch detected; nil else. | |||
]] | |||
local function text_script_match_test (script, is_latn_text, pos, char) | |||
local scripts_t = {['latf'] = true, ['latg'] = true, ['latn'] = true}; -- unicode 'latn' scripts; 'latf' and 'latg' are font variants so there are no Fraktur or Gaelic codepoints | |||
if is_set (script) then -- don't bother with the rest of this if <script> is nil or empty string | |||
script = script:lower(); -- lower case to index into <scripts_t> | |||
if is_latn_text then -- when text is wholly Latn script | |||
if not scripts_t[script] then -- but a non-Latn script is specified | |||
return cfg.text_script_match_test_t.latn_txt_mismatch; -- emit an error message | |||
end | |||
else -- when text is not wholly Latn script | |||
if scripts_t[script] then -- but a Latn script is specified | |||
return substitute (cfg.text_script_match_test_t.latn_scr_mismatch, {pos, char}); -- emit an error message with position of first offending character | |||
end | |||
end | |||
end | |||
end | |||
--[[--------------------------< B I N A R Y _ S E A R C H >--------------------------------------------------- | |||
conducts a binary search of <ranges_t> for a sub-range that holds <target>. | |||
returns boolean true if a sub-range holding <target> is found; boolean false else. | |||
]] | |||
local function binary_search (target, ranges_t) | |||
local idx_bot = 1; -- initialize to index of first key | |||
local idx_top = sizeof_ranges_t; -- initialize to index of last key (number of keys) | |||
if (target < ranges_t[idx_bot][1]) or (target > ranges_t[idx_top][2]) then -- invalid; target out of range | |||
return; -- abandon | |||
end | |||
local idx_mid; -- calculated index of range midway between top index and bottom index | |||
local flag = false; -- flag to tell us when we've evaluated last (highest) range in <ranges_t> | |||
while 1 do | |||
idx_mid = math.ceil ((idx_bot + idx_top) / 2); -- get the mid-point in the <ranges_t> sequence | |||
if (target >= ranges_t[idx_mid][1]) and (target <= ranges_t[idx_mid][2]) then -- indexed range low value <= target <= indexed range high value | |||
return true; -- we found the range that holds the <target> character; return true | |||
elseif (target > ranges_t[idx_mid][2]) then -- is <target> > indexed range high value? | |||
idx_bot = idx_mid; -- adjust <idx_bot> up | |||
else -- here when <target> less than indexed range low value | |||
idx_top = idx_mid - 1; -- adjust <idx_top> down | |||
end | |||
if flag then | |||
break; -- here when we just evaluated the last range and <target> not found | |||
end | |||
if not flag and (idx_bot == idx_top) then -- set true just before we evaluate the last (highest) range in <ranges_t> | |||
flag = true; | |||
end | |||
end | |||
end | |||
--[[--------------------------< I S _ L A T I N >-------------------------------------------------------------- | |||
compare <text> as codepoints to lists of known codepoints accepted as Latn script | |||
returns boolean true and modified <text> when <text> is wrapped in accept-as-written markup | |||
returns boolean true and <text> when codepoint is known | |||
returns boolean false, <text>, non-Latn codepoint position in <text> (left to right), and the codepoint character | |||
when codepoint is not known | |||
TODO: when text has accept-as-written markup, return a non-boolean value to indicate that <text> is not wholly | |||
latn script? Use that return value to create non-Latn HTML lang= attribute because <text> isn't really | |||
latn so lang=und (undetermined)? or instead, omit the -Latn subtag? (without -Latn need to force |italic=yes) | |||
]] | |||
local function is_latin (text, tag) | |||
local count; | |||
text, count = text:gsub ('^%(%((.+)%)%)$', '%1'); -- remove accept-as-written markup if present | |||
if 0 ~= count then | |||
return true, text; -- markup present so assume that <text> is Latn-script | |||
end | |||
local pos = 0; -- position counter for error messaging | |||
for codepoint in mw.ustring.gcodepoint (text) do -- fetch each code point | |||
pos = pos + 1; -- bump the position counter | |||
if not is_latn_data.singles_t[codepoint] and -- codepoint not found in the singles list? | |||
not binary_search (codepoint, is_latn_data.ranges_t) and -- codepoint not a member of a listed range? | |||
not (tag and is_latn_data.specials_t[codepoint] and is_latn_data.specials_t[codepoint][tag]) then -- not a language-specific codepoint? | |||
return false, text, pos, mw.ustring.char (codepoint); -- codepoint not known; return false with codepoint position and character representation | |||
end | |||
end | |||
return true, text; -- is known; return <text> | |||
end | |||
--[[--------------------------< 处 理 中 文 文 本 转 换 >-------------------------------------------------------------- | |||
该函数用于判断输入的语言代码是否属于中文(包括汉语方言),并决定是否需要禁用繁简转换。 | |||
功能: | |||
- 如果语言代码指定为无变体的中文代码 `zh-` 和其他以汉字作为书写系统的汉语方言文字(如粤语、吴语、赣语、文言文等),则返回原文本,不做任何修改。 | |||
- 如果语言代码不属于中文或为中文变体(以 `zh-` 开头),则在文本外添加 `-{}-`,以阻止繁简转换。 | |||
参数: | |||
- `code` (string): 语言代码(如 `"zh"`、`"gan"`、`"yue"`、`"en"`)。 | |||
- `text` (string): 需要处理的文本。 | |||
返回值: | |||
- (string) 处理后的文本。 | |||
]] | |||
local function chinese_conversion(code, text) | |||
-- 定义属于中文及相关方言的语言代码 | |||
local chinese_codes = { zh = true, gan = true, wuu = true, yue = true, lzh = true, hsn = true } | |||
if chinese_codes[code] then | |||
return text | |||
else | |||
return '-{' .. text .. '}-' | |||
end | |||
end | |||
--[[--------------------------< _ L A N G >-------------------------------------------------------------------- | --[[--------------------------< _ L A N G >-------------------------------------------------------------------- | ||
Entry point for {{lang}}. | |||
There should be no reason to set parameters in the {{lang}} {{#invoke:}} | |||
<includeonly>{{#invoke:lang|lang}}</includeonly> | <includeonly>{{#invoke:lang|lang}}</includeonly> | ||
Parameters are received from the template's frame (parent frame). | |||
]] | ]] | ||
| 第898行: | 第1,248行: | ||
local msg; -- for error messages | local msg; -- for error messages | ||
local tag = 'span'; -- initial value for make_text_html() | local tag = 'span'; -- initial value for make_text_html() | ||
local template = args.template or | local template = args.template or cfg.templates_t.lang; | ||
maint_cats = {}; -- initialize because when this module required into another module, these only declared once so only initialzed once | |||
maint_msgs = {}; | |||
error_msgs = {} | |||
validate_cat_args (args); -- determine if categorization should be suppressed | validate_cat_args (args); -- determine if categorization should be suppressed | ||
if args[1] and args.code then | if args[1] and args.code then | ||
make_error_msg (substitute (cfg.lang_t.conflict_n_param, {'1', cfg.lang_t.conflict_n_param_types.code}), args, template) | |||
end | end | ||
args.code = args[1] or args.code; -- prefer args.code | |||
if args[2] and args.text then | if args[2] and args.text then | ||
make_error_msg (substitute (cfg.lang_t.conflict_n_param, {'2', cfg.lang_t.conflict_n_param_types.text}), args, template) | |||
end | end | ||
args.text = args[2] or args.text; -- prefer args.text | |||
validate_text (template, args) | |||
args.text, tag = html_tag_select (args.text); -- inspects text; returns appropriate HTML tag with text trimmed accordingly | |||
args.text, tag = html_tag_select (args.text); -- inspects text; returns appropriate | |||
args.rtl = args.rtl == | args.rtl = args.rtl == cfg.keywords_t.affirmative; -- convert to boolean: 'yes' -> true, other values -> false | ||
args.proto, msg = validate_proto (args.proto); -- return boolean, or nil, or nil and error message flag | args.proto, msg = validate_proto (args.proto); -- return boolean, or nil, or nil and error message flag | ||
if msg then | if msg then | ||
return make_error_msg ( | return make_error_msg (substitute (cfg.lang_t.invalid_proto, {msg}), args, template); | ||
end | end | ||
| 第931行: | 第1,281行: | ||
if msg then | if msg then | ||
make_error_msg (msg, args, template) | |||
msg = nil | |||
code = code or '' | |||
end | |||
local is_latn_text, pos, char; | |||
is_latn_text, args.text, pos, char= is_latin (args.text, code); -- make a boolean | |||
msg = text_script_match_test (subtags.script, is_latn_text, pos, char) | |||
if msg then -- if an error detected then there is an error message | |||
make_error_msg (msg, args, template) | |||
msg = nil | |||
end | end | ||
args.italic, msg = validate_italic (args); | args.italic, msg = validate_italic (args); | ||
if msg then | if msg then | ||
make_error_msg (msg, args, template) | |||
msg = nil | |||
end | end | ||
if nil == args.italic then -- nil when |italic= absent or not set or |italic=default; args.italic controls | if nil == args.italic then -- nil when |italic= absent or not set or |italic=default; args.italic controls | ||
if ('latn' == subtags.script) or | if ('latn' == subtags.script) or -- script is latn | ||
( | (this_wiki_lang_tag ~= code and not is_set (subtags.script) and not has_poem_tag (args.text) and is_latn_text) then -- text not this wiki's language, no script specified and not in poem markup but is wholly latn script (auto-italics) | ||
-- 中文版默认不应用斜体 | |||
args.italic = 'unset'; -- DEFAULT for {{lang}} templates is upright; but if latn script set for font-style:italic | args.italic = 'unset'; -- DEFAULT for {{lang}} templates is upright; but if latn script set for font-style:italic | ||
else | else | ||
| 第947行: | 第1,310行: | ||
end | end | ||
end | end | ||
if is_set (subtags.script) then -- if script set, override rtl setting | if is_set (subtags.script) then -- if script set, override rtl setting | ||
if in_array (subtags.script, lang_data.rtl_scripts) then | if in_array (subtags.script, lang_data.rtl_scripts) then | ||
| 第957行: | 第1,320行: | ||
args.code = format_ietf_tag (code, subtags.script, subtags.region, subtags.variant, subtags.private); -- format to recommended subtag styles | args.code = format_ietf_tag (code, subtags.script, subtags.region, subtags.variant, subtags.private); -- format to recommended subtag styles | ||
language_name = language_name_get (args.code, code, true); | language_name = language_name_get (args.code, code, true) or ''; -- get language name; try IETF tag first, then code w/o variant then code w/ variant | ||
if | if cfg.keywords_t.invert == args.italic and 'span' == tag then -- invert only supported for in-line content | ||
args.text = invert_italics (args.text) | args.text = invert_italics (args.text) | ||
end | end | ||
args.text = chinese_conversion (args.code, args.text) -- 中文版特化部分 | |||
args.text = proto_prefix (args.text, language_name, args.proto); -- prefix proto-language text with a splat | args.text = proto_prefix (args.text, language_name, args.proto); -- prefix proto-language text with a splat | ||
table.insert (out, make_text_html (args.code, args.text, tag, args.rtl, args.italic, args.size, language_name)); | table.insert (out, make_text_html (args.code, args.text, tag, args.rtl, args.italic, args.size, language_name)); | ||
table.insert (out, make_category (code, language_name, args.nocat)); | table.insert (out, make_category (code, language_name, args.nocat)); | ||
table.insert (out, render_maint(args.nocat)); -- maintenance messages and categories | table.insert (out, render_maint (args.nocat)); -- maintenance messages and categories | ||
if not args.noerror and error_msgs[1] then | |||
table.insert(out, make_lang_error_span(table.concat(error_msgs))) | |||
end | |||
return table.concat (out); -- put it all together and done | return table.concat (out); -- put it all together and done | ||
| 第992行: | 第1,344行: | ||
--[[--------------------------< L A N G >---------------------------------------------------------------------- | --[[--------------------------< L A N G >---------------------------------------------------------------------- | ||
Entry point for {{lang}}. | |||
There should be no reason to set parameters in the {{lang}} {{#invoke:}} | |||
<includeonly>{{#invoke:lang|lang}}</includeonly> | <includeonly>{{#invoke:lang|lang}}</includeonly> | ||
Parameters are received from the template's frame (parent frame). | |||
]] | ]] | ||
local function lang (frame) | local function lang (frame) | ||
local | local args_t = getArgs (frame, { -- this code so that we can detect and handle wiki list markup in text | ||
valueFunc = function (key, value) | valueFunc = function (key, value) | ||
if 2 == key or 'text' == key then -- the 'text' parameter; do not trim wite space | if 2 == key or 'text' == key then -- the 'text' parameter; do not trim wite space | ||
| 第1,016行: | 第1,368行: | ||
}); | }); | ||
return _lang ( | args_t.fn = nil; -- unset because not supported but this function might have been called by {{lang|fn=lang|...}} | ||
local msg = parameter_validate (args_t, cfg.templates_t.lang); -- verify that all supplied parameters are supported by {{lang-??}} | |||
if args_t.noerror then | |||
msg = '' | |||
else | |||
msg = msg and make_lang_error_span(make_error_msg(msg, args_t, cfg.templates_t.lang)) or '' | |||
end | |||
return _lang (args_t) .. msg | |||
end | end | ||
--[[--------------------------< L A N | --[[--------------------------< T R A N S L A T I O N _ M A K E >---------------------------------------------- | ||
For the {{lang- | Stand-alone function to create literal translation of main text. | ||
other parameters can, usually should, be written in the template call. For {{lang- | |||
Also used by {{lang-x2}}. | |||
]] | |||
local function translation_make (args_t) | |||
local translation_t = {','}; -- initialize output | |||
if 'none' ~= args_t.label then -- if we want a label | |||
table.insert (translation_t, '<small>'); -- open the <small> HTML tag | |||
if cfg.keywords_t.negative == args_t.link then | |||
table.insert (translation_t, cfg.translation_make_t.lit_xlation); -- unlinked form | |||
else | |||
table.insert (translation_t, make_wikilink (cfg.translation_make_t.lit_xlation)); -- linked form | |||
end | |||
table.insert (translation_t, ":</small>"); -- close the <small> HTML tag | |||
end | |||
table.insert (translation_t, table.concat ({'「', args_t.translation, '」'})); | |||
return table.concat (translation_t); -- make a big string and done | |||
end | |||
--[[--------------------------< _ L A N G _ X X >-------------------------------------------------------------- | |||
For the {{lang-??}} templates, the only parameter required to be set in the template is the language code. All | |||
other parameters can, usually should, be written in the template call. For {{lang-??}} templates for languages | |||
that can have multiple writing systems, it may be appropriate to set |script= as well. | that can have multiple writing systems, it may be appropriate to set |script= as well. | ||
For each {{lang- | For each {{lang-??}} template choose the appropriate entry-point function so that this function knows the default | ||
styling that should be applied to text. | styling that should be applied to text. | ||
| 第1,050行: | 第1,436行: | ||
|label = 'none' to suppress all labeling (language name, 'translit.', 'lit.') | |label = 'none' to suppress all labeling (language name, 'translit.', 'lit.') | ||
any other text replaces language-name label - automatic wikilinking disabled | any other text replaces language-name label - automatic wikilinking disabled | ||
for those {{lang- | for those {{lang-??}} templates that support transliteration (those templates where |text= is not entirely latn script): | ||
|translit = text that is a transliteration of text | |translit = text that is a transliteration of text | ||
|translit-std = the standard that applies to the transliteration | |translit-std = the standard that applies to the transliteration | ||
|translit-script = ISO 15924 script name; falls back to code | |translit-script = ISO 15924 script name; falls back to code | ||
For {{lang- | For {{lang-??}}, the positional parameters are: | ||
{{{1}}} text | {{{1}}} text | ||
{{{2}}} transliterated text | {{{2}}} transliterated text | ||
| 第1,064行: | 第1,450行: | ||
]] | ]] | ||
local function _lang_xx (args) | local function _lang_xx (args, base_template) -- base_template will be either of 'Langx' or 'Lang-xx' | ||
local out = {}; | local out = {}; | ||
local language_name; -- used to make display text, article links | local language_name; -- used to make display text, article links | ||
| 第1,073行: | 第1,459行: | ||
local translit_script_name; -- name associated with IANA (ISO 15924) script code | local translit_script_name; -- name associated with IANA (ISO 15924) script code | ||
local translit; | local translit; | ||
local msg; -- for error messages | local msg; -- for error messages | ||
local tag = 'span'; -- initial value for make_text_html() | local tag = 'span'; -- initial value for make_text_html() | ||
local template = args.template or ' | local template = args.template or base_template; | ||
maint_cats = {}; -- initialize because when this module required into another module, these only declared once so only initialzed once | |||
maint_msgs = {}; | |||
error_msgs = {} | |||
local text_idx = (cfg.templates_t.langx == base_template) and 2 or 1; -- for {{langx}} 'text' positional parameter is '2' | |||
local translit_idx = (cfg.templates_t.langx == base_template) and 3 or 2; | |||
local xlate_idx = (cfg.templates_t.langx == base_template) and 4 or 3; | |||
if args[ | if args[text_idx] and args.text then | ||
make_error_msg (substitute (cfg.lang_t.conflict_n_param, {text_idx, cfg.lang_t.conflict_n_param_types.text}), args, template) | |||
end | end | ||
args.text = args[text_idx] or args.text; -- prefer positional 'text' parameter | |||
validate_text (template, args) | |||
args.text, tag = html_tag_select (args.text); -- inspects text; returns appropriate | args.text, tag = html_tag_select (args.text); -- inspects text; returns appropriate HTML tag with text trimmed accordingly | ||
if args[ | if args[translit_idx] and args.translit then | ||
make_error_msg (substitute (cfg.lang_t.conflict_n_param, {translit_idx, cfg.lang_t.conflict_n_param_types.translit}), args, template) | |||
end | end | ||
args.translit = args[translit_idx] or args.translit; -- prefer positional 'translit' parameter | |||
if args[ | |||
if args[xlate_idx] and (args.translation or args.lit) then | |||
make_error_msg (substitute (cfg.lang_xx_t.conflict_n_lit, {xlate_idx}), args, template) | |||
elseif args.translation and args.lit then | elseif args.translation and args.lit then | ||
make_error_msg (cfg.lang_xx_t.conflict_lit, args, template) | |||
end | end | ||
args.translation = args[xlate_idx] or args.translation or args.lit; -- prefer positional 'translation' parameter | |||
if args.links and args.link then | if args.links and args.link then | ||
make_error_msg (cfg.lang_xx_t.conflict_link, args, template) | |||
end | end | ||
args.link = args.link or args.links; -- prefer args.link | |||
validate_cat_args (args); -- determine if categorization should be suppressed | validate_cat_args (args); -- determine if categorization should be suppressed | ||
args.rtl = args.rtl == | args.rtl = args.rtl == cfg.keywords_t.affirmative; -- convert to boolean: 'yes' -> true, other values -> false | ||
code, subtags.script, subtags.region, subtags.variant, subtags.private, msg = get_ietf_parts (args.code, args.script, args.region, args.variant); -- private omitted because private | code, subtags.script, subtags.region, subtags.variant, subtags.private, msg = get_ietf_parts (args.code, args.script, args.region, args.variant); -- private omitted because private | ||
if msg then -- if an error detected then there is an error message | if msg then -- if an error detected then there is an error message | ||
make_error_msg (msg, args, template) | |||
msg = nil | |||
code = code or '' | |||
end | end | ||
if args.translit then | |||
local latn, pos, char; | |||
latn, args.translit, pos, char = is_latin (args.translit, (('' ~= subtags.private) and (code .. '-x-' .. subtags.private)) or code); | |||
if not latn then | |||
make_error_msg (substitute (cfg.lang_xx_t.translit_nonlatn, {pos, char}), args, template) | |||
end | |||
end | |||
local is_latn_text, text, pos, char = is_latin (args.text, code); -- make a boolean | |||
args.text = text; -- may have been modified (accept-as-written markup removed) | |||
msg = text_script_match_test (subtags.script, is_latn_text, pos, char) | |||
if msg then -- if an error detected then there is an error message | |||
make_error_msg (msg, args, template) | |||
msg = nil | |||
end | |||
args.italic, msg = validate_italic (args); | args.italic, msg = validate_italic (args); | ||
if msg then | if msg then | ||
make_error_msg (msg, args, template) | |||
msg = nil | |||
end | end | ||
if | if cfg.templates_t.langx == base_template then -- auto-italics for {{langx}} templates; adapted from {{lang}} (no support for poem tag) | ||
if nil == args.italic then -- nil when |italic= absent or not set or |italic=default; args.italic controls | |||
args.italic = 'inherit'; -- italic not set; script not latn; inherit current style | |||
end | |||
else -- {{lang-xx}} does not do auto italics; retained for those wikis that don't support {{langx}} | |||
if nil == args.italic then -- args.italic controls | |||
args.italic = initial_style_state; -- here when |italic= and |script= not set; set for font-style:<initial_style_state> | args.italic = initial_style_state; -- here when |italic= and |script= not set; set for font-style:<initial_style_state> | ||
end | end | ||
end | end | ||
if is_set (subtags.script) then -- if script set override rtl setting | if is_set (subtags.script) then -- if script set override rtl setting | ||
if in_array (subtags.script, lang_data.rtl_scripts) then | if in_array (subtags.script, lang_data.rtl_scripts) then | ||
| 第1,148行: | 第1,554行: | ||
args.proto, msg = validate_proto (args.proto); -- return boolean, or nil, or nil and error message flag | args.proto, msg = validate_proto (args.proto); -- return boolean, or nil, or nil and error message flag | ||
if msg then | if msg then | ||
return make_error_msg ( | return make_error_msg (substitute (cfg.lang_t.invalid_proto, {args.proto}), args, template); | ||
end | end | ||
args.code = format_ietf_tag (code, subtags.script, subtags.region, subtags.variant, subtags.private); -- format to recommended subtag styles | args.code = format_ietf_tag (code, subtags.script, subtags.region, subtags.variant, subtags.private); -- format to recommended subtag styles | ||
language_name = language_name_get (args.code, code, true); | language_name = language_name_get (args.code, code, true) or ''; -- get language name; try IETF tag first, then code w/o variant then code w/ variant | ||
category_name = language_name; -- category names retain IANA parenthetical diambiguators (if any) | category_name = language_name; -- category names retain IANA parenthetical diambiguators (if any) | ||
| 第1,162行: | 第1,568行: | ||
end | end | ||
else | else | ||
if | if cfg.keywords_t.negative == args.link then | ||
table.insert (out, language_name); -- language name without wikilink | table.insert (out, language_name); -- language name without wikilink | ||
else | else | ||
if lang_data.article_name[code] then | -- 中文版不需要 | ||
table.insert (out, make_wikilink (lang_data.article_name[code | -- if mw.ustring.find (language_name, 'languages', 1, true) then | ||
-- table.insert (out, make_wikilink (language_name)); -- collective language name uses simple wikilink | |||
-- elseif lang_data.article_name[args.code:lower()] then -- is IETF tag in article name over ride? | |||
-- table.insert (out, make_wikilink (lang_data.article_name[args.code:lower()], language_name)); -- language name with wikilink from override data | |||
if lang_data.article_name[code] then -- is language tag in article override | |||
table.insert (out, make_wikilink (lang_data.article_name[code], language_name)); -- language name with wikilink from override data | |||
else | else | ||
table.insert (out, make_wikilink (language_name)); -- language name with wikilink | table.insert (out, make_wikilink (language_name)); -- language name with wikilink | ||
end | end | ||
end | end | ||
| 第1,174行: | 第1,585行: | ||
end | end | ||
if | if cfg.keywords_t.invert == args.italic then | ||
args.text = invert_italics (args.text) | args.text = invert_italics (args.text) | ||
end | end | ||
args.text = chinese_conversion (args.code, args.text) -- 中文版特化部分 | |||
args.text = proto_prefix (args.text, language_name, args.proto); -- prefix proto-language text with a splat | args.text = proto_prefix (args.text, language_name, args.proto); -- prefix proto-language text with a splat | ||
table.insert (out, make_text_html (args.code, args.text, tag, args.rtl, args.italic, args.size, ('none' == args.label) and language_name or nil)) | table.insert (out, make_text_html (args.code, args.text, tag, args.rtl, args.italic, args.size, ('none' == args.label) and language_name or nil)) | ||
if is_set (args.translit) and not | if is_set (args.translit) and not is_latn_text then -- transliteration; not supported when args.text is wholly latn text (this is an imperfect test) | ||
table.insert (out, ','); -- comma to separate text from translit | table.insert (out, ','); -- comma to separate text from translit | ||
if 'none' ~= args.label then | if 'none' ~= args.label then | ||
table.insert (out, '<small>'); | table.insert (out, '<small>'); | ||
if script_table[args['translit-script']] then -- when |translit-script= is set, try to use the script's name | if script_table[args['translit-script']] then -- when |translit-script= is set, try to use the script's name | ||
translit_script_name = script_table[args['translit-script' | translit_script_name = script_table[args['translit-script']]; | ||
else | else | ||
translit_script_name = language_name; -- fall back on language name | translit_script_name = language_name; -- fall back on language name | ||
end | end | ||
if | local translit_title_obj = mw.title.makeTitle (0, substitute ('$2$1',{cfg.lang_xx_t.romanization, translit_script_name})); -- make a title object; no engvar, article titles use US spelling | ||
table.insert (out, make_wikilink ((translit_script_name or language_name) | if translit_title_obj.exists and (cfg.keywords_t.negative ~= args.link) then | ||
table.insert (out, make_wikilink (substitute ('$2$1', {cfg.lang_xx_t.romanization, translit_script_name or language_name}), | |||
substitute ('$1', {cfg.lang_xx_t.romanization})) .. ':'); -- make a wikilink if there is an article to link to; engvar the display text | |||
else | else | ||
table.insert (out, ' | table.insert (out, substitute ('$1:', {cfg.lang_xx_t.romanization})); -- else plain text per engvar | ||
end | end | ||
table.insert (out, ' | table.insert (out, '</small>'); -- close the small tag | ||
end | end | ||
translit = make_translit (args.code, language_name, args.translit, args['translit-std'], args['translit-script']) | translit = make_translit (args.code, language_name, args.translit, args['translit-std'], args['translit-script'], nil) | ||
if is_set (translit) then | if is_set (translit) then | ||
table.insert (out, translit); | table.insert (out, translit); | ||
else | else | ||
make_error_msg (substitute ('$1:$2', {cfg.lang_xx_t.invalid_xlit_std, args['translit-std'] or '[missing]'}), args, template) | |||
end | end | ||
elseif is_set (args.translit) and is_latn_text then -- when creating a transliteration of Latn script <text> | |||
make_error_msg (cfg.lang_xx_t.xlit_of_latn, args, template) | |||
end | end | ||
if is_set (args.translation) then -- translation (not supported in {{lang}}) | if is_set (args.translation) then -- translation (not supported in {{lang}}) | ||
table.insert (out, | table.insert (out, translation_make (args)); | ||
end | end | ||
table.insert (out, make_category (code, category_name, args.nocat)); | table.insert (out, make_category (code, category_name, args.nocat)); | ||
table.insert (out, render_maint(args.nocat)); -- maintenance messages and categories | table.insert (out, render_maint(args.nocat)); -- maintenance messages and categories | ||
if not args.noerror and error_msgs[1] then | |||
table.insert(out, make_lang_error_span(table.concat(error_msgs))) | |||
end | |||
return table.concat (out); -- put it all together and done | return table.concat (out); -- put it all together and done | ||
| 第1,248行: | 第1,645行: | ||
--[[--------------------------< L A N G _ X X _ A R G S _ G E T >---------------------------------------------- | --[[--------------------------< L A N G _ X X _ A R G S _ G E T >---------------------------------------------- | ||
Common function to get args table from {{lang-??}} templates. | |||
Returns table of args. | |||
Text positional parameters are not trimmed here but are selectively trimmed at html_tag_select(). | |||
]] | ]] | ||
local function lang_xx_args_get (frame) | local function lang_xx_args_get (frame, base_template) | ||
local | local args_t = getArgs(frame, | ||
{ | { | ||
parentFirst= true, -- parameters in the template override parameters set in the {{#invoke:}} | parentFirst= true, -- parameters in the template override parameters set in the {{#invoke:}} | ||
valueFunc = function (key, value) | valueFunc = function (key, value) | ||
if 1 == key then | if ((cfg.templates_t.langx == base_template) and 2 or 1) == key then -- the 'text' positional parameter; 1 for {{lang-??}}, 2 for {{langx}}; do not trim wite space | ||
return value; -- return untrimmed 'text' | return value; -- return untrimmed 'text' positional parameter | ||
elseif value then -- all other values: if the value is not nil | elseif value then -- all other values: if the value is not nil | ||
value = mw.text.trim (value); -- trim whitespace | value = mw.text.trim (value); -- trim whitespace | ||
| 第1,271行: | 第1,670行: | ||
}); | }); | ||
return | return args_t; | ||
end | end | ||
| 第1,277行: | 第1,676行: | ||
--[[--------------------------< L A N G _ X X _ I T A L I C >-------------------------------------------------- | --[[--------------------------< L A N G _ X X _ I T A L I C >-------------------------------------------------- | ||
Entry point for those {{lang- | Entry point for those {{lang-??}} templates that call lang_xx_italic(). Sets the initial style state to italic. | ||
]] | ]] | ||
local function lang_xx_italic (frame) | local function lang_xx_italic (frame) | ||
local args = lang_xx_args_get (frame); | local args = lang_xx_args_get (frame, cfg.templates_t.langxx); | ||
args.fn = nil; -- unset because not supported but this function might have been called by {{lang|fn=lang_xx_italic|...}} | |||
initial_style_state = 'italic'; | |||
return _lang_xx (args) | local msg = parameter_validate (args, cfg.templates_t.langxx); -- verify that all supplied parameters are supported by {{lang-??}} | ||
if args.noerror then | |||
msg = '' | |||
else | |||
msg = msg and make_lang_error_span(make_error_msg(msg, args, cfg.templates_t.langxx)) or '' | |||
end | |||
initial_style_state = args.italic_important and 'italic' or 'inherit'; -- 中文維基百科:忽略斜體(除非指定italic_important) | |||
return _lang_xx (args, cfg.templates_t.langxx) .. msg .. '[[Category:使用Lang-xx模板的页面]]' | |||
end | end | ||
| 第1,291行: | 第1,699行: | ||
--[[--------------------------< _ L A N G _ X X _ I T A L I C >------------------------------------------------ | --[[--------------------------< _ L A N G _ X X _ I T A L I C >------------------------------------------------ | ||
Entry point | Entry point from another module. Sets the initial style state to italic. | ||
]] | ]] | ||
local function _lang_xx_italic (args) | local function _lang_xx_italic (args) | ||
initial_style_state = 'italic'; | initial_style_state = args.italic_important and 'italic' or 'inherit'; -- 中文維基百科:忽略斜體(除非指定italic_important) | ||
return _lang_xx (args); | return _lang_xx (args, cfg.templates_t.langxx); | ||
end | end | ||
| 第1,303行: | 第1,711行: | ||
--[[--------------------------< L A N G _ X X _ I N H E R I T >------------------------------------------------ | --[[--------------------------< L A N G _ X X _ I N H E R I T >------------------------------------------------ | ||
Entry point for those {{lang- | Entry point for those {{lang-??}} templates that call lang_xx_inherit(). Sets the initial style state to inherit. | ||
]] | ]] | ||
local function lang_xx_inherit (frame) | local function lang_xx_inherit (frame) | ||
local args = lang_xx_args_get (frame); | local args = lang_xx_args_get (frame, cfg.templates_t.langxx); | ||
args.fn = nil; -- unset because not supported but this function might have been called by {{lang|fn=lang_xx_inherit|...}} | |||
local msg = parameter_validate (args, cfg.templates_t.langxx); -- verify that all supplied parameters are supported by {{lang-??}} | |||
if args.noerror then | |||
msg = '' | |||
else | |||
msg = msg and make_lang_error_span(make_error_msg(msg, args, cfg.templates_t.langxx)) or '' | |||
end | |||
initial_style_state = 'inherit'; | initial_style_state = 'inherit'; | ||
return _lang_xx (args) | return _lang_xx (args, cfg.templates_t.langxx) .. msg .. '[[Category:使用Lang-xx模板的页面]]' | ||
end | end | ||
| 第1,317行: | 第1,734行: | ||
--[[--------------------------< _ L A N G _ X X _ I N H E R I T >---------------------------------------------- | --[[--------------------------< _ L A N G _ X X _ I N H E R I T >---------------------------------------------- | ||
Entry point from another module. | Entry point from another module. Sets the initial style state to inherit. | ||
]] | ]] | ||
| 第1,323行: | 第1,740行: | ||
local function _lang_xx_inherit (args) | local function _lang_xx_inherit (args) | ||
initial_style_state = 'inherit'; | initial_style_state = 'inherit'; | ||
return _lang_xx (args); | return _lang_xx (args, cfg.templates_t.langxx); | ||
end | |||
--[[--------------------------< _ L A N G X >------------------------------------------------------------------ | |||
Entry point from another module. | |||
]] | |||
local function _langx (args_t) | |||
local langx_data = mw.loadData ('Module:Lang/langx'); -- get necessary data | |||
local rtl_t = langx_data.rtl_t; -- get list of language tags for languages that are rendered right-to-left | |||
local link_t = langx_data.link_t; -- get list of language tags for {{lang-??}} templates that set |link=<something> | |||
local size_t = langx_data.size_t; -- get list of language tags for {{lang-??}} templates that set |size=<something> | |||
error_msgs = {} | |||
local msg = parameter_validate (args_t, cfg.templates_t.langx); | |||
if msg then | |||
make_error_msg (msg, args_t, cfg.templates_t.langx) | |||
msg = nil | |||
end | |||
args_t.code = args_t[1] or args_t.code; -- get the language tag; must be {{{1}}} or |code= | |||
if not args_t.code then | |||
make_error_msg (cfg.get_ietf_parts_t.missing_lang_tag, args_t, cfg.templates_t.langx) | |||
end | |||
args_t.rtl = args_t.rtl or (rtl_t[args_t.code] and cfg.keywords_t.affirmative); -- prefer |rtl= in template call, use rtl_t else | |||
args_t.link = args_t.link or link_t[args_t.code]; -- prefer |link= in template call, use link_t felse | |||
args_t.size = args_t.size or size_t[args_t.code]; -- prefer |size= in template call, use size_t else | |||
args_t[1] = nil; -- unset to mimic {{lang-??}} templates which set |code=xx | |||
if not args_t.noerror and error_msgs[1] then | |||
msg = make_lang_error_span(table.concat(error_msgs)) | |||
end | |||
local lang_subtag = args_t.code; -- use only the base language subtag for unsupported tag test; some args_t.code are modified by |script= etc | |||
return _lang_xx (args_t, cfg.templates_t.langx) .. (msg or '') | |||
end | |||
--[[--------------------------< L A N G X >-------------------------------------------------------------------- | |||
Entry point for {{langx}}. | |||
this function calls _lang_xx() to render non-English text. The {{lang-??}} templates have three positional paramters | |||
but {{langx}} has four: | |||
| 1 | 2 | 3 | 4 | |||
{{lang-xx |<text> |<transl> |<xlate> }} | |||
{{langx |<tag> |<text> |<transl> |<xlate> }} | |||
The calls to lang_xx_args_get() and _lang_xx() use 'Langx' as a flag for those functions to select the proper | |||
positional parameters. | |||
{{lang-??}} depends on the calling template to select 'inherit' or 'italic' to establish the default rendering. | |||
{{langx}} can't do that. The initial version of {{langx}} relied on a list of language tags (inherit_t in ~/langx) | |||
scraped from those {{lang-??}} templates that call lang_xx_inherit() to render text in upright font. langx() now | |||
uses auto-italics code adapted from {{lang}} (doesn't support poem tags). | |||
]] | |||
local function langx (frame) | |||
local args_t = lang_xx_args_get (frame, cfg.templates_t.langx); -- get the arguments; 'Langx' is the <base_template> used to decide which positional param is 'text', 'translit', 'lit' | |||
return _langx (args_t); | |||
end | end | ||
| 第1,331行: | 第1,817行: | ||
Returns true when a language name associated with IETF language tag exists; nil else. IETF language tag must be valid. | Returns true when a language name associated with IETF language tag exists; nil else. IETF language tag must be valid. | ||
All code combinations supported by {{lang}} and the {{lang- | All code combinations supported by {{lang}} and the {{lang-??}} templates are supported by this function. | ||
Module entry point from another module | Module entry point from another module. | ||
]] | ]] | ||
| 第1,347行: | 第1,833行: | ||
--[[--------------------------< I S _ I E T F _ T A G >-------------------------------------------------------- | --[[--------------------------< I S _ I E T F _ T A G >-------------------------------------------------------- | ||
Module entry point from an {{#invoke:}} | Module entry point from an {{#invoke:}}. | ||
]] | ]] | ||
local function is_ietf_tag (frame) | local function is_ietf_tag (frame) | ||
return _is_ietf_tag (getArgs (frame)[1]); -- args[1] is the | return _is_ietf_tag (getArgs (frame)[1]); -- args[1] is the IETF language tag to be tested; also get parent frame | ||
end | end | ||
| 第1,365行: | 第1,851行: | ||
local function is_ietf_tag_frame (frame) | local function is_ietf_tag_frame (frame) | ||
return _is_ietf_tag (getArgs (frame, {frameOnly = true,})[1]); -- args[1] is the | return _is_ietf_tag (getArgs (frame, {frameOnly = true,})[1]); -- args[1] is the IETF language tag to be tested; do not get parent frame | ||
end | end | ||
| 第1,373行: | 第1,859行: | ||
Returns language name associated with IETF language tag if valid; error message else. | Returns language name associated with IETF language tag if valid; error message else. | ||
All code combinations supported by {{lang}} and the {{lang- | All code combinations supported by {{lang}} and the {{lang-??}} templates are supported by this function. | ||
Set invoke's |link= parameter to yes to get wikilinked version of the language name. | Set invoke's |link= parameter to yes to get wikilinked version of the language name. | ||
Module entry point from another module | Module entry point from another module. | ||
]] | ]] | ||
| 第1,384行: | 第1,870行: | ||
local subtags = {}; -- IETF subtags script, region, variant, and private | local subtags = {}; -- IETF subtags script, region, variant, and private | ||
local raw_code = args[1]; -- save a copy of the input IETF subtag | local raw_code = args[1]; -- save a copy of the input IETF subtag | ||
local link = | local link = cfg.keywords_t.affirmative == args['link']; -- make a boolean | ||
local label = args.label; | local label = args.label; | ||
local code; -- the language code | local code; -- the language code | ||
local msg; -- gets an error message if IETF language tag is malformed or invalid | local msg; -- gets an error message if IETF language tag is malformed or invalid | ||
local language_name = ''; | local language_name = ''; | ||
code, subtags.script, subtags.region, subtags.variant, subtags.private, msg = get_ietf_parts (raw_code); | code, subtags.script, subtags.region, subtags.variant, subtags.private, msg = get_ietf_parts (raw_code); | ||
if msg then | if msg then | ||
local template = (args['template'] and table.concat ({'{{', args['template'], '}} | local template = (args['template'] and table.concat ({'{{', args['template'], '}}:'})) or ''; -- make template name (if provided by the template) | ||
return | return make_error_span (template, msg); | ||
end | end | ||
raw_code = format_ietf_tag (code, subtags.script, subtags.region, subtags.variant, subtags.private); -- format to recommended subtag styles; private omitted because private | raw_code = format_ietf_tag (code, subtags.script, subtags.region, subtags.variant, subtags.private); -- format to recommended subtag styles; private omitted because private | ||
language_name = language_name_get (raw_code, code); -- get language name; try | language_name = language_name_get (raw_code, code); -- get language name; try IETF tag first, then code w/o variant then code w/ variant | ||
language_name = language_name:gsub ('%s+%b()', ''); | if 'yes' ~= args.raw then | ||
language_name = language_name:gsub ('%s+%b()', ''); -- remove IANA parenthetical disambiguators or qualifiers from names that have them | |||
end | |||
if link then -- when |link=yes, wikilink the language name | if link then -- when |link=yes, wikilink the language name | ||
if lang_data.article_name[ | if mw.ustring.find (language_name, '语系', 1, true) then | ||
language_name = make_wikilink (lang_data.article_name[code][ | language_name = make_wikilink (language_name, label); -- collective language name uses simple wikilink | ||
elseif lang_data.article_name[raw_code:lower()] then -- is IETF tag in article name override? | |||
language_name = make_wikilink (lang_data.article_name[raw_code:lower()], label or language_name); -- language name with wikilink from override data | |||
elseif lang_data.article_name[code] then -- is language tag in article name override? | |||
language_name = make_wikilink (lang_data.article_name[code], label or language_name); -- language name with wikilink from override data | |||
else | else | ||
language_name = make_wikilink (language_name, label or language_name); -- language name with wikilink | language_name = make_wikilink (language_name, label or language_name); -- language name with wikilink | ||
| 第1,415行: | 第1,907行: | ||
--[[--------------------------< N A M E _ F R O M _ T A G >---------------------------------------------------- | --[[--------------------------< N A M E _ F R O M _ T A G >---------------------------------------------------- | ||
Module entry point from an {{#invoke:}} | Module entry point from an {{#invoke:}}. | ||
]] | ]] | ||
local function name_from_tag (frame) -- entry point from an {{#invoke:Lang|name_from_tag|< | local function name_from_tag (frame) -- entry point from an {{#invoke:Lang|name_from_tag|<IETF tag>|link=<yes>|template=<template name>}} | ||
return _name_from_tag (getArgs(frame)) -- pass-on the args table, nothing else; getArgs() so we also get parent frame | return _name_from_tag (getArgs(frame)) -- pass-on the args table, nothing else; getArgs() so we also get parent frame | ||
end | end | ||
| 第1,426行: | 第1,918行: | ||
--[[--------------------------< _ T A G _ F R O M _ N A M E >-------------------------------------------------- | --[[--------------------------< _ T A G _ F R O M _ N A M E >-------------------------------------------------- | ||
Returns the | Returns the IETF language tag associated with the language name. Spelling of language name must be correct | ||
according to the spelling in the source tables. When a standard language name has a parenthetical disambiguator, | according to the spelling in the source tables. When a standard language name has a parenthetical disambiguator, | ||
that disambiguator must be omitted (they are not present in the data name-to-tag tables). | that disambiguator must be omitted (they are not present in the data name-to-tag tables). | ||
Module entry point from another module | Module entry point from another module. | ||
]] | ]] | ||
| 第1,438行: | 第1,930行: | ||
if args[1] and '' ~= args[1] then | if args[1] and '' ~= args[1] then | ||
local data = mw.loadData ('Module:Lang/tag from name'); | local data = mw.loadData ('Module:Lang/tag from name' .. sandbox); -- get the reversed data tables TODO: change when going live | ||
local lang = args[1]:lower(); -- allow any-case for the language name (speeling must till be correct) | local lang = args[1]:lower(); -- allow any-case for the language name (speeling must till be correct) | ||
local tag = data.rev_override_table[lang] or data.rev_lang_table[lang] or data.rev_lang_dep_table[lang]; -- get the code; look first in the override then in the standard | local tag = data.rev_override_table[lang] or data.rev_lang_table[lang] or data.rev_lang_dep_table[lang]; -- get the code; look first in the override then in the standard | ||
| 第1,445行: | 第1,937行: | ||
return tag, true; -- language name found so return tag and done; second return used by is_lang_name() | return tag, true; -- language name found so return tag and done; second return used by is_lang_name() | ||
else | else | ||
msg = | msg = substitute (cfg.tag_from_name_t.lang_not_found, {args[1]}); -- language name not found, error message | ||
end | end | ||
else | else | ||
msg = | msg = cfg.tag_from_name_t.missing_lang_name; -- language name not found, error message | ||
end | end | ||
local template = ''; | local template = ''; | ||
if args.template and '' ~= args.template then | if args.template and '' ~= args.template then | ||
template = table.concat ({'{{', args['template'], '}} | template = table.concat ({'{{', args['template'], '}}:'}); -- make template name (if provided by the template) | ||
end | end | ||
return | return make_error_span (template, msg); | ||
end | end | ||
| 第1,461行: | 第1,954行: | ||
--[[--------------------------< T A G _ F R O M _ N A M E >---------------------------------------------------- | --[[--------------------------< T A G _ F R O M _ N A M E >---------------------------------------------------- | ||
Module entry point from an {{#invoke:}} | Module entry point from an {{#invoke:}}. | ||
]] | ]] | ||
| 第1,467行: | 第1,960行: | ||
local function tag_from_name (frame) -- entry point from an {{#invoke:Lang|tag_from_name|<language name>|link=<yes>|template=<template name>}} | local function tag_from_name (frame) -- entry point from an {{#invoke:Lang|tag_from_name|<language name>|link=<yes>|template=<template name>}} | ||
local result, _ = _tag_from_name (getArgs(frame)) -- pass-on the args table, nothing else; getArgs() so we also get parent frame; supress second return used by is_lang_name() | local result, _ = _tag_from_name (getArgs(frame)) -- pass-on the args table, nothing else; getArgs() so we also get parent frame; supress second return used by is_lang_name() | ||
return result; | return result; | ||
end | end | ||
| 第1,473行: | 第1,966行: | ||
--[[--------------------------< I S _ L A N G _ N A M E >------------------------------------------------------ | --[[--------------------------< I S _ L A N G _ N A M E >------------------------------------------------------ | ||
Module entry point from an {{#invoke:}} | Module entry point from an {{#invoke:}}. | ||
]] | ]] | ||
| 第1,479行: | 第1,972行: | ||
local function is_lang_name (frame) | local function is_lang_name (frame) | ||
local _, result = _tag_from_name (getArgs(frame)) -- pass-on the args table, nothing else; getArgs() so we also get parent frame; supress second return used by tag_from_name() | local _, result = _tag_from_name (getArgs(frame)) -- pass-on the args table, nothing else; getArgs() so we also get parent frame; supress second return used by tag_from_name() | ||
return result and true or nil; | return result and true or nil; | ||
end | end | ||
| 第1,485行: | 第1,978行: | ||
--[[--------------------------< _ T R A N S L >---------------------------------------------------------------- | --[[--------------------------< _ T R A N S L >---------------------------------------------------------------- | ||
Module entry point from another module | Module entry point from another module. | ||
]] | ]] | ||
| 第1,495行: | 第1,988行: | ||
local script; -- IANA script | local script; -- IANA script | ||
local msg; -- for when called functions return an error message | local msg; -- for when called functions return an error message | ||
local template = args.template or cfg.templates_t.transliteration; | |||
if is_set (args[3]) then -- [3] set when {{ | maint_cats = {}; -- initialize because when this module required into another module, these only declared once so only initialzed once | ||
maint_msgs = {}; | |||
error_msgs = {} | |||
if is_set (args[3]) then -- [3] set when {{transliteration|code|standard|text}} | |||
args.text = args[3]; -- get the transliterated text | args.text = args[3]; -- get the transliterated text | ||
args.translit_std = args[2] and args[2]:lower(); -- get the standard; lower case for table indexing | args.translit_std = args[2] and args[2]:lower(); -- get the standard; lower case for table indexing | ||
if not title_table[args.translit_std] then | if not title_table[args.translit_std] then | ||
make_error_msg (substitute (cfg.transl_t.unrecog_xlit_std, {args.translit_std}), args, template) | |||
args.translit_std = nil | |||
end | end | ||
else | else | ||
if is_set (args[2]) then -- [2] set when {{ | if is_set (args[2]) then -- [2] set when {{transliteration|code|text}} | ||
args.text = args[2]; -- get the transliterated text | args.text = args[2]; -- get the transliterated text | ||
else | else | ||
if args[1] and args[1]:match ('^%a%a%a?%a?$') | if args[1] and (args[1]:match ('^%a%a%a?%a?$') or -- args[2] missing; is args[1] a language or script tag or is it the transliterated text? | ||
args[1]:match ('^%a%a%a?%-x%-')) then -- or is args[1] a private-use tag | |||
make_error_msg (cfg.transl_t.no_text, args, template) -- args[1] is a code so we're missing text | |||
args.text = '' | |||
else | else | ||
make_error_msg (cfg.transl_t.missing_lang_scr, args, template) | |||
args.text = '' | |||
end | end | ||
end | end | ||
end | end | ||
if is_set (args[1]) then -- IANA language code used for | if is_set (args[1]) then -- IANA language code used for HTML lang= attribute; or ISO 15924 script code | ||
if args[1]:match ('^%a%a%a?%a?$') then | if args[1]:match ('^%a%a%a?%a?$') or args[1]:match ('^%a%a%a?%-x%-') then -- args[1] has correct form? | ||
args.code = args[1]:lower(); -- use the language/script code; only (2, 3, or 4 alpha characters); lower case because table indexes are lower case | args.code = args[1]:lower(); -- use the language/script code; only (2, 3, or 4 alpha characters) or private-use; lower case because table indexes are lower case | ||
else | else | ||
make_error_msg (substitute (cfg.transl_t.unrecog_lang_scr, {args[1]}), args, template) -- invalid language / script code | |||
args.code = '' | |||
end | end | ||
else | else | ||
make_error_msg (cfg.transl_t.missing_lang_scr, args, template) -- missing language / script code | |||
args.code = '' | |||
end | |||
local is_latn_text, pos, char; | |||
is_latn_text, args.text, pos, char= is_latin (args.text, args.code); -- is latn text? strip accept-as-written markup | |||
if not is_latn_text then -- when text is not latn | |||
make_error_msg (substitute (cfg.lang_xx_t.translit_nonlatn, {pos, char}), args, template) | |||
end | end | ||
args.italic, msg = validate_italic (args); | args.italic, msg = validate_italic (args); | ||
if msg then | if msg then | ||
make_error_msg (msg, args, template) | |||
msg = nil | |||
end | end | ||
if 'italic' == args.italic then -- 'italic' when |italic=yes; because that is same as absent or not set and |italic=default | if 'italic' == args.italic then -- 'italic' when |italic=yes; because that is same as absent or not set and |italic=default | ||
args.italic = nil; -- set to nil; | args.italic = nil; -- set to nil; | ||
end | end | ||
if override_table[args.code] then -- is code a language code defined in the override table? | if override_table[args.code] then -- is code a language code defined in the override table? | ||
language_name = override_table[args.code | language_name = override_table[args.code]; | ||
args.code = args.code:match ('^%a%a%a?'); -- if private use, strip all but language subtag | |||
elseif lang_table[args.code] then -- is code a language code defined in the standard language code tables? | elseif lang_table[args.code] then -- is code a language code defined in the standard language code tables? | ||
language_name = lang_table[args.code | language_name = lang_table[args.code]; | ||
elseif lang_dep_table[args.code] then -- is code a language code defined in the deprecated language code tables? | elseif lang_dep_table[args.code] then -- is code a language code defined in the deprecated language code tables? | ||
language_name = lang_dep_table[args.code | language_name = lang_dep_table[args.code]; | ||
elseif script_table[args.code] then -- if here, code is not a language code; is it a script code? | elseif script_table[args.code] then -- if here, code is not a language code; is it a script code? | ||
language_name = script_table[args.code | language_name = script_table[args.code]; | ||
script = args.code; -- code was an ISO 15924 script so use that instead | script = args.code; -- code was an ISO 15924 script so use that instead | ||
args.code = ''; -- unset because not a language code | args.code = ''; -- unset because not a language code | ||
else | else | ||
make_error_msg (substitute (cfg.transl_t.unrecog_lang_scr, {args.code}), args, template) -- invalid language / script code | |||
language_name = args.code | |||
end | end | ||
-- here only when all parameters passed to make_translit() are valid | -- here only when all parameters passed to make_translit() are valid | ||
return make_translit (args.code, language_name, args.text, args.translit_std, script, args.italic) | |||
if not args.noerror and error_msgs[1] then | |||
msg = make_lang_error_span(table.concat(error_msgs)) | |||
end | |||
return make_translit (args.code, language_name, args.text, args.translit_std, script, args.italic) .. (msg or '') | |||
end | end | ||
| 第1,555行: | 第2,074行: | ||
--[[--------------------------< T R A N S L >------------------------------------------------------------------ | --[[--------------------------< T R A N S L >------------------------------------------------------------------ | ||
Module entry point from an {{#invoke:}} | Module entry point from an {{#invoke:}}. | ||
]] | ]] | ||
| 第1,566行: | 第2,085行: | ||
--[[--------------------------< C A T E G O R Y _ F R O M _ T A G >-------------------------------------------- | --[[--------------------------< C A T E G O R Y _ F R O M _ T A G >-------------------------------------------- | ||
Returns category name associated with IETF language tag if valid; error message else | Returns category name associated with IETF language tag if valid; error message else. | ||
All code combinations supported by {{lang}} and the {{lang- | All code combinations supported by {{lang}} and the {{lang-??}} templates are supported by this function. | ||
Module entry point from another module | Module entry point from another module. | ||
]] | ]] | ||
local function _category_from_tag ( | local function _category_from_tag (args_t) | ||
local subtags = {}; -- IETF subtags script, region, variant, and private | local subtags = {}; -- IETF subtags script, region, variant, and private | ||
local raw_code = | local raw_code = args_t[1]; -- save a copy of the input IETF subtag | ||
local link = | local link = cfg.keywords_t.affirmative == args_t.link; -- make a boolean | ||
local label = | local label = args_t.label; | ||
local code; -- the language code | local code; -- the language code | ||
local msg; -- gets an error message if IETF language tag is malformed or invalid | local msg; -- gets an error message if IETF language tag is malformed or invalid | ||
local category_name = ''; | local category_name = ''; | ||
code, subtags.script, subtags.region, subtags.variant, subtags.private, msg = get_ietf_parts (raw_code); | code, subtags.script, subtags.region, subtags.variant, subtags.private, msg = get_ietf_parts (raw_code); | ||
if msg then | if msg then | ||
local template = ( | local template = (args_t.template and table.concat ({'{{', args_t.template, '}}:'})) or ''; -- make template name (if provided by the template) | ||
return | return make_error_span (template, msg); | ||
end | end | ||
raw_code = format_ietf_tag (code, subtags.script, subtags.region, subtags.variant, subtags.private); -- format to recommended subtag styles; private omitted because private | raw_code = format_ietf_tag (code, subtags.script, subtags.region, subtags.variant, subtags.private); -- format to recommended subtag styles; private omitted because private | ||
category_name = language_name_get (raw_code, code); -- get language name; try | category_name = language_name_get (raw_code, code); -- get language name; try IETF tag first, then code w/o variant then code w/ variant | ||
category_name = make_category (code, category_name, nil, true):gsub ('[%[%]]', ''); | category_name = make_category (code, category_name, nil, true):gsub ('[%[%]]', ''); | ||
return category_name; | if link then | ||
return table.concat ({'[[:', category_name, ']]'}); | |||
else | |||
return category_name; | |||
end | |||
end | end | ||
| 第1,599行: | 第2,122行: | ||
--[[--------------------------< C A T E G O R Y _ F R O M _ T A G >-------------------------------------------- | --[[--------------------------< C A T E G O R Y _ F R O M _ T A G >-------------------------------------------- | ||
Module entry point from an {{#invoke:}} | Module entry point from an {{#invoke:}}. | ||
]] | ]] | ||
local function category_from_tag (frame) -- entry point from an {{#invoke:Lang|category_from_tag|< | local function category_from_tag (frame) -- entry point from an {{#invoke:Lang|category_from_tag|<IETF tag>|template=<template name>}} | ||
return _category_from_tag (getArgs (frame)); -- pass-on the args table, nothing else; getArgs() so we also get parent frame | return _category_from_tag (getArgs (frame)); -- pass-on the args table, nothing else; getArgs() so we also get parent frame | ||
end | end | ||
| 第1,612行: | 第2,135行: | ||
return { | return { | ||
category_from_tag = category_from_tag, | category_from_tag = category_from_tag, -- frame entry points when this module is #invoke:ed into templates/wikitext | ||
lang = lang, -- entry point for {{lang}} | lang = lang, -- entry point for {{lang}} | ||
langx = langx, -- entry point for {{langx}} | |||
lang_xx_inherit = lang_xx_inherit, -- entry points for {{lang-??}} | lang_xx_inherit = lang_xx_inherit, -- entry points for {{lang-??}} | ||
lang_xx_italic = lang_xx_italic, | lang_xx_italic = lang_xx_italic, | ||
is_ietf_tag = is_ietf_tag, | is_ietf_tag = is_ietf_tag, | ||
is_ietf_tag_frame = is_ietf_tag_frame, | |||
is_lang_name = is_lang_name, | is_lang_name = is_lang_name, | ||
tag_from_name = tag_from_name, -- returns | tag_from_name = tag_from_name, -- returns IETF tag associated with language name | ||
name_from_tag = name_from_tag, -- used for template documentation; possible use in ISO 639 name from code templates | name_from_tag = name_from_tag, -- used for template documentation; possible use in ISO 639 name from code templates | ||
transl = transl, -- entry point for {{ | transl = transl, -- entry point for {{transliteration}} | ||
_category_from_tag = _category_from_tag, -- entry points when this module is require()d into other modules | _category_from_tag = _category_from_tag, -- API entry points when this module is require()d into other modules | ||
_lang = _lang, | _lang = _lang, | ||
_langx = _langx, | |||
_lang_xx_inherit = _lang_xx_inherit, | _lang_xx_inherit = _lang_xx_inherit, | ||
_lang_xx_italic = _lang_xx_italic, | _lang_xx_italic = _lang_xx_italic, | ||
_is_ietf_tag = _is_ietf_tag, | _is_ietf_tag = _is_ietf_tag, | ||
get_ietf_parts = get_ietf_parts, | get_ietf_parts = get_ietf_parts, | ||
_tag_from_name = _tag_from_name, | _tag_from_name = _tag_from_name, | ||
_name_from_tag = _name_from_tag, | _name_from_tag = _name_from_tag, | ||
_transl = _transl, | _transl = _transl, | ||
_translation_make = translation_make, | |||
}; | }; | ||