Module:String2: Difference between revisions
Content deleted Content added
Johnrdorazio (talk | contribs) m 1 revision imported |
Copy changes by User:Tholme from Module:String2/sandbox per edit request. |
||
Line 26: | Line 26: | ||
-- this is a piped wikilink, so we capitalise the text, not the pipe |
-- this is a piped wikilink, so we capitalise the text, not the pipe |
||
local _ |
local _ |
||
_, letterpos = mw.ustring.find(s, "|% |
_, letterpos = mw.ustring.find(s, "|%W*%w") -- find the first letter after the pipe |
||
else |
else |
||
letterpos = mw.ustring.find(s, '% |
letterpos = mw.ustring.find(s, '%w') |
||
end |
end |
||
if letterpos then |
if letterpos then |
||
Line 94: | Line 94: | ||
local str = mw.text.trim(frame.args[1] or "") |
local str = mw.text.trim(frame.args[1] or "") |
||
return mw.text.nowiki(str) |
return mw.text.nowiki(str) |
||
⚫ | |||
-- posnq (position, no quotes) returns the numerical start position of the first occurrence |
|||
-- of one piece of text ("match") inside another ("str"). |
|||
-- It returns nil if no match is found, or if either parameter is blank. |
|||
-- It takes the text to be searched in as the first unnamed parameter, which is trimmed. |
|||
-- It takes the text to match as the second unnamed parameter, which is trimmed and |
|||
-- any double quotes " are stripped out. |
|||
p.posnq = function(frame) |
|||
local args = frame.args |
|||
local pargs = frame:getParent().args |
|||
for k, v in pairs(pargs) do |
|||
args[k] = v |
|||
end |
|||
local str = mw.text.trim(args[1] or args.source or "") |
|||
local match = mw.text.trim(args[2] or args.target or ""):gsub('"', '') |
|||
if str == "" or match == "" then return nil end |
|||
local plain = mw.text.trim(args[3] or args.plain or "") |
|||
if plain == "false" then plain = false else plain = true end |
|||
local nomatch = mw.text.trim(args[4] or args.nomatch or "") |
|||
-- just take the start position |
|||
local pos = mw.ustring.find(str, match, 1, plain) or nomatch |
|||
⚫ | |||
end |
end |
||
Line 189: | Line 166: | ||
if plain:sub(1, 1) == "f" then plain = false else plain = true end |
if plain:sub(1, 1) == "f" then plain = false else plain = true end |
||
-- get the page content and look for 'text' - return position or nomatch |
-- get the page content and look for 'text' - return position or nomatch |
||
local content = titleobj:getContent() |
local content = titleobj and titleobj:getContent() |
||
return mw.ustring.find(content, text, 1, plain) or nomatch |
return content and mw.ustring.find(content, text, 1, plain) or nomatch |
||
end |
end |
||
p.findpagetext = function(frame) |
p.findpagetext = function(frame) |
||
Line 228: | Line 205: | ||
-- Escape Pattern helper function so that all characters are treated as plain text, as per Module:String |
-- Escape Pattern helper function so that all characters are treated as plain text, as per Module:String |
||
function p._escapePattern( pattern_str) |
function p._escapePattern( pattern_str) |
||
return mw.ustring.gsub( pattern_str, "([%(%)%.%%%+%-%*%?%[%^%$%]])", "%%%1" ) |
return mw.ustring.gsub( pattern_str, "([%(%)%.%%%+%-%*%?%[%^%$%]])", "%%%1" ) |
||
end |
end |
||
Line 251: | Line 228: | ||
function p.strip( frame ) |
function p.strip( frame ) |
||
local new_args = p._getParameters( frame.args, {'source', 'chars', 'plain'} ) |
local new_args = p._getParameters( frame.args, {'source', 'chars', 'plain'} ) |
||
local source_str = new_args['source'] or '' |
local source_str = new_args['source'] or '' |
||
local chars = new_args['chars'] or '' or 'characters' |
local chars = new_args['chars'] or '' or 'characters' |
||
source_str = mw.text.trim(source_str) |
source_str = mw.text.trim(source_str) |
||
if source_str == '' or chars == '' then |
if source_str == '' or chars == '' then |
||
return source_str |
return source_str |
||
end |
end |
||
local l_plain = p._getBoolean( new_args['plain'] or true ) |
local l_plain = p._getBoolean( new_args['plain'] or true ) |
||
if l_plain then |
if l_plain then |
||
chars = p._escapePattern( chars ) |
chars = p._escapePattern( chars ) |
||
end |
end |
||
local result |
local result |
||
result = mw.ustring.gsub(source_str, "["..chars.."]", '') |
result = mw.ustring.gsub(source_str, "["..chars.."]", '') |
||
return result |
return result |
||
end |
end |
||
Line 308: | Line 285: | ||
]] |
]] |
||
function p.hyphen_to_dash( str ) |
function p.hyphen_to_dash( str, spacing ) |
||
if (str == nil or str == '') then |
if (str == nil or str == '') then |
||
return str |
return str |
||
end |
end |
||
local accept |
local accept |
||
str = mw.text.decode(str, true ) -- replace html entities with their characters; semicolon mucks up the text.split |
str = mw.text.decode(str, true ) -- replace html entities with their characters; semicolon mucks up the text.split |
||
local out = {} |
local out = {} |
||
local list = mw.text.split (str, '%s*[,;]%s*') |
local list = mw.text.split (str, '%s*[,;]%s*') -- split str at comma or semicolon separators if there are any |
||
for _, item in ipairs (list) do -- for each item in the list |
for _, item in ipairs (list) do -- for each item in the list |
||
item = mw.text.trim(item) -- trim whitespace |
item = mw.text.trim(item) -- trim whitespace |
||
item, accept = item:gsub ('^%(%((.+)%)%)$', '%1') |
item, accept = item:gsub ('^%(%((.+)%)%)$', '%1') |
||
if accept == 0 and mw.ustring.match (item, '^%w*[%.%-]?%w+%s*[%-–—]%s*%w*[%.%-]?%w+$') then -- if a hyphenated range or has endash or emdash separators |
if accept == 0 and mw.ustring.match (item, '^%w*[%.%-]?%w+%s*[%-–—]%s*%w*[%.%-]?%w+$') then -- if a hyphenated range or has endash or emdash separators |
||
if item:match ('^%a+[%.%-]?%d+%s*%-%s*%a+[%.%-]?%d+$') or -- letterdigit hyphen letterdigit (optional separator between letter and digit) |
if item:match ('^%a+[%.%-]?%d+%s*%-%s*%a+[%.%-]?%d+$') or -- letterdigit hyphen letterdigit (optional separator between letter and digit) |
||
Line 329: | Line 306: | ||
item:match ('^%d+%s*%-%s*%d+$') or -- digit hyphen digit |
item:match ('^%d+%s*%-%s*%d+$') or -- digit hyphen digit |
||
item:match ('^%a+%s*%-%s*%a+$') then -- letter hyphen letter |
item:match ('^%a+%s*%-%s*%a+$') then -- letter hyphen letter |
||
item = item:gsub ('(%w*[%.%-]?%w+)%s*%-%s*(%w*[%.%-]?%w+)', '%1–%2') |
item = item:gsub ('(%w*[%.%-]?%w+)%s*%-%s*(%w*[%.%-]?%w+)', '%1–%2') -- replace hyphen, remove extraneous space characters |
||
else |
else |
||
item = mw.ustring.gsub (item, '%s*[–—]%s*', '–') |
item = mw.ustring.gsub (item, '%s*[–—]%s*', '–') -- for endash or emdash separated ranges, replace em with en, remove extraneous whitespace |
||
end |
end |
||
end |
end |
||
table.insert (out, item) |
table.insert (out, item) -- add the (possibly modified) item to the output table |
||
end |
end |
||
local temp_str = table.concat (out, ', |
local temp_str = table.concat (out, ',' .. spacing) -- concatenate the output table into a comma separated string |
||
temp_str, accept = temp_str:gsub ('^%(%((.+)%)%)$', '%1') |
temp_str, accept = temp_str:gsub ('^%(%((.+)%)%)$', '%1') -- remove accept-this-as-written markup when it wraps all of concatenated out |
||
if accept ~= 0 then |
if accept ~= 0 then |
||
temp_str = str:gsub ('^%(%((.+)%)%)$', '%1') |
temp_str = str:gsub ('^%(%((.+)%)%)$', '%1') -- when global markup removed, return original str; do it this way to suppress boolean second return value |
||
return temp_str; |
|||
else |
|||
return temp_str; -- else, return assembled temp_str |
|||
end |
end |
||
⚫ | |||
end |
end |
||
function p.hyphen2dash( frame ) |
function p.hyphen2dash( frame ) |
||
local str = frame.args[1] or '' |
local str = frame.args[1] or '' |
||
local spacing = frame.args[2] or ' ' -- space is part of the standard separator for normal spacing (but in conjunction with templates r/rp/ran we may need a narrower spacing |
|||
⚫ | |||
⚫ | |||
⚫ | |||
-- Similar to [[Module:String#endswith]] |
|||
function p.startswith(frame) |
|||
return (frame.args[1]:sub(1, frame.args[2]:len()) == frame.args[2]) and 'yes' or '' |
|||
end |
end |
||