Module:Plain text: Difference between revisions
Content deleted Content added
Johnrdorazio (talk | contribs) m 1 revision imported |
implement "encode" option, strip out external link alt text |
||
Line 5: | Line 5: | ||
function p.main(frame) |
function p.main(frame) |
||
local text = frame.args[1] |
local text = frame.args[1] |
||
local encode = require('Module:yesno')(frame.args.encode) |
|||
return p._main(text) |
return p._main(text, encode) |
||
end |
end |
||
function p._main(text) |
function p._main(text, encode) |
||
if not text then return end |
if not text then return end |
||
text = mw.text.killMarkers(text) |
text = mw.text.killMarkers(text) |
||
Line 21: | Line 22: | ||
:gsub('%[%[%s*[Cc]ategory%s*:.-%]%]', '') --strip out categories |
:gsub('%[%[%s*[Cc]ategory%s*:.-%]%]', '') --strip out categories |
||
:gsub('%[%[[^%]]-|', '') --strip out piped link text |
:gsub('%[%[[^%]]-|', '') --strip out piped link text |
||
:gsub('([^%[])%[[^%[%]][^%]]-%s', '%1') --strip out external link text |
|||
:gsub('^%[[^%[%]][^%]]-%s', '') --strip out external link text |
|||
:gsub('[%[%]]', '') --then strip out remaining [ and ] |
:gsub('[%[%]]', '') --then strip out remaining [ and ] |
||
:gsub("'''''", "") --strip out bold italic markup |
:gsub("'''''", "") --strip out bold italic markup |
||
Line 28: | Line 31: | ||
:gsub("%s+$", "") --and trailing spaces |
:gsub("%s+$", "") --and trailing spaces |
||
:gsub("%s+", " ") --strip redundant spaces |
:gsub("%s+", " ") --strip redundant spaces |
||
if encode then |
|||
⚫ | |||
return mw.text.encode(text) |
|||
else |
|||
⚫ | |||
end |
|||
end |
end |
||
Revision as of 14:19, September 2, 2021
Documentation for this module may be created at Module:Plain text/doc
--converts text with wikilinks to plain text, e.g "[[foo|gah]] is [[bar]]" to "gah is bar"
--removes anything enclosed in tags that isn't nested, mediawiki strip markers (references etc), files, italic and bold markup
local p = {}
function p.main(frame)
local text = frame.args[1]
local encode = require('Module:yesno')(frame.args.encode)
return p._main(text, encode)
end
function p._main(text, encode)
if not text then return end
text = mw.text.killMarkers(text)
:gsub(' ', ' ') --replace nbsp spaces with regular spaces
:gsub('<br ?/?>', ', ') --replace br with commas
:gsub('<span.->(.-)</span>', '%1') --remove spans while keeping text inside
:gsub('<i.->(.-)</i>', '%1') --remove italics while keeping text inside
:gsub('<.->.-<.->', '') --strip out remaining tags and the text inside
:gsub('<.->', '') --remove any other tag markup
:gsub('%[%[%s*[Ff]ile%s*:.-%]%]', '') --strip out files
:gsub('%[%[%s*[Ii]mage%s*:.-%]%]', '') --strip out use of image:
:gsub('%[%[%s*[Cc]ategory%s*:.-%]%]', '') --strip out categories
:gsub('%[%[[^%]]-|', '') --strip out piped link text
:gsub('([^%[])%[[^%[%]][^%]]-%s', '%1') --strip out external link text
:gsub('^%[[^%[%]][^%]]-%s', '') --strip out external link text
:gsub('[%[%]]', '') --then strip out remaining [ and ]
:gsub("'''''", "") --strip out bold italic markup
:gsub("'''?", "") --not stripping out '''' gives correct output for bolded text in quotes
:gsub('----', '') --remove ---- lines
:gsub("^%s+", "") --strip leading
:gsub("%s+$", "") --and trailing spaces
:gsub("%s+", " ") --strip redundant spaces
if encode then
return mw.text.encode(text)
else
return text
end
end
return p