Module:Plain text
--converts text with wikilinks to plain text, e.g "gah is bar" to "gah is bar" --removes anything enclosed in tags that isn't nested, mediawiki strip markers (references etc), files, italic and bold markup requirestrict local p = {}
function p.main(frame) local text = frame.args[1] local encode = require('Module:yesno')(frame.args.encode) return p._main(text, encode) end
function p._main(text, encode)
if not text then return end
text = mw.text.killMarkers(text)
:gsub(' ', ' ') --replace nbsp spaces with regular spaces
:gsub('
', ', ') --replace br with commas
:gsub('<span.->(.-)', '%1') --remove spans while keeping text inside
:gsub('<i.->(.-)', '%1') --remove italics while keeping text inside
:gsub('<b.->(.-)', '%1') --remove bold while keeping text inside
:gsub('<em.->(.-)', '%1') --remove emphasis while keeping text inside
:gsub('<strong.->(.-)', '%1') --remove strong while keeping text inside
:gsub('<sub.->(.-)', '%1') --remove subscript markup; retain contents
:gsub('<sup.->(.-)', '%1') --remove superscript markup; retain contents
:gsub('<u.->(.-)', '%1') --remove underline markup; retain contents
:gsub('<.->.-<.->', ) --strip out remaining tags and the text inside
:gsub('<.->', ) --remove any other tag markup
:gsub('%[%[%s*[Ff][Ii][Ll][Ee]%s*:.-%]%]', ) --strip out files
:gsub('%[%[%s*[Ii][Mm][Aa][Gg][Ee]%s*:.-%]%]', ) --strip out use of image:
:gsub('%[%[%s*[Cc][Aa][Tt][Ee][Gg][Oo][Rr][Yy]%s*:.-%]%]', ) --strip out categories
:gsub('%[%^%-|', ) --strip out piped link text
:gsub('([^%[])%[[^%[%]][^%]]-%s', '%1') --strip out external link text
:gsub('^%[[^%[%]][^%]]-%s', ) --strip out external link text
:gsub('[%[%]]', ) --then strip out remaining [ and ]
:gsub("", "") --strip out bold italic markup
:gsub("?", "") --not stripping out ' gives correct output for bolded text in quotes
:gsub('%-%-%-%-+', ) --remove ---- lines
:gsub("^%s+", "") --strip leading
:gsub("%s+$", "") --and trailing spaces
:gsub("%s+", " ") --strip redundant spaces
if encode then
return mw.text.encode(text)
else
return text
end
end
return p