Module:Plain text: Difference between revisions

From escforumwiki
Jump to navigation Jump to search
en>Galobtter
(copy from Module:Citation/CS1/COinS, see its history for attribution - strip italics and bold)
m (1 revision imported)
 
(32 intermediate revisions by 8 users not shown)
Line 1: Line 1:
--converts text with wikilinks to plain text, e.g "[[foo|gah]] is [[bar]]" to "gah is bar"
--converts text with wikilinks to plain text, e.g "[[foo|gah]] is [[bar]]" to "gah is bar"
--removes anything enclosed in tags and files
--removes anything enclosed in tags that isn't nested, mediawiki strip markers (references etc), files, italic and bold markup
require[[strict]]
local p = {}
local p = {}
--copied from Module:Citation/CS1/COinS


function p.strip_apostrophe_markup (argument)
function p.main(frame)
if argument:find ( "''", 1, true ) == nil then -- Is there at least one double apostrophe?  If not, exit.
local text = frame.args[1]
return argument
local encode = require('Module:yesno')(frame.args.encode)
end
return p._main(text, encode)
end


while true do
function p._main(text, encode)
if argument:find ( "'''''", 1, true ) then -- bold italic (5)
if not text then return end
argument=argument:gsub("%'%'%'%'%'", ""); -- remove all instances of it
text = mw.text.killMarkers(text)
elseif argument:find ( "''''", 1, true ) then -- italic start and end without content (4)
:gsub(' ', ' ') --replace nbsp spaces with regular spaces
argument=argument:gsub("%'%'%'%'", "");
:gsub('<br ?/?>', ', ') --replace br with commas
elseif argument:find ( "'''", 1, true ) then -- bold (3)
:gsub('<span.->(.-)</span>', '%1') --remove spans while keeping text inside
argument=argument:gsub("%'%'%'", "");
:gsub('<i.->(.-)</i>', '%1') --remove italics while keeping text inside
elseif argument:find ( "''", 1, true ) then -- italic (2)
:gsub('<b.->(.-)</b>', '%1') --remove bold while keeping text inside
argument=argument:gsub("%'%'", "");
:gsub('<em.->(.-)</em>', '%1') --remove emphasis while keeping text inside
else
:gsub('<strong.->(.-)</strong>', '%1') --remove strong while keeping text inside
break;
:gsub('<sub.->(.-)</sub>', '%1') --remove subscript markup; retain contents
end
:gsub('<sup.->(.-)</sup>', '%1') --remove superscript markup; retain contents
:gsub('<u.->(.-)</u>', '%1') --remove underline markup; retain contents
:gsub('<.->.-<.->', '') --strip out remaining tags and the text inside
:gsub('<.->', '') --remove any other tag markup
:gsub('%[%[%s*[Ff][Ii][Ll][Ee]%s*:.-%]%]', '') --strip out files
:gsub('%[%[%s*[Ii][Mm][Aa][Gg][Ee]%s*:.-%]%]', '') --strip out use of image:
:gsub('%[%[%s*[Cc][Aa][Tt][Ee][Gg][Oo][Rr][Yy]%s*:.-%]%]', '') --strip out categories
:gsub('%[%[[^%]]-|', '') --strip out piped link text
:gsub('([^%[])%[[^%[%]][^%]]-%s', '%1') --strip out external link text
:gsub('^%[[^%[%]][^%]]-%s', '') --strip out external link text
:gsub('[%[%]]', '') --then strip out remaining [ and ]
:gsub("'''''", "") --strip out bold italic markup
:gsub("'''?", "") --not stripping out '''' gives correct output for bolded text in quotes
:gsub('----+', '') --remove ---- lines
:gsub("^%s+", "") --strip leading
:gsub("%s+$", "") --and trailing spaces
:gsub("%s+", " ") --strip redundant spaces
if encode then
return mw.text.encode(text)
else
return text
end
end
return argument; -- done
end
function p.main(frame)
text = frame.args[1]
text = mw.ustring.gsub (text, '<.->.-<.->', '') --strip out flags, plus any other tags, e.g footnotes
text = mw.ustring.gsub (text, '%[%[File:.-%]%]', '') --strip out files
text = mw.ustring.gsub (text, '%[%[.-|', '') --strip out piped link text
text = mw.ustring.gsub (text, '%[', '') --then strip out remaining [ and ]
text = mw.ustring.gsub (text, '%]', '')
strip_apostrophe_markup(text)
return text
end
end


return p
return p

Latest revision as of 21:06, 16 April 2024

Documentation for this module may be created at Module:Plain text/doc

--converts text with wikilinks to plain text, e.g "[[foo|gah]] is [[bar]]" to "gah is bar"
--removes anything enclosed in tags that isn't nested, mediawiki strip markers (references etc), files, italic and bold markup
require[[strict]]
local p = {}

function p.main(frame)
	local text = frame.args[1]
	local encode = require('Module:yesno')(frame.args.encode)
	return p._main(text, encode)
end

function p._main(text, encode)
	if not text then return end
	text = mw.text.killMarkers(text)
		:gsub('&nbsp;', ' ') --replace nbsp spaces with regular spaces
		:gsub('<br ?/?>', ', ') --replace br with commas
		:gsub('<span.->(.-)</span>', '%1') --remove spans while keeping text inside
		:gsub('<i.->(.-)</i>', '%1') --remove italics while keeping text inside
		:gsub('<b.->(.-)</b>', '%1') --remove bold while keeping text inside
		:gsub('<em.->(.-)</em>', '%1') --remove emphasis while keeping text inside
		:gsub('<strong.->(.-)</strong>', '%1') --remove strong while keeping text inside
		:gsub('<sub.->(.-)</sub>', '%1') --remove subscript markup; retain contents
		:gsub('<sup.->(.-)</sup>', '%1') --remove superscript markup; retain contents
		:gsub('<u.->(.-)</u>', '%1') --remove underline markup; retain contents
		:gsub('<.->.-<.->', '') --strip out remaining tags and the text inside
		:gsub('<.->', '') --remove any other tag markup
		:gsub('%[%[%s*[Ff][Ii][Ll][Ee]%s*:.-%]%]', '') --strip out files
		:gsub('%[%[%s*[Ii][Mm][Aa][Gg][Ee]%s*:.-%]%]', '') --strip out use of image:
		:gsub('%[%[%s*[Cc][Aa][Tt][Ee][Gg][Oo][Rr][Yy]%s*:.-%]%]', '') --strip out categories
		:gsub('%[%[[^%]]-|', '') --strip out piped link text
		:gsub('([^%[])%[[^%[%]][^%]]-%s', '%1') --strip out external link text
		:gsub('^%[[^%[%]][^%]]-%s', '') --strip out external link text
		:gsub('[%[%]]', '') --then strip out remaining [ and ]
		:gsub("'''''", "") --strip out bold italic markup
		:gsub("'''?", "") --not stripping out '''' gives correct output for bolded text in quotes
		:gsub('----+', '') --remove ---- lines
		:gsub("^%s+", "") --strip leading
		:gsub("%s+$", "") --and trailing spaces
		:gsub("%s+", " ") --strip redundant spaces
	if encode then
		return mw.text.encode(text)
	else
		return text
	end
end

return p