Toggle menu
Toggle preferences menu
Toggle personal menu
Not logged in
Your IP address will be publicly visible if you make any edits.

Module:SummarySnippet: Difference between revisions

From The Fortune Bringers
No edit summary
No edit summary
 
(17 intermediate revisions by the same user not shown)
Line 1: Line 1:
local p = {}
local p = {}


-- Trims whitespace from a string
-- Trim leading/trailing whitespace
local function trim(s)
local function trim(s)
return s:match("^%s*(.-)%s*$")
return s:match("^%s*(.-)%s*$")
Line 14: Line 14:
end
end


-- Parse input: extract page name from link-style input if needed
-- Parse link-style input
local raw = mw.ustring.match(page, "%[%[(.-)%]%]") or page
local raw = mw.ustring.match(page, "%[%[(.-)%]%]") or page
local pageText = mw.text.split(raw, "|")[1]
local pageText = mw.text.split(raw, "|")[1]


local content = mw.title.new(pageText)
local title = mw.title.new(pageText)
if not content or not content.exists then
if not title or not title.exists then
return "Page not found: " .. pageText
return "Page not found: " .. pageText
end
end


local text = content:getContent()
-- Use MediaWiki parser to preprocess and expand the page content
if not text then
local expanded = frame:preprocess('{{:' .. pageText .. '}}')
if not expanded then
return "No content."
return "No content."
end
end
 
-- Strip templates and most formatting (basic)
-- Attempt to skip content before the first section (e.g., infobox/template blob)
text = mw.text.killMarkers(text)
local body = mw.ustring.match(expanded, "==.*") or expanded
text = mw.ustring.gsub(text, '{{.-}}', '') -- remove templates
 
text = mw.ustring.gsub(text, '%[%[.-%|', '') -- remove link alt text
-- Clean up formatting
text = mw.ustring.gsub(text, '%[%[', '') -- remove opening brackets
body = mw.text.killMarkers(body)
text = mw.ustring.gsub(text, '%]%]', '') -- remove closing brackets
body = mw.ustring.gsub(body, '%[%[(.-)%|(.-)%]%]', '%2') -- [[Page|Label]] → Label
text = mw.ustring.gsub(text, "''+", "") -- remove italics/bold
body = mw.ustring.gsub(body, '%[%[', '')                 -- [[Page]] → Page
text = mw.ustring.gsub(text, "=+%s*(.-)%s*=+", "") -- remove headers
body = mw.ustring.gsub(body, '%]%]', '')
body = mw.ustring.gsub(body, "''+", "")                 -- remove bold/italics
-- Collapse whitespace
body = mw.ustring.gsub(body, "=+%s*(.-)%s*=+", "")       -- remove section headers
text = text:gsub("\n", " ")
body = mw.ustring.gsub(body, "{{.-}}", "")              -- remove remaining inline templates
text = text:gsub("%s+", " ")
 
text = trim(text)
-- Normalize whitespace
body = body:gsub("\n", " ")
-- Handle empty content after cleanup
body = body:gsub("%s+", " ")
if text == "" then
body = trim(body)
 
if body == "" then
return "No description available."
return "No description available."
end
end


-- Tag on a snippet-text class otherwise size gets overwritten and tack on a final read more
local truncated = mw.ustring.sub(body, 1, length)
local link = string.format(" [[:%s|Read more]]", pageText)
if #body > length then
return string.format('<span class="snippet-text">%s... %s</span>', mw.text.nowiki(truncatedText), link)
truncated = truncated .. "..."
end


return truncated
end
end


return p
return p

Latest revision as of 17:02, 30 May 2025

Documentation for this module may be created at Module:SummarySnippet/doc

local p = {}

-- Trim leading/trailing whitespace
local function trim(s)
	return s:match("^%s*(.-)%s*$")
end

function p.fromPage(frame)
	local page = frame.args[1]
	local length = tonumber(frame.args[2]) or 150

	if not page or page == '' then
		return "No page name provided."
	end

	-- Parse link-style input
	local raw = mw.ustring.match(page, "%[%[(.-)%]%]") or page
	local pageText = mw.text.split(raw, "|")[1]

	local title = mw.title.new(pageText)
	if not title or not title.exists then
		return "Page not found: " .. pageText
	end

	-- Use MediaWiki parser to preprocess and expand the page content
	local expanded = frame:preprocess('{{:' .. pageText .. '}}')
	if not expanded then
		return "No content."
	end

	-- Attempt to skip content before the first section (e.g., infobox/template blob)
	local body = mw.ustring.match(expanded, "==.*") or expanded

	-- Clean up formatting
	body = mw.text.killMarkers(body)
	body = mw.ustring.gsub(body, '%[%[(.-)%|(.-)%]%]', '%2') -- [[Page|Label]] → Label
	body = mw.ustring.gsub(body, '%[%[', '')                 -- [[Page]] → Page
	body = mw.ustring.gsub(body, '%]%]', '')
	body = mw.ustring.gsub(body, "''+", "")                  -- remove bold/italics
	body = mw.ustring.gsub(body, "=+%s*(.-)%s*=+", "")       -- remove section headers
	body = mw.ustring.gsub(body, "{{.-}}", "")               -- remove remaining inline templates

	-- Normalize whitespace
	body = body:gsub("\n", " ")
	body = body:gsub("%s+", " ")
	body = trim(body)

	if body == "" then
		return "No description available."
	end

	local truncated = mw.ustring.sub(body, 1, length)
	if #body > length then
		truncated = truncated .. "..."
	end

	return truncated
end

return p