Module:InfoboxExtractor

From JoJo's Bizarre Encyclopedia - JoJo Wiki
Jump to navigation Jump to search

Documentation for this module may be created at Module:InfoboxExtractor/doc

local p = {}

local ExtractSection = require("Module:ExtractSection")

local function extractInfobox(wikitext)
    local startInfobox = string.find(wikitext, "{{[^}]*Infobox")
    if not startInfobox then
        return nil
    end

    local braceCount = 0
    local endInfobox = startInfobox

    for i = startInfobox, #wikitext do
        local char = wikitext:sub(i, i)
        if char == '{' then
            braceCount = braceCount + 1
        elseif char == '}' then
            braceCount = braceCount - 1
        end

        if braceCount == 0 then
            endInfobox = i
            break
        end
    end

    return wikitext:sub(startInfobox, endInfobox)
end

local function getLabelValue(infobox, label)
    local pattern = "|" .. label .. " *= *"
    local matchStart, matchEnd = string.find(infobox, pattern)
    if not matchStart then
        return nil
    end

    local value = ""
    local braceCount = 0
    local i = matchEnd + 1
    local isNewLine = false

-- need to do - 2 so it ignores the }} at the end of the infobox
    while i <= #infobox - 2 do
        local char = infobox:sub(i, i)

        if char == '{' then
            braceCount = braceCount + 1
        elseif char == '}' then
            braceCount = braceCount - 1
        end

        if braceCount == 0 and char == '\n' then
            isNewLine = true
        elseif isNewLine and char == '|' then
            break
        else
            isNewLine = false
            value = value .. char
        end

        i = i + 1
    end

    return value
end

local function getImages(value)
    local images = {}
    local pattern = "%[%[File:([^|%]]+)"
    for image in string.gmatch(value, pattern) do
        table.insert(images, image)
    end
    return images
end

function p.extract(frame)
	local preprocess = frame.args.template == "true"
    local pageTitle = frame.args[1]
    if preprocess then
        pageTitle = frame:preprocess(pageTitle)
    end
    if not pageTitle then
        return "<strong class=\"error\">Error: Please provide a page title.</strong>"
    end

    local page = mw.title.new(pageTitle)
    if not page or not page.exists then
        return "<strong class=\"error\">Error: Page not found.</strong>"
    end

    local wikitext = page:getContent()
    local infobox = extractInfobox(wikitext)

    if not infobox then
        return "<strong class=\"error\">Error: Infobox not found.</strong>"
    end

    local label = frame.args[2]
    if not label then
        return "<strong class=\"error\">Error: Please provide a label.</strong>"
    end

    local value = getLabelValue(infobox, label)
    if not value then
        return "<strong class=\"error\">Error: Label not found in infobox.</strong>"
    end
    local tab = frame.args.tab or ""
    if tab ~= "" then
        local tabValue = ExtractSection.extractTab(value, frame.args.tab)
        if tabValue then
            value = tabValue
        end
    end

    if not value and frame.args.tab then
        return "<strong class=\"error\">Error: Tab not found in infobox.</strong>"
    end

    if label:lower() == "image" then
        local images = getImages(value)
        local imageIndex = tonumber(frame.args.imageIndex) or 1
        local size = frame.args.size or ""
        local link = frame.args.link or ""

        if imageIndex < 1 or imageIndex > #images then
            return "Error: Invalid image index."
        end

        local selectedImage = images[imageIndex]
        if link ~= "" then
        	return string.format('[[File:%s|%s|link=%s]]', selectedImage, size, link)
        else
        	return string.format('[[File:%s|%s]]', selectedImage, size)
        end
    else
        local processedValue = frame:preprocess(value)
        return processedValue
    end
end

return p