Module:Template input parse

Revision as of 01:19, 24 September 2024 by Ganaram inukshuk (talk | contribs) (Added fuzzy option for parsing a string of ratios (entries that are a single value are interpreted as a ratio with denominator 1); changed parse-numeric-pairs functions to have options to change both delimiters (between entries and within entries))
Module documentation[view] [edit] [history] [purge]
Todo: add documentation

local p = {}

-- Helper module for various modules that require entry of multiple labels/values

-- TODO:
-- Functions that return size-0 arrays should return nil instead.

-- Helper function
-- Parses entries from a delimited string and returns them in an array
-- Default delimiter is semicolon (;)
function p.parse_entries(unparsed, delimiter)
	local parsed = {}
	local delimiter = delimiter or ';'
	local expr = '([^' .. delimiter .. ']+)'
	for entry in string.gmatch(unparsed, expr) do
		local trimmed = entry:gsub("^%s*(.-)%s*$", "%1")
		table.insert(parsed, trimmed)		-- Add to array
	end
	return parsed
end

-- Helper function
-- Parses entries from a delimited string and returns them in an array
-- Values entered are convereted into numbers rather than strings.
-- Default delimiter is semicolon (;)
function p.parse_numeric_entries(unparsed, delimiter)
	local parsed = {}
	local delimiter = delimiter or ';'
	local expr = '([^' .. delimiter .. ']+)'
	for entry in string.gmatch(unparsed, expr) do
		local trimmed = entry:gsub("^%s*(.-)%s*$", "%1")
		local numeric = tonumber(trimmed)
		table.insert(parsed, numeric)		-- Add to array
	end
	return parsed
end

-- Helper function
-- Parses pairs of values separated by a delimiter; default is colon (:)
function p.parse_pair(unparsed, delimiter)
	local parsed = {}
	local delimiter = delimiter or ':'
	local expr = '([^' .. delimiter .. ']+)'
	for entry in string.gmatch(unparsed, expr) do
		local trimmed = entry:gsub("^%s*(.-)%s*$", "%1")
		table.insert(parsed, trimmed)		-- Add to array
	end
	if #parsed == 2 then
		return parsed
	else
		return nil
	end
end

-- Helper function
-- Parses a pair of numeric values
function p.parse_numeric_pair(unparsed, delimiter)
	local parsed = {}
	local delimiter = delimiter or ':'
	local expr = '([^' .. delimiter .. ']+)'
	for entry in string.gmatch(unparsed, expr) do
		local trimmed = entry:gsub("^%s*(.-)%s*$", "%1")
		local numeric = tonumber(trimmed)
		table.insert(parsed, numeric)		-- Add to array
	end
	if #parsed == 2 then
		return parsed
	else
		return nil
	end
end

-- Helper function
-- Parses a list of numeric pairs
-- Delimiter between each entry can be anything; default is semicolon; this
-- allows for entry of subgroup entries
-- Delimiter between the pair's two values can be anything; default is slash
-- as the intended use is parsing ratios a/b, so input must be formatted as such
-- "a/b; c/d; e/f"
function p.parse_numeric_pairs(unparsed, delimiter1, delimiter2)
	local delimiter1 = delimiter1 or ";"
	local delimiter2 = delimiter2 or "/"
	-- Split the string of unparsed pairs
	local parsed = p.parse_entries(unparsed, delimiter1)
	-- Then tokenize the tokens into numeric pairs
	local pairs_ = {}
	for i = 1, #parsed do
		local pair = p.parse_numeric_pair(parsed[i], delimiter2)
		if pair ~= nil and #pair == 2 then
			table.insert(pairs_, pair)
		end
	end
	return pairs_
end

-- Helper function
-- A less strict version of parse-numeric-pairs that parses singular values
-- as a ratio with denominator 1.
function p.parse_numeric_pair_fuzzy(unparsed, delimiter)
	local parsed = {}
	local delimiter = delimiter or ':'
	local expr = '([^' .. delimiter .. ']+)'
	for entry in string.gmatch(unparsed, expr) do
		local trimmed = entry:gsub("^%s*(.-)%s*$", "%1")
		local numeric = tonumber(trimmed)
		table.insert(parsed, numeric)		-- Add to array
	end
	if #parsed == 2 then
		return parsed
	elseif #parsed == 1 then
		return { parsed[1], 1 }
	else
		return nil
	end
end

-- Helper function
-- Parses a list of numeric pairs, where if values are not ratios, they're
-- interpreted as ratios with denominator 1.
function p.parse_numeric_pairs_fuzzy(unparsed, delimiter1, delimiter2)
	local delimiter1 = delimiter1 or ";"
	local delimiter2 = delimiter2 or "/"
	-- Split the string of unparsed pairs
	local parsed = p.parse_entries(unparsed, delimiter1)
	-- Then tokenize the tokens into numeric pairs
	local pairs_ = {}
	for i = 1, #parsed do
		local pair = p.parse_numeric_pair_fuzzy(parsed[i], delimiter2)
		if pair ~= nil and #pair == 2 then
			table.insert(pairs_, pair)
		end
	end
	return pairs_
end

-- Helper function
-- Parses key-value pairs separated by a semicolon
-- Pairs themselves are separated using a colon
function p.parse_kv_pairs(unparsed)
	-- Split the string of unparsed pairs
	local parsed = p.parse_entries(unparsed)
	-- Then tokenize the tokens into key-value pairs
	local pairs_ = {}
	--local num_pairs = 0
	for i = 1, #parsed do
		local pair = p.parse_pair(parsed[i])
		if pair ~= nil and #pair == 2 then
			pairs_[pair[1]] = pair[2]
			--num_pairs = num_pairs + 1
		end
	end
	return pairs_
end

function p.tester()
	
	return p.parse_numeric_pairs_fuzzy("2.5.7/6.11/6", ".", "/")	
end

return p