tinytoml/tinytoml.lua
FourierTransformer 876a176023 first commit
2024-10-31 10:19:27 -05:00

1130 lines
34 KiB
Lua

local tinytoml = {}
tinytoml._VERSION = "tinytoml 0.0.0"
tinytoml._DESCRIPTION = "a single-file pure Lua TOML parser"
tinytoml._URL = "https://github.com/FourierTransformer/tinytoml"
tinytoml._LICENSE = "MIT"
local sbyte = string.byte
local chars = {
SINGLE_QUOTE = sbyte("'"),
DOUBLE_QUOTE = sbyte('"'),
OPEN_BRACKET = sbyte("["),
CLOSE_BRACKET = sbyte("]"),
BACKSLASH = sbyte("\\"),
COMMA = sbyte(","),
POUND = sbyte("#"),
DOT = sbyte("."),
CR = sbyte("\r"),
LF = sbyte("\n"),
}
local function _error(sm, message, anchor)
local error_message = { "in ", sm.filename, " line ", sm.line_number, ": ", message }
if anchor ~= nil then
error_message[#error_message + 1] = "\n\n\t See https://toml.io/en/v1.0.0#"
error_message[#error_message + 1] = anchor
error_message[#error_message + 1] = " for more details\n"
end
error(table.concat(error_message))
end
local function _nsmerror(message, input, byte, anchor)
local error_message = { "on byte ", byte, ": ", message, "\nnear: ", string.sub(input, byte - 25, byte + 25) }
if anchor ~= nil then
error_message[#error_message + 1] = "\n\n\t See https://toml.io/en/v1.0.0#"
error_message[#error_message + 1] = anchor
error_message[#error_message + 1] = " for more details\n"
end
error(table.concat(error_message))
end
local _unpack = unpack or table.unpack
local utf8char
if (tonumber((_VERSION or ''):match('[%d.]*$')) or 0) < 5.3 then
utf8char = function(cp)
if cp < 128 then
return string.char(cp)
end
local suffix = cp % 64
local c4 = 128 + suffix
cp = (cp - suffix) / 64
if cp < 32 then
return string.char(192 + (cp), (c4))
end
suffix = cp % 64
local c3 = 128 + suffix
cp = (cp - suffix) / 64
if cp < 16 then
return string.char(224 + (cp), c3, c4)
end
suffix = cp % 64
cp = (cp - suffix) / 64
return string.char(240 + (cp), 128 + (suffix), c3, c4)
end
else
utf8char = utf8.char
end
local function validate_utf8(input, toml_sub)
local i, len = 1, #input
local byte, second, third, fourth = 0, 129, 129, 129
toml_sub = toml_sub or false
while i <= len do
byte = sbyte(input, i)
if byte <= 127 then
if toml_sub then
if byte < 9 then _nsmerror("TOML only allows some control characters, but they must be escaped in double quoted strings", input, i, "string")
elseif byte == chars.CR and sbyte(input, i + 1) ~= chars.LF then _nsmerror("TOML requires all \\r be followed by \\n", input, i, "spec")
elseif byte >= 11 and byte <= 31 and byte ~= 13 then _nsmerror("TOML only allows some control characters, but they must be escaped in double quoted strings", input, i, "string")
elseif byte == 127 then _nsmerror("TOML only allows some control characters, but they must be escaped in double quoted strings", input, i, "string") end
end
i = i + 1
elseif byte >= 194 and byte <= 223 then
second = sbyte(input, i + 1)
i = i + 2
elseif byte == 224 then
second = sbyte(input, i + 1); third = sbyte(input, i + 2)
if second ~= nil and second >= 128 and second <= 159 then return false, i end
i = i + 3
elseif byte == 237 then
second = sbyte(input, i + 1); third = sbyte(input, i + 2)
if second ~= nil and second >= 160 and second <= 191 then return false, i end
i = i + 3
elseif (byte >= 225 and byte <= 236) or byte == 238 or byte == 239 then
second = sbyte(input, i + 1); third = sbyte(input, i + 2)
i = i + 3
elseif byte == 240 then
second = sbyte(input, i + 1); third = sbyte(input, i + 2); fourth = sbyte(input, i + 3)
if second ~= nil and second >= 128 and second <= 143 then return false, i end
i = i + 4
elseif byte == 241 or byte == 242 or byte == 243 then
second = sbyte(input, i + 1); third = sbyte(input, i + 2); fourth = sbyte(input, i + 3)
i = i + 4
elseif byte == 244 then
second = sbyte(input, i + 1); third = sbyte(input, i + 2); fourth = sbyte(input, i + 3)
if second ~= nil and second >= 160 and second <= 191 then return false, i end
i = i + 4
else
return false, i
end
if second == nil or second < 128 or second > 191 then return false, i end
if third == nil or third < 128 or third > 191 then return false, i end
if fourth == nil or fourth < 128 or fourth > 191 then return false, i end
end
return true, i
end
local function find_newline(sm)
sm._, sm.end_seq = sm.input:find(".-\r?\n", sm.i)
if sm.end_seq == nil then
sm._, sm.end_seq = sm.input:find(".-$", sm.i)
end
sm.line_number = sm.line_number + 1
sm.i = sm.end_seq + 1
end
local escape_sequences = {
['b'] = '\b',
['t'] = '\t',
['n'] = '\n',
['f'] = '\f',
['r'] = '\r',
['\\'] = '\\',
['"'] = '"',
}
local function handle_backslash_escape(sm)
if sm.multiline_string then
if sm.input:find("^\\[ \t]-\r?\n", sm.i) then
sm._, sm.end_seq = sm.input:find("%S", sm.i + 1)
sm.i = sm.end_seq - 1
return "", false
end
end
sm._, sm.end_seq, sm.match = sm.input:find('^([\\btrfn"])', sm.i + 1)
local escape = escape_sequences[sm.match]
if escape then
sm.i = sm.end_seq
if sm.match == '"' then
return escape, true
else
return escape, false
end
end
sm._, sm.end_seq, sm.match, sm.ext = sm.input:find("^([uU])([0-9a-fA-F]+)", sm.i + 1)
if sm.match then
if (sm.match == "u" and #sm.ext == 4) or
(sm.match == "U" and #sm.ext == 8) then
local codepoint_to_insert = utf8char(tonumber(sm.ext, 16))
if not validate_utf8(codepoint_to_insert) then
_error(sm, "Escaped UTF-8 sequence not valid UTF-8 character: \\" .. sm.match .. sm.ext, "string")
end
sm.i = sm.end_seq
return codepoint_to_insert, false
end
end
return nil
end
local function close_string(sm)
local escape
local reset_quote
local start_field, end_field = sm.i + 1, 0
local second, third = sbyte(sm.input, sm.i + 1), sbyte(sm.input, sm.i + 2)
local quote_count = 0
local output = {}
local found_closing_quote = false
sm.multiline_string = false
if second == chars.DOUBLE_QUOTE and third == chars.DOUBLE_QUOTE then
sm.multiline_string = true
start_field = sm.i + 3
second, third = sbyte(sm.input, sm.i + 3), sbyte(sm.input, sm.i + 4)
if second == chars.LF then
start_field = start_field + 1
elseif second == chars.CR and third == chars.LF then
start_field = start_field + 2
end
sm.i = start_field - 1
end
while found_closing_quote == false and sm.i <= sm.input_length do
sm.i = sm.i + 1
sm.byte = sbyte(sm.input, sm.i)
if sm.byte == chars.BACKSLASH then
output[#output + 1] = sm.input:sub(start_field, sm.i - 1)
escape, reset_quote = handle_backslash_escape(sm)
if reset_quote then quote_count = 0 end
if escape ~= nil then
output[#output + 1] = escape
else
sm._, sm._, sm.match = sm.input:find("^(%S*)", sm.i + 1)
_error(sm, "TOML only allows specific escape sequences. Invalid escape sequence found: \\" .. sm.match, "string")
end
start_field = sm.i + 1
elseif sm.multiline_string then
if sm.byte == chars.DOUBLE_QUOTE then
quote_count = quote_count + 1
if quote_count == 5 then
end_field = sm.i - 3
output[#output + 1] = sm.input:sub(start_field, end_field)
found_closing_quote = true
break
end
else
if quote_count >= 3 then
end_field = sm.i - 4
output[#output + 1] = sm.input:sub(start_field, end_field)
found_closing_quote = true
sm.i = sm.i - 1
break
else
quote_count = 0
end
end
else
if sm.byte == chars.DOUBLE_QUOTE then
end_field = sm.i - 1
output[#output + 1] = sm.input:sub(start_field, end_field)
found_closing_quote = true
break
elseif sm.byte == chars.CR or sm.byte == chars.LF then
_error(sm, "Newlines are not allowed in single quoted basic strings. Use multi-line (triple quoted) strings instead.", "string")
end
end
end
if not found_closing_quote then
if sm.multiline_string then
_error(sm, "Unable to find closing triple-quotes for multi-line string", "string")
else
_error(sm, "Unable to find closing quote for string", "string")
end
end
sm.i = sm.i + 1
sm.value = table.concat(output)
sm.value_type = "string"
end
local function close_literal_string(sm)
sm.byte = 0
local start_field, end_field = sm.i + 1, 0
local second, third = sbyte(sm.input, sm.i + 1), sbyte(sm.input, sm.i + 2)
local quote_count = 0
sm.multiline_string = false
if second == chars.SINGLE_QUOTE and third == chars.SINGLE_QUOTE then
sm.multiline_string = true
start_field = sm.i + 3
second, third = sbyte(sm.input, sm.i + 3), sbyte(sm.input, sm.i + 4)
if second == chars.LF then
start_field = start_field + 1
elseif second == chars.CR and third == chars.LF then
start_field = start_field + 2
end
sm.i = start_field
end
while end_field ~= 0 or sm.i <= sm.input_length do
sm.i = sm.i + 1
sm.byte = sbyte(sm.input, sm.i)
if sm.multiline_string then
if sm.byte == chars.SINGLE_QUOTE then
quote_count = quote_count + 1
if quote_count == 5 then
end_field = sm.i - 3
break
end
else
if quote_count >= 3 then
end_field = sm.i - 4
sm.i = sm.i - 1
break
else
quote_count = 0
end
end
else
if sm.byte == chars.SINGLE_QUOTE then
end_field = sm.i - 1
break
elseif sm.byte == chars.CR or sm.byte == chars.LF then
_error(sm, "Newlines are not allowed in single quoted literal strings. Use multi-line (triple quoted) strings instead.", "string")
end
end
end
if end_field == 0 then
if sm.multiline_string then
_error(sm, "Unable to find closing triple quotes for multi-line literal string", "string")
else
_error(sm, "Unable to find closing quote for literal string", "string")
end
end
sm.i = sm.i + 1
sm.value = sm.input:sub(start_field, end_field)
sm.value_type = "string"
end
local function close_bare_string(sm)
sm._, sm.end_seq, sm.match = sm.input:find("^([a-zA-Z0-9-_]+)", sm.i)
if sm.match then
sm.i = sm.end_seq + 1
sm.multiline_string = false
sm.value = sm.match
sm.value_type = "string"
else
_error(sm, "Bare keys can only contain 'a-zA-Z0-9-_'. Invalid bare key found : " .. sm.input:sub(sm.i, sm.i + 50))
end
end
local function remove_underscores_number(sm, number, anchor)
if number:find("_") then
if number:find("__") then _error(sm, "Numbers cannot have consecutive underscores. Found " .. anchor .. ": " .. number, anchor) end
if number:find("^_") or number:find("_$") then _error(sm, "Underscores are not allowed at beginning or end of a number. Found " .. anchor .. " : " .. number, anchor) end
if number:find("%D_%d") or number:find("%d_%D") then _error(sm, "Underscores must have digits on either side. Found " .. anchor .. " : " .. number, anchor) end
number = number:gsub("_", "")
end
return number
end
local integer_match = {
["b"] = { "^0b([01_]+)$", 2 },
["o"] = { "^0o([0-7_]+)$", 8 },
["x"] = { "^0x([0-9a-fA-F_]+)$", 16 },
}
local function validate_integer(sm, value)
sm._, sm._, sm.match = value:find("^([-+]?[%d_]+)$")
if sm.match then
if sm.match:find("^[-+]?0[%d_]") then _error(sm, "Integers can't start with a leading 0. Found integer: " .. sm.match, "integer") end
sm.match = remove_underscores_number(sm, sm.match, "integer")
sm.value = tonumber(sm.match)
sm.value_type = "integer"
return true
end
if value:find("^0[box]") then
local pattern_bits = integer_match[value:sub(2, 2)]
sm._, sm._, sm.match = value:find(pattern_bits[1])
if sm.match then
sm.match = remove_underscores_number(sm, sm.match, "integer")
sm.value = tonumber(sm.match, pattern_bits[2])
sm.value_type = "integer"
return true
end
end
end
local function validate_float(sm, value)
sm._, sm._, sm.match, sm.ext = value:find("^([-+]?[%d_]+%.[%d_]+)(.*)$")
if sm.match then
if sm.match:find("%._") or sm.match:find("_%.") then _error(sm, "Underscores in floats must have a number on either side. Found float: " .. sm.match .. sm.ext, "float") end
if sm.match:find("^[-+]?0[%d_]") then _error(sm, "Floats can't start with a leading 0. Found float: " .. sm.match .. sm.ext, "float") end
sm.match = remove_underscores_number(sm, sm.match, "float")
if sm.ext ~= "" then
if sm.ext:find("^[eE][-+]?[%d_]+$") then
sm.ext = remove_underscores_number(sm, sm.ext, "float")
sm.value = tonumber(sm.match .. sm.ext)
sm.value_type = "float"
return true
end
else
sm.value = tonumber(sm.match)
sm.value_type = "float"
return true
end
end
sm._, sm._, sm.match = value:find("^([-+]?[%d_]+[eE][-+]?[%d_]+)$")
if sm.match then
if sm.match:find("_[eE]") or sm.match:find("[eE]_") then _error(sm, "Underscores in floats cannot be before or after the e. Found float: " .. sm.match .. sm.ext, "float") end
sm.match = remove_underscores_number(sm, sm.match, "float")
sm.value = tonumber(sm.match)
sm.value_type = "float"
return true
end
end
local max_days_in_month = { 31, 29, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31 }
local function validate_datetime(sm, value)
local hour, min, sec
sm._, sm._, sm.match, hour, min, sec, sm.ext = value:find("^((%d%d):(%d%d):(%d%d))(.*)$")
if sm.match then
if tonumber(hour) > 23 then _error(sm, "Hours must be less than 24. Found hour: " .. hour .. "in: " .. sm.match, "local-time") end
if tonumber(min) > 59 then _error(sm, "Minutes must be less than 60. Found minute: " .. min .. "in: " .. sm.match, "local-time") end
if tonumber(sec) > 60 then _error(sm, "Seconds must be less than 61. Found second: " .. sec .. "in: " .. sm.match, "local-time") end
if sm.ext ~= "" then
if sm.ext:find("^%.%d+$") then
sm.value_type = "time-local"
sm.value = sm.type_conversion[sm.value_type](sm.match .. sm.ext:sub(1, 4))
return true
end
else
sm.value_type = "time-local"
sm.value = sm.type_conversion[sm.value_type](sm.match)
return true
end
end
local year_s, month_s, day_s
local year, month, day
sm._, sm._, sm.match, year_s, month_s, day_s = value:find("^((%d%d%d%d)%-(%d%d)%-(%d%d))$")
if sm.match then
year, month, day = tonumber(year_s), tonumber(month_s), tonumber(day_s)
if month == 0 or month > 12 then _error(sm, "Month must be between 01-12. Found month: " .. month .. "in: " .. sm.match, "local-date") end
if day == 0 or day > max_days_in_month[month] then _error(sm, "Too many days in the month. Found " .. day .. " days in month " .. month .. ", which only has " .. max_days_in_month[month] .. " days in: " .. sm.match, "local-date") end
if month == 2 then
local leap_year = (year % 4 == 0) and not (year % 100 == 0) or (year % 400 == 0)
if leap_year == false then
if day > 28 then _error(sm, "Too many days in month. Found " .. day .. " days in month 02, which only has 28 days if it's not a leap year in: " .. sm.match, "local-date") end
end
end
sm.value_type = "date-local"
sm.value = sm.type_conversion[sm.value_type](sm.match)
local potential_end_seq
sm._, potential_end_seq, sm.match = sm.input:find("^ ([%S]+)", sm.i)
if sm.match and sm.match:find("^%d%d:%d%d:%d%d") then
value = value .. " " .. sm.match
sm.end_seq = potential_end_seq
sm.i = sm.end_seq + 1
else
return true
end
end
sm._, sm._, sm.match, year_s, month_s, day_s, hour, min, sec, sm.ext =
value:find("^((%d%d%d%d)%-(%d%d)%-(%d%d)[Tt ](%d%d):(%d%d):(%d%d))(.*)$")
if sm.match then
if tonumber(hour) > 23 then _error(sm, "Hours must be less than 24. Found hour: " .. hour .. "in: " .. sm.match, "") end
if tonumber(min) > 59 then _error(sm, "Minutes must be less than 60. Found minute: " .. min .. "in: " .. sm.match) end
if tonumber(sec) > 60 then _error(sm, "Seconds must be less than 61. Found second: " .. sec .. "in: " .. sm.match) end
year, month, day = tonumber(year_s), tonumber(month_s), tonumber(day_s)
if month == 0 or month > 12 then _error(sm, "Month must be between 01-12. Found month: " .. month .. "in: " .. sm.match) end
if day == 0 or day > max_days_in_month[month] then _error(sm, "Too many days in the month. Found " .. day .. " days in month " .. month .. ", which only has " .. max_days_in_month[month] .. " days in: " .. sm.match, "local-datetime") end
if month == 2 then
local leap_year = (year % 4 == 0) and not (year % 100 == 0) or (year % 400 == 0)
if leap_year == false then
if day > 28 then _error(sm, "Too many days in month. Found " .. day .. " days in month 02, which only has 28 day if it's not a leap year in: " .. sm.match, "local-datetime") end
end
end
if sm.ext ~= "" then
if sm.ext:find("^%.%d+$") then
sm.value_type = "datetime-local"
sm.value = sm.type_conversion[sm.value_type](sm.match .. sm.ext:sub(1, 4))
return true
elseif sm.ext:find("^%.%d+Z$") then
sm.value_type = "datetime"
sm.value = sm.type_conversion[sm.value_type](sm.match .. sm.ext:sub(1, 4))
return true
elseif sm.ext:find("^%.%d+[+-]%d%d:%d%d$") then
sm._, sm.end_seq, hour, min = sm.ext:find("^%.%d+[+-](%d%d):(%d%d)$")
if tonumber(hour) > 23 then _error(sm, "Hours must be less than 24. Found hour: " .. hour .. "in: " .. sm.match, "offset-date-time") end
if tonumber(min) > 59 then _error(sm, "Minutes must be less than 60. Found minute: " .. min .. "in: " .. sm.match, "offset-date-time") end
sm.value_type = "datetime"
sm.value = sm.type_conversion[sm.value_type](sm.match .. sm.ext:sub(1, 4))
return true
elseif sm.ext:find("^[Zz]$") then
sm.value_type = "datetime"
sm.value = sm.type_conversion[sm.value_type](sm.match .. sm.ext)
return true
elseif sm.ext:find("^[+-]%d%d:%d%d$") then
sm._, sm.end_seq, hour, min = sm.ext:find("^[+-](%d%d):(%d%d)$")
if tonumber(hour) > 23 then _error(sm, "Hours must be less than 24. Found hour: " .. hour .. "in: " .. sm.match, "offset-date-time") end
if tonumber(min) > 59 then _error(sm, "Minutes must be less than 60. Found minute: " .. min .. "in: " .. sm.match, "offset-date-time") end
sm.value_type = "datetime"
sm.value = sm.type_conversion[sm.value_type](sm.match .. sm.ext)
return true
end
else
sm.value_type = "datetime-local"
sm.value = sm.type_conversion[sm.value_type](sm.match)
return true
end
end
end
local validators = {
validate_integer,
validate_float,
validate_datetime,
}
local exact_matches = {
["true"] = { true, "bool" },
["false"] = { false, "bool" },
["+inf"] = { math.huge, "float" },
["inf"] = { math.huge, "float" },
["-inf"] = { -math.huge, "float" },
["+nan"] = { (0 / 0), "float" },
["nan"] = { (0 / 0), "float" },
["-nan"] = { (-(0 / 0)), "float" },
}
local function close_other_value(sm)
local successful_type
sm._, sm.end_seq, sm.match = sm.input:find("^([^ #\r\n,%[{%]}]+)", sm.i)
sm.i = sm.end_seq + 1
if sm.match == nil then
_error(sm, "Can't find value to close")
end
local value = sm.match
local exact_value = exact_matches[value]
if exact_value ~= nil then
sm.value = exact_value[1]
sm.value_type = exact_value[2]
return
end
for _, validator in ipairs(validators) do
successful_type = validator(sm, value)
if successful_type == true then
return
end
end
_error(sm, "Unable to determine type of value for: " .. value)
end
local function create_array(sm)
sm.nested_arrays = sm.nested_arrays + 1
sm.arrays[sm.nested_arrays] = {}
sm.i = sm.i + 1
end
local function add_array_comma(sm)
if sm.value_type == "array" or sm.value_type == "inline-table" then
table.insert(sm.arrays[sm.nested_arrays], sm.value)
else
table.insert(sm.arrays[sm.nested_arrays], sm.assign_value_function(sm.value, sm.value_type))
end
sm.value = nil
sm.i = sm.i + 1
end
local function close_array(sm)
if sm.value ~= nil then
add_array_comma(sm)
else
sm.i = sm.i + 1
end
sm.value = sm.arrays[sm.nested_arrays]
sm.value_type = "array"
sm.nested_arrays = sm.nested_arrays - 1
if sm.nested_arrays == 0 then
return "assign"
else
return "inside_array"
end
end
local function create_table(sm)
sm.tables = {}
sm.byte = sbyte(sm.input, sm.i + 1)
if sm.byte == chars.OPEN_BRACKET then
sm.i = sm.i + 2
sm.table_type = "arrays_of_tables"
else
sm.i = sm.i + 1
sm.table_type = "table"
end
end
local function add_table_dot(sm)
sm.tables[#sm.tables + 1] = sm.value
sm.i = sm.i + 1
end
local function close_table(sm)
sm.byte = sbyte(sm.input, sm.i + 1)
if sm.table_type == "arrays_of_tables" and sm.byte ~= chars.CLOSE_BRACKET then
_error(sm, "Arrays of Tables should be closed with ']]'", "array-of-tables")
end
if sm.byte == chars.CLOSE_BRACKET then
sm.i = sm.i + 2
else
sm.i = sm.i + 1
end
sm.tables[#sm.tables + 1] = sm.value
local out_table = sm.output
local meta_out_table = sm.meta_table
for i = 1, #sm.tables - 1 do
if out_table[sm.tables[i]] == nil then
out_table[sm.tables[i]] = {}
out_table = out_table[sm.tables[i]]
meta_out_table[sm.tables[i]] = { type = "auto-dictionary" }
meta_out_table = meta_out_table[sm.tables[i]]
else
if (meta_out_table[sm.tables[i]]).type == "value" then
_error(sm, "Cannot override value with table definition")
end
local next_table = out_table[sm.tables[i]][#out_table[sm.tables[i]]]
local next_meta_table = meta_out_table[sm.tables[i]][#meta_out_table[sm.tables[i]]]
if next_table == nil then
out_table = out_table[sm.tables[i]]
meta_out_table = meta_out_table[sm.tables[i]]
else
out_table = next_table
meta_out_table = next_meta_table
end
end
end
local final_table = sm.tables[#sm.tables]
if sm.table_type == "table" then
if out_table[final_table] == nil then
out_table[final_table] = {}
meta_out_table[final_table] = { type = "dictionary" }
elseif (meta_out_table[final_table]).type == "value" then
_error(sm, "Cannot override existing value with table")
elseif (meta_out_table[final_table]).type == "dictionary" then
_error(sm, "Cannot override existing table")
elseif (meta_out_table[final_table]).type == "array" then
_error(sm, "Cannot override existing array")
elseif (meta_out_table[final_table]).type == "value-dictionary" then
_error(sm, "Cannot override value with table definition")
end
(meta_out_table[final_table]).type = "dictionary"
sm.current_table = out_table[final_table]
sm.current_meta_table = meta_out_table[final_table]
elseif sm.table_type == "arrays_of_tables" then
if out_table[final_table] == nil then
out_table[final_table] = {}
meta_out_table[final_table] = { type = "array" }
elseif (meta_out_table[final_table]).type == "value" then
_error(sm, "Cannot override existing value with table")
elseif (meta_out_table[final_table]).type == "dictionary" then
_error(sm, "Cannot override existing table")
elseif (meta_out_table[final_table]).type == "auto-dictionary" then
_error(sm, "Cannot override existing table")
elseif (meta_out_table[final_table]).type == "value-dictionary" then
_error(sm, "Cannot override value with table definition")
end
table.insert(out_table[final_table], {})
table.insert(meta_out_table[final_table], { type = "dictionary" })
sm.current_table = out_table[final_table][#out_table[final_table]]
sm.current_meta_table = meta_out_table[final_table][#meta_out_table[final_table]]
end
end
local function assign_key(sm)
if sm.multiline_string == false then
sm.keys[#sm.keys + 1] = sm.value
else
_error(sm, "Keys must be a non multi-line string. Found key: " .. tostring(sm.value), "key")
end
sm.value = nil
sm.value_type = nil
sm.i = sm.i + 1
end
local function assign_value(sm)
local output = {}
if sm.value_type == "array" or sm.value_type == "inline-table" then
output = sm.value
else
output = sm.assign_value_function(sm.value, sm.value_type)
end
local out_table = sm.current_table
local meta_out_table = sm.current_meta_table
for i = 1, #sm.keys - 1 do
if out_table[sm.keys[i]] == nil then
out_table[sm.keys[i]] = {}
meta_out_table[sm.keys[i]] = { type = "value-dictionary" }
elseif (meta_out_table[sm.keys[i]]).type == "value" then
_error(sm, "Cannot key append over an exsiting value")
elseif (meta_out_table[sm.keys[i]]).type == "dictionary" then
_error(sm, "Cannot override existing table")
elseif (meta_out_table[sm.keys[i]]).type == "array" then
_error(sm, "Cannot override existing array")
end
out_table = out_table[sm.keys[i]]
meta_out_table = meta_out_table[sm.keys[i]]
end
local last_table = sm.keys[#sm.keys]
if out_table[last_table] ~= nil then
_error(sm, "Cannot override existing value")
end
out_table[last_table] = output
meta_out_table[last_table] = { type = "value" }
sm.keys = {}
sm.value = nil
sm.byte = sbyte(sm.input, sm.i)
if sm.byte == chars.COMMA then
sm.i = sm.i + 1
end
end
local function error_invalid_state(sm)
local error_message = "Incorrectly formatted TOML. "
local found = sm.input:sub(sm.i, sm.i); if found == "\r" or found == "\n" then found = "newline character" end
if sm.mode == "start_of_line" then error_message = error_message .. "At start of line, could not find a key. Found ="
elseif sm.mode == "inside_table" then error_message = error_message .. "In a table definition, expected a '.' or ']'. Found: " .. found
elseif sm.mode == "inside_key" then error_message = error_message .. "In a key defintion, expected a '.' or '='. Found: " .. found
elseif sm.mode == "value" then error_message = error_message .. "Unspecified value, key was specified, but no value provided."
elseif sm.mode == "inside_array" then error_message = error_message .. "Inside an array, expected a ']', '}' (if inside inline table), ',', newline, or comment. Found: " .. found
elseif sm.mode == "wait_for_newline" then error_message = error_message .. "Just assigned value or created table. Expected newline or comment."
end
_error(sm, error_message)
end
local function create_inline_table(sm)
sm.nested_inline_tables = sm.nested_inline_tables + 1
local backup = {
previous_state = sm.mode,
meta_table = sm.meta_table,
current_table = sm.current_table,
keys = { _unpack(sm.keys) },
}
local new_inline_table = {}
sm.current_table = new_inline_table
sm.inline_table_backup[sm.nested_inline_tables] = backup
sm.current_table = {}
sm.meta_table = {}
sm.keys = {}
sm.i = sm.i + 1
end
local function close_inline_table(sm)
if sm.value ~= nil then
assign_value(sm)
end
sm.i = sm.i + 1
sm.value = sm.current_table
sm.value_type = "inline-table"
local restore = sm.inline_table_backup[sm.nested_inline_tables]
sm.keys = restore.keys
sm.meta_table = restore.meta_table
sm.current_table = restore.current_table
sm.nested_inline_tables = sm.nested_inline_tables - 1
if restore.previous_state == "array" then
return "inside_array"
elseif restore.previous_state == "value" then
return "assign"
else
_error(sm, "close_inline_table should not be called from the previous state: " .. restore.previous_state .. ". Please submit an issue with your TOML file so we can look into the issue!")
end
end
local transitions = {
["start_of_line"] = {
[sbyte("#")] = { find_newline, "start_of_line" },
[sbyte("\r")] = { find_newline, "start_of_line" },
[sbyte("\n")] = { find_newline, "start_of_line" },
[sbyte('"')] = { close_string, "inside_key" },
[sbyte("'")] = { close_literal_string, "inside_key" },
[sbyte("[")] = { create_table, "table" },
[sbyte("=")] = { error_invalid_state, "error" },
[0] = { close_bare_string, "inside_key" },
},
["table"] = {
[sbyte('"')] = { close_string, "inside_table" },
[sbyte("'")] = { close_literal_string, "inside_table" },
[0] = { close_bare_string, "inside_table" },
},
["inside_table"] = {
[sbyte(".")] = { add_table_dot, "table" },
[sbyte("]")] = { close_table, "wait_for_newline" },
[0] = { error_invalid_state, "error" },
},
["key"] = {
[sbyte('"')] = { close_string, "inside_key" },
[sbyte("'")] = { close_literal_string, "inside_key" },
[sbyte("}")] = { close_inline_table, "?" },
[0] = { close_bare_string, "inside_key" },
},
["inside_key"] = {
[sbyte(".")] = { assign_key, "key" },
[sbyte("=")] = { assign_key, "value" },
[0] = { error_invalid_state, "error" },
},
["value"] = {
[sbyte("'")] = { close_literal_string, "assign" },
[sbyte('"')] = { close_string, "assign" },
[sbyte("{")] = { create_inline_table, "key" },
[sbyte("[")] = { create_array, "array" },
[sbyte("\n")] = { error_invalid_state, "error" },
[sbyte("\r")] = { error_invalid_state, "error" },
[0] = { close_other_value, "assign" },
},
["array"] = {
[sbyte("'")] = { close_literal_string, "inside_array" },
[sbyte('"')] = { close_string, "inside_array" },
[sbyte("[")] = { create_array, "array" },
[sbyte("]")] = { close_array, "?" },
[sbyte("#")] = { find_newline, "array" },
[sbyte("\r")] = { find_newline, "array" },
[sbyte("\n")] = { find_newline, "array" },
[sbyte("{")] = { create_inline_table, "key" },
[0] = { close_other_value, "inside_array" },
},
["inside_array"] = {
[sbyte(",")] = { add_array_comma, "array" },
[sbyte("]")] = { close_array, "?" },
[sbyte("}")] = { close_inline_table, "?" },
[sbyte("#")] = { find_newline, "inside_array" },
[sbyte("\r")] = { find_newline, "inside_array" },
[sbyte("\n")] = { find_newline, "inside_array" },
[0] = { error_invalid_state, "error" },
},
["assign"] = {
[sbyte(",")] = { assign_value, "key" },
[sbyte("}")] = { close_inline_table, "?" },
[0] = { assign_value, "wait_for_newline" },
},
["wait_for_newline"] = {
[sbyte("#")] = { find_newline, "start_of_line" },
[sbyte("\r")] = { find_newline, "start_of_line" },
[sbyte("\n")] = { find_newline, "start_of_line" },
[0] = { error_invalid_state, "error" },
},
}
local function generic_assign(value) return value end
local function generic_type_conversion(raw_value) return raw_value end
function tinytoml.parse(filename, options)
local sm = {}
sm.assign_value_function = generic_assign
sm.type_conversion = {
["datetime"] = generic_type_conversion,
["datetime-local"] = generic_type_conversion,
["date-local"] = generic_type_conversion,
["time-local"] = generic_type_conversion,
}
if options then
if options.load_from_string then
sm.input = filename
sm.filename = "string input"
end
if options.assign_value_function then
sm.assign_value_function = options.assign_value_function
else
end
if options.type_conversion then
for key, value in pairs(options.type_conversion) do
sm.type_conversion[(key)] = value
end
end
else
local file = io.open(filename, "r")
sm.input = file:read("*all")
sm.filename = filename
end
sm.i = 1
sm.keys = {}
sm.arrays = {}
sm.output = {}
sm.meta_table = {}
sm.line_number = 1
sm.nested_arrays = 0
sm.inline_table_backup = {}
sm.nested_inline_tables = 0
sm.table_type = "table"
sm.input_length = #sm.input
sm.current_table = sm.output
sm.current_meta_table = sm.meta_table
if sm.input_length == 0 then return {} end
local valid, char = validate_utf8(sm.input, true)
if not valid then
_nsmerror("Invalid UTF-8 character detected in input", sm.input, char, "spec")
end
sm.mode = "start_of_line"
local dynamic_next_mode = "start_of_line"
local transition = nil
sm._, sm.i = sm.input:find("[^ \t]", sm.i)
while sm.i <= sm.input_length do
sm.byte = sbyte(sm.input, sm.i)
transition = transitions[sm.mode][sm.byte]
if transition == nil then
transition = transitions[sm.mode][0]
end
if transition[2] == "?" then
dynamic_next_mode = transition[1](sm)
sm.mode = dynamic_next_mode
else
transition[1](sm)
sm.mode = transition[2]
end
sm._, sm.i = sm.input:find("[^ \t]", sm.i)
if sm.i == nil then
break
end
end
if sm.mode == "assign" then
sm.i = sm.input_length
assign_value(sm)
end
if sm.mode == "inside_array" or sm.mode == "array" then
_error(sm, "Unable to find closing bracket of array", "array")
end
if sm.nested_inline_tables ~= 0 then
_error(sm, "Unable to find closing bracket of inline table", "inline-table")
end
return sm.output
end
return tinytoml