nomsu/parser.lua

257 lines
8.3 KiB
Lua
Raw Normal View History

2018-06-18 15:46:28 -07:00
local lpeg = require('lpeg')
local re = require('re')
lpeg.setmaxstack(10000)
2018-06-24 23:21:07 -07:00
local P, R, S, C, Cmt, Carg
P, R, S, C, Cmt, Carg = lpeg.P, lpeg.R, lpeg.S, lpeg.C, lpeg.Cmt, lpeg.Carg
local match, sub
2018-06-18 15:46:28 -07:00
do
local _obj_0 = string
match, sub = _obj_0.match, _obj_0.sub
2018-06-18 15:46:28 -07:00
end
local insert, remove
do
local _obj_0 = table
insert, remove = _obj_0.insert, _obj_0.remove
end
local files = require('files')
2018-06-18 18:10:59 -07:00
local NomsuCode, LuaCode, Source
do
local _obj_0 = require("code_obj")
NomsuCode, LuaCode, Source = _obj_0.NomsuCode, _obj_0.LuaCode, _obj_0.Source
end
2018-06-18 15:46:28 -07:00
local AST = require("nomsu_tree")
local NOMSU_DEFS
do
local _with_0 = { }
_with_0.nl = P("\r") ^ -1 * P("\n")
_with_0.ws = S(" \t")
_with_0.tonumber = tonumber
_with_0.table = function()
return { }
end
_with_0.unpack = unpack or table.unpack
2018-06-18 15:46:28 -07:00
local string_escapes = {
n = "\n",
t = "\t",
b = "\b",
a = "\a",
v = "\v",
f = "\f",
r = "\r"
}
local digit, hex = R('09'), R('09', 'af', 'AF')
_with_0.escaped_char = (P("\\") * S("xX") * C(hex * hex)) / function(self)
return string.char(tonumber(self, 16))
end
_with_0.escaped_char = _with_0.escaped_char + ((P("\\") * C(digit * (digit ^ -2))) / function(self)
return string.char(tonumber(self))
end)
_with_0.escaped_char = _with_0.escaped_char + ((P("\\") * C(S("ntbavfr"))) / string_escapes)
_with_0.operator_char = S("'`~!@$^&*-+=|<>?/")
_with_0.utf8_char = (R("\194\223") * R("\128\191") + R("\224\239") * R("\128\191") * R("\128\191") + R("\240\244") * R("\128\191") * R("\128\191") * R("\128\191"))
_with_0.ident_char = R("az", "AZ", "09") + P("_") + _with_0.utf8_char
_with_0.userdata = Carg(1)
_with_0.add_comment = function(src, end_pos, start_pos, comment, userdata)
userdata.comments[start_pos] = comment
return true
end
2018-06-18 15:46:28 -07:00
_with_0.error = function(src, end_pos, start_pos, err_msg, userdata)
local seen_errors = userdata.errors
if seen_errors[start_pos] then
return true
end
2018-06-24 23:21:07 -07:00
local num_errors = 0
for _ in pairs(seen_errors) do
num_errors = num_errors + 1
end
if num_errors >= 10 then
2018-06-18 15:46:28 -07:00
seen_errors[start_pos + 1] = colored.bright(colored.yellow(colored.onred("Too many errors, canceling parsing...")))
return #src + 1
end
local err_pos = start_pos
local line_no = files.get_line_number(src, err_pos)
local prev_line = line_no == 1 and nil or files.get_line(src, line_no - 1)
local err_line = files.get_line(src, line_no)
local next_line = files.get_line(src, line_no + 1)
local i = err_pos - files.get_line_starts(src)[line_no]
2018-07-22 13:48:44 -07:00
local j = i + (end_pos - start_pos)
2018-06-18 15:46:28 -07:00
local pointer = ("-"):rep(i) .. "^"
err_msg = colored.bright(colored.yellow(colored.onred((err_msg or "Parse error") .. " at " .. tostring(userdata.source.filename) .. ":" .. tostring(line_no) .. ":")))
if prev_line then
2018-06-18 15:46:28 -07:00
err_msg = err_msg .. ("\n" .. colored.dim(prev_line))
end
if err_line then
err_line = colored.white(err_line:sub(1, i)) .. colored.bright(colored.red(err_line:sub(i + 1, j + 1))) .. colored.dim(err_line:sub(j + 2, -1))
err_msg = err_msg .. "\n" .. tostring(err_line) .. "\n" .. tostring(colored.red(pointer))
end
if next_line then
2018-06-18 15:46:28 -07:00
err_msg = err_msg .. ("\n" .. colored.dim(next_line))
end
seen_errors[start_pos] = err_msg
return true
end
NOMSU_DEFS = _with_0
end
setmetatable(NOMSU_DEFS, {
__index = function(self, key)
local make_node
make_node = function(start, value, stop, userdata)
if userdata.source then
do
local _with_0 = userdata.source
value.source = Source(_with_0.filename, _with_0.start + start - 1, _with_0.start + stop - 1)
end
end
setmetatable(value, AST[key])
if value.__init then
value:__init()
end
return value
end
self[key] = make_node
return make_node
end
})
local Parser = {
version = 2,
patterns = { }
}
2018-06-18 15:46:28 -07:00
do
local peg_tidier = re.compile([[ file <- %nl* {~ (def/comment) (%nl+ (def/comment))* %nl* ~}
2018-06-18 15:46:28 -07:00
def <- anon_def / captured_def
anon_def <- ({ident} (" "*) ":"
{~ ((%nl " "+ def_line?)+) / def_line ~}) -> "%1 <- %2"
2018-06-18 15:46:28 -07:00
captured_def <- ({ident} (" "*) "(" {ident} ")" (" "*) ":"
{~ ((%nl " "+ def_line?)+) / def_line ~}) -> "%1 <- (({} {| %3 |} {} %%userdata) -> %2)"
def_line <- (err / [^%nl])+
err <- ("(!!" { (!("!!)") .)* } "!!)") -> "(({} (%1) %%userdata) => error)"
2018-06-18 15:46:28 -07:00
ident <- [a-zA-Z_][a-zA-Z0-9_]*
comment <- "--" [^%nl]*
]])
for version = 1, Parser.version do
local peg_file = io.open("nomsu." .. tostring(version) .. ".peg")
if not peg_file and package.nomsupath then
for path in package.nomsupath:gmatch("[^;]+") do
peg_file = io.open(path .. "/nomsu." .. tostring(version) .. ".peg")
if peg_file then
break
end
end
end
assert(peg_file, "could not find nomsu .peg file")
local nomsu_peg = peg_tidier:match(peg_file:read('*a'))
peg_file:close()
Parser.patterns[version] = re.compile(nomsu_peg, NOMSU_DEFS)
end
2018-06-18 15:46:28 -07:00
end
Parser.parse = function(nomsu_code, source, version)
2018-06-18 15:46:28 -07:00
if source == nil then
source = nil
end
if version == nil then
version = nil
end
2018-06-27 10:22:58 -07:00
source = source or nomsu_code.source
2018-06-18 15:46:28 -07:00
nomsu_code = tostring(nomsu_code)
2018-07-22 13:48:44 -07:00
source = source or Source("string: " .. nomsu_code, 1, #nomsu_code)
version = version or nomsu_code:match("^#![^\n]*nomsu[ ]+-V[ ]*([0-9.]+)")
local syntax_version = version and tonumber(version:match("^[0-9]+")) or Parser.version
2018-06-18 15:46:28 -07:00
local userdata = {
errors = { },
source = source,
comments = { }
2018-06-18 15:46:28 -07:00
}
local tree = Parser.patterns[syntax_version]:match(nomsu_code, nil, userdata)
if not tree or type(tree) == 'number' then
2018-06-18 15:46:28 -07:00
error("In file " .. tostring(colored.blue(tostring(source or "<unknown>"))) .. " failed to parse:\n" .. tostring(colored.onyellow(colored.black(nomsu_code))))
end
if next(userdata.errors) then
2018-06-24 23:21:07 -07:00
local keys
do
local _accum_0 = { }
local _len_0 = 1
for k, v in pairs(userdata.errors) do
_accum_0[_len_0] = k
_len_0 = _len_0 + 1
end
keys = _accum_0
end
2018-06-18 15:46:28 -07:00
table.sort(keys)
local errors
do
local _accum_0 = { }
local _len_0 = 1
for _index_0 = 1, #keys do
local k = keys[_index_0]
_accum_0[_len_0] = userdata.errors[k]
_len_0 = _len_0 + 1
end
errors = _accum_0
end
error("Errors occurred while parsing (v" .. tostring(syntax_version) .. "):\n\n" .. table.concat(errors, "\n\n"), 0)
2018-06-18 15:46:28 -07:00
end
local comments
do
local _accum_0 = { }
local _len_0 = 1
for p, c in pairs(userdata.comments) do
_accum_0[_len_0] = {
comment = c,
pos = p
}
_len_0 = _len_0 + 1
end
comments = _accum_0
end
table.sort(comments, function(a, b)
return a.pos > b.pos
end)
local comment_i = 1
local walk_tree
walk_tree = function(t)
local comment_buff = { }
while comments[#comments] and comments[#comments].pos <= t.source.start do
table.insert(comment_buff, table.remove(comments))
end
for _index_0 = 1, #t do
local x = t[_index_0]
if AST.is_syntax_tree(x) then
walk_tree(x)
end
end
while comments[#comments] and comments[#comments].pos <= t.source.stop do
table.insert(comment_buff, table.remove(comments))
end
if #comment_buff > 0 then
t.comments = comment_buff
end
end
walk_tree(tree)
2018-06-18 15:46:28 -07:00
return tree
end
2018-07-17 15:00:57 -07:00
Parser.is_operator = function(s)
2018-07-17 23:33:49 -07:00
return not not (NOMSU_DEFS.operator_char ^ 1 * -1):match(s)
end
Parser.is_identifier = function(s)
return not not (NOMSU_DEFS.ident_char ^ 1 * -1):match(s)
2018-07-17 15:00:57 -07:00
end
2018-07-20 20:13:01 -07:00
local inline_escaper = re.compile("{~ (%utf8_char / ('\"' -> '\\\"') / ('\n' -> '\\n') / ('\t' -> '\\t') / ('\b' -> '\\b') / ('\a' -> '\\a') / ('\v' -> '\\v') / ('\f' -> '\\f') / ('\r' -> '\\r') / ('\\' -> '\\\\') / ([^ -~] -> escape) / .)* ~}", {
utf8_char = NOMSU_DEFS.utf8_char,
escape = (function(self)
return ("\\%03d"):format(self:byte())
end)
})
Parser.inline_escape = function(s)
return inline_escaper:match(s)
end
local escaper = re.compile("{~ (%utf8_char / ('\\' -> '\\\\') / [\n\r\t -~] / (. -> escape))* ~}", {
utf8_char = NOMSU_DEFS.utf8_char,
escape = (function(self)
return ("\\%03d"):format(self:byte())
end)
})
Parser.escape = function(s)
return escaper:match(s)
end
2018-06-23 00:57:31 -07:00
return Parser