Got everything mostly working.
This commit is contained in:
parent
21a6314e27
commit
4789892824
@ -31,10 +31,10 @@ compile [go to %label] to code: ".."
|
|||||||
|
|
||||||
rule [tree %tree has function call %call] =:
|
rule [tree %tree has function call %call] =:
|
||||||
lua> ".."
|
lua> ".."
|
||||||
local target = (\(%call)).value;
|
local target = (\(%call)).stub;
|
||||||
for subtree,_ in coroutine.wrap(function() nomsu:walk_tree(\(%tree)); end) do
|
for subtree,_ in coroutine.wrap(function() nomsu:walk_tree(\(%tree)); end) do
|
||||||
if type(subtree) == 'table' and subtree.type == "FunctionCall"
|
if type(subtree) == 'table' and subtree.type == "FunctionCall"
|
||||||
and nomsu.utils.equivalent(subtree.value, target, 2) then
|
and subtree.stub == target then
|
||||||
return true;
|
return true;
|
||||||
end
|
end
|
||||||
end
|
end
|
||||||
|
@ -27,6 +27,11 @@ rule [compile \%macro_def to \%body] =:
|
|||||||
local thunk = nomsu:tree_to_value(body);
|
local thunk = nomsu:tree_to_value(body);
|
||||||
nomsu:defmacro(signature, thunk, ("compile %s\\n..to %s"):format(vars.macro_def.src, body.src));
|
nomsu:defmacro(signature, thunk, ("compile %s\\n..to %s"):format(vars.macro_def.src, body.src));
|
||||||
|
|
||||||
|
compile [fizz %n] to:
|
||||||
|
"print(\(%n as lua))"
|
||||||
|
compile [pumpo] to:
|
||||||
|
"print('pumpo')"
|
||||||
|
|
||||||
rule [compile \%macro_def to code \%body] =:
|
rule [compile \%macro_def to code \%body] =:
|
||||||
lua> ".."
|
lua> ".."
|
||||||
local signature = {};
|
local signature = {};
|
||||||
|
410
nomsu.lua
410
nomsu.lua
@ -11,7 +11,7 @@ local colors = setmetatable({ }, {
|
|||||||
local colored = setmetatable({ }, {
|
local colored = setmetatable({ }, {
|
||||||
__index = function(_, color)
|
__index = function(_, color)
|
||||||
return (function(msg)
|
return (function(msg)
|
||||||
return colors[color] .. msg .. colors.reset
|
return colors[color] .. (msg or '') .. colors.reset
|
||||||
end)
|
end)
|
||||||
end
|
end
|
||||||
})
|
})
|
||||||
@ -45,210 +45,138 @@ local STRING_ESCAPES = {
|
|||||||
f = "\f",
|
f = "\f",
|
||||||
r = "\r"
|
r = "\r"
|
||||||
}
|
}
|
||||||
local indent_stack = {
|
local ESCAPE_CHAR = (P("\\") * S("ntbavfr")) / function(s)
|
||||||
0
|
return STRING_ESCAPES[s:sub(2, 2)]
|
||||||
}
|
end
|
||||||
local indent_patt = P(function(self, start)
|
local OPERATOR_CHAR = S("'~`!@$^&*-+=|<>?/")
|
||||||
local spaces = self:match("[ \t]*", start)
|
local UTF8_CHAR = (R("\194\223") * R("\128\191") + R("\224\239") * R("\128\191") * R("\128\191") + R("\240\244") * R("\128\191") * R("\128\191") * R("\128\191"))
|
||||||
if #spaces > indent_stack[#indent_stack] then
|
local IDENT_CHAR = R("az", "AZ", "09") + P("_") + UTF8_CHAR
|
||||||
insert(indent_stack, #spaces)
|
local parse
|
||||||
return start + #spaces
|
do
|
||||||
end
|
local ctx = { }
|
||||||
end)
|
local indent_patt = P(function(self, start)
|
||||||
local dedent_patt = P(function(self, start)
|
local spaces = self:match("[ \t]*", start)
|
||||||
local spaces = self:match("[ \t]*", start)
|
if #spaces > ctx.indent_stack[#ctx.indent_stack] then
|
||||||
if #spaces < indent_stack[#indent_stack] then
|
insert(ctx.indent_stack, #spaces)
|
||||||
remove(indent_stack)
|
return start + #spaces
|
||||||
return start
|
|
||||||
end
|
|
||||||
end)
|
|
||||||
local nodent_patt = P(function(self, start)
|
|
||||||
local spaces = self:match("[ \t]*", start)
|
|
||||||
if #spaces == indent_stack[#indent_stack] then
|
|
||||||
return start + #spaces
|
|
||||||
end
|
|
||||||
end)
|
|
||||||
local gt_nodent_patt = P(function(self, start)
|
|
||||||
local spaces = self:match("[ \t]*", start)
|
|
||||||
if #spaces >= indent_stack[#indent_stack] + 4 then
|
|
||||||
return start + indent_stack[#indent_stack] + 4
|
|
||||||
end
|
|
||||||
end)
|
|
||||||
local nomsu = [=[ file <- ({{| shebang?
|
|
||||||
(ignored_line %nl)*
|
|
||||||
statements (nodent statements)*
|
|
||||||
(%nl ignored_line)* %nl?
|
|
||||||
(({.+} ("" -> "Parse error")) => error)? |} }) -> File
|
|
||||||
|
|
||||||
shebang <- "#!" [^%nl]* %nl
|
|
||||||
|
|
||||||
inline_statements <- inline_statement (semicolon inline_statement)*
|
|
||||||
noeol_statements <- (inline_statement semicolon)* noeol_statement
|
|
||||||
statements <- (inline_statement semicolon)* statement
|
|
||||||
|
|
||||||
statement <- functioncall / expression
|
|
||||||
noeol_statement <- noeol_functioncall / noeol_expression
|
|
||||||
inline_statement <- inline_functioncall / inline_expression
|
|
||||||
|
|
||||||
inline_thunk <- ({ {| "{" %ws? inline_statements %ws? "}" |} }) -> Thunk
|
|
||||||
eol_thunk <- ({ {| ":" %ws? noeol_statements eol |} }) -> Thunk
|
|
||||||
indented_thunk <- ({ {| (":" / "{..}") indent
|
|
||||||
statements (nodent statements)*
|
|
||||||
(dedent / (({.+} ("" -> "Error while parsing thunk")) => error))
|
|
||||||
|} }) -> Thunk
|
|
||||||
|
|
||||||
inline_nomsu <- ({("\" inline_expression) }) -> Nomsu
|
|
||||||
eol_nomsu <- ({("\" noeol_expression) }) -> Nomsu
|
|
||||||
indented_nomsu <- ({("\" expression) }) -> Nomsu
|
|
||||||
|
|
||||||
inline_expression <- number / variable / inline_string / inline_list / inline_nomsu
|
|
||||||
/ inline_thunk / ("(" %ws? inline_statement %ws? ")")
|
|
||||||
noeol_expression <- indented_string / indented_nomsu / indented_list / indented_thunk
|
|
||||||
/ ("(..)" indent
|
|
||||||
statement
|
|
||||||
(dedent / (({.+} ("" -> "Error while parsing indented expression"))))
|
|
||||||
) / inline_expression
|
|
||||||
expression <- eol_thunk / eol_nomsu / noeol_expression
|
|
||||||
|
|
||||||
-- Function calls need at least one word in them
|
|
||||||
inline_functioncall <- ({(''=>line_no) {|
|
|
||||||
(inline_expression %ws?)* word (%ws? (inline_expression / word))*
|
|
||||||
|} }) -> FunctionCall
|
|
||||||
noeol_functioncall <- ({(''=>line_no) {|
|
|
||||||
(noeol_expression %ws?)* word (%ws? (noeol_expression / word))*
|
|
||||||
|} }) -> FunctionCall
|
|
||||||
functioncall <- ({(''=>line_no) {|
|
|
||||||
(expression (dotdot / %ws?))* word ((dotdot / %ws?) (expression / word))*
|
|
||||||
|} }) -> FunctionCall
|
|
||||||
|
|
||||||
word <- ({ { %operator / (!number %plain_word) } }) -> Word
|
|
||||||
|
|
||||||
inline_string <- ({ '"' {|
|
|
||||||
({~ (("\\" -> "\") / ('\"' -> '"') / ("\n" -> "
|
|
||||||
") / (!string_interpolation [^%nl"]))+ ~}
|
|
||||||
/ string_interpolation)* |} '"' }) -> String
|
|
||||||
|
|
||||||
indented_string <- ({ '".."' %ws? line_comment? %nl %gt_nodented? {|
|
|
||||||
({~ (("\\" -> "\") / (%nl+ {~ %gt_nodented -> "" ~}) / [^%nl\]) ~} / string_interpolation)*
|
|
||||||
|} ((!.) / (&(%nl+ !%gt_nodented)) / (({.+} ("" -> "Error while parsing String")) => error))
|
|
||||||
}) -> String
|
|
||||||
|
|
||||||
string_interpolation <- "\" ((noeol_expression dotdot?) / dotdot)
|
|
||||||
|
|
||||||
number <- ({ (("-"? (([0-9]+ "." [0-9]+) / ("." [0-9]+) / ([0-9]+)))-> tonumber) }) -> Number
|
|
||||||
|
|
||||||
-- Variables can be nameless (i.e. just %) and can't contain operators like apostrophe
|
|
||||||
-- which is a hack to allow %'s to parse as "%" and "' s" separately
|
|
||||||
variable <- ({ ("%" { %plain_word? }) }) -> Var
|
|
||||||
|
|
||||||
inline_list <- ({ {|
|
|
||||||
("[" %ws? ((inline_list_item comma)* inline_list_item comma?)? %ws? "]")
|
|
||||||
|} }) -> List
|
|
||||||
indented_list <- ({ {|
|
|
||||||
("[..]" indent
|
|
||||||
list_line (nodent list_line)*
|
|
||||||
(dedent / (({.+} ("" -> "Error while parsing list")) => error)))
|
|
||||||
|} }) -> List
|
|
||||||
list_line <- (inline_list_item comma)* ((inline_list_item %ws? ",") / (functioncall / expression))
|
|
||||||
inline_list_item <- inline_functioncall / inline_expression
|
|
||||||
|
|
||||||
block_comment <- "#.." [^%nl]* (%nl (%ws? &%nl))* %nl %indented [^%nl]+ (%nl ((%ws? (!. / &%nl)) / (!%dedented [^%nl]+)))*
|
|
||||||
line_comment <- "#" [^%nl]*
|
|
||||||
|
|
||||||
eol <- %ws? line_comment? (!. / &%nl)
|
|
||||||
ignored_line <- (%nodented (block_comment / line_comment)) / (%ws? (!. / &%nl))
|
|
||||||
indent <- eol (%nl ignored_line)* %nl %indented ((block_comment/line_comment) (%nl ignored_line)* nodent)?
|
|
||||||
nodent <- eol (%nl ignored_line)* %nl %nodented
|
|
||||||
dedent <- eol (%nl ignored_line)* (((!.) &%dedented) / (&(%nl %dedented)))
|
|
||||||
comma <- %ws? "," %ws?
|
|
||||||
semicolon <- %ws? ";" %ws?
|
|
||||||
dotdot <- nodent ".." %ws?
|
|
||||||
]=]
|
|
||||||
local CURRENT_FILE = nil
|
|
||||||
local whitespace = S(" \t") ^ 1
|
|
||||||
local operator = S("'~`!@$^&*-+=|<>?/") ^ 1
|
|
||||||
local utf8_continuation = R("\128\191")
|
|
||||||
local utf8_char = (R("\194\223") * utf8_continuation + R("\224\239") * utf8_continuation * utf8_continuation + R("\240\244") * utf8_continuation * utf8_continuation * utf8_continuation)
|
|
||||||
local plain_word = (R('az', 'AZ', '09') + S("_") + utf8_char) ^ 1
|
|
||||||
local defs = {
|
|
||||||
ws = whitespace,
|
|
||||||
nl = P("\n"),
|
|
||||||
tonumber = tonumber,
|
|
||||||
operator = operator,
|
|
||||||
plain_word = plain_word,
|
|
||||||
indented = indent_patt,
|
|
||||||
nodented = nodent_patt,
|
|
||||||
dedented = dedent_patt,
|
|
||||||
gt_nodented = gt_nodent_patt,
|
|
||||||
line_no = function(src, pos)
|
|
||||||
local line_no = 1
|
|
||||||
for _ in src:sub(1, pos):gmatch("\n") do
|
|
||||||
line_no = line_no + 1
|
|
||||||
end
|
end
|
||||||
return pos, tostring(CURRENT_FILE) .. ":" .. tostring(line_no)
|
end)
|
||||||
end,
|
local dedent_patt = P(function(self, start)
|
||||||
FunctionCall = function(src, line_no, value, errors)
|
local spaces = self:match("[ \t]*", start)
|
||||||
local stub = concat((function()
|
if #spaces < ctx.indent_stack[#ctx.indent_stack] then
|
||||||
local _accum_0 = { }
|
remove(ctx.indent_stack)
|
||||||
local _len_0 = 1
|
return start
|
||||||
for _index_0 = 1, #value do
|
end
|
||||||
local t = value[_index_0]
|
end)
|
||||||
_accum_0[_len_0] = (t.type == "Word" and t.value or "%")
|
local nodent_patt = P(function(self, start)
|
||||||
_len_0 = _len_0 + 1
|
local spaces = self:match("[ \t]*", start)
|
||||||
|
if #spaces == ctx.indent_stack[#ctx.indent_stack] then
|
||||||
|
return start + #spaces
|
||||||
|
end
|
||||||
|
end)
|
||||||
|
local gt_nodent_patt = P(function(self, start)
|
||||||
|
local spaces = self:match("[ \t]*", start)
|
||||||
|
if #spaces >= ctx.indent_stack[#ctx.indent_stack] + 4 then
|
||||||
|
return start + ctx.indent_stack[#ctx.indent_stack] + 4
|
||||||
|
end
|
||||||
|
end)
|
||||||
|
local defs = {
|
||||||
|
nl = P("\n"),
|
||||||
|
ws = S(" \t"),
|
||||||
|
tonumber = tonumber,
|
||||||
|
operator = OPERATOR_CHAR,
|
||||||
|
print = function(src, pos, msg)
|
||||||
|
return print(msg, pos, repr(src:sub(math.max(0, pos - 16), math.max(0, pos - 1)) .. "|" .. src:sub(pos, pos + 16))) or true
|
||||||
|
end,
|
||||||
|
utf8_char = (R("\194\223") * R("\128\191") + R("\224\239") * R("\128\191") * R("\128\191") + R("\240\244") * R("\128\191") * R("\128\191") * R("\128\191")),
|
||||||
|
indented = indent_patt,
|
||||||
|
nodented = nodent_patt,
|
||||||
|
dedented = dedent_patt,
|
||||||
|
gt_nodented = gt_nodent_patt,
|
||||||
|
escape_char = ESCAPE_CHAR,
|
||||||
|
error = function(src, pos, err_msg)
|
||||||
|
if ctx.source_code:sub(pos, pos) == "\n" then
|
||||||
|
pos = pos + #ctx.source_code:match("[ \t\n]*", pos)
|
||||||
end
|
end
|
||||||
return _accum_0
|
local line_no = 1
|
||||||
end)(), " ")
|
while (ctx.line_starts[line_no + 1] or math.huge) < pos do
|
||||||
return {
|
line_no = line_no + 1
|
||||||
type = "FunctionCall",
|
end
|
||||||
src = src,
|
local prev_line = line_no > 1 and ctx.source_code:match("[^\n]*", ctx.line_starts[line_no - 1]) or ""
|
||||||
line_no = line_no,
|
local err_line = ctx.source_code:match("[^\n]*", ctx.line_starts[line_no])
|
||||||
value = value,
|
local next_line = line_no < #ctx.line_starts and ctx.source_code:match("[^\n]*", ctx.line_starts[line_no + 1]) or ""
|
||||||
errors = errors,
|
local pointer = ("-"):rep(pos - ctx.line_starts[line_no]) .. "^"
|
||||||
stub = stub
|
err_msg = (err_msg or "Parse error") .. " in " .. tostring(ctx.filename) .. " on line " .. tostring(line_no) .. ":\n"
|
||||||
}
|
err_msg = err_msg .. "\n" .. tostring(prev_line) .. "\n" .. tostring(err_line) .. "\n" .. tostring(pointer) .. "\n" .. tostring(next_line) .. "\n"
|
||||||
end,
|
return error(err_msg)
|
||||||
error = function(src, pos, errors, err_msg)
|
end,
|
||||||
local line_no = 1
|
FunctionCall = function(start, value, stop)
|
||||||
for _ in src:sub(1, -#errors):gmatch("\n") do
|
local stub = concat((function()
|
||||||
line_no = line_no + 1
|
local _accum_0 = { }
|
||||||
|
local _len_0 = 1
|
||||||
|
for _index_0 = 1, #value do
|
||||||
|
local t = value[_index_0]
|
||||||
|
_accum_0[_len_0] = (t.type == "Word" and t.value or "%")
|
||||||
|
_len_0 = _len_0 + 1
|
||||||
|
end
|
||||||
|
return _accum_0
|
||||||
|
end)(), " ")
|
||||||
|
local line_no = 1
|
||||||
|
while (ctx.line_starts[line_no + 1] or math.huge) < start do
|
||||||
|
line_no = line_no + 1
|
||||||
|
end
|
||||||
|
local src = ctx.source_code:sub(start, stop - 1)
|
||||||
|
return {
|
||||||
|
type = "FunctionCall",
|
||||||
|
src = src,
|
||||||
|
line_no = tostring(ctx.filename) .. ":" .. tostring(line_no),
|
||||||
|
value = value,
|
||||||
|
stub = stub
|
||||||
|
}
|
||||||
end
|
end
|
||||||
local err_pos = #src - #errors + 1
|
}
|
||||||
if errors:sub(1, 1) == "\n" then
|
setmetatable(defs, {
|
||||||
err_pos = err_pos + #errors:match("[ \t]*", 2)
|
__index = function(self, key)
|
||||||
end
|
local fn
|
||||||
local start_of_err_line = err_pos
|
fn = function(start, value, stop)
|
||||||
while src:sub(start_of_err_line, start_of_err_line) ~= "\n" and start_of_err_line > 1 do
|
|
||||||
start_of_err_line = start_of_err_line - 1
|
|
||||||
end
|
|
||||||
local start_of_prev_line = start_of_err_line - 1
|
|
||||||
while src:sub(start_of_prev_line, start_of_prev_line) ~= "\n" and start_of_prev_line > 1 do
|
|
||||||
start_of_prev_line = start_of_prev_line - 1
|
|
||||||
end
|
|
||||||
local prev_line, err_line, next_line
|
|
||||||
prev_line, err_line, next_line = src:match("([^\n]*)\n([^\n]*)\n([^\n]*)", start_of_prev_line + 1)
|
|
||||||
local pointer = ("-"):rep(err_pos - start_of_err_line + 0) .. "^"
|
|
||||||
return error("\n" .. tostring(err_msg or "Parse error") .. " in " .. tostring(CURRENT_FILE) .. " on line " .. tostring(line_no) .. ":\n\n" .. tostring(prev_line) .. "\n" .. tostring(err_line) .. "\n" .. tostring(pointer) .. "\n" .. tostring(next_line) .. "\n")
|
|
||||||
end
|
|
||||||
}
|
|
||||||
setmetatable(defs, {
|
|
||||||
__index = function(t, key)
|
|
||||||
do
|
|
||||||
local _with_0
|
|
||||||
_with_0 = function(src, value, errors)
|
|
||||||
return {
|
return {
|
||||||
type = key,
|
start = start,
|
||||||
src = src,
|
stop = stop,
|
||||||
value = value,
|
value = value,
|
||||||
errors = errors
|
src = ctx.source_code:sub(start, stop - 1),
|
||||||
|
type = key
|
||||||
}
|
}
|
||||||
end
|
end
|
||||||
t[key] = _with_0
|
self[key] = fn
|
||||||
local _ = nil
|
return fn
|
||||||
return _with_0
|
|
||||||
end
|
end
|
||||||
|
})
|
||||||
|
local peg_tidier = re.compile([[ file <- {~ %nl* (def/comment) (%nl+ (def/comment))* %nl* ~}
|
||||||
|
def <- anon_def / captured_def
|
||||||
|
anon_def <- ({ident} (" "*) ":"
|
||||||
|
{((%nl " "+ [^%nl]*)+) / ([^%nl]*)}) -> "%1 <- %2"
|
||||||
|
captured_def <- ({ident} (" "*) "(" {ident} ")" (" "*) ":"
|
||||||
|
{((%nl " "+ [^%nl]*)+) / ([^%nl]*)}) -> "%1 <- ({} %3 {}) -> %2"
|
||||||
|
ident <- [a-zA-Z_][a-zA-Z0-9_]*
|
||||||
|
comment <- "--" [^%nl]*
|
||||||
|
]])
|
||||||
|
local nomsu = peg_tidier:match(io.open("nomsu.peg"):read("*a"))
|
||||||
|
nomsu = re.compile(nomsu, defs)
|
||||||
|
parse = function(source_code, filename)
|
||||||
|
local old_ctx = ctx
|
||||||
|
ctx = {
|
||||||
|
source_code = source_code,
|
||||||
|
filename = filename,
|
||||||
|
indent_stack = {
|
||||||
|
0
|
||||||
|
}
|
||||||
|
}
|
||||||
|
ctx.line_starts = re.compile("lines <- {| line ('\n' line)* |} line <- {} [^\n]*"):match(source_code)
|
||||||
|
local tree = nomsu:match(source_code)
|
||||||
|
ctx = old_ctx
|
||||||
|
return tree
|
||||||
end
|
end
|
||||||
})
|
end
|
||||||
nomsu = re.compile(nomsu, defs)
|
|
||||||
local NomsuCompiler
|
local NomsuCompiler
|
||||||
do
|
do
|
||||||
local _class_0
|
local _class_0
|
||||||
@ -272,9 +200,6 @@ do
|
|||||||
elseif type(signature) == 'table' and type(signature[1]) == 'string' then
|
elseif type(signature) == 'table' and type(signature[1]) == 'string' then
|
||||||
signature = self:get_stubs(signature)
|
signature = self:get_stubs(signature)
|
||||||
end
|
end
|
||||||
if self.debug then
|
|
||||||
self:write(colored.magenta("Defined rule " .. tostring(repr(signature))))
|
|
||||||
end
|
|
||||||
assert(type(thunk) == 'function', "Bad thunk: " .. tostring(repr(thunk)))
|
assert(type(thunk) == 'function', "Bad thunk: " .. tostring(repr(thunk)))
|
||||||
local canonical_args = nil
|
local canonical_args = nil
|
||||||
local canonical_escaped_args = nil
|
local canonical_escaped_args = nil
|
||||||
@ -562,19 +487,11 @@ do
|
|||||||
end,
|
end,
|
||||||
parse = function(self, str, filename)
|
parse = function(self, str, filename)
|
||||||
if self.debug then
|
if self.debug then
|
||||||
self:writeln(tostring(colored.bright("PARSING:")) .. "\n" .. tostring(str))
|
self:writeln(tostring(colored.bright("PARSING:")) .. "\n" .. tostring(colored.yellow(str)))
|
||||||
end
|
end
|
||||||
str = str:gsub("\r", "")
|
str = str:gsub("\r", "")
|
||||||
local old_file = CURRENT_FILE
|
local tree = parse(str, filename)
|
||||||
local old_indent_stack
|
assert(tree, "In file " .. tostring(colored.blue(filename)) .. " failed to parse:\n" .. tostring(colored.onyellow(colored.black(str))))
|
||||||
old_indent_stack, indent_stack = indent_stack, {
|
|
||||||
0
|
|
||||||
}
|
|
||||||
CURRENT_FILE = filename
|
|
||||||
local tree = nomsu:match(str)
|
|
||||||
indent_stack = old_indent_stack
|
|
||||||
CURRENT_FILE = old_file
|
|
||||||
assert(tree, "Failed to parse: " .. tostring(str))
|
|
||||||
if self.debug then
|
if self.debug then
|
||||||
self:writeln("PARSE TREE:")
|
self:writeln("PARSE TREE:")
|
||||||
self:print_tree(tree, " ")
|
self:print_tree(tree, " ")
|
||||||
@ -744,8 +661,7 @@ end);]]):format(concat(buffer, "\n"))
|
|||||||
local _list_0 = tree.value
|
local _list_0 = tree.value
|
||||||
for _index_0 = 1, #_list_0 do
|
for _index_0 = 1, #_list_0 do
|
||||||
local arg = _list_0[_index_0]
|
local arg = _list_0[_index_0]
|
||||||
local arg_inline
|
local nomsu, arg_inline = self:tree_to_nomsu(arg, force_inline)
|
||||||
nomsu, arg_inline = self:tree_to_nomsu(arg, force_inline)
|
|
||||||
if sep == " " and line_len + #nomsu > 80 then
|
if sep == " " and line_len + #nomsu > 80 then
|
||||||
sep = "\n.."
|
sep = "\n.."
|
||||||
end
|
end
|
||||||
@ -802,8 +718,7 @@ end);]]):format(concat(buffer, "\n"))
|
|||||||
local longline = 0
|
local longline = 0
|
||||||
local inline = true
|
local inline = true
|
||||||
for i, bit in ipairs(tree.value) do
|
for i, bit in ipairs(tree.value) do
|
||||||
local bit_inline
|
local nomsu, bit_inline = self:tree_to_nomsu(bit, force_inline)
|
||||||
nomsu, bit_inline = self:tree_to_nomsu(bit, force_inline)
|
|
||||||
inline = inline and bit_inline
|
inline = inline and bit_inline
|
||||||
if inline then
|
if inline then
|
||||||
if i > 1 then
|
if i > 1 then
|
||||||
@ -968,17 +883,14 @@ end)]]):format(concat(lua_bits, "\n"))
|
|||||||
break
|
break
|
||||||
end
|
end
|
||||||
if escaped_args[arg_names[arg_num]] then
|
if escaped_args[arg_names[arg_num]] then
|
||||||
arg = {
|
insert(args, "nomsu:parse(" .. tostring(repr(arg.src)) .. ", " .. tostring(repr(tree.line_no)) .. ").value[1]")
|
||||||
type = "Nomsu",
|
else
|
||||||
value = arg,
|
local expr, statement = self:tree_to_lua(arg, filename)
|
||||||
line_no = tree.line_no
|
if statement then
|
||||||
}
|
self:error("Cannot use [[" .. tostring(arg.src) .. "]] as a function argument, since it's not an expression.")
|
||||||
|
end
|
||||||
|
insert(args, expr)
|
||||||
end
|
end
|
||||||
local expr, statement = self:tree_to_lua(arg, filename)
|
|
||||||
if statement then
|
|
||||||
self:error("Cannot use [[" .. tostring(arg.src) .. "]] as a function argument, since it's not an expression.")
|
|
||||||
end
|
|
||||||
insert(args, expr)
|
|
||||||
arg_num = arg_num + 1
|
arg_num = arg_num + 1
|
||||||
_continue_0 = true
|
_continue_0 = true
|
||||||
until true
|
until true
|
||||||
@ -989,10 +901,6 @@ end)]]):format(concat(lua_bits, "\n"))
|
|||||||
remove(self.compilestack)
|
remove(self.compilestack)
|
||||||
return self.__class:comma_separated_items("nomsu:call(", args, ")"), nil
|
return self.__class:comma_separated_items("nomsu:call(", args, ")"), nil
|
||||||
elseif "String" == _exp_0 then
|
elseif "String" == _exp_0 then
|
||||||
if self.debug then
|
|
||||||
self:writeln((colored.bright("STRING:")))
|
|
||||||
self:print_tree(tree)
|
|
||||||
end
|
|
||||||
local concat_parts = { }
|
local concat_parts = { }
|
||||||
local string_buffer = ""
|
local string_buffer = ""
|
||||||
local _list_0 = tree.value
|
local _list_0 = tree.value
|
||||||
@ -1144,17 +1052,17 @@ end)]]):format(concat(lua_bits, "\n"))
|
|||||||
self:error("Nothing to get stub from")
|
self:error("Nothing to get stub from")
|
||||||
end
|
end
|
||||||
if type(x) == 'string' then
|
if type(x) == 'string' then
|
||||||
x = x:gsub("\n%s*%.%.", " ")
|
local patt = re.compile("{|(' '+ / '\n..' / {'\\'? '%' %id*} / {%id+} / {%op+})*|}", {
|
||||||
x = lpeg.Cs((operator / (function(op)
|
id = IDENT_CHAR,
|
||||||
return " " .. tostring(op) .. " "
|
op = OPERATOR_CHAR
|
||||||
end) + 1) ^ 0):match(x)
|
})
|
||||||
x = x:gsub("%s+", " "):gsub("^%s*", ""):gsub("%s*$", "")
|
local spec = concat(patt:match(x), " ")
|
||||||
local stub = x:gsub("%%%S+", "%%"):gsub("\\", "")
|
local stub = spec:gsub("%%%S+", "%%"):gsub("\\", "")
|
||||||
local arg_names
|
local arg_names
|
||||||
do
|
do
|
||||||
local _accum_0 = { }
|
local _accum_0 = { }
|
||||||
local _len_0 = 1
|
local _len_0 = 1
|
||||||
for arg in x:gmatch("%%([^%s]*)") do
|
for arg in spec:gmatch("%%([^%s]*)") do
|
||||||
_accum_0[_len_0] = arg
|
_accum_0[_len_0] = arg
|
||||||
_len_0 = _len_0 + 1
|
_len_0 = _len_0 + 1
|
||||||
end
|
end
|
||||||
@ -1163,7 +1071,7 @@ end)]]):format(concat(lua_bits, "\n"))
|
|||||||
local escaped_args = set((function()
|
local escaped_args = set((function()
|
||||||
local _accum_0 = { }
|
local _accum_0 = { }
|
||||||
local _len_0 = 1
|
local _len_0 = 1
|
||||||
for arg in x:gmatch("\\%%([^%s]*)") do
|
for arg in spec:gmatch("\\%%(%S*)") do
|
||||||
_accum_0[_len_0] = arg
|
_accum_0[_len_0] = arg
|
||||||
_len_0 = _len_0 + 1
|
_len_0 = _len_0 + 1
|
||||||
end
|
end
|
||||||
@ -1278,13 +1186,17 @@ end)]]):format(concat(lua_bits, "\n"))
|
|||||||
end,
|
end,
|
||||||
typecheck = function(self, vars, varname, desired_type)
|
typecheck = function(self, vars, varname, desired_type)
|
||||||
local x = vars[varname]
|
local x = vars[varname]
|
||||||
if type(x) == desired_type then
|
local x_type = type(x)
|
||||||
|
if x_type == desired_type then
|
||||||
return x
|
return x
|
||||||
end
|
end
|
||||||
if type(x) == 'table' and x.type == desired_type then
|
if x_type == 'table' then
|
||||||
return x
|
x_type = x.type or x_type
|
||||||
|
if x_type == desired_type then
|
||||||
|
return x
|
||||||
|
end
|
||||||
end
|
end
|
||||||
return self:error("Invalid type for %" .. tostring(varname) .. ". Expected " .. tostring(desired_type) .. ", but got " .. tostring(repr(x)) .. ".")
|
return self:error("Invalid type for %" .. tostring(varname) .. ". Expected " .. tostring(desired_type) .. ", but got " .. tostring(x_type) .. ":\n" .. tostring(repr(x)))
|
||||||
end,
|
end,
|
||||||
source_code = function(self, level)
|
source_code = function(self, level)
|
||||||
if level == nil then
|
if level == nil then
|
||||||
@ -1326,6 +1238,20 @@ end)]]):format(concat(lua_bits, "\n"))
|
|||||||
self:defmacro("__src__ %level", function(self, vars)
|
self:defmacro("__src__ %level", function(self, vars)
|
||||||
return self:repr(self:source_code(self:tree_to_value(vars.level)))
|
return self:repr(self:source_code(self:tree_to_value(vars.level)))
|
||||||
end)
|
end)
|
||||||
|
self:def("derp \\%foo derp \\%bar", function(self, vars)
|
||||||
|
local lua = "local x = " .. repr((function()
|
||||||
|
local _accum_0 = { }
|
||||||
|
local _len_0 = 1
|
||||||
|
local _list_0 = vars.foo.value
|
||||||
|
for _index_0 = 1, #_list_0 do
|
||||||
|
local t = _list_0[_index_0]
|
||||||
|
_accum_0[_len_0] = t.stub
|
||||||
|
_len_0 = _len_0 + 1
|
||||||
|
end
|
||||||
|
return _accum_0
|
||||||
|
end)()) .. ";\nlocal y = " .. self:tree_to_lua(vars.bar)
|
||||||
|
return print(colored.green(lua))
|
||||||
|
end)
|
||||||
local run_file
|
local run_file
|
||||||
run_file = function(self, vars)
|
run_file = function(self, vars)
|
||||||
if vars.filename:match(".*%.lua") then
|
if vars.filename:match(".*%.lua") then
|
||||||
@ -1333,7 +1259,7 @@ end)]]):format(concat(lua_bits, "\n"))
|
|||||||
end
|
end
|
||||||
if vars.filename:match(".*%.nom") then
|
if vars.filename:match(".*%.nom") then
|
||||||
if not self.skip_precompiled then
|
if not self.skip_precompiled then
|
||||||
local file = io.open(vars.filename:gsub("%.nom", ".compiled.nom"), "r")
|
local file = io.open(vars.filename:gsub("%.nom", ".nomc"), "r")
|
||||||
end
|
end
|
||||||
local file = file or io.open(vars.filename)
|
local file = file or io.open(vars.filename)
|
||||||
if not file then
|
if not file then
|
||||||
@ -1457,7 +1383,7 @@ if arg then
|
|||||||
c.skip_precompiled = not args.flags["-O"]
|
c.skip_precompiled = not args.flags["-O"]
|
||||||
if args.input then
|
if args.input then
|
||||||
if args.flags["-c"] and not args.output then
|
if args.flags["-c"] and not args.output then
|
||||||
args.output = args.input:gsub("%.nom", ".compiled.nom")
|
args.output = args.input:gsub("%.nom", ".nomc")
|
||||||
end
|
end
|
||||||
local compiled_output = nil
|
local compiled_output = nil
|
||||||
if args.flags["-p"] then
|
if args.flags["-p"] then
|
||||||
|
303
nomsu.moon
303
nomsu.moon
@ -10,13 +10,12 @@
|
|||||||
-- nomsu:run(your_nomsu_code)
|
-- nomsu:run(your_nomsu_code)
|
||||||
-- Or from the command line:
|
-- Or from the command line:
|
||||||
-- lua nomsu.lua [input_file [output_file or -]]
|
-- lua nomsu.lua [input_file [output_file or -]]
|
||||||
|
|
||||||
re = require 're'
|
re = require 're'
|
||||||
lpeg = require 'lpeg'
|
lpeg = require 'lpeg'
|
||||||
utils = require 'utils'
|
utils = require 'utils'
|
||||||
{:repr, :stringify, :min, :max, :equivalent, :set, :is_list, :sum} = utils
|
{:repr, :stringify, :min, :max, :equivalent, :set, :is_list, :sum} = utils
|
||||||
colors = setmetatable({}, {__index:->""})
|
colors = setmetatable({}, {__index:->""})
|
||||||
colored = setmetatable({}, {__index:(_,color)-> ((msg)-> colors[color]..msg..colors.reset)})
|
colored = setmetatable({}, {__index:(_,color)-> ((msg)-> colors[color]..(msg or '')..colors.reset)})
|
||||||
{:insert, :remove, :concat} = table
|
{:insert, :remove, :concat} = table
|
||||||
--pcall = (fn,...)-> true, fn(...)
|
--pcall = (fn,...)-> true, fn(...)
|
||||||
if _VERSION == "Lua 5.1"
|
if _VERSION == "Lua 5.1"
|
||||||
@ -40,169 +39,99 @@ if _VERSION == "Lua 5.1"
|
|||||||
|
|
||||||
lpeg.setmaxstack 10000 -- whoa
|
lpeg.setmaxstack 10000 -- whoa
|
||||||
{:P,:R,:V,:S,:Cg,:C,:Cp,:B,:Cmt} = lpeg
|
{:P,:R,:V,:S,:Cg,:C,:Cp,:B,:Cmt} = lpeg
|
||||||
|
|
||||||
STRING_ESCAPES = n:"\n", t:"\t", b:"\b", a:"\a", v:"\v", f:"\f", r:"\r"
|
STRING_ESCAPES = n:"\n", t:"\t", b:"\b", a:"\a", v:"\v", f:"\f", r:"\r"
|
||||||
|
ESCAPE_CHAR = (P("\\")*S("ntbavfr")) / (s)->STRING_ESCAPES[s\sub(2,2)]
|
||||||
|
OPERATOR_CHAR = S("'~`!@$^&*-+=|<>?/")
|
||||||
|
UTF8_CHAR = (
|
||||||
|
R("\194\223")*R("\128\191") +
|
||||||
|
R("\224\239")*R("\128\191")*R("\128\191") +
|
||||||
|
R("\240\244")*R("\128\191")*R("\128\191")*R("\128\191"))
|
||||||
|
IDENT_CHAR = R("az","AZ","09") + P("_") + UTF8_CHAR
|
||||||
|
|
||||||
-- NOTE: this treats tabs as equivalent to 1 space
|
local parse
|
||||||
indent_stack = {0}
|
do
|
||||||
indent_patt = P (start)=>
|
export parse
|
||||||
spaces = @match("[ \t]*", start)
|
ctx = {}
|
||||||
if #spaces > indent_stack[#indent_stack]
|
indent_patt = P (start)=>
|
||||||
insert(indent_stack, #spaces)
|
spaces = @match("[ \t]*", start)
|
||||||
return start + #spaces
|
if #spaces > ctx.indent_stack[#ctx.indent_stack]
|
||||||
dedent_patt = P (start)=>
|
insert(ctx.indent_stack, #spaces)
|
||||||
spaces = @match("[ \t]*", start)
|
return start + #spaces
|
||||||
if #spaces < indent_stack[#indent_stack]
|
dedent_patt = P (start)=>
|
||||||
remove(indent_stack)
|
spaces = @match("[ \t]*", start)
|
||||||
return start
|
if #spaces < ctx.indent_stack[#ctx.indent_stack]
|
||||||
nodent_patt = P (start)=>
|
remove(ctx.indent_stack)
|
||||||
spaces = @match("[ \t]*", start)
|
return start
|
||||||
if #spaces == indent_stack[#indent_stack]
|
nodent_patt = P (start)=>
|
||||||
return start + #spaces
|
spaces = @match("[ \t]*", start)
|
||||||
gt_nodent_patt = P (start)=>
|
if #spaces == ctx.indent_stack[#ctx.indent_stack]
|
||||||
-- Note! This assumes indent is 4 spaces!!!
|
return start + #spaces
|
||||||
spaces = @match("[ \t]*", start)
|
gt_nodent_patt = P (start)=>
|
||||||
if #spaces >= indent_stack[#indent_stack] + 4
|
-- Note! This assumes indent is 4 spaces!!!
|
||||||
return start + indent_stack[#indent_stack] + 4
|
spaces = @match("[ \t]*", start)
|
||||||
|
if #spaces >= ctx.indent_stack[#ctx.indent_stack] + 4
|
||||||
|
return start + ctx.indent_stack[#ctx.indent_stack] + 4
|
||||||
|
|
||||||
-- TYPES:
|
defs =
|
||||||
-- Number 1, "String", %Var, [List], (expression), {Thunk}, \Nomsu, FunctionCall, File
|
nl: P("\n"), ws: S(" \t"), :tonumber, operator: OPERATOR_CHAR
|
||||||
|
print: (src,pos,msg)-> print(msg, pos, repr(src\sub(math.max(0,pos-16),math.max(0,pos-1)).."|"..src\sub(pos,pos+16))) or true
|
||||||
|
utf8_char: (
|
||||||
|
R("\194\223")*R("\128\191") +
|
||||||
|
R("\224\239")*R("\128\191")*R("\128\191") +
|
||||||
|
R("\240\244")*R("\128\191")*R("\128\191")*R("\128\191"))
|
||||||
|
indented: indent_patt, nodented: nodent_patt, dedented: dedent_patt
|
||||||
|
gt_nodented: gt_nodent_patt, escape_char:ESCAPE_CHAR
|
||||||
|
error: (src,pos,err_msg)->
|
||||||
|
if ctx.source_code\sub(pos,pos) == "\n"
|
||||||
|
pos += #ctx.source_code\match("[ \t\n]*", pos)
|
||||||
|
line_no = 1
|
||||||
|
while (ctx.line_starts[line_no+1] or math.huge) < pos do line_no += 1
|
||||||
|
prev_line = line_no > 1 and ctx.source_code\match("[^\n]*", ctx.line_starts[line_no-1]) or ""
|
||||||
|
err_line = ctx.source_code\match("[^\n]*", ctx.line_starts[line_no])
|
||||||
|
next_line = line_no < #ctx.line_starts and ctx.source_code\match("[^\n]*", ctx.line_starts[line_no+1]) or ""
|
||||||
|
pointer = ("-")\rep(pos-ctx.line_starts[line_no]) .. "^"
|
||||||
|
err_msg = (err_msg or "Parse error").." in #{ctx.filename} on line #{line_no}:\n"
|
||||||
|
err_msg ..="\n#{prev_line}\n#{err_line}\n#{pointer}\n#{next_line}\n"
|
||||||
|
error(err_msg)
|
||||||
|
FunctionCall: (start, value, stop)->
|
||||||
|
stub = concat([(t.type == "Word" and t.value or "%") for t in *value], " ")
|
||||||
|
line_no = 1
|
||||||
|
while (ctx.line_starts[line_no+1] or math.huge) < start do line_no += 1
|
||||||
|
src = ctx.source_code\sub(start,stop-1)
|
||||||
|
return {type: "FunctionCall", :src, line_no: "#{ctx.filename}:#{line_no}", :value, :stub}
|
||||||
|
|
||||||
nomsu = [=[
|
setmetatable(defs, {__index:(key)=>
|
||||||
file <- ({{| shebang?
|
fn = (start, value, stop)->
|
||||||
(ignored_line %nl)*
|
{:start, :stop, :value, src:ctx.source_code\sub(start,stop-1), type: key}
|
||||||
statements (nodent statements)*
|
self[key] = fn
|
||||||
(%nl ignored_line)* %nl?
|
return fn
|
||||||
(({.+} ("" -> "Parse error")) => error)? |} }) -> File
|
})
|
||||||
|
|
||||||
shebang <- "#!" [^%nl]* %nl
|
-- Just for cleanliness, I put the language spec in its own file using a slightly modified
|
||||||
|
-- version of the lpeg.re syntax.
|
||||||
|
peg_tidier = re.compile [[
|
||||||
|
file <- {~ %nl* (def/comment) (%nl+ (def/comment))* %nl* ~}
|
||||||
|
def <- anon_def / captured_def
|
||||||
|
anon_def <- ({ident} (" "*) ":"
|
||||||
|
{((%nl " "+ [^%nl]*)+) / ([^%nl]*)}) -> "%1 <- %2"
|
||||||
|
captured_def <- ({ident} (" "*) "(" {ident} ")" (" "*) ":"
|
||||||
|
{((%nl " "+ [^%nl]*)+) / ([^%nl]*)}) -> "%1 <- ({} %3 {}) -> %2"
|
||||||
|
ident <- [a-zA-Z_][a-zA-Z0-9_]*
|
||||||
|
comment <- "--" [^%nl]*
|
||||||
|
]]
|
||||||
|
|
||||||
inline_statements <- inline_statement (semicolon inline_statement)*
|
nomsu = peg_tidier\match(io.open("nomsu.peg")\read("*a"))
|
||||||
noeol_statements <- (inline_statement semicolon)* noeol_statement
|
nomsu = re.compile(nomsu, defs)
|
||||||
statements <- (inline_statement semicolon)* statement
|
|
||||||
|
|
||||||
statement <- functioncall / expression
|
parse = (source_code, filename)->
|
||||||
noeol_statement <- noeol_functioncall / noeol_expression
|
old_ctx = ctx
|
||||||
inline_statement <- inline_functioncall / inline_expression
|
export ctx
|
||||||
|
ctx = {:source_code, :filename, indent_stack: {0}}
|
||||||
inline_thunk <- ({ {| "{" %ws? inline_statements %ws? "}" |} }) -> Thunk
|
ctx.line_starts = re.compile("lines <- {| line ('\n' line)* |} line <- {} [^\n]*")\match(source_code)
|
||||||
eol_thunk <- ({ {| ":" %ws? noeol_statements eol |} }) -> Thunk
|
tree = nomsu\match(source_code)
|
||||||
indented_thunk <- ({ {| (":" / "{..}") indent
|
ctx = old_ctx
|
||||||
statements (nodent statements)*
|
return tree
|
||||||
(dedent / (({.+} ("" -> "Error while parsing thunk")) => error))
|
|
||||||
|} }) -> Thunk
|
|
||||||
|
|
||||||
inline_nomsu <- ({("\" inline_expression) }) -> Nomsu
|
|
||||||
eol_nomsu <- ({("\" noeol_expression) }) -> Nomsu
|
|
||||||
indented_nomsu <- ({("\" expression) }) -> Nomsu
|
|
||||||
|
|
||||||
inline_expression <- number / variable / inline_string / inline_list / inline_nomsu
|
|
||||||
/ inline_thunk / ("(" %ws? inline_statement %ws? ")")
|
|
||||||
noeol_expression <- indented_string / indented_nomsu / indented_list / indented_thunk
|
|
||||||
/ ("(..)" indent
|
|
||||||
statement
|
|
||||||
(dedent / (({.+} ("" -> "Error while parsing indented expression"))))
|
|
||||||
) / inline_expression
|
|
||||||
expression <- eol_thunk / eol_nomsu / noeol_expression
|
|
||||||
|
|
||||||
-- Function calls need at least one word in them
|
|
||||||
inline_functioncall <- ({(''=>line_no) {|
|
|
||||||
(inline_expression %ws?)* word (%ws? (inline_expression / word))*
|
|
||||||
|} }) -> FunctionCall
|
|
||||||
noeol_functioncall <- ({(''=>line_no) {|
|
|
||||||
(noeol_expression %ws?)* word (%ws? (noeol_expression / word))*
|
|
||||||
|} }) -> FunctionCall
|
|
||||||
functioncall <- ({(''=>line_no) {|
|
|
||||||
(expression (dotdot / %ws?))* word ((dotdot / %ws?) (expression / word))*
|
|
||||||
|} }) -> FunctionCall
|
|
||||||
|
|
||||||
word <- ({ { %operator / (!number %plain_word) } }) -> Word
|
|
||||||
|
|
||||||
inline_string <- ({ '"' {|
|
|
||||||
({~ (("\\" -> "\") / ('\"' -> '"') / ("\n" -> "
|
|
||||||
") / (!string_interpolation [^%nl"]))+ ~}
|
|
||||||
/ string_interpolation)* |} '"' }) -> String
|
|
||||||
|
|
||||||
indented_string <- ({ '".."' %ws? line_comment? %nl %gt_nodented? {|
|
|
||||||
({~ (("\\" -> "\") / (%nl+ {~ %gt_nodented -> "" ~}) / [^%nl\]) ~} / string_interpolation)*
|
|
||||||
|} ((!.) / (&(%nl+ !%gt_nodented)) / (({.+} ("" -> "Error while parsing String")) => error))
|
|
||||||
}) -> String
|
|
||||||
|
|
||||||
string_interpolation <- "\" ((noeol_expression dotdot?) / dotdot)
|
|
||||||
|
|
||||||
number <- ({ (("-"? (([0-9]+ "." [0-9]+) / ("." [0-9]+) / ([0-9]+)))-> tonumber) }) -> Number
|
|
||||||
|
|
||||||
-- Variables can be nameless (i.e. just %) and can't contain operators like apostrophe
|
|
||||||
-- which is a hack to allow %'s to parse as "%" and "' s" separately
|
|
||||||
variable <- ({ ("%" { %plain_word? }) }) -> Var
|
|
||||||
|
|
||||||
inline_list <- ({ {|
|
|
||||||
("[" %ws? ((inline_list_item comma)* inline_list_item comma?)? %ws? "]")
|
|
||||||
|} }) -> List
|
|
||||||
indented_list <- ({ {|
|
|
||||||
("[..]" indent
|
|
||||||
list_line (nodent list_line)*
|
|
||||||
(dedent / (({.+} ("" -> "Error while parsing list")) => error)))
|
|
||||||
|} }) -> List
|
|
||||||
list_line <- (inline_list_item comma)* ((inline_list_item %ws? ",") / (functioncall / expression))
|
|
||||||
inline_list_item <- inline_functioncall / inline_expression
|
|
||||||
|
|
||||||
block_comment <- "#.." [^%nl]* (%nl (%ws? &%nl))* %nl %indented [^%nl]+ (%nl ((%ws? (!. / &%nl)) / (!%dedented [^%nl]+)))*
|
|
||||||
line_comment <- "#" [^%nl]*
|
|
||||||
|
|
||||||
eol <- %ws? line_comment? (!. / &%nl)
|
|
||||||
ignored_line <- (%nodented (block_comment / line_comment)) / (%ws? (!. / &%nl))
|
|
||||||
indent <- eol (%nl ignored_line)* %nl %indented ((block_comment/line_comment) (%nl ignored_line)* nodent)?
|
|
||||||
nodent <- eol (%nl ignored_line)* %nl %nodented
|
|
||||||
dedent <- eol (%nl ignored_line)* (((!.) &%dedented) / (&(%nl %dedented)))
|
|
||||||
comma <- %ws? "," %ws?
|
|
||||||
semicolon <- %ws? ";" %ws?
|
|
||||||
dotdot <- nodent ".." %ws?
|
|
||||||
]=]
|
|
||||||
|
|
||||||
CURRENT_FILE = nil
|
|
||||||
whitespace = S(" \t")^1
|
|
||||||
operator = S("'~`!@$^&*-+=|<>?/")^1
|
|
||||||
utf8_continuation = R("\128\191")
|
|
||||||
utf8_char = (
|
|
||||||
R("\194\223")*utf8_continuation +
|
|
||||||
R("\224\239")*utf8_continuation*utf8_continuation +
|
|
||||||
R("\240\244")*utf8_continuation*utf8_continuation*utf8_continuation)
|
|
||||||
plain_word = (R('az','AZ','09') + S("_") + utf8_char)^1
|
|
||||||
defs =
|
|
||||||
ws:whitespace, nl: P("\n"), :tonumber, :operator, :plain_word
|
|
||||||
indented: indent_patt, nodented: nodent_patt, dedented: dedent_patt, gt_nodented: gt_nodent_patt
|
|
||||||
line_no: (src, pos)->
|
|
||||||
line_no = 1
|
|
||||||
for _ in src\sub(1,pos)\gmatch("\n") do line_no += 1
|
|
||||||
return pos, "#{CURRENT_FILE}:#{line_no}"
|
|
||||||
FunctionCall: (src, line_no, value, errors)->
|
|
||||||
stub = concat([(t.type == "Word" and t.value or "%") for t in *value], " ")
|
|
||||||
{type: "FunctionCall", :src, :line_no, :value, :errors, :stub}
|
|
||||||
error: (src,pos,errors,err_msg)->
|
|
||||||
line_no = 1
|
|
||||||
for _ in src\sub(1,-#errors)\gmatch("\n") do line_no += 1
|
|
||||||
err_pos = #src - #errors + 1
|
|
||||||
if errors\sub(1,1) == "\n"
|
|
||||||
-- Indentation error
|
|
||||||
err_pos += #errors\match("[ \t]*", 2)
|
|
||||||
start_of_err_line = err_pos
|
|
||||||
while src\sub(start_of_err_line, start_of_err_line) != "\n" and start_of_err_line > 1
|
|
||||||
start_of_err_line -= 1
|
|
||||||
start_of_prev_line = start_of_err_line - 1
|
|
||||||
while src\sub(start_of_prev_line, start_of_prev_line) != "\n" and start_of_prev_line > 1
|
|
||||||
start_of_prev_line -= 1
|
|
||||||
|
|
||||||
local prev_line,err_line,next_line
|
|
||||||
prev_line,err_line,next_line = src\match("([^\n]*)\n([^\n]*)\n([^\n]*)", start_of_prev_line+1)
|
|
||||||
|
|
||||||
pointer = ("-")\rep(err_pos - start_of_err_line + 0) .. "^"
|
|
||||||
error("\n#{err_msg or "Parse error"} in #{CURRENT_FILE} on line #{line_no}:\n\n#{prev_line}\n#{err_line}\n#{pointer}\n#{next_line}\n")
|
|
||||||
|
|
||||||
setmetatable(defs, {
|
|
||||||
__index: (t,key)->
|
|
||||||
with t[key] = (src, value, errors)-> {type: key, :src, :value, :errors} do nil
|
|
||||||
})
|
|
||||||
nomsu = re.compile(nomsu, defs)
|
|
||||||
|
|
||||||
class NomsuCompiler
|
class NomsuCompiler
|
||||||
@def_number: 0
|
@def_number: 0
|
||||||
@ -237,8 +166,6 @@ class NomsuCompiler
|
|||||||
signature = @get_stubs {signature}
|
signature = @get_stubs {signature}
|
||||||
elseif type(signature) == 'table' and type(signature[1]) == 'string'
|
elseif type(signature) == 'table' and type(signature[1]) == 'string'
|
||||||
signature = @get_stubs signature
|
signature = @get_stubs signature
|
||||||
if @debug
|
|
||||||
@write colored.magenta "Defined rule #{repr signature}"
|
|
||||||
assert type(thunk) == 'function', "Bad thunk: #{repr thunk}"
|
assert type(thunk) == 'function', "Bad thunk: #{repr thunk}"
|
||||||
canonical_args = nil
|
canonical_args = nil
|
||||||
canonical_escaped_args = nil
|
canonical_escaped_args = nil
|
||||||
@ -391,16 +318,10 @@ class NomsuCompiler
|
|||||||
|
|
||||||
parse: (str, filename)=>
|
parse: (str, filename)=>
|
||||||
if @debug
|
if @debug
|
||||||
@writeln("#{colored.bright "PARSING:"}\n#{str}")
|
@writeln("#{colored.bright "PARSING:"}\n#{colored.yellow str}")
|
||||||
str = str\gsub("\r","")
|
str = str\gsub("\r","")
|
||||||
export indent_stack, CURRENT_FILE
|
tree = parse(str, filename)
|
||||||
old_file = CURRENT_FILE
|
assert tree, "In file #{colored.blue filename} failed to parse:\n#{colored.onyellow colored.black str}"
|
||||||
old_indent_stack, indent_stack = indent_stack, {0}
|
|
||||||
CURRENT_FILE = filename
|
|
||||||
tree = nomsu\match(str)
|
|
||||||
indent_stack = old_indent_stack -- Put it back, just in case.
|
|
||||||
CURRENT_FILE = old_file
|
|
||||||
assert tree, "Failed to parse: #{str}"
|
|
||||||
if @debug
|
if @debug
|
||||||
@writeln "PARSE TREE:"
|
@writeln "PARSE TREE:"
|
||||||
@print_tree tree, " "
|
@print_tree tree, " "
|
||||||
@ -660,20 +581,18 @@ end)]])\format(concat(lua_bits, "\n"))
|
|||||||
for arg in *tree.value
|
for arg in *tree.value
|
||||||
if arg.type == 'Word' then continue
|
if arg.type == 'Word' then continue
|
||||||
if escaped_args[arg_names[arg_num]]
|
if escaped_args[arg_names[arg_num]]
|
||||||
arg = {type:"Nomsu", value:arg, line_no:tree.line_no}
|
insert args, "nomsu:parse(#{repr arg.src}, #{repr tree.line_no}).value[1]"
|
||||||
expr,statement = @tree_to_lua arg, filename
|
else
|
||||||
if statement
|
expr,statement = @tree_to_lua arg, filename
|
||||||
@error "Cannot use [[#{arg.src}]] as a function argument, since it's not an expression."
|
if statement
|
||||||
insert args, expr
|
@error "Cannot use [[#{arg.src}]] as a function argument, since it's not an expression."
|
||||||
|
insert args, expr
|
||||||
arg_num += 1
|
arg_num += 1
|
||||||
|
|
||||||
remove @compilestack
|
remove @compilestack
|
||||||
return @@comma_separated_items("nomsu:call(", args, ")"), nil
|
return @@comma_separated_items("nomsu:call(", args, ")"), nil
|
||||||
|
|
||||||
when "String"
|
when "String"
|
||||||
if @debug
|
|
||||||
@writeln (colored.bright "STRING:")
|
|
||||||
@print_tree tree
|
|
||||||
concat_parts = {}
|
concat_parts = {}
|
||||||
string_buffer = ""
|
string_buffer = ""
|
||||||
for bit in *tree.value
|
for bit in *tree.value
|
||||||
@ -796,12 +715,12 @@ end)]])\format(concat(lua_bits, "\n"))
|
|||||||
-- (e.g. "say %msg") or function call (e.g. FunctionCall({Word("say"), Var("msg")))
|
-- (e.g. "say %msg") or function call (e.g. FunctionCall({Word("say"), Var("msg")))
|
||||||
if type(x) == 'string'
|
if type(x) == 'string'
|
||||||
-- Standardize format to stuff separated by spaces
|
-- Standardize format to stuff separated by spaces
|
||||||
x = x\gsub("\n%s*%.%.", " ")
|
patt = re.compile "{|(' '+ / '\n..' / {'\\'? '%' %id*} / {%id+} / {%op+})*|}",
|
||||||
x = lpeg.Cs((operator / ((op)->" #{op} ") + 1)^0)\match(x)
|
id:IDENT_CHAR, op:OPERATOR_CHAR
|
||||||
x = x\gsub("%s+"," ")\gsub("^%s*","")\gsub("%s*$","")
|
spec = concat patt\match(x), " "
|
||||||
stub = x\gsub("%%%S+","%%")\gsub("\\","")
|
stub = spec\gsub("%%%S+","%%")\gsub("\\","")
|
||||||
arg_names = [arg for arg in x\gmatch("%%([^%s]*)")]
|
arg_names = [arg for arg in spec\gmatch("%%([^%s]*)")]
|
||||||
escaped_args = set [arg for arg in x\gmatch("\\%%([^%s]*)")]
|
escaped_args = set [arg for arg in spec\gmatch("\\%%(%S*)")]
|
||||||
return stub, arg_names, escaped_args
|
return stub, arg_names, escaped_args
|
||||||
if type(x) != 'table'
|
if type(x) != 'table'
|
||||||
@error "Invalid type for getting stub: #{type(x)} for:\n#{repr x}"
|
@error "Invalid type for getting stub: #{type(x)} for:\n#{repr x}"
|
||||||
@ -846,9 +765,12 @@ end)]])\format(concat(lua_bits, "\n"))
|
|||||||
|
|
||||||
typecheck: (vars, varname, desired_type)=>
|
typecheck: (vars, varname, desired_type)=>
|
||||||
x = vars[varname]
|
x = vars[varname]
|
||||||
if type(x) == desired_type then return x
|
x_type = type(x)
|
||||||
if type(x) == 'table' and x.type == desired_type then return x
|
if x_type == desired_type then return x
|
||||||
@error "Invalid type for %#{varname}. Expected #{desired_type}, but got #{repr x}."
|
if x_type == 'table'
|
||||||
|
x_type = x.type or x_type
|
||||||
|
if x_type == desired_type then return x
|
||||||
|
@error "Invalid type for %#{varname}. Expected #{desired_type}, but got #{x_type}:\n#{repr x}"
|
||||||
|
|
||||||
source_code: (level=0)=>
|
source_code: (level=0)=>
|
||||||
@dedent @compilestack[#@compilestack-level].src
|
@dedent @compilestack[#@compilestack-level].src
|
||||||
@ -881,12 +803,16 @@ end)]])\format(concat(lua_bits, "\n"))
|
|||||||
@defmacro "__src__ %level", (vars)=>
|
@defmacro "__src__ %level", (vars)=>
|
||||||
@repr @source_code @tree_to_value vars.level
|
@repr @source_code @tree_to_value vars.level
|
||||||
|
|
||||||
|
@def "derp \\%foo derp \\%bar", (vars)=>
|
||||||
|
lua = "local x = "..repr([t.stub for t in *vars.foo.value])..";\nlocal y = "..@tree_to_lua(vars.bar)
|
||||||
|
print(colored.green lua)
|
||||||
|
|
||||||
run_file = (vars)=>
|
run_file = (vars)=>
|
||||||
if vars.filename\match(".*%.lua")
|
if vars.filename\match(".*%.lua")
|
||||||
return dofile(vars.filename)(@, vars)
|
return dofile(vars.filename)(@, vars)
|
||||||
if vars.filename\match(".*%.nom")
|
if vars.filename\match(".*%.nom")
|
||||||
if not @skip_precompiled -- Look for precompiled version
|
if not @skip_precompiled -- Look for precompiled version
|
||||||
file = io.open(vars.filename\gsub("%.nom", ".compiled.nom"), "r")
|
file = io.open(vars.filename\gsub("%.nom", ".nomc"), "r")
|
||||||
file = file or io.open(vars.filename)
|
file = file or io.open(vars.filename)
|
||||||
if not file
|
if not file
|
||||||
@error "File does not exist: #{vars.filename}"
|
@error "File does not exist: #{vars.filename}"
|
||||||
@ -922,11 +848,12 @@ if arg
|
|||||||
os.exit!
|
os.exit!
|
||||||
|
|
||||||
c = NomsuCompiler()
|
c = NomsuCompiler()
|
||||||
|
|
||||||
c.skip_precompiled = not args.flags["-O"]
|
c.skip_precompiled = not args.flags["-O"]
|
||||||
if args.input
|
if args.input
|
||||||
-- Read a file or stdin and output either the printouts or the compiled lua
|
-- Read a file or stdin and output either the printouts or the compiled lua
|
||||||
if args.flags["-c"] and not args.output
|
if args.flags["-c"] and not args.output
|
||||||
args.output = args.input\gsub("%.nom", ".compiled.nom")
|
args.output = args.input\gsub("%.nom", ".nomc")
|
||||||
compiled_output = nil
|
compiled_output = nil
|
||||||
if args.flags["-p"]
|
if args.flags["-p"]
|
||||||
_write = c.write
|
_write = c.write
|
||||||
|
92
nomsu.peg
Normal file
92
nomsu.peg
Normal file
@ -0,0 +1,92 @@
|
|||||||
|
file (File):
|
||||||
|
{| shebang?
|
||||||
|
(ignored_line %nl)*
|
||||||
|
statements (nodent statements)*
|
||||||
|
(%nl ignored_line)*
|
||||||
|
(!. / (("" -> "Parse error") => error)?) |}
|
||||||
|
|
||||||
|
shebang: "#!" [^%nl]* %nl
|
||||||
|
|
||||||
|
inline_statements: inline_statement (semicolon inline_statement)*
|
||||||
|
noeol_statements: (inline_statement semicolon noeol_statements) / noeol_statement
|
||||||
|
statements: (inline_statement semicolon statements) / statement
|
||||||
|
|
||||||
|
statement: functioncall / expression
|
||||||
|
noeol_statement: noeol_functioncall / noeol_expression
|
||||||
|
inline_statement: inline_functioncall / inline_expression
|
||||||
|
|
||||||
|
inline_thunk (Thunk): {| "{" %ws* inline_statements %ws* "}" |}
|
||||||
|
eol_thunk (Thunk): {| ":" %ws* noeol_statements eol |}
|
||||||
|
indented_thunk (Thunk):
|
||||||
|
{| (":" / "{..}") indent
|
||||||
|
statements (nodent statements)*
|
||||||
|
(dedent / (("" -> "Error while parsing thunk") => error))
|
||||||
|
|}
|
||||||
|
|
||||||
|
inline_nomsu (Nomsu): "\" inline_expression
|
||||||
|
eol_nomsu (Nomsu): "\" noeol_expression
|
||||||
|
indented_nomsu (Nomsu): "\" expression
|
||||||
|
|
||||||
|
inline_expression:
|
||||||
|
number / variable / inline_string / inline_list / inline_nomsu
|
||||||
|
/ inline_thunk / ("(" %ws* inline_statement %ws* ")")
|
||||||
|
noeol_expression:
|
||||||
|
indented_string / indented_nomsu / indented_list / indented_thunk
|
||||||
|
/ ("(..)" indent
|
||||||
|
statement
|
||||||
|
(dedent / (("" -> "Error while parsing indented expression") => error))
|
||||||
|
) / inline_expression
|
||||||
|
expression: eol_thunk / eol_nomsu / noeol_expression
|
||||||
|
|
||||||
|
-- Function calls need at least one word in them
|
||||||
|
inline_functioncall (FunctionCall):
|
||||||
|
{| (inline_expression %ws*)* word (%ws* (inline_expression / word))* |}
|
||||||
|
noeol_functioncall (FunctionCall):
|
||||||
|
{| (noeol_expression %ws*)* word (%ws* (noeol_expression / word))* |}
|
||||||
|
functioncall (FunctionCall):
|
||||||
|
{| (expression (dotdot / %ws*))* word ((dotdot / %ws*) (expression / word))* |}
|
||||||
|
|
||||||
|
word (Word): { %operator+ / (!number plain_word) }
|
||||||
|
|
||||||
|
inline_string (String):
|
||||||
|
'"' {|
|
||||||
|
({~ (('\"' -> '"') / ('\\' -> '\') / %escape_char / [^%nl\"])+ ~}
|
||||||
|
/ string_interpolation)*
|
||||||
|
|} '"'
|
||||||
|
indented_string (String):
|
||||||
|
'".."' %ws* line_comment? %nl %gt_nodented? {|
|
||||||
|
({~ (("\\" -> "\") / (%nl+ {~ %gt_nodented -> "" ~}) / [^%nl\])+ ~} / string_interpolation)*
|
||||||
|
|} ((!.) / (&(%nl+ !%gt_nodented)) / (("" -> "Error while parsing String") => error))
|
||||||
|
|
||||||
|
string_interpolation: "\" ((noeol_expression dotdot?) / dotdot)
|
||||||
|
|
||||||
|
number (Number): (("-"? (([0-9]+ "." [0-9]+) / ("." [0-9]+) / ([0-9]+)))-> tonumber)
|
||||||
|
|
||||||
|
-- Variables can be nameless (i.e. just %) and can't contain operators like apostrophe
|
||||||
|
-- which is a hack to allow %'s to parse as "%" and "' s" separately
|
||||||
|
variable (Var): "%" { plain_word? }
|
||||||
|
|
||||||
|
inline_list (List):
|
||||||
|
"[" %ws* {| (inline_list_item (comma inline_list_item)* comma?)? |} %ws* "]"
|
||||||
|
indented_list (List):
|
||||||
|
"[..]" indent {|
|
||||||
|
list_line (nodent list_line)*
|
||||||
|
|}
|
||||||
|
(dedent / (("" -> "Error while parsing list") => error))
|
||||||
|
list_line:
|
||||||
|
(inline_list_item (comma inline_list_item)* (comma (functioncall / expression)?)?)
|
||||||
|
/ (functioncall / expression)
|
||||||
|
inline_list_item: inline_functioncall / inline_expression
|
||||||
|
|
||||||
|
block_comment: "#.." [^%nl]* (%nl (%ws* &%nl))* %nl %indented [^%nl]+ (%nl ((%ws* ((!.) / &%nl)) / (!%dedented [^%nl]+)))*
|
||||||
|
line_comment: "#" [^%nl]*
|
||||||
|
|
||||||
|
eol: %ws* line_comment? (!. / &%nl)
|
||||||
|
ignored_line: (%nodented (block_comment / line_comment)) / (%ws* (!. / &%nl))
|
||||||
|
indent: eol (%nl ignored_line)* %nl %indented ((block_comment/line_comment) (%nl ignored_line)* nodent)?
|
||||||
|
nodent: eol (%nl ignored_line)* %nl %nodented
|
||||||
|
dedent: eol (%nl ignored_line)* (((!.) &%dedented) / (&(%nl %dedented)))
|
||||||
|
comma: %ws* "," %ws*
|
||||||
|
semicolon: %ws* ";" %ws*
|
||||||
|
dotdot: nodent ".." %ws*
|
||||||
|
plain_word: ([a-zA-Z0-9_] / %utf8_char)+
|
@ -190,7 +190,8 @@ local function min(list, keyFn)
|
|||||||
return keyTable[k]
|
return keyTable[k]
|
||||||
end
|
end
|
||||||
end
|
end
|
||||||
local best, bestKey = list[1], keyFn(best)
|
local best = list[1]
|
||||||
|
local bestKey = keyFn(best)
|
||||||
for i = 2, #list do
|
for i = 2, #list do
|
||||||
local key = keyFn(list[i])
|
local key = keyFn(list[i])
|
||||||
if key < bestKey then
|
if key < bestKey then
|
||||||
@ -212,7 +213,8 @@ local function max(list, keyFn)
|
|||||||
return keyTable[k]
|
return keyTable[k]
|
||||||
end
|
end
|
||||||
end
|
end
|
||||||
local best, bestKey = list[1], keyFn(best)
|
local best = list[1]
|
||||||
|
local bestKey = keyFn(best)
|
||||||
for i = 2, #list do
|
for i = 2, #list do
|
||||||
local key = keyFn(list[i])
|
local key = keyFn(list[i])
|
||||||
if key > bestKey then
|
if key > bestKey then
|
||||||
|
Loading…
Reference in New Issue
Block a user