nomsu/nomsu.moon

1156 lines
51 KiB
Plaintext
Raw Normal View History

2017-09-05 23:51:35 -07:00
#!/usr/bin/env moon
-- This file contains the source code of the Nomsu compiler.
-- Nomsu is a programming language that cross-compiles to Lua. It was designed to be good
-- at natural-language-like code that is highly self-modifying and flexible.
-- The only dependency is LPEG, which can be installed using "luarocks install lpeg"
-- File usage:
-- Either, in a lua/moonscript file:
-- Nomsu = require "nomsu"
-- nomsu = Nomsu()
-- nomsu:run(your_nomsu_code)
-- Or from the command line:
-- lua nomsu.lua [input_file [output_file or -]]
lfs = require 'lfs'
re = require 're'
lpeg = require 'lpeg'
2017-12-18 16:26:26 -08:00
utils = require 'utils'
new_uuid = require 'uuid'
immutable = require 'immutable'
2017-12-18 16:19:56 -08:00
{:repr, :stringify, :min, :max, :equivalent, :set, :is_list, :sum} = utils
colors = setmetatable({}, {__index:->""})
2017-12-30 14:31:07 -08:00
colored = setmetatable({}, {__index:(_,color)-> ((msg)-> colors[color]..(msg or '')..colors.reset)})
{:insert, :remove, :concat} = table
2018-02-27 14:31:19 -08:00
_Tuple = immutable(nil)
Tuple = (t)->
2018-02-27 14:31:19 -08:00
return _Tuple(table.unpack(t))
cached = (fn)->
cache = setmetatable({}, {__mode:"k"})
return (self, arg)->
unless cache[arg]
cache[arg] = fn(self, arg)
return cache[arg]
-- Use + operator for string coercive concatenation (note: "asdf" + 3 == "asdf3")
-- Use [] for accessing string characters, or s[{3,4}] for s:sub(3,4)
-- Note: This globally affects all strings in this instance of Lua!
do
STRING_METATABLE = getmetatable("")
STRING_METATABLE.__add = (other)=> @ .. stringify(other)
STRING_METATABLE.__index = (i)=>
if type(i) == 'number' then return string.sub(@, i, i)
elseif type(i) == 'table' then return string.sub(@, i[1], i[2])
else return string[i]
-- Can't use this because it breaks some LPEG stuff
--STRING_METATABLE.__mul = (other)=> string.rep(@, other)
2017-09-05 23:51:35 -07:00
-- TODO:
2017-10-02 19:35:01 -07:00
-- consider non-linear codegen, rather than doing thunks for things like comprehensions
2017-09-13 16:22:04 -07:00
-- improve indentation of generated lua code
2017-09-13 16:08:26 -07:00
-- better error reporting
-- type checking?
2017-10-23 14:55:12 -07:00
-- Add compiler options for optimization level (compile-fast vs. run-fast, etc.)
2018-01-11 01:19:03 -08:00
-- Do a pass on all actions to enforce parameters-are-nouns heuristic
2018-01-11 14:07:14 -08:00
-- Maybe do some sort of lazy definitions of actions that defer until they're used in code
-- Add a ((%x foo %y) where {x:"asdf", y:"fdsa"}) compile-time action for substitution
2017-09-05 23:51:35 -07:00
2017-08-22 01:02:41 -07:00
lpeg.setmaxstack 10000 -- whoa
{:P,:R,:V,:S,:Cg,:C,:Cp,:B,:Cmt} = lpeg
Types = {}
for t in *{"File", "Nomsu", "Block", "List", "FunctionCall", "Text", "Dict", "Number", "Word", "Var", "Comment"}
Types[t] = immutable({"id","value"}, {type:t, name:t})
Types.DictEntry = immutable({"key","value"}, {name:"DictEntry"})
Types.is_node = (n)->
type(n) == 'userdata' and n.type
NOMSU_DEFS = with {}
-- Newline supports either windows-style CR+LF or unix-style LF
.Tuple = Tuple
.DictEntry = (k,v) -> Types.DictEntry(k,v)
.nl = P("\r")^-1 * P("\n")
.ws = S(" \t")
.tonumber = tonumber
.print = (src,pos,msg)->
print(msg, pos, repr(src\sub(math.max(0,pos-16),math.max(0,pos-1)).."|"..src\sub(pos,pos+16)))
return true
string_escapes = n:"\n", t:"\t", b:"\b", a:"\a", v:"\v", f:"\f", r:"\r"
digit, hex = R('09'), R('09','af','AF')
.escaped_char = (P("\\")*S("xX")*C(hex*hex)) / => string.char(tonumber(@, 16))
.escaped_char += (P("\\")*C(digit*(digit^-2))) / => string.char(tonumber @)
.escaped_char += (P("\\")*C(S("ntbavfr"))) / string_escapes
.operator_char = S("'~`!@$^&*-+=|<>?/")
.operator = .operator_char^1
.utf8_char = (
R("\194\223")*R("\128\191") +
R("\224\239")*R("\128\191")*R("\128\191") +
R("\240\244")*R("\128\191")*R("\128\191")*R("\128\191"))
.ident_char = R("az","AZ","09") + P("_") + .utf8_char
-- If the line begins with #indent+4 spaces, the pattern matches *those* spaces
-- and adds them to the stack (not any more).
.indent = P (start)=>
nodent = lpeg.userdata.indent_stack[#lpeg.userdata.indent_stack]
indented = nodent.." "
if @sub(start, start+#indented-1) == indented
insert(lpeg.userdata.indent_stack, indented)
return start + #indented
-- If the number of leading space characters is <= the number of space on the top of the
-- stack minus 4, this pattern matches and pops off the top of the stack exactly once.
.dedent = P (start)=>
nodent = lpeg.userdata.indent_stack[#lpeg.userdata.indent_stack]
spaces = @match("[ ]*", start)
if #spaces <= #nodent-4
remove(lpeg.userdata.indent_stack)
2017-12-30 14:31:07 -08:00
return start
-- If the number of leading space characters is >= the number on the top of the
-- stack, this pattern matches and does not modify the stack.
.nodent = P (start)=>
nodent = lpeg.userdata.indent_stack[#lpeg.userdata.indent_stack]
if @sub(start, start+#nodent-1) == nodent
return start + #nodent
.error = (src,pos,err_msg)->
if lpeg.userdata.source_code\sub(pos,pos)\match("[\r\n]")
pos += #lpeg.userdata.source_code\match("[ \t\n\r]*", pos)
line_no = 1
while (lpeg.userdata.line_starts[line_no+1] or math.huge) < pos do line_no += 1
prev_line = if line_no > 1
lpeg.userdata.source_code\match("[^\r\n]*", lpeg.userdata.line_starts[line_no-1])
else ""
err_line = lpeg.userdata.source_code\match("[^\r\n]*", lpeg.userdata.line_starts[line_no])
next_line = if line_no < #lpeg.userdata.line_starts
lpeg.userdata.source_code\match("[^\r\n]*", lpeg.userdata.line_starts[line_no+1])
else ""
pointer = ("-")\rep(pos-lpeg.userdata.line_starts[line_no]) .. "^"
err_msg = (err_msg or "Parse error").." in #{lpeg.userdata.filename} on line #{line_no}:\n"
err_msg ..="\n#{prev_line}\n#{err_line}\n#{pointer}\n#{next_line}\n"
error(err_msg)
node_id = 0
setmetatable(NOMSU_DEFS, {__index:(key)=>
make_node = (start, value, stop)->
node_id = node_id + 1
if type(value) == 'table' then error(value)-- = Tuple(value)
node = Types[key](node_id, value)
lpeg.userdata.tree_metadata[node] = {
:start,:stop,filename:lpeg.userdata.filename,source_code:lpeg.userdata.source_code
}
return node
self[key] = make_node
return make_node
})
NOMSU = do
2017-12-30 14:31:07 -08:00
-- Just for cleanliness, I put the language spec in its own file using a slightly modified
-- version of the lpeg.re syntax.
peg_tidier = re.compile [[
file <- {~ %nl* (def/comment) (%nl+ (def/comment))* %nl* ~}
def <- anon_def / captured_def
anon_def <- ({ident} (" "*) ":"
{((%nl " "+ [^%nl]*)+) / ([^%nl]*)}) -> "%1 <- %2"
captured_def <- ({ident} (" "*) "(" {ident} ")" (" "*) ":"
{((%nl " "+ [^%nl]*)+) / ([^%nl]*)}) -> "%1 <- ({} %3 {}) -> %2"
ident <- [a-zA-Z_][a-zA-Z0-9_]*
comment <- "--" [^%nl]*
]]
nomsu_peg = peg_tidier\match(io.open("nomsu.peg")\read("*a"))
re.compile(nomsu_peg, NOMSU_DEFS)
2017-09-13 16:22:04 -07:00
class NomsuCompiler
new:()=>
-- Weak-key mapping from objects to randomly generated unique IDs
NaN_surrogate = {}
nil_surrogate = {}
@ids = setmetatable({}, {
__mode: "k"
__index: (key)=>
if key == nil then return @[nil_surrogate]
elseif key != key then return @[NaN_surrogate]
id = new_uuid!
@[key] = id
return id
})
2018-02-05 15:34:57 -08:00
@use_stack = {}
@compilestack = {}
@file_metadata = setmetatable({}, {__mode:"k"})
@tree_metadata = setmetatable({}, {__mode:"k"})
@action_metadata = setmetatable({}, {__mode:"k"})
2017-08-22 01:02:41 -07:00
@debug = false
@environment = {
-- Discretionary/convenience stuff
nomsu:self, repr:repr, stringify:stringify, utils:utils, lpeg:lpeg, re:re,
-- Lua stuff:
:next, :unpack, :setmetatable, :coroutine, :rawequal, :getmetatable, :pcall,
:error, :package, :os, :require, :tonumber, :tostring, :string, :xpcall, :module,
:print, :loadfile, :rawset, :_VERSION, :collectgarbage, :rawget, :bit32, :rawlen,
:table, :assert, :dofile, :loadstring, :type, :select, :debug, :math, :io, :pairs,
:load, :ipairs,
}
@environment.ACTIONS = setmetatable({}, {__index:(key)=>
error("Attempt to run undefined action: #{key}", 0)
})
@environment.LOADED = {}
@environment.Types = Types
@initialize_core!
define_action: (signature, source, fn)=>
if @debug
print "#{colored.bright "DEFINING ACTION:"} #{colored.green repr(signature)}"
if type(fn) != 'function'
error 'function', "Bad fn: #{repr fn}"
if type(signature) == 'string'
signature = {signature}
elseif type(signature) != 'table' or signature.type != nil
error("Invalid signature, expected list of strings, but got: #{repr signature}", 0)
stubs = @get_stubs_from_signature signature
stub_args = @get_args_from_signature signature
fn_info = debug.getinfo(fn, "u")
local fn_arg_positions, arg_orders
unless fn_info.isvararg
fn_arg_positions = {debug.getlocal(fn, i), i for i=1,fn_info.nparams}
arg_orders = {} -- Map from stub -> index where each arg in the stub goes in the function call
for sig_i=1,#stubs
stub, args = stubs[sig_i], stub_args[sig_i]
if @debug
print "#{colored.bright "ALIAS:"} #{colored.underscore colored.magenta repr(stub)} #{colored.bright "WITH ARGS"} #{colored.dim repr(args)} ON: #{@environment.ACTIONS}"
@environment.ACTIONS[stub] = fn
unless fn_info.isvararg
arg_positions = [fn_arg_positions[a] for a in *args]
-- TODO: better error checking?
if #arg_positions != #args
error("Mismatch in args between lua function's #{repr fn_arg_positions} and stub's #{repr args} for #{repr stub}", 0)
arg_orders[stub] = arg_positions
@action_metadata[fn] = {
:fn, :source, aliases:stubs, :arg_orders,
arg_positions:fn_arg_positions, def_number:@@def_number,
}
define_compile_action: (signature, source, fn, src)=>
@define_action(signature, source, fn)
@action_metadata[fn].compile_time = true
2017-12-15 15:30:05 -08:00
serialize_defs: (scope=nil, after=nil)=>
-- TODO: repair
error("Not currently functional.", 0)
-- TODO: figure out whether indent/dedent should affect first line
dedent: (code)=>
unless code\find("\n")
return code
spaces, indent_spaces = math.huge, math.huge
for line in code\gmatch("\n([^\n]*)")
if line\match("^%s*#.*") or line\match("^%s*$")
continue -- skip comments and blank lines
elseif s = line\match("^(%s*)%.%..*")
spaces = math.min(spaces, #s)
elseif s = line\match("^(%s*)%S.*")
indent_spaces = math.min(indent_spaces, #s)
if spaces != math.huge and spaces < indent_spaces
return (code\gsub("\n"..(" ")\rep(spaces), "\n"))
elseif indent_spaces != math.huge
return (code\gsub("\n"..(" ")\rep(indent_spaces), "\n "))
else return code
indent: (code, levels=1)=>
return code\gsub("\n","\n"..(" ")\rep(levels))
get_line_number: cached (tree)=>
metadata = @tree_metadata[tree]
unless metadata
error "Failed to find metatdata for tree: #{tree}", 0
unless @file_metadata[metadata.filename]
error "Failed to find file metatdata for file: #{metadata.filename}", 0
line_starts = @file_metadata[metadata.filename].line_starts
first_line = 1
while first_line < #line_starts and line_starts[first_line+1] < metadata.start
first_line += 1
last_line = first_line
while last_line < #line_starts and line_starts[last_line+1] < metadata.stop
last_line += 1
--return first_line == last_line and "#{metadata.filename}:#{first_line}" or "#{metadata.filename}:#{first_line}-#{last_line}"
return "#{metadata.filename}:#{first_line}"
get_source_code: (tree)=>
-- Return the (dedented) source code of a tree, or construct some if the tree was
-- dynamically generated.
metadata = @tree_metadata[tree]
unless metadata
return @tree_to_nomsu(tree)
return @dedent metadata.source_code\sub(metadata.start, metadata.stop-1)
line_counter = re.compile([[
lines <- {| line (%nl line)* |}
line <- {} (!%nl .)*
]], nl:NOMSU_DEFS.nl)
parse: (nomsu_code, filename)=>
assert type(filename) == "string", "Bad filename type: #{type filename}"
2017-08-22 01:02:41 -07:00
if @debug
print "#{colored.bright "PARSING:"}\n#{colored.yellow nomsu_code}"
unless @file_metadata[filename]
@file_metadata[filename] = {
source_code:nomsu_code, :filename, line_starts:line_counter\match(nomsu_code)
}
userdata = {
source_code:nomsu_code, :filename, indent_stack: {""}, tree_metadata:@tree_metadata,
line_starts:@file_metadata[filename].line_starts,
}
old_userdata, lpeg.userdata = lpeg.userdata, userdata
tree = NOMSU\match(nomsu_code)
lpeg.userdata = old_userdata
assert tree, "In file #{colored.blue filename} failed to parse:\n#{colored.onyellow colored.black nomsu_code}"
if @debug
print "PARSE TREE:"
@print_tree tree, " "
2017-08-22 01:02:41 -07:00
return tree
2017-09-11 13:05:25 -07:00
2018-01-10 20:45:03 -08:00
run: (src, filename, max_operations=nil, output_file=nil)=>
if src == "" then return nil, ""
if max_operations
timeout = ->
2017-10-09 04:37:16 -07:00
debug.sethook!
error("Execution quota exceeded. Your code took too long.", 0)
debug.sethook timeout, "", max_operations
tree = @parse(src, filename)
assert tree, "Failed to parse: #{src}"
assert tree.type == "File", "Attempt to run non-file: #{tree.type}"
lua = @tree_to_lua(tree)
lua_code = lua.statements or (lua.expr..";")
if lua_code.locals and #lua_code.locals > 0
lua_code = "local "..concat(lua_code.locals, ", ")..";\n"..lua_code
lua_code = "-- File: #{filename}\n"..lua_code
2018-01-10 20:45:03 -08:00
ret = @run_lua(lua_code)
if max_operations
debug.sethook!
if output_file
output_file\write(lua_code)
2018-01-10 20:45:03 -08:00
return ret, lua_code
2018-01-10 20:45:03 -08:00
run_file: (filename)=>
file_attributes = assert(lfs.attributes(filename), "File not found: #{filename}")
if file_attributes.mode == "directory"
for short_filename in lfs.dir(filename)
full_filename = filename..'/'..short_filename
attr = lfs.attributes(full_filename)
if attr.mode ~= "directory" and short_filename\match(".*%.nom")
@run_file full_filename
return
if filename\match(".*%.lua")
file = io.open(filename)
contents = file\read("*a")
file\close!
return assert(load(contents, nil, nil, @environment))!
if filename\match(".*%.nom")
if not @skip_precompiled -- Look for precompiled version
file = io.open(filename\gsub("%.nom", ".lua"), "r")
if file
lua_code = file\read("*a")
file\close!
2018-01-10 20:45:03 -08:00
return @run_lua(lua_code)
file = file or io.open(filename)
if not file
error("File does not exist: #{filename}", 0)
nomsu_code = file\read('*a')
file\close!
return @run(nomsu_code, filename)
else
error("Invalid filetype for #{filename}", 0)
2018-02-05 15:34:57 -08:00
use_file: (filename)=>
loaded = @environment.LOADED
if not loaded[filename]
2018-02-05 15:34:57 -08:00
for i,f in ipairs @use_stack
if f == filename
loop = [@use_stack[j] for j=i,#@use_stack]
insert loop, filename
error("Circular import, this loops forever: #{concat loop, " -> "}")
insert @use_stack, filename
loaded[filename] = @run_file(filename) or true
return loaded[filename]
2018-01-10 20:45:03 -08:00
run_lua: (lua_code)=>
run_lua_fn, err = load(lua_code, nil, nil, @environment)
2018-01-10 20:45:03 -08:00
if @debug
print "#{colored.bright "RUNNING LUA:"}\n#{colored.blue colored.bright(lua_code)}"
if not run_lua_fn
n = 1
fn = ->
n = n + 1
("\n%-3d|")\format(n)
code = "1 |"..lua_code\gsub("\n", fn)
error("Failed to compile generated code:\n#{colored.bright colored.blue colored.onblack code}\n\n#{err}", 0)
return run_lua_fn!
2018-01-10 20:45:03 -08:00
tree_to_value: (tree, filename)=>
-- Special case for text literals
if tree.type == 'Text' and #tree.value == 1 and type(tree.value[1]) == 'string'
return tree.value[1]
code = "return #{@tree_to_lua(tree).expr};"
if @debug
print "#{colored.bright "RUNNING LUA TO GET VALUE:"}\n#{colored.blue colored.bright(code)}"
lua_thunk, err = load(code, nil, nil, @environment)
if not lua_thunk
error("Failed to compile generated code:\n#{colored.bright colored.blue colored.onblack code}\n\n#{colored.red err}", 0)
return lua_thunk!
tree_to_nomsu: (tree, indentation="", max_line=80, expr_type=nil)=>
-- Convert a tree into nomsu code that satisfies the max line requirement or nil
-- if that's not possible
-- expr_type is either:
-- nil for code that goes at the top level and can contain anything
-- "noeol" for code that can contain anything except an end-of-line component
-- like a colon (i.e. it already occurs after a colon on the same line)
-- "inline" for code that cannot contain indented code or an end-of-line component
-- e.g. code that is meant to go inside parentheses
assert tree, "No tree provided to tree_to_nomsu."
assert Types.is_node(tree), "Invalid tree: #{repr(tree)}"
join_lines = (lines)->
for line in *lines
if #indentation + #line > max_line
return nil
return concat(lines, "\n"..indentation)
is_operator = (tok)-> tok and tok.type == "Word" and NOMSU_DEFS.operator\match(tok.value)
local inline_expression, noeol_expression, expression
inline_expression = (tok)->
switch tok.type
when "Block"
if #tok.value > 1 then return nil
nomsu = inline_expression tok.value
return nomsu and "(: #{nomsu})"
when "FunctionCall"
buff = ""
for i,bit in ipairs tok.value
if bit.type == "Word"
if i == 1 or (is_operator(bit) and is_operator(tok.value[i-1]))
buff ..= bit.value
else buff ..= " "..bit.value
else
nomsu = inline_expression bit
return nil unless nomsu
unless i == 1 or bit.type == "Block"
buff ..= " "
buff ..= if bit.type == "FunctionCall"
"("..nomsu..")"
else nomsu
return buff
when "List"
bits = {}
for bit in *tok.value
nomsu = inline_expression bit
return nil unless nomsu
insert bits, nomsu
return "["..concat(bits, ", ").."]"
when "Dict"
bits = {}
for bit in *tok.value
key_nomsu = if bit.key.type == "Word"
bit.key.value
else inline_expression bit.key
return nil unless key_nomsu
if bit.key.type == "FunctionCall"
key_nomsu = "("..key_nomsu..")"
value_nomsu = inline_expression bit.value
return nil unless value_nomsu
insert bits, key_nomsu.."="..value_nomsu
return "{"..concat(bits, ", ").."}"
when "Text"
buff = '"'
for bit in *tok.value
if type(bit) == 'string'
-- Force indented text
return nil if bit\find("\n")
buff ..= bit\gsub("\\","\\\\")\gsub("\n","\\n")
else
nomsu = inline_expression(bit)
return nil unless nomsu
buff ..= if bit.type == "Var" or bit.type == "List" or bit.type == "Dict"
"\\"..nomsu
else "\\("..nomsu..")"
if #buff > max_line then return nil
return buff..'"'
when "Nomsu"
nomsu = inline_expression(tok.value)
return nil if not nomsu
return "\\("..nomsu..")"
when "Number" then tostring(tok.value)
when "Var" then "%"..tok.value
else return nil
noeol_expression = (tok)->
nomsu = inline_expression(tok)
if nomsu and #nomsu < max_line
return nomsu
switch tok.type
when "Block"
buff = ":"
for line in *tok.value
nomsu = expression(line)
return nil unless nomsu
buff ..= "\n "..@indent(nomsu)
return buff
when "FunctionCall"
nomsu = expression(tok)
return nil unless nomsu
return "(..)\n "..@indent(nomsu)
when "List"
buff = "[..]"
line = "\n "
for bit in *tok.value
nomsu = inline_expression bit
if line != "\n " and #line + #", " + #nomsu > max_line
buff ..= line
line = "\n "
sep = line == "\n " and "" or ", "
if nomsu
line ..= sep..nomsu
if #line >= max_line
buff ..= line
line = "\n "
else
line ..= sep..expression(bit)
buff ..= line
line = "\n "
if line ~= "\n "
buff ..= line
return buff
when "Dict"
buff = "{..}"
line = "\n "
for bit in *tok.value
key_nomsu = inline_expression bit.key
return nil unless key_nomsu
if bit.key.type == "FunctionCall"
key_nomsu = "("..key_nomsu..")"
value_nomsu = inline_expression bit.value
if value_nomsu and #key_nomsu + #value_nomsu < max_line
line ..= key_nomsu.."="..value_nomsu..","
if #line >= max_line
buff ..= line
line = "\n "
else
line ..= key_nomsu.."="..expression(bit.value)
buff ..= line
line = "\n "
if line ~= "\n "
buff ..= line
return buff
when "Text"
buff = '".."\n '
for bit in *tok.value
if type(bit) == 'string'
buff ..= bit\gsub("\\","\\\\")\gsub("\n","\n ")
else
nomsu = inline_expression(bit)
return nil unless nomsu
buff ..= if bit.type == "Var" or bit.type == "List" or bit.type == "Dict"
"\\"..nomsu
else "\\("..nomsu..")"
return buff
when "Nomsu"
nomsu = expression(tok.value)
return nil if not nomsu
return "\\(..)\n "..@indent(nomsu)
when "Comment"
if tok.value\find("\n")
return "#.."..tok.value\gsub("\n","\n ")
else
return "#"..tok.value
else return inline_expression(tok)
expression = (tok)->
nomsu = inline_expression(tok)
if nomsu and #nomsu < max_line
return nomsu
switch tok.type
when "Block"
if #tok.value == 1
nomsu = if tok.value[1].type == "FunctionCall"
inline_expression(tok.value[1])
else
noeol_expression(tok.value[1])
if nomsu and #(nomsu\match("[^\n]*")) < max_line
return ": "..nomsu
return noeol_expression(tok)
when "FunctionCall"
-- The hard task
buff = ""
for i,bit in ipairs tok.value
if bit.type == "Word"
if i == 1 or (is_operator(bit) and is_operator(tok.value[i-1])) or buff\sub(-2,-1) == ".."
buff ..= bit.value
else
buff ..= " "..bit.value
else
nomsu = inline_expression(bit)
if nomsu and #nomsu < max_line
if bit.type == "FunctionCall"
nomsu = "("..nomsu..")"
else
nomsu = expression(bit)
return nil unless nomsu
if bit.type == "FunctionCall"
nomsu = "(..)\n "..@indent(nomsu)
if i < #tok.value
nomsu ..= "\n.."
unless i == 1 or bit.type == "Block"
buff ..= " "
buff ..= nomsu
return buff
when "File"
lines = {}
for line in *tree.value
nomsu = expression(line)
unless nomsu
src = @get_source_code line
error "Failed to produce output for:\n#{colored.yellow src}", 0
insert lines, nomsu
return concat lines, "\n"
when "Comment"
if tok.value\find("\n")
return "#.."..tok.value\gsub("\n","\n ")
else
return "#"..tok.value
else return noeol_expression(tok)
return expression(tree)
value_to_nomsu: (value)=>
switch type(value)
when "nil"
return "(nil)"
when "bool"
return value and "(yes)" or "(no)"
when "number"
2018-01-26 15:18:56 -08:00
-- TODO: support NaN, inf, etc.?
return repr(value)
when "table"
2017-12-18 16:19:56 -08:00
if is_list(value)
return "[#{concat [@value_to_nomsu(v) for v in *value], ", "}]"
else
2018-01-26 15:18:56 -08:00
return "{#{concat ["#{@value_to_nomsu(k)}:#{@value_to_nomsu(v)}" for k,v in pairs(value)], ", "}}"
2017-12-14 14:26:24 -08:00
when "string"
if value == "\n"
return "'\\n'"
elseif not value\find[["]] and not value\find"\n" and not value\find"\\"
return "\""..value.."\""
else
-- TODO: This might fail if it's being put inside a list or something
return '".."\n '..(@indent value)
else
error("Unsupported value_to_nomsu type: #{type(value)}", 0)
@math_patt: re.compile [[ "%" (" " [*/^+-] " %")+ ]]
tree_to_lua: (tree)=>
-- Return <lua code for value>, <additional lua code>
assert tree, "No tree provided."
if not Types.is_node(tree)
error("Invalid tree: #{repr(tree)}", 0)
2017-08-22 01:02:41 -07:00
switch tree.type
when "File"
if #tree.value == 1
return @tree_to_lua(tree.value[1])
declared_locals = {}
lua_bits = {}
line_no = 1
for line in *tree.value
lua = @tree_to_lua line
if not lua
error("No lua produced by #{repr line}", 0)
if lua.locals
new_locals = [l for l in *lua.locals when not declared_locals[l]]
if #new_locals > 0
insert lua_bits, "local #{concat new_locals, ", "};"
for l in *new_locals do declared_locals[l] = true
if lua.statements then insert lua_bits, lua.statements
elseif lua.expr then insert lua_bits, "#{lua.expr};"
return statements:concat(lua_bits, "\n")
when "Comment"
return statements:"--"..tree.value\gsub("\n","\n--")
when "Nomsu"
return expr:"nomsu:parse(#{repr @get_source_code(tree.value)}, #{repr @get_line_number(tree.value)}).value[1]"
2017-08-22 01:02:41 -07:00
when "Block"
lua_bits = {}
locals = {}
for arg in *tree.value
lua = @tree_to_lua arg
if #tree.value == 1 and lua.expr and not lua.statements
return {expr:lua.expr, locals:lua.locals}
if lua.locals
for l in *lua.locals do table.insert(locals, l)
if lua.statements then insert lua_bits, lua.statements
elseif lua.expr then insert lua_bits, "#{lua.expr};"
utils.deduplicate(locals)
return statements:concat(lua_bits, "\n"), locals:(#locals > 0 and locals or nil)
2017-08-22 01:02:41 -07:00
when "FunctionCall"
insert @compilestack, tree
stub = @tree_to_stub tree
ok, fn = pcall(-> @environment.ACTIONS[stub])
if not ok then fn = nil
metadata = @action_metadata[fn]
if metadata and metadata.compile_time
args = [arg for arg in *tree.value when arg.type != "Word"]
if metadata and metadata.arg_orders
new_args = [args[p] for p in *metadata.arg_orders[stub]]
args = new_args
if @debug
print "#{colored.bright "RUNNING MACRO"} #{colored.underscore colored.magenta(stub)} "
print "#{colored.bright "WITH ARGS:"} #{colored.dim concat([(repr a)\sub(1,100) for a in *args], ", ")}"
lua = fn(unpack(args))
remove @compilestack
return lua
elseif not metadata and @@math_patt\match(stub)
-- This is a bit of a hack, but this code handles arbitrarily complex
-- math expressions like 2*x + 3^2 without having to define a single
2018-01-11 01:19:03 -08:00
-- action for every possibility.
bits = {}
for tok in *tree.value
if tok.type == "Word"
insert bits, tok.value
else
lua = @tree_to_lua(tok)
unless lua.expr
src = @get_source_code(tok)
error("non-expression value inside math expression: #{colored.yellow src}")
insert bits, lua.expr
remove @compilestack
return expr:"(#{concat bits, " "})"
args = {}
for tok in *tree.value
if tok.type == "Word" then continue
lua = @tree_to_lua(tok)
unless lua.expr
line = @get_line_number(tok)
src = @get_source_code(tok)
error "#{line}: Cannot use:\n#{colored.yellow src}\nas an argument to #{stub}, since it's not an expression, it produces: #{repr lua}", 0
insert args, lua.expr
if metadata and metadata.arg_orders
new_args = [args[p] for p in *metadata.arg_orders[stub]]
args = new_args
remove @compilestack
return expr:@@comma_separated_items("ACTIONS[#{repr stub}](", args, ")")
2017-08-22 01:02:41 -07:00
2018-01-11 01:09:26 -08:00
when "Text"
2017-09-14 02:41:10 -07:00
concat_parts = {}
string_buffer = ""
for bit in *tree.value
if type(bit) == "string"
string_buffer ..= bit
continue
if string_buffer ~= ""
insert concat_parts, repr(string_buffer)
string_buffer = ""
lua = @tree_to_lua bit
if @debug
print(colored.bright "INTERP:")
@print_tree bit
print "#{colored.bright "EXPR:"} #{lua.expr}, #{colored.bright "STATEMENT:"} #{lua.statements}"
unless lua.expr
line = @get_line_number(bit)
src = @get_source_code(bit)
error "#{line}: Cannot use #{colored.yellow bit} as a string interpolation value, since it's not an expression.", 0
insert concat_parts, "stringify(#{lua.expr})"
2017-09-14 02:41:10 -07:00
if string_buffer ~= ""
insert concat_parts, repr(string_buffer)
2017-09-14 02:41:10 -07:00
2017-09-26 15:27:01 -07:00
if #concat_parts == 0
return expr:"''"
elseif #concat_parts == 1
return expr:concat_parts[1]
else return expr:"(#{concat(concat_parts, "..")})"
2017-08-22 01:02:41 -07:00
when "List"
items = {}
for item in *tree.value
lua = @tree_to_lua item
unless lua.expr
line = @get_line_number(item)
src = @get_source_code(item)
error "#{line}: Cannot use #{colored.yellow src} as a list item, since it's not an expression.", 0
insert items, lua.expr
return expr:@@comma_separated_items("{", items, "}")
when "Dict"
items = {}
for entry in *tree.value
key_lua = if entry.key.type == "Word"
{expr:repr(entry.key.value)}
else
@tree_to_lua entry.key
unless key_lua.expr
line = @get_line_number(entry.key)
src = @get_source_code(entry.key)
error "#{line}: Cannot use #{colored.yellow src} as a dict key, since it's not an expression.", 0
value_lua = @tree_to_lua entry.value
unless value_lua.expr
line = @get_line_number(entry.value)
src = @get_source_code(entry.value)
error "#{line}: Cannot use #{colored.yellow src} as a dict value, since it's not an expression.", 0
key_str = key_lua.expr\match([=[["']([a-zA-Z_][a-zA-Z0-9_]*)['"]]=])
if key_str
insert items, "#{key_str}=#{value_lua.expr}"
elseif key_lua.expr\sub(1,1) == "["
insert items, "[ #{key_lua.expr}]=#{value_lua.expr}"
else
insert items, "[#{key_lua.expr}]=#{value_lua.expr}"
return expr:@@comma_separated_items("{", items, "}")
when "Number"
return expr:repr(tree.value)
2017-08-22 01:02:41 -07:00
when "Var"
return expr:@var_to_lua_identifier(tree.value)
2017-08-22 01:02:41 -07:00
else
error("Unknown/unimplemented thingy: #{tree.type}", 0)
2017-09-25 17:02:00 -07:00
walk_tree: (tree, depth=0)=>
coroutine.yield(tree, depth)
return unless Types.is_node(tree)
switch tree.type
2018-01-11 01:09:26 -08:00
when "List", "File", "Block", "FunctionCall", "Text"
for v in *tree.value
2017-09-25 17:02:00 -07:00
@walk_tree(v, depth+1)
when "Dict"
for e in *tree.value
@walk_tree(e.key, depth+1)
@walk_tree(e.value, depth+1)
2017-09-25 17:02:00 -07:00
else @walk_tree(tree.value, depth+1)
return nil
print_tree: (tree)=>
2018-01-26 15:03:07 -08:00
io.write(colors.bright..colors.green)
2017-09-25 17:02:00 -07:00
for node,depth in coroutine.wrap(-> @walk_tree tree)
if Types.is_node(node)
2018-01-26 15:03:07 -08:00
print("#{(" ")\rep(depth)}#{node.type}:")
else
print((" ")\rep(depth)..repr(node))
2018-01-26 15:03:07 -08:00
io.write(colors.reset)
2017-09-25 17:02:00 -07:00
tree_to_str: (tree)=>
bits = {}
for node,depth in coroutine.wrap(-> @walk_tree tree)
if Types.is_node(node)
2017-09-25 17:02:00 -07:00
insert bits, ("#{(" ")\rep(depth)}#{node.type}:")
else
insert bits, ((" ")\rep(depth)..repr(node))
2017-09-25 17:02:00 -07:00
return concat(bits, "\n")
2017-09-11 13:05:25 -07:00
2017-09-21 13:30:59 -07:00
@unescape_string: (str)=>
Cs(((P("\\\\")/"\\") + (P("\\\"")/'"') + NOMSU_DEFS.escaped_char + P(1))^0)\match(str)
2017-09-21 13:30:59 -07:00
2017-09-11 13:05:25 -07:00
@comma_separated_items: (open, items, close)=>
2017-09-21 13:30:59 -07:00
bits = {open}
so_far = 0
for i,item in ipairs(items)
if i < #items then item ..= ", "
insert bits, item
so_far += #item
if so_far >= 80
insert bits, "\n"
so_far = 0
insert bits, close
return concat(bits)
tree_map: (tree, fn)=>
-- Return a new tree with fn mapped to each node. If fn provides a replacement,
-- use that and stop recursing, otherwise recurse.
unless Types.is_node(tree) then return tree
replacement = fn(tree)
if replacement != nil
return replacement
switch tree.type
2018-01-11 01:09:26 -08:00
when "File", "Nomsu", "Block", "List", "FunctionCall", "Text"
new_values, is_changed = {}, false
for i,old_value in ipairs(tree.value)
new_value = type(old_value) != "string" and @tree_map(old_value, fn) or nil
if new_value != nil and new_value != old_value
is_changed = true
new_values[i] = new_value
else
new_values[i] = old_value
if is_changed
new_tree = getmetatable(tree)(tree.id, Tuple(new_values))
-- TODO: Maybe generate new metadata?
@tree_metadata[new_tree] = @tree_metadata[tree]
return new_tree
when "Dict"
new_values, is_changed = {}, false
for i,e in ipairs tree.value
new_key = @tree_map(e.key, fn)
new_value = @tree_map(e.value, fn)
if (new_key != nil and new_key != e.key) or (new_value != nil and new_value != e.value)
is_changed = true
new_values[i] = DictEntry(new_key, new_value)
else
new_values[i] = e
if is_changed
new_tree = getmetatable(tree)(tree.id, Tuple(new_values))
-- TODO: Maybe generate new metadata?
@tree_metadata[new_tree] = @tree_metadata[tree]
return new_tree
when nil -- Raw table, probably from one of the .value of a multi-value tree (e.g. List)
error("Invalid tree: #{repr tree}")
return tree
tree_with_replaced_vars: (tree, replacements)=>
return @tree_map tree, (t)->
if t.type == "Var"
id = @var_to_lua_identifier t.value
if replacements[id] != nil
return replacements[id]
tree_to_stub: cached (tree)=>
if tree.type != "FunctionCall" then error "Tried to get stub from non-functioncall tree: #{tree.type}", 0
return concat([(t.type == "Word" and t.value or "%") for t in *tree.value], " ")
tree_to_named_stub: cached (tree)=>
if tree.type != "FunctionCall" then error "Tried to get stub from non-functioncall tree: #{tree.type}", 0
return concat([(t.type == "Word" and t.value or "%#{t.value}") for t in *tree.value], " ")
stub_defs = {
space:(P(' ') + P('\n..'))^0
word:(NOMSU_DEFS.ident_char^1 + NOMSU_DEFS.operator^1)
varname:(R('az','AZ','09') + P('_') + NOMSU_DEFS.utf8_char)^0
}
stub_pattern = re.compile("{~ (%space->'') (('%' (%varname->'')) / %word)? ((%space->' ') (('%' (%varname->'')) / %word))* (%space->'') ~}", stub_defs)
get_stubs_from_signature: (signature)=>
if type(signature) != 'table' or signature.type
error("Invalid signature: #{repr signature}", 0)
stubs = {}
for i,alias in ipairs(signature)
if type(alias) != 'string'
error("Expected entries in signature to be strings, not #{type(alias)}s like: #{repr alias}\nsignature: #{repr signature}", 0)
stubs[i] = stub_pattern\match(alias)
unless stubs[i]
error("Failed to match stub pattern on alias: #{repr alias}")
return stubs
var_pattern = re.compile("{| %space ((('%' {%varname}) / %word) %space)+ |}", stub_defs)
get_args_from_signature: (signature)=>
if type(signature) != 'table' or signature.type
error("Invalid signature: #{repr signature}", 0)
stub_args = {}
for i,alias in ipairs(signature)
if type(alias) != 'string'
error("Invalid type for signature: #{type(alias)} for:\n#{repr alias}", 0)
args = var_pattern\match(alias)
unless args
error("Failed to match arg pattern on alias: #{repr alias}", 0)
for j=1,#args do args[j] = @var_to_lua_identifier(args[j])
stub_args[i] = args
return stub_args
var_to_lua_identifier: (var)=>
-- Converts arbitrary nomsu vars to valid lua identifiers by replacing illegal
-- characters with escape sequences
if Types.Var\is_instance(var)
var = var.value
"_"..(var\gsub "%W", (verboten)->
if verboten == "_" then "__" else ("_%x")\format(verboten\byte!))
2018-01-05 15:23:18 -08:00
2017-09-12 20:00:19 -07:00
initialize_core: =>
-- Sets up some core functionality
get_line_no = -> "nomsu.moon:#{debug.getinfo(2).currentline}"
nomsu = self
nomsu_string_as_lua = (code)->
concat_parts = {}
for bit in *code.value
if type(bit) == "string"
insert concat_parts, bit
else
lua = nomsu\tree_to_lua bit
unless lua.expr
line = @get_line_number(bit)
src = @get_source_code(bit)
error "#{line}: Cannot use #{colored.yellow src} as a string interpolation value, since it's not an expression.", 0
insert concat_parts, lua.expr
return concat(concat_parts)
@define_compile_action "immediately %block", get_line_no!, (_block)->
lua = nomsu\tree_to_lua(_block)
lua_code = lua.statements or (lua.expr..";")
if lua.locals and #lua.locals > 0
lua_code = "local #{concat lua.locals, ", "};\n#{lua_code}"
nomsu\run_lua(lua_code)
return statements:"if IMMEDIATE then\n#{lua_code}\nend", locals:lua.locals
@define_compile_action "lua> %code", get_line_no!, (_code)->
if _code.type == "Text"
lua = nomsu_string_as_lua(_code)
return statements:lua
else
return statements:"nomsu:run_lua(#{nomsu\tree_to_lua(_code).expr});"
2017-09-25 17:02:00 -07:00
@define_compile_action "=lua %code", get_line_no!, (_code)->
lua = nomsu_string_as_lua(_code)
return expr:lua
@define_compile_action "!! code location !!", get_line_no!, ->
tree = nomsu.compilestack[#nomsu.compilestack-1]
metadata = @tree_metadata[tree]
return expr: repr("#{metadata.filename}:#{metadata.start},#{metadata.stop}")
2017-12-30 14:31:07 -08:00
@define_action "run file %filename", get_line_no!, (_filename)->
return nomsu\run_file(_filename)
@define_compile_action "use %filename", get_line_no!, (_filename)->
filename = nomsu\tree_to_value(_filename)
2018-02-05 15:34:57 -08:00
nomsu\use_file(filename)
return expr:"nomsu:use_file(#{repr filename})"
2017-09-12 20:00:19 -07:00
-- Only run this code if this file was run directly with command line arguments, and not require()'d:
if arg and debug.getinfo(2).func != require
export colors
colors = require 'consolecolors'
parser = re.compile([[
2017-10-08 18:25:50 -07:00
args <- {| {:flags: flags? :} ({:input: input :} ";" ("-o;"{:output: output :} ";")?)? (";")? |} !.
flags <- (({| ({flag} ";")* |}) -> set)
flag <- "-c" / "-i" / "-p" / "-O" / "--help" / "-h" / "-v"
input <- "-" / [^;]+
output <- "-" / [^;]+
2017-12-18 16:19:56 -08:00
]], {:set})
args = concat(arg, ";")..";"
args = parser\match(args) or {}
if not args or not args.flags or args.flags["--help"] or args.flags["-h"]
print "Usage: lua nomsu.lua [-c] [-i] [-p] [-O] [--help] [input [-o output]]"
os.exit!
2017-09-12 20:00:19 -07:00
nomsu = NomsuCompiler()
run = ->
if args.flags["-v"]
nomsu.debug = true
nomsu.skip_precompiled = not args.flags["-O"]
if args.input
-- Read a file or stdin and output either the printouts or the compiled lua
if args.flags["-c"] and not args.output
args.output = args.input\gsub("%.nom", ".lua")
compiled_output = nil
if args.flags["-p"]
nomsu.environment.print = ->
compiled_output = io.output()
elseif args.output
compiled_output = io.open(args.output, 'w')
if args.input\match(".*%.lua")
retval = dofile(args.input)(nomsu, {})
else
local retval, code
if args.input == '-'
retval, code = nomsu\run(io.read('*a'), 'stdin')
else
retval, code = nomsu\run_file(args.input)
if compiled_output
compiled_output\write("local IMMEDIATE = true;\n")
compiled_output\write(code)
if args.flags["-p"]
nomsu.environment.print = print
if args.flags["-i"]
-- REPL
nomsu\run('use "core"', "stdin")
while true
io.write(colored.bright colored.yellow ">> ")
buff = ""
while true
line = io.read("*L")
if line == "\n" or not line
break
line = line\gsub("\t", " ")
buff ..= line
io.write(colored.dim colored.yellow ".. ")
if #buff == 0
break
ok, ret = pcall(-> nomsu\run(buff, "stdin"))
if ok and ret != nil
print "= "..repr(ret)
elseif not ok
print colored.bright colored.red ret
err_hand = (error_message)->
-- TODO: write properly to stderr
print("#{colored.red "ERROR:"} #{colored.bright colored.yellow colored.onred (error_message or "")}")
print("stack traceback:")
-- TODO: properly print out the calling site of nomsu code, not just the *called* code
ok, to_lua = pcall -> require('moonscript.base').to_lua
if not ok then to_lua = -> nil
nomsu_file = io.open("nomsu.moon")
nomsu_source = nomsu_file\read("*a")
_, line_table = to_lua(nomsu_source)
nomsu_file\close!
level = 2
while true
calling_fn = debug.getinfo(level)
if not calling_fn then break
if calling_fn.func == run then break
level += 1
name = calling_fn.name
if name == "run_lua_fn" then continue
line = nil
if metadata = nomsu.action_metadata[calling_fn.func]
filename, start, stop = metadata.source\match("([^:]*):([0-9]*),([0-9]*)")
if filename
file = io.open(filename)\read("*a")
line_no = 1
for _ in file\sub(1,tonumber(start))\gmatch("\n") do line_no += 1
offending_statement = file\sub(tonumber(start),tonumber(stop))
if #offending_statement > 50
offending_statement = offending_statement\sub(1,50).."..."
offending_statement = colored.red(offending_statement)
line = colored.yellow(filename..":"..tostring(line_no).."\n "..offending_statement)
else
line = colored.yellow(metadata.source)
name = colored.bright(colored.yellow(metadata.aliases[1]))
else
if calling_fn.istailcall and not name
name = "<tail call>"
if calling_fn.short_src == "./nomsu.moon" and line_table
char = line_table[calling_fn.currentline]
line_num = 1
for _ in nomsu_source\sub(1,char)\gmatch("\n") do line_num += 1
line = colored.cyan("#{calling_fn.short_src}:#{line_num}")
name = colored.bright(colored.cyan(name or "???"))
else
line = colored.blue("#{calling_fn.short_src}:#{calling_fn.currentline}")
name = colored.bright(colored.blue(name or "???"))
_from = colored.dim colored.white "|"
print(("%32s %s %s")\format(name, _from, line))
os.exit(false, true)
-- Note: xpcall has a slightly different API in Lua <=5.1 vs. >=5.2, but this works
-- for both APIs
xpcall(run, err_hand)
2017-09-12 20:00:19 -07:00
2017-09-13 16:22:04 -07:00
return NomsuCompiler