#!/usr/bin/env moon -- This file contains the source code of the Nomsu compiler. -- Nomsu is a programming language that cross-compiles to Lua. It was designed to be good -- at natural-language-like code that is highly self-modifying and flexible. -- The only dependency is LPEG, which can be installed using "luarocks install lpeg" -- File usage: -- Either, in a lua/moonscript file: -- Nomsu = require "nomsu" -- nomsu = Nomsu() -- nomsu:run(your_nomsu_code) -- Or from the command line: -- lua nomsu.lua [input_file [output_file or -]] lfs = require 'lfs' re = require 're' lpeg = require 'lpeg' utils = require 'utils' new_uuid = require 'uuid' immutable = require 'immutable' {:repr, :stringify, :min, :max, :equivalent, :set, :is_list, :sum} = utils colors = setmetatable({}, {__index:->""}) colored = setmetatable({}, {__index:(_,color)-> ((msg)-> colors[color]..(msg or '')..colors.reset)}) {:insert, :remove, :concat} = table -- Use + operator for string coercive concatenation (note: "asdf" + 3 == "asdf3") -- Use [] for accessing string characters, or s[{3,4}] for s:sub(3,4) -- Note: This globally affects all strings in this instance of Lua! do STRING_METATABLE = getmetatable("") STRING_METATABLE.__add = (other)=> @ .. stringify(other) STRING_METATABLE.__index = (i)=> if type(i) == 'number' then return string.sub(@, i, i) elseif type(i) == 'table' then return string.sub(@, i[1], i[2]) else return string[i] -- Can't use this because it breaks some LPEG stuff --STRING_METATABLE.__mul = (other)=> string.rep(@, other) -- TODO: -- consider non-linear codegen, rather than doing thunks for things like comprehensions -- improve indentation of generated lua code -- better error reporting -- type checking? -- Add compiler options for optimization level (compile-fast vs. run-fast, etc.) -- Do a pass on all actions to enforce parameters-are-nouns heuristic -- Maybe do some sort of lazy definitions of actions that defer until they're used in code -- Add a ((%x foo %y) where {x:"asdf", y:"fdsa"}) compile-time action for substitution lpeg.setmaxstack 10000 -- whoa {:P,:R,:V,:S,:Cg,:C,:Cp,:B,:Cmt} = lpeg Types = {} type_tostring = => "#{@name}(#{concat [repr(x) for x in *@], ", "})" Tuple = immutable(nil, {name:"Tuple"}) for t in *{"File", "Nomsu", "Block", "List", "FunctionCall", "Text", "Dict", "Number", "Word", "Var", "Comment", "IndexChain"} Types[t] = immutable({"id","value"}, {type:t, name:t, __tostring:type_tostring}) Types.DictEntry = immutable({"key","value"}, {name:"DictEntry"}) Types.is_node = (n)-> type(n) == 'userdata' and n.type NOMSU_DEFS = with {} -- Newline supports either windows-style CR+LF or unix-style LF .Tuple = (values)-> return Tuple(table.unpack(values)) .DictEntry = (k,v) -> Types.DictEntry(k,v) .nl = P("\r")^-1 * P("\n") .ws = S(" \t") .tonumber = tonumber .print = (src,pos,msg)-> print(msg, pos, repr(src\sub(math.max(0,pos-16),math.max(0,pos-1)).."|"..src\sub(pos,pos+16))) return true string_escapes = n:"\n", t:"\t", b:"\b", a:"\a", v:"\v", f:"\f", r:"\r" digit, hex = R('09'), R('09','af','AF') .escaped_char = (P("\\")*S("xX")*C(hex*hex)) / => string.char(tonumber(@, 16)) .escaped_char += (P("\\")*C(digit*(digit^-2))) / => string.char(tonumber @) .escaped_char += (P("\\")*C(S("ntbavfr"))) / string_escapes .operator_char = S("'~`!@$^&*-+=|<>?/") .operator = .operator_char^1 .utf8_char = ( R("\194\223")*R("\128\191") + R("\224\239")*R("\128\191")*R("\128\191") + R("\240\244")*R("\128\191")*R("\128\191")*R("\128\191")) .ident_char = R("az","AZ","09") + P("_") + .utf8_char -- If the line begins with #indent+4 spaces, the pattern matches *those* spaces -- and adds them to the stack (not any more). .indent = P (start)=> nodent = lpeg.userdata.indent_stack[#lpeg.userdata.indent_stack] indented = nodent.." " if @sub(start, start+#indented-1) == indented insert(lpeg.userdata.indent_stack, indented) return start + #indented -- If the number of leading space characters is <= the number of space on the top of the -- stack minus 4, this pattern matches and pops off the top of the stack exactly once. .dedent = P (start)=> nodent = lpeg.userdata.indent_stack[#lpeg.userdata.indent_stack] spaces = @match("[ ]*", start) if #spaces <= #nodent-4 remove(lpeg.userdata.indent_stack) return start -- If the number of leading space characters is >= the number on the top of the -- stack, this pattern matches and does not modify the stack. .nodent = P (start)=> nodent = lpeg.userdata.indent_stack[#lpeg.userdata.indent_stack] if @sub(start, start+#nodent-1) == nodent return start + #nodent .error = (src,pos,err_msg)-> if lpeg.userdata.source_code\sub(pos,pos)\match("[\r\n]") pos += #lpeg.userdata.source_code\match("[ \t\n\r]*", pos) line_no = 1 while (lpeg.userdata.line_starts[line_no+1] or math.huge) < pos do line_no += 1 prev_line = if line_no > 1 lpeg.userdata.source_code\match("[^\r\n]*", lpeg.userdata.line_starts[line_no-1]) else "" err_line = lpeg.userdata.source_code\match("[^\r\n]*", lpeg.userdata.line_starts[line_no]) next_line = if line_no < #lpeg.userdata.line_starts lpeg.userdata.source_code\match("[^\r\n]*", lpeg.userdata.line_starts[line_no+1]) else "" pointer = ("-")\rep(pos-lpeg.userdata.line_starts[line_no]) .. "^" err_msg = (err_msg or "Parse error").." in #{lpeg.userdata.filename} on line #{line_no}:\n" err_msg ..="\n#{prev_line}\n#{err_line}\n#{pointer}\n#{next_line}\n" error(err_msg) node_id = 0 setmetatable(NOMSU_DEFS, {__index:(key)=> make_node = (start, value, stop)-> node_id = node_id + 1 if type(value) == 'table' then error("Not a tuple: #{repr value}")-- = Tuple(value) node = Types[key](node_id, value) lpeg.userdata.tree_metadata[node] = { :start,:stop,filename:lpeg.userdata.filename,source_code:lpeg.userdata.source_code } return node self[key] = make_node return make_node }) NOMSU = do -- Just for cleanliness, I put the language spec in its own file using a slightly modified -- version of the lpeg.re syntax. peg_tidier = re.compile [[ file <- {~ %nl* (def/comment) (%nl+ (def/comment))* %nl* ~} def <- anon_def / captured_def anon_def <- ({ident} (" "*) ":" {((%nl " "+ [^%nl]*)+) / ([^%nl]*)}) -> "%1 <- %2" captured_def <- ({ident} (" "*) "(" {ident} ")" (" "*) ":" {((%nl " "+ [^%nl]*)+) / ([^%nl]*)}) -> "%1 <- ({} %3 {}) -> %2" ident <- [a-zA-Z_][a-zA-Z0-9_]* comment <- "--" [^%nl]* ]] nomsu_peg = peg_tidier\match(io.open("nomsu.peg")\read("*a")) re.compile(nomsu_peg, NOMSU_DEFS) class NomsuCompiler new:()=> -- Weak-key mapping from objects to randomly generated unique IDs NaN_surrogate = {} nil_surrogate = {} @ids = setmetatable({}, { __mode: "k" __index: (key)=> if key == nil then return @[nil_surrogate] elseif key != key then return @[NaN_surrogate] id = new_uuid! @[key] = id return id }) @use_stack = {} @compilestack = {} @file_metadata = setmetatable({}, {__mode:"k"}) @tree_metadata = setmetatable({}, {__mode:"k"}) @action_metadata = setmetatable({}, {__mode:"k"}) @debug = false @environment = { -- Discretionary/convenience stuff nomsu:self, repr:repr, stringify:stringify, utils:utils, lpeg:lpeg, re:re, -- Lua stuff: :next, :unpack, :setmetatable, :coroutine, :rawequal, :getmetatable, :pcall, :error, :package, :os, :require, :tonumber, :tostring, :string, :xpcall, :module, :print, :loadfile, :rawset, :_VERSION, :collectgarbage, :rawget, :bit32, :rawlen, :table, :assert, :dofile, :loadstring, :type, :select, :debug, :math, :io, :pairs, :load, :ipairs, } for k,v in pairs(Types) do @environment[k] = v @environment.Tuple = Tuple @environment.ACTIONS = setmetatable({}, {__index:(key)=> error("Attempt to run undefined action: #{key}", 0) }) @environment.LOADED = {} @environment.Types = Types @initialize_core! define_action: (signature, source, fn)=> if @debug print "#{colored.bright "DEFINING ACTION:"} #{colored.green repr(signature)}" if type(fn) != 'function' error 'function', "Bad fn: #{repr fn}" if type(signature) == 'string' signature = {signature} elseif type(signature) != 'table' or signature.type != nil error("Invalid signature, expected list of strings, but got: #{repr signature}", 0) stubs = @get_stubs_from_signature signature stub_args = @get_args_from_signature signature fn_info = debug.getinfo(fn, "u") local fn_arg_positions, arg_orders unless fn_info.isvararg fn_arg_positions = {debug.getlocal(fn, i), i for i=1,fn_info.nparams} arg_orders = {} -- Map from stub -> index where each arg in the stub goes in the function call for sig_i=1,#stubs stub, args = stubs[sig_i], stub_args[sig_i] if @debug print "#{colored.bright "ALIAS:"} #{colored.underscore colored.magenta repr(stub)} #{colored.bright "WITH ARGS"} #{colored.dim repr(args)} ON: #{@environment.ACTIONS}" @environment.ACTIONS[stub] = fn unless fn_info.isvararg arg_positions = [fn_arg_positions[a] for a in *args] -- TODO: better error checking? if #arg_positions != #args error("Mismatch in args between lua function's #{repr fn_arg_positions} and stub's #{repr args} for #{repr stub}", 0) arg_orders[stub] = arg_positions @action_metadata[fn] = { :fn, :source, aliases:stubs, :arg_orders, arg_positions:fn_arg_positions, def_number:@@def_number, } define_compile_action: (signature, source, fn, src)=> @define_action(signature, source, fn) @action_metadata[fn].compile_time = true serialize_defs: (scope=nil, after=nil)=> -- TODO: repair error("Not currently functional.", 0) -- TODO: figure out whether indent/dedent should affect first line dedent: (code)=> unless code\find("\n") return code spaces, indent_spaces = math.huge, math.huge for line in code\gmatch("\n([^\n]*)") if line\match("^%s*#.*") or line\match("^%s*$") continue -- skip comments and blank lines elseif s = line\match("^(%s*)%.%..*") spaces = math.min(spaces, #s) elseif s = line\match("^(%s*)%S.*") indent_spaces = math.min(indent_spaces, #s) if spaces != math.huge and spaces < indent_spaces return (code\gsub("\n"..(" ")\rep(spaces), "\n")) elseif indent_spaces != math.huge return (code\gsub("\n"..(" ")\rep(indent_spaces), "\n ")) else return code indent: (code, levels=1)=> return code\gsub("\n","\n"..(" ")\rep(levels)) get_line_number: (tree)=> metadata = @tree_metadata[tree] unless metadata return "" unless @file_metadata[metadata.filename] error "Failed to find file metatdata for file: #{metadata.filename}", 0 line_starts = @file_metadata[metadata.filename].line_starts first_line = 1 while first_line < #line_starts and line_starts[first_line+1] < metadata.start first_line += 1 last_line = first_line while last_line < #line_starts and line_starts[last_line+1] < metadata.stop last_line += 1 --return first_line == last_line and "#{metadata.filename}:#{first_line}" or "#{metadata.filename}:#{first_line}-#{last_line}" return "#{metadata.filename}:#{first_line}" get_source_code: (tree)=> -- Return the (dedented) source code of a tree, or construct some if the tree was -- dynamically generated. metadata = @tree_metadata[tree] unless metadata return @tree_to_nomsu(tree) return @dedent metadata.source_code\sub(metadata.start, metadata.stop-1) line_counter = re.compile([[ lines <- {| line (%nl line)* |} line <- {} (!%nl .)* ]], nl:NOMSU_DEFS.nl) parse: (nomsu_code, filename)=> assert type(filename) == "string", "Bad filename type: #{type filename}" if @debug print "#{colored.bright "PARSING:"}\n#{colored.yellow nomsu_code}" unless @file_metadata[filename] @file_metadata[filename] = { source_code:nomsu_code, :filename, line_starts:line_counter\match(nomsu_code) } userdata = { source_code:nomsu_code, :filename, indent_stack: {""}, tree_metadata:@tree_metadata, line_starts:@file_metadata[filename].line_starts, } old_userdata, lpeg.userdata = lpeg.userdata, userdata tree = NOMSU\match(nomsu_code) lpeg.userdata = old_userdata assert tree, "In file #{colored.blue filename} failed to parse:\n#{colored.onyellow colored.black nomsu_code}" if @debug print "PARSE TREE:" @print_tree tree, " " return tree run: (src, filename, max_operations=nil, output_file=nil)=> if src == "" then return nil, "" if max_operations timeout = -> debug.sethook! error("Execution quota exceeded. Your code took too long.", 0) debug.sethook timeout, "", max_operations tree = @parse(src, filename) assert tree, "Failed to parse: #{src}" assert tree.type == "File", "Attempt to run non-file: #{tree.type}" lua = @tree_to_lua(tree) lua_code = lua.statements or (lua.expr..";") if lua_code.locals and #lua_code.locals > 0 lua_code = "local "..concat(lua_code.locals, ", ")..";\n"..lua_code lua_code = "-- File: #{filename}\n"..lua_code ret = @run_lua(lua_code) if max_operations debug.sethook! if output_file output_file\write(lua_code) return ret, lua_code run_file: (filename)=> file_attributes = assert(lfs.attributes(filename), "File not found: #{filename}") if file_attributes.mode == "directory" for short_filename in lfs.dir(filename) full_filename = filename..'/'..short_filename attr = lfs.attributes(full_filename) if attr.mode ~= "directory" and short_filename\match(".*%.nom") @run_file full_filename return if filename\match(".*%.lua") file = io.open(filename) contents = file\read("*a") file\close! return assert(load(contents, nil, nil, @environment))! if filename\match(".*%.nom") if not @skip_precompiled -- Look for precompiled version file = io.open(filename\gsub("%.nom", ".lua"), "r") if file lua_code = file\read("*a") file\close! return @run_lua(lua_code) file = file or io.open(filename) if not file error("File does not exist: #{filename}", 0) nomsu_code = file\read('*a') file\close! return @run(nomsu_code, filename) else error("Invalid filetype for #{filename}", 0) use_file: (filename)=> loaded = @environment.LOADED if not loaded[filename] for i,f in ipairs @use_stack if f == filename loop = [@use_stack[j] for j=i,#@use_stack] insert loop, filename error("Circular import, this loops forever: #{concat loop, " -> "}") insert @use_stack, filename loaded[filename] = @run_file(filename) or true return loaded[filename] run_lua: (lua_code)=> run_lua_fn, err = load(lua_code, nil, nil, @environment) if @debug print "#{colored.bright "RUNNING LUA:"}\n#{colored.blue colored.bright(lua_code)}" if not run_lua_fn n = 1 fn = -> n = n + 1 ("\n%-3d|")\format(n) code = "1 |"..lua_code\gsub("\n", fn) error("Failed to compile generated code:\n#{colored.bright colored.blue colored.onblack code}\n\n#{err}", 0) return run_lua_fn! tree_to_value: (tree, filename)=> -- Special case for text literals if tree.type == 'Text' and #tree.value == 1 and type(tree.value[1]) == 'string' return tree.value[1] code = "return #{@tree_to_lua(tree).expr};" if @debug print "#{colored.bright "RUNNING LUA TO GET VALUE:"}\n#{colored.blue colored.bright(code)}" lua_thunk, err = load(code, nil, nil, @environment) if not lua_thunk error("Failed to compile generated code:\n#{colored.bright colored.blue colored.onblack code}\n\n#{colored.red err}", 0) return lua_thunk! tree_to_nomsu: (tree, indentation="", max_line=80, expr_type=nil)=> -- Convert a tree into nomsu code that satisfies the max line requirement or nil -- if that's not possible -- expr_type is either: -- nil for code that goes at the top level and can contain anything -- "noeol" for code that can contain anything except an end-of-line component -- like a colon (i.e. it already occurs after a colon on the same line) -- "inline" for code that cannot contain indented code or an end-of-line component -- e.g. code that is meant to go inside parentheses assert tree, "No tree provided to tree_to_nomsu." assert Types.is_node(tree), "Invalid tree: #{repr(tree)}" join_lines = (lines)-> for line in *lines if #indentation + #line > max_line return nil return concat(lines, "\n"..indentation) is_operator = (tok)-> tok and tok.type == "Word" and NOMSU_DEFS.operator\match(tok.value) local inline_expression, noeol_expression, expression inline_expression = (tok)-> switch tok.type when "Block" if #tok.value > 1 then return nil nomsu = inline_expression tok.value return nomsu and "(: #{nomsu})" when "FunctionCall" buff = "" for i,bit in ipairs tok.value if bit.type == "Word" if i == 1 or (is_operator(bit) and is_operator(tok.value[i-1])) buff ..= bit.value else buff ..= " "..bit.value else nomsu = inline_expression bit return nil unless nomsu unless i == 1 or bit.type == "Block" buff ..= " " buff ..= if bit.type == "FunctionCall" "("..nomsu..")" else nomsu return buff when "IndexChain" bits = {} for bit in *tok.value nomsu = inline_expression bit return nil unless nomsu insert bits, nomsu return concat(bits, ".") when "List" bits = {} for bit in *tok.value nomsu = inline_expression bit return nil unless nomsu insert bits, nomsu return "["..concat(bits, ", ").."]" when "Dict" bits = {} for bit in *tok.value key_nomsu = if bit.key.type == "Word" bit.key.value else inline_expression bit.key return nil unless key_nomsu if bit.key.type == "FunctionCall" key_nomsu = "("..key_nomsu..")" value_nomsu = inline_expression bit.value return nil unless value_nomsu insert bits, key_nomsu.."="..value_nomsu return "{"..concat(bits, ", ").."}" when "Text" buff = '"' for bit in *tok.value if type(bit) == 'string' -- Force indented text return nil if bit\find("\n") buff ..= bit\gsub("\\","\\\\")\gsub("\n","\\n") else nomsu = inline_expression(bit) return nil unless nomsu buff ..= if bit.type == "Var" or bit.type == "List" or bit.type == "Dict" "\\"..nomsu else "\\("..nomsu..")" if #buff > max_line then return nil return buff..'"' when "Nomsu" nomsu = inline_expression(tok.value) return nil if not nomsu return "\\("..nomsu..")" when "Number" then tostring(tok.value) when "Var" then "%"..tok.value else return nil noeol_expression = (tok)-> nomsu = inline_expression(tok) if nomsu and #nomsu < max_line return nomsu switch tok.type when "Block" buff = ":" for line in *tok.value nomsu = expression(line) return nil unless nomsu buff ..= "\n "..@indent(nomsu) return buff when "FunctionCall" nomsu = expression(tok) return nil unless nomsu return "(..)\n "..@indent(nomsu) when "IndexChain" return nil when "List" buff = "[..]" line = "\n " for bit in *tok.value nomsu = inline_expression bit if line != "\n " and #line + #", " + #nomsu > max_line buff ..= line line = "\n " sep = line == "\n " and "" or ", " if nomsu line ..= sep..nomsu if #line >= max_line buff ..= line line = "\n " else line ..= sep..expression(bit) buff ..= line line = "\n " if line ~= "\n " buff ..= line return buff when "Dict" buff = "{..}" line = "\n " for bit in *tok.value key_nomsu = inline_expression bit.key return nil unless key_nomsu if bit.key.type == "FunctionCall" key_nomsu = "("..key_nomsu..")" value_nomsu = inline_expression bit.value if value_nomsu and #key_nomsu + #value_nomsu < max_line line ..= key_nomsu.."="..value_nomsu.."," if #line >= max_line buff ..= line line = "\n " else line ..= key_nomsu.."="..expression(bit.value) buff ..= line line = "\n " if line ~= "\n " buff ..= line return buff when "Text" buff = '".."\n ' for bit in *tok.value if type(bit) == 'string' buff ..= bit\gsub("\\","\\\\")\gsub("\n","\n ") else nomsu = inline_expression(bit) return nil unless nomsu buff ..= if bit.type == "Var" or bit.type == "List" or bit.type == "Dict" or bit.type == "IndexChain" "\\"..nomsu else "\\("..nomsu..")" return buff when "Nomsu" nomsu = expression(tok.value) return nil if not nomsu return "\\(..)\n "..@indent(nomsu) when "Comment" if tok.value\find("\n") return "#.."..tok.value\gsub("\n","\n ") else return "#"..tok.value else return inline_expression(tok) expression = (tok)-> nomsu = inline_expression(tok) if nomsu and #nomsu < max_line return nomsu switch tok.type when "Block" if #tok.value == 1 nomsu = if tok.value[1].type == "FunctionCall" inline_expression(tok.value[1]) else noeol_expression(tok.value[1]) if nomsu and #(nomsu\match("[^\n]*")) < max_line return ": "..nomsu return noeol_expression(tok) when "FunctionCall" -- The hard task buff = "" for i,bit in ipairs tok.value if bit.type == "Word" if i == 1 or (is_operator(bit) and is_operator(tok.value[i-1])) or buff\sub(-2,-1) == ".." buff ..= bit.value else buff ..= " "..bit.value else nomsu = inline_expression(bit) if nomsu and #nomsu < max_line if bit.type == "FunctionCall" nomsu = "("..nomsu..")" else nomsu = expression(bit) return nil unless nomsu if bit.type == "FunctionCall" nomsu = "(..)\n "..@indent(nomsu) if i < #tok.value nomsu ..= "\n.." unless i == 1 or bit.type == "Block" buff ..= " " buff ..= nomsu return buff when "File" lines = {} for line in *tree.value nomsu = expression(line) unless nomsu src = @get_source_code line error "Failed to produce output for:\n#{colored.yellow src}", 0 insert lines, nomsu return concat lines, "\n" when "Comment" if tok.value\find("\n") return "#.."..tok.value\gsub("\n","\n ") else return "#"..tok.value else return noeol_expression(tok) return expression(tree) value_to_nomsu: (value)=> switch type(value) when "nil" return "(nil)" when "bool" return value and "(yes)" or "(no)" when "number" -- TODO: support NaN, inf, etc.? return repr(value) when "table" if is_list(value) return "[#{concat [@value_to_nomsu(v) for v in *value], ", "}]" else return "{#{concat ["#{@value_to_nomsu(k)}:#{@value_to_nomsu(v)}" for k,v in pairs(value)], ", "}}" when "string" if value == "\n" return "'\\n'" elseif not value\find[["]] and not value\find"\n" and not value\find"\\" return "\""..value.."\"" else -- TODO: This might fail if it's being put inside a list or something return '".."\n '..(@indent value) else error("Unsupported value_to_nomsu type: #{type(value)}", 0) @math_patt: re.compile [[ "%" (" " [*/^+-] " %")+ ]] tree_to_lua: (tree)=> -- Return , assert tree, "No tree provided." if not Types.is_node(tree) error("Invalid tree: #{repr(tree)}", 0) switch tree.type when "File" if #tree.value == 1 return @tree_to_lua(tree.value[1]) declared_locals = {} lua_bits = {} line_no = 1 for line in *tree.value lua = @tree_to_lua line if not lua error("No lua produced by #{repr line}", 0) if lua.locals new_locals = [l for l in *lua.locals when not declared_locals[l]] if #new_locals > 0 insert lua_bits, "local #{concat new_locals, ", "};" for l in *new_locals do declared_locals[l] = true if lua.statements then insert lua_bits, lua.statements elseif lua.expr then insert lua_bits, "#{lua.expr};" return statements:concat(lua_bits, "\n") when "Comment" return statements:"--"..tree.value\gsub("\n","\n--") when "Nomsu" --return expr:"nomsu:parse(#{repr @get_source_code(tree.value)}, #{repr @get_line_number(tree.value)}).value[1]" return expr:repr(tree.value) when "Block" lua_bits = {} locals = {} for arg in *tree.value lua = @tree_to_lua arg if #tree.value == 1 and lua.expr and not lua.statements return {expr:lua.expr, locals:lua.locals} if lua.locals for l in *lua.locals do table.insert(locals, l) if lua.statements then insert lua_bits, lua.statements elseif lua.expr then insert lua_bits, "#{lua.expr};" utils.deduplicate(locals) return statements:concat(lua_bits, "\n"), locals:(#locals > 0 and locals or nil) when "FunctionCall" insert @compilestack, tree stub = @tree_to_stub tree ok, fn = pcall(-> @environment.ACTIONS[stub]) if not ok then fn = nil metadata = @action_metadata[fn] if metadata and metadata.compile_time args = [arg for arg in *tree.value when arg.type != "Word"] if metadata and metadata.arg_orders new_args = [args[p] for p in *metadata.arg_orders[stub]] args = new_args if @debug print "#{colored.bright "RUNNING MACRO"} #{colored.underscore colored.magenta(stub)} " print "#{colored.bright "WITH ARGS:"} #{colored.dim concat([(repr a)\sub(1,100) for a in *args], ", ")}" lua = fn(unpack(args)) remove @compilestack return lua elseif not metadata and @@math_patt\match(stub) -- This is a bit of a hack, but this code handles arbitrarily complex -- math expressions like 2*x + 3^2 without having to define a single -- action for every possibility. bits = {} for tok in *tree.value if tok.type == "Word" insert bits, tok.value else lua = @tree_to_lua(tok) unless lua.expr src = @get_source_code(tok) error("non-expression value inside math expression: #{colored.yellow src}") insert bits, lua.expr remove @compilestack return expr:"(#{concat bits, " "})" args = {} for tok in *tree.value if tok.type == "Word" then continue lua = @tree_to_lua(tok) unless lua.expr line = @get_line_number(tok) src = @get_source_code(tok) error "#{line}: Cannot use:\n#{colored.yellow src}\nas an argument to #{stub}, since it's not an expression, it produces: #{repr lua}", 0 insert args, lua.expr if metadata and metadata.arg_orders new_args = [args[p] for p in *metadata.arg_orders[stub]] args = new_args remove @compilestack return expr:@@comma_separated_items("ACTIONS[#{repr stub}](", args, ")") when "Text" concat_parts = {} string_buffer = "" for bit in *tree.value if type(bit) == "string" string_buffer ..= bit continue if string_buffer ~= "" insert concat_parts, repr(string_buffer) string_buffer = "" lua = @tree_to_lua bit if @debug print(colored.bright "INTERP:") @print_tree bit print "#{colored.bright "EXPR:"} #{lua.expr}, #{colored.bright "STATEMENT:"} #{lua.statements}" unless lua.expr line = @get_line_number(bit) src = @get_source_code(bit) error "#{line}: Cannot use #{colored.yellow bit} as a string interpolation value, since it's not an expression.", 0 insert concat_parts, "stringify(#{lua.expr})" if string_buffer ~= "" insert concat_parts, repr(string_buffer) if #concat_parts == 0 return expr:"''" elseif #concat_parts == 1 return expr:concat_parts[1] else return expr:"(#{concat(concat_parts, "..")})" when "IndexChain" items = {} for i, item in ipairs(tree.value) lua = @tree_to_lua item unless lua.expr line = @get_line_number(item) src = @get_source_code(item) error "#{line}: Cannot index #{colored.yellow src}, since it's not an expression.", 0 -- TODO: improve generated code by removing parens and square brackets when possible if i == 1 insert items, "(#{lua.expr})" else insert items, "[ #{lua.expr}]" return expr:concat(items,"") when "List" items = {} for item in *tree.value lua = @tree_to_lua item unless lua.expr line = @get_line_number(item) src = @get_source_code(item) error "#{line}: Cannot use #{colored.yellow src} as a list item, since it's not an expression.", 0 insert items, lua.expr return expr:@@comma_separated_items("{", items, "}") when "Dict" items = {} for entry in *tree.value key_lua = if entry.key.type == "Word" {expr:repr(entry.key.value)} else @tree_to_lua entry.key unless key_lua.expr line = @get_line_number(entry.key) src = @get_source_code(entry.key) error "#{line}: Cannot use #{colored.yellow src} as a dict key, since it's not an expression.", 0 value_lua = @tree_to_lua entry.value unless value_lua.expr line = @get_line_number(entry.value) src = @get_source_code(entry.value) error "#{line}: Cannot use #{colored.yellow src} as a dict value, since it's not an expression.", 0 key_str = key_lua.expr\match([=[["']([a-zA-Z_][a-zA-Z0-9_]*)['"]]=]) if key_str insert items, "#{key_str}=#{value_lua.expr}" elseif key_lua.expr\sub(1,1) == "[" insert items, "[ #{key_lua.expr}]=#{value_lua.expr}" else insert items, "[#{key_lua.expr}]=#{value_lua.expr}" return expr:@@comma_separated_items("{", items, "}") when "Number" return expr:repr(tree.value) when "Var" return expr:@var_to_lua_identifier(tree.value) else error("Unknown/unimplemented thingy: #{tree.type}", 0) walk_tree: (tree, depth=0)=> coroutine.yield(tree, depth) return unless Types.is_node(tree) switch tree.type when "List", "File", "Block", "FunctionCall", "Text", "IndexChain" for v in *tree.value @walk_tree(v, depth+1) when "Dict" for e in *tree.value @walk_tree(e.key, depth+1) @walk_tree(e.value, depth+1) else @walk_tree(tree.value, depth+1) return nil print_tree: (tree)=> io.write(colors.bright..colors.green) for node,depth in coroutine.wrap(-> @walk_tree tree) if Types.is_node(node) print("#{(" ")\rep(depth)}#{node.type}:") else print((" ")\rep(depth)..repr(node)) io.write(colors.reset) tree_to_str: (tree)=> bits = {} for node,depth in coroutine.wrap(-> @walk_tree tree) if Types.is_node(node) insert bits, ("#{(" ")\rep(depth)}#{node.type}:") else insert bits, ((" ")\rep(depth)..repr(node)) return concat(bits, "\n") @unescape_string: (str)=> Cs(((P("\\\\")/"\\") + (P("\\\"")/'"') + NOMSU_DEFS.escaped_char + P(1))^0)\match(str) @comma_separated_items: (open, items, close)=> bits = {open} so_far = 0 for i,item in ipairs(items) if i < #items then item ..= ", " insert bits, item so_far += #item if so_far >= 80 insert bits, "\n" so_far = 0 insert bits, close return concat(bits) tree_map: (tree, fn)=> -- Return a new tree with fn mapped to each node. If fn provides a replacement, -- use that and stop recursing, otherwise recurse. unless Types.is_node(tree) then return tree replacement = fn(tree) if replacement != nil return replacement switch tree.type when "File", "Nomsu", "Block", "List", "FunctionCall", "Text", "IndexChain" new_values, is_changed = {}, false for i,old_value in ipairs(tree.value) new_value = type(old_value) != "string" and @tree_map(old_value, fn) or nil if new_value != nil and new_value != old_value is_changed = true new_values[i] = new_value else new_values[i] = old_value if is_changed new_tree = getmetatable(tree)(tree.id, Tuple(table.unpack(new_values))) return new_tree when "Dict" new_values, is_changed = {}, false for i,e in ipairs tree.value new_key = @tree_map(e.key, fn) new_value = @tree_map(e.value, fn) if (new_key != nil and new_key != e.key) or (new_value != nil and new_value != e.value) is_changed = true new_values[i] = DictEntry(new_key, new_value) else new_values[i] = e if is_changed new_tree = getmetatable(tree)(tree.id, Tuple(table.unpack(new_values))) return new_tree when nil -- Raw table, probably from one of the .value of a multi-value tree (e.g. List) error("Invalid tree: #{repr tree}") return tree tree_with_replaced_vars: (tree, replacements)=> return @tree_map tree, (t)-> if t.type == "Var" id = @var_to_lua_identifier t.value if replacements[id] != nil return replacements[id] tree_to_stub: (tree)=> if tree.type != "FunctionCall" then error "Tried to get stub from non-functioncall tree: #{tree.type}", 0 return concat([(t.type == "Word" and t.value or "%") for t in *tree.value], " ") tree_to_named_stub: (tree)=> if tree.type != "FunctionCall" then error "Tried to get stub from non-functioncall tree: #{tree.type}", 0 return concat([(t.type == "Word" and t.value or "%#{t.value}") for t in *tree.value], " ") stub_defs = { space:(P(' ') + P('\n..'))^0 word:(NOMSU_DEFS.ident_char^1 + NOMSU_DEFS.operator^1) varname:(R('az','AZ','09') + P('_') + NOMSU_DEFS.utf8_char)^0 } stub_pattern = re.compile("{~ (%space->'') (('%' (%varname->'')) / %word)? ((%space->' ') (('%' (%varname->'')) / %word))* (%space->'') ~}", stub_defs) get_stubs_from_signature: (signature)=> if type(signature) != 'table' or signature.type error("Invalid signature: #{repr signature}", 0) stubs = {} for i,alias in ipairs(signature) if type(alias) != 'string' error("Expected entries in signature to be strings, not #{type(alias)}s like: #{repr alias}\nsignature: #{repr signature}", 0) stubs[i] = stub_pattern\match(alias) unless stubs[i] error("Failed to match stub pattern on alias: #{repr alias}") return stubs var_pattern = re.compile("{| %space ((('%' {%varname}) / %word) %space)+ |}", stub_defs) get_args_from_signature: (signature)=> if type(signature) != 'table' or signature.type error("Invalid signature: #{repr signature}", 0) stub_args = {} for i,alias in ipairs(signature) if type(alias) != 'string' error("Invalid type for signature: #{type(alias)} for:\n#{repr alias}", 0) args = var_pattern\match(alias) unless args error("Failed to match arg pattern on alias: #{repr alias}", 0) for j=1,#args do args[j] = @var_to_lua_identifier(args[j]) stub_args[i] = args return stub_args var_to_lua_identifier: (var)=> -- Converts arbitrary nomsu vars to valid lua identifiers by replacing illegal -- characters with escape sequences if Types.Var\is_instance(var) var = var.value "_"..(var\gsub "%W", (verboten)-> if verboten == "_" then "__" else ("_%x")\format(verboten\byte!)) initialize_core: => -- Sets up some core functionality get_line_no = -> "nomsu.moon:#{debug.getinfo(2).currentline}" nomsu = self nomsu_string_as_lua = (code)-> concat_parts = {} for bit in *code.value if type(bit) == "string" insert concat_parts, bit else lua = nomsu\tree_to_lua bit unless lua.expr line = @get_line_number(bit) src = @get_source_code(bit) error "#{line}: Cannot use #{colored.yellow src} as a string interpolation value, since it's not an expression.", 0 insert concat_parts, lua.expr return concat(concat_parts) @define_compile_action "immediately %block", get_line_no!, (_block)-> lua = nomsu\tree_to_lua(_block) lua_code = lua.statements or (lua.expr..";") if lua.locals and #lua.locals > 0 lua_code = "local #{concat lua.locals, ", "};\n#{lua_code}" nomsu\run_lua(lua_code) return statements:"if IMMEDIATE then\n#{lua_code}\nend", locals:lua.locals @define_compile_action "lua> %code", get_line_no!, (_code)-> if _code.type == "Text" lua = nomsu_string_as_lua(_code) return statements:lua else return statements:"nomsu:run_lua(#{nomsu\tree_to_lua(_code).expr});" @define_compile_action "=lua %code", get_line_no!, (_code)-> lua = nomsu_string_as_lua(_code) return expr:lua @define_compile_action "!! code location !!", get_line_no!, -> tree = nomsu.compilestack[#nomsu.compilestack-1] metadata = @tree_metadata[tree] if metadata return expr: repr("#{metadata.filename}:#{metadata.start},#{metadata.stop}") else return expr: repr("") @define_action "run file %filename", get_line_no!, (_filename)-> return nomsu\run_file(_filename) @define_compile_action "use %filename", get_line_no!, (_filename)-> filename = nomsu\tree_to_value(_filename) nomsu\use_file(filename) return expr:"nomsu:use_file(#{repr filename})" -- Only run this code if this file was run directly with command line arguments, and not require()'d: if arg and debug.getinfo(2).func != require export colors colors = require 'consolecolors' parser = re.compile([[ args <- {| {:flags: flags? :} ({:input: input :} ";" ("-o;"{:output: output :} ";")?)? (";")? |} !. flags <- (({| ({flag} ";")* |}) -> set) flag <- "-c" / "-i" / "-p" / "-O" / "--help" / "-h" / "-v" input <- "-" / [^;]+ output <- "-" / [^;]+ ]], {:set}) args = concat(arg, ";")..";" args = parser\match(args) or {} if not args or not args.flags or args.flags["--help"] or args.flags["-h"] print "Usage: lua nomsu.lua [-c] [-i] [-p] [-O] [--help] [input [-o output]]" os.exit! nomsu = NomsuCompiler() run = -> if args.flags["-v"] nomsu.debug = true nomsu.skip_precompiled = not args.flags["-O"] if args.input -- Read a file or stdin and output either the printouts or the compiled lua if args.flags["-c"] and not args.output args.output = args.input\gsub("%.nom", ".lua") compiled_output = nil if args.flags["-p"] nomsu.environment.print = -> compiled_output = io.output() elseif args.output compiled_output = io.open(args.output, 'w') if args.input\match(".*%.lua") retval = dofile(args.input)(nomsu, {}) else local retval, code if args.input == '-' retval, code = nomsu\run(io.read('*a'), 'stdin') else retval, code = nomsu\run_file(args.input) if compiled_output compiled_output\write("local IMMEDIATE = true;\n") compiled_output\write(code) if args.flags["-p"] nomsu.environment.print = print if args.flags["-i"] -- REPL nomsu\run('use "core"', "stdin") while true io.write(colored.bright colored.yellow ">> ") buff = "" while true line = io.read("*L") if line == "\n" or not line break line = line\gsub("\t", " ") buff ..= line io.write(colored.dim colored.yellow ".. ") if #buff == 0 break ok, ret = pcall(-> nomsu\run(buff, "stdin")) if ok and ret != nil print "= "..repr(ret) elseif not ok print colored.bright colored.red ret err_hand = (error_message)-> -- TODO: write properly to stderr print("#{colored.red "ERROR:"} #{colored.bright colored.yellow colored.onred (error_message or "")}") print("stack traceback:") -- TODO: properly print out the calling site of nomsu code, not just the *called* code ok, to_lua = pcall -> require('moonscript.base').to_lua if not ok then to_lua = -> nil nomsu_file = io.open("nomsu.moon") nomsu_source = nomsu_file\read("*a") _, line_table = to_lua(nomsu_source) nomsu_file\close! level = 2 while true calling_fn = debug.getinfo(level) if not calling_fn then break if calling_fn.func == run then break level += 1 name = calling_fn.name if name == "run_lua_fn" then continue line = nil if metadata = nomsu.action_metadata[calling_fn.func] filename, start, stop = metadata.source\match("([^:]*):([0-9]*),([0-9]*)") if filename file = io.open(filename)\read("*a") line_no = 1 for _ in file\sub(1,tonumber(start))\gmatch("\n") do line_no += 1 offending_statement = file\sub(tonumber(start),tonumber(stop)) if #offending_statement > 50 offending_statement = offending_statement\sub(1,50).."..." offending_statement = colored.red(offending_statement) line = colored.yellow(filename..":"..tostring(line_no).."\n "..offending_statement) else line = colored.yellow(metadata.source) name = colored.bright(colored.yellow(metadata.aliases[1])) else if calling_fn.istailcall and not name name = "" if calling_fn.short_src == "./nomsu.moon" and line_table char = line_table[calling_fn.currentline] line_num = 1 for _ in nomsu_source\sub(1,char)\gmatch("\n") do line_num += 1 line = colored.cyan("#{calling_fn.short_src}:#{line_num}") name = colored.bright(colored.cyan(name or "???")) else line = colored.blue("#{calling_fn.short_src}:#{calling_fn.currentline}") name = colored.bright(colored.blue(name or "???")) _from = colored.dim colored.white "|" print(("%32s %s %s")\format(name, _from, line)) os.exit(false, true) -- Note: xpcall has a slightly different API in Lua <=5.1 vs. >=5.2, but this works -- for both APIs ldt = require 'ldt' ldt.guard run --xpcall(run, err_hand) return NomsuCompiler