#!/usr/bin/env moon -- This file contains the source code of the Nomsu compiler. -- Nomsu is a programming language that cross-compiles to Lua. It was designed to be good -- at natural-language-like code that is highly self-modifying and flexible. -- The only dependency is LPEG, which can be installed using "luarocks install lpeg" -- File usage: -- Either, in a lua/moonscript file: -- Nomsu = require "nomsu" -- nomsu = Nomsu() -- nomsu:run(your_nomsu_code) -- Or from the command line: -- lua nomsu.lua [input_file [output_file or -]] re = require 're' lpeg = require 'lpeg' utils = require 'utils' new_uuid = require 'uuid' {:repr, :stringify, :min, :max, :equivalent, :set, :is_list, :sum} = utils colors = setmetatable({}, {__index:->""}) colored = setmetatable({}, {__index:(_,color)-> ((msg)-> colors[color]..(msg or '')..colors.reset)}) {:insert, :remove, :concat} = table -- Use + operator for string coercive concatenation (note: "asdf" + 3 == "asdf3") -- Use [] for accessing string characters, or s[{3,4}] for s:sub(3,4) -- Note: This globally affects all strings in this instance of Lua! do STRING_METATABLE = getmetatable("") STRING_METATABLE.__add = (other)=> @ .. stringify(other) STRING_METATABLE.__index = (i)=> if type(i) == 'number' then return string.sub(@, i, i) elseif type(i) == 'table' then return string.sub(@, i[1], i[2]) else return string[i] --STRING_METATABLE.__mul = (other)=> string.rep(@, other) -- TODO: -- consider non-linear codegen, rather than doing thunks for things like comprehensions -- improve indentation of generated lua code -- better error reporting -- type checking? -- Add compiler options for optimization level (compile-fast vs. run-fast, etc.) -- Do a pass on all actions to enforce parameters-are-nouns heuristic -- Maybe do some sort of lazy definitions of actions that defer until they're used in code -- Change nomsu:tree_to_lua() to use a table lookup instead of a switch statement lpeg.setmaxstack 10000 -- whoa {:P,:R,:V,:S,:Cg,:C,:Cp,:B,:Cmt} = lpeg NOMSU_DEFS = with {} -- Newline supports either windows-style CR+LF or unix-style LF .nl = P("\r")^-1 * P("\n") .ws = S(" \t") .tonumber = tonumber .print = (src,pos,msg)-> print(msg, pos, repr(src\sub(math.max(0,pos-16),math.max(0,pos-1)).."|"..src\sub(pos,pos+16))) return true string_escapes = n:"\n", t:"\t", b:"\b", a:"\a", v:"\v", f:"\f", r:"\r" digit, hex = R('09'), R('09','af','AF') .escaped_char = (P("\\")*S("xX")*C(hex*hex)) / => string.char(tonumber(@, 16)) .escaped_char += (P("\\")*C(digit*(digit^-2))) / => string.char(tonumber @) .escaped_char += (P("\\")*C(S("ntbavfr"))) / string_escapes .operator_char = S("'~`!@$^&*-+=|<>?/") .operator = .operator_char^1 .utf8_char = ( R("\194\223")*R("\128\191") + R("\224\239")*R("\128\191")*R("\128\191") + R("\240\244")*R("\128\191")*R("\128\191")*R("\128\191")) .ident_char = R("az","AZ","09") + P("_") + .utf8_char -- If the number of leading space characters is greater than number in the top of the -- stack, this pattern matches and pushes the number onto the stack. .indent = P (start)=> spaces = @match("[ \t]*", start) if #spaces > lpeg.userdata.indent_stack[#lpeg.userdata.indent_stack] insert(lpeg.userdata.indent_stack, #spaces) return start + #spaces -- If the number of leading space characters is less than number in the top of the -- stack, this pattern matches and pops off the top of the stack exactly once. .dedent = P (start)=> spaces = @match("[ \t]*", start) if #spaces < lpeg.userdata.indent_stack[#lpeg.userdata.indent_stack] remove(lpeg.userdata.indent_stack) return start -- If the number of leading space characters is equal to the number on the top of the -- stack, this pattern matches and does not modify the stack. .nodent = P (start)=> spaces = @match("[ \t]*", start) if #spaces == lpeg.userdata.indent_stack[#lpeg.userdata.indent_stack] return start + #spaces -- If the number of leading space characters is 4+ more than the number on the top of the -- stack, this pattern matches the first n+4 spaces and does not modify the stack. .gt_nodent = P (start)=> -- Note! This assumes indent is exactly 4 spaces!!! spaces = @match("[ \t]*", start) if #spaces >= lpeg.userdata.indent_stack[#lpeg.userdata.indent_stack] + 4 return start + lpeg.userdata.indent_stack[#lpeg.userdata.indent_stack] + 4 .error = (src,pos,err_msg)-> if lpeg.userdata.source_code\sub(pos,pos)\match("[\r\n]") pos += #lpeg.userdata.source_code\match("[ \t\n\r]*", pos) line_no = 1 while (lpeg.userdata.line_starts[line_no+1] or math.huge) < pos do line_no += 1 prev_line = if line_no > 1 lpeg.userdata.source_code\match("[^\r\n]*", lpeg.userdata.line_starts[line_no-1]) else "" err_line = lpeg.userdata.source_code\match("[^\r\n]*", lpeg.userdata.line_starts[line_no]) next_line = if line_no < #lpeg.userdata.line_starts lpeg.userdata.source_code\match("[^\r\n]*", lpeg.userdata.line_starts[line_no+1]) else "" pointer = ("-")\rep(pos-lpeg.userdata.line_starts[line_no]) .. "^" err_msg = (err_msg or "Parse error").." in #{lpeg.userdata.filename} on line #{line_no}:\n" err_msg ..="\n#{prev_line}\n#{err_line}\n#{pointer}\n#{next_line}\n" error(err_msg) .FunctionCall = (start, value, stop)-> stub = concat([(t.type == "Word" and t.value or "%") for t in *value], " ") src = lpeg.userdata.source_code\sub(start,stop-1) return { type: "FunctionCall", :start, :stop, :value, :stub, filename:lpeg.userdata.filename, get_line_no:lpeg.userdata.get_line_no, get_src:lpeg.userdata.get_src, } setmetatable(NOMSU_DEFS, {__index:(key)=> make_node = (start, value, stop)-> { type: key, :start, :stop, :value, filename:lpeg.userdata.filename, get_src:lpeg.userdata.get_src, get_line_no:lpeg.userdata.get_line_no, } self[key] = make_node return make_node }) NOMSU = do -- Just for cleanliness, I put the language spec in its own file using a slightly modified -- version of the lpeg.re syntax. peg_tidier = re.compile [[ file <- {~ %nl* (def/comment) (%nl+ (def/comment))* %nl* ~} def <- anon_def / captured_def anon_def <- ({ident} (" "*) ":" {((%nl " "+ [^%nl]*)+) / ([^%nl]*)}) -> "%1 <- %2" captured_def <- ({ident} (" "*) "(" {ident} ")" (" "*) ":" {((%nl " "+ [^%nl]*)+) / ([^%nl]*)}) -> "%1 <- ({} %3 {}) -> %2" ident <- [a-zA-Z_][a-zA-Z0-9_]* comment <- "--" [^%nl]* ]] nomsu_peg = peg_tidier\match(io.open("nomsu.peg")\read("*a")) re.compile(nomsu_peg, NOMSU_DEFS) class NomsuCompiler @def_number: 0 new:()=> -- Weak-key mapping from objects to randomly generated unique IDs NaN_surrogate = {} nil_surrogate = {} @ids = setmetatable({}, { __mode: "k" __index: (key)=> if key == nil then return @[nil_surrogate] elseif key != key then return @[NaN_surrogate] id = new_uuid! @[key] = id return id }) @compilestack = {} @debug = false @environment = { -- Discretionary/convenience stuff nomsu:self, repr:repr, stringify:stringify, utils:utils, lpeg:lpeg, re:re, -- Lua stuff: :next, :unpack, :setmetatable, :coroutine, :rawequal, :getmetatable, :pcall, :error, :package, :os, :require, :tonumber, :tostring, :string, :xpcall, :module, :print, :loadfile, :rawset, :_VERSION, :collectgarbage, :rawget, :bit32, :rawlen, :table, :assert, :dofile, :loadstring, :type, :select, :debug, :math, :io, :pairs, :load, :ipairs, } @environment.ACTIONS = setmetatable({}, {__index:(key)=> error("Attempt to run undefined action: #{key}", 0) }) @action_metadata = setmetatable({}, {__mode:"k"}) @environment.ACTION_METADATA = @action_metadata @environment.LOADED = {} @initialize_core! define_action: (signature, source, fn)=> if @debug print "#{colored.bright "DEFINING ACTION:"} #{colored.green repr(signature)}" if type(fn) != 'function' error 'function', "Bad fn: #{repr fn}" if type(signature) == 'string' signature = {signature} elseif type(signature) != 'table' or signature.type != nil error("Invalid signature, expected list of strings, but got: #{repr signature}", 0) stubs = @get_stubs_from_signature signature stub_args = @get_args_from_signature signature @@def_number += 1 fn_info = debug.getinfo(fn, "u") local fn_arg_positions, arg_orders unless fn_info.isvararg fn_arg_positions = {debug.getlocal(fn, i), i for i=1,fn_info.nparams} arg_orders = {} -- Map from stub -> index where each arg in the stub goes in the function call for sig_i=1,#stubs stub, args = stubs[sig_i], stub_args[sig_i] if @debug print "#{colored.bright "ALIAS:"} #{colored.underscore colored.magenta repr(stub)} #{colored.bright "WITH ARGS"} #{colored.dim repr(args)} ON: #{@environment.ACTIONS}" -- TODO: use debug.getupvalue instead of @environment.ACTIONS? @environment.ACTIONS[stub] = fn unless fn_info.isvararg arg_positions = [fn_arg_positions[a] for a in *args] -- TODO: better error checking? if #arg_positions != #args error("Mismatch in args between lua function's #{repr fn_arg_positions} and stub's #{repr args} for #{repr stub}", 0) arg_orders[stub] = arg_positions @action_metadata[fn] = { :fn, :source, aliases:stubs, :arg_orders, arg_positions:fn_arg_positions, def_number:@@def_number, } define_compile_action: (signature, source, fn, src)=> @define_action(signature, source, fn) @action_metadata[fn].compile_time = true serialize_defs: (scope=nil, after=nil)=> -- TODO: repair error("Not currently functional.", 0) dedent: (code)=> unless code\find("\n") return code spaces, indent_spaces = math.huge, math.huge for line in code\gmatch("\n([^\n]*)") if line\match("^%s*#.*") or line\match("^%s*$") continue -- skip comments and blank lines elseif s = line\match("^(%s*)%.%..*") spaces = math.min(spaces, #s) elseif s = line\match("^(%s*)%S.*") indent_spaces = math.min(indent_spaces, #s) if spaces != math.huge and spaces < indent_spaces return (code\gsub("\n"..(" ")\rep(spaces), "\n")) elseif indent_spaces != math.huge return (code\gsub("\n"..(" ")\rep(indent_spaces), "\n ")) else return code indent: (code, levels=1)=> return code\gsub("\n","\n"..(" ")\rep(levels)) line_counter = re.compile([[ lines <- {| line (%nl line)* |} line <- {} (!%nl .)* ]], nl:NOMSU_DEFS.nl) parse: (nomsu_code, filename)=> assert type(filename) == "string", "Bad filename type: #{type filename}" if @debug print "#{colored.bright "PARSING:"}\n#{colored.yellow nomsu_code}" userdata = with {source_code:nomsu_code, :filename, indent_stack: {0}} .get_src = => nomsu_code\sub(@start, @stop-1) .line_starts = line_counter\match(.source_code) .get_line_no = => unless @_line_no line_no = 1 while line_no < #.line_starts and .line_starts[line_no+1] < @start line_no += 1 @_line_no = "#{.filename}:#{line_no}" return @_line_no old_userdata, lpeg.userdata = lpeg.userdata, userdata tree = NOMSU\match(nomsu_code) lpeg.userdata = old_userdata assert tree, "In file #{colored.blue filename} failed to parse:\n#{colored.onyellow colored.black nomsu_code}" if @debug print "PARSE TREE:" @print_tree tree, " " return tree run: (src, filename, max_operations=nil, output_file=nil)=> if src == "" then return nil, "" if max_operations timeout = -> debug.sethook! error("Execution quota exceeded. Your code took too long.", 0) debug.sethook timeout, "", max_operations tree = @parse(src, filename) assert tree, "Failed to parse: #{src}" assert tree.type == "File", "Attempt to run non-file: #{tree.type}" lua = @tree_to_lua(tree) lua_code = lua.statements or (lua.expr..";") if lua_code.locals and #lua_code.locals > 0 lua_code = "local "..concat(lua_code.locals, ", ")..";\n"..lua_code lua_code = "-- File: #{filename}\n"..lua_code ret = @run_lua(lua_code) if max_operations debug.sethook! if output_file output_file\write(lua_code) return ret, lua_code run_file: (filename)=> if filename\match(".*%.lua") file = io.open(filename) contents = file\read("*a") file\close! return assert(load(contents, nil, nil, @environment))! if filename\match(".*%.nom") if not @skip_precompiled -- Look for precompiled version file = io.open(filename\gsub("%.nom", ".lua"), "r") if file lua_code = file\read("*a") file\close! return @run_lua(lua_code) file = file or io.open(filename) if not file error("File does not exist: #{filename}", 0) nomsu_code = file\read('*a') file\close! return @run(nomsu_code, filename) else error("Invalid filetype for #{filename}", 0) require_file: (filename)=> loaded = @environment.LOADED if not loaded[filename] loaded[filename] = @run_file(filename) or true return loaded[filename] run_lua: (lua_code)=> run_lua_fn, err = load(lua_code, nil, nil, @environment) if @debug print "#{colored.bright "RUNNING LUA:"}\n#{colored.blue colored.bright(lua_code)}" if not run_lua_fn n = 1 fn = -> n = n + 1 ("\n%-3d|")\format(n) code = "1 |"..lua_code\gsub("\n", fn) error("Failed to compile generated code:\n#{colored.bright colored.blue colored.onblack code}\n\n#{err}", 0) return run_lua_fn! tree_to_value: (tree, filename)=> -- Special case for text literals if tree.type == 'Text' and #tree.value == 1 and type(tree.value[1]) == 'string' return tree.value[1] code = "return #{@tree_to_lua(tree).expr};" if @debug print "#{colored.bright "RUNNING LUA TO GET VALUE:"}\n#{colored.blue colored.bright(code)}" lua_thunk, err = load(code, nil, nil, @environment) if not lua_thunk error("Failed to compile generated code:\n#{colored.bright colored.blue colored.onblack code}\n\n#{colored.red err}", 0) return lua_thunk! tree_to_nomsu: (tree, indentation="", max_line=80, expr_type=nil)=> -- Convert a tree into nomsu code that satisfies the max line requirement or nil -- if that's not possible -- expr_type is either: -- nil for code that goes at the top level and can contain anything -- "noeol" for code that can contain anything except an end-of-line component -- like a colon (i.e. it already occurs after a colon on the same line) -- "inline" for code that cannot contain indented code or an end-of-line component -- e.g. code that is meant to go inside parentheses assert tree, "No tree provided to tree_to_nomsu." assert tree.type, "Invalid tree: #{repr(tree)}" join_lines = (lines)-> for line in *lines if #indentation + #line > max_line return nil return concat(lines, "\n"..indentation) is_operator = (tok)-> tok and tok.type == "Word" and NOMSU_DEFS.operator\match(tok.value) local inline_expression, noeol_expression, expression inline_expression = (tok)-> switch tok.type when "Block" if #tok.value > 1 then return nil nomsu = inline_expression tok.value return nomsu and "(: #{nomsu})" when "FunctionCall" buff = "" for i,bit in ipairs tok.value if bit.type == "Word" if i == 1 or (is_operator(bit) and is_operator(tok.value[i-1])) buff ..= bit.value else buff ..= " "..bit.value else nomsu = inline_expression bit return nil unless nomsu unless i == 1 or bit.type == "Block" buff ..= " " buff ..= if bit.type == "FunctionCall" "("..nomsu..")" else nomsu return buff when "List" bits = {} for bit in *tok.value nomsu = inline_expression bit return nil unless nomsu insert bits, nomsu return "["..concat(bits, ", ").."]" when "Dict" bits = {} for bit in *tok.value key_nomsu = if bit.dict_key.type == "Word" bit.dict_key.value else inline_expression bit.dict_key return nil unless key_nomsu if bit.dict_key.type == "FunctionCall" key_nomsu = "("..key_nomsu..")" value_nomsu = inline_expression bit.dict_value return nil unless value_nomsu insert bits, key_nomsu.."="..value_nomsu return "{"..concat(bits, ", ").."}" when "Text" buff = '"' for bit in *tok.value if type(bit) == 'string' -- Force indented text return nil if bit\find("\n") buff ..= bit\gsub("\\","\\\\")\gsub("\n","\\n") else nomsu = inline_expression(bit) return nil unless nomsu buff ..= if bit.type == "Var" or bit.type == "List" or bit.type == "Dict" "\\"..nomsu else "\\("..nomsu..")" if #buff > max_line then return nil return buff..'"' when "Nomsu" nomsu = inline_expression(tok.value) return nil if not nomsu return "\\("..nomsu..")" when "Number" then tostring(tok.value) when "Var" then "%"..tok.value else return nil noeol_expression = (tok)-> nomsu = inline_expression(tok) if nomsu and #nomsu < max_line return nomsu switch tok.type when "Block" buff = ":" for line in *tok.value nomsu = expression(line) return nil unless nomsu buff ..= "\n "..@indent(nomsu) return buff when "FunctionCall" nomsu = expression(tok) return nil unless nomsu return "(..)\n "..@indent(nomsu) when "List" buff = "[..]" line = "\n " for bit in *tok.value nomsu = inline_expression bit if line != "\n " and #line + #", " + #nomsu > max_line buff ..= line line = "\n " sep = line == "\n " and "" or ", " if nomsu line ..= sep..nomsu if #line >= max_line buff ..= line line = "\n " else line ..= sep..expression(bit) buff ..= line line = "\n " if line ~= "\n " buff ..= line return buff when "Dict" buff = "{..}" line = "\n " for bit in *tok.value key_nomsu = inline_expression bit.dict_key return nil unless key_nomsu if bit.dict_key.type == "FunctionCall" key_nomsu = "("..key_nomsu..")" value_nomsu = inline_expression bit.dict_value if value_nomsu and #key_nomsu + #value_nomsu < max_line line ..= key_nomsu.."="..value_nomsu.."," if #line >= max_line buff ..= line line = "\n " else line ..= key_nomsu.."="..expression(bit.dict_value) buff ..= line line = "\n " if line ~= "\n " buff ..= line return buff when "Text" buff = '".."\n ' for bit in *tok.value if type(bit) == 'string' buff ..= bit\gsub("\\","\\\\")\gsub("\n","\n ") else nomsu = inline_expression(bit) return nil unless nomsu buff ..= if bit.type == "Var" or bit.type == "List" or bit.type == "Dict" "\\"..nomsu else "\\("..nomsu..")" return buff when "Nomsu" nomsu = expression(tok.value) return nil if not nomsu return "\\(..)\n "..@indent(nomsu) when "Comment" if tok.value\find("\n") return "#.."..tok.value\gsub("\n","\n ") else return "#"..tok.value else return inline_expression(tok) expression = (tok)-> nomsu = inline_expression(tok) if nomsu and #nomsu < max_line return nomsu switch tok.type when "Block" if #tok.value == 1 nomsu = if tok.value[1].type == "FunctionCall" inline_expression(tok.value[1]) else noeol_expression(tok.value[1]) if nomsu and #(nomsu\match("[^\n]*")) < max_line return ": "..nomsu return noeol_expression(tok) when "FunctionCall" -- The hard task buff = "" for i,bit in ipairs tok.value if bit.type == "Word" if i == 1 or (is_operator(bit) and is_operator(tok.value[i-1])) or buff\sub(-2,-1) == ".." buff ..= bit.value else buff ..= " "..bit.value else nomsu = inline_expression(bit) if nomsu and #nomsu < max_line if bit.type == "FunctionCall" nomsu = "("..nomsu..")" else nomsu = expression(bit) return nil unless nomsu if bit.type == "FunctionCall" nomsu = "(..)\n "..@indent(nomsu) if i < #tok.value nomsu ..= "\n.." unless i == 1 or bit.type == "Block" buff ..= " " buff ..= nomsu return buff when "File" lines = {} for line in *tree.value nomsu = expression(line) assert nomsu, "Failed to produce output for:\n#{colored.yellow line\get_src!}" insert lines, nomsu return concat lines, "\n" when "Comment" if tok.value\find("\n") return "#.."..tok.value\gsub("\n","\n ") else return "#"..tok.value else return noeol_expression(tok) return expression(tree) value_to_nomsu: (value)=> switch type(value) when "nil" return "(nil)" when "bool" return value and "(yes)" or "(no)" when "number" return repr(value) when "table" if is_list(value) return "[#{concat [@value_to_nomsu(v) for v in *value], ", "}]" else return "{#{concat ["#{@value_to_nomsu(k)}=#{@value_to_nomsu(v)}" for k,v in pairs(value)], ", "}}" when "string" if value == "\n" return "'\\n'" elseif not value\find[["]] and not value\find"\n" and not value\find"\\" return "\""..value.."\"" else -- TODO: This might fail if it's being put inside a list or something return '".."\n '..(@indent value) else error("Unsupported value_to_nomsu type: #{type(value)}", 0) @math_patt: re.compile [[ "%" (" " [*/^+-] " %")+ ]] tree_to_lua: (tree)=> -- Return , assert tree, "No tree provided." if not tree.type error("Invalid tree: #{repr(tree)}", 0) switch tree.type when "File" if #tree.value == 1 return @tree_to_lua(tree.value[1]) declared_locals = {} lua_bits = {} line_no = 1 for line in *tree.value lua = @tree_to_lua line if not lua error("No lua produced by #{repr line}", 0) if lua.locals new_locals = [l for l in *lua.locals when not declared_locals[l]] if #new_locals > 0 insert lua_bits, "local #{concat new_locals, ", "};" for l in *new_locals do declared_locals[l] = true if lua.statements then insert lua_bits, lua.statements elseif lua.expr then insert lua_bits, "#{lua.expr};" return statements:concat(lua_bits, "\n") when "Comment" return statements:"--"..tree.value\gsub("\n","\n--") when "Nomsu" return expr:"nomsu:parse(#{repr tree.value\get_src!}, #{repr tree\get_line_no!}).value[1]" when "Block" lua_bits = {} locals = {} for arg in *tree.value lua = @tree_to_lua arg if #tree.value == 1 and lua.expr and not lua.statements return {expr:lua.expr, locals:lua.locals} if lua.locals for l in *lua.locals do table.insert(locals, l) if lua.statements then insert lua_bits, lua.statements elseif lua.expr then insert lua_bits, "#{lua.expr};" utils.deduplicate(locals) return statements:concat(lua_bits, "\n"), locals:(#locals > 0 and locals or nil) when "FunctionCall" insert @compilestack, tree -- Rawget here to avoid triggering an error for accessing an undefined action fn = rawget(@environment.ACTIONS, tree.stub) metadata = @environment.ACTION_METADATA[fn] if metadata and metadata.compile_time args = [arg for arg in *tree.value when arg.type != "Word"] if metadata and metadata.arg_orders new_args = [args[p] for p in *metadata.arg_orders[tree.stub]] args = new_args if @debug print "#{colored.bright "RUNNING MACRO"} #{colored.underscore colored.magenta(tree.stub)} " print "#{colored.bright "WITH ARGS:"} #{colored.dim repr [(repr a)\sub(1,50) for a in *args]}" lua = fn(unpack(args)) remove @compilestack return lua elseif not metadata and @@math_patt\match(tree.stub) -- This is a bit of a hack, but this code handles arbitrarily complex -- math expressions like 2*x + 3^2 without having to define a single -- action for every possibility. bits = {} for tok in *tree.value if tok.type == "Word" insert bits, tok.value else lua = @tree_to_lua(tok) assert(lua.expr, "non-expression value inside math expression: #{tok\get_src!}") insert bits, lua.expr remove @compilestack return expr:"(#{concat bits, " "})" args = {} for tok in *tree.value if tok.type == "Word" then continue lua = @tree_to_lua(tok) assert lua.expr, "#{tree\get_line_no!}: Cannot use:\n#{colored.yellow tok\get_src!}\nas an argument to #{tree.stub}, since it's not an expression, it produces: #{repr lua}" insert args, lua.expr if metadata and metadata.arg_orders new_args = [args[p] for p in *metadata.arg_orders[tree.stub]] args = new_args remove @compilestack return expr:@@comma_separated_items("ACTIONS[#{repr tree.stub}](", args, ")") when "Text" concat_parts = {} string_buffer = "" for bit in *tree.value if type(bit) == "string" string_buffer ..= bit continue if string_buffer ~= "" insert concat_parts, repr(string_buffer) string_buffer = "" lua = @tree_to_lua bit if @debug print(colored.bright "INTERP:") @print_tree bit print "#{colored.bright "EXPR:"} #{lua.expr}, #{colored.bright "STATEMENT:"} #{lua.statements}" assert lua.expr, "Cannot use [[#{bit\get_src!}]] as a string interpolation value, since it's not an expression." insert concat_parts, "stringify(#{lua.expr})" if string_buffer ~= "" insert concat_parts, repr(string_buffer) if #concat_parts == 0 return expr:"''" elseif #concat_parts == 1 return expr:concat_parts[1] else return expr:"(#{concat(concat_parts, "..")})" when "List" items = {} for item in *tree.value lua = @tree_to_lua item assert lua.expr, "Cannot use [[#{item\get_src!}]] as a list item, since it's not an expression." insert items, lua.expr return expr:@@comma_separated_items("{", items, "}") when "Dict" items = {} for entry in *tree.value key_lua = if entry.dict_key.type == "Word" {expr:repr(entry.dict_key.value)} else @tree_to_lua entry.dict_key assert key_lua.expr, "Cannot use [[#{entry.dict_key\get_src!}]] as a dict key, since it's not an expression." value_lua = @tree_to_lua entry.dict_value assert value_lua.expr, "Cannot use [[#{entry.dict_value\get_src!}]] as a dict value, since it's not an expression." key_str = key_lua.expr\match([=[["']([a-zA-Z_][a-zA-Z0-9_]*)['"]]=]) if key_str insert items, "#{key_str}=#{value_lua.expr}" elseif key_lua.expr\sub(1,1) == "[" insert items, "[ #{key_lua.expr}]=#{value_lua.expr}" else insert items, "[#{key_lua.expr}]=#{value_lua.expr}" return expr:@@comma_separated_items("{", items, "}") when "Number" return expr:repr(tree.value) when "Var" return expr:@var_to_lua_identifier(tree.value) else error("Unknown/unimplemented thingy: #{tree.type}", 0) walk_tree: (tree, depth=0)=> coroutine.yield(tree, depth) if type(tree) != 'table' or not tree.type return switch tree.type when "List", "File", "Block", "FunctionCall", "Text" for v in *tree.value @walk_tree(v, depth+1) when "Dict" for e in *tree.value @walk_tree(e.dict_key, depth+1) @walk_tree(e.dict_value, depth+1) else @walk_tree(tree.value, depth+1) return nil print_tree: (tree)=> buff = colors.bright..colors.green for node,depth in coroutine.wrap(-> @walk_tree tree) if type(node) != 'table' or not node.type buff += ((" ")\rep(depth)..repr(node)).."\n" else buff += ("#{(" ")\rep(depth)}#{node.type}:").."\n" print(buff..colors.reset) tree_to_str: (tree)=> bits = {} for node,depth in coroutine.wrap(-> @walk_tree tree) if type(node) != 'table' or not node.type insert bits, ((" ")\rep(depth)..repr(node)) else insert bits, ("#{(" ")\rep(depth)}#{node.type}:") return concat(bits, "\n") @unescape_string: (str)=> Cs(((P("\\\\")/"\\") + (P("\\\"")/'"') + NOMSU_DEFS.escaped_char + P(1))^0)\match(str) @comma_separated_items: (open, items, close)=> bits = {open} so_far = 0 for i,item in ipairs(items) if i < #items then item ..= ", " insert bits, item so_far += #item if so_far >= 80 insert bits, "\n" so_far = 0 insert bits, close return concat(bits) tree_with_replaced_vars: (tree, replacements)=> if type(tree) != 'table' then return tree switch tree.type when "Var" id = @var_to_lua_identifier tree.value if replacements[id] ~= nil tree = replacements[id] when "File", "Nomsu", "Block", "List", "FunctionCall", "Text" new_value = @tree_with_replaced_vars tree.value, replacements if new_value != tree.value tree = {k,v for k,v in pairs(tree)} tree.value = new_value when "Dict" dirty = false replacements = {} for i,e in ipairs tree.value new_key = @tree_with_replaced_vars e.dict_key, replacements new_value = @tree_with_replaced_vars e.dict_value, replacements dirty or= new_key != e.dict_key or new_value != e.dict_value replacements[i] = {dict_key:new_key, dict_value:new_value} if dirty tree = {k,v for k,v in pairs(tree)} tree.value = replacements when nil -- Raw table, probably from one of the .value of a multi-value tree (e.g. List) new_values = {} any_different = false for k,v in pairs tree new_values[k] = @tree_with_replaced_vars v, replacements any_different or= (new_values[k] != tree[k]) if any_different tree = new_values return tree stub_defs = { space:(P(' ') + P('\n..'))^0 word:(NOMSU_DEFS.ident_char^1 + NOMSU_DEFS.operator^1) varname:(R('az','AZ','09') + P('_') + NOMSU_DEFS.utf8_char)^0 } stub_pattern = re.compile("{~ (%space->'') (('%' (%varname->'')) / %word)? ((%space->' ') (('%' (%varname->'')) / %word))* (%space->'') ~}", stub_defs) get_stubs_from_signature: (signature)=> if type(signature) != 'table' or signature.type error("Invalid signature: #{repr signature}", 0) stubs = {} for i,alias in ipairs(signature) if type(alias) != 'string' error("Expected entries in signature to be strings, not #{type(alias)}s like: #{repr alias}\nsignature: #{repr signature}", 0) stubs[i] = stub_pattern\match(alias) unless stubs[i] error("Failed to match stub pattern on alias: #{repr alias}") return stubs var_pattern = re.compile("{| %space ((('%' {%varname}) / %word) %space)+ |}", stub_defs) get_args_from_signature: (signature)=> if type(signature) != 'table' or signature.type error("Invalid signature: #{repr signature}", 0) stub_args = {} for i,alias in ipairs(signature) if type(alias) != 'string' error("Invalid type for signature: #{type(alias)} for:\n#{repr alias}", 0) args = var_pattern\match(alias) unless args error("Failed to match arg pattern on alias: #{repr alias}", 0) for j=1,#args do args[j] = @var_to_lua_identifier(args[j]) stub_args[i] = args return stub_args var_to_lua_identifier: (var)=> -- Converts arbitrary nomsu vars to valid lua identifiers by replacing illegal -- characters with escape sequences if type(var) == 'table' and var.type == "Var" var = var.value "_"..(var\gsub "%W", (verboten)-> if verboten == "_" then "__" else ("_%x")\format(verboten\byte!)) source_code: (level=0)=> @dedent @compilestack[#@compilestack-level]\get_src! initialize_core: => -- Sets up some core functionality get_line_no = -> "nomsu.moon:#{debug.getinfo(2).currentline}" nomsu = self nomsu_string_as_lua = (code)-> concat_parts = {} for bit in *code.value if type(bit) == "string" insert concat_parts, bit else lua = nomsu\tree_to_lua bit unless lua.expr error("Cannot use [[#{bit\get_src!}]] as a string interpolation value, since it's not an expression.", 0) insert concat_parts, lua.expr return concat(concat_parts) -- TODO: fix how 'immediately' works with locals, e.g. "immediately: %x <- 5" @define_compile_action "immediately %block", get_line_no!, (_block)-> lua = nomsu\tree_to_lua(_block) lua_code = lua.statements or (lua.expr..";") nomsu\run_lua(lua_code) return statements:"if IMMEDIATE then\n#{lua_code}\nend", locals:lua.locals @define_compile_action "lua> %code", get_line_no!, (_code)-> if _code.type == "Text" lua = nomsu_string_as_lua(_code) return statements:lua else return statements:"nomsu:run_lua(#{nomsu\tree_to_lua(_code).expr});" @define_compile_action "=lua %code", get_line_no!, (_code)-> lua = nomsu_string_as_lua(_code) return expr:lua @define_compile_action "!! code location !!", get_line_no!, -> tree = nomsu.compilestack[#nomsu.compilestack-1] return expr: repr("#{tree.filename}:#{tree.start},#{tree.stop}") @define_action "run file %filename", get_line_no!, (_filename)-> nomsu\run_file(_filename) @define_compile_action "use %filename", get_line_no!, (_filename)-> filename = nomsu\tree_to_value(_filename) nomsu\require_file(filename) return statements:"nomsu:require_file(#{repr filename});" if arg export colors colors = require 'consolecolors' parser = re.compile([[ args <- {| {:flags: flags? :} ({:input: input :} ";" ("-o;"{:output: output :} ";")?)? (";")? |} !. flags <- (({| ({flag} ";")* |}) -> set) flag <- "-c" / "-i" / "-p" / "-O" / "--help" / "-h" / "-v" input <- "-" / [^;]+ output <- "-" / [^;]+ ]], {:set}) args = concat(arg, ";")..";" args = parser\match(args) or {} if not args or not args.flags or args.flags["--help"] or args.flags["-h"] print "Usage: lua nomsu.lua [-c] [-i] [-p] [-O] [--help] [input [-o output]]" os.exit! nomsu = NomsuCompiler() run = -> if args.flags["-v"] nomsu.debug = true nomsu.skip_precompiled = not args.flags["-O"] if args.input -- Read a file or stdin and output either the printouts or the compiled lua if args.flags["-c"] and not args.output args.output = args.input\gsub("%.nom", ".lua") compiled_output = nil if args.flags["-p"] nomsu.environment.print = -> compiled_output = io.output() elseif args.output compiled_output = io.open(args.output, 'w') if args.input\match(".*%.lua") retval = dofile(args.input)(nomsu, {}) else input = if args.input == '-' io.read('*a') else io.open(args.input)\read("*a") retval, code = nomsu\run(input, args.input) if compiled_output compiled_output\write("local IMMEDIATE = true;\n") compiled_output\write(code) if args.flags["-p"] nomsu.environment.print = print if args.flags["-i"] -- REPL nomsu\run('use "lib/core.nom"', "stdin") while true buff = "" while true io.write(">> ") line = io.read("*L") if line == "\n" or not line break buff ..= line if #buff == 0 break ok, ret = pcall(-> nomsu\run(buff, "stdin")) if ok and ret != nil print "= "..repr(ret) err_hand = (error_message)-> -- TODO: write properly to stderr print("#{colored.red "ERROR:"} #{colored.bright colored.yellow colored.onred (error_message or "")}") print("stack traceback:") -- TODO: properly print out the calling site of nomsu code, not just the *called* code import to_lua from require "moonscript.base" nomsu_file = io.open("nomsu.moon") nomsu_source = nomsu_file\read("*a") _, line_table = to_lua(nomsu_source) nomsu_file\close! level = 2 while true calling_fn = debug.getinfo(level) if not calling_fn then break if calling_fn.func == run then break level += 1 name = calling_fn.name if name == "run_lua_fn" then continue line = nil if metadata = nomsu.action_metadata[calling_fn.func] filename, start, stop = metadata.source\match("([^:]*):([0-9]*),([0-9]*)") if filename file = io.open(filename)\read("*a") line_no = 1 for _ in file\sub(1,tonumber(start))\gmatch("\n") do line_no += 1 offending_statement = file\sub(tonumber(start),tonumber(stop)) if #offending_statement > 50 offending_statement = offending_statement\sub(1,50).."..." offending_statement = colored.red(offending_statement) line = colored.yellow(filename..":"..tostring(line_no).."\n "..offending_statement) else line = colored.yellow(metadata.source) name = colored.bright(colored.yellow(metadata.aliases[1])) else if calling_fn.istailcall and not name name = "" if calling_fn.short_src == "./nomsu.moon" char = line_table[calling_fn.currentline] line_num = 1 for _ in nomsu_source\sub(1,char)\gmatch("\n") do line_num += 1 line = colored.cyan("#{calling_fn.short_src}:#{line_num}") name = colored.bright(colored.cyan(name or "???")) else line = colored.blue("#{calling_fn.short_src}:#{calling_fn.currentline}") name = colored.bright(colored.blue(name or "???")) _from = colored.dim colored.white "|" print(("%32s %s %s")\format(name, _from, line)) os.exit(false, true) -- Note: xpcall has a slightly different API in Lua <=5.1 vs. >=5.2, but this works -- for both APIs xpcall(run, err_hand) return NomsuCompiler