nomsu/nomsu.4.peg

233 lines
9.0 KiB
Plaintext
Raw Normal View History

2018-09-12 15:31:59 -07:00
-- Nomsu version 4
2018-12-18 19:30:01 -08:00
file <-
2018-09-12 15:31:59 -07:00
{:curr_indent: ' '* :}
(((action / expression / inline_block / indented_block) eol !.)
/ file_chunks / empty_block)
{:curr_indent: %nil :}
!.
2018-12-18 19:30:01 -08:00
shebang <- "#!" (!"nomsu" [^%nl])* "nomsu" ws+ "-V" ws* [0-9.]+ [^%nl]* (%nl / !.)
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
eof <- !.
2018-12-18 19:30:01 -08:00
file_chunks (FileChunks) <-
{:shebang: shebang :}?
(top_block (nl_nodent section_division top_block)*)
2018-09-12 15:31:59 -07:00
blank_lines?
unexpected_indent? unexpected_chunk?
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
top_block (Block) <-
2019-01-18 20:40:18 -08:00
((blank_lines nodent) / (comment nl_nodent))? statement (nl_nodent statement)*
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
empty_block (Block) <-
2018-09-12 15:31:59 -07:00
comment? blank_lines?
2018-12-18 19:30:01 -08:00
nodent <- (unexpected_indent [^%nl]* / =curr_indent)
indent <- {~ =curr_indent (ws / (%tab -> ' '))+ ~}
blank_lines <- %nl ((nodent comment / ws*) %nl)*
eol <- ws* eol_comment? (!. / &%nl)
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
nl_nodent <- blank_lines nodent
nl_indent <- blank_lines tab_error? {:curr_indent: indent :} (comment nl_nodent)*
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
comment (Comment) <-
"#" {~ [^%nl]* (%nl+ (indent -> '') [^%nl]*)* (%nl &%nl)* ~}
2018-12-18 19:30:01 -08:00
eol_comment (Comment) <-
2018-09-12 15:31:59 -07:00
"#" {[^%nl]*}
2018-12-18 19:30:01 -08:00
unexpected_code <- ws* _unexpected_code
_unexpected_code (Error) <-
{:error: {~ [^%nl]+ -> "Couldn't parse this code." ~} :}
2018-12-18 19:30:01 -08:00
unexpected_chunk (Error) <-
{:error: {~ .+ -> "Couldn't parse this chunk of code." ~} :}
2018-12-18 19:30:01 -08:00
unexpected_indent (Error) <-
{:error: {~ (=curr_indent ws+) -> "This indentation is messed up." ~} :}
{:hint: {~ '' -> 'This line should either have the same indentation as the line above it, or exactly 4 spaces more.' ~} :}
2018-12-18 19:30:01 -08:00
missing_paren_err (Error) <-
2018-09-12 15:31:59 -07:00
{:error: {~ eol -> 'Line ended without finding a closing )-parenthesis' ~} :}
{:hint: {~ '' -> 'Put a ")" here' ~} :}
2018-12-18 19:30:01 -08:00
missing_quote_err (Error) <-
2018-09-12 15:31:59 -07:00
{:error: {~ eol -> 'Line ended before finding a closing double quotation mark' ~} :}
{:hint: {~ "" -> "Put a quotation mark here" ~} :}
2018-12-18 19:30:01 -08:00
missing_bracket_error (Error) <-
2018-09-12 15:31:59 -07:00
{:error: {~ eol -> "Line ended before finding a closing ]-bracket" ~} :}
{:hint: {~ '' -> 'Put a "]" here' ~} :}
2018-12-18 19:30:01 -08:00
missing_brace_error (Error) <-
2018-09-12 15:31:59 -07:00
{:error: {~ eol -> "Line ended before finding a closing }-brace" ~} :}
{:hint: {~ '' -> 'Put a "}" here' ~} :}
2018-12-18 19:30:01 -08:00
disallowed_interpolation (Error) <-
{:error: {~ ("\" ('\:' / '(..)' / '[..]' / '{..}') (%nl (&(%nl) / =curr_indent ' ' [^%nl]*))*) ->
"Sorry, indented text interpolations are not currently supported on the first line of multi-line text." ~} :}
{:hint: {~ '' -> 'Move the code for the first line of text to the next line by ending this line with "\" and starting the next line indented with "..", followed by the code for the first line.' ~} :}
2018-12-18 19:30:01 -08:00
tab_error (Error) <-
&(=curr_indent %tab)
{:error: {~ '' -> 'Tabs are not allowed for indentation.' ~} :}
{:hint: {~ '' -> 'Use spaces instead of tabs.' ~} :}
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
section_division <- ("~")^+3 eol
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
inline_block <-
"(" ws* inline_block ws* (eof / ")") / raw_inline_block
2018-12-18 19:30:01 -08:00
raw_inline_block (Block) <-
2018-09-12 15:31:59 -07:00
(!"::") ":" ws* ((inline_statement (ws* ";" ws* inline_statement)*) / !(eol nl_indent))
2018-12-18 19:30:01 -08:00
indented_block (Block) <-
":" eol nl_indent statement (nl_nodent statement)*
2018-09-12 15:31:59 -07:00
(%nl (ws* %nl)* nodent (comment / eol / unexpected_code))*
{:curr_indent: %nil :}
2018-12-18 19:30:01 -08:00
statement <-
2018-09-12 15:31:59 -07:00
(action / expression) (eol / unexpected_code)
2018-12-18 19:30:01 -08:00
inline_statement <- (inline_action / inline_expression)
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
noindex_inline_expression <-
2018-09-12 15:31:59 -07:00
number / variable / inline_text / inline_list / inline_dict / inline_nomsu
/ ( "("
ws* (inline_action / inline_expression) ws*
(ws* ',' ws* (inline_action / inline_expression) ws*)*
(")" / eof / missing_paren_err / unexpected_code)
2018-09-12 15:31:59 -07:00
)
2018-12-18 19:30:01 -08:00
inline_expression <- index_chain / noindex_inline_expression
indented_expression <-
2018-09-14 19:17:09 -07:00
indented_text / indented_nomsu / indented_list / indented_dict / ({|
"(..)" eol nl_indent
2018-09-12 15:31:59 -07:00
(action / expression) (eol / unexpected_code)
(%nl (ws* %nl)* nodent (comment / eol / unexpected_code))*
{:curr_indent: %nil :}
|} -> unpack)
2018-12-18 19:30:01 -08:00
expression <-
2018-09-12 15:31:59 -07:00
inline_expression / indented_expression
2018-12-18 19:30:01 -08:00
inline_nomsu (EscapedNomsu) <- "\" (inline_expression / inline_block)
indented_nomsu (EscapedNomsu) <-
2018-09-12 15:31:59 -07:00
"\" (noindex_inline_expression / inline_block / indented_expression / indented_block)
2018-12-18 19:30:01 -08:00
index_chain (IndexChain) <-
2018-09-12 15:31:59 -07:00
noindex_inline_expression ("." (text_word / noindex_inline_expression))+
2018-12-18 19:30:01 -08:00
inline_action <- inline_methodcall / _inline_action
inline_methodcall (MethodCall) <-
(inline_expression / "(" inline_block ")") ws* "::" ws* _inline_action
2018-09-12 15:31:59 -07:00
-- Actions need either at least 1 word, or at least 2 tokens
2018-12-18 19:30:01 -08:00
_inline_action (Action) <-
2018-09-12 15:31:59 -07:00
!section_division
( (inline_arg (ws* (inline_arg / word))+)
/ (word (ws* (inline_arg / word))*))
(ws* inline_block)?
2018-12-18 19:30:01 -08:00
inline_arg <- inline_expression / inline_block / "(" ws* ")"
2018-12-18 19:30:01 -08:00
action <- methodcall / _action
methodcall (MethodCall) <-
(expression / "(" inline_block ")" / indented_block)
((ws* "\")? eol nl_nodent "..")? ws* "::" ((ws* "\")? eol nl_nodent "..")? ws*
_action
2018-12-18 19:30:01 -08:00
_action (Action) <-
2018-09-12 15:31:59 -07:00
!section_division
( (arg (((ws* "\")? eol nl_nodent "..")? ws* (arg / word))+)
/ (word (((ws* "\")? eol nl_nodent "..")? ws* (arg / word))*))
2018-12-18 19:30:01 -08:00
arg <- expression / inline_block / indented_block / "(" ws* ")"
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
word <- !number { operator_char+ / ident_char+ }
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
text_word (Text) <- word
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
inline_text (Text) <-
2018-09-14 19:17:09 -07:00
!(indented_text)
'"' _inline_text* ('"' / eof / missing_quote_err / unexpected_code)
2018-12-18 19:30:01 -08:00
_inline_text <-
{~ (('\"' -> '"') / ('\\' -> '\') / escaped_char / text_char+)+ ~}
/ inline_text_interpolation / illegal_char
2018-12-18 19:30:01 -08:00
inline_text_interpolation <-
2018-09-12 15:31:59 -07:00
"\" (
2018-09-14 19:17:09 -07:00
variable / inline_list / inline_dict
2018-09-12 15:31:59 -07:00
/ ("("
ws* (inline_action / inline_expression) ws*
(ws* ',' ws* (inline_action / inline_expression) ws*)*
(")" / eof / missing_paren_err / unexpected_code))
2018-09-12 15:31:59 -07:00
)
2018-12-18 19:30:01 -08:00
text_char <- %utf8_char / !["\] %print / %tab
illegal_char (Error) <-
{:error: {~ (!(%nl / %tab / %print) .) -> "Illegal unprintable character here (it may not be visible, but it's there)" ~} :}
{:hint: {~ '' -> "This sort of thing can happen when copying and pasting code. Try deleting and retyping the code." ~} :}
2018-12-18 19:30:01 -08:00
nonterminal_quote <-
'"' &([^%nl] / %nl+ =curr_indent)
2018-12-18 19:30:01 -08:00
indented_text (Text) <-
'"'
_inline_text*
(('\' %nl+ {:curr_indent: indent :} ('..')?)
/ disallowed_interpolation? {%nl+} {:curr_indent: indent :})
(indented_plain_text / text_interpolation / illegal_char / {~ %nl+ (=curr_indent -> "") [ ]* ~})*
('"' eol / eof / missing_quote_err)
{:curr_indent: %nil :}
2018-09-12 15:31:59 -07:00
-- Tracking text-lines-within-indented-text as separate objects allows for better debugging line info
2018-12-18 19:30:01 -08:00
indented_plain_text (Text) <-
2018-09-14 19:17:09 -07:00
{~
((("\" blank_lines =curr_indent "..") -> "") / ('\\' -> '\')
/ (!text_interpolation (escaped_char / '\'))
/ (nonterminal_quote / text_char)+)+
2018-09-14 19:17:09 -07:00
~}
2018-12-18 19:30:01 -08:00
text_interpolation <-
inline_text_interpolation / ("\" (indented_expression / indented_block) (blank_lines =curr_indent "..")?)
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
number (Number) <-
(&("-"? "0x" [0-9a-fA-F]+) {:hex: '' -> 'yes' :})?
(("-"? (([0-9]+ "." [0-9]+) / ("." [0-9]+) / "0x" [0-9a-fA-F]+ / ([0-9]+)))-> tonumber)
2018-09-12 15:31:59 -07:00
-- Variables can be nameless (i.e. just %) and can only contain identifier chars.
-- This ensures you don't get weird parsings of `%x+%y` or `%'s thing`.
2018-12-18 19:30:01 -08:00
variable (Var) <- "%" {ident_char*}
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
inline_list (List) <-
2018-09-12 15:31:59 -07:00
!('[..]')
"[" ws*
(inline_list_item (ws* ',' ws* inline_list_item)* (ws* ',')?)? ws*
("]" / eof / (","? (missing_bracket_error / unexpected_code)))
2018-12-18 19:30:01 -08:00
indented_list (List) <-
2018-09-12 15:31:59 -07:00
"[..]" eol nl_indent
list_line (nl_nodent list_line)*
2018-09-12 15:31:59 -07:00
(%nl (ws* %nl)* nodent (comment / eol / unexpected_code))*
(","? unexpected_code)?
2018-12-18 19:30:01 -08:00
list_line <-
2018-09-12 15:31:59 -07:00
(inline_list_item ws* "," ws*)+ eol
/ (inline_list_item ws* "," ws*)* (action / expression / inline_block / indented_block) eol
2018-12-18 19:30:01 -08:00
inline_list_item <- inline_action / inline_expression / inline_block
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
inline_dict (Dict) <-
2018-09-12 15:31:59 -07:00
!('{..}')
"{" ws*
(inline_dict_entry (ws* ',' ws* inline_dict_entry)*)? ws*
("}" / eof / (","? (missing_brace_error / unexpected_code)))
2018-12-18 19:30:01 -08:00
indented_dict (Dict) <-
2018-09-12 15:31:59 -07:00
"{..}" eol nl_indent
dict_line (nl_nodent dict_line)*
2018-09-12 15:31:59 -07:00
(%nl (ws* %nl)* nodent (comment / eol / unexpected_code))*
(","? unexpected_code)?
2018-12-18 19:30:01 -08:00
dict_line <-
2018-09-12 15:31:59 -07:00
(inline_dict_entry ws* "," ws*)+ eol
/ (inline_dict_entry ws* "," ws*)* dict_entry eol
2018-12-18 19:30:01 -08:00
_dict_entry(DictEntry) <-
2018-09-12 15:31:59 -07:00
dict_key (ws* ":" ws* (action / expression))?
2018-12-18 19:30:01 -08:00
dict_entry <-
_dict_entry / inline_block / indented_block
2018-12-18 19:30:01 -08:00
_inline_dict_entry(DictEntry) <-
2018-09-12 15:31:59 -07:00
dict_key (ws* ":" ws* (inline_action / inline_expression)?)?
2018-12-18 19:30:01 -08:00
inline_dict_entry <-
_inline_dict_entry / inline_block
2018-12-18 19:30:01 -08:00
dict_key <-
2018-09-12 15:31:59 -07:00
text_word / inline_expression
2018-12-18 19:30:01 -08:00
operator_char <- ['`~!@$^&*+=|<>?/-]
ident_char <- [a-zA-Z0-9_] / %utf8_char
ws <- " "
2018-09-12 15:31:59 -07:00
2018-12-18 19:30:01 -08:00
escaped_char <-
2018-09-12 15:31:59 -07:00
("\"->'') (
(([xX]->'') ((({[0-9a-fA-F]^2} %number_16) -> tonumber) -> tochar))
/ ((([0-9] [0-9]^-2) -> tonumber) -> tochar)
/ ("a"->ascii_7) / ("b"->ascii_8) / ("t"->ascii_9) / ("n"->ascii_10)
/ ("v"->ascii_11) / ("f"->ascii_12) / ("r"->ascii_13)
)