// Some basic operations defined on AST nodes, mainly converting to // strings for debugging. #include #include #include "ast.h" #include "stdlib/datatypes.h" #include "stdlib/integers.h" #include "stdlib/tables.h" #include "stdlib/text.h" #include "cordhelpers.h" CONSTFUNC const char *binop_method_name(ast_e tag) { switch (tag) { case Power: case PowerUpdate: return "power"; case Multiply: case MultiplyUpdate: return "times"; case Divide: case DivideUpdate: return "divided_by"; case Mod: case ModUpdate: return "modulo"; case Mod1: case Mod1Update: return "modulo1"; case Plus: case PlusUpdate: return "plus"; case Minus: case MinusUpdate: return "minus"; case Concat: case ConcatUpdate: return "concatenated_with"; case LeftShift: case LeftShiftUpdate: return "left_shifted"; case RightShift: case RightShiftUpdate: return "right_shifted"; case UnsignedLeftShift: case UnsignedLeftShiftUpdate: return "unsigned_left_shifted"; case UnsignedRightShift: case UnsignedRightShiftUpdate: return "unsigned_right_shifted"; case And: case AndUpdate: return "bit_and"; case Or: case OrUpdate: return "bit_or"; case Xor: case XorUpdate: return "bit_xor"; default: return NULL; } }; CONSTFUNC const char *binop_operator(ast_e tag) { switch (tag) { case Multiply: case MultiplyUpdate: return "*"; case Divide: case DivideUpdate: return "/"; case Mod: case ModUpdate: return "%"; case Plus: case PlusUpdate: return "+"; case Minus: case MinusUpdate: return "-"; case LeftShift: case LeftShiftUpdate: return "<<"; case RightShift: case RightShiftUpdate: return ">>"; case And: case AndUpdate: return "&"; case Or: case OrUpdate: return "|"; case Xor: case XorUpdate: return "^"; case Equals: return "=="; case NotEquals: return "!="; case LessThan: return "<"; case LessThanOrEquals: return "<="; case GreaterThan: return ">"; case GreaterThanOrEquals: return ">="; default: return NULL; } }; static CORD ast_list_to_xml(ast_list_t *asts); static CORD arg_list_to_xml(arg_ast_t *args); static CORD when_clauses_to_xml(when_clause_t *clauses); static CORD tags_to_xml(tag_ast_t *tags); static CORD xml_escape(CORD text); static CORD optional_tagged(const char *tag, ast_t *ast); static CORD optional_tagged_type(const char *tag, type_ast_t *ast); CORD xml_escape(CORD text) { text = CORD_replace(text, "&", "&"); text = CORD_replace(text, "<", "<"); text = CORD_replace(text, ">", ">"); return text; } CORD ast_list_to_xml(ast_list_t *asts) { CORD c = CORD_EMPTY; for (; asts; asts = asts->next) { c = CORD_cat(c, ast_to_xml(asts->ast)); } return c; } CORD arg_list_to_xml(arg_ast_t *args) { CORD c = ""; for (; args; args = args->next) { CORD arg_cord = args->name ? CORD_all("name, "\">") : ""; if (args->type) arg_cord = CORD_all(arg_cord, "", type_ast_to_xml(args->type), ""); if (args->value) arg_cord = CORD_all(arg_cord, "", ast_to_xml(args->value), ""); c = CORD_all(c, arg_cord, ""); } return CORD_cat(c, ""); } CORD when_clauses_to_xml(when_clause_t *clauses) { CORD c = CORD_EMPTY; for (; clauses; clauses = clauses->next) { c = CORD_all(c, "", ast_to_xml(clauses->pattern), ast_to_xml(clauses->body), ""); } return c; } CORD tags_to_xml(tag_ast_t *tags) { CORD c = CORD_EMPTY; for (; tags; tags = tags->next) { c = CORD_all(c, "name, "\">", arg_list_to_xml(tags->fields), ""); } return c; } CORD optional_tagged(const char *tag, ast_t *ast) { return ast ? CORD_all("<", tag, ">", ast_to_xml(ast), "") : CORD_EMPTY; } CORD optional_tagged_type(const char *tag, type_ast_t *ast) { return ast ? CORD_all("<", tag, ">", type_ast_to_xml(ast), "") : CORD_EMPTY; } CORD ast_to_xml(ast_t *ast) { if (!ast) return CORD_EMPTY; switch (ast->tag) { #define T(type, ...) case type: { auto data = ast->__data.type; (void)data; return CORD_asprintf(__VA_ARGS__); } T(Unknown, "") T(None, "") T(Bool, "", data.b ? "yes" : "no") T(Var, "%s", data.name) T(Int, "%s", data.str) T(Num, "%g", data.n) T(TextLiteral, "%r", xml_escape(data.cord)) T(TextJoin, "%r", data.lang ? CORD_all(" lang=\"", data.lang, "\"") : CORD_EMPTY, ast_list_to_xml(data.children)) T(Path, "%s", data.path) T(Declare, "%r%r", ast_to_xml(data.var), type_ast_to_xml(data.type), ast_to_xml(data.value)) T(Assign, "%r%r", ast_list_to_xml(data.targets), ast_list_to_xml(data.values)) #define BINOP(name) T(name, "<" #name ">%r %r", ast_to_xml(data.lhs), ast_to_xml(data.rhs)) BINOP(Power) BINOP(PowerUpdate) BINOP(Multiply) BINOP(MultiplyUpdate) BINOP(Divide) BINOP(DivideUpdate) BINOP(Mod) BINOP(ModUpdate) BINOP(Mod1) BINOP(Mod1Update) BINOP(Plus) BINOP(PlusUpdate) BINOP(Minus) BINOP(MinusUpdate) BINOP(Concat) BINOP(ConcatUpdate) BINOP(LeftShift) BINOP(LeftShiftUpdate) BINOP(RightShift) BINOP(RightShiftUpdate) BINOP(UnsignedLeftShift) BINOP(UnsignedLeftShiftUpdate) BINOP(UnsignedRightShift) BINOP(UnsignedRightShiftUpdate) BINOP(And) BINOP(AndUpdate) BINOP(Or) BINOP(OrUpdate) BINOP(Xor) BINOP(XorUpdate) BINOP(Compare) BINOP(Equals) BINOP(NotEquals) BINOP(LessThan) BINOP(LessThanOrEquals) BINOP(GreaterThan) BINOP(GreaterThanOrEquals) #undef BINOP T(Negative, "%r", ast_to_xml(data.value)) T(Not, "%r", ast_to_xml(data.value)) T(HeapAllocate, "%r", ast_to_xml(data.value)) T(StackReference, "%r", ast_to_xml(data.value)) T(Min, "%r%r%r", ast_to_xml(data.lhs), ast_to_xml(data.rhs), optional_tagged("key", data.key)) T(Max, "%r%r%r", ast_to_xml(data.lhs), ast_to_xml(data.rhs), optional_tagged("key", data.key)) T(Array, "%r", ast_list_to_xml(data.items)) T(Set, "%r", ast_list_to_xml(data.items)) T(Table, "%r%r
", optional_tagged("default-value", data.default_value), ast_list_to_xml(data.entries), optional_tagged("fallback", data.fallback)) T(TableEntry, "%r%r", ast_to_xml(data.key), ast_to_xml(data.value)) T(Comprehension, "%r%r%r%r%r", optional_tagged("expr", data.expr), ast_list_to_xml(data.vars), optional_tagged("iter", data.iter), optional_tagged("filter", data.filter)) T(FunctionDef, "%r%r%r", ast_to_xml(data.name), arg_list_to_xml(data.args), optional_tagged_type("return-type", data.ret_type), ast_to_xml(data.body)) T(ConvertDef, "%r%r%r", arg_list_to_xml(data.args), optional_tagged_type("return-type", data.ret_type), ast_to_xml(data.body)) T(Lambda, "%r%r%r)", arg_list_to_xml(data.args), optional_tagged_type("return-type", data.ret_type), ast_to_xml(data.body)) T(FunctionCall, "%r%r", ast_to_xml(data.fn), arg_list_to_xml(data.args)) T(MethodCall, "%r%s%r", ast_to_xml(data.self), data.name, arg_list_to_xml(data.args)) T(Block, "%r", ast_list_to_xml(data.statements)) T(For, "%r%r%r%r%r", ast_list_to_xml(data.vars), optional_tagged("iterable", data.iter), optional_tagged("body", data.body), optional_tagged("empty", data.empty)) T(While, "%r%r", optional_tagged("condition", data.condition), optional_tagged("body", data.body)) T(Repeat, "%r", optional_tagged("body", data.body)) T(If, "%r%r%r", optional_tagged("condition", data.condition), optional_tagged("body", data.body), optional_tagged("else", data.else_body)) T(When, "%r%r%r", ast_to_xml(data.subject), when_clauses_to_xml(data.clauses), optional_tagged("else", data.else_body)) T(Reduction, "%r", xml_escape(binop_method_name(data.op)), optional_tagged("key", data.key), optional_tagged("iterable", data.iter)) T(Skip, "%r", data.target) T(Stop, "%r", data.target) T(PrintStatement, "%r", ast_list_to_xml(data.to_print)) T(Pass, "") T(Defer, "%r", ast_to_xml(data.body)) T(Return, "%r", ast_to_xml(data.value)) T(Extern, "%r", data.name, type_ast_to_xml(data.type)) T(StructDef, "%r%r", data.name, arg_list_to_xml(data.fields), ast_to_xml(data.namespace)) T(EnumDef, "%r%r", data.name, tags_to_xml(data.tags), ast_to_xml(data.namespace)) T(LangDef, "%r", data.name, ast_to_xml(data.namespace)) T(Index, "%r%r", optional_tagged("indexed", data.indexed), optional_tagged("index", data.index)) T(FieldAccess, "%r", data.field, ast_to_xml(data.fielded)) T(Optional, "%r", ast_to_xml(data.value)) T(NonOptional, "%r", ast_to_xml(data.value)) T(DocTest, "%r%r", optional_tagged("expression", data.expr), optional_tagged("expected", data.expected)) T(Use, "%r%r", optional_tagged("var", data.var), xml_escape(data.path)) T(InlineCCode, "%r", xml_escape(data.code)) T(Deserialize, "%r%r", type_ast_to_xml(data.type), ast_to_xml(data.value)) T(Extend, "%r", data.name, ast_to_xml(data.body)) default: return "???"; #undef T } } const char *ast_to_xml_str(ast_t *ast) { return CORD_to_const_char_star(ast_to_xml(ast)); } const char *ast_source(ast_t *ast) { if (!ast) return NULL; size_t len = (size_t)(ast->end - ast->start); char *source = GC_MALLOC_ATOMIC(len + 1); memcpy(source, ast->start, len); source[len] = '\0'; return source; } CORD type_ast_to_xml(type_ast_t *t) { if (!t) return "NULL"; switch (t->tag) { #define T(type, ...) case type: { auto data = t->__data.type; (void)data; return CORD_asprintf(__VA_ARGS__); } T(UnknownTypeAST, "") T(VarTypeAST, "%s", data.name) T(PointerTypeAST, "%r", data.is_stack ? "yes" : "no", type_ast_to_xml(data.pointed)) T(ArrayTypeAST, "%r", type_ast_to_xml(data.item)) T(SetTypeAST, "%r", type_ast_to_xml(data.item)) T(TableTypeAST, "%r %r", type_ast_to_xml(data.key), type_ast_to_xml(data.value)) T(FunctionTypeAST, "%r %r", arg_list_to_xml(data.args), type_ast_to_xml(data.ret)) T(OptionalTypeAST, "%r", data.type) #undef T default: return CORD_EMPTY; } } PUREFUNC bool is_idempotent(ast_t *ast) { switch (ast->tag) { case Int: case Bool: case Num: case Var: case None: case TextLiteral: return true; case Index: { auto index = Match(ast, Index); return is_idempotent(index->indexed) && index->index != NULL && is_idempotent(index->index); } case FieldAccess: { auto access = Match(ast, FieldAccess); return is_idempotent(access->fielded); } default: return false; } } void _visit_topologically(ast_t *ast, Table_t definitions, Table_t *visited, Closure_t fn) { void (*visit)(void*, ast_t*) = (void*)fn.fn; if (ast->tag == StructDef) { auto def = Match(ast, StructDef); if (Table$str_get(*visited, def->name)) return; Table$str_set(visited, def->name, (void*)_visit_topologically); for (arg_ast_t *field = def->fields; field; field = field->next) { if (field->type && field->type->tag == VarTypeAST) { const char *field_type_name = Match(field->type, VarTypeAST)->name; ast_t *dependency = Table$str_get(definitions, field_type_name); if (dependency) { _visit_topologically(dependency, definitions, visited, fn); } } } visit(fn.userdata, ast); } else if (ast->tag == EnumDef) { auto def = Match(ast, EnumDef); if (Table$str_get(*visited, def->name)) return; Table$str_set(visited, def->name, (void*)_visit_topologically); for (tag_ast_t *tag = def->tags; tag; tag = tag->next) { for (arg_ast_t *field = tag->fields; field; field = field->next) { if (field->type && field->type->tag == VarTypeAST) { const char *field_type_name = Match(field->type, VarTypeAST)->name; ast_t *dependency = Table$str_get(definitions, field_type_name); if (dependency) { _visit_topologically(dependency, definitions, visited, fn); } } } } visit(fn.userdata, ast); } else if (ast->tag == LangDef) { auto def = Match(ast, LangDef); if (Table$str_get(*visited, def->name)) return; visit(fn.userdata, ast); } else { visit(fn.userdata, ast); } } void visit_topologically(ast_list_t *asts, Closure_t fn) { // Visit each top-level statement in topological order: // - 'use' statements first // - then typedefs // - visiting typedefs' dependencies first // - then function/variable declarations Table_t definitions = {}; for (ast_list_t *stmt = asts; stmt; stmt = stmt->next) { if (stmt->ast->tag == StructDef) { auto def = Match(stmt->ast, StructDef); Table$str_set(&definitions, def->name, stmt->ast); } else if (stmt->ast->tag == EnumDef) { auto def = Match(stmt->ast, EnumDef); Table$str_set(&definitions, def->name, stmt->ast); } else if (stmt->ast->tag == LangDef) { auto def = Match(stmt->ast, LangDef); Table$str_set(&definitions, def->name, stmt->ast); } } void (*visit)(void*, ast_t*) = (void*)fn.fn; Table_t visited = {}; // First: 'use' statements in order: for (ast_list_t *stmt = asts; stmt; stmt = stmt->next) { if (stmt->ast->tag == Use || (stmt->ast->tag == Declare && Match(stmt->ast, Declare)->value->tag == Use)) visit(fn.userdata, stmt->ast); } // Then typedefs in topological order: for (ast_list_t *stmt = asts; stmt; stmt = stmt->next) { if (stmt->ast->tag == StructDef || stmt->ast->tag == EnumDef || stmt->ast->tag == LangDef) _visit_topologically(stmt->ast, definitions, &visited, fn); } // Then everything else in order: for (ast_list_t *stmt = asts; stmt; stmt = stmt->next) { if (!(stmt->ast->tag == StructDef || stmt->ast->tag == EnumDef || stmt->ast->tag == LangDef || stmt->ast->tag == Use || (stmt->ast->tag == Declare && Match(stmt->ast, Declare)->value->tag == Use))) { visit(fn.userdata, stmt->ast); } } } CONSTFUNC bool is_binary_operation(ast_t *ast) { switch (ast->tag) { case BINOP_CASES: return true; default: return false; } } CONSTFUNC bool is_update_assignment(ast_t *ast) { switch (ast->tag) { case PowerUpdate: case MultiplyUpdate: case DivideUpdate: case ModUpdate: case Mod1Update: case PlusUpdate: case MinusUpdate: case ConcatUpdate: case LeftShiftUpdate: case UnsignedLeftShiftUpdate: case RightShiftUpdate: case UnsignedRightShiftUpdate: case AndUpdate: case OrUpdate: case XorUpdate: return true; default: return false; } } CONSTFUNC ast_e binop_tag(ast_e tag) { switch (tag) { case PowerUpdate: return Power; case MultiplyUpdate: return Multiply; case DivideUpdate: return Divide; case ModUpdate: return Mod; case Mod1Update: return Mod1; case PlusUpdate: return Plus; case MinusUpdate: return Minus; case ConcatUpdate: return Concat; case LeftShiftUpdate: return LeftShift; case UnsignedLeftShiftUpdate: return UnsignedLeftShift; case RightShiftUpdate: return RightShift; case UnsignedRightShiftUpdate: return UnsignedRightShift; case AndUpdate: return And; case OrUpdate: return Or; case XorUpdate: return Xor; default: return Unknown; } } // vim: ts=4 sw=0 et cino=L2,l1,(0,W4,m1,\:0