tomo/tomo.c

494 lines
19 KiB
C

// The main program that runs compilation
#include <ctype.h>
#include <gc.h>
#include <gc/cord.h>
#include <libgen.h>
#include <printf.h>
#include <stdio.h>
#include <stdlib.h>
#include <sys/stat.h>
#include "ast.h"
#include "builtins/array.h"
#include "builtins/datatypes.h"
#include "builtins/text.h"
#include "compile.h"
#include "parse.h"
#include "repl.h"
#include "typecheck.h"
#include "types.h"
#define ENV_CORD(name) CORD_from_char_star(getenv(name) ? getenv(name) : "")
#define CORD_RUN(...) ({ CORD _cmd = CORD_all(__VA_ARGS__); if (verbose) CORD_printf("\x1b[33m%r\x1b[m\n", _cmd); popen(CORD_to_const_char_star(_cmd), "w"); })
typedef enum { MODE_TRANSPILE = 0, MODE_COMPILE_OBJ = 1, MODE_COMPILE_SHARED_OBJ = 2, MODE_COMPILE_EXE = 3, MODE_RUN = 4 } mode_e;
static bool verbose = false;
static bool show_codegen = false;
static CORD autofmt, cconfig, cflags, ldlibs, ldflags, cc;
static int transpile_header(env_t *base_env, const char *filename, bool force_retranspile);
static int transpile_code(env_t *base_env, const char *filename, bool force_retranspile);
static int compile_object_file(const char *filename, bool force_recompile);
static int compile_executable(env_t *base_env, const char *filename, CORD object_files);
static void build_file_dependency_graph(const char *filename, table_t *to_compile, table_t *to_link);
int main(int argc, char *argv[])
{
mode_e mode = MODE_RUN;
int after_flags = 1;
const char *libname = NULL;
for (int i = 1; i < argc; i++) {
if (streq(argv[i], "-t")) {
mode = MODE_TRANSPILE;
} else if (streq(argv[i], "-c")) {
mode = MODE_COMPILE_OBJ;
} else if (strncmp(argv[i], "-s=", 3) == 0) {
mode = MODE_COMPILE_SHARED_OBJ;
libname = argv[i] + strlen("-s=");
} else if (streq(argv[i], "-s")) {
mode = MODE_COMPILE_SHARED_OBJ;
if (i+1 >= argc)
errx(1, "You must provide at least one file to build a shared library");
libname = file_base_name(argv[i+1]);
} else if (streq(argv[i], "-r")) {
mode = MODE_RUN;
} else if (streq(argv[i], "-e")) {
mode = MODE_COMPILE_EXE;
} else if (streq(argv[i], "-h") || streq(argv[i], "--help")) {
printf("Usage: %s | %s [-r] file.tm args... | %s (-t|-c|-s) file1.tm file2.tm...\n", argv[0], argv[0], argv[0]);
return 0;
} else if (streq(argv[i], "-u")) {
// Uninstall libraries:
for (int j = i + 1; j < argc; j++) {
system(heap_strf("rm -rvf ~/.local/src/tomo/%s ~/.local/include/tomo/lib%s.h ~/.local/lib/tomo/lib%s.so",
argv[j], argv[j], argv[j]));
}
return 0;
} else if (strchr(argv[i], '=')) {
while (argv[i][0] == '-')
++argv[i];
char *eq = strchr(argv[i], '=');
*eq = '\0';
for (char *p = argv[i]; *p; p++)
*p = toupper(*p);
setenv(argv[i], eq + 1, 1);
} else {
after_flags = i;
break;
}
}
if (register_printf_specifier('T', printf_type, printf_pointer_size))
errx(1, "Couldn't set printf specifier");
if (register_printf_specifier('W', printf_ast, printf_pointer_size))
errx(1, "Couldn't set printf specifier");
setenv("TOMO_IMPORT_PATH", "~/.local/src/tomo:.", 0);
setenv("TOMO_LIB_PATH", "~/.local/lib/tomo:.", 0);
CORD home = ENV_CORD("HOME");
autofmt = ENV_CORD("AUTOFMT");
if (!autofmt) autofmt = "indent -kr -l100 -nbbo -nut -sob";
if (!autofmt[0]) autofmt = "cat";
verbose = (getenv("VERBOSE") && (streq(getenv("VERBOSE"), "1") || streq(getenv("VERBOSE"), "2")));
show_codegen = (getenv("VERBOSE") && streq(getenv("VERBOSE"), "2"));
if (after_flags >= argc) {
repl();
return 0;
}
cconfig = ENV_CORD("CCONFIG");
if (!cconfig)
cconfig = "-std=c11 -fdollars-in-identifiers -fsanitize=signed-integer-overflow -fno-sanitize-recover"
" -D_XOPEN_SOURCE=700 -D_POSIX_C_SOURCE=200809L -D_DEFAULT_SOURCE";
CORD optimization = ENV_CORD("O");
if (!optimization) optimization = CORD_EMPTY;
else optimization = CORD_all("-O", optimization);
cflags = ENV_CORD("CFLAGS");
if (!cflags)
cflags = CORD_all(cconfig, " ", optimization, " -fPIC -ggdb -I./include -I'", home, "/.local/include' -D_DEFAULT_SOURCE");
ldflags = CORD_all("-Wl,-rpath='$ORIGIN',-rpath='", home, "/.local/lib/tomo' -L. -L'", home, "/.local/lib/tomo'");
ldlibs = "-lgc -lcord -lm -ltomo";
cc = ENV_CORD("CC");
if (!cc) cc = "cc";
CORD compilation_library_name = CORD_EMPTY;
env_t *env = new_compilation_unit(&compilation_library_name);
table_t dependency_files = {};
table_t to_link = {};
for (int i = after_flags; i < argc; i++) {
const char *resolved = resolve_path(argv[i], ".", ".");
if (!resolved) errx(1, "Couldn't resolve path: %s", argv[i]);
build_file_dependency_graph(resolved, &dependency_files, &to_link);
if (mode == MODE_RUN) break;
}
int status;
// Non-lazily (re)compile header files for each source file passed to the compiler:
for (int i = after_flags; i < argc; i++) {
const char *filename = argv[i];
status = transpile_header(env, filename, true);
if (status != 0) return status;
}
// Lazily (re)compile all the header files:
for (int64_t i = 0; i < dependency_files.entries.length; i++) {
const char *filename = *(char**)(dependency_files.entries.data + i*dependency_files.entries.stride);
status = transpile_header(env, filename, false);
if (status != 0) return status;
}
env->imports = new(table_t);
// Non-lazily (re)compile object files for each source file passed to the compiler:
for (int i = after_flags; i < argc; i++) {
const char *filename = argv[i];
status = transpile_code(env, filename, true);
if (status != 0) return status;
status = compile_object_file(filename, true);
if (status != 0) return status;
if (mode == MODE_RUN) break;
}
if (mode == MODE_COMPILE_OBJ)
return 0;
// Lazily (re)compile object files for each dependency:
for (int64_t i = 0; i < dependency_files.entries.length; i++) {
const char *filename = *(char**)(dependency_files.entries.data + i*dependency_files.entries.stride);
status = transpile_code(env, filename, false);
if (status != 0) return status;
status = compile_object_file(filename, false);
if (status != 0) return status;
}
CORD object_files = CORD_EMPTY;
for (int64_t i = 0; i < dependency_files.entries.length; i++) {
const char *filename = *(char**)(dependency_files.entries.data + i*dependency_files.entries.stride);
object_files = CORD_all(object_files, filename, ".o ");
}
for (int64_t i = 0; i < to_link.entries.length; i++) {
const char *lib = *(char**)(to_link.entries.data + i*to_link.entries.stride);
ldlibs = CORD_all(ldlibs, " ", lib);
}
// For shared objects, link up all the object files into one .so file:
if (mode == MODE_COMPILE_SHARED_OBJ) {
char *libname_id = heap_str(libname);
for (char *p = libname_id; *p; p++) {
if (!isalnum(*p) && *p != '_' && *p != '$')
*p = '_';
}
compilation_library_name = libname_id;
// Build a "libwhatever.h" header that loads all the headers:
const char *h_filename = heap_strf("lib%s.h", libname);
FILE *header_prog = CORD_RUN(autofmt ? autofmt : "cat", " 2>/dev/null >", h_filename);
fputs("#pragma once\n", header_prog);
for (int i = after_flags; i < argc; i++) {
const char *filename = argv[i];
file_t *f = load_file(filename);
if (!f) errx(1, "No such file: %s", filename);
ast_t *ast = parse_file(f, NULL);
if (!ast) errx(1, "Could not parse %s", f);
env->namespace = new(namespace_t, .name=file_base_name(filename));
for (ast_list_t *stmt = Match(ast, Block)->statements; stmt; stmt = stmt->next) {
if (stmt->ast->tag == Import || (stmt->ast->tag == Declare && Match(stmt->ast, Declare)->value->tag == Import))
continue;
CORD h = compile_statement_header(env, stmt->ast);
if (h) CORD_put(h, header_prog);
}
}
if (pclose(header_prog) == -1)
errx(1, "Failed to run autoformat program on header file: %s", autofmt);
// Also output a "libwhatever.files" file that lists the .tm files it used:
const char *files_filename = heap_strf("lib%s.files", libname);
FILE *files_file = fopen(files_filename, "w");
if (!files_file)
errx(1, "Couldn't open file: %s", files_filename);
for (int i = after_flags; i < argc; i++) {
fprintf(files_file, "%s\n", argv[i]);
}
if (fclose(files_file))
errx(1, "Failed to close file: %s", files_filename);
// Build up a list of symbol renamings:
unlink("symbol_renames.txt");
FILE *prog;
for (int i = after_flags; i < argc; i++) {
prog = CORD_RUN("nm -U -fjust-symbols ", argv[i], ".o | sed 's/.*/\\0 ", libname_id, "$\\0/' >>symbol_renames.txt");
status = pclose(prog);
if (!WIFEXITED(status) || WEXITSTATUS(status) != 0)
errx(WEXITSTATUS(status), "Failed to create symbol rename table with `nm` and `sed`");
}
CORD outfile = CORD_all("lib", libname, ".so");
prog = CORD_RUN(cc, " ", cflags, " ", ldflags, " ", ldlibs, " -Wl,-soname=", outfile, " -shared ", object_files, " -o ", outfile);
status = pclose(prog);
if (!WIFEXITED(status) || WEXITSTATUS(status) != 0)
errx(WEXITSTATUS(status), "Failed to compile shared library file");
if (verbose)
CORD_printf("Compiled to %r\n", outfile);
prog = CORD_RUN("objcopy --redefine-syms=symbol_renames.txt lib", libname, ".so");
status = pclose(prog);
if (!WIFEXITED(status) || WEXITSTATUS(status) != 0)
errx(WEXITSTATUS(status), "Failed to run `objcopy` to add library prefix to symbols");
prog = CORD_RUN("patchelf --rename-dynamic-symbols symbol_renames.txt lib", libname, ".so");
status = pclose(prog);
if (!WIFEXITED(status) || WEXITSTATUS(status) != 0)
errx(WEXITSTATUS(status), "Failed to run `patchelf` to rename dynamic symbols with library prefix");
if (verbose)
CORD_printf("Successfully renamed symbols with library prefix!\n");
unlink("symbol_renames.txt");
printf("Do you want to install your library? [Y/n] ");
fflush(stdout);
switch (getchar()) {
case 'y': case 'Y': case '\n': {
system(heap_strf("mkdir -p ~/.local/lib/tomo ~/.local/include/tomo ~/.local/src/tomo/'%s'", libname));
system(heap_strf("cp -rv . ~/.local/src/tomo/'%s'", libname));
system(heap_strf("ln -sfv '../../src/tomo/%s/lib%s.so' ~/.local/lib/tomo/'lib%s.so'", libname, libname, libname));
system(heap_strf("ln -sfv '../../src/tomo/%s/lib%s.h' ~/.local/include/tomo/'lib%s.h'", libname, libname, libname));
}
default: break;
}
return 0;
} else {
const char *filename = argv[after_flags];
int executable_status = compile_executable(env, filename, object_files);
if (mode == MODE_COMPILE_EXE || executable_status != 0)
return executable_status;
char *exe_name = heap_strn(filename, strlen(filename) - strlen(".tm"));
int num_args = argc - after_flags - 1;
char *prog_args[num_args + 2];
prog_args[0] = exe_name;
for (int i = 0; i < num_args; i++)
prog_args[i+1] = argv[after_flags+1+i];
prog_args[num_args+1] = NULL;
execv(exe_name, prog_args);
errx(1, "Failed to run compiled program");
}
}
void build_file_dependency_graph(const char *filename, table_t *to_compile, table_t *to_link)
{
if (Table$str_get(*to_compile, filename))
return;
Table$str_set(to_compile, filename, filename);
size_t len = strlen(filename);
assert(strncmp(filename + len - 3, ".tm", 3) == 0);
file_t *f = load_file(filename);
if (!f)
errx(1, "No such file: %s", filename);
ast_t *ast = parse_file(f, NULL);
if (!ast)
errx(1, "Could not parse %s", f);
char *file_dir = realpath(filename, NULL);
dirname(file_dir);
for (ast_list_t *stmt = Match(ast, Block)->statements; stmt; stmt = stmt->next) {
ast_t *stmt_ast = stmt->ast;
if (stmt_ast->tag == Declare)
stmt_ast = Match(stmt_ast, Declare)->value;
if (stmt_ast->tag == Import) {
const char *path = Match(stmt_ast, Import)->path;
path = resolve_path(heap_strf("%s.tm", path), filename, "");
if (!path) errx(1, "Couldn't resolve import: %s", path);
if (Table$str_get(*to_compile, path))
continue;
Table$str_set(to_compile, path, path);
build_file_dependency_graph(path, to_compile, to_link);
} else if (stmt_ast->tag == Use) {
const char *name = Match(stmt_ast, Use)->name;
if (strncmp(name, "-l", 2) == 0) {
Table$str_set(to_link, name, name);
} else {
const char *libfile = resolve_path(heap_strf("%s/lib%s.so", name, name), filename, getenv("TOMO_IMPORT_PATH"));
if (!libfile) errx(1, "Couldn't resolve path: %s", name);
const char *lib = heap_strf("-l%s", name);
Table$str_set(to_link, lib, lib);
}
}
}
free(file_dir);
}
static bool is_stale(const char *filename, const char *relative_to)
{
struct stat target_stat;
if (stat(filename, &target_stat))
return true;
struct stat relative_to_stat;
if (stat(relative_to, &relative_to_stat))
errx(1, "File doesn't exist: %s", relative_to);
return target_stat.st_mtime < relative_to_stat.st_mtime;
}
int transpile_header(env_t *base_env, const char *filename, bool force_retranspile)
{
const char *h_filename = heap_strf("%s.h", filename);
if (!force_retranspile && !is_stale(h_filename, filename)) {
return 0;
}
file_t *f = load_file(filename);
if (!f)
errx(1, "No such file: %s", filename);
ast_t *ast = parse_file(f, NULL);
if (!ast)
errx(1, "Could not parse %s", f);
env_t *module_env = load_module_env(base_env, ast);
CORD h_code = compile_header(module_env, ast);
if (autofmt) {
FILE *prog = CORD_RUN(autofmt, " 2>/dev/null >", h_filename);
CORD_put(h_code, prog);
if (pclose(prog) == -1)
errx(1, "Failed to run autoformat program on header file: %s", autofmt);
} else {
FILE *h_file = fopen(h_filename, "w");
if (!h_file)
errx(1, "Couldn't open file: %s", h_filename);
CORD_put(h_code, h_file);
if (fclose(h_file))
errx(1, "Failed to close file: %s", h_filename);
}
if (verbose)
printf("Transpiled to %s\n", h_filename);
if (show_codegen) {
FILE *out = CORD_RUN("bat -P ", h_filename);
pclose(out);
}
return 0;
}
int transpile_code(env_t *base_env, const char *filename, bool force_retranspile)
{
const char *c_filename = heap_strf("%s.c", filename);
if (!force_retranspile && !is_stale(c_filename, filename)) {
return 0;
}
file_t *f = load_file(filename);
if (!f)
errx(1, "No such file: %s", filename);
ast_t *ast = parse_file(f, NULL);
if (!ast)
errx(1, "Could not parse %s", f);
env_t *module_env = load_module_env(base_env, ast);
CORD c_code = compile_file(module_env, ast);
if (autofmt) {
FILE *prog = CORD_RUN(autofmt, " 2>/dev/null >", c_filename);
CORD_put(c_code, prog);
if (pclose(prog) == -1)
errx(1, "Failed to output autoformatted C code to %s: %s", c_filename, autofmt);
} else {
FILE *c_file = fopen(c_filename, "w");
if (!c_file)
errx(1, "Couldn't open file: %s", c_filename);
CORD_put(c_code, c_file);
if (fclose(c_file))
errx(1, "Failed to close file: %s", c_filename);
}
if (verbose)
printf("Transpiled to %s\n", c_filename);
if (show_codegen) {
FILE *out = CORD_RUN("bat -P ", c_filename);
pclose(out);
}
return 0;
}
int compile_object_file(const char *filename, bool force_recompile)
{
const char *obj_file = heap_strf("%s.o", filename);
if (!force_recompile && !is_stale(obj_file, filename)
&& !is_stale(obj_file, heap_strf("%s.c", filename))
&& !is_stale(obj_file, heap_strf("%s.h", filename))) {
return 0;
}
CORD outfile = CORD_all(filename, ".o");
FILE *prog = CORD_RUN(cc, " ", cflags, " -c ", filename, ".c -o ", outfile);
int status = pclose(prog);
if (WIFEXITED(status) && WEXITSTATUS(status) == 0) {
if (verbose)
CORD_printf("Compiled to %r\n", outfile);
}
return WIFEXITED(status) ? WEXITSTATUS(status) : EXIT_FAILURE;
}
int compile_executable(env_t *base_env, const char *filename, CORD object_files)
{
const char *name = file_base_name(filename);
env_t *env = Table$str_get(*base_env->imports, name);
assert(env);
binding_t *main_binding = get_binding(env, "main");
if (!main_binding || main_binding->type->tag != FunctionType) {
errx(1, "No main() function has been defined for %s, so it can't be run!", filename);
}
const char *bin_name = heap_strn(filename, strlen(filename) - strlen(".tm"));
FILE *runner = CORD_RUN(autofmt, " | ", cc, " ", cflags, " ", ldflags, " ", ldlibs, " ", object_files, " -x c - -o ", bin_name);
CORD program = CORD_all(
"#include <tomo/tomo.h>\n"
"#include \"", filename, ".h\"\n"
"\n"
"int main(int argc, char *argv[]) {\n"
"tomo_init();\n"
"\n",
CORD_all(compile_cli_arg_call(env, main_binding->code, main_binding->type), "return 0;\n"),
"}\n"
);
if (show_codegen) {
FILE *out = CORD_RUN(autofmt, " | bat -P --file-name=run.c");
CORD_put(program, out);
pclose(out);
}
CORD_put(program, runner);
int status = pclose(runner);
if (WIFEXITED(status) && WEXITSTATUS(status) == 0) {
if (verbose)
printf("Compiled executable: %s\n", bin_name);
}
return WIFEXITED(status) ? WEXITSTATUS(status) : EXIT_FAILURE;
}
// vim: ts=4 sw=0 et cino=L2,l1,(0,W4,m1,\:0