mirror of
https://github.com/danog/ir.git
synced 2024-12-11 16:59:46 +01:00
1073 lines
29 KiB
C
1073 lines
29 KiB
C
/*
|
|
* IR - Lightweight JIT Compilation Framework
|
|
* (IR CLI driver)
|
|
* Copyright (C) 2022 Zend by Perforce.
|
|
* Authors: Dmitry Stogov <dmitry@php.net>
|
|
*/
|
|
|
|
#include "ir.h"
|
|
#include "ir_private.h" // TODO: move this together with loader
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
|
|
#ifdef _WIN32
|
|
# include <windows.h>
|
|
#endif
|
|
|
|
static void help(const char *cmd)
|
|
{
|
|
printf(
|
|
#if HAVE_LLVM
|
|
"Usage: %s [options] [--llvm-bitcode|--llvm-asm] input-file...\n"
|
|
#else
|
|
"Usage: %s [options] input-file...\n"
|
|
#endif
|
|
"Options:\n"
|
|
" -O[012] - optimization level (default: 2)\n"
|
|
" -S - dump final target assembler code\n"
|
|
#if defined(IR_TARGET_X86) || defined(IR_TARGET_X64)
|
|
" -mavx - use AVX instruction set\n"
|
|
" -mno-bmi1 - disable BMI1 instruction set\n"
|
|
#endif
|
|
" -muse-fp - use base frame pointer register\n"
|
|
" --emit-c [file-name] - convert to C source\n"
|
|
" --emit-llvm [file-name] - convert to LLVM\n"
|
|
" --save [file-name] - save IR\n"
|
|
" --dot [file-name] - dump IR graph\n"
|
|
" --dump [file-name] - dump IR table\n"
|
|
" --dump-after-load - dump IR after load and local optimization\n"
|
|
" --dump-after-sccp - dump IR after SCCP optimization pass\n"
|
|
" --dump-after-gcm - dump IR after GCM optimization pass\n"
|
|
" --dump-after-schedule - dump IR after SCHEDULE pass\n"
|
|
" --dump-after-live-ranges - dump IR after live ranges identification\n"
|
|
" --dump-after-coalescing - dump IR after live ranges coalescing\n"
|
|
" --dump-after-all - dump IR after each pass\n"
|
|
" --dump-final - dump IR after all pass\n"
|
|
" --dump-size - dump generated code size\n"
|
|
" --dump-use-lists - dump def->use lists\n"
|
|
" --dump-cfg - dump CFG (Control Flow Graph)\n"
|
|
" --dump-cfg-map - dump CFG map (instruction to BB number)\n"
|
|
" --dump-live-ranges - dump live ranges\n"
|
|
#ifdef IR_DEBUG
|
|
" --debug-sccp - debug SCCP optimization pass\n"
|
|
" --debug-gcm - debug GCM optimization pass\n"
|
|
" --debug-schedule - debug SCHEDULE optimization pass\n"
|
|
" --debug-ra - debug register allocator\n"
|
|
" --debug-regset <bit-mask> - restrict available register set\n"
|
|
#endif
|
|
" --target - print JIT target\n"
|
|
" --version\n"
|
|
" --help\n",
|
|
cmd);
|
|
}
|
|
|
|
#define IR_DUMP_SAVE (1<<0)
|
|
#define IR_DUMP_DUMP (1<<1)
|
|
#define IR_DUMP_DOT (1<<2)
|
|
#define IR_DUMP_USE_LISTS (1<<3)
|
|
#define IR_DUMP_CFG (1<<4)
|
|
#define IR_DUMP_CFG_MAP (1<<5)
|
|
#define IR_DUMP_LIVE_RANGES (1<<6)
|
|
#define IR_DUMP_CODEGEN (1<<7)
|
|
|
|
#define IR_DUMP_AFTER_LOAD (1<<16)
|
|
#define IR_DUMP_AFTER_SCCP (1<<17)
|
|
#define IR_DUMP_AFTER_GCM (1<<18)
|
|
#define IR_DUMP_AFTER_SCHEDULE (1<<19)
|
|
#define IR_DUMP_AFTER_LIVE_RANGES (1<<20)
|
|
#define IR_DUMP_AFTER_COALESCING (1<<21)
|
|
|
|
#define IR_DUMP_AFTER_ALL (1<<29)
|
|
#define IR_DUMP_FINAL (1<<30)
|
|
|
|
static int _save(ir_ctx *ctx, uint32_t dump, uint32_t pass, FILE *f, const char *func_name)
|
|
{
|
|
char fn[4096];
|
|
bool close = 0;
|
|
|
|
if (!f) {
|
|
if (dump & IR_DUMP_AFTER_ALL) {
|
|
if (pass == IR_DUMP_AFTER_LOAD) {
|
|
snprintf(fn, sizeof(fn)-1, "01-load-%s.ir", func_name);
|
|
} else if (pass == IR_DUMP_AFTER_SCCP) {
|
|
snprintf(fn, sizeof(fn)-1, "02-sccp-%s.ir", func_name);
|
|
} else if (pass == IR_DUMP_AFTER_GCM) {
|
|
snprintf(fn, sizeof(fn)-1, "03-gcm-%s.ir", func_name);
|
|
} else if (pass == IR_DUMP_AFTER_SCHEDULE) {
|
|
snprintf(fn, sizeof(fn)-1, "04-schedule-%s.ir", func_name);
|
|
} else if (pass == IR_DUMP_AFTER_LIVE_RANGES) {
|
|
snprintf(fn, sizeof(fn)-1, "05-live-ranges-%s.ir", func_name);
|
|
} else if (pass == IR_DUMP_AFTER_COALESCING) {
|
|
snprintf(fn, sizeof(fn)-1, "06-coalescing-%s.ir", func_name);
|
|
} else if (pass == IR_DUMP_FINAL) {
|
|
if (dump & IR_DUMP_CODEGEN) {
|
|
snprintf(fn, sizeof(fn)-1, "07-codegen-%s.ir", func_name);
|
|
} else {
|
|
snprintf(fn, sizeof(fn)-1, "07-final-%s.ir", func_name);
|
|
}
|
|
} else {
|
|
f = stderr; // TODO:
|
|
}
|
|
} else {
|
|
snprintf(fn, sizeof(fn)-1, "%s.ir", func_name);
|
|
}
|
|
f = fopen(fn, "w+");
|
|
if (!f) {
|
|
fprintf(stderr, "ERROR: Cannot create file '%s'\n", fn);
|
|
return 0;
|
|
}
|
|
close = 1;
|
|
}
|
|
if (pass == IR_DUMP_FINAL && (dump & IR_DUMP_CODEGEN)) {
|
|
ir_dump_codegen(ctx, f);
|
|
} else if (dump & IR_DUMP_SAVE) {
|
|
ir_save(ctx, f);
|
|
}
|
|
if (dump & IR_DUMP_DUMP) {
|
|
ir_dump(ctx, f);
|
|
}
|
|
if (dump & IR_DUMP_DOT) {
|
|
ir_dump_dot(ctx, f);
|
|
}
|
|
if (dump & IR_DUMP_USE_LISTS) {
|
|
ir_dump_use_lists(ctx, f);
|
|
}
|
|
if (dump & IR_DUMP_CFG) {
|
|
ir_dump_cfg(ctx, f);
|
|
}
|
|
if (dump & IR_DUMP_CFG_MAP) {
|
|
ir_dump_cfg_map(ctx, f);
|
|
}
|
|
if (dump & IR_DUMP_LIVE_RANGES) {
|
|
ir_dump_live_ranges(ctx, f);
|
|
}
|
|
if (close) {
|
|
fclose(f);
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
int ir_compile_func(ir_ctx *ctx, int opt_level, uint32_t dump, FILE *dump_file, const char *func_name)
|
|
{
|
|
if ((dump & (IR_DUMP_AFTER_LOAD|IR_DUMP_AFTER_ALL))
|
|
&& !_save(ctx, dump, IR_DUMP_AFTER_LOAD, dump_file, func_name)) {
|
|
return 0;
|
|
}
|
|
|
|
if (opt_level > 0 || (ctx->flags & (IR_GEN_NATIVE|IR_GEN_CODE))) {
|
|
ir_build_def_use_lists(ctx);
|
|
}
|
|
|
|
ir_check(ctx);
|
|
|
|
/* Global Optimization */
|
|
if (opt_level > 1) {
|
|
ir_sccp(ctx);
|
|
if ((dump & (IR_DUMP_AFTER_SCCP|IR_DUMP_AFTER_ALL))
|
|
&& !_save(ctx, dump, IR_DUMP_AFTER_SCCP, dump_file, func_name)) {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
if (opt_level > 0 || (ctx->flags & (IR_GEN_NATIVE|IR_GEN_CODE))) {
|
|
ir_build_cfg(ctx);
|
|
}
|
|
|
|
/* Schedule */
|
|
if (opt_level > 0) {
|
|
ir_build_dominators_tree(ctx);
|
|
ir_find_loops(ctx);
|
|
ir_gcm(ctx);
|
|
if ((dump & (IR_DUMP_AFTER_GCM|IR_DUMP_AFTER_ALL))
|
|
&& !_save(ctx, dump, IR_DUMP_AFTER_GCM, dump_file, func_name)) {
|
|
return 0;
|
|
}
|
|
ir_schedule(ctx);
|
|
if ((dump & (IR_DUMP_AFTER_SCHEDULE|IR_DUMP_AFTER_ALL))
|
|
&& !_save(ctx, dump, IR_DUMP_AFTER_SCHEDULE, dump_file, func_name)) {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
if (ctx->flags & IR_GEN_NATIVE) {
|
|
ir_match(ctx);
|
|
}
|
|
|
|
if (opt_level > 0) {
|
|
ir_assign_virtual_registers(ctx);
|
|
ir_compute_live_ranges(ctx);
|
|
|
|
if ((dump & (IR_DUMP_AFTER_LIVE_RANGES|IR_DUMP_AFTER_ALL))
|
|
&& !_save(ctx, dump, IR_DUMP_AFTER_LIVE_RANGES, dump_file, func_name)) {
|
|
return 0;
|
|
}
|
|
|
|
ir_coalesce(ctx);
|
|
|
|
if ((dump & (IR_DUMP_AFTER_COALESCING|IR_DUMP_AFTER_ALL))
|
|
&& !_save(ctx, dump, IR_DUMP_AFTER_COALESCING, dump_file, func_name)) {
|
|
return 0;
|
|
}
|
|
|
|
if (ctx->flags & IR_GEN_NATIVE) {
|
|
ir_reg_alloc(ctx);
|
|
}
|
|
|
|
ir_schedule_blocks(ctx);
|
|
} else if (ctx->flags & (IR_GEN_NATIVE|IR_GEN_CODE)) {
|
|
ir_assign_virtual_registers(ctx);
|
|
ir_compute_dessa_moves(ctx);
|
|
}
|
|
|
|
if ((dump & (IR_DUMP_FINAL|IR_DUMP_AFTER_ALL|IR_DUMP_CODEGEN))
|
|
&& !_save(ctx, dump, IR_DUMP_FINAL, dump_file, func_name)) {
|
|
return 0;
|
|
}
|
|
|
|
ir_check(ctx);
|
|
|
|
return 1;
|
|
}
|
|
|
|
typedef struct _ir_sym {
|
|
void *addr;
|
|
void *thunk_addr;
|
|
} ir_sym;
|
|
|
|
typedef struct _ir_main_loader {
|
|
ir_loader loader;
|
|
int opt_level;
|
|
uint32_t mflags;
|
|
uint64_t debug_regset;
|
|
uint32_t dump;
|
|
bool dump_asm;
|
|
bool dump_size;
|
|
bool run;
|
|
size_t size;
|
|
void *main;
|
|
FILE *dump_file;
|
|
FILE *c_file;
|
|
FILE *llvm_file;
|
|
ir_strtab symtab;
|
|
ir_sym *sym;
|
|
ir_ref sym_count;
|
|
void *data;
|
|
void *code_buffer;
|
|
size_t code_buffer_size;
|
|
} ir_main_loader;
|
|
|
|
static bool ir_loader_add_sym(ir_loader *loader, const char *name, void *addr)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*)loader;
|
|
uint32_t len = (uint32_t)strlen(name);
|
|
ir_ref val = ir_strtab_count(&l->symtab) + 1;
|
|
ir_ref old_val = ir_strtab_lookup(&l->symtab, name, len, val);
|
|
if (old_val != val) {
|
|
if (addr && !l->sym[old_val].addr) {
|
|
/* Update forward declaration */
|
|
l->sym[old_val].addr = addr;
|
|
if (l->sym[old_val].thunk_addr) {
|
|
// TODO: Fix thunk or relocation ???
|
|
}
|
|
return 1;
|
|
}
|
|
return 0;
|
|
}
|
|
if (val >= l->sym_count) {
|
|
l->sym_count += 16;
|
|
l->sym = ir_mem_realloc(l->sym, sizeof(ir_sym) * l->sym_count);
|
|
}
|
|
l->sym[val].addr = addr;
|
|
l->sym[val].thunk_addr = NULL;
|
|
return 1;
|
|
}
|
|
|
|
static bool ir_loader_has_sym(ir_loader *loader, const char *name)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*)loader;
|
|
uint32_t len = (uint32_t)strlen(name);
|
|
ir_ref val = ir_strtab_find(&l->symtab, name, len);
|
|
return val != 0;
|
|
}
|
|
|
|
static void* ir_loader_resolve_sym_name(ir_loader *loader, const char *name)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*)loader;
|
|
uint32_t len = (uint32_t)strlen(name);
|
|
ir_ref val = ir_strtab_find(&l->symtab, name, len);
|
|
void *addr;
|
|
|
|
if (val) {
|
|
if (l->sym[val].addr) {
|
|
return l->sym[val].addr;
|
|
}
|
|
if (!l->sym[val].thunk_addr) {
|
|
/* Undefined declaration */
|
|
// TODO: Add thunk or relocation ???
|
|
l->sym[val].thunk_addr = (void*)(intptr_t)sizeof(void*);
|
|
}
|
|
return l->sym[val].thunk_addr;
|
|
}
|
|
addr = ir_resolve_sym_name(name);
|
|
ir_loader_add_sym(loader, name, addr); /* cache */
|
|
return addr;
|
|
}
|
|
|
|
static bool ir_loader_external_sym_dcl(ir_loader *loader, const char *name, uint32_t flags)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*) loader;
|
|
|
|
if (ir_loader_has_sym(loader, name)) {
|
|
return 1;
|
|
}
|
|
|
|
if ((l->dump & IR_DUMP_SAVE) && (l->dump_file)) {
|
|
fprintf(l->dump_file, "extern %s %s;\n", (flags & IR_CONST) ? "const" : "var", name);
|
|
}
|
|
if (l->c_file) {
|
|
ir_emit_c_sym_decl(name, flags | IR_EXTERN, 0, l->c_file);
|
|
}
|
|
if (l->llvm_file) {
|
|
ir_emit_llvm_sym_decl(name, flags | IR_EXTERN, 0, l->llvm_file);
|
|
}
|
|
if (l->dump_asm || l->dump_size || l->run) {
|
|
void *addr = ir_loader_resolve_sym_name(loader, name);
|
|
|
|
if (!addr) {
|
|
return 0;
|
|
}
|
|
if (l->dump_asm) {
|
|
ir_disasm_add_symbol(name, (uintptr_t)addr, sizeof(void*));
|
|
}
|
|
} else {
|
|
ir_loader_add_sym(loader, name, NULL);
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
static void ir_dump_func_dcl(const char *name, uint32_t flags, ir_type ret_type, uint32_t params_count, const uint8_t *param_types, FILE *f)
|
|
{
|
|
if (flags & IR_EXTERN) {
|
|
fprintf(f, "extern ");
|
|
} else if (flags & IR_STATIC) {
|
|
fprintf(f, "static ");
|
|
}
|
|
fprintf(f, "func %s(", name);
|
|
if (params_count) {
|
|
const uint8_t *p = param_types;
|
|
|
|
fprintf(f, "%s", ir_type_cname[*p]);
|
|
p++;
|
|
while (--params_count) {
|
|
fprintf(f, ", %s", ir_type_cname[*p]);
|
|
p++;
|
|
}
|
|
if (flags & IR_VARARG_FUNC) {
|
|
fprintf(f, ", ...");
|
|
}
|
|
} else if (flags & IR_VARARG_FUNC) {
|
|
fprintf(f, "...");
|
|
}
|
|
fprintf(f, "): %s", ir_type_cname[ret_type]);
|
|
if (flags & IR_FASTCALL_FUNC) {
|
|
fprintf(f, " __fastcall");
|
|
} else if (flags & IR_BUILTIN_FUNC) {
|
|
fprintf(f, " __builtin");
|
|
}
|
|
fprintf(f, ";\n");
|
|
}
|
|
|
|
static bool ir_loader_external_func_dcl(ir_loader *loader, const char *name, uint32_t flags,
|
|
ir_type ret_type, uint32_t params_count, const uint8_t *param_types)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*) loader;
|
|
|
|
if (ir_loader_has_sym(loader, name)) {
|
|
return 1;
|
|
}
|
|
|
|
if ((l->dump & IR_DUMP_SAVE) && (l->dump_file)) {
|
|
ir_dump_func_dcl(name, flags | IR_EXTERN, ret_type, params_count, param_types, l->dump_file);
|
|
}
|
|
if (l->c_file) {
|
|
ir_emit_c_func_decl(name, flags | IR_EXTERN, ret_type, params_count, param_types, l->c_file);
|
|
}
|
|
if (l->llvm_file) {
|
|
ir_emit_llvm_func_decl(name, flags | IR_EXTERN, ret_type, params_count, param_types, l->llvm_file);
|
|
}
|
|
if (l->dump_asm || l->dump_size || l->run) {
|
|
void *addr = ir_loader_resolve_sym_name(loader, name);
|
|
|
|
if (!addr) {
|
|
return 0;
|
|
}
|
|
if (l->dump_asm) {
|
|
ir_disasm_add_symbol(name, (uintptr_t)addr, sizeof(void*));
|
|
}
|
|
} else {
|
|
ir_loader_add_sym(loader, name, NULL);
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
static bool ir_loader_forward_func_dcl(ir_loader *loader, const char *name, uint32_t flags,
|
|
ir_type ret_type, uint32_t params_count, const uint8_t *param_types)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*) loader;
|
|
|
|
if (ir_loader_has_sym(loader, name)) {
|
|
return 1;
|
|
}
|
|
|
|
if ((l->dump & IR_DUMP_SAVE) && (l->dump_file)) {
|
|
ir_dump_func_dcl(name, flags, ret_type, params_count, param_types, l->dump_file);
|
|
}
|
|
if (l->c_file) {
|
|
ir_emit_c_func_decl(name, flags, ret_type, params_count, param_types, l->c_file);
|
|
}
|
|
|
|
ir_loader_add_sym(loader, name, NULL);
|
|
return 1;
|
|
}
|
|
|
|
static bool ir_loader_sym_dcl(ir_loader *loader, const char *name, uint32_t flags, size_t size, bool has_data)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*) loader;
|
|
|
|
if ((l->dump & IR_DUMP_SAVE) && (l->dump_file)) {
|
|
if (flags & IR_STATIC) {
|
|
fprintf(l->dump_file, "static ");
|
|
}
|
|
fprintf(l->dump_file, "%s %s [%ld]%s\n", (flags & IR_CONST) ? "const" : "var", name, size, has_data ? " = {" : ";");
|
|
}
|
|
if (l->c_file) {
|
|
ir_emit_c_sym_decl(name, flags, has_data, l->c_file);
|
|
}
|
|
if (l->llvm_file) {
|
|
ir_emit_llvm_sym_decl(name, flags, has_data, l->llvm_file);
|
|
}
|
|
if (l->dump_asm || l->dump_size || l->run) {
|
|
void *data = ir_mem_malloc(size);
|
|
|
|
if (!ir_loader_add_sym(loader, name, data)) {
|
|
ir_mem_free(data);
|
|
return 0;
|
|
}
|
|
memset(data, 0, size);
|
|
if (has_data) {
|
|
l->data = data;
|
|
}
|
|
if (l->dump_asm) {
|
|
ir_disasm_add_symbol(name, (uintptr_t)data, size);
|
|
}
|
|
} else {
|
|
ir_loader_add_sym(loader, name, NULL);
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
static bool ir_loader_sym_data(ir_loader *loader, ir_type type, uint32_t count, const void *data)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*) loader;
|
|
|
|
if ((l->dump & IR_DUMP_SAVE) && (l->dump_file)) {
|
|
const void *p = data;
|
|
uint32_t i;
|
|
|
|
switch (ir_type_size[type]) {
|
|
case 1:
|
|
for (i = 0; i < count; i++) {
|
|
fprintf(l->dump_file, "\t%s 0x%02x,\n", ir_type_cname[type], (uint32_t)*(uint8_t*)p);
|
|
p = (void*)((uintptr_t)p + 1);
|
|
}
|
|
break;
|
|
case 2:
|
|
for (i = 0; i < count; i++) {
|
|
fprintf(l->dump_file, "\t%s 0x%04x,\n", ir_type_cname[type], (uint32_t)*(uint16_t*)p);
|
|
p = (void*)((uintptr_t)p + 1);
|
|
}
|
|
break;
|
|
case 4:
|
|
for (i = 0; i < count; i++) {
|
|
fprintf(l->dump_file, "\t%s 0x%08x,\n", ir_type_cname[type], *(uint32_t*)p);
|
|
p = (void*)((uintptr_t)p + 4);
|
|
}
|
|
break;
|
|
case 8:
|
|
for (i = 0; i < count; i++) {
|
|
fprintf(l->dump_file, "\t%s 0x%016lx,\n", ir_type_cname[type], *(uint64_t*)p);
|
|
p = (void*)((uintptr_t)p + 8);
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
if (l->c_file) {
|
|
// TODO:
|
|
}
|
|
if (l->llvm_file) {
|
|
// TODO:
|
|
}
|
|
if (l->dump_asm || l->dump_size || l->run) {
|
|
size_t size = ir_type_size[type] * count;
|
|
|
|
if (!l->data) {
|
|
return 0;
|
|
}
|
|
// TODO: alignement
|
|
memcpy(l->data, data, size);
|
|
l->data = (void*)((uintptr_t)l->data + size);
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
static bool ir_loader_sym_data_ref(ir_loader *loader, ir_op op, const char *ref)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*) loader;
|
|
|
|
IR_ASSERT(op == IR_FUNC || op == IR_SYM);
|
|
if ((l->dump & IR_DUMP_SAVE) && (l->dump_file)) {
|
|
fprintf(l->dump_file, "\t%s %s(%s),\n", ir_type_cname[IR_ADDR], op == IR_FUNC ? "func" : "sym", ref);
|
|
}
|
|
if (l->c_file) {
|
|
// TODO:
|
|
}
|
|
if (l->llvm_file) {
|
|
// TODO:
|
|
}
|
|
if (l->dump_asm || l->dump_size || l->run) {
|
|
// TODO:
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
static bool ir_loader_sym_data_end(ir_loader *loader)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*) loader;
|
|
|
|
if ((l->dump & IR_DUMP_SAVE) && (l->dump_file)) {
|
|
fprintf(l->dump_file, "};\n");
|
|
}
|
|
if (l->c_file) {
|
|
// TODO:
|
|
}
|
|
if (l->llvm_file) {
|
|
// TODO:
|
|
}
|
|
if (l->dump_asm || l->dump_size || l->run) {
|
|
// TODO:
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
static bool ir_loader_func_init(ir_loader *loader, ir_ctx *ctx, const char *name)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*) loader;
|
|
|
|
ir_init(ctx, loader->default_func_flags, 256, 1024);
|
|
ctx->mflags = l->mflags;
|
|
ctx->fixed_regset = ~l->debug_regset;
|
|
ctx->loader = loader;
|
|
return 1;
|
|
}
|
|
|
|
static bool ir_loader_func_process(ir_loader *loader, ir_ctx *ctx, const char *name)
|
|
{
|
|
ir_main_loader *l = (ir_main_loader*) loader;
|
|
|
|
// TODO: remove this
|
|
if (ctx->ret_type == (ir_type)-1) {
|
|
ir_ref ref = ctx->ir_base[1].op1;
|
|
while (ref) {
|
|
ir_insn *insn = &ctx->ir_base[ref];
|
|
if (insn->op == IR_RETURN) {
|
|
ctx->ret_type = insn->op2 ? ctx->ir_base[insn->op2].type : IR_VOID;
|
|
break;
|
|
} else if (insn->op == IR_UNREACHABLE && ctx->ir_base[insn->op1].op == IR_TAILCALL) {
|
|
ctx->ret_type = ctx->ir_base[insn->op1].type;
|
|
break;
|
|
}
|
|
ref = ctx->ir_base[ref].op3;
|
|
}
|
|
}
|
|
|
|
if (name == NULL) {
|
|
name = (l->run) ? "main" : "test";
|
|
} else if ((l->dump & IR_DUMP_SAVE) && l->dump_file) {
|
|
if (ctx->flags & IR_STATIC) {
|
|
fprintf(l->dump_file, "static ");
|
|
}
|
|
fprintf(l->dump_file, "func %s(", name);
|
|
if (ctx->ir_base[2].op == IR_PARAM) {
|
|
ir_insn *insn = &ctx->ir_base[2];
|
|
|
|
fprintf(l->dump_file, "%s", ir_type_cname[insn->type]);
|
|
insn++;
|
|
while (insn->op == IR_PARAM) {
|
|
fprintf(l->dump_file, ", %s", ir_type_cname[insn->type]);
|
|
insn++;;
|
|
}
|
|
if (ctx->flags & IR_VARARG_FUNC) {
|
|
fprintf(l->dump_file, ", ...");
|
|
}
|
|
} else if (ctx->flags & IR_VARARG_FUNC) {
|
|
fprintf(l->dump_file, "...");
|
|
}
|
|
fprintf(l->dump_file, "): %s", ir_type_cname[ctx->ret_type != (ir_type)-1 ? ctx->ret_type : IR_VOID]);
|
|
if (ctx->flags & IR_FASTCALL_FUNC) {
|
|
fprintf(l->dump_file, " __fastcall");
|
|
}
|
|
fprintf(l->dump_file, "\n");
|
|
}
|
|
|
|
if (!ir_compile_func(ctx, l->opt_level, l->dump, l->dump_file, name)) {
|
|
return 0;
|
|
}
|
|
|
|
if (l->c_file) {
|
|
if (!ir_emit_c(ctx, name, l->c_file)) {
|
|
fprintf(stderr, "\nERROR: %d\n", ctx->status);
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
if (l->llvm_file) {
|
|
if (!ir_emit_llvm(ctx, name, l->llvm_file)) {
|
|
fprintf(stderr, "\nERROR: %d\n", ctx->status);
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
if (l->dump_asm || l->dump_size || l->run) {
|
|
size_t size;
|
|
void *entry;
|
|
|
|
if (l->code_buffer) {
|
|
ctx->code_buffer = (char*)l->code_buffer + l->size;
|
|
ctx->code_buffer_size = l->code_buffer_size - l->size;
|
|
ir_mem_unprotect(l->code_buffer, l->code_buffer_size);
|
|
}
|
|
entry = ir_emit_code(ctx, &size);
|
|
#ifndef _WIN32
|
|
if (l->run) {
|
|
if (!l->code_buffer) {
|
|
ir_mem_unprotect(entry, size);
|
|
}
|
|
ir_gdb_register(name, entry, size, sizeof(void*), 0);
|
|
if (!l->code_buffer) {
|
|
ir_mem_protect(entry, size);
|
|
}
|
|
}
|
|
#endif
|
|
if (l->code_buffer) {
|
|
ir_mem_protect(l->code_buffer, l->code_buffer_size);
|
|
}
|
|
if (entry) {
|
|
l->size += size;
|
|
#if defined(IR_TARGET_AARCH64)
|
|
l->size += ctx->veneers_size;
|
|
#endif
|
|
l->size = IR_ALIGNED_SIZE(l->size, 16);
|
|
if (!ir_loader_add_sym(loader, name, entry)) {
|
|
fprintf(stderr, "\nERROR: Symbol redefinition: %s\n", name);
|
|
return 0;
|
|
}
|
|
if (l->dump_asm) {
|
|
ir_ref i;
|
|
ir_insn *insn;
|
|
|
|
ir_disasm_add_symbol(name, (uintptr_t)entry, size);
|
|
|
|
for (i = IR_UNUSED + 1, insn = ctx->ir_base - i; i < ctx->consts_count; i++, insn--) {
|
|
if (insn->op == IR_FUNC) {
|
|
const char *name = ir_get_str(ctx, insn->val.name);
|
|
void *addr = ir_loader_resolve_sym_name(loader, name);
|
|
|
|
ir_disasm_add_symbol(name, (uintptr_t)addr, sizeof(void*));
|
|
//TODO: } else if (insn->op == IR_SYM) {
|
|
}
|
|
}
|
|
|
|
ir_disasm(name, entry, size, 0, ctx, stderr);
|
|
}
|
|
if (l->run) {
|
|
#ifndef _WIN32
|
|
ir_perf_map_register(name, entry, size);
|
|
ir_perf_jitdump_open();
|
|
ir_perf_jitdump_register(name, entry, size);
|
|
#endif
|
|
if (strcmp(name, "main") == 0) {
|
|
l->main = entry;
|
|
}
|
|
}
|
|
} else {
|
|
fprintf(stderr, "\nERROR: %d\n", ctx->status);
|
|
return 0;
|
|
}
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
int main(int argc, char **argv)
|
|
{
|
|
int i;
|
|
char *input = NULL;
|
|
char *dump_file = NULL, *c_file = NULL, *llvm_file = 0;
|
|
FILE *f;
|
|
bool emit_c = 0, emit_llvm = 0, dump_size = 0, dump_asm = 0, run = 0;
|
|
uint32_t dump = 0;
|
|
int opt_level = 2;
|
|
uint32_t flags = 0;
|
|
uint32_t mflags = 0;
|
|
#if defined(IR_TARGET_X86) || defined(IR_TARGET_X64)
|
|
uint32_t mflags_disabled = 0;
|
|
#endif
|
|
uint64_t debug_regset = 0xffffffffffffffff;
|
|
#ifdef _WIN32
|
|
bool abort_fault = 1;
|
|
#endif
|
|
#if HAVE_LLVM
|
|
bool load_llvm_bitcode = 0;
|
|
bool load_llvm_asm = 0;
|
|
#endif
|
|
ir_main_loader loader;
|
|
|
|
ir_consistency_check();
|
|
|
|
for (i = 1; i < argc; i++) {
|
|
if (strcmp(argv[i], "-h") == 0
|
|
|| strcmp(argv[i], "--help") == 0) {
|
|
help(argv[0]);
|
|
return 0;
|
|
} else if (strcmp(argv[i], "--version") == 0) {
|
|
printf("IR %s\n", IR_VERSION);
|
|
return 0;
|
|
} else if (strcmp(argv[i], "--target") == 0) {
|
|
printf("%s\n", IR_TARGET);
|
|
return 0;
|
|
} else if (argv[i][0] == '-' && argv[i][1] == 'O' && strlen(argv[i]) == 3) {
|
|
if (argv[i][2] == '0') {
|
|
opt_level = 0;
|
|
} else if (argv[i][2] == '1') {
|
|
opt_level = 1;
|
|
} else if (argv[i][2] == '2') {
|
|
opt_level = 2;
|
|
} else {
|
|
fprintf(stderr, "ERROR: Invalid usage' (use --help)\n");
|
|
return 1;
|
|
}
|
|
} else if (strcmp(argv[i], "--emit-c") == 0) {
|
|
emit_c = 1;
|
|
if (i + 1 < argc && argv[i + 1][0] != '-') {
|
|
c_file = argv[i + 1];
|
|
i++;
|
|
}
|
|
} else if (strcmp(argv[i], "--emit-llvm") == 0) {
|
|
emit_llvm = 1;
|
|
if (i + 1 < argc && argv[i + 1][0] != '-') {
|
|
llvm_file = argv[i + 1];
|
|
i++;
|
|
}
|
|
} else if (strcmp(argv[i], "--save") == 0) {
|
|
// TODO: check save/dot/dump/... conflicts
|
|
dump |= IR_DUMP_SAVE;
|
|
if (i + 1 < argc && argv[i + 1][0] != '-') {
|
|
dump_file = argv[i + 1];
|
|
i++;
|
|
}
|
|
} else if (strcmp(argv[i], "--dot") == 0) {
|
|
dump |= IR_DUMP_DOT;
|
|
if (i + 1 < argc && argv[i + 1][0] != '-') {
|
|
dump_file = argv[i + 1];
|
|
i++;
|
|
}
|
|
} else if (strcmp(argv[i], "--dump") == 0) {
|
|
dump |= IR_DUMP_DUMP;
|
|
if (i + 1 < argc && argv[i + 1][0] != '-') {
|
|
dump_file = argv[i + 1];
|
|
i++;
|
|
}
|
|
} else if (strcmp(argv[i], "--dump-use-lists") == 0) {
|
|
dump |= IR_DUMP_USE_LISTS;
|
|
} else if (strcmp(argv[i], "--dump-cfg") == 0) {
|
|
dump |= IR_DUMP_CFG;
|
|
} else if (strcmp(argv[i], "--dump-cfg-map") == 0) {
|
|
dump |= IR_DUMP_CFG_MAP;
|
|
} else if (strcmp(argv[i], "--dump-live-ranges") == 0) {
|
|
dump |= IR_DUMP_LIVE_RANGES;
|
|
} else if (strcmp(argv[i], "--dump-codegen") == 0) {
|
|
dump |= IR_DUMP_CODEGEN;
|
|
} else if (strcmp(argv[i], "--dump-after-load") == 0) {
|
|
dump |= IR_DUMP_AFTER_LOAD;
|
|
} else if (strcmp(argv[i], "--dump-after-sccp") == 0) {
|
|
dump |= IR_DUMP_AFTER_SCCP;
|
|
} else if (strcmp(argv[i], "--dump-after-gcm") == 0) {
|
|
dump |= IR_DUMP_AFTER_GCM;
|
|
} else if (strcmp(argv[i], "--dump-after-schedule") == 0) {
|
|
dump |= IR_DUMP_AFTER_SCHEDULE;
|
|
} else if (strcmp(argv[i], "--dump-after-live-ranges") == 0) {
|
|
dump |= IR_DUMP_AFTER_LIVE_RANGES;
|
|
} else if (strcmp(argv[i], "--dump-after-coalescing") == 0) {
|
|
dump |= IR_DUMP_AFTER_COALESCING;
|
|
} else if (strcmp(argv[i], "--dump-after-all") == 0) {
|
|
dump |= IR_DUMP_AFTER_ALL;
|
|
} else if (strcmp(argv[i], "--dump-final") == 0) {
|
|
dump |= IR_DUMP_FINAL;
|
|
} else if (strcmp(argv[i], "--dump-size") == 0) {
|
|
dump_size = 1;
|
|
} else if (strcmp(argv[i], "-S") == 0) {
|
|
dump_asm = 1;
|
|
} else if (strcmp(argv[i], "--run") == 0) {
|
|
run = 1;
|
|
#if defined(IR_TARGET_X86) || defined(IR_TARGET_X64)
|
|
} else if (strcmp(argv[i], "-mavx") == 0) {
|
|
mflags |= IR_X86_AVX;
|
|
} else if (strcmp(argv[i], "-mno-bmi1") == 0) {
|
|
mflags_disabled |= IR_X86_BMI1;
|
|
#endif
|
|
} else if (strcmp(argv[i], "-muse-fp") == 0) {
|
|
flags |= IR_USE_FRAME_POINTER;
|
|
} else if (strcmp(argv[i], "-mfastcall") == 0) {
|
|
flags |= IR_FASTCALL_FUNC;
|
|
#ifdef IR_DEBUG
|
|
} else if (strcmp(argv[i], "--debug-sccp") == 0) {
|
|
flags |= IR_DEBUG_SCCP;
|
|
} else if (strcmp(argv[i], "--debug-gcm") == 0) {
|
|
flags |= IR_DEBUG_GCM;
|
|
} else if (strcmp(argv[i], "--debug-schedule") == 0) {
|
|
flags |= IR_DEBUG_SCHEDULE;
|
|
} else if (strcmp(argv[i], "--debug-ra") == 0) {
|
|
flags |= IR_DEBUG_RA;
|
|
#endif
|
|
} else if (strcmp(argv[i], "--debug-regset") == 0) {
|
|
if (i + 1 == argc || argv[i + 1][0] == '-') {
|
|
fprintf(stderr, "ERROR: Invalid usage' (use --help)\n");
|
|
return 1;
|
|
}
|
|
debug_regset = strtoull(argv[i + 1], NULL, 0);
|
|
i++;
|
|
#ifdef _WIN32
|
|
} else if (strcmp(argv[i], "--no-abort-fault") == 0) {
|
|
abort_fault = 0;
|
|
#endif
|
|
#if HAVE_LLVM
|
|
} else if (strcmp(argv[i], "--llvm-bitcode") == 0) {
|
|
if (input || i + 1 == argc || argv[i + 1][0] == '-') {
|
|
fprintf(stderr, "ERROR: Invalid usage' (use --help)\n");
|
|
return 1;
|
|
}
|
|
load_llvm_bitcode = 1;
|
|
input = argv[++i];
|
|
} else if (strcmp(argv[i], "--llvm-asm") == 0) {
|
|
if (input || i + 1 == argc || argv[i + 1][0] == '-') {
|
|
fprintf(stderr, "ERROR: Invalid usage' (use --help)\n");
|
|
return 1;
|
|
}
|
|
load_llvm_asm = 1;
|
|
input = argv[++i];
|
|
#endif
|
|
} else if (argv[i][0] == '-') {
|
|
fprintf(stderr, "ERROR: Unknown option '%s' (use --help)\n", argv[i]);
|
|
return 1;
|
|
} else {
|
|
if (input) {
|
|
fprintf(stderr, "ERROR: Invalid usage' (use --help)\n");
|
|
return 1;
|
|
}
|
|
input = argv[i];
|
|
}
|
|
}
|
|
|
|
if (dump && !(dump & (IR_DUMP_AFTER_LOAD|IR_DUMP_AFTER_SCCP|
|
|
IR_DUMP_AFTER_GCM|IR_DUMP_AFTER_SCHEDULE|
|
|
IR_DUMP_AFTER_LIVE_RANGES|IR_DUMP_AFTER_COALESCING|IR_DUMP_FINAL))) {
|
|
dump |= IR_DUMP_FINAL;
|
|
}
|
|
|
|
if (!input) {
|
|
fprintf(stderr, "ERROR: no input file\n");
|
|
return 1;
|
|
}
|
|
|
|
#if defined(IR_TARGET_X86) || defined(IR_TARGET_X64)
|
|
uint32_t cpuinfo = ir_cpuinfo();
|
|
|
|
if (!(cpuinfo & IR_X86_SSE2)) {
|
|
fprintf(stderr, "ERROR: incompatible CPU (SSE2 is not supported)\n");
|
|
return 1;
|
|
}
|
|
|
|
if ((mflags & IR_X86_AVX) && !(cpuinfo & IR_X86_AVX)) {
|
|
fprintf(stderr, "ERROR: -mavx is not compatible with CPU (AVX is not supported)\n");
|
|
return 1;
|
|
}
|
|
if ((cpuinfo & IR_X86_BMI1) && !(mflags_disabled & IR_X86_BMI1)) {
|
|
mflags |= IR_X86_BMI1;
|
|
}
|
|
#endif
|
|
|
|
#ifdef _WIN32
|
|
if (!abort_fault) {
|
|
_set_abort_behavior(0, _WRITE_ABORT_MSG|_CALL_REPORTFAULT);
|
|
SetErrorMode(SEM_FAILCRITICALERRORS|SEM_NOGPFAULTERRORBOX);
|
|
}
|
|
#endif
|
|
|
|
flags |= IR_FUNCTION;
|
|
|
|
if (opt_level > 0) {
|
|
flags |= IR_OPT_FOLDING | IR_OPT_CFG | IR_OPT_CODEGEN;
|
|
}
|
|
if (emit_c || emit_llvm) {
|
|
flags |= IR_GEN_CODE;
|
|
}
|
|
if (dump_asm || dump_size || run) {
|
|
flags |= IR_GEN_NATIVE;
|
|
if (emit_c) {
|
|
fprintf(stderr, "ERROR: --emit-c is incompatible with native code generator (-S, --dump-size, --run)\n");
|
|
return 1;
|
|
}
|
|
}
|
|
|
|
memset(&loader, 0, sizeof(loader));
|
|
loader.loader.default_func_flags = flags;
|
|
loader.loader.init_module = NULL;
|
|
loader.loader.external_sym_dcl = ir_loader_external_sym_dcl;
|
|
loader.loader.external_func_dcl = ir_loader_external_func_dcl;
|
|
loader.loader.forward_func_dcl = ir_loader_forward_func_dcl;
|
|
loader.loader.sym_dcl = ir_loader_sym_dcl;
|
|
loader.loader.sym_data = ir_loader_sym_data;
|
|
loader.loader.sym_data_ref = ir_loader_sym_data_ref;
|
|
loader.loader.sym_data_end = ir_loader_sym_data_end;
|
|
loader.loader.func_init = ir_loader_func_init;
|
|
loader.loader.func_process = ir_loader_func_process;
|
|
loader.loader.resolve_sym_name = ir_loader_resolve_sym_name;
|
|
loader.loader.has_sym = ir_loader_has_sym;
|
|
loader.loader.add_sym = ir_loader_add_sym;
|
|
|
|
loader.opt_level = opt_level;
|
|
loader.mflags = mflags;
|
|
loader.debug_regset = debug_regset;
|
|
loader.dump = dump;
|
|
loader.dump_asm = dump_asm;
|
|
loader.dump_size = dump_size;
|
|
loader.run = run;
|
|
|
|
ir_strtab_init(&loader.symtab, 16, 4096);
|
|
loader.sym = NULL;
|
|
loader.sym_count = 0;
|
|
|
|
//TODO: ir_loader_add_sym(&loader.loader, (void*)"printf", printf);
|
|
ir_loader_add_sym(&loader.loader, (void*)"putchar", putchar);
|
|
|
|
if (dump_file) {
|
|
loader.dump_file = fopen(dump_file, "w+");
|
|
if (!loader.dump_file) {
|
|
fprintf(stderr, "ERROR: Cannot create file '%s'\n", dump_file);
|
|
return 0;
|
|
}
|
|
} else {
|
|
loader.dump_file = stderr;
|
|
}
|
|
if (emit_c) {
|
|
if (c_file) {
|
|
loader.c_file = fopen(c_file, "w+");
|
|
if (!loader.c_file) {
|
|
fprintf(stderr, "ERROR: Cannot create file '%s'\n", c_file);
|
|
return 0;
|
|
}
|
|
} else {
|
|
loader.c_file = stderr;
|
|
}
|
|
}
|
|
if (emit_llvm) {
|
|
if (llvm_file) {
|
|
loader.llvm_file = fopen(llvm_file, "w+");
|
|
if (!loader.llvm_file) {
|
|
fprintf(stderr, "ERROR: Cannot create file '%s'\n", llvm_file);
|
|
return 0;
|
|
}
|
|
} else {
|
|
loader.llvm_file = stderr;
|
|
}
|
|
}
|
|
|
|
#if defined(IR_TARGET_AARCH64)
|
|
if (dump_asm || dump_size || run) {
|
|
/* Preallocate 2MB JIT code buffer. On AArch64 it may be necessary to generate veneers. */
|
|
loader.code_buffer_size = 2 * 1024 * 1024;
|
|
loader.code_buffer = ir_mem_mmap(loader.code_buffer_size);
|
|
if (!loader.code_buffer) {
|
|
fprintf(stderr, "ERROR: Cannot allocate JIT code buffer\n");
|
|
return 0;
|
|
}
|
|
}
|
|
#endif
|
|
|
|
#if HAVE_LLVM
|
|
if (load_llvm_bitcode) {
|
|
if (!ir_load_llvm_bitcode(&loader.loader, input)) {
|
|
fprintf(stderr, "ERROR: Cannot load LLVM file '%s'\n", input);
|
|
return 1;
|
|
}
|
|
goto finish;
|
|
} else if (load_llvm_asm) {
|
|
if (!ir_load_llvm_asm(&loader.loader, input)) {
|
|
fprintf(stderr, "ERROR: Cannot load LLVM file '%s'\n", input);
|
|
return 1;
|
|
}
|
|
goto finish;
|
|
}
|
|
#endif
|
|
|
|
f = fopen(input, "rb");
|
|
if (!f) {
|
|
fprintf(stderr, "ERROR: Cannot open input file '%s'\n", input);
|
|
return 1;
|
|
}
|
|
|
|
ir_loader_init();
|
|
|
|
if (!ir_load(&loader.loader, f)) {
|
|
fprintf(stderr, "ERROR: Cannot load input file '%s'\n", input);
|
|
}
|
|
|
|
fclose(f);
|
|
|
|
|
|
ir_loader_free();
|
|
|
|
#if HAVE_LLVM
|
|
finish:
|
|
#endif
|
|
|
|
if (loader.dump_file && loader.dump_file != stderr) {
|
|
fclose(loader.dump_file);
|
|
}
|
|
if (loader.c_file && loader.c_file != stderr) {
|
|
fclose(loader.c_file);
|
|
}
|
|
if (loader.llvm_file && loader.llvm_file != stderr) {
|
|
fclose(loader.llvm_file);
|
|
}
|
|
|
|
if (dump_size) {
|
|
fprintf(stderr, "\ncode size = %lld\n", (long long int)loader.size);
|
|
}
|
|
|
|
ir_strtab_free(&loader.symtab);
|
|
if (loader.sym) {
|
|
ir_mem_free(loader.sym);
|
|
}
|
|
|
|
if (run && loader.main) {
|
|
int (*func)(void) = loader.main;
|
|
int ret = func();
|
|
fflush(stdout);
|
|
if (ret) {
|
|
fprintf(stderr, "\nexit code = %d\n", ret);
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|