aboutsummaryrefslogtreecommitdiff
path: root/src/codegen/ssa.cpp
diff options
context:
space:
mode:
authorgingerBill <ginger.bill.22@gmail.com>2016-07-30 00:09:30 +0100
committergingerBill <ginger.bill.22@gmail.com>2016-07-30 00:17:13 +0100
commit776dc0e8f1aa506ae0096c78ff10565e56c175e7 (patch)
tree946508a869196a3bf1d005e0ddffd182a1786a1d /src/codegen/ssa.cpp
parent32ab8fcf99df786c264ca566799b022c66cca34b (diff)
Restart LLVM IR SSA generation
This is the third go and I'm going for it!
Diffstat (limited to 'src/codegen/ssa.cpp')
-rw-r--r--src/codegen/ssa.cpp746
1 files changed, 746 insertions, 0 deletions
diff --git a/src/codegen/ssa.cpp b/src/codegen/ssa.cpp
new file mode 100644
index 000000000..d17264f64
--- /dev/null
+++ b/src/codegen/ssa.cpp
@@ -0,0 +1,746 @@
+struct ssaModule;
+struct ssaProcedure;
+struct ssaBlock;
+struct ssaValue;
+
+
+struct ssaModule {
+ CheckerInfo *info;
+ BaseTypeSizes sizes;
+ gbAllocator allocator;
+
+ Map<ssaValue *> values; // Key: Entity *
+ Map<ssaValue *> members; // Key: String
+ i32 global_string_index;
+};
+
+
+struct ssaBlock {
+ i32 id;
+ AstNode *node;
+ Scope *scope;
+ String label;
+ ssaProcedure *parent;
+
+ gbArray(ssaValue *) instructions;
+ gbArray(ssaValue *) values;
+};
+
+struct ssaProcedure {
+ ssaModule *module;
+ String name;
+ Entity *entity;
+ DeclarationInfo *decl;
+ AstNode *type_expr;
+ AstNode *body;
+
+ gbArray(ssaValue *) blocks;
+ ssaBlock *curr_block;
+};
+
+
+struct ssaLocal {
+ Entity *entity;
+};
+struct ssaGlobal {
+ b32 generated;
+ Entity *entity;
+ ssaValue *value;
+};
+struct ssaStore {
+ ssaValue *address;
+ ssaValue *value;
+};
+struct ssaLoad {
+ ssaValue *address;
+};
+struct ssaBinaryOp {
+ Token op;
+ ssaValue *left, *right;
+};
+struct ssaGetElementPtr {
+ ssaValue *address;
+ Type *result_type;
+ Type *element_type;
+ gbArray(ssaValue *) indices;
+};
+
+enum ssaInstructionKind {
+ ssaInstruction_Invalid,
+
+ ssaInstruction_Local,
+ ssaInstruction_Store,
+ ssaInstruction_Load,
+ ssaInstruction_GetElementPtr,
+
+ ssaInstruction_BinaryOp,
+
+ ssaInstruction_Count,
+};
+
+struct ssaInstruction {
+ ssaInstructionKind kind;
+
+ ssaBlock *parent;
+ Type *type;
+ TokenPos pos;
+
+ union {
+ ssaLocal local;
+ ssaStore store;
+ ssaLoad load;
+ ssaGetElementPtr get_element_ptr;
+
+ ssaBinaryOp binary_op;
+ };
+};
+
+
+enum ssaValueKind {
+ ssaValue_Invalid,
+
+ ssaValue_TypeName,
+ ssaValue_Global,
+ ssaValue_Procedure,
+ ssaValue_Constant,
+
+ ssaValue_Block,
+ ssaValue_Instruction,
+
+ ssaValue_Count,
+};
+
+struct ssaValue {
+ ssaValueKind kind;
+ i32 id;
+
+ union {
+ Entity * type_name;
+ ssaGlobal global;
+ ssaProcedure procedure;
+ TypeAndValue constant;
+ ssaBlock block;
+ ssaInstruction instruction;
+ };
+};
+
+enum ssaLvalueKind {
+ ssaLvalue_Blank,
+ ssaLvalue_Address,
+
+ ssaLvalue_Count,
+};
+
+struct ssaLvalue {
+ ssaLvalueKind kind;
+ union {
+ struct {} blank;
+ struct {
+ ssaValue *value;
+ AstNode *expr;
+ } address;
+ };
+};
+
+void ssa_module_init(ssaModule *m, Checker *c) {
+ m->allocator = gb_heap_allocator();
+ m->info = &c->info;
+ m->sizes = c->sizes;
+
+ map_init(&m->values, m->allocator);
+ map_init(&m->members, m->allocator);
+}
+
+void ssa_module_destroy(ssaModule *m) {
+ map_destroy(&m->values);
+ map_destroy(&m->members);
+}
+
+void ssa_module_add_value(ssaModule *m, Entity *e, ssaValue *v) {
+ map_set(&m->values, hash_pointer(e), v);
+}
+
+
+Type *ssa_value_type(ssaValue *value);
+
+Type *ssa_instruction_type(ssaInstruction *instr) {
+ switch (instr->kind) {
+ case ssaInstruction_Local:
+ return instr->local.entity->type;
+ case ssaInstruction_Store:
+ return ssa_value_type(instr->store.address);
+ case ssaInstruction_Load:
+ return ssa_value_type(instr->load.address);
+ }
+ return NULL;
+}
+
+Type *ssa_value_type(ssaValue *value) {
+ switch (value->kind) {
+ case ssaValue_TypeName:
+ return value->type_name->type;
+ case ssaValue_Global:
+ return value->global.entity->type;
+ case ssaValue_Procedure:
+ return value->procedure.entity->type;
+ case ssaValue_Constant:
+ return value->constant.type;
+ case ssaValue_Instruction:
+ return ssa_instruction_type(&value->instruction);
+ }
+ return NULL;
+}
+
+
+
+
+
+
+
+
+
+
+
+ssaValue *ssa_alloc_value(gbAllocator a, ssaValueKind kind) {
+ ssaValue *v = gb_alloc_item(a, ssaValue);
+ v->kind = kind;
+ return v;
+}
+
+ssaValue *ssa_alloc_instruction(gbAllocator a, ssaInstructionKind kind) {
+ ssaValue *v = ssa_alloc_value(a, ssaValue_Instruction);
+ v->instruction.kind = kind;
+ return v;
+}
+
+ssaValue *ssa_make_value_type_name(gbAllocator a, Entity *e) {
+ ssaValue *v = ssa_alloc_value(a, ssaValue_TypeName);
+ v->type_name = e;
+ return v;
+}
+
+ssaValue *ssa_make_value_global(gbAllocator a, Entity *e, ssaValue *value) {
+ ssaValue *v = ssa_alloc_value(a, ssaValue_Global);
+ v->global.entity = e;
+ v->global.value = value;
+ return v;
+}
+
+
+
+ssaValue *ssa_make_instruction_local(ssaProcedure *p, Entity *e) {
+ ssaValue *v = ssa_alloc_instruction(p->module->allocator, ssaInstruction_Local);
+ ssaInstruction *i = &v->instruction;
+ i->local.entity = e;
+ if (p->curr_block) {
+ gb_array_append(p->curr_block->values, v);
+ }
+ ssa_module_add_value(p->module, e, v);
+ return v;
+}
+
+
+ssaValue *ssa_make_instruction_store(ssaProcedure *p, ssaValue *address, ssaValue *value) {
+ ssaValue *v = ssa_alloc_instruction(p->module->allocator, ssaInstruction_Store);
+ ssaInstruction *i = &v->instruction;
+ i->store.address = address;
+ i->store.value = value;
+ if (p->curr_block) {
+ gb_array_append(p->curr_block->values, v);
+ }
+ return v;
+}
+
+ssaValue *ssa_make_instruction_load(ssaProcedure *p, ssaValue *address) {
+ ssaValue *v = ssa_alloc_instruction(p->module->allocator, ssaInstruction_Load);
+ ssaInstruction *i = &v->instruction;
+ i->load.address = address;
+ if (p->curr_block) {
+ gb_array_append(p->curr_block->values, v);
+ }
+ return v;
+}
+
+ssaValue *ssa_make_instruction_get_element_ptr(ssaProcedure *p, ssaValue *address) {
+ ssaValue *v = ssa_alloc_instruction(p->module->allocator, ssaInstruction_GetElementPtr);
+ ssaInstruction *i = &v->instruction;
+ i->get_element_ptr.address = address;
+ if (p->curr_block) {
+ gb_array_append(p->curr_block->values, v);
+ }
+ return v;
+}
+
+ssaValue *ssa_make_instruction_binary_op(ssaProcedure *p, Token op, ssaValue *left, ssaValue *right) {
+ ssaValue *v = ssa_alloc_instruction(p->module->allocator, ssaInstruction_BinaryOp);
+ ssaInstruction *i = &v->instruction;
+ i->binary_op.op = op;
+ i->binary_op.left = left;
+ i->binary_op.right = right;
+ if (p->curr_block) {
+ gb_array_append(p->curr_block->values, v);
+ }
+ return v;
+}
+
+
+ssaValue *ssa_make_value_constant(gbAllocator a, Type *type, ExactValue value) {
+ ssaValue *v = ssa_alloc_value(a, ssaValue_Constant);
+ v->constant.type = type;
+ v->constant.value = value;
+ return v;
+}
+
+ssaValue *ssa_make_value_procedure(gbAllocator a, Entity *e, DeclarationInfo *decl, ssaModule *m) {
+ ssaValue *v = ssa_alloc_value(a, ssaValue_Procedure);
+ v->procedure.module = m;
+ v->procedure.entity = e;
+ v->procedure.decl = decl;
+ v->procedure.name = e->token.string;
+ return v;
+}
+
+ssaValue *ssa_make_value_block(gbAllocator a, ssaProcedure *proc, AstNode *node, Scope *scope, String label) {
+ ssaValue *v = ssa_alloc_value(a, ssaValue_Block);
+ v->block.label = label;
+ v->block.node = node;
+ v->block.scope = scope;
+ v->block.parent = proc;
+
+ gb_array_init(v->block.instructions, gb_heap_allocator());
+ gb_array_init(v->block.values, gb_heap_allocator());
+
+ return v;
+}
+
+
+
+ssaValue *ssa_add_global_string(ssaProcedure *proc, ExactValue value) {
+ GB_ASSERT(value.kind == ExactValue_String);
+ gbAllocator a = gb_heap_allocator();
+
+
+ isize max_len = 4+8+1;
+ u8 *str = cast(u8 *)gb_alloc_array(a, u8, max_len);
+ isize len = gb_snprintf(cast(char *)str, max_len, ".str%x", proc->module->global_string_index);
+ proc->module->global_string_index++;
+
+ String name = make_string(str, len-1);
+ Token token = {Token_String};
+ token.string = name;
+ Type *type = &basic_types[Basic_string];
+ Entity *entity = make_entity_constant(a, NULL, token, type, value);
+ ssaValue *v = ssa_make_value_constant(a, type, value);
+
+
+ ssaValue *g = ssa_make_value_global(a, entity, v);
+ g->global.generated = true;
+
+ map_set(&proc->module->values, hash_pointer(entity), g);
+ map_set(&proc->module->members, hash_string(name), g);
+
+ return g;
+}
+
+
+ssaValue *ssa_add_block(ssaProcedure *proc, AstNode *node, String label) {
+ gbAllocator a = proc->module->allocator;
+ Scope *scope = NULL;
+ Scope **found = map_get(&proc->module->info->scopes, hash_pointer(node));
+ if (found) scope = *found;
+ ssaValue *block = ssa_make_value_block(a, proc, node, scope, label);
+ gb_array_append(proc->blocks, block);
+ return block;
+}
+
+
+
+void ssa_begin_procedure_body(ssaProcedure *proc) {
+ gb_array_init(proc->blocks, gb_heap_allocator());
+ ssaValue *b = ssa_add_block(proc, proc->body, make_string("entry"));
+ proc->curr_block = &b->block;
+}
+
+
+void ssa_end_procedure_body(ssaProcedure *proc) {
+
+// Number registers
+ i32 reg_id = 0;
+ gb_for_array(i, proc->blocks) {
+ ssaBlock *b = &proc->blocks[i]->block;
+ gb_for_array(j, b->instructions) {
+ ssaValue *value = b->instructions[j];
+ ssaInstruction *instr = &value->instruction;
+ if (instr->kind == ssaInstruction_Store) {
+ continue;
+ }
+ value->id = reg_id;
+ reg_id++;
+ }
+ }
+}
+
+
+b32 ssa_is_blank_identifier(AstNode *i) {
+ GB_ASSERT(i->kind == AstNode_Identifier);
+ return are_strings_equal(i->identifier.token.string, make_string("_"));
+}
+
+
+ssaValue *ssa_block_emit(ssaBlock *b, ssaValue *instr) {
+ instr->instruction.parent = b;
+ gb_array_append(b->instructions, instr);
+ return instr;
+}
+
+ssaValue *ssa_emit(ssaProcedure *proc, ssaValue *instr) {
+ return ssa_block_emit(proc->curr_block, instr);
+}
+
+
+ssaValue *ssa_add_local(ssaProcedure *proc, Entity *e) {
+ ssaValue *instr = ssa_make_instruction_local(proc, e);
+ ssa_emit(proc, instr);
+ return instr;
+}
+
+ssaValue *ssa_add_local_for_identifier(ssaProcedure *proc, AstNode *name) {
+ Entity **found = map_get(&proc->module->info->definitions, hash_pointer(name));
+ if (found) {
+ return ssa_add_local(proc, *found);
+ }
+ return NULL;
+}
+
+
+ssaValue *ssa_emit_store(ssaProcedure *p, ssaValue *address, ssaValue *value) {
+ ssaValue *store = ssa_make_instruction_store(p, address, value);
+ ssa_emit(p, store);
+ return store;
+}
+
+ssaValue *ssa_emit_load(ssaProcedure *p, ssaValue *address) {
+ ssaValue *v = ssa_make_instruction_load(p, address);
+ ssa_emit(p, v);
+ return v;
+}
+
+ssaValue *ssa_lvalue_store(ssaLvalue lval, ssaProcedure *p, ssaValue *value) {
+ switch (lval.kind) {
+ case ssaLvalue_Address:
+ return ssa_emit_store(p, lval.address.value, value);
+ }
+ GB_PANIC("Illegal lvalue store");
+ return NULL;
+}
+
+ssaValue *ssa_lvalue_load(ssaLvalue lval, ssaProcedure *p) {
+ switch (lval.kind) {
+ case ssaLvalue_Address:
+ return ssa_emit_load(p, lval.address.value);
+ }
+ GB_PANIC("Illegal lvalue load");
+ return NULL;
+}
+
+
+ssaValue *ssa_lvalue_address(ssaLvalue lval, ssaProcedure *p) {
+ switch (lval.kind) {
+ case ssaLvalue_Address:
+ return lval.address.value;
+ }
+ return NULL;
+}
+
+ssaValue *ssa_build_expression(ssaProcedure *proc, AstNode *expr);
+ssaValue *ssa_build_single_expression(ssaProcedure *proc, AstNode *expr, TypeAndValue *tv);
+
+ssaValue *ssa_emit_conversion(ssaProcedure *proc, ssaValue *value, Type *a_type) {
+ Type *b_type = ssa_value_type(value);
+ if (are_types_identical(a_type, b_type))
+ return value;
+
+ Type *a = get_base_type(a_type);
+ Type *b = get_base_type(b_type);
+
+ if (value->kind == ssaValue_Constant) {
+ if (a->kind == Type_Basic)
+ return ssa_make_value_constant(proc->module->allocator, a_type, value->constant.value);
+ }
+
+ GB_PANIC("TODO(bill): ssa_emit_conversion");
+
+ return NULL;
+}
+
+ssaValue *ssa_emit_arith(ssaProcedure *proc, Token op, ssaValue *left, ssaValue *right, Type *type) {
+ switch (op.kind) {
+ case Token_Add:
+ case Token_Sub:
+ case Token_Mul:
+ case Token_Quo:
+ case Token_Mod:
+ case Token_And:
+ case Token_Or:
+ case Token_Xor:
+ case Token_AndNot:
+ left = ssa_emit_conversion(proc, left, type);
+ right = ssa_emit_conversion(proc, right, type);
+ break;
+ }
+
+ ssaValue *v = ssa_make_instruction_binary_op(proc, op, left, right);
+ return ssa_emit(proc, v);
+}
+
+ssaValue *ssa_build_single_expression(ssaProcedure *proc, AstNode *expr, TypeAndValue *tv) {
+ switch (expr->kind) {
+ case AstNode_Identifier: {
+ Entity *e = *map_get(&proc->module->info->uses, hash_pointer(expr));
+ if (e->kind == Entity_Builtin) {
+ // TODO(bill): Entity_Builtin
+ return NULL;
+ }
+
+ auto *found = map_get(&proc->module->values, hash_pointer(e));
+ if (found) {
+ return ssa_emit_load(proc, *found);
+ }
+ } break;
+
+ case AstNode_UnaryExpression: {
+ auto *ue = &expr->unary_expression;
+ switch (ue->op.kind) {
+ case Token_Add:
+ return ssa_build_expression(proc, ue->operand);
+ case Token_Sub:
+ return NULL;
+ case Token_Xor:
+ return NULL;
+ case Token_Not:
+ return NULL;
+ case Token_Pointer:
+ return NULL;
+ }
+ } break;
+
+ case AstNode_BinaryExpression: {
+ auto *be = &expr->binary_expression;
+ switch (be->op.kind) {
+ case Token_Add:
+ case Token_Sub:
+ case Token_Mul:
+ case Token_Quo:
+ case Token_Mod:
+ case Token_And:
+ case Token_Or:
+ case Token_Xor:
+ case Token_AndNot:
+ return ssa_emit_arith(proc, be->op,
+ ssa_build_expression(proc, be->left),
+ ssa_build_expression(proc, be->right),
+ tv->type);
+ }
+ } break;
+ case AstNode_ProcedureLiteral:
+ break;
+ case AstNode_CastExpression:
+ break;
+ case AstNode_CallExpression:
+ break;
+ case AstNode_SliceExpression:
+ break;
+ case AstNode_IndexExpression:
+ break;
+ case AstNode_SelectorExpression:
+ break;
+ }
+
+ GB_PANIC("Unexpected expression");
+ return NULL;
+}
+
+
+ssaValue *ssa_build_expression(ssaProcedure *proc, AstNode *expr) {
+ expr = unparen_expression(expr);
+
+ TypeAndValue *tv = map_get(&proc->module->info->types, hash_pointer(expr));
+ if (tv) {
+ if (tv->value.kind != ExactValue_Invalid) {
+ if (tv->value.kind == ExactValue_String) {
+ ssaValue *global_str = ssa_add_global_string(proc, tv->value);
+ return ssa_emit_load(proc, global_str);
+ }
+ return ssa_make_value_constant(proc->module->allocator, tv->type, tv->value);
+ }
+
+ ssaValue *value = NULL;
+ if (tv->mode == Addressing_Variable) {
+ gb_printf("!Addressable!\n");
+ // TODO(bill): Addressing_Variable
+ } else {
+ value = ssa_build_single_expression(proc, expr, tv);
+ }
+
+ return value;
+ }
+ return NULL;
+}
+
+
+ssaLvalue ssa_build_address(ssaProcedure *proc, AstNode *expr) {
+ switch (expr->kind) {
+ case AstNode_Identifier: {
+ if (!ssa_is_blank_identifier(expr)) {
+ Entity *e = entity_of_identifier(proc->module->info, expr);
+
+ ssaLvalue val = {ssaLvalue_Address};
+ val.address.expr = expr;
+ ssaValue **found = map_get(&proc->module->values, hash_pointer(e));
+ if (found) {
+ val.address.value = *found;
+ }
+ return val;
+ }
+ } break;
+
+ case AstNode_ParenExpression:
+ return ssa_build_address(proc, unparen_expression(expr));
+
+ case AstNode_DereferenceExpression: {
+ ssaLvalue val = {ssaLvalue_Address};
+ val.address.value = ssa_build_expression(proc, expr);
+ val.address.expr = expr;
+ return val;
+ } break;
+
+ case AstNode_SelectorExpression:
+ break;
+
+ case AstNode_IndexExpression:
+ break;
+
+ // TODO(bill): Others address
+ }
+
+ ssaLvalue blank = {ssaLvalue_Blank};
+ return blank;
+}
+
+void ssa_build_statement(ssaProcedure *proc, AstNode *s);
+
+void ssa_build_statement_list(ssaProcedure *proc, AstNode *list) {
+ for (AstNode *stmt = list ; stmt != NULL; stmt = stmt->next)
+ ssa_build_statement(proc, stmt);
+}
+
+void ssa_build_statement(ssaProcedure *proc, AstNode *s) {
+ switch (s->kind) {
+ case AstNode_EmptyStatement:
+ break;
+ case AstNode_VariableDeclaration: {
+ auto *vd = &s->variable_declaration;
+ if (vd->kind == Declaration_Mutable) {
+ if (vd->name_count == vd->value_count) { // 1:1 assigment
+
+ } else if (vd->value_count == 0) { // declared and zero-initialized
+ for (AstNode *name = vd->name_list; name != NULL; name = name->next) {
+ if (!ssa_is_blank_identifier(name)) {
+ // TODO(bill): add local
+ ssa_add_local_for_identifier(proc, name);
+ }
+ }
+ } else { // Tuple(s)
+ GB_PANIC("TODO(bill): tuple assignment variable declaration");
+ }
+ }
+ } break;
+
+ case AstNode_AssignStatement: {
+ auto *assign = &s->assign_statement;
+ switch (assign->op.kind) {
+ case Token_Eq: {
+ gbArray(ssaLvalue) lvals;
+ gb_array_init(lvals, gb_heap_allocator());
+ defer (gb_array_free(lvals));
+
+ for (AstNode *lhs = assign->lhs_list;
+ lhs != NULL;
+ lhs = lhs->next) {
+ ssaLvalue lval = {};
+ if (!ssa_is_blank_identifier(lhs)) {
+ lval = ssa_build_address(proc, lhs);
+ }
+ gb_array_append(lvals, lval);
+ }
+
+ if (assign->lhs_count == assign->rhs_count) {
+ if (assign->lhs_count == 1) {
+ AstNode *lhs = assign->lhs_list;
+ AstNode *rhs = assign->rhs_list;
+ ssaValue *init = ssa_build_expression(proc, rhs);
+ ssa_lvalue_store(lvals[0], proc, init);
+ } else {
+ GB_PANIC("TODO(bill): parallel assignment");
+ }
+ } else {
+ GB_PANIC("TODO(bill): tuple assignment");
+ }
+
+ } break;
+
+ default: // +=, -=, etc
+ break;
+ }
+ } break;
+
+ case AstNode_ExpressionStatement:
+ ssa_build_expression(proc, s->expression_statement.expression);
+ break;
+
+ case AstNode_BlockStatement:
+ ssa_build_statement_list(proc, s->block_statement.list);
+ break;
+ }
+}
+
+
+
+void ssa_build_procedure(ssaValue *value) {
+ ssaProcedure *proc = &value->procedure;
+
+ gb_printf("Building %.*s: %.*s\n", LIT(entity_strings[proc->entity->kind]), LIT(proc->name));
+
+
+ AstNode *proc_decl = proc->decl->proc_decl;
+ switch (proc_decl->kind) {
+ case AstNode_ProcedureDeclaration:
+ proc->type_expr = proc_decl->procedure_declaration.type;
+ proc->body = proc_decl->procedure_declaration.body;
+ break;
+ default:
+ return;
+ }
+
+ if (proc->body == NULL) {
+ // TODO(bill): External procedure
+ return;
+ }
+
+
+ ssa_begin_procedure_body(proc);
+ ssa_build_statement(proc, proc->body);
+ ssa_end_procedure_body(proc);
+
+}
+
+
+
+
+
+
+
+
+
+
+