2018-02-02 00:26:31 -05:00
|
|
|
import io:*
|
|
|
|
|
import mem:*
|
|
|
|
|
import map:*
|
|
|
|
|
import hash_map:*
|
|
|
|
|
import stack:*
|
|
|
|
|
import string:*
|
|
|
|
|
import util:*
|
|
|
|
|
import tree:*
|
|
|
|
|
import symbol:*
|
|
|
|
|
import ast_nodes:*
|
|
|
|
|
// for error with syntax tree
|
|
|
|
|
import pass_common:*
|
|
|
|
|
import poset:*
|
|
|
|
|
|
2018-02-27 23:53:08 +00:00
|
|
|
fun type_size(t: *type): ulong
|
|
|
|
|
return type_size_and_alignment(t).first
|
|
|
|
|
fun type_size_and_alignment(t: *type): pair<ulong,ulong> {
|
|
|
|
|
if (t->indirection)
|
|
|
|
|
return make_pair(#sizeof<*void>, #sizeof<*void>)
|
|
|
|
|
match (t->base) {
|
|
|
|
|
base_type::object() {
|
|
|
|
|
var total_size: ulong = 0
|
|
|
|
|
var max_size: ulong = 0
|
|
|
|
|
var max_align: ulong = 0
|
|
|
|
|
t->type_def->type_def.variables.for_each(fun(i: *ast_node) {
|
|
|
|
|
var individual = type_size_and_alignment(i->declaration_statement.identifier->identifier.type)
|
|
|
|
|
max_size = max(max_size, individual.first)
|
|
|
|
|
max_align = max(max_align, individual.second)
|
|
|
|
|
// increase total size by the individual size + padding to get alignment
|
|
|
|
|
var padding = 0
|
|
|
|
|
if (individual.second != 0)
|
|
|
|
|
padding = (individual.second - (total_size % individual.second)) % individual.second
|
|
|
|
|
total_size += individual.first + padding
|
|
|
|
|
})
|
|
|
|
|
if (t->type_def->type_def.is_union)
|
|
|
|
|
total_size = max_size
|
|
|
|
|
// pad the end so that consecutive objects in memory are aligned
|
|
|
|
|
if (max_align != 0)
|
|
|
|
|
total_size += (max_align - (total_size % max_align)) % max_align
|
|
|
|
|
return make_pair(total_size, max_align)
|
|
|
|
|
}
|
|
|
|
|
base_type::function() return make_pair(#sizeof<*void>, #sizeof<*void>)
|
|
|
|
|
base_type::boolean() return make_pair(#sizeof<bool>, #sizeof<bool>)
|
|
|
|
|
base_type::character() return make_pair(#sizeof<char>, #sizeof<char>)
|
|
|
|
|
base_type::ucharacter() return make_pair(#sizeof<uchar>, #sizeof<uchar>)
|
|
|
|
|
base_type::short_int() return make_pair(#sizeof<short>, #sizeof<short>)
|
|
|
|
|
base_type::ushort_int() return make_pair(#sizeof<ushort>, #sizeof<ushort>)
|
|
|
|
|
base_type::integer() return make_pair(#sizeof<int>, #sizeof<int>)
|
|
|
|
|
base_type::uinteger() return make_pair(#sizeof<uint>, #sizeof<uint>)
|
|
|
|
|
base_type::long_int() return make_pair(#sizeof<long>, #sizeof<long>)
|
|
|
|
|
base_type::ulong_int() return make_pair(#sizeof<ulong>, #sizeof<ulong>)
|
|
|
|
|
base_type::floating() return make_pair(#sizeof<float>, #sizeof<float>)
|
|
|
|
|
base_type::double_precision() return make_pair(#sizeof<double>, #sizeof<double>)
|
|
|
|
|
}
|
|
|
|
|
error(string("Invalid type for type_size: ") + t->to_string())
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
fun offset_into_struct(struct_type: *type, ident: *ast_node): ulong {
|
|
|
|
|
var offset: ulong = 0
|
|
|
|
|
if (struct_type->type_def->type_def.is_union)
|
|
|
|
|
return offset
|
|
|
|
|
for (var i = 0; i < struct_type->type_def->type_def.variables.size; i++;) {
|
|
|
|
|
var size_and_align = type_size_and_alignment(struct_type->type_def->type_def.variables[i]->declaration_statement.identifier->identifier.type)
|
|
|
|
|
var align = size_and_align.second
|
|
|
|
|
if (align != 0)
|
|
|
|
|
offset += (align - (offset % align)) % align
|
|
|
|
|
if (struct_type->type_def->type_def.variables[i]->declaration_statement.identifier == ident)
|
|
|
|
|
break
|
|
|
|
|
else
|
|
|
|
|
offset += size_and_align.first
|
|
|
|
|
}
|
|
|
|
|
return offset
|
|
|
|
|
}
|
2018-02-02 00:26:31 -05:00
|
|
|
|
2018-03-07 01:58:19 -05:00
|
|
|
var register_size = #sizeof<*void>
|
|
|
|
|
adt operand_size {
|
|
|
|
|
b8,
|
|
|
|
|
b16,
|
|
|
|
|
b32,
|
|
|
|
|
b64
|
|
|
|
|
}
|
|
|
|
|
fun size_to_operand_size(size: ulong): operand_size {
|
|
|
|
|
if (size == 1) return operand_size::b8()
|
|
|
|
|
if (size == 2) return operand_size::b16()
|
|
|
|
|
if (size == 4) return operand_size::b32()
|
|
|
|
|
if (size == 8) return operand_size::b64()
|
|
|
|
|
error("invalid operand size")
|
|
|
|
|
}
|
2018-02-02 00:26:31 -05:00
|
|
|
adt byte_inst {
|
2018-02-03 18:53:13 -05:00
|
|
|
nop,
|
2018-03-07 01:58:19 -05:00
|
|
|
imm: imm,
|
|
|
|
|
add: add,
|
|
|
|
|
ldr: ldr,
|
|
|
|
|
str: str,
|
|
|
|
|
jmp: jmp,
|
|
|
|
|
jz: jz,
|
|
|
|
|
call: call,
|
2018-02-27 23:53:08 +00:00
|
|
|
ret
|
2018-02-03 18:53:13 -05:00
|
|
|
}
|
|
|
|
|
obj imm {
|
|
|
|
|
var reg: int
|
2018-03-06 23:30:00 -05:00
|
|
|
var val: long
|
2018-02-03 18:53:13 -05:00
|
|
|
}
|
2018-02-27 23:53:08 +00:00
|
|
|
obj add {
|
|
|
|
|
var to_reg: int
|
|
|
|
|
var a: int
|
|
|
|
|
var b: int
|
2018-02-03 22:47:21 -05:00
|
|
|
}
|
2018-02-27 23:53:08 +00:00
|
|
|
obj ldr {
|
2018-02-03 22:47:21 -05:00
|
|
|
var to_reg: int
|
|
|
|
|
var from_reg: int
|
2018-03-06 23:30:00 -05:00
|
|
|
var offset: long
|
2018-03-07 01:58:19 -05:00
|
|
|
var size: operand_size
|
2018-02-03 18:53:13 -05:00
|
|
|
}
|
2018-02-27 23:53:08 +00:00
|
|
|
obj str {
|
2018-02-03 18:53:13 -05:00
|
|
|
var to_reg: int
|
2018-03-06 23:30:00 -05:00
|
|
|
var offset: long
|
2018-02-03 18:53:13 -05:00
|
|
|
var from_reg: int
|
2018-03-07 01:58:19 -05:00
|
|
|
var size: operand_size
|
2018-02-03 18:53:13 -05:00
|
|
|
}
|
2018-02-27 21:27:29 -05:00
|
|
|
obj jmp {
|
2018-03-06 23:30:00 -05:00
|
|
|
var offset: long
|
2018-02-27 21:27:29 -05:00
|
|
|
}
|
2018-02-27 21:41:57 -05:00
|
|
|
obj jz {
|
2018-02-27 21:27:29 -05:00
|
|
|
var reg: int
|
2018-03-06 23:30:00 -05:00
|
|
|
var offset: long
|
2018-02-27 21:27:29 -05:00
|
|
|
}
|
2018-03-07 01:58:19 -05:00
|
|
|
obj call {
|
|
|
|
|
var reg: int
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
fun to_string(s: operand_size): string {
|
|
|
|
|
match (s) {
|
|
|
|
|
operand_size::b8() return string("8")
|
|
|
|
|
operand_size::b16() return string("16")
|
|
|
|
|
operand_size::b32() return string("32")
|
|
|
|
|
operand_size::b64() return string("64")
|
|
|
|
|
}
|
|
|
|
|
return string("missed operand size")
|
|
|
|
|
}
|
2018-02-02 00:26:31 -05:00
|
|
|
|
2018-02-03 18:53:13 -05:00
|
|
|
fun to_string(b: byte_inst): string {
|
|
|
|
|
match (b) {
|
2018-02-03 22:47:21 -05:00
|
|
|
byte_inst::nop() return string("nop")
|
|
|
|
|
byte_inst::imm(i) return string("r") + i.reg + " = imm " + i.val
|
2018-02-27 23:53:08 +00:00
|
|
|
byte_inst::add(a) return string("r") + a.to_reg + " = r" + a.a + " + r" + a.b
|
2018-03-07 01:58:19 -05:00
|
|
|
byte_inst::ldr(l) return string("r") + l.to_reg + " = ldr" + to_string(l.size) + " r" + l.from_reg + " (" + l.offset + ")"
|
|
|
|
|
byte_inst::str(s) return "str" + to_string(s.size) + " (r" + s.to_reg + "(" + s.offset + ") <= r" + s.from_reg + ")"
|
2018-02-27 21:27:29 -05:00
|
|
|
byte_inst::jmp(j) return string("jmp(pc += ") + j.offset + ")"
|
2018-03-07 01:58:19 -05:00
|
|
|
byte_inst::jz(j) return string("jmp(r") + j.reg + " == 0, pc += " + j.offset + ")"
|
|
|
|
|
byte_inst::call(c) return string("call pc = r") + c.reg
|
2018-02-27 23:53:08 +00:00
|
|
|
byte_inst::ret() return string("ret")
|
2018-02-03 18:53:13 -05:00
|
|
|
}
|
|
|
|
|
return string("Missed byte_inst case in to_string")
|
|
|
|
|
}
|
|
|
|
|
|
2018-03-07 01:58:19 -05:00
|
|
|
fun bytecode_to_string(functions: ref vector<bytecode_function>, instructions: ref vector<byte_inst>): string {
|
|
|
|
|
return string("\n").join(functions.map(fun(bb: ref bytecode_function): string return bb.to_string(instructions);))
|
2018-02-03 18:53:13 -05:00
|
|
|
}
|
|
|
|
|
|
2018-03-07 01:58:19 -05:00
|
|
|
fun bytecode_function(name: ref string, start: int): bytecode_function {
|
|
|
|
|
var to_ret.construct(name, start): bytecode_function
|
2018-02-03 18:53:13 -05:00
|
|
|
return to_ret
|
|
|
|
|
}
|
2018-02-27 23:53:08 +00:00
|
|
|
obj bytecode_function (Object) {
|
2018-02-03 18:53:13 -05:00
|
|
|
var name: string
|
2018-03-07 01:58:19 -05:00
|
|
|
var instruction_start: int
|
|
|
|
|
var instruction_end: int
|
2018-02-27 23:53:08 +00:00
|
|
|
var var_to_frame_offset: map<*ast_node, int>
|
|
|
|
|
var frame_size: int
|
2018-02-03 18:53:13 -05:00
|
|
|
|
2018-02-27 23:53:08 +00:00
|
|
|
fun construct(): *bytecode_function {
|
2018-03-07 01:58:19 -05:00
|
|
|
instruction_start = 0
|
|
|
|
|
instruction_end = 0
|
2018-02-03 18:53:13 -05:00
|
|
|
name.construct()
|
2018-02-27 23:53:08 +00:00
|
|
|
var_to_frame_offset.construct()
|
2018-03-07 01:58:19 -05:00
|
|
|
frame_size = 0
|
2018-02-03 18:53:13 -05:00
|
|
|
return this
|
|
|
|
|
}
|
2018-03-07 01:58:19 -05:00
|
|
|
fun construct(name_in: ref string, instruction_start_in: int): *bytecode_function {
|
|
|
|
|
instruction_start = instruction_start_in
|
|
|
|
|
instruction_end = 0
|
2018-02-03 18:53:13 -05:00
|
|
|
name.copy_construct(&name_in)
|
2018-02-27 23:53:08 +00:00
|
|
|
var_to_frame_offset.construct()
|
2018-03-07 01:58:19 -05:00
|
|
|
frame_size = 0
|
2018-02-03 18:53:13 -05:00
|
|
|
return this
|
|
|
|
|
}
|
2018-02-27 23:53:08 +00:00
|
|
|
fun copy_construct(old: *bytecode_function) {
|
2018-03-07 01:58:19 -05:00
|
|
|
instruction_start = old->instruction_start
|
|
|
|
|
instruction_end = old->instruction_end
|
2018-02-03 18:53:13 -05:00
|
|
|
name.copy_construct(&old->name)
|
2018-02-27 23:53:08 +00:00
|
|
|
var_to_frame_offset.copy_construct(&old->var_to_frame_offset)
|
|
|
|
|
frame_size = old->frame_size
|
2018-02-03 18:53:13 -05:00
|
|
|
}
|
2018-02-27 23:53:08 +00:00
|
|
|
fun operator=(other: ref bytecode_function) {
|
2018-02-03 18:53:13 -05:00
|
|
|
destruct()
|
|
|
|
|
copy_construct(&other)
|
|
|
|
|
}
|
|
|
|
|
fun destruct() {
|
|
|
|
|
name.destruct()
|
2018-02-27 23:53:08 +00:00
|
|
|
var_to_frame_offset.destruct()
|
2018-02-03 18:53:13 -05:00
|
|
|
}
|
2018-03-07 01:58:19 -05:00
|
|
|
fun to_string(instructions: ref vector<byte_inst>): string {
|
2018-02-27 23:53:08 +00:00
|
|
|
var res = name + "(frame size " + frame_size + "):\n"
|
|
|
|
|
res += "\t frame layout\n"
|
2018-03-07 01:58:19 -05:00
|
|
|
res += "\t\tsaved RBP : RPB = 0\n"
|
2018-02-27 23:53:08 +00:00
|
|
|
var_to_frame_offset.for_each(fun(n: *ast_node, o: int) {
|
2018-03-07 01:58:19 -05:00
|
|
|
res += "\t\t" + n->identifier.name + ": RBP - " + o + "\n"
|
2018-02-27 23:53:08 +00:00
|
|
|
})
|
|
|
|
|
res += "\n\t bytecode\n"
|
2018-03-07 01:58:19 -05:00
|
|
|
for (var i = instruction_start; i < instruction_end; i++;)
|
|
|
|
|
res += string("\t\t") + i + string(": ") + to_string(instructions[i]) + "\n"
|
2018-02-03 18:53:13 -05:00
|
|
|
return res
|
|
|
|
|
}
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
obj bytecode_generator (Object) {
|
2018-02-03 18:53:13 -05:00
|
|
|
var reg_counter: int
|
2018-02-27 23:53:08 +00:00
|
|
|
var reg_max: int
|
2018-02-02 00:26:31 -05:00
|
|
|
var id_counter: int
|
|
|
|
|
var ast_name_map: hash_map<*ast_node, string>
|
2018-02-27 23:53:08 +00:00
|
|
|
var functions: vector<bytecode_function>
|
2018-03-07 01:58:19 -05:00
|
|
|
var node_function_idx: map<*ast_node, int>
|
|
|
|
|
var instructions: vector<byte_inst>
|
|
|
|
|
var fixup_function_addresses: vector<pair<int, *ast_node>>
|
2018-02-02 00:26:31 -05:00
|
|
|
fun construct(): *bytecode_generator {
|
|
|
|
|
id_counter = 0
|
|
|
|
|
ast_name_map.construct()
|
2018-02-27 23:53:08 +00:00
|
|
|
functions.construct()
|
2018-03-07 01:58:19 -05:00
|
|
|
node_function_idx.construct()
|
|
|
|
|
instructions.construct()
|
|
|
|
|
fixup_function_addresses.construct()
|
2018-03-06 23:30:00 -05:00
|
|
|
reg_counter = 3
|
|
|
|
|
reg_max = 3
|
2018-02-02 00:26:31 -05:00
|
|
|
|
|
|
|
|
return this
|
|
|
|
|
}
|
|
|
|
|
fun copy_construct(old: *bytecode_generator) {
|
2018-02-03 18:53:13 -05:00
|
|
|
reg_counter = old->reg_counter
|
2018-02-27 23:53:08 +00:00
|
|
|
reg_max = old->reg_max
|
2018-02-02 00:26:31 -05:00
|
|
|
id_counter = old->id_counter
|
|
|
|
|
ast_name_map.copy_construct(&old->ast_name_map)
|
2018-02-27 23:53:08 +00:00
|
|
|
functions.copy_construct(&old->functions)
|
2018-03-07 01:58:19 -05:00
|
|
|
node_function_idx.copy_construct(&old->node_function_idx)
|
|
|
|
|
instructions.copy_construct(&old->instructions)
|
|
|
|
|
fixup_function_addresses.copy_construct(&old->fixup_function_addresses)
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
|
|
|
|
fun operator=(other: ref bytecode_generator) {
|
|
|
|
|
destruct()
|
|
|
|
|
copy_construct(&other)
|
|
|
|
|
}
|
|
|
|
|
fun destruct() {
|
|
|
|
|
ast_name_map.destruct()
|
2018-02-27 23:53:08 +00:00
|
|
|
functions.destruct()
|
2018-03-07 01:58:19 -05:00
|
|
|
node_function_idx.destruct()
|
|
|
|
|
instructions.destruct()
|
|
|
|
|
fixup_function_addresses.destruct()
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
|
|
|
|
fun get_id(): string return to_string(id_counter++);
|
2018-02-03 18:53:13 -05:00
|
|
|
fun get_reg(): int return reg_counter++;
|
2018-02-27 23:53:08 +00:00
|
|
|
fun reset_reg() {
|
|
|
|
|
if (reg_counter > reg_max) {
|
|
|
|
|
reg_max = reg_counter
|
|
|
|
|
}
|
2018-03-06 23:30:00 -05:00
|
|
|
reg_counter = 3
|
2018-02-27 23:53:08 +00:00
|
|
|
}
|
2018-03-07 01:58:19 -05:00
|
|
|
/*fun generate_bytecode(name_ast_map: map<string, pair<*tree<symbol>,*ast_node>>): pair<vector<bytecode_function>, vector<byte_inst>> {*/
|
|
|
|
|
fun generate_bytecode(name_ast_map: map<string, pair<*tree<symbol>,*ast_node>>) {
|
2018-02-02 00:26:31 -05:00
|
|
|
|
|
|
|
|
// iterate through asts
|
|
|
|
|
name_ast_map.for_each(fun(name: string, tree_pair: pair<*tree<symbol>,*ast_node>) {
|
|
|
|
|
// iterate through children for each ast
|
|
|
|
|
// do lambdas seperatly, so we can reconstitute the enclosing object if it has one
|
|
|
|
|
tree_pair.second->translation_unit.lambdas.for_each(fun(child: *ast_node) {
|
|
|
|
|
generate_function_definition(child)
|
|
|
|
|
})
|
|
|
|
|
tree_pair.second->translation_unit.children.for_each(fun(child: *ast_node) {
|
|
|
|
|
match (*child) {
|
|
|
|
|
ast_node::declaration_statement(backing) generate_declaration_statement(child)
|
|
|
|
|
ast_node::compiler_intrinsic(backing) generate_compiler_intrinsic(child)
|
|
|
|
|
ast_node::function(backing) generate_function_definition(child)
|
|
|
|
|
ast_node::template(backing) {
|
|
|
|
|
backing.instantiated.for_each(fun(node: *ast_node) {
|
|
|
|
|
match (*node) {
|
|
|
|
|
ast_node::function(backing) generate_function_definition(node)
|
|
|
|
|
ast_node::type_def(backing) {
|
|
|
|
|
backing.methods.for_each(fun(method: *ast_node) {
|
|
|
|
|
if (is_template(method))
|
|
|
|
|
method->template.instantiated.for_each(fun(m: *ast_node) generate_function_definition(m);)
|
|
|
|
|
else
|
|
|
|
|
generate_function_definition(method)
|
|
|
|
|
})
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
})
|
|
|
|
|
}
|
|
|
|
|
ast_node::type_def(backing) {
|
|
|
|
|
backing.methods.for_each(fun(method: *ast_node) {
|
|
|
|
|
if (is_template(method))
|
|
|
|
|
method->template.instantiated.for_each(fun(m: *ast_node) generate_function_definition(m);)
|
|
|
|
|
else
|
|
|
|
|
generate_function_definition(method)
|
|
|
|
|
})
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
})
|
|
|
|
|
})
|
2018-03-07 01:58:19 -05:00
|
|
|
fixup_function_addresses.for_each(fun(p: pair<int, *ast_node>) {
|
|
|
|
|
instructions[p.first].imm.val = functions[node_function_idx[p.second]].instruction_start
|
|
|
|
|
})
|
|
|
|
|
for (var i = 0; i < functions.size - 1; i++;)
|
|
|
|
|
functions[i].instruction_end = functions[i+1].instruction_start
|
|
|
|
|
functions.last().instruction_end = instructions.size
|
|
|
|
|
/*return make_pair(functions, instructions)*/
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_function_definition(node: *ast_node): int {
|
2018-03-07 01:58:19 -05:00
|
|
|
reset_reg()
|
|
|
|
|
node_function_idx[node] = functions.size
|
|
|
|
|
functions.add(bytecode_function(get_name(node), instructions.size))
|
2018-02-03 22:47:21 -05:00
|
|
|
node->function.parameters.for_each(fun(p: *ast_node) {
|
2018-02-27 23:53:08 +00:00
|
|
|
functions.last().var_to_frame_offset[p] = functions.last().frame_size
|
2018-03-06 23:30:00 -05:00
|
|
|
functions.last().frame_size += type_size(p->identifier.type)
|
2018-02-03 22:47:21 -05:00
|
|
|
})
|
2018-03-06 23:30:00 -05:00
|
|
|
emit_add(0, 0, emit_imm(-register_size)) // these two lines push rbp onto the stack, which grows towards negative
|
2018-03-07 01:58:19 -05:00
|
|
|
emit_str(0, 0, 1, operand_size::b64()) // rsp[0] <= rbp
|
2018-03-06 23:30:00 -05:00
|
|
|
emit_add(1, 0, emit_imm(0)) // note that we start the frame size at register_size for this reason
|
|
|
|
|
|
2018-03-07 01:58:19 -05:00
|
|
|
var push_frame_idx = instructions.size
|
|
|
|
|
emit_add(0, 0, emit_imm(0)) // this has to be fixed afterwards to be the -frame_size
|
2018-03-06 23:30:00 -05:00
|
|
|
|
2018-02-03 18:53:13 -05:00
|
|
|
generate(node->function.body_statement)
|
2018-03-06 23:30:00 -05:00
|
|
|
|
2018-03-07 01:58:19 -05:00
|
|
|
instructions[push_frame_idx].imm.val = -functions.last().frame_size
|
2018-03-06 23:30:00 -05:00
|
|
|
|
2018-02-03 18:53:13 -05:00
|
|
|
return -1
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_declaration_statement(node: *ast_node): int {
|
2018-02-02 00:26:31 -05:00
|
|
|
var identifier = node->declaration_statement.identifier
|
|
|
|
|
var ident_type = identifier->identifier.type
|
2018-03-06 23:30:00 -05:00
|
|
|
functions.last().frame_size += type_size(ident_type)
|
2018-03-07 01:58:19 -05:00
|
|
|
functions.last().var_to_frame_offset[identifier] = functions.last().frame_size
|
2018-02-02 00:26:31 -05:00
|
|
|
if (node->declaration_statement.expression) {
|
2018-03-07 01:58:19 -05:00
|
|
|
emit_str(1, functions.last().var_to_frame_offset[identifier], generate(node->declaration_statement.expression), size_to_operand_size(type_size(get_ast_type(identifier))))
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
return -1
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_assignment_statement(node: *ast_node): int {
|
2018-03-07 01:58:19 -05:00
|
|
|
/*var to = generate(node->assignment_statement.to, true)*/
|
2018-02-03 18:53:13 -05:00
|
|
|
var from = generate(node->assignment_statement.from)
|
2018-03-07 01:58:19 -05:00
|
|
|
var to = generate(node->assignment_statement.to, true)
|
|
|
|
|
emit_str(to, 0, from, size_to_operand_size(type_size(get_ast_type(node->assignment_statement.to))))
|
2018-02-03 18:53:13 -05:00
|
|
|
return -1
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_if_statement(node: *ast_node): int {
|
2018-02-27 21:27:29 -05:00
|
|
|
var cond_reg = generate(node->if_statement.condition)
|
2018-03-07 01:58:19 -05:00
|
|
|
var jz_index = instructions.size
|
2018-02-27 21:41:57 -05:00
|
|
|
emit_jz(cond_reg,0)
|
2018-02-03 18:53:13 -05:00
|
|
|
generate(node->if_statement.then_part)
|
2018-02-27 21:27:29 -05:00
|
|
|
if (node->if_statement.else_part) {
|
2018-03-07 01:58:19 -05:00
|
|
|
var jmp_index = instructions.size
|
2018-02-27 21:27:29 -05:00
|
|
|
emit_jmp(0)
|
2018-03-07 01:58:19 -05:00
|
|
|
instructions[jz_index].jz.offset = instructions.size - jz_index
|
2018-02-03 18:53:13 -05:00
|
|
|
generate(node->if_statement.else_part)
|
2018-03-07 01:58:19 -05:00
|
|
|
instructions[jmp_index].jmp.offset = instructions.size - jmp_index
|
2018-02-27 21:27:29 -05:00
|
|
|
} else {
|
2018-03-07 01:58:19 -05:00
|
|
|
instructions[jz_index].jz.offset = instructions.size - jz_index
|
2018-02-27 21:27:29 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
return -1
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_while_loop(node: *ast_node): int {
|
|
|
|
|
generate(node->while_loop.condition)
|
|
|
|
|
generate(node->while_loop.statement)
|
|
|
|
|
return -1
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_for_loop(node: *ast_node): int {
|
|
|
|
|
if (node->for_loop.init)
|
|
|
|
|
generate(node->for_loop.init)
|
|
|
|
|
if (node->for_loop.condition)
|
|
|
|
|
generate(node->for_loop.condition)
|
|
|
|
|
if (node->for_loop.update)
|
|
|
|
|
generate(node->for_loop.update)
|
|
|
|
|
generate(node->for_loop.body)
|
|
|
|
|
return -1
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 22:47:21 -05:00
|
|
|
fun generate_identifier(node: *ast_node, lvalue: bool): int {
|
2018-02-27 23:53:08 +00:00
|
|
|
if (lvalue) {
|
2018-03-06 23:30:00 -05:00
|
|
|
return emit_add(1, emit_imm(-functions.last().var_to_frame_offset[node]))
|
2018-02-27 23:53:08 +00:00
|
|
|
} else {
|
2018-03-07 01:58:19 -05:00
|
|
|
return emit_ldr(1, -functions.last().var_to_frame_offset[node], size_to_operand_size(type_size(get_ast_type(node))))
|
2018-02-27 23:53:08 +00:00
|
|
|
}
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_return_statement(node: *ast_node): int {
|
2018-02-27 23:53:08 +00:00
|
|
|
if (node->return_statement.return_value) {
|
2018-03-06 23:30:00 -05:00
|
|
|
/*emit_str(1, register_size, generate(node->return_statement.return_value))*/
|
|
|
|
|
emit_add(2, emit_imm(0), generate(node->return_statement.return_value))
|
2018-03-07 01:58:19 -05:00
|
|
|
emit_add(0, 1, emit_imm(register_size))
|
|
|
|
|
emit_ldr(1, 1, 0, operand_size::b64())
|
2018-02-27 23:53:08 +00:00
|
|
|
emit_ret()
|
|
|
|
|
} else {
|
|
|
|
|
emit_ret()
|
|
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
return -1
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_branching_statement(node: *ast_node): int {
|
2018-02-02 00:26:31 -05:00
|
|
|
match(node->branching_statement.b_type) {
|
2018-03-07 01:58:19 -05:00
|
|
|
branching_type::break_stmt() instructions.add(byte_inst::nop())
|
|
|
|
|
branching_type::continue_stmt() instructions.add(byte_inst::nop())
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
return -1
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_cast(node: *ast_node): int {
|
|
|
|
|
return generate(node->cast.value)
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_value(node: *ast_node): int {
|
2018-02-27 21:27:29 -05:00
|
|
|
if (node->value.value_type->is_bool())
|
|
|
|
|
return emit_imm((node->value.string_value == "true") cast int)
|
|
|
|
|
else
|
|
|
|
|
return emit_imm(string_to_num<int>(node->value.string_value))
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_code_block(node: *ast_node): int {
|
2018-02-27 23:53:08 +00:00
|
|
|
node->code_block.children.for_each(fun(child: *ast_node) {
|
2018-03-06 23:30:00 -05:00
|
|
|
// registers aren't used between statements (only stack reg)
|
|
|
|
|
reset_reg()
|
|
|
|
|
generate(child)
|
2018-02-27 23:53:08 +00:00
|
|
|
})
|
2018-02-03 18:53:13 -05:00
|
|
|
return -1
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
|
|
|
|
// this generates the function as a value, not the actual function
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_function(node: *ast_node): int {
|
2018-03-07 01:58:19 -05:00
|
|
|
fixup_function_addresses.add(make_pair(instructions.size,node))
|
2018-02-03 18:53:13 -05:00
|
|
|
return emit_imm(-2)
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 22:47:21 -05:00
|
|
|
fun generate_function_call(node: *ast_node, lvalue: bool): int {
|
2018-02-03 18:53:13 -05:00
|
|
|
node->function_call.parameters.for_each(fun(child: *ast_node) generate(child);)
|
2018-03-07 01:58:19 -05:00
|
|
|
return emit_call(generate_function(node->function_call.func))
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
|
|
|
|
|
2018-02-03 18:53:13 -05:00
|
|
|
fun generate_compiler_intrinsic(node: *ast_node): int {
|
2018-03-07 01:58:19 -05:00
|
|
|
instructions.add(byte_inst::nop())
|
2018-02-03 18:53:13 -05:00
|
|
|
return -1
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
|
|
|
|
|
2018-02-03 22:47:21 -05:00
|
|
|
fun generate(node: *ast_node): int return generate(node, false)
|
|
|
|
|
fun generate(node: *ast_node, lvalue: bool): int {
|
2018-02-02 00:26:31 -05:00
|
|
|
match (*node) {
|
2018-02-03 18:53:13 -05:00
|
|
|
ast_node::declaration_statement(backing) return generate_declaration_statement(node)
|
|
|
|
|
ast_node::assignment_statement(backing) return generate_assignment_statement(node)
|
|
|
|
|
ast_node::if_statement(backing) return generate_if_statement(node)
|
|
|
|
|
ast_node::while_loop(backing) return generate_while_loop(node)
|
|
|
|
|
ast_node::for_loop(backing) return generate_for_loop(node)
|
|
|
|
|
ast_node::function(backing) return generate_function(node)
|
2018-02-03 22:47:21 -05:00
|
|
|
ast_node::function_call(backing) return generate_function_call(node, lvalue)
|
2018-02-03 18:53:13 -05:00
|
|
|
ast_node::compiler_intrinsic(backing) return generate_compiler_intrinsic(node)
|
|
|
|
|
ast_node::code_block(backing) return generate_code_block(node)
|
|
|
|
|
ast_node::return_statement(backing) return generate_return_statement(node)
|
|
|
|
|
ast_node::branching_statement(backing) return generate_branching_statement(node)
|
|
|
|
|
ast_node::cast(backing) return generate_cast(node)
|
|
|
|
|
ast_node::value(backing) return generate_value(node)
|
2018-02-03 22:47:21 -05:00
|
|
|
ast_node::identifier(backing) return generate_identifier(node, lvalue)
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
2018-02-03 18:53:13 -05:00
|
|
|
error("Bad node")
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|
|
|
|
|
fun get_name(node: *ast_node): string {
|
|
|
|
|
var maybe_it = ast_name_map.get_ptr_or_null(node);
|
|
|
|
|
if (maybe_it)
|
|
|
|
|
return *maybe_it
|
2018-02-03 18:53:13 -05:00
|
|
|
var result = get_ast_name(node) + get_id()
|
|
|
|
|
if (is_function(node) && node->function.name == "main")
|
|
|
|
|
result = "main"
|
2018-02-02 00:26:31 -05:00
|
|
|
ast_name_map.set(node, result)
|
|
|
|
|
return result
|
|
|
|
|
}
|
2018-03-06 23:30:00 -05:00
|
|
|
fun emit_imm(value: ulong): int { return emit_imm((value) cast int); }
|
2018-02-03 18:53:13 -05:00
|
|
|
fun emit_imm(value: int): int {
|
|
|
|
|
var i: imm
|
|
|
|
|
i.reg = get_reg()
|
|
|
|
|
i.val = value
|
2018-03-07 01:58:19 -05:00
|
|
|
instructions.add(byte_inst::imm(i))
|
2018-02-03 18:53:13 -05:00
|
|
|
return i.reg
|
|
|
|
|
}
|
2018-02-27 23:53:08 +00:00
|
|
|
fun emit_add(a: int, b: int): int {
|
2018-03-06 23:30:00 -05:00
|
|
|
return emit_add(get_reg(), a, b)
|
|
|
|
|
}
|
|
|
|
|
fun emit_add(dest: int, a: int, b: int): int {
|
2018-02-27 23:53:08 +00:00
|
|
|
var i: add
|
2018-03-06 23:30:00 -05:00
|
|
|
i.to_reg = dest
|
2018-02-27 23:53:08 +00:00
|
|
|
i.a = a
|
|
|
|
|
i.b = b
|
2018-03-07 01:58:19 -05:00
|
|
|
instructions.add(byte_inst::add(i))
|
2018-02-27 23:53:08 +00:00
|
|
|
return i.to_reg
|
2018-02-03 22:47:21 -05:00
|
|
|
}
|
2018-03-07 01:58:19 -05:00
|
|
|
fun emit_ldr(reg: int, offset: int, size: operand_size): int { return emit_ldr(get_reg(), reg, offset, size); }
|
|
|
|
|
fun emit_ldr(dest: int, reg: int, offset: int, size: operand_size): int {
|
2018-02-27 23:53:08 +00:00
|
|
|
var l: ldr
|
2018-03-06 23:30:00 -05:00
|
|
|
l.to_reg = dest
|
2018-02-27 23:53:08 +00:00
|
|
|
l.from_reg = reg
|
|
|
|
|
l.offset = offset
|
2018-03-07 01:58:19 -05:00
|
|
|
l.size = size
|
|
|
|
|
instructions.add(byte_inst::ldr(l))
|
2018-02-03 22:47:21 -05:00
|
|
|
return l.to_reg
|
2018-02-03 18:53:13 -05:00
|
|
|
}
|
2018-03-07 01:58:19 -05:00
|
|
|
fun emit_str(to_reg: int, offset: int, from_reg: int, size: operand_size): int {
|
2018-02-27 23:53:08 +00:00
|
|
|
var s: str
|
2018-02-03 18:53:13 -05:00
|
|
|
s.to_reg = to_reg
|
2018-02-27 23:53:08 +00:00
|
|
|
s.offset = offset
|
2018-02-03 18:53:13 -05:00
|
|
|
s.from_reg = from_reg
|
2018-03-07 01:58:19 -05:00
|
|
|
s.size = size
|
|
|
|
|
instructions.add(byte_inst::str(s))
|
2018-02-03 18:53:13 -05:00
|
|
|
return -1
|
|
|
|
|
}
|
2018-02-27 21:27:29 -05:00
|
|
|
fun emit_jmp(offset: int): int {
|
|
|
|
|
var j: jmp
|
|
|
|
|
j.offset = offset
|
2018-03-07 01:58:19 -05:00
|
|
|
instructions.add(byte_inst::jmp(j))
|
2018-02-27 21:27:29 -05:00
|
|
|
return -1
|
|
|
|
|
}
|
2018-02-27 21:41:57 -05:00
|
|
|
fun emit_jz(reg: int, offset: int): int {
|
|
|
|
|
var j: jz
|
2018-02-27 21:27:29 -05:00
|
|
|
j.reg = reg
|
|
|
|
|
j.offset = offset
|
2018-03-07 01:58:19 -05:00
|
|
|
instructions.add(byte_inst::jz(j))
|
2018-02-27 21:27:29 -05:00
|
|
|
return -1
|
|
|
|
|
}
|
2018-02-27 23:53:08 +00:00
|
|
|
fun emit_ret(): int {
|
2018-03-07 01:58:19 -05:00
|
|
|
instructions.add(byte_inst::ret())
|
2018-02-03 18:53:13 -05:00
|
|
|
return -1
|
|
|
|
|
}
|
2018-03-07 01:58:19 -05:00
|
|
|
fun emit_call(reg: int): int {
|
|
|
|
|
var c: call
|
|
|
|
|
c.reg = reg
|
|
|
|
|
instructions.add(byte_inst::call(c))
|
|
|
|
|
return 2
|
2018-02-03 18:53:13 -05:00
|
|
|
}
|
2018-02-03 22:47:21 -05:00
|
|
|
|
2018-03-06 23:30:00 -05:00
|
|
|
// Stack ABI
|
|
|
|
|
// it's system v x64, but all params passed on stack
|
2018-02-03 22:47:21 -05:00
|
|
|
fun evaluate(): int {
|
|
|
|
|
println("evaling main")
|
2018-03-07 01:58:19 -05:00
|
|
|
println(bytecode_to_string(functions, instructions))
|
2018-02-27 23:53:08 +00:00
|
|
|
var main_entry = functions.find_first_satisfying(fun(block: bytecode_function): bool return block.name == "main";)
|
2018-03-06 23:30:00 -05:00
|
|
|
var registers.construct(reg_max): vector<long>
|
2018-02-27 23:53:08 +00:00
|
|
|
registers.size = reg_max
|
2018-03-07 01:58:19 -05:00
|
|
|
registers[0] = -register_size // with the stack being zeroed out, this makes it a return address of 0
|
|
|
|
|
registers[1] = 0xdeadbeefcafebabe
|
2018-03-06 23:30:00 -05:00
|
|
|
var stack_size = 8 * 1024 * 1024
|
|
|
|
|
var stack = new<uchar>(stack_size) + stack_size
|
|
|
|
|
for (var i = 0; i < stack_size; i++;)
|
|
|
|
|
stack[-i + -1] = 0
|
2018-03-07 01:58:19 -05:00
|
|
|
for (var i = main_entry.instruction_start; i < instructions.size; i++;) {
|
|
|
|
|
println(string("evaling: ") + i + ": " + to_string(instructions[i]))
|
|
|
|
|
match(instructions[i]) {
|
2018-02-03 22:47:21 -05:00
|
|
|
byte_inst::nop() {}
|
|
|
|
|
byte_inst::imm(i) registers[i.reg] = i.val
|
2018-02-27 23:53:08 +00:00
|
|
|
byte_inst::add(a) registers[a.to_reg] = registers[a.a] + registers[a.b]
|
2018-03-07 01:58:19 -05:00
|
|
|
byte_inst::ldr(l) match (l.size) {
|
|
|
|
|
operand_size::b8() registers[l.to_reg] = *(stack + registers[l.from_reg] + l.offset) cast *char
|
|
|
|
|
operand_size::b16() registers[l.to_reg] = *(stack + registers[l.from_reg] + l.offset) cast *short
|
|
|
|
|
operand_size::b32() registers[l.to_reg] = *(stack + registers[l.from_reg] + l.offset) cast *int
|
|
|
|
|
operand_size::b64() registers[l.to_reg] = *(stack + registers[l.from_reg] + l.offset) cast *long
|
|
|
|
|
}
|
|
|
|
|
byte_inst::str(s) match (s.size) {
|
|
|
|
|
operand_size::b8() *(stack + registers[s.to_reg] + s.offset) cast *uchar = registers[s.from_reg]
|
|
|
|
|
operand_size::b16() *(stack + registers[s.to_reg] + s.offset) cast *ushort = registers[s.from_reg]
|
|
|
|
|
operand_size::b32() *(stack + registers[s.to_reg] + s.offset) cast *uint = registers[s.from_reg]
|
|
|
|
|
operand_size::b64() *(stack + registers[s.to_reg] + s.offset) cast *ulong = registers[s.from_reg]
|
|
|
|
|
}
|
2018-02-27 21:27:29 -05:00
|
|
|
byte_inst::jmp(j) i += j.offset - 1 // to counteract pc inc
|
2018-02-27 21:41:57 -05:00
|
|
|
byte_inst::jz(j) if (registers[j.reg] == 0)
|
2018-02-27 21:27:29 -05:00
|
|
|
i += j.offset - 1 // to counteract pc inc
|
2018-03-07 01:58:19 -05:00
|
|
|
byte_inst::call(c) {
|
|
|
|
|
/*registers[0] -= register_size*/
|
|
|
|
|
registers[0] = registers[0] - register_size
|
|
|
|
|
*(stack + registers[0]) cast *long = i + 1
|
|
|
|
|
i = registers[c.reg] - 1
|
2018-03-06 23:30:00 -05:00
|
|
|
}
|
2018-02-27 23:53:08 +00:00
|
|
|
byte_inst::ret() {
|
2018-03-07 01:58:19 -05:00
|
|
|
var pc = *(stack + registers[0]) cast *long
|
|
|
|
|
/*registers[0] += register_size*/
|
|
|
|
|
registers[0] = registers[0] + register_size
|
2018-02-27 23:53:08 +00:00
|
|
|
print("returning! return value is\n\t")
|
2018-03-06 23:30:00 -05:00
|
|
|
var value = registers[2]
|
|
|
|
|
println(value)
|
|
|
|
|
println("first part of memory is")
|
|
|
|
|
for (var i = 0; i < 8*8; i+=8;) {
|
|
|
|
|
print(string("-") + i + string(": "))
|
|
|
|
|
for (var j = 0; j < 8; j++;) {
|
|
|
|
|
if (j == 4)
|
|
|
|
|
print(" ")
|
|
|
|
|
print(*(stack - (i+j)*#sizeof<uchar> - 1) cast *uchar)
|
|
|
|
|
print(" ")
|
|
|
|
|
}
|
|
|
|
|
println()
|
|
|
|
|
}
|
|
|
|
|
println("Done")
|
2018-03-07 01:58:19 -05:00
|
|
|
if (pc == 0) {
|
|
|
|
|
return value
|
|
|
|
|
} else {
|
|
|
|
|
i = pc - 1
|
|
|
|
|
println(string("returning to ") + pc)
|
|
|
|
|
}
|
2018-02-27 23:53:08 +00:00
|
|
|
}
|
2018-02-03 22:47:21 -05:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return -1
|
|
|
|
|
}
|
2018-02-02 00:26:31 -05:00
|
|
|
}
|