371 lines
13 KiB
OCaml
371 lines
13 KiB
OCaml
|
(*===----------------------------------------------------------------------===
|
||
|
* Code Generation
|
||
|
*===----------------------------------------------------------------------===*)
|
||
|
|
||
|
open Llvm
|
||
|
|
||
|
exception Error of string
|
||
|
|
||
|
let context = global_context ()
|
||
|
let the_module = create_module context "my cool jit"
|
||
|
let builder = builder context
|
||
|
let named_values:(string, llvalue) Hashtbl.t = Hashtbl.create 10
|
||
|
let double_type = double_type context
|
||
|
|
||
|
(* Create an alloca instruction in the entry block of the function. This
|
||
|
* is used for mutable variables etc. *)
|
||
|
let create_entry_block_alloca the_function var_name =
|
||
|
let builder = builder_at context (instr_begin (entry_block the_function)) in
|
||
|
build_alloca double_type var_name builder
|
||
|
|
||
|
let rec codegen_expr = function
|
||
|
| Ast.Number n -> const_float double_type n
|
||
|
| Ast.Variable name ->
|
||
|
let v = try Hashtbl.find named_values name with
|
||
|
| Not_found -> raise (Error "unknown variable name")
|
||
|
in
|
||
|
(* Load the value. *)
|
||
|
build_load v name builder
|
||
|
| Ast.Unary (op, operand) ->
|
||
|
let operand = codegen_expr operand in
|
||
|
let callee = "unary" ^ (String.make 1 op) in
|
||
|
let callee =
|
||
|
match lookup_function callee the_module with
|
||
|
| Some callee -> callee
|
||
|
| None -> raise (Error "unknown unary operator")
|
||
|
in
|
||
|
build_call callee [|operand|] "unop" builder
|
||
|
| Ast.Binary (op, lhs, rhs) ->
|
||
|
begin match op with
|
||
|
| '=' ->
|
||
|
(* Special case '=' because we don't want to emit the LHS as an
|
||
|
* expression. *)
|
||
|
let name =
|
||
|
match lhs with
|
||
|
| Ast.Variable name -> name
|
||
|
| _ -> raise (Error "destination of '=' must be a variable")
|
||
|
in
|
||
|
|
||
|
(* Codegen the rhs. *)
|
||
|
let val_ = codegen_expr rhs in
|
||
|
|
||
|
(* Lookup the name. *)
|
||
|
let variable = try Hashtbl.find named_values name with
|
||
|
| Not_found -> raise (Error "unknown variable name")
|
||
|
in
|
||
|
ignore(build_store val_ variable builder);
|
||
|
val_
|
||
|
| _ ->
|
||
|
let lhs_val = codegen_expr lhs in
|
||
|
let rhs_val = codegen_expr rhs in
|
||
|
begin
|
||
|
match op with
|
||
|
| '+' -> build_fadd lhs_val rhs_val "addtmp" builder
|
||
|
| '-' -> build_fsub lhs_val rhs_val "subtmp" builder
|
||
|
| '*' -> build_fmul lhs_val rhs_val "multmp" builder
|
||
|
| '<' ->
|
||
|
(* Convert bool 0/1 to double 0.0 or 1.0 *)
|
||
|
let i = build_fcmp Fcmp.Ult lhs_val rhs_val "cmptmp" builder in
|
||
|
build_uitofp i double_type "booltmp" builder
|
||
|
| _ ->
|
||
|
(* If it wasn't a builtin binary operator, it must be a user defined
|
||
|
* one. Emit a call to it. *)
|
||
|
let callee = "binary" ^ (String.make 1 op) in
|
||
|
let callee =
|
||
|
match lookup_function callee the_module with
|
||
|
| Some callee -> callee
|
||
|
| None -> raise (Error "binary operator not found!")
|
||
|
in
|
||
|
build_call callee [|lhs_val; rhs_val|] "binop" builder
|
||
|
end
|
||
|
end
|
||
|
| Ast.Call (callee, args) ->
|
||
|
(* Look up the name in the module table. *)
|
||
|
let callee =
|
||
|
match lookup_function callee the_module with
|
||
|
| Some callee -> callee
|
||
|
| None -> raise (Error "unknown function referenced")
|
||
|
in
|
||
|
let params = params callee in
|
||
|
|
||
|
(* If argument mismatch error. *)
|
||
|
if Array.length params == Array.length args then () else
|
||
|
raise (Error "incorrect # arguments passed");
|
||
|
let args = Array.map codegen_expr args in
|
||
|
build_call callee args "calltmp" builder
|
||
|
| Ast.If (cond, then_, else_) ->
|
||
|
let cond = codegen_expr cond in
|
||
|
|
||
|
(* Convert condition to a bool by comparing equal to 0.0 *)
|
||
|
let zero = const_float double_type 0.0 in
|
||
|
let cond_val = build_fcmp Fcmp.One cond zero "ifcond" builder in
|
||
|
|
||
|
(* Grab the first block so that we might later add the conditional branch
|
||
|
* to it at the end of the function. *)
|
||
|
let start_bb = insertion_block builder in
|
||
|
let the_function = block_parent start_bb in
|
||
|
|
||
|
let then_bb = append_block context "then" the_function in
|
||
|
|
||
|
(* Emit 'then' value. *)
|
||
|
position_at_end then_bb builder;
|
||
|
let then_val = codegen_expr then_ in
|
||
|
|
||
|
(* Codegen of 'then' can change the current block, update then_bb for the
|
||
|
* phi. We create a new name because one is used for the phi node, and the
|
||
|
* other is used for the conditional branch. *)
|
||
|
let new_then_bb = insertion_block builder in
|
||
|
|
||
|
(* Emit 'else' value. *)
|
||
|
let else_bb = append_block context "else" the_function in
|
||
|
position_at_end else_bb builder;
|
||
|
let else_val = codegen_expr else_ in
|
||
|
|
||
|
(* Codegen of 'else' can change the current block, update else_bb for the
|
||
|
* phi. *)
|
||
|
let new_else_bb = insertion_block builder in
|
||
|
|
||
|
(* Emit merge block. *)
|
||
|
let merge_bb = append_block context "ifcont" the_function in
|
||
|
position_at_end merge_bb builder;
|
||
|
let incoming = [(then_val, new_then_bb); (else_val, new_else_bb)] in
|
||
|
let phi = build_phi incoming "iftmp" builder in
|
||
|
|
||
|
(* Return to the start block to add the conditional branch. *)
|
||
|
position_at_end start_bb builder;
|
||
|
ignore (build_cond_br cond_val then_bb else_bb builder);
|
||
|
|
||
|
(* Set a unconditional branch at the end of the 'then' block and the
|
||
|
* 'else' block to the 'merge' block. *)
|
||
|
position_at_end new_then_bb builder; ignore (build_br merge_bb builder);
|
||
|
position_at_end new_else_bb builder; ignore (build_br merge_bb builder);
|
||
|
|
||
|
(* Finally, set the builder to the end of the merge block. *)
|
||
|
position_at_end merge_bb builder;
|
||
|
|
||
|
phi
|
||
|
| Ast.For (var_name, start, end_, step, body) ->
|
||
|
(* Output this as:
|
||
|
* var = alloca double
|
||
|
* ...
|
||
|
* start = startexpr
|
||
|
* store start -> var
|
||
|
* goto loop
|
||
|
* loop:
|
||
|
* ...
|
||
|
* bodyexpr
|
||
|
* ...
|
||
|
* loopend:
|
||
|
* step = stepexpr
|
||
|
* endcond = endexpr
|
||
|
*
|
||
|
* curvar = load var
|
||
|
* nextvar = curvar + step
|
||
|
* store nextvar -> var
|
||
|
* br endcond, loop, endloop
|
||
|
* outloop: *)
|
||
|
|
||
|
let the_function = block_parent (insertion_block builder) in
|
||
|
|
||
|
(* Create an alloca for the variable in the entry block. *)
|
||
|
let alloca = create_entry_block_alloca the_function var_name in
|
||
|
|
||
|
(* Emit the start code first, without 'variable' in scope. *)
|
||
|
let start_val = codegen_expr start in
|
||
|
|
||
|
(* Store the value into the alloca. *)
|
||
|
ignore(build_store start_val alloca builder);
|
||
|
|
||
|
(* Make the new basic block for the loop header, inserting after current
|
||
|
* block. *)
|
||
|
let loop_bb = append_block context "loop" the_function in
|
||
|
|
||
|
(* Insert an explicit fall through from the current block to the
|
||
|
* loop_bb. *)
|
||
|
ignore (build_br loop_bb builder);
|
||
|
|
||
|
(* Start insertion in loop_bb. *)
|
||
|
position_at_end loop_bb builder;
|
||
|
|
||
|
(* Within the loop, the variable is defined equal to the PHI node. If it
|
||
|
* shadows an existing variable, we have to restore it, so save it
|
||
|
* now. *)
|
||
|
let old_val =
|
||
|
try Some (Hashtbl.find named_values var_name) with Not_found -> None
|
||
|
in
|
||
|
Hashtbl.add named_values var_name alloca;
|
||
|
|
||
|
(* Emit the body of the loop. This, like any other expr, can change the
|
||
|
* current BB. Note that we ignore the value computed by the body, but
|
||
|
* don't allow an error *)
|
||
|
ignore (codegen_expr body);
|
||
|
|
||
|
(* Emit the step value. *)
|
||
|
let step_val =
|
||
|
match step with
|
||
|
| Some step -> codegen_expr step
|
||
|
(* If not specified, use 1.0. *)
|
||
|
| None -> const_float double_type 1.0
|
||
|
in
|
||
|
|
||
|
(* Compute the end condition. *)
|
||
|
let end_cond = codegen_expr end_ in
|
||
|
|
||
|
(* Reload, increment, and restore the alloca. This handles the case where
|
||
|
* the body of the loop mutates the variable. *)
|
||
|
let cur_var = build_load alloca var_name builder in
|
||
|
let next_var = build_add cur_var step_val "nextvar" builder in
|
||
|
ignore(build_store next_var alloca builder);
|
||
|
|
||
|
(* Convert condition to a bool by comparing equal to 0.0. *)
|
||
|
let zero = const_float double_type 0.0 in
|
||
|
let end_cond = build_fcmp Fcmp.One end_cond zero "loopcond" builder in
|
||
|
|
||
|
(* Create the "after loop" block and insert it. *)
|
||
|
let after_bb = append_block context "afterloop" the_function in
|
||
|
|
||
|
(* Insert the conditional branch into the end of loop_end_bb. *)
|
||
|
ignore (build_cond_br end_cond loop_bb after_bb builder);
|
||
|
|
||
|
(* Any new code will be inserted in after_bb. *)
|
||
|
position_at_end after_bb builder;
|
||
|
|
||
|
(* Restore the unshadowed variable. *)
|
||
|
begin match old_val with
|
||
|
| Some old_val -> Hashtbl.add named_values var_name old_val
|
||
|
| None -> ()
|
||
|
end;
|
||
|
|
||
|
(* for expr always returns 0.0. *)
|
||
|
const_null double_type
|
||
|
| Ast.Var (var_names, body) ->
|
||
|
let old_bindings = ref [] in
|
||
|
|
||
|
let the_function = block_parent (insertion_block builder) in
|
||
|
|
||
|
(* Register all variables and emit their initializer. *)
|
||
|
Array.iter (fun (var_name, init) ->
|
||
|
(* Emit the initializer before adding the variable to scope, this
|
||
|
* prevents the initializer from referencing the variable itself, and
|
||
|
* permits stuff like this:
|
||
|
* var a = 1 in
|
||
|
* var a = a in ... # refers to outer 'a'. *)
|
||
|
let init_val =
|
||
|
match init with
|
||
|
| Some init -> codegen_expr init
|
||
|
(* If not specified, use 0.0. *)
|
||
|
| None -> const_float double_type 0.0
|
||
|
in
|
||
|
|
||
|
let alloca = create_entry_block_alloca the_function var_name in
|
||
|
ignore(build_store init_val alloca builder);
|
||
|
|
||
|
(* Remember the old variable binding so that we can restore the binding
|
||
|
* when we unrecurse. *)
|
||
|
begin
|
||
|
try
|
||
|
let old_value = Hashtbl.find named_values var_name in
|
||
|
old_bindings := (var_name, old_value) :: !old_bindings;
|
||
|
with Not_found -> ()
|
||
|
end;
|
||
|
|
||
|
(* Remember this binding. *)
|
||
|
Hashtbl.add named_values var_name alloca;
|
||
|
) var_names;
|
||
|
|
||
|
(* Codegen the body, now that all vars are in scope. *)
|
||
|
let body_val = codegen_expr body in
|
||
|
|
||
|
(* Pop all our variables from scope. *)
|
||
|
List.iter (fun (var_name, old_value) ->
|
||
|
Hashtbl.add named_values var_name old_value
|
||
|
) !old_bindings;
|
||
|
|
||
|
(* Return the body computation. *)
|
||
|
body_val
|
||
|
|
||
|
let codegen_proto = function
|
||
|
| Ast.Prototype (name, args) | Ast.BinOpPrototype (name, args, _) ->
|
||
|
(* Make the function type: double(double,double) etc. *)
|
||
|
let doubles = Array.make (Array.length args) double_type in
|
||
|
let ft = function_type double_type doubles in
|
||
|
let f =
|
||
|
match lookup_function name the_module with
|
||
|
| None -> declare_function name ft the_module
|
||
|
|
||
|
(* If 'f' conflicted, there was already something named 'name'. If it
|
||
|
* has a body, don't allow redefinition or reextern. *)
|
||
|
| Some f ->
|
||
|
(* If 'f' already has a body, reject this. *)
|
||
|
if block_begin f <> At_end f then
|
||
|
raise (Error "redefinition of function");
|
||
|
|
||
|
(* If 'f' took a different number of arguments, reject. *)
|
||
|
if element_type (type_of f) <> ft then
|
||
|
raise (Error "redefinition of function with different # args");
|
||
|
f
|
||
|
in
|
||
|
|
||
|
(* Set names for all arguments. *)
|
||
|
Array.iteri (fun i a ->
|
||
|
let n = args.(i) in
|
||
|
set_value_name n a;
|
||
|
Hashtbl.add named_values n a;
|
||
|
) (params f);
|
||
|
f
|
||
|
|
||
|
(* Create an alloca for each argument and register the argument in the symbol
|
||
|
* table so that references to it will succeed. *)
|
||
|
let create_argument_allocas the_function proto =
|
||
|
let args = match proto with
|
||
|
| Ast.Prototype (_, args) | Ast.BinOpPrototype (_, args, _) -> args
|
||
|
in
|
||
|
Array.iteri (fun i ai ->
|
||
|
let var_name = args.(i) in
|
||
|
(* Create an alloca for this variable. *)
|
||
|
let alloca = create_entry_block_alloca the_function var_name in
|
||
|
|
||
|
(* Store the initial value into the alloca. *)
|
||
|
ignore(build_store ai alloca builder);
|
||
|
|
||
|
(* Add arguments to variable symbol table. *)
|
||
|
Hashtbl.add named_values var_name alloca;
|
||
|
) (params the_function)
|
||
|
|
||
|
let codegen_func the_fpm = function
|
||
|
| Ast.Function (proto, body) ->
|
||
|
Hashtbl.clear named_values;
|
||
|
let the_function = codegen_proto proto in
|
||
|
|
||
|
(* If this is an operator, install it. *)
|
||
|
begin match proto with
|
||
|
| Ast.BinOpPrototype (name, args, prec) ->
|
||
|
let op = name.[String.length name - 1] in
|
||
|
Hashtbl.add Parser.binop_precedence op prec;
|
||
|
| _ -> ()
|
||
|
end;
|
||
|
|
||
|
(* Create a new basic block to start insertion into. *)
|
||
|
let bb = append_block context "entry" the_function in
|
||
|
position_at_end bb builder;
|
||
|
|
||
|
try
|
||
|
(* Add all arguments to the symbol table and create their allocas. *)
|
||
|
create_argument_allocas the_function proto;
|
||
|
|
||
|
let ret_val = codegen_expr body in
|
||
|
|
||
|
(* Finish off the function. *)
|
||
|
let _ = build_ret ret_val builder in
|
||
|
|
||
|
(* Validate the generated code, checking for consistency. *)
|
||
|
Llvm_analysis.assert_valid_function the_function;
|
||
|
|
||
|
(* Optimize the function. *)
|
||
|
let _ = PassManager.run_function the_function the_fpm in
|
||
|
|
||
|
the_function
|
||
|
with e ->
|
||
|
delete_function the_function;
|
||
|
raise e
|