196 lines
6.4 KiB
OCaml
196 lines
6.4 KiB
OCaml
|
(*===---------------------------------------------------------------------===
|
||
|
* Parser
|
||
|
*===---------------------------------------------------------------------===*)
|
||
|
|
||
|
(* binop_precedence - This holds the precedence for each binary operator that is
|
||
|
* defined *)
|
||
|
let binop_precedence:(char, int) Hashtbl.t = Hashtbl.create 10
|
||
|
|
||
|
(* precedence - Get the precedence of the pending binary operator token. *)
|
||
|
let precedence c = try Hashtbl.find binop_precedence c with Not_found -> -1
|
||
|
|
||
|
(* primary
|
||
|
* ::= identifier
|
||
|
* ::= numberexpr
|
||
|
* ::= parenexpr
|
||
|
* ::= ifexpr
|
||
|
* ::= forexpr *)
|
||
|
let rec parse_primary = parser
|
||
|
(* numberexpr ::= number *)
|
||
|
| [< 'Token.Number n >] -> Ast.Number n
|
||
|
|
||
|
(* parenexpr ::= '(' expression ')' *)
|
||
|
| [< 'Token.Kwd '('; e=parse_expr; 'Token.Kwd ')' ?? "expected ')'" >] -> e
|
||
|
|
||
|
(* identifierexpr
|
||
|
* ::= identifier
|
||
|
* ::= identifier '(' argumentexpr ')' *)
|
||
|
| [< 'Token.Ident id; stream >] ->
|
||
|
let rec parse_args accumulator = parser
|
||
|
| [< e=parse_expr; stream >] ->
|
||
|
begin parser
|
||
|
| [< 'Token.Kwd ','; e=parse_args (e :: accumulator) >] -> e
|
||
|
| [< >] -> e :: accumulator
|
||
|
end stream
|
||
|
| [< >] -> accumulator
|
||
|
in
|
||
|
let rec parse_ident id = parser
|
||
|
(* Call. *)
|
||
|
| [< 'Token.Kwd '(';
|
||
|
args=parse_args [];
|
||
|
'Token.Kwd ')' ?? "expected ')'">] ->
|
||
|
Ast.Call (id, Array.of_list (List.rev args))
|
||
|
|
||
|
(* Simple variable ref. *)
|
||
|
| [< >] -> Ast.Variable id
|
||
|
in
|
||
|
parse_ident id stream
|
||
|
|
||
|
(* ifexpr ::= 'if' expr 'then' expr 'else' expr *)
|
||
|
| [< 'Token.If; c=parse_expr;
|
||
|
'Token.Then ?? "expected 'then'"; t=parse_expr;
|
||
|
'Token.Else ?? "expected 'else'"; e=parse_expr >] ->
|
||
|
Ast.If (c, t, e)
|
||
|
|
||
|
(* forexpr
|
||
|
::= 'for' identifier '=' expr ',' expr (',' expr)? 'in' expression *)
|
||
|
| [< 'Token.For;
|
||
|
'Token.Ident id ?? "expected identifier after for";
|
||
|
'Token.Kwd '=' ?? "expected '=' after for";
|
||
|
stream >] ->
|
||
|
begin parser
|
||
|
| [<
|
||
|
start=parse_expr;
|
||
|
'Token.Kwd ',' ?? "expected ',' after for";
|
||
|
end_=parse_expr;
|
||
|
stream >] ->
|
||
|
let step =
|
||
|
begin parser
|
||
|
| [< 'Token.Kwd ','; step=parse_expr >] -> Some step
|
||
|
| [< >] -> None
|
||
|
end stream
|
||
|
in
|
||
|
begin parser
|
||
|
| [< 'Token.In; body=parse_expr >] ->
|
||
|
Ast.For (id, start, end_, step, body)
|
||
|
| [< >] ->
|
||
|
raise (Stream.Error "expected 'in' after for")
|
||
|
end stream
|
||
|
| [< >] ->
|
||
|
raise (Stream.Error "expected '=' after for")
|
||
|
end stream
|
||
|
|
||
|
| [< >] -> raise (Stream.Error "unknown token when expecting an expression.")
|
||
|
|
||
|
(* unary
|
||
|
* ::= primary
|
||
|
* ::= '!' unary *)
|
||
|
and parse_unary = parser
|
||
|
(* If this is a unary operator, read it. *)
|
||
|
| [< 'Token.Kwd op when op != '(' && op != ')'; operand=parse_expr >] ->
|
||
|
Ast.Unary (op, operand)
|
||
|
|
||
|
(* If the current token is not an operator, it must be a primary expr. *)
|
||
|
| [< stream >] -> parse_primary stream
|
||
|
|
||
|
(* binoprhs
|
||
|
* ::= ('+' primary)* *)
|
||
|
and parse_bin_rhs expr_prec lhs stream =
|
||
|
match Stream.peek stream with
|
||
|
(* If this is a binop, find its precedence. *)
|
||
|
| Some (Token.Kwd c) when Hashtbl.mem binop_precedence c ->
|
||
|
let token_prec = precedence c in
|
||
|
|
||
|
(* If this is a binop that binds at least as tightly as the current binop,
|
||
|
* consume it, otherwise we are done. *)
|
||
|
if token_prec < expr_prec then lhs else begin
|
||
|
(* Eat the binop. *)
|
||
|
Stream.junk stream;
|
||
|
|
||
|
(* Parse the unary expression after the binary operator. *)
|
||
|
let rhs = parse_unary stream in
|
||
|
|
||
|
(* Okay, we know this is a binop. *)
|
||
|
let rhs =
|
||
|
match Stream.peek stream with
|
||
|
| Some (Token.Kwd c2) ->
|
||
|
(* If BinOp binds less tightly with rhs than the operator after
|
||
|
* rhs, let the pending operator take rhs as its lhs. *)
|
||
|
let next_prec = precedence c2 in
|
||
|
if token_prec < next_prec
|
||
|
then parse_bin_rhs (token_prec + 1) rhs stream
|
||
|
else rhs
|
||
|
| _ -> rhs
|
||
|
in
|
||
|
|
||
|
(* Merge lhs/rhs. *)
|
||
|
let lhs = Ast.Binary (c, lhs, rhs) in
|
||
|
parse_bin_rhs expr_prec lhs stream
|
||
|
end
|
||
|
| _ -> lhs
|
||
|
|
||
|
(* expression
|
||
|
* ::= primary binoprhs *)
|
||
|
and parse_expr = parser
|
||
|
| [< lhs=parse_unary; stream >] -> parse_bin_rhs 0 lhs stream
|
||
|
|
||
|
(* prototype
|
||
|
* ::= id '(' id* ')'
|
||
|
* ::= binary LETTER number? (id, id)
|
||
|
* ::= unary LETTER number? (id) *)
|
||
|
let parse_prototype =
|
||
|
let rec parse_args accumulator = parser
|
||
|
| [< 'Token.Ident id; e=parse_args (id::accumulator) >] -> e
|
||
|
| [< >] -> accumulator
|
||
|
in
|
||
|
let parse_operator = parser
|
||
|
| [< 'Token.Unary >] -> "unary", 1
|
||
|
| [< 'Token.Binary >] -> "binary", 2
|
||
|
in
|
||
|
let parse_binary_precedence = parser
|
||
|
| [< 'Token.Number n >] -> int_of_float n
|
||
|
| [< >] -> 30
|
||
|
in
|
||
|
parser
|
||
|
| [< 'Token.Ident id;
|
||
|
'Token.Kwd '(' ?? "expected '(' in prototype";
|
||
|
args=parse_args [];
|
||
|
'Token.Kwd ')' ?? "expected ')' in prototype" >] ->
|
||
|
(* success. *)
|
||
|
Ast.Prototype (id, Array.of_list (List.rev args))
|
||
|
| [< (prefix, kind)=parse_operator;
|
||
|
'Token.Kwd op ?? "expected an operator";
|
||
|
(* Read the precedence if present. *)
|
||
|
binary_precedence=parse_binary_precedence;
|
||
|
'Token.Kwd '(' ?? "expected '(' in prototype";
|
||
|
args=parse_args [];
|
||
|
'Token.Kwd ')' ?? "expected ')' in prototype" >] ->
|
||
|
let name = prefix ^ (String.make 1 op) in
|
||
|
let args = Array.of_list (List.rev args) in
|
||
|
|
||
|
(* Verify right number of arguments for operator. *)
|
||
|
if Array.length args != kind
|
||
|
then raise (Stream.Error "invalid number of operands for operator")
|
||
|
else
|
||
|
if kind == 1 then
|
||
|
Ast.Prototype (name, args)
|
||
|
else
|
||
|
Ast.BinOpPrototype (name, args, binary_precedence)
|
||
|
| [< >] ->
|
||
|
raise (Stream.Error "expected function name in prototype")
|
||
|
|
||
|
(* definition ::= 'def' prototype expression *)
|
||
|
let parse_definition = parser
|
||
|
| [< 'Token.Def; p=parse_prototype; e=parse_expr >] ->
|
||
|
Ast.Function (p, e)
|
||
|
|
||
|
(* toplevelexpr ::= expression *)
|
||
|
let parse_toplevel = parser
|
||
|
| [< e=parse_expr >] ->
|
||
|
(* Make an anonymous proto. *)
|
||
|
Ast.Function (Ast.Prototype ("", [||]), e)
|
||
|
|
||
|
(* external ::= 'extern' prototype *)
|
||
|
let parse_extern = parser
|
||
|
| [< 'Token.Extern; e=parse_prototype >] -> e
|