ligo/AST.mli

431 lines
9.7 KiB
OCaml
Raw Normal View History

2019-02-26 01:29:29 +04:00
(* Abstract Syntax Tree (AST) for Ligo *)
[@@@warning "-30"]
2019-02-26 01:29:29 +04:00
open Utils
(* Regions
The AST carries all the regions where tokens have been found by the
lexer, plus additional regions corresponding to whole subtrees
(like entire expressions, patterns etc.). These regions are needed
for error reporting and source-to-source transformations. To make
these pervasive regions more legible, we define singleton types for
the symbols, keywords etc. with suggestive names like "kwd_and"
denoting the _region_ of the occurrence of the keyword "and".
*)
type 'a reg = 'a Region.reg
val nseq_to_region : ('a -> Region.t) -> 'a nseq -> Region.t
val nsepseq_to_region : ('a -> Region.t) -> ('a,'sep) nsepseq -> Region.t
val sepseq_to_region : ('a -> Region.t) -> ('a,'sep) sepseq -> Region.t
(* Keywords of Ligo *)
type kwd_begin = Region.t
type kwd_const = Region.t
type kwd_down = Region.t
type kwd_fail = Region.t
2019-02-26 01:29:29 +04:00
type kwd_if = Region.t
type kwd_in = Region.t
type kwd_is = Region.t
type kwd_for = Region.t
type kwd_function = Region.t
type kwd_parameter = Region.t
type kwd_storage = Region.t
type kwd_type = Region.t
type kwd_of = Region.t
type kwd_operations = Region.t
type kwd_var = Region.t
type kwd_end = Region.t
type kwd_then = Region.t
type kwd_else = Region.t
type kwd_match = Region.t
type kwd_procedure = Region.t
type kwd_null = Region.t
type kwd_record = Region.t
type kwd_step = Region.t
type kwd_to = Region.t
type kwd_mod = Region.t
type kwd_not = Region.t
type kwd_while = Region.t
type kwd_with = Region.t
(* Data constructors *)
type c_False = Region.t
type c_None = Region.t
type c_Some = Region.t
type c_True = Region.t
type c_Unit = Region.t
(* Symbols *)
type semi = Region.t
type comma = Region.t
type lpar = Region.t
type rpar = Region.t
type lbrace = Region.t
type rbrace = Region.t
type lbracket = Region.t
type rbracket = Region.t
type cons = Region.t
type vbar = Region.t
type arrow = Region.t
type ass = Region.t
2019-02-26 01:29:29 +04:00
type equal = Region.t
type colon = Region.t
type bool_or = Region.t
type bool_and = Region.t
type lt = Region.t
type leq = Region.t
type gt = Region.t
type geq = Region.t
type neq = Region.t
type plus = Region.t
type minus = Region.t
type slash = Region.t
type times = Region.t
type dot = Region.t
type wild = Region.t
type cat = Region.t
(* Virtual tokens *)
type eof = Region.t
(* Literals *)
type variable = string reg
type fun_name = string reg
type type_name = string reg
type field_name = string reg
type map_name = string reg
type constr = string reg
2019-02-26 01:29:29 +04:00
(* Comma-separated non-empty lists *)
type 'a csv = ('a, comma) nsepseq
(* Bar-separated non-empty lists *)
type 'a bsv = ('a, vbar) nsepseq
(* Parentheses *)
type 'a par = (lpar * 'a * rpar) reg
(* Brackets compounds *)
type 'a brackets = (lbracket * 'a * rbracket) reg
(* Braced compounds *)
type 'a braces = (lbrace * 'a * rbrace) reg
(* The Abstract Syntax Tree *)
type t = {
types : type_decl reg list;
constants : const_decl reg list;
parameter : parameter_decl reg;
storage : storage_decl reg;
operations : operations_decl reg;
lambdas : lambda_decl list;
block : block reg;
eof : eof
}
2019-02-26 01:29:29 +04:00
and ast = t
and parameter_decl = {
kwd_parameter : kwd_parameter;
name : variable;
colon : colon;
param_type : type_expr;
terminator : semi option
}
2019-02-26 01:29:29 +04:00
and storage_decl = {
kwd_storage : kwd_storage;
store_type : type_expr;
terminator : semi option
}
2019-02-26 01:29:29 +04:00
and operations_decl = {
kwd_operations : kwd_operations;
op_type : type_expr;
terminator : semi option
}
2019-02-26 01:29:29 +04:00
(* Type declarations *)
and type_decl = {
kwd_type : kwd_type;
name : type_name;
kwd_is : kwd_is;
type_expr : type_expr;
terminator : semi option
}
2019-02-26 01:29:29 +04:00
and type_expr =
Prod of cartesian
| Sum of (variant, vbar) nsepseq reg
| Record of record_type
| TypeApp of (type_name * type_tuple) reg
| ParType of type_expr par
| TAlias of variable
2019-02-26 01:29:29 +04:00
and cartesian = (type_expr, times) nsepseq reg
2019-02-26 01:29:29 +04:00
and variant = (constr * kwd_of * cartesian) reg
2019-02-26 01:29:29 +04:00
and record_type = (kwd_record * field_decls * kwd_end) reg
2019-02-26 01:29:29 +04:00
and field_decls = (field_decl, semi) nsepseq
2019-02-26 01:29:29 +04:00
and field_decl = (variable * colon * type_expr) reg
2019-02-26 01:29:29 +04:00
and type_tuple = (type_name, comma) nsepseq par
2019-02-26 01:29:29 +04:00
(* Function and procedure declarations *)
and lambda_decl =
FunDecl of fun_decl reg
| ProcDecl of proc_decl reg
and fun_decl = {
kwd_function : kwd_function;
name : variable;
param : parameters;
colon : colon;
ret_type : type_expr;
kwd_is : kwd_is;
local_decls : local_decl list;
block : block reg;
kwd_with : kwd_with;
return : expr;
terminator : semi option
}
2019-02-26 01:29:29 +04:00
and proc_decl = {
kwd_procedure : kwd_procedure;
name : variable;
param : parameters;
kwd_is : kwd_is;
local_decls : local_decl list;
block : block reg;
terminator : semi option
}
2019-02-26 01:29:29 +04:00
and parameters = (param_decl, semi) nsepseq par
2019-02-26 01:29:29 +04:00
and param_decl =
ParamConst of param_const
| ParamVar of param_var
and param_const = (kwd_const * variable * colon * type_expr) reg
and param_var = (kwd_var * variable * colon * type_expr) reg
2019-02-26 01:29:29 +04:00
and block = {
opening : kwd_begin;
instr : instructions;
terminator : semi option;
close : kwd_end
}
2019-02-26 01:29:29 +04:00
and local_decl =
LocalLam of lambda_decl
| LocalConst of const_decl reg
| LocalVar of var_decl reg
and const_decl = {
kwd_const : kwd_const;
name : variable;
colon : colon;
vtype : type_expr;
equal : equal;
init : expr;
terminator : semi option
2019-03-05 14:15:02 +04:00
}
2019-02-26 01:29:29 +04:00
and var_decl = {
kwd_var : kwd_var;
name : variable;
colon : colon;
vtype : type_expr;
ass : ass;
init : expr;
terminator : semi option
}
2019-02-26 01:29:29 +04:00
and instructions = (instruction, semi) nsepseq reg
2019-02-26 01:29:29 +04:00
and instruction =
Single of single_instr
| Block of block reg
2019-02-26 01:29:29 +04:00
and single_instr =
Cond of conditional reg
| Match of match_instr reg
| Ass of ass_instr
| Loop of loop
| ProcCall of fun_call
2019-02-26 01:29:29 +04:00
| Null of kwd_null
| Fail of (kwd_fail * expr) reg
and conditional = {
kwd_if : kwd_if;
test : expr;
kwd_then : kwd_then;
ifso : instruction;
kwd_else : kwd_else;
ifnot : instruction
}
2019-02-26 01:29:29 +04:00
and match_instr = {
kwd_match : kwd_match;
expr : expr;
kwd_with : kwd_with;
lead_vbar : vbar option;
cases : cases;
kwd_end : kwd_end
}
2019-02-26 01:29:29 +04:00
and cases = (case, vbar) nsepseq reg
2019-02-26 01:29:29 +04:00
and case = (pattern * arrow * instruction) reg
2019-02-26 01:29:29 +04:00
and ass_instr = (variable * ass * expr) reg
2019-02-26 01:29:29 +04:00
and loop =
While of while_loop
| For of for_loop
2019-02-26 01:29:29 +04:00
and while_loop = (kwd_while * expr * block reg) reg
2019-02-26 01:29:29 +04:00
and for_loop =
ForInt of for_int reg
| ForCollect of for_collect reg
2019-02-26 01:29:29 +04:00
and for_int = {
kwd_for : kwd_for;
ass : ass_instr;
down : kwd_down option;
kwd_to : kwd_to;
bound : expr;
step : (kwd_step * expr) option;
block : block reg
}
2019-02-26 01:29:29 +04:00
and for_collect = {
kwd_for : kwd_for;
var : variable;
bind_to : (arrow * variable) option;
kwd_in : kwd_in;
expr : expr;
block : block reg
}
2019-02-26 01:29:29 +04:00
(* Expressions *)
and expr =
Or of (expr * bool_or * expr) reg
| And of (expr * bool_and * expr) reg
| Lt of (expr * lt * expr) reg
| Leq of (expr * leq * expr) reg
| Gt of (expr * gt * expr) reg
| Geq of (expr * geq * expr) reg
| Equal of (expr * equal * expr) reg
| Neq of (expr * neq * expr) reg
| Cat of (expr * cat * expr) reg
| Cons of (expr * cons * expr) reg
| Add of (expr * plus * expr) reg
| Sub of (expr * minus * expr) reg
| Mult of (expr * times * expr) reg
| Div of (expr * slash * expr) reg
| Mod of (expr * kwd_mod * expr) reg
| Neg of (minus * expr) reg
| Not of (kwd_not * expr) reg
2019-02-26 01:29:29 +04:00
| Int of (Lexer.lexeme * Z.t) reg
| Var of Lexer.lexeme reg
| String of Lexer.lexeme reg
| Bytes of (Lexer.lexeme * MBytes.t) reg
| False of c_False
| True of c_True
| Unit of c_Unit
| Tuple of tuple
| List of (expr, comma) nsepseq brackets
| EmptyList of empty_list
| Set of (expr, comma) nsepseq braces
| EmptySet of empty_set
| NoneExpr of none_expr
| FunCall of fun_call
| ConstrApp of constr_app
| SomeApp of (c_Some * arguments) reg
| MapLookUp of map_lookup reg
| ParExpr of expr par
2019-02-26 01:29:29 +04:00
and tuple = (expr, comma) nsepseq par
2019-02-26 01:29:29 +04:00
and empty_list =
(lbracket * rbracket * colon * type_expr) par
2019-02-26 01:29:29 +04:00
and empty_set =
(lbrace * rbrace * colon * type_expr) par
2019-02-26 01:29:29 +04:00
and none_expr =
(c_None * colon * type_expr) par
2019-02-26 01:29:29 +04:00
and fun_call = (fun_name * arguments) reg
2019-02-26 01:29:29 +04:00
and arguments = tuple
2019-02-26 01:29:29 +04:00
and constr_app = (constr * arguments) reg
2019-02-26 01:29:29 +04:00
and map_lookup = {
map_name : variable;
selector : dot;
index : expr brackets
}
2019-02-26 01:29:29 +04:00
(* Patterns *)
and pattern = (core_pattern, cons) nsepseq reg
2019-02-26 01:29:29 +04:00
and core_pattern =
2019-02-26 01:29:29 +04:00
PVar of Lexer.lexeme reg
| PWild of wild
| PInt of (Lexer.lexeme * Z.t) reg
| PBytes of (Lexer.lexeme * MBytes.t) reg
| PString of Lexer.lexeme reg
| PUnit of c_Unit
| PFalse of c_False
| PTrue of c_True
| PNone of c_None
| PSome of (c_Some * core_pattern par) reg
| PList of list_pattern
| PTuple of (core_pattern, comma) nsepseq par
2019-02-26 01:29:29 +04:00
and list_pattern =
Sugar of (core_pattern, comma) sepseq brackets
| Raw of (core_pattern * cons * pattern) par
2019-02-26 01:29:29 +04:00
(* Projecting regions *)
val type_expr_to_region : type_expr -> Region.t
val expr_to_region : expr -> Region.t
val instr_to_region : instruction -> Region.t
val core_pattern_to_region : core_pattern -> Region.t
val local_decl_to_region : local_decl -> Region.t
(* Printing *)
val print_tokens : t -> unit