parser.mly 7.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234
  1. %{
  2. (**
  3. * Parser for the CiviC language.
  4. *
  5. * Note that some shift/reduce conflicts exist, but these need not be solved
  6. * since menhir can automatically resolve them
  7. *)
  8. open Lexing
  9. open Types
  10. let loc start stop = [Loc (Util.loc_from_lexpos start stop)]
  11. let rec make_dims dimloc = function
  12. | [] -> []
  13. | dim :: tail -> Dim (dim, dimloc) :: (make_dims dimloc tail)
  14. let rec make_args = function
  15. | [] -> []
  16. | h::t -> Arg h :: (make_args t)
  17. %}
  18. (* Tokens *)
  19. %token LPAREN RPAREN LBRACK RBRACK LBRACE RBRACE SEMICOL COMMA
  20. %token NOT ADD SUB MUL DIV MOD
  21. %token EQ NE LT LE GT GE
  22. %token AND OR
  23. %token ASSIGN IF ELSE WHILE DO FOR RETURN EXTERN EXPORT
  24. %token INT BOOL FLOAT VOID
  25. %token EOF
  26. %token <bool> BOOL_CONST
  27. %token <float> FLOAT_CONST
  28. %token <int> INT_CONST
  29. %token <string> ID
  30. (* Precedence *)
  31. (*%right ASSIGN*)
  32. %left OR
  33. %left AND
  34. %left EQ NE
  35. %left LT LE GT GE
  36. %left ADD SUB
  37. %left MUL DIV MOD
  38. %right NOT NEG CAST
  39. %nonassoc IF
  40. %nonassoc ELSE
  41. (* Start symbol *)
  42. %type <Types.node> program
  43. %start program
  44. %%
  45. (* Left-recursive list (use List.rev to obtain original list) *)
  46. lreclist(x):
  47. | { [] }
  48. | lreclist(x) x { $2 :: $1 }
  49. (* Shorthand for comma-separated list *)
  50. %inline clist(x):
  51. lst=separated_list(COMMA, x)
  52. { lst }
  53. basic_type:
  54. | FLOAT { Float }
  55. | INT { Int }
  56. | BOOL { Bool }
  57. program:
  58. decl* EOF
  59. { Program ($1, loc $startpos $endpos) }
  60. decl:
  61. (* function: use location of function name *)
  62. | EXTERN hdr=fun_header SEMICOL
  63. { let (t, n, p, nameloc) = hdr in
  64. FunDec(t, n, p, nameloc) }
  65. | export=boption(EXPORT) hdr=fun_header LBRACE body=fun_body RBRACE
  66. { let (t, n, p, nameloc) = hdr in
  67. FunDef (export, t, n, p, Block body, nameloc) }
  68. (* global variable declaration: use location of variable name *)
  69. | EXTERN ctype=basic_type name=ID SEMICOL
  70. { GlobalDec (ctype, name, loc $startpos $endpos) }
  71. | EXTERN ctype=basic_type LBRACK dims=dimlist RBRACK name=ID SEMICOL
  72. { let loc = loc $startpos(name) $endpos(name) in
  73. GlobalDec (ArrayDims (ctype, List.rev dims), name, loc) }
  74. | export=boption(EXPORT) ctype=basic_type name=ID SEMICOL
  75. { let loc = loc $startpos(name) $endpos(name) in
  76. GlobalDef (export, ctype, name, None, loc) }
  77. | export=boption(EXPORT) ctype=basic_type name=ID ASSIGN init=expr SEMICOL
  78. { let loc = loc $startpos(name) $endpos(name) in
  79. GlobalDef (export, ctype, name, Some init, loc) }
  80. | export=boption(EXPORT) ctype=basic_type LBRACK dims=clist(expr) RBRACK
  81. name=ID SEMICOL
  82. { let loc = loc $startpos(name) $endpos(name) in
  83. GlobalDef (export, ArrayDims (ctype, dims), name, None, loc) }
  84. fun_header:
  85. (* function header: use location of function name *)
  86. | ret=basic_type name=ID LPAREN params=clist(param) RPAREN
  87. { (ret, name, params, loc $startpos(name) $endpos(name)) }
  88. | VOID name=ID LPAREN params=clist(param) RPAREN
  89. { (Void, name, params, loc $startpos(name) $endpos(name)) }
  90. param:
  91. (* parameter: use location of parameter name *)
  92. | ctype=basic_type name=ID
  93. { Param (ctype, name, loc $startpos(name) $endpos(name)) }
  94. | ctype=basic_type LBRACK dims=dimlist RBRACK name=ID
  95. { let loc = loc $startpos(name) $endpos(name) in
  96. Param (ArrayDims (ctype, List.rev dims), name, loc) }
  97. dimlist:
  98. | name=ID
  99. { [Dim (name, loc $startpos(name) $endpos(name))] }
  100. | head=dimlist COMMA name=ID
  101. { Dim (name, loc $startpos(name) $endpos(name)) :: head }
  102. fun_body:
  103. | lreclist(var_dec) local_fun_dec* statement* loption(return_statement)
  104. { VarDecs (List.rev $1) :: (LocalFuns $2) :: $3 @ $4 }
  105. return_statement:
  106. (* return statement: use location of return value *)
  107. | RETURN value=expr SEMICOL
  108. { [Return (value, loc $startpos(value) $endpos(value))] }
  109. (* function: use location of function name *)
  110. local_fun_dec:
  111. | hdr=fun_header LBRACE body=fun_body RBRACE
  112. { let (t, n, p, nameloc) = hdr in
  113. FunDef (false, t, n, p, Block body, nameloc) }
  114. var_dec:
  115. (* variable declaration: use location of variable name *)
  116. | ctype=basic_type name=ID SEMICOL
  117. { VarDec (ctype, name, None, loc $startpos(name) $endpos(name)) }
  118. | ctype=basic_type name=ID ASSIGN init=expr SEMICOL
  119. { VarDec (ctype, name, Some init, loc $startpos(name) $endpos(name)) }
  120. | ctype=basic_type LBRACK dims=clist(expr) RBRACK name=ID SEMICOL
  121. { let loc = loc $startpos(name) $endpos(name) in
  122. VarDec (ArrayDims (ctype, dims), name, None, loc) }
  123. | ctype=basic_type LBRACK dims=clist(expr) RBRACK name=ID ASSIGN
  124. init=expr SEMICOL
  125. { let loc = loc $startpos(name) $endpos(name) in
  126. VarDec (ArrayDims (ctype, dims), name, Some init, loc) }
  127. statement:
  128. (* assignment: use location of assigned variable name *)
  129. | name=ID ASSIGN value=expr SEMICOL
  130. { Assign (name, None, value, loc $startpos(name) $endpos(name)) }
  131. | name=ID LBRACK dims=clist(expr) brk=RBRACK ASSIGN value=expr SEMICOL
  132. { Assign (name, Some dims, value, loc $startpos(name) $endpos(brk)) }
  133. | name=ID LPAREN args=clist(expr) RPAREN SEMICOL
  134. { Expr (FunCall (name, make_args args, loc $startpos(name) $endpos(name))) }
  135. (* if-statements and (do-)while-loops: use location of condition *)
  136. | IF LPAREN cond=expr RPAREN body=block
  137. { If (cond, Block body, loc $startpos $endpos) } %prec IF
  138. | IF LPAREN c=expr RPAREN t=block ELSE f=block
  139. { IfElse (c, Block t, Block f, loc $startpos(c) $endpos(c)) } %prec ELSE
  140. | WHILE LPAREN cond=expr RPAREN body=block
  141. { While (cond, Block body, loc $startpos(cond) $endpos(cond)) }
  142. | DO body=block WHILE LPAREN cond=expr RPAREN SEMICOL
  143. { DoWhile (cond, Block body, loc $startpos(cond) $endpos(cond)) }
  144. (* for-loop: use location of counter id *)
  145. | FOR LPAREN INT cnt=ID ASSIGN start=expr COMMA stop=expr RPAREN body=block
  146. { let loc = loc $startpos(cnt) $endpos(cnt) in
  147. For (cnt, start, stop, Const (IntVal 1, []), Block body, loc) }
  148. | FOR LPAREN INT cnt=ID ASSIGN start=expr COMMA stop=expr COMMA step=expr
  149. RPAREN body=block
  150. { let loc = loc $startpos(cnt) $endpos(cnt) in
  151. For (cnt, start, stop, step, Block body, loc) }
  152. block:
  153. | LBRACE stats=statement* RBRACE { stats }
  154. | stat=statement { [stat] }
  155. expr:
  156. | name=ID LPAREN args=clist(expr) RPAREN
  157. { FunCall (name, make_args args, loc $startpos $endpos) }
  158. | LPAREN expr RPAREN { $2 }
  159. | ID { Var ($1, None, loc $startpos $endpos) }
  160. | l=expr op=binop r=expr { Binop (op, l, r, loc $startpos $endpos) }
  161. | SUB expr { Monop (Neg, $2, loc $startpos $endpos) } %prec NEG
  162. | NOT expr { Monop (Not, $2, loc $startpos $endpos) }
  163. | LPAREN basic_type RPAREN expr { TypeCast ($2, $4, loc $startpos $endpos) } %prec CAST
  164. | FLOAT_CONST { Const (FloatVal $1, loc $startpos $endpos) }
  165. | INT_CONST { Const (IntVal $1, loc $startpos $endpos) }
  166. | BOOL_CONST { Const (BoolVal $1, loc $startpos $endpos) }
  167. | ID array_const { Var ($1, Some $2, loc $startpos $endpos) }
  168. | array_const { ArrayConst ($1, loc $startpos $endpos) }
  169. %inline binop:
  170. | ADD { Add }
  171. | SUB { Sub }
  172. | MUL { Mul }
  173. | DIV { Div }
  174. | MOD { Mod }
  175. | EQ { Eq }
  176. | NE { Ne }
  177. | LT { Lt }
  178. | LE { Le }
  179. | GT { Gt }
  180. | GE { Ge }
  181. | AND { And }
  182. | OR { Or }
  183. array_const:
  184. LBRACK values=clist(expr) RBRACK
  185. { values }
  186. %%