typecheck.ml 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253
  1. (*
  2. * Do a number of checks:
  3. * - A void function must not return a value.
  4. * - A non-void function must return a value of the correct type.
  5. * - Array indices must be of type integer.
  6. * - The number of array indices must match the number of array dimensions.
  7. * - The type on the right-hand side of an assignment must match the type on
  8. * the left-hand side.
  9. * - The number of arguments used for a function call must match the number of
  10. * parameters for that function.
  11. * - The types of the function arguments must match the types of parameters.
  12. * - The operands of a unary or binary operation must have valid types.
  13. * - The predicate expression of an if, while, or do-while statement must be
  14. * a boolean.
  15. * - Only values having a basic type can be type cast.
  16. *)
  17. open Printf
  18. open Types
  19. open Util
  20. open Stringify
  21. let array_depth = function
  22. | ArrayDims (_, dims) -> List.length dims
  23. | _ -> raise InvalidNode
  24. let spec = function
  25. | ArrayDims (ctype, dims) -> (ctype, List.length dims)
  26. | ctype -> (ctype, 0)
  27. let check_type ?(msg="") expected node =
  28. let got = typeof node in
  29. if (spec got) <> (spec expected) then begin
  30. let msg = match msg with
  31. | "" -> sprintf "type mismatch: expected type %s, got %s"
  32. (type2str expected) (type2str got)
  33. (*(type2str (spec expected)) (type2str (spec got))*)
  34. | _ -> msg
  35. in raise (NodeError (node, msg))
  36. end
  37. let op_types = function
  38. | Not | And | Or -> [Bool]
  39. | Mod -> [Int]
  40. | Neg | Sub | Div | Lt | Le | Gt | Ge -> [Int; Float]
  41. | Add | Mul | Eq | Ne -> [Bool; Int; Float]
  42. let op_result_type opnd_type = function
  43. | Not | And | Or | Eq | Ne | Lt | Le | Gt | Ge -> Bool
  44. | Neg | Add | Sub | Mul | Div | Mod -> opnd_type
  45. (* Check if the given operator can be applied to the given type *)
  46. let check_type_op allowed_types desc node =
  47. let got = typeof node in
  48. if not (List.mem got allowed_types) then (
  49. let msg = sprintf
  50. "%s cannot be applied to type %s, only to %s"
  51. desc (type2str got) (types2str allowed_types)
  52. in
  53. raise (NodeError (node, msg))
  54. ); ()
  55. let check_dims_match dims dec_type errnode =
  56. match (List.length dims, array_depth dec_type) with
  57. | (got, expected) when got != expected ->
  58. let msg = sprintf
  59. "dimension mismatch: expected %d indices, got %d" expected got
  60. in
  61. raise (NodeError (errnode, msg))
  62. | _ -> ()
  63. let rec typecheck node =
  64. let check_trav ctype node =
  65. let node = typecheck node in
  66. check_type ctype node;
  67. node
  68. in
  69. match node with
  70. | FunUse ((FunDec (ret_type, name, params, _) as dec), args, ann)
  71. | FunUse ((FunDef (_, ret_type, name, params, _, _) as dec), args, ann) ->
  72. begin
  73. match (List.length args, List.length params) with
  74. | (nargs, nparams) when nargs != nparams ->
  75. let msg = sprintf
  76. "function \"%s\" expects %d arguments, got %d"
  77. name nparams nargs
  78. in
  79. raise (NodeError (node, msg))
  80. | _ ->
  81. let args = List.map typecheck args in
  82. let check_arg_type arg param =
  83. check_type (typeof param) arg;
  84. in
  85. List.iter2 check_arg_type args params;
  86. FunUse (dec, args, Type ret_type :: ann)
  87. end
  88. (* Operators match operand types and get a new type based on the operator *)
  89. | Monop (op, opnd, ann) ->
  90. let opnd = typecheck opnd in
  91. let desc = sprintf "unary operator \"%s\"" (op2str op) in
  92. check_type_op (op_types op) desc opnd;
  93. Monop (op, opnd, Type (op_result_type (typeof opnd) op) :: ann)
  94. | Binop (op, left, right, ann) ->
  95. let left = typecheck left in
  96. let right = typecheck right in
  97. let desc = sprintf "binary operator \"%s\"" (op2str op) in
  98. check_type_op (op_types op) desc left;
  99. check_type (typeof left) right;
  100. (* Check for division by zero *)
  101. begin
  102. match (op, right) with
  103. | (Div, Const (IntVal 0, _)) -> node_warning right "division by zero"
  104. | _ -> ()
  105. end;
  106. Binop (op, left, right, Type (op_result_type (typeof left) op) :: ann)
  107. (* Conditions must be bool, and right-hand type must match left-hand type *)
  108. | Cond (cond, texpr, fexpr, ann) ->
  109. let cond = check_trav Bool cond in
  110. let texpr = typecheck texpr in
  111. let fexpr = check_trav (typeof texpr) fexpr in
  112. Cond (cond, texpr, fexpr, Type (typeof texpr) :: ann)
  113. (* Only basic types can be typecasted *)
  114. | TypeCast (ctype, value, ann) ->
  115. let value = typecheck value in
  116. check_type_op [Bool; Int; Float] "typecast" value;
  117. TypeCast (ctype, value, Type (ctype) :: ann)
  118. (* Array allocation dimensions must have type int *)
  119. | Allocate (dec, dims, ann) ->
  120. Allocate (dec, List.map (check_trav Int) dims, ann)
  121. (* Array dimensions are always integers *)
  122. | Dim (name, ann) ->
  123. Dim (name, Type Int :: ann)
  124. (* Functions and parameters must be traversed to give types to Dim nodes *)
  125. (*
  126. | FunDec (ret_type, name, params, ann) ->
  127. FunDec (ret_type, name, List.map typecheck params, ann)
  128. | Param (ArrayDims (ctype, dims), name, ann) ->
  129. Param (ArrayDims (ctype, List.map typecheck dims), name, ann)
  130. *)
  131. (* Void functions may have no return statement, other functions must have a
  132. * return statement of valid type *)
  133. | FunDef (export, ret_type, name, params, body, ann) ->
  134. let params = List.map typecheck params in
  135. let body = typecheck body in
  136. let rec find_return = function
  137. | [] -> None
  138. | [Return (value, _) as ret] -> Some (ret, typeof value)
  139. | hd :: tl -> find_return tl
  140. in
  141. begin
  142. match (ret_type, find_return (block_body body)) with
  143. | (Void, Some (ret, _)) ->
  144. raise (NodeError (ret, "void function should not have a return value"))
  145. | ((Bool | Int | Float), None) ->
  146. let msg = sprintf
  147. "expected return value of type %s for function \"%s\""
  148. (type2str ret_type) name
  149. in
  150. raise (NodeError (node, msg))
  151. | ((Bool | Int | Float), Some (ret, t)) when t != ret_type ->
  152. let msg = sprintf
  153. "function \"%s\" has return type %s, got %s"
  154. name (type2str ret_type) (type2str t)
  155. in
  156. raise (NodeError (ret, msg))
  157. | _ -> FunDef (export, ret_type, name, params, body, ann)
  158. end
  159. (* Conditions in must have type bool *)
  160. | If (cond, body, ann) ->
  161. If (check_trav Bool cond, typecheck body, ann)
  162. | IfElse (cond, tbody, fbody, ann) ->
  163. IfElse (check_trav Bool cond, typecheck tbody, typecheck fbody, ann)
  164. | While (cond, body, ann) ->
  165. While (check_trav Bool cond, typecheck body, ann)
  166. | DoWhile (cond, body, ann) ->
  167. DoWhile (check_trav Bool cond, typecheck body, ann)
  168. (* Constants *)
  169. | Const (BoolVal value, ann) ->
  170. Const (BoolVal value, Type Bool :: ann)
  171. | Const (IntVal value, ann) ->
  172. (* Do a bound check on integers (use Int32 because default ints in ocaml
  173. * are 31- or 63-bit *)
  174. let cmpval = Nativeint.of_int value in
  175. let min = Nativeint.of_int32 Int32.min_int in
  176. let max = Nativeint.of_int32 Int32.max_int in
  177. if cmpval < min || cmpval > max then (
  178. raise (NodeError (node, "integer value out of range (signed 32-bit)"))
  179. );
  180. Const (IntVal value, Type Int :: ann)
  181. | Const (FloatVal value, ann) ->
  182. Const (FloatVal value, Type Float :: ann)
  183. (* Variables inherit the type of their declaration *)
  184. | VarUse (dec, None, ann) ->
  185. VarUse (dec, None, Type (typeof dec) :: ann)
  186. | VarUse (dec, Some dims, ann) ->
  187. let dims = List.map typecheck dims in
  188. List.iter (check_type Int) dims;
  189. check_dims_match dims (typeof dec) node;
  190. VarUse (dec, Some dims, Type (basetypeof dec) :: ann)
  191. (* Array pointers cannot be re-assigned, because array dimension reduction
  192. * makes assumptions about dimensions of an array *)
  193. | VarLet (dec, None, _, _) when is_array dec ->
  194. raise (NodeError (node, "cannot assign value to array pointer after \
  195. initialisation"))
  196. (* Assigned values must match variable declaration *)
  197. | VarLet (dec, None, value, ann) ->
  198. VarLet (dec, None, check_trav (typeof dec) value, ann)
  199. | VarLet (dec, Some dims, value, ann) ->
  200. (* Number of assigned indices must match array definition *)
  201. check_dims_match dims (typeof dec) node;
  202. (* Array indices must be ints *)
  203. let dims = List.map typecheck dims in
  204. List.iter (check_type Int) dims;
  205. (* Assigned value must match array base type *)
  206. let value = typecheck value in
  207. check_type (basetypeof dec) value;
  208. VarLet (dec, Some dims, value, ann)
  209. (* ArrayConst initialisations are transformed during desugaring, so any
  210. * occurrences that are left are illegal *)
  211. | ArrayConst _ ->
  212. raise (NodeError (node, "array constants can only be used in array \
  213. initialisation"))
  214. | _ -> transform_children typecheck node
  215. let phase = function
  216. | Ast node -> Ast (typecheck node)
  217. | _ -> raise (InvalidInput "typecheck")