typecheck.ml 9.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271
  1. (*
  2. * Do a number of checks:
  3. * - A void function must not return a value.
  4. * - A non-void function must return a value of the correct type.
  5. * - Array indices must be of type integer.
  6. * - The number of array indices must match the number of array dimensions.
  7. * - The type on the right-hand side of an assignment must match the type on
  8. * the left-hand side.
  9. * - The number of arguments used for a function call must match the number of
  10. * parameters for that function.
  11. * - The types of the function arguments must match the types of parameters.
  12. * - The operands of a unary or binary operation must have valid types.
  13. * - The predicate expression of an if, while, or do-while statement must be
  14. * a boolean.
  15. * - Only values of a basic type can be type cast.
  16. *)
  17. open Printf
  18. open Types
  19. open Util
  20. open Stringify
  21. (* Stringify a list of types for use in error messages.
  22. * ctype list -> string *)
  23. let rec types2str = function
  24. | [] -> ""
  25. | [ctype] -> type2str ctype
  26. | ctype :: tail -> type2str ctype ^ " or " ^ (types2str tail)
  27. let array_depth = function
  28. | ArrayDims (_, dims) -> List.length dims
  29. | _ -> raise InvalidNode
  30. let spec = function
  31. | ArrayDims (ctype, dims) -> (ctype, List.length dims)
  32. | ctype -> (ctype, 0)
  33. let type2str_error = function
  34. | ArrayDims (ctype, dims) ->
  35. type2str ctype ^ "[" ^ repeat "," (List.length dims - 1) ^ "]"
  36. | ctype ->
  37. type2str ctype
  38. let check_type ?(msg="") expected node =
  39. let got = typeof node in
  40. if (spec got) <> (spec expected) then begin
  41. let msg = match msg with
  42. | "" -> sprintf "type mismatch: expected type %s, got %s"
  43. (type2str_error expected) (type2str_error got)
  44. | _ -> msg
  45. in raise (NodeError (node, msg))
  46. end
  47. let op_types = function
  48. | Not | And | Or -> [Bool]
  49. | Mod -> [Int]
  50. | Neg | Sub | Div | Lt | Le | Gt | Ge -> [Int; Float]
  51. | Add | Mul | Eq | Ne -> [Bool; Int; Float]
  52. let op_result_type opnd_type = function
  53. | Not | And | Or | Eq | Ne | Lt | Le | Gt | Ge -> Bool
  54. | Neg | Add | Sub | Mul | Div | Mod -> opnd_type
  55. (* Check if the given operator can be applied to the given type *)
  56. let check_type_op allowed_types desc node =
  57. let got = typeof node in
  58. if not (List.mem got allowed_types) then (
  59. let msg = sprintf
  60. "%s cannot be applied to type %s, only to %s"
  61. desc (type2str got) (types2str allowed_types)
  62. in
  63. raise (NodeError (node, msg))
  64. ); ()
  65. let check_dims_match dims dec_type errnode =
  66. match (List.length dims, array_depth dec_type) with
  67. | (got, expected) when got != expected ->
  68. let msg = sprintf
  69. "dimension mismatch: expected %d indices, got %d" expected got
  70. in
  71. raise (NodeError (errnode, msg))
  72. | _ -> ()
  73. let rec typecheck node =
  74. let check_trav ctype node =
  75. let node = typecheck node in
  76. check_type ctype node;
  77. node
  78. in
  79. match node with
  80. | FunUse ((FunDec (ret_type, name, params, _) as dec), args, ann)
  81. | FunUse ((FunDef (_, ret_type, name, params, _, _) as dec), args, ann) ->
  82. begin
  83. match (List.length args, List.length params) with
  84. | (nargs, nparams) when nargs != nparams ->
  85. let msg = sprintf
  86. "function \"%s\" expects %d arguments, got %d"
  87. name nparams nargs
  88. in
  89. raise (NodeError (node, msg))
  90. | _ ->
  91. let args = List.map typecheck args in
  92. let check_arg_type arg param =
  93. check_type (typeof param) arg;
  94. in
  95. List.iter2 check_arg_type args params;
  96. FunUse (dec, args, Type ret_type :: ann)
  97. end
  98. (* Operators match operand types and get a new type based on the operator *)
  99. | Monop (op, opnd, ann) ->
  100. let opnd = typecheck opnd in
  101. let desc = sprintf "unary operator \"%s\"" (op2str op) in
  102. check_type_op (op_types op) desc opnd;
  103. Monop (op, opnd, Type (op_result_type (typeof opnd) op) :: ann)
  104. | Binop (op, left, right, ann) ->
  105. let left = typecheck left in
  106. let right = typecheck right in
  107. let desc = sprintf "binary operator \"%s\"" (op2str op) in
  108. check_type_op (op_types op) desc left;
  109. check_type (typeof left) right;
  110. (* Check for division by zero *)
  111. begin
  112. match (op, right) with
  113. | (Div, Const (IntVal 0, _)) -> node_warning right "division by zero"
  114. | _ -> ()
  115. end;
  116. Binop (op, left, right, Type (op_result_type (typeof left) op) :: ann)
  117. (* Conditions must be bool, and right-hand type must match left-hand type *)
  118. | Cond (cond, texpr, fexpr, ann) ->
  119. let cond = check_trav Bool cond in
  120. let texpr = typecheck texpr in
  121. let fexpr = check_trav (typeof texpr) fexpr in
  122. Cond (cond, texpr, fexpr, Type (typeof texpr) :: ann)
  123. (* Only basic types can be typecasted *)
  124. | TypeCast (ctype, value, ann) ->
  125. let value = typecheck value in
  126. check_type_op [Bool; Int; Float] "typecast" value;
  127. TypeCast (ctype, value, Type ctype :: ann)
  128. (* Array allocation dimensions must have type int *)
  129. | Allocate (dec, dims, ann) ->
  130. Allocate (dec, List.map (check_trav Int) dims, ann)
  131. (* Array dimensions are always integers *)
  132. | Dim (name, ann) ->
  133. Dim (name, Type Int :: ann)
  134. (* Functions and parameters must be traversed to give types to Dim nodes *)
  135. (*
  136. | FunDec (ret_type, name, params, ann) ->
  137. FunDec (ret_type, name, List.map typecheck params, ann)
  138. | Param (ArrayDims (ctype, dims), name, ann) ->
  139. Param (ArrayDims (ctype, List.map typecheck dims), name, ann)
  140. *)
  141. (* Void functions may have no return statement, other functions must have a
  142. * return statement of valid type *)
  143. | FunDef (export, ret_type, name, params, body, ann) ->
  144. let params = List.map typecheck params in
  145. let body = typecheck body in
  146. let rec find_return = function
  147. | [] -> None
  148. | [Return (value, _) as ret] -> Some (ret, typeof value)
  149. | hd :: tl -> find_return tl
  150. in
  151. begin
  152. match (ret_type, find_return (block_body body)) with
  153. | (Void, Some (ret, _)) ->
  154. raise (NodeError (ret, "void function should not have a return value"))
  155. | ((Bool | Int | Float), None) ->
  156. let msg = sprintf
  157. "expected return value of type %s for function \"%s\""
  158. (type2str ret_type) name
  159. in
  160. raise (NodeError (node, msg))
  161. | ((Bool | Int | Float), Some (ret, t)) when t != ret_type ->
  162. let msg = sprintf
  163. "function \"%s\" has return type %s, got %s"
  164. name (type2str ret_type) (type2str t)
  165. in
  166. raise (NodeError (ret, msg))
  167. | _ -> FunDef (export, ret_type, name, params, body, ann)
  168. end
  169. (* Conditions in must have type bool *)
  170. | If (cond, body, ann) ->
  171. If (check_trav Bool cond, typecheck body, ann)
  172. | IfElse (cond, tbody, fbody, ann) ->
  173. IfElse (check_trav Bool cond, typecheck tbody, typecheck fbody, ann)
  174. | While (cond, body, ann) ->
  175. While (check_trav Bool cond, typecheck body, ann)
  176. | DoWhile (cond, body, ann) ->
  177. DoWhile (check_trav Bool cond, typecheck body, ann)
  178. (* Constants *)
  179. | Const (BoolVal value, ann) ->
  180. Const (BoolVal value, Type Bool :: ann)
  181. | Const (IntVal value, ann) ->
  182. (* Do a bound check on integers (use Int32 because default ints in ocaml
  183. * are 31- or 63-bit *)
  184. let cmpval = Nativeint.of_int value in
  185. let min = Nativeint.of_int32 Int32.min_int in
  186. let max = Nativeint.of_int32 Int32.max_int in
  187. if cmpval < min || cmpval > max then (
  188. raise (NodeError (node, "integer value out of range (signed 32-bit)"))
  189. );
  190. Const (IntVal value, Type Int :: ann)
  191. | Const (FloatVal value, ann) ->
  192. Const (FloatVal value, Type Float :: ann)
  193. (* Extern arrays variables are transformed to imported functions, so the
  194. * pointer cannot be passed *)
  195. | VarUse (GlobalDec (ArrayDims _, _, _), None, _) ->
  196. raise (NodeError (node, "imported array pointers may only be \
  197. dereferenced, not used directly"))
  198. (* Variables inherit the type of their declaration *)
  199. | VarUse (dec, None, ann) ->
  200. VarUse (dec, None, Type (typeof dec) :: ann)
  201. | VarUse (dec, Some dims, ann) ->
  202. let dims = List.map typecheck dims in
  203. List.iter (check_type Int) dims;
  204. check_dims_match dims (typeof dec) node;
  205. VarUse (dec, Some dims, Type (basetypeof dec) :: ann)
  206. (* Array pointers cannot be re-assigned, because array dimension reduction
  207. * makes assumptions about dimensions of an array *)
  208. | VarLet (dec, None, _, _) when is_array dec ->
  209. raise (NodeError (node, "cannot assign value to array pointer after \
  210. initialisation"))
  211. (* Assigned values must match variable declaration *)
  212. | VarLet (dec, None, value, ann) ->
  213. VarLet (dec, None, check_trav (typeof dec) value, ann)
  214. | VarLet (dec, Some dims, value, ann) ->
  215. (* Number of assigned indices must match array definition *)
  216. check_dims_match dims (typeof dec) node;
  217. (* Array indices must be ints *)
  218. let dims = List.map typecheck dims in
  219. List.iter (check_type Int) dims;
  220. (* Assigned value must match array base type *)
  221. let value = typecheck value in
  222. check_type (basetypeof dec) value;
  223. VarLet (dec, Some dims, value, ann)
  224. (* ArrayConst initialisations are transformed during desugaring, so any
  225. * occurrences that are left are illegal *)
  226. | ArrayConst _ ->
  227. raise (NodeError (node, "array constants can only be used in array \
  228. initialisation"))
  229. | _ -> transform_children typecheck node
  230. let phase = function
  231. | Ast node -> Ast (typecheck node)
  232. | _ -> raise (InvalidInput "typecheck")