typecheck.ml 9.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266
  1. (*
  2. * Do a number of checks:
  3. * - A void function must not return a value.
  4. * - A non-void function must return a value of the correct type.
  5. * - Array indices must be of type integer.
  6. * - The number of array indices must match the number of array dimensions.
  7. * - The type on the right-hand side of an assignment must match the type on
  8. * the left-hand side.
  9. * - The number of arguments used for a function call must match the number of
  10. * parameters for that function.
  11. * - The types of the function arguments must match the types of parameters.
  12. * - The operands of a unary or binary operation must have valid types.
  13. * - The predicate expression of an if, while, or do-while statement must be
  14. * a boolean.
  15. * - Only values of a basic type can be type cast.
  16. *)
  17. open Printf
  18. open Types
  19. open Util
  20. open Stringify
  21. (* Stringify a list of types for use in error messages.
  22. * ctype list -> string *)
  23. let rec types2str = function
  24. | [] -> ""
  25. | [ctype] -> type2str ctype
  26. | ctype :: tail -> type2str ctype ^ " or " ^ (types2str tail)
  27. let array_depth = function
  28. | ArrayDims (_, dims) -> List.length dims
  29. | _ -> raise InvalidNode
  30. let spec = function
  31. | ArrayDims (ctype, dims) -> (ctype, List.length dims)
  32. | ctype -> (ctype, 0)
  33. let check_type ?(msg="") expected node =
  34. let got = typeof node in
  35. if (spec got) <> (spec expected) then begin
  36. let msg = match msg with
  37. | "" -> sprintf "type mismatch: expected type %s, got %s"
  38. (type2str expected) (type2str got)
  39. (*(type2str (spec expected)) (type2str (spec got))*)
  40. | _ -> msg
  41. in raise (NodeError (node, msg))
  42. end
  43. let op_types = function
  44. | Not | And | Or -> [Bool]
  45. | Mod -> [Int]
  46. | Neg | Sub | Div | Lt | Le | Gt | Ge -> [Int; Float]
  47. | Add | Mul | Eq | Ne -> [Bool; Int; Float]
  48. let op_result_type opnd_type = function
  49. | Not | And | Or | Eq | Ne | Lt | Le | Gt | Ge -> Bool
  50. | Neg | Add | Sub | Mul | Div | Mod -> opnd_type
  51. (* Check if the given operator can be applied to the given type *)
  52. let check_type_op allowed_types desc node =
  53. let got = typeof node in
  54. if not (List.mem got allowed_types) then (
  55. let msg = sprintf
  56. "%s cannot be applied to type %s, only to %s"
  57. desc (type2str got) (types2str allowed_types)
  58. in
  59. raise (NodeError (node, msg))
  60. ); ()
  61. let check_dims_match dims dec_type errnode =
  62. match (List.length dims, array_depth dec_type) with
  63. | (got, expected) when got != expected ->
  64. let msg = sprintf
  65. "dimension mismatch: expected %d indices, got %d" expected got
  66. in
  67. raise (NodeError (errnode, msg))
  68. | _ -> ()
  69. let rec typecheck node =
  70. let check_trav ctype node =
  71. let node = typecheck node in
  72. check_type ctype node;
  73. node
  74. in
  75. match node with
  76. | FunUse ((FunDec (ret_type, name, params, _) as dec), args, ann)
  77. | FunUse ((FunDef (_, ret_type, name, params, _, _) as dec), args, ann) ->
  78. begin
  79. match (List.length args, List.length params) with
  80. | (nargs, nparams) when nargs != nparams ->
  81. let msg = sprintf
  82. "function \"%s\" expects %d arguments, got %d"
  83. name nparams nargs
  84. in
  85. raise (NodeError (node, msg))
  86. | _ ->
  87. let args = List.map typecheck args in
  88. let check_arg_type arg param =
  89. check_type (typeof param) arg;
  90. in
  91. List.iter2 check_arg_type args params;
  92. FunUse (dec, args, Type ret_type :: ann)
  93. end
  94. (* Operators match operand types and get a new type based on the operator *)
  95. | Monop (op, opnd, ann) ->
  96. let opnd = typecheck opnd in
  97. let desc = sprintf "unary operator \"%s\"" (op2str op) in
  98. check_type_op (op_types op) desc opnd;
  99. Monop (op, opnd, Type (op_result_type (typeof opnd) op) :: ann)
  100. | Binop (op, left, right, ann) ->
  101. let left = typecheck left in
  102. let right = typecheck right in
  103. let desc = sprintf "binary operator \"%s\"" (op2str op) in
  104. check_type_op (op_types op) desc left;
  105. check_type (typeof left) right;
  106. (* Check for division by zero *)
  107. begin
  108. match (op, right) with
  109. | (Div, Const (IntVal 0, _)) -> node_warning right "division by zero"
  110. | _ -> ()
  111. end;
  112. Binop (op, left, right, Type (op_result_type (typeof left) op) :: ann)
  113. (* Conditions must be bool, and right-hand type must match left-hand type *)
  114. | Cond (cond, texpr, fexpr, ann) ->
  115. let cond = check_trav Bool cond in
  116. let texpr = typecheck texpr in
  117. let fexpr = check_trav (typeof texpr) fexpr in
  118. Cond (cond, texpr, fexpr, Type (typeof texpr) :: ann)
  119. (* Only basic types can be typecasted *)
  120. | TypeCast (ctype, value, ann) ->
  121. let value = typecheck value in
  122. check_type_op [Bool; Int; Float] "typecast" value;
  123. TypeCast (ctype, value, Type (ctype) :: ann)
  124. (* Array allocation dimensions must have type int *)
  125. | Allocate (dec, dims, ann) ->
  126. Allocate (dec, List.map (check_trav Int) dims, ann)
  127. (* Array dimensions are always integers *)
  128. | Dim (name, ann) ->
  129. Dim (name, Type Int :: ann)
  130. (* Functions and parameters must be traversed to give types to Dim nodes *)
  131. (*
  132. | FunDec (ret_type, name, params, ann) ->
  133. FunDec (ret_type, name, List.map typecheck params, ann)
  134. | Param (ArrayDims (ctype, dims), name, ann) ->
  135. Param (ArrayDims (ctype, List.map typecheck dims), name, ann)
  136. *)
  137. (* Void functions may have no return statement, other functions must have a
  138. * return statement of valid type *)
  139. | FunDef (export, ret_type, name, params, body, ann) ->
  140. let params = List.map typecheck params in
  141. let body = typecheck body in
  142. let rec find_return = function
  143. | [] -> None
  144. | [Return (value, _) as ret] -> Some (ret, typeof value)
  145. | hd :: tl -> find_return tl
  146. in
  147. begin
  148. match (ret_type, find_return (block_body body)) with
  149. | (Void, Some (ret, _)) ->
  150. raise (NodeError (ret, "void function should not have a return value"))
  151. | ((Bool | Int | Float), None) ->
  152. let msg = sprintf
  153. "expected return value of type %s for function \"%s\""
  154. (type2str ret_type) name
  155. in
  156. raise (NodeError (node, msg))
  157. | ((Bool | Int | Float), Some (ret, t)) when t != ret_type ->
  158. let msg = sprintf
  159. "function \"%s\" has return type %s, got %s"
  160. name (type2str ret_type) (type2str t)
  161. in
  162. raise (NodeError (ret, msg))
  163. | _ -> FunDef (export, ret_type, name, params, body, ann)
  164. end
  165. (* Conditions in must have type bool *)
  166. | If (cond, body, ann) ->
  167. If (check_trav Bool cond, typecheck body, ann)
  168. | IfElse (cond, tbody, fbody, ann) ->
  169. IfElse (check_trav Bool cond, typecheck tbody, typecheck fbody, ann)
  170. | While (cond, body, ann) ->
  171. While (check_trav Bool cond, typecheck body, ann)
  172. | DoWhile (cond, body, ann) ->
  173. DoWhile (check_trav Bool cond, typecheck body, ann)
  174. (* Constants *)
  175. | Const (BoolVal value, ann) ->
  176. Const (BoolVal value, Type Bool :: ann)
  177. | Const (IntVal value, ann) ->
  178. (* Do a bound check on integers (use Int32 because default ints in ocaml
  179. * are 31- or 63-bit *)
  180. let cmpval = Nativeint.of_int value in
  181. let min = Nativeint.of_int32 Int32.min_int in
  182. let max = Nativeint.of_int32 Int32.max_int in
  183. if cmpval < min || cmpval > max then (
  184. raise (NodeError (node, "integer value out of range (signed 32-bit)"))
  185. );
  186. Const (IntVal value, Type Int :: ann)
  187. | Const (FloatVal value, ann) ->
  188. Const (FloatVal value, Type Float :: ann)
  189. (* Extern arrays variables are transformed to imported functions, so the
  190. * pointer cannot be passed *)
  191. | VarUse (GlobalDec (ArrayDims _, _, _), None, _) ->
  192. raise (NodeError (node, "imported array pointers may only be \
  193. dereferenced, not used directly"))
  194. (* Variables inherit the type of their declaration *)
  195. | VarUse (dec, None, ann) ->
  196. VarUse (dec, None, Type (typeof dec) :: ann)
  197. | VarUse (dec, Some dims, ann) ->
  198. let dims = List.map typecheck dims in
  199. List.iter (check_type Int) dims;
  200. check_dims_match dims (typeof dec) node;
  201. VarUse (dec, Some dims, Type (basetypeof dec) :: ann)
  202. (* Array pointers cannot be re-assigned, because array dimension reduction
  203. * makes assumptions about dimensions of an array *)
  204. | VarLet (dec, None, _, _) when is_array dec ->
  205. raise (NodeError (node, "cannot assign value to array pointer after \
  206. initialisation"))
  207. (* Assigned values must match variable declaration *)
  208. | VarLet (dec, None, value, ann) ->
  209. VarLet (dec, None, check_trav (typeof dec) value, ann)
  210. | VarLet (dec, Some dims, value, ann) ->
  211. (* Number of assigned indices must match array definition *)
  212. check_dims_match dims (typeof dec) node;
  213. (* Array indices must be ints *)
  214. let dims = List.map typecheck dims in
  215. List.iter (check_type Int) dims;
  216. (* Assigned value must match array base type *)
  217. let value = typecheck value in
  218. check_type (basetypeof dec) value;
  219. VarLet (dec, Some dims, value, ann)
  220. (* ArrayConst initialisations are transformed during desugaring, so any
  221. * occurrences that are left are illegal *)
  222. | ArrayConst _ ->
  223. raise (NodeError (node, "array constants can only be used in array \
  224. initialisation"))
  225. | _ -> transform_children typecheck node
  226. let phase = function
  227. | Ast node -> Ast (typecheck node)
  228. | _ -> raise (InvalidInput "typecheck")