1 (* Yoann Padioleau, Julia Lawall
3 * Copyright (C) 2010, University of Copenhagen DIKU and INRIA.
4 * Copyright (C) 2007, 2008, 2009 University of Urbana Champaign and DIKU
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License (GPL)
8 * version 2 as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * file license.txt for more details.
20 (*****************************************************************************)
22 (*****************************************************************************)
23 let pr2, pr2_once
= Common.mk_pr2_wrappers
Flag_parsing_c.verbose_type
25 (*****************************************************************************)
27 (*****************************************************************************)
29 (* What info do we want in a clean C type ? Normally it would help
30 * if we remove some of the complexity of C with for instance typedefs
31 * by expanding those typedefs or structname and enumname to their
32 * final value. Then, when we do pattern matching we can conveniently forget
33 * to handle the typedef, enumname and similar cases. But sometimes,
34 * in coccinelle for instance, we want to keep some of those original
35 * info. So right now we have a in-the-middle solution by keeping
36 * the original typename in the ast and expanding some of them
37 * in the type_annotation phase. We don't do this expansion for
38 * structname because usually when we have a struct we actually
39 * prefer to just have the structname. It's only when we access
40 * field that we need that information, but the type_annotater has
41 * already done this job so no need in the parent expression to know
42 * the full definition of the structure. But for typedef, this is different.
44 * So really the finalType we want, the completed_type notion below,
45 * corresponds to a type we think is useful enough to work on, to do
46 * pattern matching on, and one where we have all the needed information
47 * and we don't need to look again somewhere else to get the information.
52 * todo? define a new clean fulltype ? as julia did with type_cocci.ml
53 * without the parsing info, with some normalization (for instance have
54 * only structUnionName and enumName, and remove the ParenType), some
55 * abstractions (don't care for instance about name in parameters of
56 * functionType, or size of array), and with new types such as Unknown
57 * or PartialFunctionType (when don't have type of return when infer
58 * the type of function call not based on type of function but on the
59 * type of its arguments).
65 type finalType
= Ast_c.fullType
67 type completed_and_simplified
= Ast_c.fullType
69 type completed_typedef
= Ast_c.fullType
70 type removed_typedef
= Ast_c.fullType
73 * use Ast_c.nQ, Ast_c.defaultInt, Ast_c.emptyAnnotCocci,
74 * Ast_c.emptyMetavarsBinding, Ast_c.emptyComments
76 let (int_type
: Ast_c.fullType
) =
77 (* Lib_parsing_c.al_type (Parse_c.type_of_string "int")*)
79 (Ast_c.BaseType
(Ast_c.IntType
(Ast_c.Si
(Ast_c.Signed
, Ast_c.CInt
))))
80 [Ast_c.al_info
0 (* al *)
83 {Common.str
= "int"; Common.charpos
= 0; Common.line
= -1;
84 Common.column
= -1; Common.file
= ""};
86 {contents
= Some
(Ast_cocci.CONTEXT
(Ast_cocci.NoPos
, Ast_cocci.NOTHING
), [])};
87 Ast_c.comments_tag
= {contents
=
88 {Ast_c.mbefore
= []; Ast_c.mafter
= [];
89 Ast_c.mbefore2
= []; Ast_c.mafter2
= []
95 (* normally if the type annotated has done a good job, this should always
96 * return true. Cf type_annotater_c.typedef_fix.
98 let rec is_completed_and_simplified ty
=
99 match Ast_c.unwrap_typeC ty
with
101 | Pointer t
-> is_completed_and_simplified t
102 | Array
(e
, t
) -> is_completed_and_simplified t
103 | StructUnion
(su
, sopt
, fields
) ->
104 (* recurse fields ? Normally actually don't want,
105 * prefer to have a StructUnionName when it's possible *)
108 | Some _
-> false (* should have transformed it in a StructUnionName *)
111 (* todo? return type is completed ? params completed ? *)
118 (* we prefer StructUnionName to StructUnion when it comes to typed metavar *)
119 | StructUnionName
(su
, s
) -> true
121 (* should have completed with more information *)
122 | TypeName
(_name
, typ
) ->
126 (* recurse cos what if it's an alias of an alias ? *)
127 is_completed_and_simplified t
130 (* should have removed paren, for better matching with typed metavar.
131 * kind of iso again *)
139 true (* well we don't handle it, so can't really say it's completed *)
142 let is_completed_typedef_fullType x
= raise Todo
144 let is_removed_typedef_fullType x
= raise Todo
146 (*****************************************************************************)
147 (* more "virtual" fulltype, the fullType_with_no_typename *)
148 (*****************************************************************************)
149 let remove_typedef x
= raise Todo
151 (*****************************************************************************)
152 (* expression exp_info annotation vs finalType *)
153 (*****************************************************************************)
155 (* builders, needed because julia added gradually more information in
156 * the expression reference annotation in ast_c.
160 (Some x
, Ast_c.NotTest
)
162 let make_exp_type t
=
163 (t
, Ast_c.NotLocalVar
)
165 let make_info_def t
=
166 make_info (make_exp_type t
)
171 (None
, Ast_c.NotTest
)
174 let do_with_type f
(t
,_test
) =
177 | Some
(t
,_local
) -> f t
180 match Ast_c.get_type_expr e
with
181 | Some
(t
,_
), _test
-> Some t
182 | None
, _test
-> None
186 (*****************************************************************************)
188 (*****************************************************************************)
191 let structdef_to_struct_name ty
=
192 let (qu
, tybis
) = ty
in
193 match Ast_c.unwrap_typeC ty
with
194 | (StructUnion
(su
, sopt
, fields
)) ->
195 let iis = Ast_c.get_ii_typeC_take_care tybis
in
196 (match sopt
, iis with
197 (* todo? but what if correspond to a nested struct def ? *)
198 | Some s
, [i1
;i2
;i3
;i4
] ->
199 qu
, Ast_c.mk_tybis
(StructUnionName
(su
, s
)) [i1
;i2
]
202 | x
-> raise Impossible
204 | _
-> raise Impossible
207 (*****************************************************************************)
209 (*****************************************************************************)
212 let type_of_function (def
,ii
) =
213 let ftyp = def
.f_type
in
215 (* could use the info in the 'ii' ? *)
217 let fake = Ast_c.fakeInfo
(Common.fake_parse_info
) in
218 let fake_oparen = Ast_c.rewrap_str
"(" fake in
219 let fake = Ast_c.fakeInfo
(Common.fake_parse_info
) in
220 let fake_cparen = Ast_c.rewrap_str
")" fake in
222 Ast_c.mk_ty
(FunctionType
ftyp) [fake_oparen;fake_cparen]
225 (* pre: only a single variable *)
226 let type_of_decl decl
=
228 | Ast_c.DeclList
(xs
,ii1
) ->
230 | [] -> raise Impossible
232 (* todo? for other xs ? *)
234 let {v_namei
= _var
; v_type
= v_type
;
235 v_storage
= (_storage
,_inline
)} = x
in
237 (* TODO normalize ? what if nested structure definition ? *)
240 | Ast_c.MacroDecl _
->
241 pr2_once
"not handling MacroDecl type yet";
246 (* pre: it is indeed a struct def decl, and only a single variable *)
247 let structdef_of_decl decl
=
250 | Ast_c.DeclList
(xs
,ii1
) ->
252 | [] -> raise Impossible
254 (* todo? for other xs ? *)
256 let {v_namei
= var
; v_type
= v_type
;
257 v_storage
= (storage
,inline
)} = x
in
259 (match Ast_c.unwrap_typeC v_type
with
260 | Ast_c.StructUnion
(su
, _must_be_some
, fields
) ->
262 | _
-> raise Impossible
265 | Ast_c.MacroDecl _
-> raise Impossible
270 (*****************************************************************************)
272 (*****************************************************************************)
274 let (fake_function_type
:
275 fullType
option -> argument wrap2 list
-> fullType
option) =
278 let fake = Ast_c.fakeInfo
(Common.fake_parse_info
) in
279 let fake_oparen = Ast_c.rewrap_str
"(" fake in
280 let fake = Ast_c.fakeInfo
(Common.fake_parse_info
) in
281 let fake_cparen = Ast_c.rewrap_str
")" fake in
283 let (tyargs
: parameterType wrap2 list
) =
284 args
+> Common.map_filter
(fun (arg
,ii
) ->
287 (match Ast_c.get_onlytype_expr e
with
290 { Ast_c.p_namei
= None
;
291 p_register
= false, Ast_c.noii
;
301 if List.length args
<> List.length tyargs
304 rettype
+> Common.map_option
(fun rettype
->
305 let (ftyp: functionType
) = (rettype
, (tyargs
, (false,[]))) in
307 Ast_c.mk_ty
(FunctionType
ftyp) [fake_oparen;fake_cparen]
313 (*****************************************************************************)
315 (*****************************************************************************)
318 (* todo: the rules are far more complex, but I prefer to simplify for now.
319 * todo: should take operator as a parameter.
321 * todo: Also need handle pointer arithmetic! the type of 'pt + 2'
322 * is still the type of pt. cf parsing_cocci/type_infer.ml
324 * (* pad: in pointer arithmetic, as in ptr+1, the lub must be ptr *)
325 * | (T.Pointer
(ty1
),T.Pointer
(ty2
)) ->
326 * T.Pointer
(loop
(ty1
,ty2
))
327 * | (ty1
,T.Pointer
(ty2
)) -> T.Pointer
(ty2
)
328 * | (T.Pointer
(ty1
),ty2
) -> T.Pointer
(ty1
)
335 | Some t
, None
-> Some t
336 | None
, Some t
-> Some t
337 (* check equal ? no cos can have pointer arithmetic so t2 can be <> t1
339 * todo: right now I favor the first term because usually pointer
340 * arithmetic are written with the pointer in the first position.
342 * Also when an expression contain a typedef, as in
343 * 'dma_addr + 1' where dma_addr was declared as a varialbe
344 * of type dma_addr_t, then again I want to have in the lub
345 * the typedef and it is often again in the first position.
348 | Some t1
, Some t2
->
349 let t1bis = Ast_c.unwrap_typeC t1
in
350 let t2bis = Ast_c.unwrap_typeC t2
in
351 (* a small attempt to do better, no consideration of typedefs *)
352 (match op
, t1bis, t2bis with
353 (* these rules follow ANSI C. See eg:
354 http://flexor.uwaterloo.ca/library/SGI_bookshelves/SGI_Developer/books/CLanguageRef/sgi_html/ch05.html *)
355 _
,Ast_c.BaseType
(bt1
),Ast_c.BaseType
(bt2
) ->
357 Ast_c.Void
,_
-> Some t2
(* something has gone wrong *)
358 | _
,Ast_c.Void
-> Some t1
(* something has gone wrong *)
359 | Ast_c.FloatType
(Ast_c.CLongDouble
),_
-> Some t1
360 | _
,Ast_c.FloatType
(Ast_c.CLongDouble
) -> Some t2
361 | Ast_c.FloatType
(Ast_c.CDouble
),_
-> Some t1
362 | _
,Ast_c.FloatType
(Ast_c.CDouble
) -> Some t2
363 | Ast_c.FloatType
(Ast_c.CFloat
),_
-> Some t1
364 | _
,Ast_c.FloatType
(Ast_c.CFloat
) -> Some t2
366 | Ast_c.IntType
(Ast_c.Si
(Ast_c.UnSigned
,Ast_c.CLongLong
)),_
->
368 | _
,Ast_c.IntType
(Ast_c.Si
(Ast_c.UnSigned
,Ast_c.CLongLong
)) ->
370 | Ast_c.IntType
(Ast_c.Si
(Ast_c.Signed
,Ast_c.CLongLong
)),_
->
372 | _
,Ast_c.IntType
(Ast_c.Si
(Ast_c.Signed
,Ast_c.CLongLong
)) ->
374 | Ast_c.IntType
(Ast_c.Si
(Ast_c.UnSigned
,Ast_c.CLong
)),_
->
376 | _
,Ast_c.IntType
(Ast_c.Si
(Ast_c.UnSigned
,Ast_c.CLong
)) ->
378 | Ast_c.IntType
(Ast_c.Si
(Ast_c.Signed
,Ast_c.CLong
)),_
->
380 | _
,Ast_c.IntType
(Ast_c.Si
(Ast_c.Signed
,Ast_c.CLong
)) ->
382 | Ast_c.IntType
(Ast_c.Si
(Ast_c.UnSigned
,Ast_c.CInt
)),_
->
384 | _
,Ast_c.IntType
(Ast_c.Si
(Ast_c.UnSigned
,Ast_c.CInt
)) ->
386 | _
-> Some int_type
)
388 | Ast_c.Plus
,Ast_c.Pointer _
,Ast_c.BaseType
(Ast_c.IntType _
) ->
390 | Ast_c.Plus
,Ast_c.BaseType
(Ast_c.IntType _
),Ast_c.Pointer _
->
392 | Ast_c.Minus
,Ast_c.Pointer _
,Ast_c.BaseType
(Ast_c.IntType _
) ->
394 | Ast_c.Minus
,Ast_c.BaseType
(Ast_c.IntType _
),Ast_c.Pointer _
->
396 | Ast_c.Minus
,Ast_c.Pointer _
,Ast_c.Pointer _
->
398 (* todo, Pointer, Typedef, etc *)
404 | None
-> None
, Ast_c.NotTest
405 | Some ft
-> Some
(ft
, Ast_c.NotLocalVar
), Ast_c.NotTest
409 (*****************************************************************************)
411 (*****************************************************************************)
413 (* old: was using some nested find_some, but easier use ref
414 * update: handling union (used a lot in sparse)
415 * note: it is independent of the environment.
418 string -> (Ast_c.structUnion
* Ast_c.structType
) -> Ast_c.fullType
) =
419 fun fld
(su
, fields
) ->
423 let rec aux_fields fields
=
424 fields
+> List.iter
(fun x
->
426 | DeclarationField
(FieldDeclList
(onefield_multivars
, iiptvirg
)) ->
427 onefield_multivars
+> List.iter
(fun (fieldkind
, iicomma
) ->
429 | Simple
(Some name
, t
) | BitField
(Some name
, t
, _
, _
) ->
430 let s = Ast_c.str_of_name name
in
432 then Common.push2 t
res
435 | Simple
(None
, t
) ->
436 (match Ast_c.unwrap_typeC t
with
439 | StructUnion
(Union
, _
, fields
) ->
442 (* Special case of nested structure definition inside
443 * structure without associated field variable as in
444 * struct top = { ... struct xx { int subfield1; ... }; ... }
445 * cf sparse source, where can access subfields directly.
446 * It can also be used in conjunction with union.
448 | StructUnion
(Struct
, _
, fields
) ->
456 | EmptyField info
-> ()
457 | MacroDeclField _
-> pr2_once
"DeclTodo"; ()
459 | CppDirectiveStruct _
460 | IfdefStruct _
-> pr2_once
"StructCpp";
469 pr2 ("MultiFound field: " ^ fld
) ;
474 (*****************************************************************************)
476 (*****************************************************************************)
479 (* was in aliasing_function_c.ml before*)
481 (* assume normalized/completed ? so no ParenType handling to do ?
483 let rec is_function_type x
=
484 match Ast_c.unwrap_typeC x
with
485 | FunctionType _
-> true
489 (* assume normalized/completed ? so no ParenType handling to do ? *)
490 let rec function_pointer_type_opt x
=
491 match Ast_c.unwrap_typeC x
with
493 (match Ast_c.unwrap_typeC y
with
494 | FunctionType ft
-> Some ft
497 | TypeName
(_name
, Some ft2
) ->
498 (match Ast_c.unwrap_typeC ft2
with
499 | FunctionType ft
-> Some ft
505 (* bugfix: for many fields in structure, the field is a typename
506 * like irq_handler_t to a function pointer
508 | TypeName
(_name
, Some ft
) ->
509 function_pointer_type_opt ft
510 (* bugfix: in field, usually it has some ParenType *)
513 function_pointer_type_opt ft