(*
* Copyright 2005-2009, Ecole des Mines de Nantes, University of Copenhagen
* Yoann Padioleau, Julia Lawall, Rene Rydhof Hansen, Henrik Stuart, Gilles Muller
* This file is part of Coccinelle.
*
* Coccinelle is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, according to version 2 of the License.
*
* Coccinelle is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Coccinelle. If not, see .
*
* The authors reserve the right to distribute this or future versions of
* Coccinelle under other licenses.
*)
open Common
module CCI = Ctlcocci_integration
module TAC = Type_annoter_c
(*****************************************************************************)
(* This file is a kind of driver. It gathers all the important functions
* from coccinelle in one place. The different entities in coccinelle are:
* - files
* - astc
* - astcocci
* - flow (contain nodes)
* - ctl (contain rule_elems)
* This file contains functions to transform one in another.
*)
(*****************************************************************************)
(* --------------------------------------------------------------------- *)
(* C related *)
(* --------------------------------------------------------------------- *)
let cprogram_of_file file =
let (program2, _stat) = Parse_c.parse_print_error_heuristic file in
program2
let cprogram_of_file_cached file =
let (program2, _stat) = Parse_c.parse_cache file in
if !Flag_cocci.ifdef_to_if
then
program2 +> Parse_c.with_program2 (fun asts ->
Cpp_ast_c.cpp_ifdef_statementize asts
)
else program2
let cfile_of_program program2_with_ppmethod outf =
Unparse_c.pp_program program2_with_ppmethod outf
(* for memoization, contains only one entry, the one for the SP *)
let _hparse = Hashtbl.create 101
let _hctl = Hashtbl.create 101
(* --------------------------------------------------------------------- *)
(* Cocci related *)
(* --------------------------------------------------------------------- *)
let sp_of_file2 file iso =
Common.memoized _hparse (file, iso) (fun () ->
Parse_cocci.process file iso false)
let sp_of_file file iso =
Common.profile_code "parse cocci" (fun () -> sp_of_file2 file iso)
(* --------------------------------------------------------------------- *)
(* Flow related *)
(* --------------------------------------------------------------------- *)
let print_flow flow =
Ograph_extended.print_ograph_mutable flow "/tmp/test.dot" true
let ast_to_flow_with_error_messages2 x =
let flowopt =
try Ast_to_flow.ast_to_control_flow x
with Ast_to_flow.Error x ->
Ast_to_flow.report_error x;
None
in
flowopt +> do_option (fun flow ->
(* This time even if there is a deadcode, we still have a
* flow graph, so I can try the transformation and hope the
* deadcode will not bother us.
*)
try Ast_to_flow.deadcode_detection flow
with Ast_to_flow.Error (Ast_to_flow.DeadCode x) ->
Ast_to_flow.report_error (Ast_to_flow.DeadCode x);
);
flowopt
let ast_to_flow_with_error_messages a =
Common.profile_code "flow" (fun () -> ast_to_flow_with_error_messages2 a)
(* --------------------------------------------------------------------- *)
(* Ctl related *)
(* --------------------------------------------------------------------- *)
let ctls_of_ast2 ast ua pos =
List.map2
(function ast -> function (ua,pos) ->
List.combine
(if !Flag_cocci.popl
then Popl.popl ast
else Asttoctl2.asttoctl ast ua pos)
(Asttomember.asttomember ast ua))
ast (List.combine ua pos)
let ctls_of_ast ast ua =
Common.profile_code "asttoctl2" (fun () -> ctls_of_ast2 ast ua)
(*****************************************************************************)
(* Some debugging functions *)
(*****************************************************************************)
(* the inputs *)
let show_or_not_cfile2 cfile =
if !Flag_cocci.show_c then begin
Common.pr2_xxxxxxxxxxxxxxxxx ();
pr2 ("processing C file: " ^ cfile);
Common.pr2_xxxxxxxxxxxxxxxxx ();
Common.command2 ("cat " ^ cfile);
end
let show_or_not_cfile a =
Common.profile_code "show_xxx" (fun () -> show_or_not_cfile2 a)
let show_or_not_cfiles cfiles = List.iter show_or_not_cfile cfiles
let show_or_not_cocci2 coccifile isofile =
if !Flag_cocci.show_cocci then begin
Common.pr2_xxxxxxxxxxxxxxxxx ();
pr2 ("processing semantic patch file: " ^ coccifile);
isofile +> (fun s -> pr2 ("with isos from: " ^ s));
Common.pr2_xxxxxxxxxxxxxxxxx ();
Common.command2 ("cat " ^ coccifile);
pr2 "";
end
let show_or_not_cocci a b =
Common.profile_code "show_xxx" (fun () -> show_or_not_cocci2 a b)
(* the output *)
let show_or_not_diff2 cfile outfile show_only_minus =
if !Flag_cocci.show_diff then begin
match Common.fst(Compare_c.compare_default cfile outfile) with
Compare_c.Correct -> () (* diff only in spacing, etc *)
| _ ->
(* may need --strip-trailing-cr under windows *)
pr2 "diff = ";
let line =
match !Flag_parsing_c.diff_lines with
| None -> "diff -u -p " ^ cfile ^ " " ^ outfile
| Some n -> "diff -U "^n^" -p "^cfile^" "^outfile in
let xs =
let res = Common.cmd_to_list line in
match (!Flag.patch,res) with
(* create something that looks like the output of patch *)
(Some prefix,minus_file::plus_file::rest) ->
let drop_prefix file =
if prefix = ""
then "/"^file
else
(match Str.split (Str.regexp prefix) file with
[base_file] -> base_file
| _ -> failwith "prefix not found in the old file name") in
let diff_line =
match List.rev(Str.split (Str.regexp " ") line) with
new_file::old_file::cmdrev ->
if !Flag.sgrep_mode2
then
String.concat " "
(List.rev ("/tmp/nothing" :: old_file :: cmdrev))
else
let old_base_file = drop_prefix old_file in
String.concat " "
(List.rev
(("b"^old_base_file)::("a"^old_base_file)::cmdrev))
| _ -> failwith "bad command" in
let (minus_line,plus_line) =
if !Flag.sgrep_mode2
then (minus_file,plus_file)
else
match (Str.split (Str.regexp "[ \t]") minus_file,
Str.split (Str.regexp "[ \t]") plus_file) with
("---"::old_file::old_rest,"+++"::new_file::new_rest) ->
let old_base_file = drop_prefix old_file in
(String.concat " "
("---"::("a"^old_base_file)::old_rest),
String.concat " "
("+++"::("b"^old_base_file)::new_rest))
| (l1,l2) ->
failwith
(Printf.sprintf "bad diff header lines: %s %s"
(String.concat ":" l1) (String.concat ":" l2)) in
diff_line::minus_line::plus_line::rest
| _ -> res in
xs +> List.iter (fun s ->
if s =~ "^\\+" && show_only_minus
then ()
else pr s)
end
let show_or_not_diff a b c =
Common.profile_code "show_xxx" (fun () -> show_or_not_diff2 a b c)
(* the derived input *)
let show_or_not_ctl_tex2 astcocci ctls =
if !Flag_cocci.show_ctl_tex then begin
Ctltotex.totex ("/tmp/__cocci_ctl.tex") astcocci ctls;
Common.command2 ("cd /tmp; latex __cocci_ctl.tex; " ^
"dvips __cocci_ctl.dvi -o __cocci_ctl.ps;" ^
"gv __cocci_ctl.ps &");
end
let show_or_not_ctl_tex a b =
Common.profile_code "show_xxx" (fun () -> show_or_not_ctl_tex2 a b)
let show_or_not_rule_name ast rulenb =
if !Flag_cocci.show_ctl_text or !Flag.show_trying or
!Flag.show_transinfo or !Flag_cocci.show_binding_in_out
then
begin
let name =
match ast with
Ast_cocci.CocciRule (nm, (deps, drops, exists), x, _, _) -> nm
| _ -> i_to_s rulenb in
Common.pr_xxxxxxxxxxxxxxxxx ();
pr (name ^ " = ");
Common.pr_xxxxxxxxxxxxxxxxx ()
end
let show_or_not_scr_rule_name rulenb =
if !Flag_cocci.show_ctl_text or !Flag.show_trying or
!Flag.show_transinfo or !Flag_cocci.show_binding_in_out
then
begin
let name = i_to_s rulenb in
Common.pr_xxxxxxxxxxxxxxxxx ();
pr ("script rule " ^ name ^ " = ");
Common.pr_xxxxxxxxxxxxxxxxx ()
end
let show_or_not_ctl_text2 ctl ast rulenb =
if !Flag_cocci.show_ctl_text then begin
adjust_pp_with_indent (fun () ->
Format.force_newline();
Pretty_print_cocci.print_plus_flag := true;
Pretty_print_cocci.print_minus_flag := true;
Pretty_print_cocci.unparse ast;
);
pr "CTL = ";
let (ctl,_) = ctl in
adjust_pp_with_indent (fun () ->
Format.force_newline();
Pretty_print_engine.pp_ctlcocci
!Flag_cocci.show_mcodekind_in_ctl !Flag_cocci.inline_let_ctl ctl;
);
pr "";
end
let show_or_not_ctl_text a b c =
Common.profile_code "show_xxx" (fun () -> show_or_not_ctl_text2 a b c)
(* running information *)
let get_celem celem : string =
match celem with
Ast_c.Definition ({Ast_c.f_name = funcs;},_) -> funcs
| Ast_c.Declaration
(Ast_c.DeclList ([{Ast_c.v_namei = Some ((s, _),_);}, _], _)) -> s
| _ -> ""
let show_or_not_celem2 prelude celem =
let (tag,trying) =
(match celem with
| Ast_c.Definition ({Ast_c.f_name = funcs;},_) ->
Flag.current_element := funcs;
(" function: ",funcs)
| Ast_c.Declaration
(Ast_c.DeclList ([{Ast_c.v_namei = Some ((s, _),_);}, _], _)) ->
Flag.current_element := s;
(" variable ",s);
| _ ->
Flag.current_element := "something_else";
(" ","something else");
) in
if !Flag.show_trying then pr2 (prelude ^ tag ^ trying)
let show_or_not_celem a b =
Common.profile_code "show_xxx" (fun () -> show_or_not_celem2 a b)
let show_or_not_trans_info2 trans_info =
if !Flag.show_transinfo then begin
if null trans_info then pr2 "transformation info is empty"
else begin
pr2 "transformation info returned:";
let trans_info =
List.sort (function (i1,_,_) -> function (i2,_,_) -> compare i1 i2)
trans_info
in
indent_do (fun () ->
trans_info +> List.iter (fun (i, subst, re) ->
pr2 ("transform state: " ^ (Common.i_to_s i));
indent_do (fun () ->
adjust_pp_with_indent_and_header "with rule_elem: " (fun () ->
Pretty_print_cocci.print_plus_flag := true;
Pretty_print_cocci.print_minus_flag := true;
Pretty_print_cocci.rule_elem "" re;
);
adjust_pp_with_indent_and_header "with binding: " (fun () ->
Pretty_print_engine.pp_binding subst;
);
)
);
)
end
end
let show_or_not_trans_info a =
Common.profile_code "show_xxx" (fun () -> show_or_not_trans_info2 a)
let show_or_not_binding2 s binding =
if !Flag_cocci.show_binding_in_out then begin
adjust_pp_with_indent_and_header ("binding " ^ s ^ " = ") (fun () ->
Pretty_print_engine.pp_binding binding
)
end
let show_or_not_binding a b =
Common.profile_code "show_xxx" (fun () -> show_or_not_binding2 a b)
(*****************************************************************************)
(* Some helper functions *)
(*****************************************************************************)
let worth_trying cfiles tokens =
(* drop the following line for a list of list by rules. since we don't
allow multiple minirules, all the tokens within a rule should be in
a single CFG entity *)
let tokens = Common.union_all tokens in
if not !Flag_cocci.windows && not (null tokens)
then
(* could also modify the code in get_constants.ml *)
let tokens = tokens +> List.map (fun s ->
match () with
| _ when s =~ "^[A-Za-z_][A-Za-z_0-9]*$" ->
"\\b" ^ s ^ "\\b"
| _ when s =~ "^[A-Za-z_]" ->
"\\b" ^ s
| _ when s =~ ".*[A-Za-z_]$" ->
s ^ "\\b"
| _ -> s
) in
let com = sprintf "egrep -q '(%s)' %s" (join "|" tokens) (join " " cfiles)
in
(match Sys.command com with
| 0 (* success *) -> true
| _ (* failure *) ->
(if !Flag.show_misc
then Printf.printf "grep failed: %s\n" com);
false (* no match, so not worth trying *)
)
else true
let check_macro_in_sp_and_adjust tokens =
let tokens = Common.union_all tokens in
tokens +> List.iter (fun s ->
if Hashtbl.mem !Parsing_hacks._defs s
then begin
pr2 "warning: macro in semantic patch was in macro definitions";
pr2 ("disabling macro expansion for " ^ s);
Hashtbl.remove !Parsing_hacks._defs s
end
)
let contain_loop gopt =
match gopt with
| Some g ->
g#nodes#tolist +> List.exists (fun (xi, node) ->
Control_flow_c.extract_is_loop node
)
| None -> true (* means nothing, if no g then will not model check *)
let sp_contain_typed_metavar_z toplevel_list_list =
let bind x y = x or y in
let option_default = false in
let mcode _ _ = option_default in
let donothing r k e = k e in
let expression r k e =
match Ast_cocci.unwrap e with
| Ast_cocci.MetaExpr (_,_,_,Some t,_,_) -> true
| Ast_cocci.MetaExpr (_,_,_,_,Ast_cocci.LocalID,_) -> true
| _ -> k e
in
let combiner =
Visitor_ast.combiner bind option_default
mcode mcode mcode mcode mcode mcode mcode mcode mcode mcode mcode mcode
donothing donothing donothing donothing
donothing expression donothing donothing donothing donothing donothing
donothing donothing donothing donothing donothing
in
toplevel_list_list +>
List.exists
(function (nm,_,rule) ->
(List.exists combiner.Visitor_ast.combiner_top_level rule))
let sp_contain_typed_metavar rules =
sp_contain_typed_metavar_z
(List.map
(function x ->
match x with
Ast_cocci.CocciRule (a,b,c,d,_) -> (a,b,c)
| _ -> failwith "error in filter")
(List.filter
(function x ->
match x with
Ast_cocci.CocciRule (a,b,c,d,Ast_cocci.Normal) -> true
| _ -> false)
rules))
(* finding among the #include the one that we need to parse
* because they may contain useful type definition or because
* we may have to modify them
*
* For the moment we base in part our heuristic on the name of the file, e.g.
* serio.c is related we think to #include
*)
let (includes_to_parse:
(Common.filename * Parse_c.program2) list ->
Flag_cocci.include_options -> 'a) = fun xs choose_includes ->
match choose_includes with
Flag_cocci.I_UNSPECIFIED -> failwith "not possible"
| Flag_cocci.I_NO_INCLUDES -> []
| x ->
let all_includes = x = Flag_cocci.I_ALL_INCLUDES in
xs +> List.map (fun (file, cs) ->
let dir = Common.dirname file in
cs +> Common.map_filter (fun (c,_info_item) ->
match c with
| Ast_c.CppTop
(Ast_c.Include
{Ast_c.i_include = ((x,ii)); i_rel_pos = info_h_pos;}) ->
(match x with
| Ast_c.Local xs ->
let f = Filename.concat dir (Common.join "/" xs) in
(* for our tests, all the files are flat in the current dir *)
if not (Sys.file_exists f) && !Flag_cocci.relax_include_path
then
let attempt2 = Filename.concat dir (Common.last xs) in
if not (Sys.file_exists f) && all_includes
then Some (Filename.concat !Flag_cocci.include_path
(Common.join "/" xs))
else Some attempt2
else Some f
| Ast_c.NonLocal xs ->
if all_includes ||
Common.fileprefix (Common.last xs) = Common.fileprefix file
then
Some (Filename.concat !Flag_cocci.include_path
(Common.join "/" xs))
else None
| Ast_c.Weird _ -> None
)
| _ -> None))
+> List.concat
+> Common.uniq
let rec interpret_dependencies local global = function
Ast_cocci.Dep s -> List.mem s local
| Ast_cocci.AntiDep s ->
(if !Flag_ctl.steps != None
then failwith "steps and ! dependency incompatible");
not (List.mem s local)
| Ast_cocci.EverDep s -> List.mem s global
| Ast_cocci.NeverDep s ->
(if !Flag_ctl.steps != None
then failwith "steps and ! dependency incompatible");
not (List.mem s global)
| Ast_cocci.AndDep(s1,s2) ->
(interpret_dependencies local global s1) &&
(interpret_dependencies local global s2)
| Ast_cocci.OrDep(s1,s2) ->
(interpret_dependencies local global s1) or
(interpret_dependencies local global s2)
| Ast_cocci.NoDep -> true
let rec print_dependencies str local global dep =
if !Flag_cocci.show_dependencies
then
begin
pr2 str;
let seen = ref [] in
let rec loop = function
Ast_cocci.Dep s | Ast_cocci.AntiDep s ->
if not (List.mem s !seen)
then
begin
if List.mem s local
then pr2 (s^" satisfied")
else pr2 (s^" not satisfied");
seen := s :: !seen
end
| Ast_cocci.EverDep s | Ast_cocci.NeverDep s ->
if not (List.mem s !seen)
then
begin
if List.mem s global
then pr2 (s^" satisfied")
else pr2 (s^" not satisfied");
seen := s :: !seen
end
| Ast_cocci.AndDep(s1,s2) ->
loop s1;
loop s2
| Ast_cocci.OrDep(s1,s2) ->
loop s1;
loop s2
| Ast_cocci.NoDep -> () in
loop dep
end
(* --------------------------------------------------------------------- *)
(* #include relative position in the file *)
(* --------------------------------------------------------------------- *)
(* compute the set of new prefixes
* on
* "a/b/x"; (* in fact it is now a list of string so ["a";"b";"x"] *)
* "a/b/c/x";
* "a/x";
* "b/x";
* it would give for the first element
* ""; "a"; "a/b"; "a/b/x"
* for the second
* "a/b/c/x"
*
* update: if the include is inside a ifdef a put nothing. cf -test incl.
* this is because we dont want code added inside ifdef.
*)
let compute_new_prefixes xs =
xs +> Common.map_withenv (fun already xs ->
let subdirs_prefixes = Common.inits xs in
let new_first = subdirs_prefixes +> List.filter (fun x ->
not (List.mem x already)
)
in
new_first,
new_first @ already
) []
+> fst
(* does via side effect on the ref in the Include in Ast_c *)
let rec update_include_rel_pos cs =
let only_include = cs +> Common.map_filter (fun c ->
match c with
| Ast_c.CppTop (Ast_c.Include {Ast_c.i_include = ((x,_));
i_rel_pos = aref;
i_is_in_ifdef = inifdef}) ->
(match x with
| Ast_c.Weird _ -> None
| _ ->
if inifdef
then None
else Some (x, aref)
)
| _ -> None
)
in
let (locals, nonlocals) =
only_include +> Common.partition_either (fun (c, aref) ->
match c with
| Ast_c.Local x -> Left (x, aref)
| Ast_c.NonLocal x -> Right (x, aref)
| Ast_c.Weird x -> raise Impossible
) in
update_rel_pos_bis locals;
update_rel_pos_bis nonlocals;
cs
and update_rel_pos_bis xs =
let xs' = List.map fst xs in
let the_first = compute_new_prefixes xs' in
let the_last = List.rev (compute_new_prefixes (List.rev xs')) in
let merged = Common.zip xs (Common.zip the_first the_last) in
merged +> List.iter (fun ((x, aref), (the_first, the_last)) ->
aref := Some
{
Ast_c.first_of = the_first;
Ast_c.last_of = the_last;
}
)
(*****************************************************************************)
(* All the information needed around the C elements and Cocci rules *)
(*****************************************************************************)
type toplevel_c_info = {
ast_c: Ast_c.toplevel; (* contain refs so can be modified *)
tokens_c: Parser_c.token list;
fullstring: string;
flow: Control_flow_c.cflow option; (* it's the "fixed" flow *)
contain_loop: bool;
env_typing_before: TAC.environment;
env_typing_after: TAC.environment;
was_modified: bool ref;
(* id: int *)
}
type toplevel_cocci_info_script_rule = {
scr_ast_rule: string * (string * (string * string)) list * string;
language: string;
scr_dependencies: Ast_cocci.dependency;
scr_ruleid: int;
script_code: string;
}
type toplevel_cocci_info_cocci_rule = {
ctl: Lib_engine.ctlcocci * (CCI.pred list list);
metavars: Ast_cocci.metavar list;
ast_rule: Ast_cocci.rule;
isexp: bool; (* true if + code is an exp, only for Flag.make_hrule *)
rulename: string;
dependencies: Ast_cocci.dependency;
(* There are also some hardcoded rule names in parse_cocci.ml:
* let reserved_names = ["all";"optional_storage";"optional_qualifier"]
*)
dropped_isos: string list;
free_vars: Ast_cocci.meta_name list;
negated_pos_vars: Ast_cocci.meta_name list;
used_after: Ast_cocci.meta_name list;
positions: Ast_cocci.meta_name list;
ruleid: int;
ruletype: Ast_cocci.ruletype;
was_matched: bool ref;
}
type toplevel_cocci_info =
ScriptRuleCocciInfo of toplevel_cocci_info_script_rule
| CocciRuleCocciInfo of toplevel_cocci_info_cocci_rule
type kind_file = Header | Source
type file_info = {
fname : string;
full_fname : string;
was_modified_once: bool ref;
asts: toplevel_c_info list;
fpath : string;
fkind : kind_file;
}
let g_contain_typedmetavar = ref false
let last_env_toplevel_c_info xs =
(Common.last xs).env_typing_after
let concat_headers_and_c (ccs: file_info list)
: (toplevel_c_info * string) list =
(List.concat (ccs +> List.map (fun x ->
x.asts +> List.map (fun x' ->
(x', x.fname)))))
let for_unparser xs =
xs +> List.map (fun x ->
(x.ast_c, (x.fullstring, x.tokens_c)), Unparse_c.PPviastr
)
let gen_pdf_graph () =
(Ctl_engine.get_graph_files ()) +> List.iter (fun outfile ->
Printf.printf "Generation of %s%!" outfile;
let filename_stack = Ctl_engine.get_graph_comp_files outfile in
List.iter (fun filename ->
ignore (Unix.system ("dot " ^ filename ^ " -Tpdf -o " ^ filename ^ ".pdf;"))
) filename_stack;
let (head,tail) = (List.hd filename_stack, List.tl filename_stack) in
ignore(Unix.system ("cp " ^ head ^ ".pdf " ^ outfile ^ ".pdf;"));
tail +> List.iter (fun filename ->
ignore(Unix.system ("mv " ^ outfile ^ ".pdf /tmp/tmp.pdf;"));
ignore(Unix.system ("pdftk " ^ filename ^ ".pdf /tmp/tmp.pdf cat output " ^ outfile ^ ".pdf"));
);
ignore(Unix.system ("rm /tmp/tmp.pdf;"));
List.iter (fun filename ->
ignore (Unix.system ("rm " ^ filename ^ " " ^ filename ^ ".pdf;"))
) filename_stack;
Printf.printf " - Done\n")
(* --------------------------------------------------------------------- *)
let prepare_cocci ctls free_var_lists negated_pos_lists
used_after_lists positions_list metavars astcocci =
let gathered = Common.index_list_1
(zip (zip (zip (zip (zip (zip ctls metavars) astcocci) free_var_lists)
negated_pos_lists) used_after_lists) positions_list)
in
gathered +> List.map
(fun (((((((ctl_toplevel_list,metavars),ast),free_var_list),
negated_pos_list),used_after_list),positions_list),rulenb) ->
let is_script_rule r =
match r with Ast_cocci.ScriptRule _ -> true | _ -> false in
if not (List.length ctl_toplevel_list = 1) && not (is_script_rule ast)
then failwith "not handling multiple minirules";
match ast with
Ast_cocci.ScriptRule (lang,deps,mv,code) ->
let r =
{
scr_ast_rule = (lang, mv, code);
language = lang;
scr_dependencies = deps;
scr_ruleid = rulenb;
script_code = code;
}
in ScriptRuleCocciInfo r
| Ast_cocci.CocciRule
(rulename,(dependencies,dropped_isos,z),restast,isexp,ruletype) ->
CocciRuleCocciInfo (
{
ctl = List.hd ctl_toplevel_list;
metavars = metavars;
ast_rule = ast;
isexp = List.hd isexp;
rulename = rulename;
dependencies = dependencies;
dropped_isos = dropped_isos;
free_vars = List.hd free_var_list;
negated_pos_vars = List.hd negated_pos_list;
used_after = List.hd used_after_list;
positions = List.hd positions_list;
ruleid = rulenb;
ruletype = ruletype;
was_matched = ref false;
})
)
(* --------------------------------------------------------------------- *)
let build_info_program cprogram env =
let (cs, parseinfos) =
Common.unzip cprogram in
let alltoks =
parseinfos +> List.map (fun (s,toks) -> toks) +> List.flatten in
(* I use cs' but really annotate_xxx work by doing side effects on cs *)
let cs' =
Comment_annotater_c.annotate_program alltoks cs in
let cs_with_envs =
Type_annoter_c.annotate_program env (*!g_contain_typedmetavar*) cs'
in
zip cs_with_envs parseinfos +> List.map (fun ((c, (enva,envb)), parseinfo)->
let (fullstr, tokens) = parseinfo in
let flow =
ast_to_flow_with_error_messages c +> Common.map_option (fun flow ->
let flow = Ast_to_flow.annotate_loop_nodes flow in
(* remove the fake nodes for julia *)
let fixed_flow = CCI.fix_flow_ctl flow in
if !Flag_cocci.show_flow then print_flow fixed_flow;
if !Flag_cocci.show_before_fixed_flow then print_flow flow;
fixed_flow
)
in
{
ast_c = c; (* contain refs so can be modified *)
tokens_c = tokens;
fullstring = fullstr;
flow = flow;
contain_loop = contain_loop flow;
env_typing_before = enva;
env_typing_after = envb;
was_modified = ref false;
}
)
(* Optimisation. Try not unparse/reparse the whole file when have modifs *)
let rebuild_info_program cs file isexp =
cs +> List.map (fun c ->
if !(c.was_modified)
then
let file = Common.new_temp_file "cocci_small_output" ".c" in
cfile_of_program
[(c.ast_c, (c.fullstring, c.tokens_c)), Unparse_c.PPnormal]
file;
(* Common.command2 ("cat " ^ file); *)
let cprogram = cprogram_of_file file in
let xs = build_info_program cprogram c.env_typing_before in
(* TODO: assert env has not changed,
* if yes then must also reparse what follows even if not modified.
* Do that only if contain_typedmetavar of course, so good opti.
*)
(* Common.list_init xs *) (* get rid of the FinalDef *)
xs
else [c]
) +> List.concat
let rebuild_info_c_and_headers ccs isexp =
ccs +> List.iter (fun c_or_h ->
if c_or_h.asts +> List.exists (fun c -> !(c.was_modified))
then c_or_h.was_modified_once := true;
);
ccs +> List.map (fun c_or_h ->
{ c_or_h with
asts = rebuild_info_program c_or_h.asts c_or_h.full_fname isexp }
)
let prepare_c files choose_includes : file_info list =
let cprograms = List.map cprogram_of_file_cached files in
let includes = includes_to_parse (zip files cprograms) choose_includes in
(* todo?: may not be good to first have all the headers and then all the c *)
let all =
(includes +> List.map (fun hpath -> Right hpath))
++
((zip files cprograms) +> List.map (fun (file, asts) -> Left (file, asts)))
in
let env = ref !TAC.initial_env in
let ccs = all +> Common.map_filter (fun x ->
match x with
| Right hpath ->
if not (Common.lfile_exists hpath)
then begin
pr2 ("TYPE: header " ^ hpath ^ " not found");
None
end
else
let h_cs = cprogram_of_file_cached hpath in
let info_h_cs = build_info_program h_cs !env in
env :=
if null info_h_cs
then !env
else last_env_toplevel_c_info info_h_cs
;
Some {
fname = Common.basename hpath;
full_fname = hpath;
asts = info_h_cs;
was_modified_once = ref false;
fpath = hpath;
fkind = Header;
}
| Left (file, cprogram) ->
(* todo?: don't update env ? *)
let cs = build_info_program cprogram !env in
(* we do that only for the c, not for the h *)
ignore(update_include_rel_pos (cs +> List.map (fun x -> x.ast_c)));
Some {
fname = Common.basename file;
full_fname = file;
asts = cs;
was_modified_once = ref false;
fpath = file;
fkind = Source;
}
)
in
ccs
(*****************************************************************************)
(* Processing the ctls and toplevel C elements *)
(*****************************************************************************)
(* The main algorithm =~
* The algorithm is roughly:
* for_all ctl rules in SP
* for_all minirule in rule (no more)
* for_all binding (computed during previous phase)
* for_all C elements
* match control flow of function vs minirule
* with the binding and update the set of possible
* bindings, and returned the possibly modified function.
* pretty print modified C elements and reparse it.
*
*
* On ne prends que les newbinding ou returned_any_state est vrai.
* Si ca ne donne rien, on prends ce qu'il y avait au depart.
* Mais au nouveau depart de quoi ?
* - si ca donne rien apres avoir traité toutes les fonctions avec ce binding ?
* - ou alors si ca donne rien, apres avoir traité toutes les fonctions
* avec tous les bindings du round d'avant ?
*
* Julia pense qu'il faut prendre la premiere solution.
* Example: on a deux environnements candidats, E1 et E2 apres avoir traité
* la regle ctl 1. On arrive sur la regle ctl 2.
* E1 ne donne rien pour la regle 2, on garde quand meme E1 pour la regle 3.
* E2 donne un match a un endroit et rend E2' alors on utilise ca pour
* la regle 3.
*
* I have not to look at used_after_list to decide to restart from
* scratch. I just need to look if the binding list is empty.
* Indeed, let's suppose that a SP have 3 regions/rules. If we
* don't find a match for the first region, then if this first
* region does not bind metavariable used after, that is if
* used_after_list is empty, then mysat(), even if does not find a
* match, will return a Left, with an empty transformation_info,
* and so current_binding will grow. On the contrary if the first
* region must bind some metavariables used after, and that we
* dont find any such region, then mysat() will returns lots of
* Right, and current_binding will not grow, and so we will have
* an empty list of binding, and we will catch such a case.
*
* opti: julia says that because the binding is
* determined by the used_after_list, the items in the list
* are kind of sorted, so could optimise the insert_set operations.
*)
(* r(ule), c(element in C code), e(nvironment) *)
let rec apply_python_rule r cache newes e rules_that_have_matched
rules_that_have_ever_matched =
show_or_not_scr_rule_name r.scr_ruleid;
if not(interpret_dependencies rules_that_have_matched
!rules_that_have_ever_matched r.scr_dependencies)
then
begin
print_dependencies "dependencies for script not satisfied:"
rules_that_have_matched
!rules_that_have_ever_matched r.scr_dependencies;
show_or_not_binding "in environment" e;
(cache, (e, rules_that_have_matched)::newes)
end
else
begin
let (_, mv, _) = r.scr_ast_rule in
if List.for_all (Pycocci.contains_binding e) mv
then
begin
let relevant_bindings =
List.filter
(function ((re,rm),_) ->
List.exists (function (_,(r,m)) -> r = re && m = rm) mv)
e in
let new_cache =
if List.mem relevant_bindings cache
then cache
else
begin
print_dependencies "dependencies for script satisfied:"
rules_that_have_matched
!rules_that_have_ever_matched r.scr_dependencies;
show_or_not_binding "in" e;
Pycocci.build_classes (List.map (function (x,y) -> x) e);
Pycocci.construct_variables mv e;
let _ = Pycocci.pyrun_simplestring
("import coccinelle\nfrom coccinelle "^
"import *\ncocci = Cocci()\n" ^
r.script_code) in
relevant_bindings :: cache
end in
if !Pycocci.inc_match
then (new_cache, merge_env [(e, rules_that_have_matched)] newes)
else (new_cache, newes)
end
else (cache, merge_env [(e, rules_that_have_matched)] newes)
end
and apply_cocci_rule r rules_that_have_ever_matched es (ccs:file_info list ref) =
Common.profile_code r.rulename (fun () ->
show_or_not_rule_name r.ast_rule r.ruleid;
show_or_not_ctl_text r.ctl r.ast_rule r.ruleid;
let reorganized_env =
reassociate_positions r.free_vars r.negated_pos_vars !es in
(* looping over the environments *)
let (_,newes (* envs for next round/rule *)) =
List.fold_left
(function (cache,newes) ->
function ((e,rules_that_have_matched),relevant_bindings) ->
if not(interpret_dependencies rules_that_have_matched
!rules_that_have_ever_matched r.dependencies)
then
begin
print_dependencies
("dependencies for rule "^r.rulename^" not satisfied:")
rules_that_have_matched
!rules_that_have_ever_matched r.dependencies;
show_or_not_binding "in environment" e;
(cache,
merge_env
[(e +> List.filter (fun (s,v) -> List.mem s r.used_after),
rules_that_have_matched)]
newes)
end
else
let new_bindings =
try List.assoc relevant_bindings cache
with
Not_found ->
print_dependencies
("dependencies for rule "^r.rulename^" satisfied:")
rules_that_have_matched
!rules_that_have_ever_matched r.dependencies;
show_or_not_binding "in" e;
show_or_not_binding "relevant in" relevant_bindings;
(* applying the rule *)
(match r.ruletype with
Ast_cocci.Normal ->
let children_e = ref [] in
(* looping over the functions and toplevel elements in
.c and .h *)
concat_headers_and_c !ccs +> List.iter (fun (c,f) ->
if c.flow <> None
then
(* does also some side effects on c and r *)
let processed =
process_a_ctl_a_env_a_toplevel r
relevant_bindings c f in
match processed with
| None -> ()
| Some newbindings ->
newbindings +> List.iter (fun newbinding ->
children_e :=
Common.insert_set newbinding !children_e)
); (* end iter cs *)
!children_e
| Ast_cocci.Generated ->
process_a_generated_a_env_a_toplevel r
relevant_bindings !ccs;
[]) in
let old_bindings_to_keep =
Common.nub
(e +> List.filter (fun (s,v) -> List.mem s r.used_after)) in
let new_e =
if null new_bindings
then
begin
(*use the old bindings, specialized to the used_after_list*)
if !Flag_ctl.partial_match
then
printf
"Empty list of bindings, I will restart from old env";
[(old_bindings_to_keep,rules_that_have_matched)]
end
else
(* combine the new bindings with the old ones, and
specialize to the used_after_list *)
let old_variables = List.map fst old_bindings_to_keep in
(* have to explicitly discard the inherited variables
because we want the inherited value of the positions
variables not the extended one created by
reassociate_positions. want to reassociate freshly
according to the free variables of each rule. *)
let new_bindings_to_add =
Common.nub
(new_bindings +>
List.map
(List.filter
(fun (s,v) ->
List.mem s r.used_after &&
not (List.mem s old_variables)))) in
List.map
(function new_binding_to_add ->
(List.sort compare
(Common.union_set
old_bindings_to_keep new_binding_to_add),
r.rulename::rules_that_have_matched))
new_bindings_to_add in
((relevant_bindings,new_bindings)::cache,
merge_env new_e newes))
([],[]) reorganized_env in (* end iter es *)
if !(r.was_matched)
then Common.push2 r.rulename rules_that_have_ever_matched;
es := newes;
(* apply the tagged modifs and reparse *)
if not !Flag.sgrep_mode2
then ccs := rebuild_info_c_and_headers !ccs r.isexp
)
and merge_env new_e old_e =
List.fold_left
(function old_e ->
function (e,rules) as elem ->
let (same,diff) = List.partition (function (e1,_) -> e = e1) old_e in
match same with
[] -> elem :: old_e
| [(_,old_rules)] -> (e,Common.union_set rules old_rules) :: diff
| _ -> failwith "duplicate environment entries")
old_e new_e
and bigloop2 rs (ccs: file_info list) =
let es = ref [(Ast_c.emptyMetavarsBinding,[])] in
let ccs = ref ccs in
let rules_that_have_ever_matched = ref [] in
(* looping over the rules *)
rs +> List.iter (fun r ->
match r with
ScriptRuleCocciInfo r ->
if !Flag_cocci.show_ctl_text then begin
Common.pr_xxxxxxxxxxxxxxxxx ();
pr ("script: " ^ r.language);
Common.pr_xxxxxxxxxxxxxxxxx ();
adjust_pp_with_indent (fun () ->
Format.force_newline();
let (l,mv,code) = r.scr_ast_rule in
let deps = r.scr_dependencies in
Pretty_print_cocci.unparse
(Ast_cocci.ScriptRule (l,deps,mv,code)));
end;
if !Flag.show_misc then print_endline "RESULT =";
let (_, newes) =
List.fold_left
(function (cache, newes) ->
function (e, rules_that_have_matched) ->
match r.language with
"python" ->
apply_python_rule r cache newes e rules_that_have_matched
rules_that_have_ever_matched
| "test" ->
concat_headers_and_c !ccs +> List.iter (fun (c,_) ->
if c.flow <> None
then
Printf.printf "Flow: %s\r\nFlow!\r\n%!" c.fullstring);
(cache, newes)
| _ ->
Printf.printf "Unknown language: %s\n" r.language;
(cache, newes)
)
([],[]) !es in
es := newes;
| CocciRuleCocciInfo r ->
apply_cocci_rule r rules_that_have_ever_matched es ccs);
if !Flag.sgrep_mode2
then begin
(* sgrep can lead to code that is not parsable, but we must
* still call rebuild_info_c_and_headers to pretty print the
* action (MINUS), so that later the diff will show what was
* matched by sgrep. But we don't want the parsing error message
* hence the following flag setting. So this code propably
* will generate a NotParsedCorrectly for the matched parts
* and the very final pretty print and diff will work
*)
Flag_parsing_c.verbose_parsing := false;
ccs := rebuild_info_c_and_headers !ccs false
end;
!ccs (* return final C asts *)
and reassociate_positions free_vars negated_pos_vars envs =
(* issues: isolate the bindings that are relevant to a given rule.
separate out the position variables
associate all of the position variables for a given set of relevant
normal variable bindings with each set of relevant normal variable
bindings. Goal: if eg if@p (E) matches in two places, then both inherited
occurrences of E should see both bindings of p, not just its own.
Otherwise, a position constraint for something that matches in two
places will never be useful, because the position can always be
different from the other one. *)
let relevant =
List.map
(function (e,_) ->
List.filter (function (x,_) -> List.mem x free_vars) e)
envs in
let splitted_relevant =
(* separate the relevant variables into the non-position ones and the
position ones *)
List.map
(function r ->
List.fold_left
(function (non_pos,pos) ->
function (v,_) as x ->
if List.mem v negated_pos_vars
then (non_pos,x::pos)
else (x::non_pos,pos))
([],[]) r)
relevant in
let splitted_relevant =
List.map
(function (non_pos,pos) ->
(List.sort compare non_pos,List.sort compare pos))
splitted_relevant in
let non_poss =
List.fold_left
(function non_pos ->
function (np,_) ->
if List.mem np non_pos then non_pos else np::non_pos)
[] splitted_relevant in
let extended_relevant =
(* extend the position variables with the values found at other identical
variable bindings *)
List.map
(function non_pos ->
let others =
List.filter
(function (other_non_pos,other_pos) ->
(* do we want equal? or just somehow compatible? eg non_pos
binds only E, but other_non_pos binds both E and E1 *)
non_pos = other_non_pos)
splitted_relevant in
(non_pos,
List.sort compare
(non_pos @
(combine_pos negated_pos_vars
(List.map (function (_,x) -> x) others)))))
non_poss in
List.combine envs
(List.map (function (non_pos,_) -> List.assoc non_pos extended_relevant)
splitted_relevant)
and combine_pos negated_pos_vars others =
List.map
(function posvar ->
(posvar,
Ast_c.MetaPosValList
(List.sort compare
(List.fold_left
(function positions ->
function other_list ->
try
match List.assoc posvar other_list with
Ast_c.MetaPosValList l1 ->
Common.union_set l1 positions
| _ -> failwith "bad value for a position variable"
with Not_found -> positions)
[] others))))
negated_pos_vars
and bigloop a b =
Common.profile_code "bigloop" (fun () -> bigloop2 a b)
(* does side effects on C ast and on Cocci info rule *)
and process_a_ctl_a_env_a_toplevel2 r e c f =
indent_do (fun () ->
show_or_not_celem "trying" c.ast_c;
Flag.currentfile := Some (f ^ ":" ^get_celem c.ast_c);
let (trans_info, returned_any_states, inherited_bindings, newbindings) =
Common.save_excursion Flag_ctl.loop_in_src_code (fun () ->
Flag_ctl.loop_in_src_code := !Flag_ctl.loop_in_src_code||c.contain_loop;
(***************************************)
(* !Main point! The call to the engine *)
(***************************************)
let model_ctl = CCI.model_for_ctl r.dropped_isos (Common.some c.flow) e
in CCI.mysat model_ctl r.ctl (r.used_after, e)
)
in
if not returned_any_states
then None
else begin
show_or_not_celem "found match in" c.ast_c;
show_or_not_trans_info trans_info;
List.iter (show_or_not_binding "out") newbindings;
r.was_matched := true;
if not (null trans_info)
then begin
c.was_modified := true;
try
(* les "more than one var in a decl" et "already tagged token"
* font crasher coccinelle. Si on a 5 fichiers, donc on a 5
* failed. Le try limite le scope des crashes pendant la
* trasformation au fichier concerne. *)
(* modify ast via side effect *)
ignore(Transformation_c.transform r.rulename r.dropped_isos
inherited_bindings trans_info (Common.some c.flow));
with Timeout -> raise Timeout | UnixExit i -> raise (UnixExit i)
end;
Some (List.map (function x -> x@inherited_bindings) newbindings)
end
)
and process_a_ctl_a_env_a_toplevel a b c f=
Common.profile_code "process_a_ctl_a_env_a_toplevel"
(fun () -> process_a_ctl_a_env_a_toplevel2 a b c f)
and process_a_generated_a_env_a_toplevel2 r env = function
[cfile] ->
let free_vars =
List.filter
(function
(rule,_) when rule = r.rulename -> false
| (_,"ARGS") -> false
| _ -> true)
r.free_vars in
let env_domain = List.map (function (nm,vl) -> nm) env in
let metavars =
List.filter
(function md ->
let (rl,_) = Ast_cocci.get_meta_name md in
rl = r.rulename)
r.metavars in
if Common.include_set free_vars env_domain
then Unparse_hrule.pp_rule metavars r.ast_rule env cfile.full_fname
| _ -> failwith "multiple files not supported"
and process_a_generated_a_env_a_toplevel rule env ccs =
Common.profile_code "process_a_ctl_a_env_a_toplevel"
(fun () -> process_a_generated_a_env_a_toplevel2 rule env ccs)
(*****************************************************************************)
(* The main function *)
(*****************************************************************************)
let full_engine2 (coccifile, isofile) cfiles =
show_or_not_cfiles cfiles;
show_or_not_cocci coccifile isofile;
Pycocci.set_coccifile coccifile;
let isofile =
if not (Common.lfile_exists isofile)
then begin
pr2 ("warning: Can't find default iso file: " ^ isofile);
None
end
else Some isofile
in
(* useful opti when use -dir *)
let (metavars,astcocci,free_var_lists,negated_pos_lists,used_after_lists,
positions_lists,toks,_) =
sp_of_file coccifile isofile
in
let ctls =
Common.memoized _hctl (coccifile, isofile) (fun () ->
ctls_of_ast astcocci used_after_lists positions_lists)
in
let contain_typedmetavar = sp_contain_typed_metavar astcocci in
(* optimisation allowing to launch coccinelle on all the drivers *)
if !Flag_cocci.worth_trying_opt && not (worth_trying cfiles toks)
then begin
pr2 ("not worth trying:" ^ Common.join " " cfiles);
cfiles +> List.map (fun s -> s, None)
end
else begin
if !Flag.show_misc then Common.pr_xxxxxxxxxxxxxxxxx();
if !Flag.show_misc then pr "let's go";
if !Flag.show_misc then Common.pr_xxxxxxxxxxxxxxxxx();
g_contain_typedmetavar := contain_typedmetavar;
check_macro_in_sp_and_adjust toks;
let cocci_infos =
prepare_cocci ctls free_var_lists negated_pos_lists
used_after_lists positions_lists metavars astcocci in
let choose_includes =
match !Flag_cocci.include_options with
Flag_cocci.I_UNSPECIFIED ->
if contain_typedmetavar
then Flag_cocci.I_NORMAL_INCLUDES
else Flag_cocci.I_NO_INCLUDES
| x -> x in
let c_infos = prepare_c cfiles choose_includes in
show_or_not_ctl_tex astcocci ctls;
(* ! the big loop ! *)
let c_infos' = bigloop cocci_infos c_infos in
if !Flag.show_misc then Common.pr_xxxxxxxxxxxxxxxxx ();
if !Flag.show_misc then pr "Finished";
if !Flag_ctl.graphical_trace then gen_pdf_graph ();
if !Flag.show_misc then Common.pr_xxxxxxxxxxxxxxxxx();
c_infos' +> List.map (fun c_or_h ->
if !(c_or_h.was_modified_once)
then begin
let outfile = Common.new_temp_file "cocci-output" ("-" ^ c_or_h.fname)
in
if c_or_h.fkind = Header
then pr2 ("a header file was modified: " ^ c_or_h.fname);
(* and now unparse everything *)
cfile_of_program (for_unparser c_or_h.asts) outfile;
let show_only_minus = !Flag.sgrep_mode2 in
show_or_not_diff c_or_h.fpath outfile show_only_minus;
(c_or_h.fpath,
if !Flag.sgrep_mode2 then None else Some outfile
)
end
else
(c_or_h.fpath, None)
);
end
let full_engine a b =
Common.profile_code "full_engine" (fun () -> full_engine2 a b)
(*****************************************************************************)
(* check duplicate from result of full_engine *)
(*****************************************************************************)
let check_duplicate_modif2 xs =
(* opti: let groups = Common.groupBy (fun (a,resa) (b,resb) -> a =$= b) xs *)
pr2 ("Check duplication for " ^ i_to_s (List.length xs) ^ " files");
let groups = Common.group_assoc_bykey_eff xs in
groups +> Common.map_filter (fun (file, xs) ->
match xs with
| [] -> raise Impossible
| [res] -> Some (file, res)
| res::xs ->
match res with
| None ->
if not (List.for_all (fun res2 -> res2 = None) xs)
then begin
pr2 ("different modification result for " ^ file);
None
end
else Some (file, None)
| Some res ->
if not(List.for_all (fun res2 ->
match res2 with
| None -> false
| Some res2 ->
let diff = Common.cmd_to_list ("diff -u -b -B "^res^" "^res2)
in
null diff
) xs) then begin
pr2 ("different modification result for " ^ file);
None
end
else Some (file, Some res)
)
let check_duplicate_modif a =
Common.profile_code "check_duplicate" (fun () -> check_duplicate_modif2 a)