-
Notifications
You must be signed in to change notification settings - Fork 94
/
Copy pathcfg.ml
345 lines (300 loc) · 10.8 KB
/
cfg.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
(*
*
* Copyright (c) 2001-2003,
* George C. Necula <[email protected]>
* Scott McPeak <[email protected]>
* Wes Weimer <[email protected]>
* Simon Goldsmith <[email protected]>
* S.P Rahul, Aman Bhargava
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are
* met:
*
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
*
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* 3. The names of the contributors may not be used to endorse or promote
* products derived from this software without specific prior written
* permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
* IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
* PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
* OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
*)
(* Authors: Aman Bhargava, S. P. Rahul *)
(* sfg: this stuff was stolen from optim.ml - the code to print the cfg as
a dot graph is mine *)
open Pretty
open Cil
module E=Errormsg
(* entry points: cfgFun, printCfgChannel, printCfgFilename *)
(* known issues:
* -sucessors of if somehow end up with two edges each
*)
(*------------------------------------------------------------*)
(* Notes regarding CFG computation:
1) Initially only succs and preds are computed. sid's are filled in
later, in whatever order is suitable (e.g. for forward problems, reverse
depth-first postorder).
2) If a stmt (return, break or continue) has no successors, then
function return must follow.
No predecessors means it is the start of the function
3) We use the fact that initially all the succs and preds are assigned []
*)
(* Fill in the CFG info for the stmts in a block
next = succ of the last stmt in this block
break = succ of any Break in this block
cont = succ of any Continue in this block
None means the succ is the function return. It does not mean the break/cont
is invalid. We assume the validity has already been checked.
rlabels = list of potential successors of computed gotos (ie. every labelled
statement whose address is retained)
*)
let start_id = ref 0 (* for unique ids across many functions *)
class caseLabeledStmtFinder slr = object(self)
inherit nopCilVisitor
method vstmt s =
if List.exists (fun l ->
match l with | Case _ | CaseRange _ | Default _ -> true | _ -> false)
s.labels
then begin
slr := s :: (!slr);
match s.skind with
| Switch(_,_,_,_) -> SkipChildren
| _ -> DoChildren
end else match s.skind with
| Switch(_,_,_,_) -> SkipChildren
| _ -> DoChildren
end
let findCaseLabeledStmts (b : block) : stmt list =
let slr = ref [] in
let vis = new caseLabeledStmtFinder slr in
ignore(visitCilBlock vis b);
!slr
class addrOfLabelFinder slr = object(self)
inherit nopCilVisitor
method vexpr e = match e with
| AddrOfLabel sref ->
slr := !sref :: (!slr);
SkipChildren
| _ -> DoChildren
end
let findAddrOfLabelStmts (b : block) : stmt list =
let slr = ref [] in
let vis = new addrOfLabelFinder slr in
ignore(visitCilBlock vis b);
!slr
(* entry point *)
(** Compute a control flow graph for fd. Stmts in fd have preds and succs
filled in *)
let rec cfgFun (fd : fundec): int =
begin
let initial_id = !start_id in
let nodeList = ref [] in
let rlabels = findAddrOfLabelStmts fd.sbody in
cfgBlock fd.sbody None None None nodeList rlabels;
fd.smaxstmtid <- Some(!start_id);
fd.sallstmts <- List.rev !nodeList;
!start_id - initial_id
end
and cfgStmts (ss: stmt list)
(next:stmt option) (break:stmt option) (cont:stmt option)
(nodeList:stmt list ref) (rlabels: stmt list) =
match ss with
[] -> ();
| [s] -> cfgStmt s next break cont nodeList rlabels
| hd::tl ->
cfgStmt hd (Some (List.hd tl)) break cont nodeList rlabels;
cfgStmts tl next break cont nodeList rlabels
and cfgBlock (blk: block)
(next:stmt option) (break:stmt option) (cont:stmt option)
(nodeList:stmt list ref) (rlabels: stmt list) =
cfgStmts blk.bstmts next break cont nodeList rlabels
(* Fill in the CFG info for a stmt
Meaning of next, break, cont should be clear from earlier comment
*)
and cfgStmt (s: stmt) (next:stmt option) (break:stmt option) (cont:stmt option)
(nodeList:stmt list ref) (rlabels: stmt list) =
incr start_id;
s.sid <- !start_id;
nodeList := s :: !nodeList; (* Future traversals can be made in linear time. e.g. *)
if s.succs <> [] then begin
(*E.s*)ignore (bug "CFG must be cleared before being computed!");
raise (Failure "CFG bug")
end;
let addSucc (n: stmt) =
if not (List.memq n s.succs) then
s.succs <- n::s.succs;
if not (List.memq s n.preds) then
n.preds <- s::n.preds
in
let addOptionSucc (n: stmt option) =
match n with
None -> ()
| Some n' -> addSucc n'
in
let addBlockSucc (b: block) (n: stmt option) =
(* Add the first statement in b as a successor to the current stmt.
Or, if b is empty, add n as a successor *)
match b.bstmts with
[] -> addOptionSucc n
| hd::_ -> addSucc hd
in
let instrFallsThrough (i : instr) : bool = match i with
Call (_, Lval (Var vf, NoOffset), _, _) ->
(* See if this has the noreturn attribute *)
not (hasAttribute "noreturn" vf.vattr)
| Call (_, f, _, _) ->
not (hasAttribute "noreturn" (typeAttrs (typeOf f)))
| _ -> true
in
match s.skind with
Instr il ->
if List.for_all instrFallsThrough il then
addOptionSucc next
else
()
| Return _ -> ()
| Goto (p,_) -> addSucc !p
| ComputedGoto (e,_) -> List.iter addSucc rlabels
| Break _ -> addOptionSucc break
| Continue _ -> addOptionSucc cont
| If (_, blk1, blk2, _) ->
(* The succs of If is [true branch;false branch] *)
addBlockSucc blk2 next;
addBlockSucc blk1 next;
cfgBlock blk1 next break cont nodeList rlabels;
cfgBlock blk2 next break cont nodeList rlabels
| Block b ->
addBlockSucc b next;
cfgBlock b next break cont nodeList rlabels
| Switch(_,blk,l,_) ->
let bl = findCaseLabeledStmts blk in
List.iter addSucc (List.rev bl(*l*)); (* Add successors in order *)
(* sfg: if there's no default, need to connect s->next *)
if not (List.exists
(fun stmt -> List.exists
(function Default _ -> true | _ -> false)
stmt.labels)
bl)
then
addOptionSucc next;
cfgBlock blk next next cont nodeList rlabels
| Loop(blk, loc, s1, s2) ->
s.skind <- Loop(blk, loc, (Some s), next);
addBlockSucc blk (Some s);
cfgBlock blk (Some s) next (Some s) nodeList rlabels
(* Since all loops have terminating condition true, we don't put
any direct successor to stmt following the loop *)
| TryExcept _ | TryFinally _ ->
E.s (E.unimp "try/except/finally")
(*------------------------------------------------------------*)
(**************************************************************)
(* do something for all stmts in a fundec *)
let rec forallStmts (todo) (fd : fundec) =
begin
fasBlock todo fd.sbody;
end
and fasBlock (todo) (b : block) =
List.iter (fasStmt todo) b.bstmts
and fasStmt (todo) (s : stmt) =
begin
ignore(todo s);
match s.skind with
| Block b -> fasBlock todo b
| If (_, tb, fb, _) -> (fasBlock todo tb; fasBlock todo fb)
| Switch (_, b, _, _) -> fasBlock todo b
| Loop (b, _, _, _) -> fasBlock todo b
| (Return _ | Break _ | Continue _ | Goto _ | ComputedGoto _ | Instr _) -> ()
| TryExcept _ | TryFinally _ -> E.s (E.unimp "try/except/finally")
end
;;
(**************************************************************)
(* printing the control flow graph - you have to compute it first *)
let d_cfgnodename () (s : stmt) =
dprintf "%d" s.sid
let d_cfgnodelabel () (s : stmt) =
let label =
begin
match s.skind with
| If (e, _, _, _) -> "if" (*sprint ~width:999 (dprintf "if %a" d_exp e)*)
| Loop _ -> "loop"
| Break _ -> "break"
| Continue _ -> "continue"
| Goto _ | ComputedGoto _ -> "goto"
| Instr _ -> "instr"
| Switch _ -> "switch"
| Block _ -> "block"
| Return _ -> "return"
| TryExcept _ -> "try-except"
| TryFinally _ -> "try-finally"
end in
dprintf "%d: %s" s.sid label
let d_cfgedge (src) () (dest) =
dprintf "%a -> %a"
d_cfgnodename src
d_cfgnodename dest
let d_cfgnode () (s : stmt) =
dprintf "%a [label=\"%a\"]\n\t%a"
d_cfgnodename s
d_cfgnodelabel s
(d_list "\n\t" (d_cfgedge s)) s.succs
(**********************************************************************)
(* entry points *)
(** print control flow graph (in dot form) for fundec to channel *)
let printCfgChannel (chan : out_channel) (fd : fundec) =
let pnode (s:stmt) = fprintf chan "%a\n" d_cfgnode s in
begin
ignore (fprintf chan "digraph CFG_%s {\n" fd.svar.vname);
forallStmts pnode fd;
ignore(fprintf chan "}\n");
end
(** Print control flow graph (in dot form) for fundec to file *)
let printCfgFilename (filename : string) (fd : fundec) =
let chan = open_out filename in
begin
printCfgChannel chan fd;
close_out chan;
end
;;
(**********************************************************************)
let clearCFGinfo (fd : fundec) =
let clear s =
s.sid <- -1;
s.succs <- [];
s.preds <- [];
in
forallStmts clear fd
let clearFileCFG (f : file) =
start_id := 0;
iterGlobals f (fun g ->
match g with GFun(fd,_) ->
clearCFGinfo fd
| _ -> ())
let computeFileCFG (f : file) =
iterGlobals f (fun g ->
match g with GFun(fd,_) ->
ignore(cfgFun fd)
| _ -> ())
let allStmts (f : file) : stmt list =
foldGlobals f
(fun accu g ->
match g with
| GFun (f,l) -> f.sallstmts @ accu
| _ -> accu
) []