-
Notifications
You must be signed in to change notification settings - Fork 8
/
Copy pathslicing_evaluation.ml
349 lines (331 loc) · 17.9 KB
/
slicing_evaluation.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
open Core
open Wassail
type slicing_result = {
function_sliced: int32;
slicing_criterion: Instr.Label.t;
initial_number_of_instrs : int;
slice_size_before_adaptation : int;
slice_size_after_adaptation : int;
cfg_time : Time_float.Span.t;
spec_time : Time_float.Span.t;
control_time : Time_float.Span.t;
data_time : Time_float.Span.t;
mem_time : Time_float.Span.t;
global_time : Time_float.Span.t;
slicing_time1 : Time_float.Span.t;
slicing_time2 : Time_float.Span.t;
}
type ignored_reason =
| NoFunction
| NoInstruction of int32
type result =
| Success of slicing_result
| Ignored of ignored_reason
| SliceExtensionError of int32 * Instr.Label.t * int * string
| SliceError of int32 * Instr.Label.t * int * string
| CfgError of int32 * int * string
| LoadError of string
let all_labels (instrs : 'a Instr.t list) : Instr.Label.Set.t =
List.fold_left instrs
~init:Instr.Label.Set.empty
~f:(fun acc instr ->
Instr.Label.Set.union acc (Instr.all_labels_no_merge instr))
let time (f : unit -> 'a) : 'a * Time_float.Span.t =
let t0 = Time_float.now () in
let res = f () in
let t1 = Time_float.now () in
(res, Time_float.diff t1 t0)
let prefix : string ref = ref "."
let output (file : string) (fields : string list) =
Out_channel.with_file (Printf.sprintf "%s/%s" !prefix file) ~append:true ~f:(fun ch ->
Out_channel.output_string ch (Printf.sprintf "%s\n" (String.concat ~sep:"," fields)))
let output_slicing_result filename = function
| Success r ->
output "data.txt" [filename; (* 0 *)
Int32.to_string r.function_sliced; (* 1 *)
Instr.Label.to_string r.slicing_criterion; (* 2 *)
string_of_int r.initial_number_of_instrs; (* 3 *)
string_of_int r.slice_size_before_adaptation; (* 4 *)
string_of_int r.slice_size_after_adaptation; (* 5 *)
string_of_float (Time_float.Span.to_ms r.cfg_time); (* 6 *)
string_of_float (Time_float.Span.to_ms r.spec_time); (* 7 *)
string_of_float (Time_float.Span.to_ms r.control_time); (* 8 *)
string_of_float (Time_float.Span.to_ms r.data_time); (* 9 *)
string_of_float (Time_float.Span.to_ms r.mem_time); (* 10 *)
string_of_float (Time_float.Span.to_ms r.global_time); (* 11 *)
string_of_float (Time_float.Span.to_ms r.slicing_time1); (* 12 *)
string_of_float (Time_float.Span.to_ms r.slicing_time2)] (* 13 *)
| Ignored NoFunction ->
output "nofunction.txt" [filename]
| Ignored (NoInstruction f) ->
output "noinstruction.txt" [filename; Int32.to_string f]
| SliceExtensionError (f, criterion, size, reason) ->
output "error.txt" [filename; (* 0 *)
Int32.to_string f; (* 1 *)
Instr.Label.to_string criterion; (* 2 *)
string_of_int size; (* 3 *)
"slice-extension"; (* 4 *)
reason] (* 5 *)
| SliceError (f, criterion, size, reason) ->
output "error.txt" [filename; (* 0 *)
Int32.to_string f; (* 1 *)
Instr.Label.to_string criterion; (* 2 *)
string_of_int size; (* 3 *)
"slice"; (* 4 *)
reason] (* 5 *)
| CfgError (f, size, reason) ->
output "error.txt" [filename; (* 0 *)
Int32.to_string f; (* 1 *)
"-1"; (* 2 *)
string_of_int size; (* 3 *)
"cfg"; (* 4 *)
reason] (* 5 *)
| LoadError _ ->
output "loaderror.txt" [filename]
let slices (filename : string) (criterion_selection : [`Random | `All | `Last ]) : unit =
try
Spec_inference.propagate_globals := false;
Spec_inference.propagate_locals := false;
Spec_inference.use_const := false;
let wasm_mod = Wasm_module.of_file filename in
let funcs = wasm_mod.funcs in
if List.is_empty funcs then
output_slicing_result filename (Ignored NoFunction)
else
List.iteri funcs ~f:(fun _i func ->
let labels = Instr.Label.Set.to_array (all_labels func.code.body) in
if Array.length labels = 0 then
output_slicing_result filename (Ignored (NoInstruction func.idx))
else
try
let t0 = Time_float.now () in
let cfg_raw = Cfg_builder.build wasm_mod func.idx in
let cfg_time = Time_float.diff (Time_float.now ()) t0 in
let t0 = Time_float.now () in
let cfg, () = Spec_inference.Intra.analyze wasm_mod cfg_raw Int32Map.empty in
let spec_time = Time_float.diff (Time_float.now ()) t0 in
let cfg_instructions = Cfg.all_instructions cfg in
let preanalysis = Slicing.preanalysis cfg cfg_instructions in
List.iter (match criterion_selection with
| `Random -> [Array.get labels (Random.int (Array.length labels))]
| `All -> Array.to_list labels
| `Last -> [Array.last labels])
~f:(fun slicing_criterion ->
try
let instrs_to_keep, (control_time, data_time, mem_time, global_time, slicing_time1) = Slicing.instructions_to_keep cfg cfg_instructions preanalysis (Instr.Label.Set.singleton slicing_criterion) in
try
let t0 = Time_float.now () in
let sliced_func = Slicing.slice_to_funcinst cfg ~instrs:(Some instrs_to_keep) cfg_instructions (Instr.Label.Set.singleton slicing_criterion) in
let t1 = Time_float.now () in
let slicing_time2 = Time_float.diff t1 t0 in
let sliced_labels = all_labels sliced_func.code.body in
(* Printf.printf "fun %ld:%s -- initial: %s, before: %s, after: %d\n" func.idx (Instr.Label.to_string slicing_criterion) (Instr.Label.Set.to_string (all_labels func.code.body)) (Instr.Label.Set.to_string instrs_to_keep) (Instr.Label.Set.length sliced_labels); *)
output_slicing_result filename (Success {
function_sliced = func.idx;
slicing_criterion;
initial_number_of_instrs = Array.length labels;
slice_size_before_adaptation = Instr.Label.Set.length instrs_to_keep;
slice_size_after_adaptation = Instr.Label.Set.length sliced_labels;
cfg_time; spec_time; slicing_time1; slicing_time2; control_time; data_time; mem_time; global_time
})
with e ->
output_slicing_result filename (SliceExtensionError (func.idx, slicing_criterion, Array.length labels, Exn.to_string_mach e))
with e ->
output_slicing_result filename (SliceError (func.idx, slicing_criterion, Array.length labels, Exn.to_string_mach e)))
with e -> output_slicing_result filename (CfgError (func.idx, Array.length labels, Exn.to_string_mach e)))
with e -> output_slicing_result filename (LoadError (Exn.to_string e))
let evaluate_file (filename : string) (criterion_selection : [`All | `Random | `Last]) : unit =
slices filename criterion_selection
let evaluate =
Command.basic
~summary:"Evaluate the slicer on a a benchmark"
Command.Let_syntax.(
let%map_open filename = anon ("file" %: string)
and prefix_opt = flag "-p" (optional string) ~doc:"prefix for where to save the results file (default: current directory)"
and all = flag "-a" no_arg ~doc:"slice on all functions, for all slicing criterion"
and last = flag "-l" no_arg ~doc:"slice on all functions, for the last slicing criterion" in
fun () ->
begin match prefix_opt with
| None -> ()
| Some p -> prefix := p
end;
evaluate_file filename (if all then `All else if last then `Last else `Random))
(** Find the slicing criterion, i.e., the address at which the string ORBS is *)
let find_criterion (filename : string) : Int32.t =
(* Find the specific string in the data section *)
let wasm_mod = Wasm_module.of_file filename in
let pattern = "\nORBS:" in
let address = match List.find_map wasm_mod.datas ~f:(fun segment ->
match String.substr_index segment.dinit ~pattern with
| Some idx -> begin match (Segment_mode.offset segment.dmode) with
| (Instr.Data {instr = Instr.Const (Prim_value.I32 n); _}) :: [] -> Some (Int32.(n + (of_int_exn idx)))
| _ -> failwith "unsupported segment offset"
end
| None -> None) with
| Some idx -> idx
| None -> failwith "cannot find pattern in any data segment" in
Printf.printf "%s: %ld\n" filename address;
address
(* Generate a slice for printf function calls with a specific string *)
let generate_slice (filename : string) (output_file : string) =
let refined = false in (* Set to false if you want to slice the printf call, to true if you want to slice on the second printf argument *)
let only_function = false in (* set to false to generate the whole module *)
Spec_inference.propagate_globals := false;
Spec_inference.propagate_locals := false;
Spec_inference.use_const := false;
let wasm_mod = Wasm_module.of_file filename in
let address = find_criterion filename in
(* Find the index of the printf function (it should be exported, otherwise it is unnamed) *)
let printf_export_idx = match List.find_map wasm_mod.exported_funcs ~f:(fun (idx, name, _type) ->
if String.equal name "printf" then
Some idx
else
None) with
| Some idx -> idx
| None -> failwith "cannot find printf in exported functions" in
Spec_inference.propagate_globals := false;
Spec_inference.propagate_locals := false;
Printf.printf "printf id: %ld\n" printf_export_idx;
(* Find the function and slicing criterion: it should call printf with the string's position in the data segment as argument *)
Spec_inference.use_const := true;
Spec_inference.propagate_locals := true;
let (function_idx, slicing_criteria) = match List.find_map wasm_mod.funcs ~f:(fun func ->
let cfg = Cfg.without_empty_nodes_with_no_predecessors (Spec_analysis.analyze_intra1 wasm_mod func.idx) in
match List.filter_map (Cfg.all_instructions_list cfg) ~f:(function
| Instr.Control ({instr = Call (_, _, idx); annotation_before; label; _ }) when Int32.(idx = printf_export_idx) ->
begin match (Spec.get_or_fail annotation_before).vstack with
| _ :: first_arg :: _ when Var.equal first_arg (Var.Const (Prim_value.I32 address)) -> Some label
| _ -> None
end
| _ -> None) with
| [] -> None
| l -> Some (func.idx, l)) with
| Some r -> r
| None -> failwith "cannot find function to slice" in
Spec_inference.use_const := false;
Spec_inference.propagate_globals := false;
Spec_inference.propagate_locals := false;
let actual_slicing_criteria =
match List.find_map wasm_mod.funcs ~f:(fun func ->
if Int32.(func.idx = function_idx) then begin
Printf.printf "We are slicing function %ld\n" func.idx;
let cfg = Cfg.without_empty_nodes_with_no_predecessors (Spec_analysis.analyze_intra1 wasm_mod func.idx) in
let (_, _, use_def) = Use_def.make cfg in
match List.filter_map (Cfg.all_instructions_list cfg) ~f:(function
| Instr.Control ({instr = Call (_, _, idx); annotation_before; label; _ }) when Int32.(idx = printf_export_idx) ->
begin match (Spec.get_or_fail annotation_before).vstack with
| second_arg :: _ when List.mem slicing_criteria label ~equal:Instr.Label.equal ->
Printf.printf "second arg is: %s\n" (Var.to_string second_arg);
begin match Use_def.UseDefChains.get use_def (Use_def.Use.make label second_arg) with
| Use_def.Def.Instruction (arg_label, _) ->
Printf.printf "it is defined at: %s\n" (Instr.Label.to_string arg_label);
Some arg_label
| _ -> None
end
| _ -> None
end
| _ -> None) with
| [] -> None
| l -> Some l
end else
None) with
| Some r -> r
| None -> failwith "cannot find second argument" in
(* Perform the actual slicing *)
Spec_inference.use_const := false;
Spec_inference.propagate_globals := false;
Spec_inference.propagate_locals := false;
let cfg = Cfg.without_empty_nodes_with_no_predecessors (Spec_analysis.analyze_intra1 wasm_mod function_idx) in
let funcinst = Slicing.slice_to_funcinst cfg (Cfg.all_instructions cfg) (Instr.Label.Set.of_list (if refined then actual_slicing_criteria else slicing_criteria)) in
let module_ = Wasm_module.replace_func wasm_mod function_idx funcinst in
Out_channel.with_file output_file
~f:(fun ch ->
Out_channel.output_string ch
(if only_function
then Func_inst.to_wasm_string funcinst
else Wasm_module.to_string module_))
let gen_slice_specific =
Command.basic
~summary:"Generate a slice for a specific slicing criterion"
Command.Let_syntax.(
let%map_open file = anon ("file" %: string)
and output = anon ("output" %: string) in
fun () ->
generate_slice file output)
let find_criterion =
Command.basic
~summary:"Find the slicing criterion in a program. Prints the address the string ORBS."
Command.Let_syntax.(
let%map_open file = anon ("file" %: string) in
fun () ->
let _ = find_criterion file in ())
let count_instructions_in_slice (filename : string) (output_file : string) =
let output_func (i : Int32.t) (f : Func_inst.t) (put : string -> unit) =
put (Printf.sprintf "(func (;%ld;) (type %ld)" i f.type_idx);
if not (List.is_empty (fst f.typ)) then begin
put (Printf.sprintf " (param %s)"
(String.concat ~sep:" " (List.map (fst f.typ) ~f:Type.to_string)))
end;
if not (List.is_empty (snd f.typ)) then begin
put (Printf.sprintf " (result %s)"
(String.concat ~sep:" " (List.map (snd f.typ) ~f:Type.to_string)))
end;
put "\n";
if not (List.is_empty f.code.locals) then begin
put (Printf.sprintf " (local %s)\n" (String.concat ~sep:" " (List.map f.code.locals ~f:Type.to_string)))
end;
put (Instr.list_to_string f.code.body ?indent:(Some 2) ?sep:(Some "\n") (fun () -> ""));
put ")\n" in
let pattern = "\nORBS:" in
Spec_inference.propagate_globals := false;
Spec_inference.propagate_locals := false;
Spec_inference.use_const := false;
let wasm_mod = Wasm_module.of_file filename in
(* Find the specific string in the data section *)
let str_pos = match List.find_map wasm_mod.datas ~f:(fun segment ->
match String.substr_index segment.dinit ~pattern with
| Some idx -> begin match (Segment_mode.offset segment.dmode) with
| (Instr.Data {instr = Instr.Const (Prim_value.I32 n); _}) :: [] -> Some (Int32.(n + (of_int_exn idx)))
| _ -> failwith "unsupported segment offset"
end
| None -> None) with
| Some idx -> idx
| None -> failwith "cannot find pattern in any data segment" in
(* Find the index of the printf function (it should be exported, otherwise it is unnamed) *)
let printf_export_idx = match List.find_map wasm_mod.exported_funcs ~f:(fun (idx, name, _type) ->
if String.equal name "printf" then
Some idx
else
None) with
| Some idx -> idx
| None -> failwith "cannot find printf in exported functions" in
Spec_inference.propagate_globals := false;
Spec_inference.propagate_locals := false;
(* Find the function and slicing criterion: it should call printf with the string's position in the data segment as argument *)
let (function_idx, _slicing_criterion) = match List.find_map wasm_mod.funcs ~f:(fun func ->
Spec_inference.use_const := true;
Spec_inference.propagate_locals := true;
Out_channel.with_file output_file
~f:(fun ch -> output_func func.idx func (Out_channel.output_string ch));
let cfg = Cfg.without_empty_nodes_with_no_predecessors (Spec_analysis.analyze_intra1 wasm_mod func.idx) in
List.find_map (Cfg.all_instructions_list cfg) ~f:(function
| Instr.Control ({instr = Call (_, _, idx); annotation_before; label; _ }) when Int32.(idx = printf_export_idx) ->
begin match (Spec.get_or_fail annotation_before).vstack with
| _ :: first_arg :: _ when Var.equal first_arg (Var.Const (Prim_value.I32 str_pos)) -> Some (func.idx, label)
| _ -> None
end
| _ -> None)) with
| Some r -> r
| None -> failwith "cannot find function to slice" in
let f = List32.nth_exn wasm_mod.funcs Int32.(function_idx - wasm_mod.nfuncimports) in
let all_labels = List.fold_left f.code.body ~init:Instr.Label.Set.empty ~f:(fun acc i ->
Instr.Label.Set.union acc (Instr.all_labels_no_merge i)) in
Printf.printf "%d\n" (Instr.Label.Set.length all_labels)
let count_in_slice =
Command.basic
~summary:"Count the number of instructions in a slice for a specific slicing criterion"
Command.Let_syntax.(
let%map_open file = anon ("file" %: string)
and out = anon ("out" %: string) in
fun () ->
count_instructions_in_slice file out)