diff_fuzz/analyze.py at main · kenballus/diff_fuzz · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
import os
import json
import shutil
import itertools
import uuid
import argparse
import subprocess
import dataclasses
import sys
from pathlib import PosixPath
from typing import Callable, TypeVar

import matplotlib.pyplot as plt  # type: ignore
import numpy as np

from diff_fuzz import trace_batch, fingerprint_t, json_t, EdgeCountSnapshot

BENCHMARKING_DIR: PosixPath = PosixPath("benchmarking").resolve()
RESULTS_DIR: PosixPath = PosixPath("results").resolve()
REPORTS_DIR: PosixPath = PosixPath("reports").resolve()
ANALYSES_DIR: PosixPath = BENCHMARKING_DIR.joinpath("analyses").resolve()
RUN_DIR: PosixPath = PosixPath("/tmp").joinpath("diff-fuzz-analyzer")

CONFIG_FILE_PATH: PosixPath = PosixPath("config.py").resolve()
CONFIG_COPY_PATH: PosixPath = BENCHMARKING_DIR.joinpath("config_copy.py")


T = TypeVar("T")


def attempt(f: Callable[..., T], error_message: str, *args, **kwargs) -> T | None:
    try:
        return f(*args, **kwargs)
    except:  # pylint: disable=bare-except
        print(error_message, file=sys.stderr)
        return None


# Check that the files exported by a given run of the fuzzer actually exist
def check_fuzz_output(run_name: str, run_uuid: str) -> None:
    # Check for report file
    if not os.path.isfile(REPORTS_DIR.joinpath(run_uuid).with_suffix(".json")):
        raise FileNotFoundError(f"{run_name} doesn't have a report file!")

    # Check for results folder
    if not os.path.isdir(RESULTS_DIR.joinpath(run_uuid)):
        raise FileNotFoundError(f"{run_name} doesn't have a differentials folder!")


# Data class that describes how many bugs have been found at a particular time and generation. Records the cumulative number of bugs found up to that point, the time at which the latest included bug was found, and the generation at which the latest included bug was found. Stored in JSON in the differentials list which has a JSON object for every bug found during the run sorted by time found in ascending order. Each JSON object has an example of the bug base64 encoded, the path to a file where an example of the bug is stored, the time at which the bug was found, and the generation in which the bug was found.
@dataclasses.dataclass
class BugCount:
    bug_count: int
    time: float
    generation: int


def parse_reports(
    uuids_to_names: dict[str, str]
) -> tuple[dict[str, list[BugCount]], dict[str, dict[str, list[EdgeCountSnapshot]]]]:
    all_bug_data: dict[str, list[BugCount]] = {}
    all_edge_data: dict[str, dict[str, list[EdgeCountSnapshot]]] = {}
    for run_uuid in uuids_to_names:
        with open(REPORTS_DIR.joinpath(run_uuid).with_suffix(".json"), "rb") as report_file:
            report_json: json_t = json.load(report_file)
            assert isinstance(report_json, dict)

        # Parse the JSON for bug datas
        differentials_json: json_t = report_json["differentials"]
        assert isinstance(differentials_json, list)
        differentials: list[BugCount] = []
        running_count: int = 0
        for differential_json in differentials_json:
            assert isinstance(differential_json, dict)
            running_count += 1
            assert isinstance(differential_json["time"], float)
            assert isinstance(differential_json["generation"], int)
            bug_data: BugCount = BugCount(
                running_count, differential_json["time"], differential_json["generation"]
            )
            differentials.append(bug_data)
        all_bug_data[run_uuid] = differentials

        # Parse the JSON for edge data
        coverage_json: json_t = report_json["coverage"]
        assert isinstance(coverage_json, dict)
        for target_name in coverage_json.keys():
            assert isinstance(target_name, str)
            if target_name not in all_edge_data:
                all_edge_data[target_name] = {run_uuid: [] for run_uuid in uuids_to_names}
            coverage_list: json_t = coverage_json[target_name]
            assert isinstance(coverage_list, list)
            for data_point_json in coverage_list:
                assert isinstance(data_point_json, dict)
                assert isinstance(data_point_json["edges"], int)
                assert isinstance(data_point_json["time"], float)
                assert isinstance(data_point_json["generation"], int)
                edge_data: EdgeCountSnapshot = EdgeCountSnapshot(
                    data_point_json["edges"], data_point_json["time"], data_point_json["generation"]
                )
                all_edge_data[target_name][run_uuid].append(edge_data)
    return all_bug_data, all_edge_data


# Reads byte differentials from the given differentials directory and gives them back in a list
def read_byte_differentials(
    differentials_folder: PosixPath,
) -> list[bytes]:
    # Read the bugs from files
    byte_differentials: list[bytes] = []
    differentials = os.listdir(differentials_folder)
    for diff in differentials:
        differential_file_name = differentials_folder.joinpath(diff)
        with open(differential_file_name, "rb") as differential_file:
            byte_differentials.append(differential_file.read())
    return byte_differentials


# Takes a list of byte differentials and returns a dictionary of all the trace fingerprints these byte differentials result in.
# The dictionary maps each found fingerprint to a byte differential example.
def trace_byte_differentials(byte_differentials: list[bytes]) -> dict[fingerprint_t, bytes]:
    # Trace the bugs
    if os.path.exists(RUN_DIR):
        raise ValueError(f"Run directory already exists! Please delete {RUN_DIR.resolve()}")
    os.mkdir(RUN_DIR)
    try:
        fingerprints: list[fingerprint_t] = trace_batch(RUN_DIR, byte_differentials)
    finally:
        attempt(shutil.rmtree, f"Failed to cleanup the run directory at {RUN_DIR}", RUN_DIR)

    # Record
    fingerprints_to_bytes = {}
    for fingerprint, byte_differential in zip(fingerprints, byte_differentials):
        fingerprints_to_bytes[fingerprint] = byte_differential
    return fingerprints_to_bytes


def build_overlap_report(
    uuids_to_names: dict[str, str],
    machine_file_path: PosixPath,
) -> None:
    run_differentials: dict[str, dict[fingerprint_t, bytes]] = {}
    for run_uuid in uuids_to_names:
        byte_differentials: list[bytes] = read_byte_differentials(RESULTS_DIR.joinpath(run_uuid))
        run_differentials[run_uuid] = trace_byte_differentials(byte_differentials)

    # Get list of combos from big to small
    combos_list: list[list[str]] = list(
        list(combo)
        for i in range(len(uuids_to_names), 0, -1)
        for combo in itertools.combinations(uuids_to_names.keys(), i)
    )
    combo_name_to_traces: dict[str, set[fingerprint_t]] = {}
    for combo in combos_list:
        # Save combo name before editing combo
        combo_name: str = "/".join(uuids_to_names[run_uuid] for run_uuid in combo)
        # For each combo build list of common bugs
        common_traces: set[fingerprint_t] = set(run_differentials[combo.pop()].keys())
        for run_uuid in combo:
            common_traces = common_traces.intersection(run_differentials[run_uuid].keys())
        combo_name_to_traces[combo_name] = common_traces

    # Write to the machine readable file
    with open(machine_file_path, "wb") as machine_file:
        machine_file.write("Included runs,Common bug count\n".encode("latin-1"))
        machine_file.write(
            "\n".join(
                f"{combo_name},{len(common_traces)}"
                for combo_name, common_traces in combo_name_to_traces.items()
            ).encode("latin-1")
        )

    # Choose examples for every trace
    trace_examples: dict[fingerprint_t, bytes] = {}
    for traces_to_bytes in run_differentials.values():
        for trace in traces_to_bytes:
            trace_examples[trace] = traces_to_bytes[trace]

    # Write to the stderr file in a readable format
    for combo_name, common_traces in combo_name_to_traces.items():
        print("-------------------------------------------", file=sys.stderr)
        print(combo_name, file=sys.stderr)
        print("Total: " + str(len(common_traces)), file=sys.stderr)
        print("-------------------------------------------", file=sys.stderr)
        # Find an example for each trace common between the runs
        common_examples: list[str] = list(str(trace_examples[trace])[2:-1] for trace in common_traces)
        # Sort examples and print them
        for example in sorted(common_examples):
            print(example, file=sys.stderr)


def build_edge_graphs(
    analysis_name: str,
    uuids_to_names: dict[str, str],
    analysis_dir: PosixPath,
    edge_data: dict[str, dict[str, list[EdgeCountSnapshot]]],
) -> None:
    # Build the graphs
    for target_name, runs in edge_data.items():
        figure, axis = plt.subplots(2, 1, constrained_layout=True)
        figure.suptitle(f"{analysis_name} - {target_name}", fontsize=16)
        axis[0].set_xlabel("Time (s)")
        axis[0].set_ylabel("Edges")
        axis[1].set_xlabel("Generations")
        axis[1].set_ylabel("Edges")
        for run_uuid in runs:
            axis[0].plot(
                np.array([point.time for point in runs[run_uuid]]),
                np.array([point.edge_count for point in runs[run_uuid]]),
                label=uuids_to_names[run_uuid],
            )
            axis[1].plot(
                np.array([point.generation for point in runs[run_uuid]]),
                np.array([point.edge_count for point in runs[run_uuid]]),
            )
        figure.legend(loc="upper left")
        plt.savefig(analysis_dir.joinpath(f"edges_{target_name}").with_suffix(".png"), format="png")
        plt.close()


# Plot a run onto a given axis
def plot_bugs(run_name: str, differentials: list[BugCount], axis: np.ndarray) -> None:
    axis[0].plot(
        np.array([differential.time for differential in differentials]),
        np.array([differential.bug_count for differential in differentials]),
        label=run_name,
    )
    axis[0].set_xlabel("Time (s)")
    axis[0].set_ylabel("Bugs")
    axis[1].plot(
        np.array([differential.generation for differential in differentials]),
        np.array([differential.bug_count for differential in differentials]),
    )
    axis[1].set_xlabel("Generations")
    axis[1].set_ylabel("Bugs")


def build_bug_graph(
    analysis_name: str,
    uuids_to_names: dict[str, str],
    analysis_dir: PosixPath,
    bug_data: dict[str, list[BugCount]],
) -> None:
    figure, axis = plt.subplots(2, 1, constrained_layout=True)
    figure.suptitle(analysis_name, fontsize=16)

    for run_uuid, run_name in uuids_to_names.items():
        plot_bugs(run_name, bug_data[run_uuid], axis)

    figure.legend(loc="upper left")
    plt.savefig(analysis_dir.joinpath("bug_graph").with_suffix(".png"), format="png")
    plt.close()


# Dataclass for holding information about runs in the queue. Contains a user-defined name, a commit hash,
# a timeout in seconds, and potentially a config for the run
@dataclasses.dataclass
class QueuedRun:
    name: str
    commit: str
    timeout: int
    config_file: PosixPath


def retrieve_queued_runs(queue_file_path: PosixPath) -> list[QueuedRun]:
    queued_runs: list[QueuedRun] = []
    # Read queue file and check validity
    with open(queue_file_path, "r", encoding="ascii") as queue_file:
        for split_line in map(lambda line: line.strip().split(","), queue_file.readlines()):
            assert len(split_line) in (3, 4)
            name: str = split_line[0]
            commit_hash: str = split_line[1]
            timeout: int = int(split_line[2])
            config_file: PosixPath = (
                PosixPath(split_line[3]).resolve() if len(split_line) == 4 else CONFIG_COPY_PATH
            )
            assert config_file.is_file()
            assert config_file != CONFIG_FILE_PATH
            queued_runs.append(QueuedRun(name, commit_hash, timeout, config_file))
    return queued_runs


def execute_runs(queued_runs: list[QueuedRun]) -> dict[str, str]:
    # Save original branch
    original_branch: bytes = subprocess.run(
        ["git", "branch", "--show-current"], capture_output=True, check=True
    ).stdout.strip()

    uuids_to_names: dict[str, str] = {}

    # Execute queued runs
    try:
        for queued_run in queued_runs:
            subprocess.run(["git", "checkout", queued_run.commit], check=True)
            shutil.copyfile(queued_run.config_file, CONFIG_FILE_PATH)
            uuids_to_names[
                subprocess.run(
                    [
                        "timeout",
                        "--foreground",
                        "--signal=2",  # SIGINT
                        "--preserve-status",
                        str(queued_run.timeout),
                        "python",
                        "diff_fuzz.py",
                    ],
                    capture_output=True,
                    check=True,
                )
                .stdout.decode("ascii")
                .strip()
            ] = queued_run.name
    finally:
        # Cleanup
        attempt(shutil.copyfile, "Failed to restore config file.", CONFIG_COPY_PATH, CONFIG_FILE_PATH)
        attempt(os.remove, f"Failed to remove {CONFIG_COPY_PATH}.", CONFIG_COPY_PATH)
        attempt(
            subprocess.run,
            "Failed to return to original branch.",
            ["git", "switch", original_branch],
            capture_output=True,
            check=True,
        )

    return uuids_to_names


def main() -> None:
    assert RESULTS_DIR.is_dir()
    assert ANALYSES_DIR.is_dir()
    assert REPORTS_DIR.is_dir()
    assert CONFIG_COPY_PATH != CONFIG_FILE_PATH

    # Retrieve arguments
    parser: argparse.ArgumentParser = argparse.ArgumentParser()
    parser.add_argument("name", help="The name of the analysis to put on the graphs")
    parser.add_argument(
        "queue_file_path", help="The path to the queue file to take runs from for the analysis"
    )
    parser.add_argument("--bug-count", help="Enable creation of bug count plot", action="store_true")
    parser.add_argument("--bug-overlap", help="Enable creation of bug overlap reports", action="store_true")
    parser.add_argument("--edge-count", help="Enable creation of edge count plot", action="store_true")
    args: argparse.Namespace = parser.parse_args()

    # Ensure at least one option is enabled
    if not any((args.bug_count, args.edge_count, args.bug_overlap)):
        raise ValueError("At least one of --bug-count, --bug-overlap, --edge-count must be passed.")

    # Copy the original config
    assert os.path.isfile(CONFIG_FILE_PATH)
    shutil.copyfile(CONFIG_FILE_PATH, CONFIG_COPY_PATH)

    # Check that queue file exists and get queued runs
    queue_file_path = PosixPath(args.queue_file_path).resolve()
    assert os.path.isfile(queue_file_path)
    queued_runs: list[QueuedRun] = retrieve_queued_runs(queue_file_path)

    # Run!
    uuids_to_names: dict[str, str] = execute_runs(queued_runs)

    # Parse and assert data
    for run_uuid, run_name in uuids_to_names.items():
        check_fuzz_output(run_name, run_uuid)
    try:
        bug_data, edge_data = parse_reports(uuids_to_names)
    except AssertionError as e:
        raise ValueError("One of the report JSON files cannot be parsed.") from e

    # Generate analysis uuid
    analysis_uuid: str = str(uuid.uuid4())
    analysis_dir: PosixPath = ANALYSES_DIR.joinpath(analysis_uuid)
    os.mkdir(analysis_dir)

    if args.bug_count:
        build_bug_graph(args.name, uuids_to_names, analysis_dir, bug_data)
    if args.edge_count:
        build_edge_graphs(args.name, uuids_to_names, analysis_dir, edge_data)
    if args.bug_overlap:
        build_overlap_report(
            uuids_to_names,
            analysis_dir.joinpath("overlap_machine").with_suffix(".csv"),
        )

    print(f"Analysis done! See {analysis_dir.resolve()} for results")


if __name__ == "__main__":
    main()