-
Notifications
You must be signed in to change notification settings - Fork 260
/
run_benchmark.sh
executable file
·112 lines (81 loc) · 2.27 KB
/
run_benchmark.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
#!/usr/bin/python3.9
# Copyright (c) Microsoft Corporation.
# Licensed under the MIT License.
# Run all notebooks fully to produce publishable benchmark results
# and reusable notebooks
set -ex
kernel=$1
if [ -z "$kernel" ]; then
kernel=cybersim
fi
script_dir=$(dirname "$0")
pushd "$script_dir/.."
output_dir=notebooks/output/benchmark
output_plot_dir=$output_dir/plots
run () {
base=$1
suffix=$2
cat notebook notebooks/$base.py \
| jupytext --to ipynb - \
| papermill --kernel $kernel $output_dir/$base$suffix.ipynb "${@:3}"
}
jupyter kernelspec list
mkdir $output_dir -p
mkdir $output_plot_dir -p
# run c2_interactive_interface '' # disabled: not deterministic and can fail
# run random_active_directory '' # disabled: not deterministic and can fail
# run notebook_dql_debug.py ''
run toyctf-blank ''
run toyctf-random ''
run toyctf-solved ''
run chainnetwork-optionwrapper ''
run chainnetwork-random '' -y "
iterations: 100
"
run randomnetwork ''
run notebook_benchmark '-chain' -y "
gymid: 'CyberBattleChain-v0'
iteration_count: 2000 # iteration_count = 9000
training_episode_count: 20 # training_episode_count = 50
eval_episode_count: 3 # eval_episode_count = 5
maximum_node_count: 20 # maximum_node_count = 22
maximum_total_credentials: 20 # maximum_total_credentials = 22
env_size: 10
plots_dir: $output_plot_dir
"
run notebook_benchmark '-toyctf' -y "
gymid: 'CyberBattleToyCtf-v0'
env_size: null
iteration_count: 1500
training_episode_count: 20
eval_episode_count: 10
maximum_node_count: 12
maximum_total_credentials: 10
plots_dir: $output_plot_dir
"
run notebook_benchmark '-tiny' -y "
gymid: 'CyberBattleTiny-v0'
env_size: null
iteration_count: 200
training_episode_count: 10
eval_episode_count: 10
maximum_node_count: 5
maximum_total_credentials: 3
plots_dir: $output_plot_dir
"
run notebook_dql_transfer '' -y "
plots_dir: $output_plot_dir
"
run notebook_randlookups '' -y "
plots_dir: $output_plot_dir
"
run notebook_tabularq '' -y "
plots_dir: $output_plot_dir
"
run notebook_withdefender '' -y "
plots_dir: $output_plot_dir
"
run dql_active_directory '' -y "
iteration_count: 50
"
popd