forked from cts198859/deeprl_network
-
Notifications
You must be signed in to change notification settings - Fork 0
/
config_ia2c_grid.ini
43 lines (41 loc) · 944 Bytes
/
config_ia2c_grid.ini
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
[MODEL_CONFIG]
rmsp_alpha = 0.99
rmsp_epsilon = 1e-5
max_grad_norm = 40
gamma = 0.99
lr_init = 5e-4
lr_decay = constant
entropy_coef = 0.01
value_coef = 0.5
num_lstm = 64
num_fc = 64
batch_size = 120
reward_norm = 100.0
reward_clip = -1
[TRAIN_CONFIG]
total_step = 1e6
test_interval = 2e6
log_interval = 1e4
[ENV_CONFIG]
clip_wave = 2.0
clip_wait = -1
control_interval_sec = 5
; agent is greedy, ia2c, ia2c_fp, ma2c_som, ma2c_ic3, ma2c_nc.
agent = ia2c
; coop discount is used to discount the neighbors' impact
coop_gamma = 0.9
data_path = ./envs/large_grid_data/
episode_length_sec = 3600
; the normailization is based on typical values in sim
norm_wave = 5.0
norm_wait = -1
coef_wait = 0
peak_flow1 = 1100
peak_flow2 = 925
init_density = 0
; objective is chosen from queue, wait, hybrid
objective = queue
scenario = atsc_large_grid
seed = 12
test_seeds = 10000,20000,30000,40000,50000,60000,70000,80000,90000,100000
yellow_interval_sec = 2