-
Notifications
You must be signed in to change notification settings - Fork 0
/
config_ma2c_nc_slowdown.ini
47 lines (45 loc) · 810 Bytes
/
config_ma2c_nc_slowdown.ini
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
[MODEL_CONFIG]
rmsp_alpha = 0.99
rmsp_epsilon = 1e-5
max_grad_norm = 40
gamma = 0.99
lr_init = 5e-4
lr_decay = constant
entropy_coef = 0.05
value_coef = 0.5
num_lstm = 64
num_fc = 64
batch_size = 60
; same nodes may be updated by ~8 propagations,
; adjust norm accordingly
reward_norm = 5000.0
reward_clip = -1
[TRAIN_CONFIG]
total_step = 1e6
test_interval = 1e7
log_interval = 1e4
[ENV_CONFIG]
control_interval_sec = 0.1
episode_length_sec = 60
agent = ma2c_nc
batch_size = 60
coop_gamma = -1
; constraints
headway_min = 1
headway_st = 5
headway_go = 35
speed_max = 30
accel_max = 2.5
accel_min = -2.5
; reward
reward_v = 1
reward_u = 0.1
collision_penalty = 1000
headway_target = 20
speed_target = 15
norm_headway = 10
norm_speed = 7.5
n_vehicle = 8
scenario = cacc_slowdown
seed = 12
test_seeds = 10000