forked from 32af3611/acrl
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathopt_conf.json
44 lines (44 loc) · 1.45 KB
/
opt_conf.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
{
"DATA_SOURCE_DIRECTORIES": [
"data/cfd"
],
"TRAINING_LABEL": "training",
"TRAINING_REWARD_MODEL_ID": "models/default",
"TRAINING_REWARD_HIDDEN_SIZES": [1024, 1024],
"TRAINING_REWARD_BATCH_SIZE": 64,
"TRAINING_REWARD_LR": 1e-3,
"TRAINING_REWARD_GAMMA": 0.9999,
"TRAINING_REWARD_TYPE": ["d_drag"],
"TRAINING_REWARD_USE_CUMULATIVE_REWARD": true,
"TRAINING_AGENT_MODEL_ID": null,
"TRAINING_AGENT_N_TOTAL_EPISODES": 300000,
"TRAINING_AGENT_N_EXPLORATION_EPISODES": 50000,
"TRAINING_AGENT_N_STEPS_PER_EPISODE": 30,
"TRAINING_AGENT_WARMUP_STEPS": 1000,
"TRAINING_AGENT_LOG_FREQUENCY": 1000,
"TRAINING_AGENT_EPSILON_START": 0.5,
"TRAINING_AGENT_EPSILON_END": 0.0,
"TRAINING_AGENT_GAMMA": 1.0,
"TRAINING_AGENT_BATCH_SIZE": 64,
"TRAINING_AGENT_SYNC_FREQUENCY": 10,
"TRAINING_AGENT_REPLAY_BUFFER_SIZE": 50000,
"TRAINING_AGENT_HIDDEN_SIZES": [512, 512, 512],
"TRAINING_AGENT_OPTIMIZER": {"name": "rmsprop", "momentum": 0.0},
"TRAINING_AGENT_LR_MIN": 1e-5,
"TRAINING_AGENT_LR_MAX": null,
"TRAINING_AGENT_LR_CYCLE": 1000,
"TRAINING_AGENT_LR_DECAY": 0.99999,
"TRAINING_AGENT_ACTION_STOP_NULL": false,
"TRAINING_AGENT_ACTION_CONFIG": {
"type": "additive",
"magnitudes": [1e-3],
"use_null_action": true
},
"TRAINING_AGENT_MEAN_CONFIG": {
"min": 1.9e-3,
"max": 2.1e-3
},
"TRAINING_RETRAINING_FREQUENCY": 10000,
"TRAINING_RESAMPLING_FREQUENCY": 100,
"TRAINING_RESAMPLING_OUTPUT_PREFIX": "resampling"
}