forked from edbeeching/godot_rl_agents
-
Notifications
You must be signed in to change notification settings - Fork 0
/
ppo_test.yaml
39 lines (35 loc) · 796 Bytes
/
ppo_test.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
algorithm: PPO
stop:
episode_reward_mean: 5000
training_iteration: 1000
timesteps_total: 200000000
config:
env: godot
env_config:
framerate: null
action_repeat: null
show_window: false
seed: 0
framework: torch
lambda: 0.95
gamma: 0.95
vf_clip_param: 1.0
clip_param: 0.2
entropy_coeff: 0.001
entropy_coeff_schedule: null
train_batch_size: 1024
sgd_minibatch_size: 128
num_sgd_iter: 16
num_workers: 4
lr: 0.0003
num_envs_per_worker: 16
batch_mode: truncate_episodes
rollout_fragment_length: 16
num_gpus: 1
model:
fcnet_hiddens: [256, 256]
use_lstm: false
lstm_cell_size : 32
framestack: 4
no_done_at_end: false
soft_horizon: false