-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathloo_dmc.sh
executable file
·54 lines (48 loc) · 3.38 KB
/
loo_dmc.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
timesteps=50000000
env_id="AcrobotSwingup-v1 AcrobotSwingupSparse-v1 BallInCupCatch-v1 CartpoleBalance-v1 CartpoleBalanceSparse-v1 CartpoleSwingup-v1 CartpoleSwingupSparse-v1 CartpoleThreePoles-v1 CartpoleTwoPoles-v1 CheetahRun-v1 FingerSpin-v1 FingerTurnEasy-v1 FingerTurnHard-v1 FishSwim-v1 FishUpright-v1 HopperHop-v1 HopperStand-v1 HumanoidRun-v1 HumanoidRunPureState-v1 HumanoidStand-v1 HumanoidWalk-v1 HumanoidCMURun-v1 HumanoidCMUStand-v1 ManipulatorBringBall-v1 ManipulatorBringPeg-v1 ManipulatorInsertBall-v1 ManipulatorInsertPeg-v1 PendulumSwingup-v1 PointMassEasy-v1 PointMassHard-v1 ReacherEasy-v1 ReacherHard-v1 SwimmerSwimmer6-v1 SwimmerSwimmer15-v1 WalkerRun-v1 WalkerStand-v1 WalkerWalk-v1"
seeds=3
workers=1000
gittag=$(git describe --tags)
for (( startseed=1; startseed<=$seeds; startseed++ ))
do
poetry run python -m cleanrl_utils.benchmark \
--env-ids $env_id \
--command "poetry run python ppo_v3/ppo_envpool_tricks_dmc.py --exp-name ppo_envpool_tricks_FINAL_loo --num-envs 128 --symlog True --two-hot True --percentile-scale True --percentile-ema-rate 0.999 --critic-ema True --critic-zero-init True --total-timesteps $timesteps --track" \
--start-seed $startseed \
--num-seeds 1 \
--workers $workers \
--slurm-gpus-per-task 1 \
--slurm-template-path ppov3.slurm_template
poetry run python -m cleanrl_utils.benchmark \
--env-ids $env_id \
--command "poetry run python ppo_v3/ppo_envpool_tricks_dmc.py --exp-name ppo_envpool_tricks_FINAL_loo_symlog --num-envs 128 --two-hot True --two-hot-range 1000 --percentile-scale True --percentile-ema-rate 0.999 --critic-ema True --critic-zero-init True --total-timesteps $timesteps --track" \
--start-seed $startseed \
--num-seeds 1 \
--workers $workers \
--slurm-gpus-per-task 1 \
--slurm-template-path ppov3.slurm_template
poetry run python -m cleanrl_utils.benchmark \
--env-ids $env_id \
--command "poetry run python ppo_v3/ppo_envpool_tricks_dmc.py --exp-name ppo_envpool_tricks_FINAL_loo_twohot --num-envs 128 --symlog True --percentile-scale True --percentile-ema-rate 0.999 --critic-ema True --total-timesteps $timesteps --track" \
--start-seed $startseed \
--num-seeds 1 \
--workers $workers \
--slurm-gpus-per-task 1 \
--slurm-template-path ppov3.slurm_template
poetry run python -m cleanrl_utils.benchmark \
--env-ids $env_id \
--command "poetry run python ppo_v3/ppo_envpool_tricks_dmc.py --exp-name ppo_envpool_tricks_FINAL_loo_percentile --num-envs 128 --symlog True --two-hot True --critic-ema True --critic-zero-init True --total-timesteps $timesteps --track" \
--start-seed $startseed \
--num-seeds 1 \
--workers $workers \
--slurm-gpus-per-task 1 \
--slurm-template-path ppov3.slurm_template
poetry run python -m cleanrl_utils.benchmark \
--env-ids $env_id \
--command "poetry run python ppo_v3/ppo_envpool_tricks_dmc.py --exp-name ppo_envpool_tricks_FINAL_loo_criticema --num-envs 128 --symlog True --two-hot True --percentile-scale True --percentile-ema-rate 0.99 --critic-zero-init True --total-timesteps $timesteps --track" \
--start-seed $startseed \
--num-seeds 1 \
--workers $workers \
--slurm-gpus-per-task 1 \
--slurm-template-path ppov3.slurm_template
done