-
Notifications
You must be signed in to change notification settings - Fork 14
/
Copy pathexec.sh
94 lines (86 loc) · 2.66 KB
/
exec.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
#!/bin/bash
export gym_envs="
CartPole-v1
Pendulum-v1
Acrobot-v1
MountainCar-v0
MountainCarContinuous-v0
"
export minatar_envs="
Asterix-MinAtar
Breakout-MinAtar
Freeway-MinAtar
SpaceInvaders-MinAtar
"
#Seaquest-MinAtar
export bsuite_envs="
Catch-bsuite
DeepSea-bsuite
MemoryChain-bsuite
UmbrellaChain-bsuite
DiscountingChain-bsuite
MNISTBandit-bsuite
SimpleBandit-bsuite
"
export misc_envs="
FourRooms-misc
MetaMaze-misc
PointRobot-misc
BernoulliBandit-misc
GaussianBandit-misc
"
if [[ "$1" == "speed" ]]
then
# Loop over environments and estimate runtime speed
for env_name in $minatar_envs $gym_envs
do
python speed.py -env $env_name -np -n_envs 10
python speed.py -env $env_name -np -n_envs 10 -net
python speed.py -env $env_name -n_envs 10
python speed.py -env $env_name -n_envs 10 -net
python speed.py -env $env_name -np -n_envs 40
python speed.py -env $env_name -np -n_envs 40 -net
python speed.py -env $env_name -n_envs 40
python speed.py -env $env_name -n_envs 40 -net
python speed.py -env $env_name -n_envs 2000 -gpu
python speed.py -env $env_name -n_envs 2000 -net -gpu
python speed.py -env $env_name -n_envs 2000 -gpu -a100
python speed.py -env $env_name -n_envs 2000 -net -gpu -a100
done
for env_name in $bsuite_envs $misc_envs
do
python speed.py -env $env_name -n_envs 10
python speed.py -env $env_name -n_envs 10 -net
python speed.py -env $env_name -n_envs 40
python speed.py -env $env_name -n_envs 40 -net
python speed.py -env $env_name -n_envs 2000 -gpu
python speed.py -env $env_name -n_envs 2000 -net -gpu
python speed.py -env $env_name -n_envs 2000 -gpu -a100
python speed.py -env $env_name -n_envs 2000 -net -gpu -a100
done
# TODO: Add bsuite numpy evaluation
# TODO: Add V100S results and TPU evaluation
elif [[ "$1" == "train" ]]
then
# Loop over environments and train agents with PPO/ES
for env_name in $gym_envs $minatar_envs $bsuite_envs
do
python train.py -config agents/$env_name/ppo.yaml --lrate 1e-04
python train.py -config agents/$env_name/ppo.yaml --lrate 1e-03
python train.py -config agents/$env_name/ppo.yaml
python train.py -config agents/$env_name/es.yaml
done
for env_name in $misc_envs
do
python train.py -config configs/$env_name/es.yaml
done
elif [[ "$1" == "visualize" ]]
then
# Loop over environments and visualize trained PPO agent
for env_name in $gym_envs $minatar_envs
do
python visualize.py -env $env_name -train ppo
done
else
echo "Provide valid argument to bash script"
fi