-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathtrain_all.sh
executable file
·97 lines (89 loc) · 19.7 KB
/
train_all.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
#!/bin/bash
NUM_ACTOR_WORKER=5
NUM_CRITIC_WORKER=1
myip_command="ifconfig | sed -En 's/127.0.0.1//;s/.*inet (addr:)?(([0-9]*\.){3}[0-9]*).*/\2/p'"
myip=$(eval "$myip_command")
python train.py --config config/halfcheetah-v2/td3.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/acemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/opo.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/cemrl.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --parallel_critic --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update adaptive --aesrl_mean_update_param 2000 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update adaptive --aesrl_mean_update_param -2000 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update adaptive --aesrl_mean_update_param 2000 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update adaptive --aesrl_mean_update_param 2000 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update fixed --aesrl_mean_update_param 2000 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update fixed --aesrl_mean_update_param -2000 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update fixed --aesrl_mean_update_param 2000 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/halfcheetah-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update fixed --aesrl_mean_update_param 2000 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/td3.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/acemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/opo.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/cemrl.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --parallel_critic --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update adaptive --aesrl_mean_update_param -960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update fixed --aesrl_mean_update_param -960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/ant-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/td3.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/acemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/opo.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/cemrl.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --parallel_critic --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update adaptive --aesrl_mean_update_param 2000 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update adaptive --aesrl_mean_update_param -2000 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update adaptive --aesrl_mean_update_param 2000 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update adaptive --aesrl_mean_update_param 2000 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update fixed --aesrl_mean_update_param 2000 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update fixed --aesrl_mean_update_param -2000 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update fixed --aesrl_mean_update_param 2000 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/hopper-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update fixed --aesrl_mean_update_param 2000 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/td3.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/acemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/opo.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/cemrl.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --parallel_critic --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update adaptive --aesrl_mean_update_param -960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update fixed --aesrl_mean_update_param -960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/humanoid-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/td3.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/acemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/opo.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/cemrl.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --parallel_critic --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update adaptive --aesrl_mean_update_param -960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update fixed --aesrl_mean_update_param -960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/swimmer-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/td3.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/acemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/opo.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/cemrl.json --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/pcemrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --parallel_critic --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update adaptive --aesrl_mean_update_param -960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update adaptive --aesrl_mean_update_param 960 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-relative --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update baseline-absolute --aesrl_var_update fixed --aesrl_mean_update_param -960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-linear --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345
python train.py --config config/walker2d-v2/aesrl.json --num_actor_worker $NUM_ACTOR_WORKER --num_critic_worker $NUM_CRITIC_WORKER --aesrl_mean_update fixed-sigmoid --aesrl_var_update fixed --aesrl_mean_update_param 960 --aesrl_fixed_var_n 10 --ray_address $myip --ray_port 12345 --redis_password 12345