-
Notifications
You must be signed in to change notification settings - Fork 42
/
eval.sh
237 lines (191 loc) · 14.1 KB
/
eval.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
export PYTHONPATH=${PWD}:$PYTHONPATH
## Standard POMDP (occlusion benchmark)
# python scripts/merge_csv.py --base_path results/logs/pomdp/Pendulum/V \
# --max_episode_len 200 --start_x 2000 --interval_x 1000
# python scripts/plot_csv.py --csv_path results/data/pomdp/Pendulum/V/final.csv \
# --max_x 30000 --window_size 3 # don't forget uncomment "Arch"
# python scripts/plot_diagnose.py --csv_path results/data/pomdp/Pendulum/V/final.csv \
# --max_x 50000 --window_size 3 --instances sac-lstm-200-oar-separate,sac-lstm-200-oar-shared
# python scripts/merge_csv.py --base_path results/logs/pomdp/AntBLT/P \
# --max_episode_len 1000 --start_x 12000 --interval_x 4000
# python scripts/plot_csv.py --csv_path results/data/pomdp/AntBLT/P/final.csv \
# --window_size 20 --max_x 1500000 --best_variant td3-gru-64-oa-separate --other_methods ppo_gru,a2c_gru,VRM \
# --name Ant-P
# python scripts/plot_single_factor.py --csv_path results/data/pomdp/AntBLT/P/final.csv \
# --window_size 20 --factors RL,Encoder,Len,Inputs
# python scripts/merge_csv.py --base_path results/logs/pomdp/AntBLT/V \
# --max_episode_len 1000 --start_x 12000 --interval_x 4000
# python scripts/plot_csv.py --csv_path results/data/pomdp/AntBLT/V/final.csv \
# --window_size 20 --max_x 1500000 --best_variant td3-gru-64-oa-separate --other_methods ppo_gru,a2c_gru,VRM \
# --name Ant-V
# python scripts/plot_csv.py --csv_path results/data/pomdp/AntBLT/V/final.csv \
# --window_size 20 --max_x 500000 --best_variant td3-gru-64-oa-separate
# python scripts/plot_single_factor.py --csv_path results/data/pomdp/AntBLT/V/final.csv \
# --window_size 20 --factors RL,Encoder,Len,Inputs
# python scripts/merge_csv.py --base_path results/logs/pomdp/HalfCheetahBLT/P \
# --max_episode_len 1000 --start_x 12000 --interval_x 4000
# python scripts/plot_csv.py --csv_path results/data/pomdp/HalfCheetahBLT/P/final.csv \
# --window_size 20 --max_x 1500000 --best_variant td3-gru-64-oa-separate --other_methods ppo_gru,a2c_gru,VRM \
# --name Cheetah-P
# python scripts/plot_csv.py --csv_path results/data/pomdp/HalfCheetahBLT/P/final.csv \
# --window_size 20 --max_x 500000 --best_variant td3-gru-64-oa-separate
# python scripts/plot_single_factor.py --csv_path results/data/pomdp/HalfCheetahBLT/P/final.csv \
# --window_size 20 --factors RL,Encoder,Len,Inputs
# python scripts/merge_csv.py --base_path results/logs/pomdp/HalfCheetahBLT/V \
# --max_episode_len 1000 --start_x 12000 --interval_x 4000
# python scripts/plot_csv.py --csv_path results/data/pomdp/HalfCheetahBLT/V/final.csv \
# --window_size 20 --max_x 1500000 --best_variant td3-gru-64-oa-separate --other_methods ppo_gru,a2c_gru,VRM \
# --name Cheetah-V
# python scripts/plot_csv.py --csv_path results/data/pomdp/HalfCheetahBLT/V/final.csv \
# --window_size 20 --max_x 500000 --best_variant td3-gru-64-oa-separate
# python scripts/plot_single_factor.py --csv_path results/data/pomdp/HalfCheetahBLT/V/final.csv \
# --window_size 20 --factors RL,Encoder,Len,Inputs
# python scripts/merge_csv.py --base_path results/logs/pomdp/HopperBLT/P \
# --max_episode_len 1000 --start_x 12000 --interval_x 4000
# python scripts/plot_csv.py --csv_path results/data/pomdp/HopperBLT/P/final.csv \
# --window_size 20 --max_x 1500000 --best_variant td3-gru-64-oa-separate --other_methods ppo_gru,a2c_gru,VRM \
# --name Hopper-P
# python scripts/plot_csv.py --csv_path results/data/pomdp/HopperBLT/P/final.csv \
# --window_size 20 --max_x 500000 --best_variant td3-gru-64-oa-separate
# python scripts/plot_single_factor.py --csv_path results/data/pomdp/HopperBLT/P/final.csv \
# --window_size 20 --factors RL,Encoder,Len,Inputs
# python scripts/merge_csv.py --base_path results/logs/pomdp/HopperBLT/V \
# --max_episode_len 1000 --start_x 12000 --interval_x 4000
# python scripts/plot_csv.py --csv_path results/data/pomdp/HopperBLT/V/final.csv \
# --window_size 20 --max_x 1500000 --best_variant td3-gru-64-oa-separate --other_methods ppo_gru,a2c_gru,VRM \
# --name Hopper-V
# python scripts/plot_csv.py --csv_path results/data/pomdp/HopperBLT/V/final.csv \
# --window_size 20 --max_x 500000 --best_variant td3-gru-64-oa-separate
# python scripts/plot_single_factor.py --csv_path results/data/pomdp/HopperBLT/V/final.csv \
# --window_size 20 --factors RL,Encoder,Len,Inputs
# python scripts/merge_csv.py --base_path results/logs/pomdp/WalkerBLT/P \
# --max_episode_len 1000 --start_x 12000 --interval_x 4000
# python scripts/plot_csv.py --csv_path results/data/pomdp/WalkerBLT/P/final.csv \
# --window_size 20 --max_x 1500000 --best_variant td3-gru-64-oa-separate --other_methods ppo_gru,a2c_gru,VRM \
# --name Walker-P
# python scripts/plot_csv.py --csv_path results/data/pomdp/WalkerBLT/P/final.csv \
# --window_size 20 --max_x 500000 --best_variant td3-gru-64-oa-separate
# python scripts/plot_single_factor.py --csv_path results/data/pomdp/WalkerBLT/P/final.csv \
# --window_size 20 --factors RL,Encoder,Len,Inputs
# python scripts/merge_csv.py --base_path results/logs/pomdp/WalkerBLT/V \
# --max_episode_len 1000 --start_x 12000 --interval_x 4000
# python scripts/plot_csv.py --csv_path results/data/pomdp/WalkerBLT/V/final.csv \
# --window_size 20 --max_x 1500000 --best_variant td3-gru-64-oa-separate --other_methods ppo_gru,a2c_gru,VRM \
# --name Walker-V
# python scripts/plot_csv.py --csv_path results/data/pomdp/WalkerBLT/V/final.csv \
# --window_size 20 --max_x 500000 --best_variant td3-gru-64-oa-separate
# python scripts/plot_single_factor.py --csv_path results/data/pomdp/WalkerBLT/V/final.csv \
# --window_size 20 --factors RL,Encoder,Len,Inputs
## Meta RL (off-policy varibad benchmark)
# python scripts/merge_csv.py --base_path results/logs/meta/HalfCheetahVel-v0 \
# --max_episode_len 400 --start_x 240000 --interval_x 40000
# python scripts/plot_csv.py --csv_path results/data/meta/HalfCheetahVel-v0/final.csv \
# --window_size 10 --max_x 20000000 --best_variant td3-lstm-64-oar-separate --other_methods offpolicy-varibad \
# --name Cheetah-Vel --loc "lower right"
# python scripts/merge_csv.py --base_path results/logs/meta/HalfCheetahVel-v0/oracle \
# --max_episode_len 400 --start_x 240000 --interval_x 40000
# python scripts/plot_csv.py --csv_path results/data/meta/HalfCheetahVel-v0/oracle/final.csv \
# --window_size 10 --max_x 5000000
# python scripts/plot_single_factor.py --csv_path results/data/meta/HalfCheetahVel-v0/final.csv \
# --window_size 10 --factors RL,Encoder,Len
# python scripts/merge_csv.py --base_path results/logs/meta/PointRobotSparse-v0 \
# --max_episode_len 120 --start_x 60000 --interval_x 15000
# python scripts/plot_csv.py --csv_path results/data/meta/PointRobotSparse-v0/final.csv \
# --window_size 10 --best_variant td3-lstm-64-or-separate --other_methods offpolicy-varibad \
# --name Semi-Circle --loc "lower right"
# python scripts/merge_csv.py --base_path results/logs/meta/PointRobotSparse-v0/oracle \
# --max_episode_len 120 --start_x 60000 --interval_x 15000
# python scripts/plot_csv.py --csv_path results/data/meta/PointRobotSparse-v0/oracle/final.csv \
# --window_size 10 --max_x 1500000
# python scripts/plot_diagnose.py --csv_path results/data/meta/PointRobotSparse-v0/final.csv \
# --window_size 10 --instances td3-lstm-64-or-separate,td3-lstm-64-or-shared
# python scripts/plot_single_factor.py --csv_path results/data/meta/PointRobotSparse-v0/final.csv \
# --window_size 10 --factors Arch,RL,Encoder,Len
# python scripts/merge_csv.py --base_path results/logs/meta/Wind-v0 \
# --max_episode_len 75 --start_x 9000 --interval_x 3000
# python scripts/plot_csv.py --csv_path results/data/meta/Wind-v0/final.csv \
# --window_size 10 --best_variant td3-lstm-64-oa-separate --other_methods offpolicy-varibad \
# --name Wind --loc "lower right"
# python scripts/merge_csv.py --base_path results/logs/meta/Wind-v0/oracle \
# --max_episode_len 75 --start_x 9000 --interval_x 3000
# python scripts/plot_csv.py --csv_path results/data/meta/Wind-v0/oracle/final.csv \
# --window_size 10
# python scripts/plot_single_factor.py --csv_path results/data/meta/Wind-v0/final.csv \
# --window_size 10 --factors RL,Encoder,Len,Inputs
## Meta RL (on-policy varibad benchmark)
# python scripts/merge_csv.py --base_path results/logs/meta/AntDir-v0 \
# --max_episode_len 400 --start_x 240000 --interval_x 40000
# python scripts/plot_csv.py --csv_path results/data/meta/AntDir-v0/final.csv \
# --window_size 10 --max_x 100000000 --other_methods onpolicy-varibad,rl2,oracle_ppo,oracle_sac,Markovian_td3 \
# --best_variant sac-gru-400-oar-separate \
# --loc "lower right" --name Ant-Dir
# python scripts/merge_csv.py --base_path results/logs/meta/CheetahDir-v0 \
# --max_episode_len 400 --start_x 240000 --interval_x 40000
# python scripts/plot_csv.py --csv_path results/data/meta/CheetahDir-v0/final.csv \
# --window_size 10 --max_x 100000000 --other_methods onpolicy-varibad,rl2,oracle_ppo,Markovian_sac,oracle_sac \
# --best_variant sac-gru-400-oar-separate \
# --loc "lower right" --name Cheetah-Dir
# python scripts/merge_csv.py --base_path results/logs/meta/HumanoidDir-v0 \
# --max_episode_len 400 --start_x 240000 --interval_x 40000
# python scripts/plot_csv.py --csv_path results/data/meta/HumanoidDir-v0/final.csv \
# --window_size 10 --max_x 100000000 --other_methods onpolicy-varibad,rl2,oracle_ppo,oracle_sac,Markovian_sac \
# --best_variant sac-gru-400-oar-separate \
# --loc "lower right" --name Humanoid-Dir
## Robust RL
# python scripts/merge_csv.py --base_path results/logs/rmdp/MRPOHalfCheetahRandomNormal-v0 \
# --max_episode_len 1000 --start_x 50000 --interval_x 50000
# python scripts/plot_csv.py --csv_path results/data/rmdp/MRPOHalfCheetahRandomNormal-v0/final.csv \
# --window_size 20 --max_x 15000000 --best_variant td3-lstm-64-o-separate --other_methods MRPO,ppo_gru,oracle_sac,Markovian_sac \
# --name Cheetah-Robust --loc "upper right"
# python scripts/plot_single_factor.py --csv_path results/data/rmdp/MRPOHalfCheetahRandomNormal-v0/final.csv \
# --window_size 20 --factors RL,Encoder,Len,Inputs
# python scripts/merge_csv.py --base_path results/logs/rmdp/MRPOHopperRandomNormal-v0 \
# --max_episode_len 1000 --start_x 50000 --interval_x 50000
# python scripts/plot_csv.py --csv_path results/data/rmdp/MRPOHopperRandomNormal-v0/final.csv \
# --window_size 20 --max_x 20000000 --best_variant td3-lstm-64-o-separate --other_methods MRPO,ppo_gru,oracle_sac,Markovian_sac \
# --name Hopper-Robust --loc "upper right"
# python scripts/plot_single_factor.py --csv_path results/data/rmdp/MRPOHopperRandomNormal-v0/final.csv \
# --window_size 20 --factors RL,Encoder,Len,Inputs
# python scripts/merge_csv.py --base_path results/logs/rmdp/MRPOWalker2dRandomNormal-v0 \
# --max_episode_len 1000 --start_x 50000 --interval_x 50000
# python scripts/plot_csv.py --csv_path results/data/rmdp/MRPOWalker2dRandomNormal-v0/final.csv \
# --window_size 20 --max_x 20000000 --best_variant td3-lstm-64-o-separate --other_methods MRPO,ppo_gru,oracle_sac,Markovian_sac \
# --name Walker-Robust --loc "upper right"
# python scripts/plot_single_factor.py --csv_path results/data/rmdp/MRPOWalker2dRandomNormal-v0/final.csv \
# --window_size 20 --factors RL,Encoder,Len,Inputs
## Generalization in RL
# python scripts/merge_csv.py --base_path results/logs/generalize/SunblazeHalfCheetah-v0 \
# --max_episode_len 1000 --start_x 50000 --interval_x 50000
# python scripts/plot_csv.py --csv_path results/data/generalize/SunblazeHalfCheetah-v0/final.csv \
# --window_size 20 --max_x 20000000 --best_variant td3-lstm-64-o-separate
# python scripts/merge_csv.py --base_path results/logs/generalize/SunblazeHalfCheetahRandomNormal-v0 \
# --max_episode_len 1000 --start_x 50000 --interval_x 50000
# python scripts/plot_csv.py --csv_path results/data/generalize/SunblazeHalfCheetahRandomNormal-v0/final.csv \
# --window_size 20 --max_x 20000000 --best_variant td3-lstm-64-o-separate
# python scripts/plot_generalization.py --merged_path results/data/generalize/Cheetah-Generalize \
# --csv_paths results/data/generalize/SunblazeHalfCheetah-v0/final.csv,results/data/generalize/SunblazeHalfCheetahRandomNormal-v0/final.csv \
# --window_size 10 --name Cheetah-Generalize --factors RL,Len,Inputs --best_variant td3-lstm-64-o-separate \
# --other_methods oracle_td3,Markovian_sac
# python scripts/merge_csv.py --base_path results/logs/generalize/SunblazeHopper-v0 \
# --max_episode_len 1000 --start_x 50000 --interval_x 50000
# python scripts/plot_csv.py --csv_path results/data/generalize/SunblazeHopper-v0/final.csv \
# --window_size 20 --max_x 20000000 --best_variant td3-lstm-64-o-separate
# python scripts/merge_csv.py --base_path results/logs/generalize/SunblazeHopperRandomNormal-v0 \
# --max_episode_len 1000 --start_x 50000 --interval_x 50000
# python scripts/plot_csv.py --csv_path results/data/generalize/SunblazeHopperRandomNormal-v0/final.csv \
# --window_size 20 --max_x 20000000 --best_variant td3-lstm-64-o-separate
# python scripts/plot_generalization.py --merged_path results/data/generalize/Hopper-Generalize \
# --csv_paths results/data/generalize/SunblazeHopper-v0/final.csv,results/data/generalize/SunblazeHopperRandomNormal-v0/final.csv \
# --window_size 10 --name Hopper-Generalize --factors RL,Len,Inputs --best_variant td3-lstm-64-o-separate \
# --other_methods oracle_sac,Markovian_sac
## Long-term credit assignment
# python scripts/merge_csv.py --base_path results/logs/credit/Catch/40 \
# --max_episode_len 279 --start_x 13950 --interval_x 13950
# python scripts/plot_csv.py --csv_path results/data/credit/Catch/40/final.csv \
# --window_size 10 --loc "right" --max_x 2500000 \
# --name Delayed-Catch --best_variant sacd-lstm-279-o-separate
# python scripts/merge_csv.py --base_path results/logs/credit/KeytoDoor/SR \
# --max_episode_len 85 --start_x 4250 --interval_x 4250
# python scripts/plot_csv.py --csv_path results/data/credit/KeytoDoor/SR/final.csv \
# --window_size 10 --loc "lower right" --max_x 4000000 \
# --best_variant sacd-lstm-85-o-separate --name Key-to-Door