-
-
Notifications
You must be signed in to change notification settings - Fork 290
/
Copy pathinfos.py
311 lines (301 loc) · 20.1 KB
/
infos.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
"""
This file holds all URLs and reference scores.
"""
#TODO(Justin): This is duplicated. Make all __init__ file URLs and scores point to this file.
DATASET_URLS = {
'maze2d-open-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-open-sparse.hdf5',
'maze2d-umaze-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-umaze-sparse-v1.hdf5',
'maze2d-medium-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-medium-sparse-v1.hdf5',
'maze2d-large-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-large-sparse-v1.hdf5',
'maze2d-eval-umaze-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-eval-umaze-sparse-v1.hdf5',
'maze2d-eval-medium-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-eval-medium-sparse-v1.hdf5',
'maze2d-eval-large-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-eval-large-sparse-v1.hdf5',
'maze2d-open-dense-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-open-dense.hdf5',
'maze2d-umaze-dense-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-umaze-dense-v1.hdf5',
'maze2d-medium-dense-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-medium-dense-v1.hdf5',
'maze2d-large-dense-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-large-dense-v1.hdf5',
'maze2d-eval-umaze-dense-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-eval-umaze-dense-v1.hdf5',
'maze2d-eval-medium-dense-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-eval-medium-dense-v1.hdf5',
'maze2d-eval-large-dense-v1' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/maze2d/maze2d-eval-large-dense-v1.hdf5',
'minigrid-fourrooms-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/minigrid/minigrid4rooms.hdf5',
'minigrid-fourrooms-random-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/minigrid/minigrid4rooms_random.hdf5',
'pen-human-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/pen-v0_demos_clipped.hdf5',
'pen-cloned-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/pen-demos-v0-bc-combined.hdf5',
'pen-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/pen-v0_expert_clipped.hdf5',
'hammer-human-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/hammer-v0_demos_clipped.hdf5',
'hammer-cloned-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/hammer-demos-v0-bc-combined.hdf5',
'hammer-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/hammer-v0_expert_clipped.hdf5',
'relocate-human-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/relocate-v0_demos_clipped.hdf5',
'relocate-cloned-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/relocate-demos-v0-bc-combined.hdf5',
'relocate-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/relocate-v0_expert_clipped.hdf5',
'door-human-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/door-v0_demos_clipped.hdf5',
'door-cloned-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/door-demos-v0-bc-combined.hdf5',
'door-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg/door-v0_expert_clipped.hdf5',
'halfcheetah-random-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/halfcheetah_random.hdf5',
'halfcheetah-medium-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/halfcheetah_medium.hdf5',
'halfcheetah-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/halfcheetah_expert.hdf5',
'halfcheetah-medium-replay-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/halfcheetah_mixed.hdf5',
'halfcheetah-medium-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/halfcheetah_medium_expert.hdf5',
'walker2d-random-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/walker2d_random.hdf5',
'walker2d-medium-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/walker2d_medium.hdf5',
'walker2d-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/walker2d_expert.hdf5',
'walker2d-medium-replay-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/walker_mixed.hdf5',
'walker2d-medium-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/walker2d_medium_expert.hdf5',
'hopper-random-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/hopper_random.hdf5',
'hopper-medium-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/hopper_medium.hdf5',
'hopper-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/hopper_expert.hdf5',
'hopper-medium-replay-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/hopper_mixed.hdf5',
'hopper-medium-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/hopper_medium_expert.hdf5',
'ant-random-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/ant_random.hdf5',
'ant-medium-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/ant_medium.hdf5',
'ant-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/ant_expert.hdf5',
'ant-medium-replay-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/ant_mixed.hdf5',
'ant-medium-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/ant_medium_expert.hdf5',
'ant-random-expert-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco/ant_random_expert.hdf5',
'antmaze-umaze-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_new/Ant_maze_u-maze_noisy_multistart_False_multigoal_False_sparse.hdf5',
'antmaze-umaze-diverse-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_new/Ant_maze_u-maze_noisy_multistart_True_multigoal_True_sparse.hdf5',
'antmaze-medium-play-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_new/Ant_maze_big-maze_noisy_multistart_True_multigoal_False_sparse.hdf5',
'antmaze-medium-diverse-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_new/Ant_maze_big-maze_noisy_multistart_True_multigoal_True_sparse.hdf5',
'antmaze-large-play-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_new/Ant_maze_hardest-maze_noisy_multistart_True_multigoal_False_sparse.hdf5',
'antmaze-large-diverse-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_new/Ant_maze_hardest-maze_noisy_multistart_True_multigoal_True_sparse.hdf5',
'antmaze-umaze-v2' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_v2/Ant_maze_u-maze_noisy_multistart_False_multigoal_False_sparse_fixed.hdf5',
'antmaze-umaze-diverse-v2' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_v2/Ant_maze_u-maze_noisy_multistart_True_multigoal_True_sparse_fixed.hdf5',
'antmaze-medium-play-v2' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_v2/Ant_maze_big-maze_noisy_multistart_True_multigoal_False_sparse_fixed.hdf5',
'antmaze-medium-diverse-v2' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_v2/Ant_maze_big-maze_noisy_multistart_True_multigoal_True_sparse_fixed.hdf5',
'antmaze-large-play-v2' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_v2/Ant_maze_hardest-maze_noisy_multistart_True_multigoal_False_sparse_fixed.hdf5',
'antmaze-large-diverse-v2' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/ant_maze_v2/Ant_maze_hardest-maze_noisy_multistart_True_multigoal_True_sparse_fixed.hdf5',
'flow-ring-random-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/flow/flow-ring-v0-random.hdf5',
'flow-ring-controller-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/flow/flow-ring-v0-idm.hdf5',
'flow-merge-random-v0':'http://rail.eecs.berkeley.edu/datasets/offline_rl/flow/flow-merge-v0-random.hdf5',
'flow-merge-controller-v0':'http://rail.eecs.berkeley.edu/datasets/offline_rl/flow/flow-merge-v0-idm.hdf5',
'kitchen-complete-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/kitchen/mini_kitchen_microwave_kettle_light_slider-v0.hdf5',
'kitchen-partial-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/kitchen/kitchen_microwave_kettle_light_slider-v0.hdf5',
'kitchen-mixed-v0' : 'http://rail.eecs.berkeley.edu/datasets/offline_rl/kitchen/kitchen_microwave_kettle_bottomburner_light-v0.hdf5',
'carla-lane-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/carla/carla_lane_follow_flat-v0.hdf5',
'carla-town-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/carla/carla_town_subsamp_flat-v0.hdf5',
'carla-town-full-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/carla/carla_town_flat-v0.hdf5',
'bullet-halfcheetah-random-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-halfcheetah_random.hdf5',
'bullet-halfcheetah-medium-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-halfcheetah_medium.hdf5',
'bullet-halfcheetah-expert-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-halfcheetah_expert.hdf5',
'bullet-halfcheetah-medium-expert-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-halfcheetah_medium_expert.hdf5',
'bullet-halfcheetah-medium-replay-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-halfcheetah_medium_replay.hdf5',
'bullet-hopper-random-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-hopper_random.hdf5',
'bullet-hopper-medium-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-hopper_medium.hdf5',
'bullet-hopper-expert-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-hopper_expert.hdf5',
'bullet-hopper-medium-expert-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-hopper_medium_expert.hdf5',
'bullet-hopper-medium-replay-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-hopper_medium_replay.hdf5',
'bullet-ant-random-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-ant_random.hdf5',
'bullet-ant-medium-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-ant_medium.hdf5',
'bullet-ant-expert-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-ant_expert.hdf5',
'bullet-ant-medium-expert-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-ant_medium_expert.hdf5',
'bullet-ant-medium-replay-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-ant_medium_replay.hdf5',
'bullet-walker2d-random-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-walker2d_random.hdf5',
'bullet-walker2d-medium-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-walker2d_medium.hdf5',
'bullet-walker2d-expert-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-walker2d_expert.hdf5',
'bullet-walker2d-medium-expert-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-walker2d_medium_expert.hdf5',
'bullet-walker2d-medium-replay-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-walker2d_medium_replay.hdf5',
'bullet-maze2d-open-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-maze2d-open-sparse.hdf5',
'bullet-maze2d-umaze-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-maze2d-umaze-sparse.hdf5',
'bullet-maze2d-medium-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-maze2d-medium-sparse.hdf5',
'bullet-maze2d-large-v0': 'http://rail.eecs.berkeley.edu/datasets/offline_rl/bullet/bullet-maze2d-large-sparse.hdf5',
}
REF_MIN_SCORE = {
'maze2d-open-v0' : 0.01 ,
'maze2d-umaze-v1' : 23.85 ,
'maze2d-medium-v1' : 13.13 ,
'maze2d-large-v1' : 6.7 ,
'maze2d-open-dense-v0' : 11.17817 ,
'maze2d-umaze-dense-v1' : 68.537689 ,
'maze2d-medium-dense-v1' : 44.264742 ,
'maze2d-large-dense-v1' : 30.569041 ,
'minigrid-fourrooms-v0' : 0.01442 ,
'minigrid-fourrooms-random-v0' : 0.01442 ,
'pen-human-v0' : 96.262799 ,
'pen-cloned-v0' : 96.262799 ,
'pen-expert-v0' : 96.262799 ,
'hammer-human-v0' : -274.856578 ,
'hammer-cloned-v0' : -274.856578 ,
'hammer-expert-v0' : -274.856578 ,
'relocate-human-v0' : -6.425911 ,
'relocate-cloned-v0' : -6.425911 ,
'relocate-expert-v0' : -6.425911 ,
'door-human-v0' : -56.512833 ,
'door-cloned-v0' : -56.512833 ,
'door-expert-v0' : -56.512833 ,
'halfcheetah-random-v0' : -280.178953 ,
'halfcheetah-medium-v0' : -280.178953 ,
'halfcheetah-expert-v0' : -280.178953 ,
'halfcheetah-medium-replay-v0' : -280.178953 ,
'halfcheetah-medium-expert-v0' : -280.178953 ,
'walker2d-random-v0' : 1.629008 ,
'walker2d-medium-v0' : 1.629008 ,
'walker2d-expert-v0' : 1.629008 ,
'walker2d-medium-replay-v0' : 1.629008 ,
'walker2d-medium-expert-v0' : 1.629008 ,
'hopper-random-v0' : -20.272305 ,
'hopper-medium-v0' : -20.272305 ,
'hopper-expert-v0' : -20.272305 ,
'hopper-medium-replay-v0' : -20.272305 ,
'hopper-medium-expert-v0' : -20.272305 ,
'ant-random-v0' : -325.6,
'ant-medium-v0' : -325.6,
'ant-expert-v0' : -325.6,
'ant-medium-replay-v0' : -325.6,
'ant-medium-expert-v0' : -325.6,
'antmaze-umaze-v0' : 0.0 ,
'antmaze-umaze-diverse-v0' : 0.0 ,
'antmaze-medium-play-v0' : 0.0 ,
'antmaze-medium-diverse-v0' : 0.0 ,
'antmaze-large-play-v0' : 0.0 ,
'antmaze-large-diverse-v0' : 0.0 ,
'antmaze-umaze-v2' : 0.0 ,
'antmaze-umaze-diverse-v2' : 0.0 ,
'antmaze-medium-play-v2' : 0.0 ,
'antmaze-medium-diverse-v2' : 0.0 ,
'antmaze-large-play-v2' : 0.0 ,
'antmaze-large-diverse-v2' : 0.0 ,
'kitchen-complete-v0' : 0.0 ,
'kitchen-partial-v0' : 0.0 ,
'kitchen-mixed-v0' : 0.0 ,
'flow-ring-random-v0' : -165.22 ,
'flow-ring-controller-v0' : -165.22 ,
'flow-merge-random-v0' : 118.67993 ,
'flow-merge-controller-v0' : 118.67993 ,
'carla-lane-v0': -0.8503839912088142,
'carla-town-v0': -114.81579500772153, # random score
'bullet-halfcheetah-random-v0': -1275.766996,
'bullet-halfcheetah-medium-v0': -1275.766996,
'bullet-halfcheetah-expert-v0': -1275.766996,
'bullet-halfcheetah-medium-expert-v0': -1275.766996,
'bullet-halfcheetah-medium-replay-v0': -1275.766996,
'bullet-hopper-random-v0': 20.058972,
'bullet-hopper-medium-v0': 20.058972,
'bullet-hopper-expert-v0': 20.058972,
'bullet-hopper-medium-expert-v0': 20.058972,
'bullet-hopper-medium-replay-v0': 20.058972,
'bullet-ant-random-v0': 373.705955,
'bullet-ant-medium-v0': 373.705955,
'bullet-ant-expert-v0': 373.705955,
'bullet-ant-medium-expert-v0': 373.705955,
'bullet-ant-medium-replay-v0': 373.705955,
'bullet-walker2d-random-v0': 16.523877,
'bullet-walker2d-medium-v0': 16.523877,
'bullet-walker2d-expert-v0': 16.523877,
'bullet-walker2d-medium-expert-v0': 16.523877,
'bullet-walker2d-medium-replay-v0': 16.523877,
'bullet-maze2d-open-v0': 8.750000,
'bullet-maze2d-umaze-v0': 32.460000,
'bullet-maze2d-medium-v0': 14.870000,
'bullet-maze2d-large-v0': 1.820000,
}
REF_MAX_SCORE = {
'maze2d-open-v0' : 20.66 ,
'maze2d-umaze-v1' : 161.86 ,
'maze2d-medium-v1' : 277.39 ,
'maze2d-large-v1' : 273.99 ,
'maze2d-open-dense-v0' : 27.166538620695782 ,
'maze2d-umaze-dense-v1' : 193.66285642381482 ,
'maze2d-medium-dense-v1' : 297.4552547777125 ,
'maze2d-large-dense-v1' : 303.4857382709002 ,
'minigrid-fourrooms-v0' : 2.89685 ,
'minigrid-fourrooms-random-v0' : 2.89685 ,
'pen-human-v0' : 3076.8331017826877 ,
'pen-cloned-v0' : 3076.8331017826877 ,
'pen-expert-v0' : 3076.8331017826877 ,
'hammer-human-v0' : 12794.134825156867 ,
'hammer-cloned-v0' : 12794.134825156867 ,
'hammer-expert-v0' : 12794.134825156867 ,
'relocate-human-v0' : 4233.877797728884 ,
'relocate-cloned-v0' : 4233.877797728884 ,
'relocate-expert-v0' : 4233.877797728884 ,
'door-human-v0' : 2880.5693087298737 ,
'door-cloned-v0' : 2880.5693087298737 ,
'door-expert-v0' : 2880.5693087298737 ,
'halfcheetah-random-v0' : 12135.0 ,
'halfcheetah-medium-v0' : 12135.0 ,
'halfcheetah-expert-v0' : 12135.0 ,
'halfcheetah-medium-replay-v0' : 12135.0 ,
'halfcheetah-medium-expert-v0' : 12135.0 ,
'walker2d-random-v0' : 4592.3 ,
'walker2d-medium-v0' : 4592.3 ,
'walker2d-expert-v0' : 4592.3 ,
'walker2d-medium-replay-v0' : 4592.3 ,
'walker2d-medium-expert-v0' : 4592.3 ,
'hopper-random-v0' : 3234.3 ,
'hopper-medium-v0' : 3234.3 ,
'hopper-expert-v0' : 3234.3 ,
'hopper-medium-replay-v0' : 3234.3 ,
'hopper-medium-expert-v0' : 3234.3 ,
'ant-random-v0' : 3879.7,
'ant-medium-v0' : 3879.7,
'ant-expert-v0' : 3879.7,
'ant-medium-replay-v0' : 3879.7,
'ant-medium-expert-v0' : 3879.7,
'antmaze-umaze-v0' : 1.0 ,
'antmaze-umaze-diverse-v0' : 1.0 ,
'antmaze-medium-play-v0' : 1.0 ,
'antmaze-medium-diverse-v0' : 1.0 ,
'antmaze-large-play-v0' : 1.0 ,
'antmaze-large-diverse-v0' : 1.0 ,
'antmaze-umaze-v2' : 1.0 ,
'antmaze-umaze-diverse-v2' : 1.0 ,
'antmaze-medium-play-v2' : 1.0 ,
'antmaze-medium-diverse-v2' : 1.0 ,
'antmaze-large-play-v2' : 1.0 ,
'antmaze-large-diverse-v2' : 1.0 ,
'kitchen-complete-v0' : 4.0 ,
'kitchen-partial-v0' : 4.0 ,
'kitchen-mixed-v0' : 4.0 ,
'flow-ring-random-v0' : 24.42 ,
'flow-ring-controller-v0' : 24.42 ,
'flow-merge-random-v0' : 330.03179 ,
'flow-merge-controller-v0' : 330.03179 ,
'carla-lane-v0': 1023.5784385429523,
'carla-town-v0': 2440.1772022247314, # avg dataset score
'bullet-halfcheetah-random-v0': 2381.6725,
'bullet-halfcheetah-medium-v0': 2381.6725,
'bullet-halfcheetah-expert-v0': 2381.6725,
'bullet-halfcheetah-medium-expert-v0': 2381.6725,
'bullet-halfcheetah-medium-replay-v0': 2381.6725,
'bullet-hopper-random-v0': 1441.8059623430963,
'bullet-hopper-medium-v0': 1441.8059623430963,
'bullet-hopper-expert-v0': 1441.8059623430963,
'bullet-hopper-medium-expert-v0': 1441.8059623430963,
'bullet-hopper-medium-replay-v0': 1441.8059623430963,
'bullet-ant-random-v0': 2650.495,
'bullet-ant-medium-v0': 2650.495,
'bullet-ant-expert-v0': 2650.495,
'bullet-ant-medium-expert-v0': 2650.495,
'bullet-ant-medium-replay-v0': 2650.495,
'bullet-walker2d-random-v0': 1623.6476303317536,
'bullet-walker2d-medium-v0': 1623.6476303317536,
'bullet-walker2d-expert-v0': 1623.6476303317536,
'bullet-walker2d-medium-expert-v0': 1623.6476303317536,
'bullet-walker2d-medium-replay-v0': 1623.6476303317536,
'bullet-maze2d-open-v0': 64.15,
'bullet-maze2d-umaze-v0': 153.99,
'bullet-maze2d-medium-v0': 238.05,
'bullet-maze2d-large-v0': 285.92,
}
#Gym-MuJoCo V1/V2 envs
for env in ['halfcheetah', 'hopper', 'walker2d', 'ant']:
for dset in ['random', 'medium', 'expert', 'medium-replay', 'full-replay', 'medium-expert']:
#v1 envs
dset_name = env+'_'+dset.replace('-', '_')+'-v1'
env_name = dset_name.replace('_', '-')
DATASET_URLS[env_name] = 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco_v1/%s.hdf5' % dset_name
REF_MIN_SCORE[env_name] = REF_MIN_SCORE[env+'-random-v0']
REF_MAX_SCORE[env_name] = REF_MAX_SCORE[env+'-random-v0']
#v2 envs
dset_name = env+'_'+dset.replace('-', '_')+'-v2'
env_name = dset_name.replace('_', '-')
DATASET_URLS[env_name] = 'http://rail.eecs.berkeley.edu/datasets/offline_rl/gym_mujoco_v2/%s.hdf5' % dset_name
REF_MIN_SCORE[env_name] = REF_MIN_SCORE[env+'-random-v0']
REF_MAX_SCORE[env_name] = REF_MAX_SCORE[env+'-random-v0']
#Adroit v1 envs
for env in ['hammer', 'pen', 'relocate', 'door']:
for dset in ['human', 'expert', 'cloned']:
env_name = env+'-'+dset+'-v1'
DATASET_URLS[env_name] = 'http://rail.eecs.berkeley.edu/datasets/offline_rl/hand_dapg_v1/%s.hdf5' % env_name
REF_MIN_SCORE[env_name] = REF_MIN_SCORE[env+'-human-v0']
REF_MAX_SCORE[env_name] = REF_MAX_SCORE[env+'-human-v0']