@@ -77,7 +77,7 @@ def cartpole():
7777
7878@train_preference_comparisons_ex .named_config
7979def seals_ant ():
80- environment = dict (gym_id = "seals/Ant-v0 " )
80+ environment = dict (gym_id = "seals/Ant-v1 " )
8181 rl = dict (
8282 batch_size = 2048 ,
8383 rl_kwargs = dict (
@@ -104,7 +104,7 @@ def half_cheetah():
104104
105105@train_preference_comparisons_ex .named_config
106106def seals_half_cheetah ():
107- environment = dict (gym_id = "seals/HalfCheetah-v0 " )
107+ environment = dict (gym_id = "seals/HalfCheetah-v1 " )
108108 rl = dict (
109109 batch_size = 512 ,
110110 rl_kwargs = dict (
@@ -125,7 +125,7 @@ def seals_half_cheetah():
125125
126126@train_preference_comparisons_ex .named_config
127127def seals_hopper ():
128- environment = dict (gym_id = "seals/Hopper-v0 " )
128+ environment = dict (gym_id = "seals/Hopper-v1 " )
129129 policy = dict (
130130 policy_cls = "MlpPolicy" ,
131131 policy_kwargs = dict (
@@ -151,7 +151,7 @@ def seals_hopper():
151151
152152@train_preference_comparisons_ex .named_config
153153def seals_swimmer ():
154- environment = dict (gym_id = "seals/Swimmer-v0 " )
154+ environment = dict (gym_id = "seals/Swimmer-v1 " )
155155 policy = dict (
156156 policy_cls = "MlpPolicy" ,
157157 policy_kwargs = dict (
@@ -178,7 +178,7 @@ def seals_swimmer():
178178
179179@train_preference_comparisons_ex .named_config
180180def seals_walker ():
181- environment = dict (gym_id = "seals/Walker2d-v0 " )
181+ environment = dict (gym_id = "seals/Walker2d-v1 " )
182182 policy = dict (
183183 policy_cls = "MlpPolicy" ,
184184 policy_kwargs = dict (
@@ -206,7 +206,7 @@ def seals_walker():
206206@train_preference_comparisons_ex .named_config
207207def seals_humanoid ():
208208 locals ().update (** MUJOCO_SHARED_LOCALS )
209- environment = dict (gym_id = "seals/Humanoid-v0 " )
209+ environment = dict (gym_id = "seals/Humanoid-v1 " )
210210 total_timesteps = int (4e6 )
211211
212212
0 commit comments