Skip to content

Commit c9ccf5b

Browse files
committed
Upgrade environment versions in the train_preference_comparisons config.
1 parent 2459817 commit c9ccf5b

File tree

1 file changed

+6
-6
lines changed

1 file changed

+6
-6
lines changed

src/imitation/scripts/config/train_preference_comparisons.py

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -77,7 +77,7 @@ def cartpole():
7777

7878
@train_preference_comparisons_ex.named_config
7979
def seals_ant():
80-
environment = dict(gym_id="seals/Ant-v0")
80+
environment = dict(gym_id="seals/Ant-v1")
8181
rl = dict(
8282
batch_size=2048,
8383
rl_kwargs=dict(
@@ -104,7 +104,7 @@ def half_cheetah():
104104

105105
@train_preference_comparisons_ex.named_config
106106
def seals_half_cheetah():
107-
environment = dict(gym_id="seals/HalfCheetah-v0")
107+
environment = dict(gym_id="seals/HalfCheetah-v1")
108108
rl = dict(
109109
batch_size=512,
110110
rl_kwargs=dict(
@@ -125,7 +125,7 @@ def seals_half_cheetah():
125125

126126
@train_preference_comparisons_ex.named_config
127127
def seals_hopper():
128-
environment = dict(gym_id="seals/Hopper-v0")
128+
environment = dict(gym_id="seals/Hopper-v1")
129129
policy = dict(
130130
policy_cls="MlpPolicy",
131131
policy_kwargs=dict(
@@ -151,7 +151,7 @@ def seals_hopper():
151151

152152
@train_preference_comparisons_ex.named_config
153153
def seals_swimmer():
154-
environment = dict(gym_id="seals/Swimmer-v0")
154+
environment = dict(gym_id="seals/Swimmer-v1")
155155
policy = dict(
156156
policy_cls="MlpPolicy",
157157
policy_kwargs=dict(
@@ -178,7 +178,7 @@ def seals_swimmer():
178178

179179
@train_preference_comparisons_ex.named_config
180180
def seals_walker():
181-
environment = dict(gym_id="seals/Walker2d-v0")
181+
environment = dict(gym_id="seals/Walker2d-v1")
182182
policy = dict(
183183
policy_cls="MlpPolicy",
184184
policy_kwargs=dict(
@@ -206,7 +206,7 @@ def seals_walker():
206206
@train_preference_comparisons_ex.named_config
207207
def seals_humanoid():
208208
locals().update(**MUJOCO_SHARED_LOCALS)
209-
environment = dict(gym_id="seals/Humanoid-v0")
209+
environment = dict(gym_id="seals/Humanoid-v1")
210210
total_timesteps = int(4e6)
211211

212212

0 commit comments

Comments
 (0)