Skip to content

Commit ccd804d

Browse files
authored
update atari_wrappers (#702)
* update atari_wrappers * update atari_wrappers
1 parent abdc349 commit ccd804d

File tree

1 file changed

+9
-9
lines changed

1 file changed

+9
-9
lines changed

parl/env/atari_wrappers.py

Lines changed: 9 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -273,22 +273,22 @@ def _get_ob(self):
273273

274274

275275
class TestEnv(gym.Wrapper):
276-
def __init__(self, env, eval_episodes=3):
276+
def __init__(self, env, test_episodes=3):
277277
""" env wrapper for test and validation in atari environment.
278278
279279
Args:
280280
env (ClipRewardEnv or FrameStack): the atari env
281-
eval_episodes (int): number of episodes for evaluation
281+
test_episodes (int): number of episodes for evaluation
282282
"""
283283

284284
gym.Wrapper.__init__(self, env)
285285
self._env = env
286286
self._monitor = get_wrapper_by_cls(env, MonitorEnv)
287-
self._eval_episodes = eval_episodes
287+
self._test_episodes = test_episodes
288288
self._was_real_done = False
289289
self._eval_rewards = None
290290
self._end_episode = len(
291-
self._monitor.get_episode_rewards()) + eval_episodes
291+
self._monitor.get_episode_rewards()) + test_episodes
292292

293293
def step(self, action):
294294
ob, reward, done, info = self._env.step(action)
@@ -301,8 +301,8 @@ def reset(self, **kwargs):
301301
if self._get_curr_episode() >= self._end_episode:
302302
self._was_real_done = True
303303
self._eval_rewards = \
304-
self._monitor.get_episode_rewards()[-self._eval_episodes:]
305-
self._end_episode = self._end_episode + self._eval_episodes
304+
self._monitor.get_episode_rewards()[-self._test_episodes:]
305+
self._end_episode = self._end_episode + self._test_episodes
306306
else:
307307
self._was_real_done = False
308308
self._eval_rewards = None
@@ -324,15 +324,15 @@ def wrap_deepmind(env,
324324
framestack=True,
325325
obs_format='NHWC',
326326
test=False,
327-
eval_episodes=3):
327+
test_episodes=3):
328328
"""Configure environment for DeepMind-style Atari.
329329
330330
Args:
331331
dim (int): Dimension to resize observations to (dim x dim).
332332
framestack (bool): Whether to framestack observations.
333333
obs_format (str): observation output format
334334
test (bool): whether this is a test env
335-
eval_episodes (int): when test, number of episodes for each evaluation
335+
test_episodes (int): when test, number of episodes for each evaluation
336336
"""
337337
env = MonitorEnv(env)
338338
env = NoopResetEnv(env, noop_max=30)
@@ -346,5 +346,5 @@ def wrap_deepmind(env,
346346
if framestack:
347347
env = FrameStack(env, 4, obs_format)
348348
if test:
349-
env = TestEnv(env, eval_episodes)
349+
env = TestEnv(env, test_episodes)
350350
return env

0 commit comments

Comments
 (0)