@@ -273,22 +273,22 @@ def _get_ob(self):
273273
274274
275275class TestEnv (gym .Wrapper ):
276- def __init__ (self , env , eval_episodes = 3 ):
276+ def __init__ (self , env , test_episodes = 3 ):
277277 """ env wrapper for test and validation in atari environment.
278278
279279 Args:
280280 env (ClipRewardEnv or FrameStack): the atari env
281- eval_episodes (int): number of episodes for evaluation
281+ test_episodes (int): number of episodes for evaluation
282282 """
283283
284284 gym .Wrapper .__init__ (self , env )
285285 self ._env = env
286286 self ._monitor = get_wrapper_by_cls (env , MonitorEnv )
287- self ._eval_episodes = eval_episodes
287+ self ._test_episodes = test_episodes
288288 self ._was_real_done = False
289289 self ._eval_rewards = None
290290 self ._end_episode = len (
291- self ._monitor .get_episode_rewards ()) + eval_episodes
291+ self ._monitor .get_episode_rewards ()) + test_episodes
292292
293293 def step (self , action ):
294294 ob , reward , done , info = self ._env .step (action )
@@ -301,8 +301,8 @@ def reset(self, **kwargs):
301301 if self ._get_curr_episode () >= self ._end_episode :
302302 self ._was_real_done = True
303303 self ._eval_rewards = \
304- self ._monitor .get_episode_rewards ()[- self ._eval_episodes :]
305- self ._end_episode = self ._end_episode + self ._eval_episodes
304+ self ._monitor .get_episode_rewards ()[- self ._test_episodes :]
305+ self ._end_episode = self ._end_episode + self ._test_episodes
306306 else :
307307 self ._was_real_done = False
308308 self ._eval_rewards = None
@@ -324,15 +324,15 @@ def wrap_deepmind(env,
324324 framestack = True ,
325325 obs_format = 'NHWC' ,
326326 test = False ,
327- eval_episodes = 3 ):
327+ test_episodes = 3 ):
328328 """Configure environment for DeepMind-style Atari.
329329
330330 Args:
331331 dim (int): Dimension to resize observations to (dim x dim).
332332 framestack (bool): Whether to framestack observations.
333333 obs_format (str): observation output format
334334 test (bool): whether this is a test env
335- eval_episodes (int): when test, number of episodes for each evaluation
335+ test_episodes (int): when test, number of episodes for each evaluation
336336 """
337337 env = MonitorEnv (env )
338338 env = NoopResetEnv (env , noop_max = 30 )
@@ -346,5 +346,5 @@ def wrap_deepmind(env,
346346 if framestack :
347347 env = FrameStack (env , 4 , obs_format )
348348 if test :
349- env = TestEnv (env , eval_episodes )
349+ env = TestEnv (env , test_episodes )
350350 return env
0 commit comments