2
2
from typing import Optional , List
3
3
import copy
4
4
5
- final_eval_reward_wrapper = EasyDict (type = 'final_eval_reward ' )
5
+ eval_episode_return_wrapper = EasyDict (type = 'eval_episode_return ' )
6
6
7
7
8
8
def get_default_wrappers (env_wrapper_name : str , env_id : Optional [str ] = None ) -> List [dict ]:
9
9
if env_wrapper_name == 'mujoco_default' :
10
10
return [
11
11
EasyDict (type = 'delay_reward' , kwargs = dict (delay_reward_step = 3 )),
12
- copy .deepcopy (final_eval_reward_wrapper ),
12
+ copy .deepcopy (eval_episode_return_wrapper ),
13
13
]
14
14
elif env_wrapper_name == 'atari_default' :
15
15
wrapper_list = []
@@ -23,14 +23,14 @@ def get_default_wrappers(env_wrapper_name: str, env_id: Optional[str] = None) ->
23
23
wrapper_list .append (EasyDict (type = 'scaled_float_frame' ))
24
24
wrapper_list .append (EasyDict (type = 'clip_reward' ))
25
25
wrapper_list .append (EasyDict (type = 'frame_stack' , kwargs = dict (n_frames = 4 )))
26
- wrapper_list .append (copy .deepcopy (final_eval_reward_wrapper ))
26
+ wrapper_list .append (copy .deepcopy (eval_episode_return_wrapper ))
27
27
return wrapper_list
28
28
elif env_wrapper_name == 'gym_hybrid_default' :
29
29
return [
30
30
EasyDict (type = 'gym_hybrid_dict_action' ),
31
- copy .deepcopy (final_eval_reward_wrapper ),
31
+ copy .deepcopy (eval_episode_return_wrapper ),
32
32
]
33
33
elif env_wrapper_name == 'default' :
34
- return [copy .deepcopy (final_eval_reward_wrapper )]
34
+ return [copy .deepcopy (eval_episode_return_wrapper )]
35
35
else :
36
36
raise NotImplementedError ()
0 commit comments