Skip to content

Commit f5f971f

Browse files
Marlos C. Machadopsc-g
authored andcommitted
Parameters that actually lead to good results (200) in CartPole with C51.
PiperOrigin-RevId: 257675436
1 parent b9e932a commit f5f971f

File tree

1 file changed

+9
-7
lines changed

1 file changed

+9
-7
lines changed

dopamine/agents/rainbow/configs/c51_cartpole.gin

Lines changed: 9 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -11,26 +11,28 @@ RainbowAgent.observation_shape = %gym_lib.CARTPOLE_OBSERVATION_SHAPE
1111
RainbowAgent.observation_dtype = %gym_lib.CARTPOLE_OBSERVATION_DTYPE
1212
RainbowAgent.stack_size = %gym_lib.CARTPOLE_STACK_SIZE
1313
RainbowAgent.network = @gym_lib.cartpole_rainbow_network
14-
RainbowAgent.num_atoms = 51
15-
RainbowAgent.vmax = 10.
14+
RainbowAgent.num_atoms = 201
15+
RainbowAgent.vmax = 100.
1616
RainbowAgent.gamma = 0.99
17+
RainbowAgent.epsilon_eval = 0.
18+
RainbowAgent.epsilon_train = 0.01
1719
RainbowAgent.update_horizon = 1
1820
RainbowAgent.min_replay_history = 500
19-
RainbowAgent.update_period = 4
20-
RainbowAgent.target_update_period = 100
21+
RainbowAgent.update_period = 1
22+
RainbowAgent.target_update_period = 1
2123
RainbowAgent.epsilon_fn = @dqn_agent.identity_epsilon
2224
RainbowAgent.replay_scheme = 'uniform'
2325
RainbowAgent.tf_device = '/gpu:0' # use '/cpu:*' for non-GPU version
2426
RainbowAgent.optimizer = @tf.train.AdamOptimizer()
2527

26-
tf.train.AdamOptimizer.learning_rate = 0.001
27-
tf.train.AdamOptimizer.epsilon = 0.0003125
28+
tf.train.AdamOptimizer.learning_rate = 0.00001
29+
tf.train.AdamOptimizer.epsilon = 0.00000390625
2830

2931
create_gym_environment.environment_name = 'CartPole'
3032
create_gym_environment.version = 'v0'
3133
create_agent.agent_name = 'rainbow'
3234
Runner.create_environment_fn = @gym_lib.create_gym_environment
33-
Runner.num_iterations = 500
35+
Runner.num_iterations = 400
3436
Runner.training_steps = 1000
3537
Runner.evaluation_steps = 1000
3638
Runner.max_steps_per_episode = 200 # Default max episode length.

0 commit comments

Comments
 (0)