Skip to content

Commit 115cb27

Browse files
authored
Merge pull request #5 from Bam4d/cartpole_hyperparams_2
these hyperparameters work significantly better than previous
2 parents 0fdf6fc + faa6f19 commit 115cb27

File tree

1 file changed

+3
-3
lines changed
  • rl4j-examples/src/main/java/org/deeplearning4j/examples/rl4j

1 file changed

+3
-3
lines changed

rl4j-examples/src/main/java/org/deeplearning4j/examples/rl4j/Cartpole.java

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -46,9 +46,9 @@ public class Cartpole
4646
150000, //Max step
4747
150000, //Max size of experience replay
4848
32, //size of batches
49-
500, //target update (hard)
49+
100, //target update (hard)
5050
10, //num step noop warmup
51-
0.01, //reward scaling
51+
0.1, //reward scaling
5252
0.99, //gamma
5353
1.0, //td-error clipping
5454
0.1f, //min epsilon
@@ -58,7 +58,7 @@ public class Cartpole
5858

5959
public static DQNFactoryStdDense.Configuration CARTPOLE_NET =
6060
DQNFactoryStdDense.Configuration.builder()
61-
.l2(0.001).updater(new Adam(0.0005)).numHiddenNodes(16).numLayer(3).build();
61+
.updater(new Adam(0.001)).numHiddenNodes(16).numLayer(3).build();
6262

6363
public static void main(String[] args) throws IOException {
6464
cartPole();

0 commit comments

Comments
 (0)