File tree 3 files changed +9
-9
lines changed
rl4j-examples/src/main/java/org/deeplearning4j/examples/rl4j
3 files changed +9
-9
lines changed Original file line number Diff line number Diff line change @@ -42,11 +42,11 @@ public class A3CCartpole {
42
42
200 , //Max step By epoch
43
43
500000 , //Max step
44
44
16 , //Number of threads
45
- 5 , //t_max
45
+ 10 , //t_max
46
46
10 , //num step noop warmup
47
- 0.01 , //reward scaling
47
+ 0.1 , //reward scaling
48
48
0.99 , //gamma
49
- 10 .0 //td-error clipping
49
+ 1 .0 //td-error clipping
50
50
);
51
51
52
52
Original file line number Diff line number Diff line change @@ -41,12 +41,12 @@ public class AsyncNStepCartpole {
41
41
200 , //Max step By epoch
42
42
300000 , //Max step
43
43
16 , //Number of threads
44
- 5 , //t_max
44
+ 10 , //t_max
45
45
100 , //target update (hard)
46
46
10 , //num step noop warmup
47
- 0.01 , //reward scaling
47
+ 0.1 , //reward scaling
48
48
0.99 , //gamma
49
- 100 .0 , //td-error clipping
49
+ 1 .0 , //td-error clipping
50
50
0.1f , //min epsilon
51
51
9000 //num step for eps greedy anneal
52
52
);
Original file line number Diff line number Diff line change @@ -46,9 +46,9 @@ public class Cartpole
46
46
150000 , //Max step
47
47
150000 , //Max size of experience replay
48
48
32 , //size of batches
49
- 500 , //target update (hard)
49
+ 100 , //target update (hard)
50
50
10 , //num step noop warmup
51
- 0.01 , //reward scaling
51
+ 0.1 , //reward scaling
52
52
0.99 , //gamma
53
53
1.0 , //td-error clipping
54
54
0.1f , //min epsilon
@@ -58,7 +58,7 @@ public class Cartpole
58
58
59
59
public static DQNFactoryStdDense .Configuration CARTPOLE_NET =
60
60
DQNFactoryStdDense .Configuration .builder ()
61
- .l2 ( 0.001 ). updater (new Adam (0.0005 )).numHiddenNodes (16 ).numLayer (3 ).build ();
61
+ .updater (new Adam (0.001 )).numHiddenNodes (16 ).numLayer (3 ).build ();
62
62
63
63
public static void main (String [] args ) throws IOException {
64
64
cartPole ();
You can’t perform that action at this time.
0 commit comments