history video parameters now actually capture the main part of the screen and not just the corner

Bam4d · Bam4d · commit 8a05b3d5a443 · 2020-04-22T14:56:28.000+01:00
diff --git a/rl4j-examples/src/main/java/org/deeplearning4j/examples/rl4j/ALE.java b/rl4j-examples/src/main/java/org/deeplearning4j/examples/rl4j/ALE.java
@@ -17,6 +17,7 @@
 package org.deeplearning4j.examples.rl4j;
 
 import java.io.IOException;
+
 import org.deeplearning4j.rl4j.learning.HistoryProcessor;
 import org.deeplearning4j.rl4j.learning.sync.qlearning.QLearning;
 import org.deeplearning4j.rl4j.learning.sync.qlearning.discrete.QLearningDiscreteConv;
@@ -26,47 +27,46 @@
 
 /**
  * @author saudet
- *
+ * <p>
  * Main example for DQN with The Arcade Learning Environment (ALE)
- *
  */
 public class ALE {
 
     public static HistoryProcessor.Configuration ALE_HP =
-            new HistoryProcessor.Configuration(
-                    4,       //History length
-                    84,      //resize width
-                    110,     //resize height
-                    84,      //crop width
-                    84,      //crop height
-                    0,       //cropping x offset
-                    0,       //cropping y offset
-                    4        //skip mod (one frame is picked every x
-            );
+        new HistoryProcessor.Configuration(
+            4,       //History length
+            152,      //resize width
+            194,     //resize height
+            152,      //crop width
+            194,      //crop height
+            8,       //cropping x offset
+            32,       //cropping y offset
+            4       //skip mod (one frame is picked every x
+        );
 
     public static QLearning.QLConfiguration ALE_QL =
-            new QLearning.QLConfiguration(
-                    123,      //Random seed
-                    10000,    //Max step By epoch
-                    8000000,  //Max step
-                    1000000,  //Max size of experience replay
-                    32,       //size of batches
-                    10000,    //target update (hard)
-                    500,      //num step noop warmup
-                    0.1,      //reward scaling
-                    0.99,     //gamma
-                    100.0,    //td-error clipping
-                    0.1f,     //min epsilon
-                    100000,   //num step for eps greedy anneal
-                    true      //double-dqn
-            );
+        new QLearning.QLConfiguration(
+            123,      //Random seed
+            10000,    //Max step By epoch
+            8000000,  //Max step
+            1000000,  //Max size of experience replay
+            32,       //size of batches
+            10000,    //target update (hard)
+            500,      //num step noop warmup
+            0.1,      //reward scaling
+            0.99,     //gamma
+            100.0,    //td-error clipping
+            0.1f,     //min epsilon
+            100000,   //num step for eps greedy anneal
+            true      //double-dqn
+        );
 
     public static DQNFactoryStdConv.Configuration ALE_NET_QL =
-            new DQNFactoryStdConv.Configuration(
-                    0.00025, //learning rate
-                    0.000,   //l2 regularization
-                    null, null
-            );
+        new DQNFactoryStdConv.Configuration(
+            0.00025, //learning rate
+            0.000,   //l2 regularization
+            null, null
+        );
 
     public static void main(String[] args) throws IOException {
 
@@ -76,7 +76,7 @@ public static void main(String[] args) throws IOException {
         //setup the emulation environment through ALE, you will need a ROM file
         ALEMDP mdp = null;
         try {
-            mdp = new ALEMDP("pong.bin");
+            mdp = new ALEMDP("/home/bam4d/konduit/ALE/ROMS/pong.bin");
         } catch (UnsatisfiedLinkError e) {
             System.out.println("To run this example, uncomment the \"ale-platform\" dependency in the pom.xml file.");
         }