From 3d6afb192a40d71d5dd692a79928cf8035718c45 Mon Sep 17 00:00:00 2001
From: Jonathan Harper <jharper@unity3d.com>
Date: Mon, 10 Dec 2018 14:59:58 -0800
Subject: [PATCH 1/2] Support both 32-bit and 64-bit types in UnityEnvironment

We check for the single brain case in UnityEnvironment by checking
for applicable non-dict types in the step arguments. However for ints
and floats we just use `np.int_` and `np.float_` for the check, which
are the defaults for your system.

This means if you are using an application (like baselines in #1448)
which uses the wrong int/float size an error will be thrown.  This
change explicitly allows both 32 and 64-bit numbers.
---
 ml-agents/mlagents/envs/environment.py | 13 +++++++++----
 1 file changed, 9 insertions(+), 4 deletions(-)

diff --git a/ml-agents/mlagents/envs/environment.py b/ml-agents/mlagents/envs/environment.py
index 06a857a225..fca09c989a 100644
--- a/ml-agents/mlagents/envs/environment.py
+++ b/ml-agents/mlagents/envs/environment.py
@@ -20,6 +20,11 @@
 
 
 class UnityEnvironment(object):
+    SINGLE_BRAIN_ACTION_TYPES = (
+        int, np.int32, np.int64, float, np.float32, np.float64, list, np.ndarray
+    )
+    SINGLE_BRAIN_TEXT_TYPES = (str, list, np.ndarray)
+
     def __init__(self, file_name=None, worker_id=0,
                  base_port=5005, seed=0,
                  docker_training=False, no_graphics=False):
@@ -270,7 +275,7 @@ def step(self, vector_action=None, memory=None, text_action=None, value=None) ->
 
         # Check that environment is loaded, and episode is currently running.
         if self._loaded and not self._global_done and self._global_done is not None:
-            if isinstance(vector_action, (int, np.int_, float, np.float_, list, np.ndarray)):
+            if isinstance(vector_action, self.SINGLE_BRAIN_ACTION_TYPES):
                 if self._num_external_brains == 1:
                     vector_action = {self._external_brain_names[0]: vector_action}
                 elif self._num_external_brains > 1:
@@ -282,7 +287,7 @@ def step(self, vector_action=None, memory=None, text_action=None, value=None) ->
                         "There are no external brains in the environment, "
                         "step cannot take a vector_action input")
 
-            if isinstance(memory, (int, np.int_, float, np.float_, list, np.ndarray)):
+            if isinstance(memory, self.SINGLE_BRAIN_ACTION_TYPES):
                 if self._num_external_brains == 1:
                     memory = {self._external_brain_names[0]: memory}
                 elif self._num_external_brains > 1:
@@ -294,7 +299,7 @@ def step(self, vector_action=None, memory=None, text_action=None, value=None) ->
                         "There are no external brains in the environment, "
                         "step cannot take a memory input")
 
-            if isinstance(text_action, (str, list, np.ndarray)):
+            if isinstance(text_action, self.SINGLE_BRAIN_TEXT_TYPES):
                 if self._num_external_brains == 1:
                     text_action = {self._external_brain_names[0]: text_action}
                 elif self._num_external_brains > 1:
@@ -306,7 +311,7 @@ def step(self, vector_action=None, memory=None, text_action=None, value=None) ->
                         "There are no external brains in the environment, "
                         "step cannot take a value input")
 
-            if isinstance(value, (int, np.int_, float, np.float_, list, np.ndarray)):
+            if isinstance(value, self.SINGLE_BRAIN_ACTION_TYPES):
                 if self._num_external_brains == 1:
                     value = {self._external_brain_names[0]: value}
                 elif self._num_external_brains > 1:

From 286aed443128c3d04c537628e5cd056b3c0a05c4 Mon Sep 17 00:00:00 2001
From: Jonathan Harper <jharper@unity3d.com>
Date: Thu, 13 Dec 2018 14:39:52 -0800
Subject: [PATCH 2/2] Correctly "flatten" non-scalar action values

---
 ml-agents/mlagents/envs/environment.py | 11 +++++------
 1 file changed, 5 insertions(+), 6 deletions(-)

diff --git a/ml-agents/mlagents/envs/environment.py b/ml-agents/mlagents/envs/environment.py
index fca09c989a..94d7147ef2 100644
--- a/ml-agents/mlagents/envs/environment.py
+++ b/ml-agents/mlagents/envs/environment.py
@@ -20,9 +20,8 @@
 
 
 class UnityEnvironment(object):
-    SINGLE_BRAIN_ACTION_TYPES = (
-        int, np.int32, np.int64, float, np.float32, np.float64, list, np.ndarray
-    )
+    SCALAR_ACTION_TYPES = (int, np.int32, np.int64, float, np.float32, np.float64)
+    SINGLE_BRAIN_ACTION_TYPES = SCALAR_ACTION_TYPES + (list, np.ndarray)
     SINGLE_BRAIN_TEXT_TYPES = (str, list, np.ndarray)
 
     def __init__(self, file_name=None, worker_id=0,
@@ -424,14 +423,14 @@ def _close(self):
         if self.proc1 is not None:
             self.proc1.kill()
 
-    @staticmethod
-    def _flatten(arr):
+    @classmethod
+    def _flatten(cls, arr):
         """
         Converts arrays to list.
         :param arr: numpy vector.
         :return: flattened list.
         """
-        if isinstance(arr, (int, np.int_, float, np.float_)):
+        if isinstance(arr, cls.SCALAR_ACTION_TYPES):
             arr = [float(arr)]
         if isinstance(arr, np.ndarray):
             arr = arr.tolist()