Provide support with incompatible API

7 年前 · 9ded88f3
--- a/python/unityagents/environment.py
+++ b/python/unityagents/environment.py

 class UnityEnvironment(object):
    def __init__(self, file_name, worker_id=0,
-                 base_port=5005, curriculum = None):
+                 base_port=5005, curriculum=None):
        """
        Starts a new unity environment and establishes a connection with the environment.
        Notice: Currently communication between Unity and Python takes place over an open socket without authentication.

        cwd = os.getcwd()
        file_name = (file_name.strip()
-            .replace('.app', '').replace('.exe', '').replace('.x86_64', '').replace('.x86', ''))
+                     .replace('.app', '').replace('.exe', '').replace('.x86_64', '').replace('.x86', ''))
        true_filename = os.path.basename(os.path.normpath(file_name))
        launch_string = None
        if platform == "linux" or platform == "linux2":
        if launch_string is None:
            self.close()
            raise UnityEnvironmentException("Couldn't launch the {0} environment. "
-            "Provided filename does not match any environments."
-            .format(true_filename))
+                                            "Provided filename does not match any environments."
+                                            .format(true_filename))
        else:
            # Launch Unity environment
            proc1 = subprocess.Popen(
-        self._socket.settimeout(30) 
+        self._socket.settimeout(30)
        try:
            try:
                self._socket.listen(1)
                p = json.loads(p)
            except socket.timeout as e:
                raise UnityEnvironmentException(
-                "The Unity environment took too long to respond. Make sure {} does not need user interaction to launch "
-                "and that the Academy and the external Brain(s) are attached to objects in the Scene.".format(
-                    str(file_name)))
-        
+                    "The Unity environment took too long to respond. Make sure {} does not need user interaction to "
+                    "launch and that the Academy and the external Brain(s) are attached to objects in the Scene."
+                    .format(str(file_name)))
+
            if "apiNumber" not in p:
                self._unity_api = "API-1"
            else:
                    "The API number is not compatible between Unity and python. Python API : {0}, Unity API : "
-                    "{1}.".format(self._python_api, self._unity_api))
+                    "{1}.\nPlease go to https://github.com/Unity-Technologies/ml-agents to download the latest version "
+                    "of ML-Agents.".format(self._python_api, self._unity_api))

            self._data = {}
            self._global_done = None
            logger.info("\n'{}' started successfully!".format(self._academy_name))
            if (self._num_external_brains == 0):
                logger.warning(" No External Brains found in the Unity Environment. "
-                    "You will not be able to pass actions to your agent(s).")
+                               "You will not be able to pass actions to your agent(s).")
        except UnityEnvironmentException:
            proc1.kill()
            self.close()
                                                             for k in self._resetParameters])) + '\n' + \
               '\n'.join([str(self._brains[b]) for b in self._brains])

-
    def _recv_bytes(self):
        s = self._conn.recv(self._buffer_size)
        message_length = struct.unpack("I", bytearray(s[:4]))[0]
        config = self._curriculum.get_lesson(progress) if config is None else config
        if old_lesson != self._curriculum.get_lesson_number():
            logger.info("\nLesson changed. Now in Lesson {0} : \t{1}"
-                .format(self._curriculum.get_lesson_number(),
-                    ', '.join([str(x)+' -> '+str(config[x]) for x in config])))
+                        .format(self._curriculum.get_lesson_number(),
+                                ', '.join([str(x) + ' -> ' + str(config[x]) for x in config])))
-                .format(self._curriculum.get_lesson_number(),
-                    ', '.join([str(x)+' -> '+str(config[x]) for x in config])))
+                        .format(self._curriculum.get_lesson_number(),
+                                ', '.join([str(x) + ' -> ' + str(config[x]) for x in config])))
        if self._loaded:
            self._conn.send(b"RESET")
            self._conn.recv(self._buffer_size)
                raise UnityActionException("Brain {0} has an invalid state. "
                                           "Expecting {1} {2} state but received {3}."
                                           .format(b, n_agent if self._brains[b].state_space_type == "discrete"
-                                            else str(self._brains[b].state_space_size * n_agent),
-                                            self._brains[b].state_space_type,
-                                            len(state_dict["states"])))
+                else str(self._brains[b].state_space_size * n_agent),
+                                                   self._brains[b].state_space_type,
+                                                   len(state_dict["states"])))
-            if n_agent > 0 :
-                actions =  np.array(state_dict["actions"]).reshape((n_agent, -1))
-            else :
+            if n_agent > 0:
+                actions = np.array(state_dict["actions"]).reshape((n_agent, -1))
+            else:
                actions = np.array([])

            observations = []
        arr = [float(x) for x in arr]
        return arr

-    def step(self, action = None, memory=None, value=None):
+    def step(self, action=None, memory=None, value=None):
        """
        Provides the environment with an action, moves the environment dynamics forward accordingly, and returns
        observation, state, and reward information to the agent.
                        "and actions as values".format(self._num_brains))
                else:
                    raise UnityActionException(
-                        "There are no external brains in the environment, " 
+                        "There are no external brains in the environment, "
-                    
+
            if isinstance(memory, (int, np.int_, float, np.float_, list, np.ndarray)):
                if self._num_external_brains == 1:
                    memory = {self._external_brain_names[0]: memory}
                        "and memories as values".format(self._num_brains))
                else:
                    raise UnityActionException(
-                        "There are no external brains in the environment, " 
+                        "There are no external brains in the environment, "
-                elif self._num_external_brains > 1:  
+                elif self._num_external_brains > 1:
-                        "There are no external brains in the environment, " 
+                        "There are no external brains in the environment, "
                        "step cannot take a value input")

            for brain_name in list(action.keys()) + list(memory.keys()) + list(value.keys()):
-                        "in the environment". format(brain_name))
+                        "in the environment".format(brain_name))

            for b in self._external_brain_names:
                n_agent = len(self._data[b].agents)
                    raise UnityActionException(
                        "There was a mismatch between the provided memory and environment's expectation: "
                        "The brain {0} expected {1} memories but was given {2}"
-                        .format(b, self._brains[b].memory_space_size * n_agent, len(memory[b])))
+                            .format(b, self._brains[b].memory_space_size * n_agent, len(memory[b])))
                if not ((self._brains[b].action_space_type == "discrete" and len(action[b]) == n_agent) or
                            (self._brains[b].action_space_type == "continuous" and len(
                                action[b]) == self._brains[b].action_space_size * n_agent)):
-                        .format(b, n_agent if self._brains[b].action_space_type == "discrete" else
+                            .format(b, n_agent if self._brains[b].action_space_type == "discrete" else
-                        str(action[b])))
+                                    str(action[b])))
            self._conn.send(b"STEP")
            self._send_action(action, memory, value)
            return self._get_state()
            self._socket.close()
            self._loaded = False
        else:
-            raise UnityEnvironmentException("No Unity environment is loaded.")
+            raise UnityEnvironmentException("No Unity environment is loaded.")