[skip ci] continue training until worker-0 is done

5 年前 · 455adc60
--- a/ml-agents/mlagents/trainers/trainer/trainer.py
+++ b/ml-agents/mlagents/trainers/trainer/trainer.py
 from mlagents.trainers.policy import Policy
 from mlagents.trainers.exception import UnityTrainerException
 from mlagents_envs.timers import hierarchical_timer
+import horovod.tensorflow as hvd


 logger = logging.getLogger("mlagents.trainers")
        stop training if it wasn't training to begin with, or if max_steps
        is reached.
        """
-        return self.is_training and self.get_step <= self.get_max_steps
+        if hvd.rank() == 0:
+            logger.info("Worker = 0, step = %s", self.get_step)
+            return self.is_training and self.get_step <= self.get_max_steps
+        else:
+            logger.info("Worker = %s, step = %s", (hvd.rank(), self.get_step))
+            return True

    @property
    def reward_buffer(self) -> Deque[float]: