[🐛 🔨 ]Adding the ELO to the GlobalTrainingStatus (#5202)

* Adding the ELO to the GlobalTrainingStatus * Update ml-agents/mlagents/trainers/ghost/trainer.py Co-authored-by: andrewcoh <54679309+andrewcoh@users.noreply.github.com> Co-authored-by: andrewcoh <54679309+andrewcoh@users.noreply.github.com>
4 年前 · 640b2e00
--- a/ml-agents/mlagents/trainers/ghost/trainer.py
+++ b/ml-agents/mlagents/trainers/ghost/trainer.py
    BehaviorIdentifiers,
    create_name_behavior_id,
 )
+from mlagents.trainers.training_status import GlobalTrainingStatus, StatusType


 logger = get_logger(__name__)
        self.last_swap: int = 0
        self.last_team_change: int = 0

-        # Chosen because it is the initial ELO in Chess
-        self.initial_elo: float = self_play_parameters.initial_elo
+        self.initial_elo = GlobalTrainingStatus.get_parameter_state(
+            self.brain_name, StatusType.ELO
+        )
+        if self.initial_elo is None:
+            self.initial_elo = self_play_parameters.initial_elo
        self.policy_elos: List[float] = [self.initial_elo] * (
            self.window + 1
        )  # for learning policy
        """
        Forwarding call to wrapped trainers save_model.
        """
+        GlobalTrainingStatus.set_parameter_state(
+            self.brain_name, StatusType.ELO, self.current_elo
+        )
        self.trainer.save_model()

    def create_policy(
--- a/ml-agents/mlagents/trainers/training_status.py
+++ b/ml-agents/mlagents/trainers/training_status.py
    STATS_METADATA = "metadata"
    CHECKPOINTS = "checkpoints"
    FINAL_CHECKPOINT = "final_checkpoint"
+    ELO = "elo"


@attr.s(auto_attribs=True)