ml-agents/com.unity.ml-agents/Runtime/Policies/RemotePolicy.cs


								using UnityEngine;

								using System.Collections.Generic;

								using System;

								using Unity.MLAgents.Actuators;

								using Unity.MLAgents.Sensors;


								namespace Unity.MLAgents.Policies

								{

								    /// <summary>

								    /// The Remote Policy only works when training.

								    /// When training your Agents, the RemotePolicy will be controlled by Python.

								    /// </summary>

								    internal class RemotePolicy : IPolicy

								    {

								        int m_AgentId;

								        string m_FullyQualifiedBehaviorName;

								        SpaceType m_SpaceType;

								        ActionBuffers m_LastActionBuffer;


								        internal ICommunicator m_Communicator;


								        /// <inheritdoc />

								        public RemotePolicy(

								            ActionSpec actionSpec,

								            string fullyQualifiedBehaviorName)

								        {

								            m_FullyQualifiedBehaviorName = fullyQualifiedBehaviorName;

								            m_Communicator = Academy.Instance.Communicator;

								            m_Communicator.SubscribeBrain(m_FullyQualifiedBehaviorName, actionSpec);


								            actionSpec.CheckNotHybrid();

								            m_SpaceType = actionSpec.NumContinuousActions > 0 ? SpaceType.Continuous : SpaceType.Discrete;

								        }


								        /// <inheritdoc />

								        public void RequestDecision(AgentInfo info, List<ISensor> sensors)

								        {

								            m_AgentId = info.episodeId;

								            m_Communicator?.PutObservations(m_FullyQualifiedBehaviorName, info, sensors);

								        }


								        /// <inheritdoc />

								        public ref readonly ActionBuffers DecideAction()

								        {

								            m_Communicator?.DecideBatch();

								            var actions = m_Communicator?.GetActions(m_FullyQualifiedBehaviorName, m_AgentId);

								            // TODO figure out how to handle this with multiple space types.

								            if (m_SpaceType == SpaceType.Continuous)

								            {

								                m_LastActionBuffer = new ActionBuffers(actions, Array.Empty<int>());

								                return ref m_LastActionBuffer;

								            }

								            m_LastActionBuffer = ActionBuffers.FromDiscreteActions(actions);

								            return ref m_LastActionBuffer;

								        }


								        public void Dispose()

								        {

								        }

								    }

								}