MoveAgent(actionBuffers.DiscreteActions);
// Penalty given each step to encourage agent to finish task quickly.
AddReward(-1f / MaxStep);
//AddReward(-1f / MaxStep);
}
public override void Heuristic(in ActionBuffers actionsOut)