浏览代码

more experiments for self-play

/asymm-envs
Andrew Cohen 4 年前
当前提交
d9f1a2f5
共有 2 个文件被更改,包括 4 次插入36 次删除
  1. 34
      Project/Assets/ML-Agents/Examples/Tennis/Scripts/HitWall.cs
  2. 6
      config/trainer_config.yaml

34
Project/Assets/ML-Agents/Examples/Tennis/Scripts/HitWall.cs


{
public GameObject areaObject;
public int lastAgentHit;
public bool net;
public enum FloorHit
{

m_AgentB.EndEpisode();
m_Area.MatchReset();
lastFloorHit = FloorHit.Service;
net = false;
lastAgentHit = -1;
}
void AgentAWins()

else
{
lastFloorHit = FloorHit.FloorAHit;
//successful serve
if (!net)
{
net = true;
}
}
}
else if (collision.gameObject.name == "floorB")

else
{
lastFloorHit = FloorHit.FloorBHit;
//successful serve
if (!net)
{
net = true;
}
}
}
else if (collision.gameObject.name == "net" && !net)
{
if (lastAgentHit == 0)
{
AgentBWins();
}
else if (lastAgentHit == 1)
{
AgentAWins();
}
}
}

}
else
{
//agent can return serve in the air
if (lastFloorHit != FloorHit.Service && !net)
{
net = true;
}
lastAgentHit = 0;
lastFloorHit = FloorHit.FloorHitUnset;

}
else
{
if (lastFloorHit != FloorHit.Service && !net)
{
net = true;
}
lastAgentHit = 1;
lastFloorHit = FloorHit.FloorHitUnset;
}

6
config/trainer_config.yaml


Goalie:
normalize: false
max_steps: 3.0e7
max_steps: 5.0e7
learning_rate_schedule: constant
batch_size: 2048
buffer_size: 20480

Striker:
normalize: false
max_steps: 3.0e7
max_steps: 5.0e7
learning_rate_schedule: constant
batch_size: 2048
buffer_size: 20480

SoccerTwos:
normalize: false
max_steps: 5.0e7
max_steps: 1.0e8
learning_rate_schedule: constant
batch_size: 2048
buffer_size: 20480

正在加载...
取消
保存