您最多选择25个主题
主题必须以中文或者字母或数字开头,可以包含连字符 (-),并且长度不得超过35个字符
132 行
3.4 KiB
132 行
3.4 KiB
using System.Collections;
|
|
using System.Collections.Generic;
|
|
using UnityEngine;
|
|
using MLAgents;
|
|
|
|
public class BouncerAgent : Agent {
|
|
|
|
[Header("Bouncer Specific")]
|
|
public GameObject banana;
|
|
public GameObject bodyObject;
|
|
Rigidbody rb;
|
|
Vector3 lookDir;
|
|
public float strength = 10f;
|
|
float jumpCooldown;
|
|
int numberJumps = 20;
|
|
int jumpLeft = 20;
|
|
|
|
ResetParameters resetParams;
|
|
|
|
public override void InitializeAgent()
|
|
{
|
|
rb = gameObject.GetComponent<Rigidbody>();
|
|
lookDir = Vector3.zero;
|
|
|
|
var academy = FindObjectOfType<Academy>() as Academy;
|
|
resetParams = academy.resetParameters;
|
|
|
|
SetResetParameters();
|
|
}
|
|
|
|
public override void CollectObservations()
|
|
{
|
|
AddVectorObs(gameObject.transform.localPosition);
|
|
AddVectorObs(banana.transform.localPosition);
|
|
}
|
|
|
|
public override void AgentAction(float[] vectorAction, string textAction)
|
|
{
|
|
for (int i = 0; i < vectorAction.Length; i++)
|
|
{
|
|
vectorAction[i] = Mathf.Clamp(vectorAction[i], -1f, 1f);
|
|
}
|
|
float x = vectorAction[0];
|
|
float y = ScaleAction(vectorAction[1], 0, 1);
|
|
float z = vectorAction[2];
|
|
rb.AddForce( new Vector3(x, y+1, z) * strength);
|
|
|
|
AddReward(-0.05f * (
|
|
vectorAction[0] * vectorAction[0] +
|
|
vectorAction[1] * vectorAction[1] +
|
|
vectorAction[2] * vectorAction[2]) / 3f);
|
|
|
|
lookDir = new Vector3(x, y, z);
|
|
}
|
|
|
|
public override void AgentReset()
|
|
{
|
|
|
|
gameObject.transform.localPosition = new Vector3(
|
|
(1 - 2 * Random.value) *5, 2, (1 - 2 * Random.value)*5);
|
|
rb.velocity = default(Vector3);
|
|
GameObject environment = gameObject.transform.parent.gameObject;
|
|
BouncerBanana[] bananas =
|
|
environment.GetComponentsInChildren<BouncerBanana>();
|
|
foreach (BouncerBanana bb in bananas)
|
|
{
|
|
bb.Respawn();
|
|
}
|
|
jumpLeft = numberJumps;
|
|
|
|
SetResetParameters();
|
|
}
|
|
|
|
public override void AgentOnDone()
|
|
{
|
|
|
|
}
|
|
|
|
private void FixedUpdate()
|
|
{
|
|
if (Physics.Raycast(transform.position, new Vector3(0f,-1f,0f), 0.51f) && jumpCooldown <= 0f)
|
|
{
|
|
RequestDecision();
|
|
jumpLeft -= 1;
|
|
jumpCooldown = 0.1f;
|
|
rb.velocity = default(Vector3);
|
|
}
|
|
|
|
jumpCooldown -= Time.fixedDeltaTime;
|
|
|
|
if (gameObject.transform.position.y < -1)
|
|
{
|
|
AddReward(-1);
|
|
Done();
|
|
return;
|
|
}
|
|
|
|
if (gameObject.transform.localPosition.x < -19 || gameObject.transform.localPosition.x >19
|
|
|| gameObject.transform.localPosition.z < -19 || gameObject.transform.localPosition.z > 19)
|
|
{
|
|
AddReward(-1);
|
|
Done();
|
|
return;
|
|
}
|
|
if (jumpLeft == 0)
|
|
{
|
|
Done();
|
|
}
|
|
|
|
}
|
|
|
|
private void Update()
|
|
{
|
|
if (lookDir.magnitude > float.Epsilon)
|
|
{
|
|
bodyObject.transform.rotation = Quaternion.Lerp(bodyObject.transform.rotation,
|
|
Quaternion.LookRotation(lookDir),
|
|
Time.deltaTime * 10f);
|
|
}
|
|
}
|
|
|
|
public void SetBananaScale()
|
|
{
|
|
var banana_scale = resetParams["banana_scale"];
|
|
banana.transform.localScale = new Vector3(banana_scale, banana_scale, banana_scale);
|
|
}
|
|
|
|
public void SetResetParameters()
|
|
{
|
|
SetBananaScale();
|
|
}
|
|
}
|