|
|
|
|
|
|
PPO_TF_CONFIG, |
|
|
|
hyperparameters=new_hyperparams, |
|
|
|
network_settings=new_networksettings, |
|
|
|
max_steps=400, |
|
|
|
max_steps=500, |
|
|
|
summary_freq=100, |
|
|
|
framework=FrameworkType.TENSORFLOW, |
|
|
|
) |
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize("use_discrete", [True, False]) |
|
|
|
def test_recurrent_sac(use_discrete): |
|
|
|
step_size = 0.5 if use_discrete else 0.2 |
|
|
|
step_size = 0.2 if use_discrete else 0.5 |
|
|
|
env = MemoryEnvironment( |
|
|
|
[BRAIN_NAME], use_discrete=use_discrete, step_size=step_size |
|
|
|
) |
|
|
|