|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize("use_discrete", [True, False]) |
|
|
|
def test_recurrent_sac(use_discrete): |
|
|
|
step_size = 0.2 if use_discrete else 0.8 |
|
|
|
step_size = 0.2 if use_discrete else 0.5 |
|
|
|
env = MemoryEnvironment( |
|
|
|
[BRAIN_NAME], use_discrete=use_discrete, step_size=step_size |
|
|
|
) |
|
|
|
|
|
|
) |
|
|
|
new_hyperparams = attr.evolve( |
|
|
|
SAC_TF_CONFIG.hyperparameters, |
|
|
|
batch_size=128, |
|
|
|
batch_size=256, |
|
|
|
learning_rate=1e-3, |
|
|
|
buffer_init_steps=1000, |
|
|
|
steps_per_update=2, |
|
|
|
|
|
|
hyperparameters=new_hyperparams, |
|
|
|
network_settings=new_networksettings, |
|
|
|
max_steps=4000, |
|
|
|
max_steps=2000, |
|
|
|
framework=FrameworkType.TENSORFLOW, |
|
|
|
) |
|
|
|
_check_environment_trains(env, {BRAIN_NAME: config}) |
|
|
|