|
|
|
|
|
|
trainer_params["output_path"] = path1 |
|
|
|
policy = create_policy_mock(trainer_params) |
|
|
|
policy.initialize_or_load() |
|
|
|
policy._set_step(2000) |
|
|
|
policy.save_model(2000) |
|
|
|
|
|
|
|
assert len(os.listdir(tmp_path)) > 0 |
|
|
|
|
|
|
policy2.initialize_or_load() |
|
|
|
_compare_two_policies(policy, policy2) |
|
|
|
assert policy2.get_current_step() == 2000 |
|
|
|
|
|
|
|
# Try initialize from path 1 |
|
|
|
trainer_params["model_path"] = path2 |
|
|
|
|
|
|
|
|
|
|
_compare_two_policies(policy2, policy3) |
|
|
|
# Assert that the steps are 0. |
|
|
|
assert policy3.get_current_step() == 0 |
|
|
|
|
|
|
|
|
|
|
|
def _compare_two_policies(policy1: NNPolicy, policy2: NNPolicy) -> None: |
|
|
|