|
|
|
|
|
|
config.hyperparameters, batch_size=120, buffer_size=12000, learning_rate=5.0e-3, |
|
|
|
use_bisim=True, predict_return=True, |
|
|
|
# separate_value_train=True, separate_policy_train=True, |
|
|
|
use_var_predict=True, with_prior=True, use_op_buffer=True, in_epoch_alter=True, in_batch_alter=False, |
|
|
|
policy_layers=0, value_layers=0, encoder_layers=2, feature_size=4, |
|
|
|
use_var_predict=True, with_prior=True, use_op_buffer=False, in_epoch_alter=False, in_batch_alter=True, |
|
|
|
policy_layers=1, value_layers=1, encoder_layers=1, feature_size=4, |
|
|
|
#use_inverse_model=True |
|
|
|
) |
|
|
|
config = attr.evolve(config, hyperparameters=new_hyperparams, max_steps=200000, summary_freq=5000) |
|
|
|
|
|
|
) |
|
|
|
new_hyperparams = attr.evolve( |
|
|
|
config.hyperparameters, batch_size=120, buffer_size=12000, use_transfer=True, |
|
|
|
transfer_path=transfer_from, |
|
|
|
use_op_buffer=True, in_epoch_alter=True, in_batch_alter=False, learning_rate=5.0e-3, |
|
|
|
transfer_path=transfer_from, separate_policy_train=True, |
|
|
|
use_op_buffer=True, in_epoch_alter=False, in_batch_alter=True, learning_rate=5.0e-3, |
|
|
|
use_var_predict=True, with_prior=True, policy_layers=1, load_policy=False, |
|
|
|
load_value=False, predict_return=True, value_layers=1, encoder_layers=1, |
|
|
|
use_var_predict=True, with_prior=True, policy_layers=0, load_policy=False, |
|
|
|
load_value=False, predict_return=True, value_layers=0, encoder_layers=2, |
|
|
|
use_bisim=True, |
|
|
|
) |
|
|
|
config = attr.evolve(config, hyperparameters=new_hyperparams, max_steps=300000, summary_freq=5000) |
|
|
|
|
|
|
if __name__ == "__main__": |
|
|
|
for obs in ["rich1", "rich2"]: # ["normal", "rich1", "rich2"]: |
|
|
|
for obs in ["normal", "rich1", "rich2"]: # ["normal", "rich1", "rich2"]: |
|
|
|
+ "_f4_pv-l1_rew_bisim-op_newalter_noreuse-soft0.1") |
|
|
|
+ "_f4_pv-l0_rew_bisim_order-ibalter_noreuse-soft0.1_noop_conlr") |
|
|
|
# for obs in ["normal", "rich1"]: |
|
|
|
# test_2d_transfer(seed=0, obs_spec_type="rich2", |
|
|
|
# transfer_from="./transfer_results/model_"+ obs +"_f4_pv-l0_rew_bisim-op_samelen_s0/Simple", |
|
|
|
# run_id="transfer_rich2_f4_pv-l0_rew_bisim-op_samelen_from_" + obs) |
|
|
|
# for obs in ["normal", "rich2"]: |
|
|
|
# for obs in ["normal"]: |
|
|
|
# test_2d_transfer(seed=0, obs_spec_type="rich1", |
|
|
|
# transfer_from="./transfer_results/model_"+ obs +"_f4_pv-l0_rew_bisim_order-ibalter_noreuse-soft0.1_nostop-op10_linlr_s0/Simple", |
|
|
|
# run_id="transfer_rich1_f4_pv-l0_soft_ibalter_sepp_from_" + obs) |
|
|
|
|
|
|
|
# for obs in ["normal"]: |
|
|
|
# transfer_from="./transfer_results/model_"+ obs +"_f4_pv-l0_rew_bisim-op_new_s0/Simple", |
|
|
|
# run_id="transfer_rich1_f4_pv-l0_rew_bisim-op_new_from" + obs) |
|
|
|
# transfer_from="./transfer_results/model_"+ obs +"_f4_pv-l0_rew_bisim-nop_newalter_noreuse-soft0.1_s0/Simple", |
|
|
|
# run_id="transfer_rich1_retrain-all_f4_pv-l0_rew_bisim-nop_noreuse-soft0.1_from_" + obs) |
|
|
|
# for i in range(5): |
|
|
|
# test_2d_model(seed=i) |