|
|
|
|
|
|
save_replay_buffer: false |
|
|
|
init_entcoef: 1.0 |
|
|
|
reward_signal_steps_per_update: 10.0 |
|
|
|
encoder_layers: 1 |
|
|
|
policy_layers: 1 |
|
|
|
encoder_layers: 2 |
|
|
|
policy_layers: 0 |
|
|
|
feature_size: 16 |
|
|
|
feature_size: 64 |
|
|
|
# separate_value_net: true |
|
|
|
separate_policy_train: true |
|
|
|
# separate_value_train: true |
|
|
|
|
|
|
train_model: false |
|
|
|
load_policy: true |
|
|
|
load_value: true |
|
|
|
transfer_path: "results/sac-ball-f16-e1p1f0/3DBall" |
|
|
|
transfer_path: "results/ball-linear-s0/3DBall" |
|
|
|
network_settings: |
|
|
|
normalize: true |
|
|
|
hidden_units: 128 |
|
|
|