load_model: false
encoder_layers: 2
action_layers: 2
policy_layers: 1
policy_layers: 2
value_layers: 1
feature_size: 64
value_layers: 2
feature_size: 128
action_feature_size: 128
reuse_encoder: true
in_epoch_alter: false
predict_return: true
use_bisim: false
separate_value_train: false
separate_value_train: true
in_batch_alter: true
network_settings:
normalize: true
model_schedule: linear
train_model: false
load_model: true
train_action: false