forward_layers: 1
value_layers: 1
feature_size: 16
separate_policy_train: true
reuse_encoder: false
in_epoch_alter: false
in_batch_alter: false
encoder_layers: 2
policy_layers: 1
forward_layers: 2
value_layers: 3
value_layers: 2
in_batch_alter: true