浏览代码

linear 3dball

/develop/bisim-review
Andrew Cohen 4 年前
当前提交
eace3365
共有 3 个文件被更改,包括 24 次插入21 次删除
  1. 15
      config/ppo_transfer/3DBall.yaml
  2. 15
      config/ppo_transfer/3DBallHard.yaml
  3. 15
      config/ppo_transfer/3DBallHardTransfer.yaml

15
config/ppo_transfer/3DBall.yaml


learning_rate_schedule: linear
model_schedule: linear
load_model: false
encoder_layers: 1
encoder_layers: 2
policy_layers: 1
forward_layers: 1
value_layers: 1
feature_size: 16
policy_layers: 0
forward_layers: 0
value_layers: 2
feature_size: 128
action_feature_size: 32
reuse_encoder: true
in_epoch_alter: false

predict_return: true
use_bisim: false
separate_value_train: false
separate_value_train: true
separate_value_net: true
hidden_units: 64
hidden_units: 128
num_layers: 1
vis_encode_type: simple
reward_signals:

15
config/ppo_transfer/3DBallHard.yaml


learning_rate_schedule: linear
model_schedule: linear
load_model: false
encoder_layers: 1
encoder_layers: 2
policy_layers: 1
forward_layers: 1
value_layers: 1
feature_size: 16
policy_layers: 0
forward_layers: 0
value_layers: 2
feature_size: 128
action_feature_size: 32
reuse_encoder: true
in_epoch_alter: false

predict_return: true
use_bisim: false
separate_value_train: false
separate_value_train: true
separate_value_net: true
hidden_units: 64
hidden_units: 128
num_layers: 1
vis_encode_type: simple
reward_signals:

15
config/ppo_transfer/3DBallHardTransfer.yaml


num_epoch: 3
learning_rate_schedule: linear
model_schedule: linear
encoder_layers: 1
encoder_layers: 2
policy_layers: 1
forward_layers: 1
value_layers: 1
feature_size: 16
policy_layers: 0
forward_layers: 0
value_layers: 2
feature_size: 128
action_feature_size: 32
reuse_encoder: true
in_epoch_alter: false

predict_return: true
use_bisim: false
separate_value_train: false
separate_value_train: true
separate_value_net: true
train_model: false
load_model: true
train_action: false

in_batch_alter: true
network_settings:
normalize: true
hidden_units: 64
hidden_units: 128
num_layers: 1
vis_encode_type: simple
reward_signals:

正在加载...
取消
保存