WalkerDynamic:
normalize: true
num_epoch: 3
time_horizon: 1000
batch_size: 2048
# learning_rate_schedule: constant
num_epoch: 6
time_horizon: 2048
batch_size: 4096
# learning_rate: 1.0e-3
num_layers: 3
hidden_units: 512
reward_signals:
# WalkerDynamic:
# normalize: true
# num_epoch: 3
# time_horizon: 1000
# batch_size: 2048
# buffer_size: 20480
# max_steps: 2e7
# # max_steps: 1e8
# summary_freq: 30000
# num_layers: 3
# hidden_units: 512
# reward_signals:
# extrinsic:
# strength: 1.0
# gamma: 0.995
WalkerStatic: