num_epoch: 3
learning_rate_schedule: linear
network_settings:
normalize: true
hidden_units: 64
normalize: false
hidden_units: 128
num_layers: 2
vis_encode_type: simple
reward_signals: