gamma: 0.99
strength: 1.0
keep_checkpoints: 5
max_steps: 10000000
max_steps: 4000000
time_horizon: 64
summary_freq: 10000