time_horizon: 50
normalize: true
self_play:
window: 10
window: 100
play_against_latest_model_ratio: 0.5
save_steps: 50000
swap_steps: 2000