atari-ppo.yaml 848 B

123456789101112131415161718192021222324252627282930
  1. # Runs on a single g3.16xl node
  2. # See https://github.com/ray-project/rl-experiments for results
  3. atari-ppo:
  4. env:
  5. grid_search:
  6. - BreakoutNoFrameskip-v4
  7. - BeamRiderNoFrameskip-v4
  8. - QbertNoFrameskip-v4
  9. - SpaceInvadersNoFrameskip-v4
  10. run: PPO
  11. config:
  12. # Works for both torch and tf.
  13. framework: tf
  14. lambda: 0.95
  15. kl_coeff: 0.5
  16. clip_rewards: True
  17. clip_param: 0.1
  18. vf_clip_param: 10.0
  19. entropy_coeff: 0.01
  20. train_batch_size: 5000
  21. rollout_fragment_length: 100
  22. sgd_minibatch_size: 500
  23. num_sgd_iter: 10
  24. num_workers: 10
  25. num_envs_per_worker: 5
  26. batch_mode: truncate_episodes
  27. observation_filter: NoFilter
  28. model:
  29. vf_share_layers: true
  30. num_gpus: 1