hopper-ppo.yaml 394 B

12345678910111213141516
  1. hopper-ppo:
  2. env: Hopper-v1
  3. run: PPO
  4. config:
  5. # Works for both torch and tf.
  6. framework: tf
  7. gamma: 0.995
  8. kl_coeff: 1.0
  9. num_sgd_iter: 20
  10. lr: .0001
  11. sgd_minibatch_size: 32768
  12. train_batch_size: 160000
  13. num_workers: 64
  14. num_gpus: 4
  15. batch_mode: complete_episodes
  16. observation_filter: MeanStdFilter