cartpole-ppo-hyperband.yaml 397 B

12345678910111213141516
  1. cartpole-ppo:
  2. env: CartPole-v0
  3. run: PPO
  4. num_samples: 3
  5. stop:
  6. episode_reward_mean: 200
  7. time_total_s: 180
  8. config:
  9. # Works for both torch and tf.
  10. framework: tf
  11. num_workers: 1
  12. num_sgd_iter:
  13. grid_search: [1, 4]
  14. sgd_minibatch_size:
  15. grid_search: [128, 256, 512]
  16. observation_filter: MeanStdFilter