cartpole-ppo.yaml 470 B

12345678910111213141516171819
  1. cartpole-ppo:
  2. env: CartPole-v0
  3. run: PPO
  4. stop:
  5. episode_reward_mean: 150
  6. timesteps_total: 100000
  7. config:
  8. # Works for both torch and tf.
  9. framework: tf
  10. gamma: 0.99
  11. lr: 0.0003
  12. num_workers: 1
  13. observation_filter: MeanStdFilter
  14. num_sgd_iter: 6
  15. vf_loss_coeff: 0.01
  16. model:
  17. fcnet_hiddens: [32]
  18. fcnet_activation: linear
  19. vf_share_layers: true