cartpole-appo-vtrace.yaml 547 B

123456789101112131415161718192021
  1. cartpole-appo-vtrace:
  2. env: CartPole-v0
  3. run: APPO
  4. stop:
  5. episode_reward_mean: 180
  6. timesteps_total: 200000
  7. config:
  8. # Works for both torch and tf.
  9. framework: tf
  10. num_envs_per_worker: 5
  11. num_workers: 4
  12. num_gpus: 0
  13. observation_filter: MeanStdFilter
  14. num_sgd_iter: 1
  15. vf_loss_coeff: 0.01
  16. vtrace: true
  17. vtrace_drop_last_ts: false
  18. model:
  19. fcnet_hiddens: [32]
  20. fcnet_activation: linear
  21. vf_share_layers: true