cartpole-sac.yaml 595 B

12345678910111213141516171819202122
  1. cartpole-sac:
  2. env: CartPole-v0
  3. run: SAC
  4. stop:
  5. episode_reward_mean: 100
  6. timesteps_total: 100000
  7. config:
  8. # Works for both torch and tf.
  9. framework: tf
  10. gamma: 0.95
  11. no_done_at_end: false
  12. target_network_update_freq: 32
  13. tau: 1.0
  14. # initial_alpha: 0.5
  15. train_batch_size: 32
  16. optimization:
  17. actor_learning_rate: 0.005
  18. critic_learning_rate: 0.005
  19. entropy_learning_rate: 0.0001
  20. # grad_norm_clipping: 40.0
  21. # evaluation_config:
  22. # explore: true