halfcheetah-pybullet-sac.yaml 939 B

12345678910111213141516171819202122232425262728293031323334
  1. halfcheetah-pybullet-sac:
  2. env: HalfCheetahBulletEnv-v0
  3. run: SAC
  4. stop:
  5. episode_reward_mean: 800.0
  6. config:
  7. # Works for both torch and tf.
  8. framework: tf
  9. horizon: 1000
  10. soft_horizon: false
  11. Q_model:
  12. fcnet_activation: relu
  13. fcnet_hiddens: [256, 256]
  14. policy_model:
  15. fcnet_activation: relu
  16. fcnet_hiddens: [256, 256]
  17. tau: 0.005
  18. target_entropy: auto
  19. no_done_at_end: false
  20. n_step: 3
  21. rollout_fragment_length: 1
  22. prioritized_replay: true
  23. train_batch_size: 256
  24. target_network_update_freq: 1
  25. timesteps_per_iteration: 1000
  26. learning_starts: 10000
  27. optimization:
  28. actor_learning_rate: 0.0003
  29. critic_learning_rate: 0.0003
  30. entropy_learning_rate: 0.0003
  31. num_workers: 0
  32. num_gpus: 1
  33. metrics_smoothing_episodes: 5