pong-rainbow.yaml 774 B

1234567891011121314151617181920212223242526272829
  1. pong-deterministic-rainbow:
  2. env: PongDeterministic-v4
  3. run: DQN
  4. stop:
  5. episode_reward_mean: 20
  6. config:
  7. num_atoms: 51
  8. noisy: True
  9. gamma: 0.99
  10. lr: .0001
  11. hiddens: [512]
  12. learning_starts: 10000
  13. buffer_size: 50000
  14. rollout_fragment_length: 4
  15. train_batch_size: 32
  16. exploration_config:
  17. epsilon_timesteps: 2
  18. final_epsilon: 0.0
  19. target_network_update_freq: 500
  20. prioritized_replay: True
  21. prioritized_replay_alpha: 0.5
  22. final_prioritized_replay_beta: 1.0
  23. prioritized_replay_beta_annealing_timesteps: 400000
  24. n_step: 3
  25. gpu: True
  26. model:
  27. grayscale: True
  28. zero_mean: False
  29. dim: 42