two-step-game-maddpg.yaml 987 B

1234567891011121314151617181920212223242526272829303132333435
  1. two-step-game-maddpg:
  2. env: ray.rllib.examples.env.two_step_game.TwoStepGame
  3. run: MADDPG
  4. stop:
  5. sampler_results/episode_reward_mean: 7.2
  6. timesteps_total: 20000
  7. config:
  8. # MADDPG only supports tf for now.
  9. framework: torch
  10. env_config:
  11. env_config:
  12. actions_are_logits: true
  13. num_steps_sampled_before_learning_starts: 200
  14. multiagent:
  15. policies:
  16. p0:
  17. - null
  18. - null
  19. - null
  20. - {
  21. agent_id: 0
  22. }
  23. p1:
  24. - null
  25. - null
  26. - null
  27. - {
  28. agent_id: 1
  29. }
  30. # YAML-capable policy_mapping_fn definition via providing a callable class here.
  31. policy_mapping_fn:
  32. type: ray.rllib.examples.multi_agent_and_self_play.policy_mapping_fn.PolicyMappingFn