12345678910111213141516171819 |
- cartpole-dqn-w-param-noise:
- env: CartPole-v0
- run: DQN
- stop:
- episode_reward_mean: 150
- timesteps_total: 300000
- config:
- # Works for both torch and tf.
- framework: tf
- exploration_config:
- type: ParameterNoise
- random_timesteps: 10000
- initial_stddev: 1.0
- batch_mode: complete_episodes
- lr: 0.0008
- num_workers: 0
- model:
- fcnet_hiddens: [32, 32]
- fcnet_activation: tanh
|