dqn-LunarLander-v2 / config.yml
nsanghi's picture
Initial commit
e6ac2d1
raw
history blame
474 Bytes
!!python/object/apply:collections.OrderedDict
- - - batch_size
- 128
- - buffer_size
- 50000
- - exploration_final_eps
- 0.1
- - exploration_fraction
- 0.12
- - gamma
- 0.99
- - gradient_steps
- -1
- - learning_rate
- 0.00063
- - learning_starts
- 0
- - n_timesteps
- 100000.0
- - policy
- MlpPolicy
- - policy_kwargs
- dict(net_arch=[256, 256])
- - target_update_interval
- 250
- - train_freq
- 4