!!python/object/apply:collections.OrderedDict - - - batch_size - 256 - - clip_range - lin_0.2 - - ent_coef - 0.001 - - gae_lambda - 0.95 - - gamma - 0.999 - - learning_rate - lin_3e-4 - - n_envs - 32 - - n_epochs - 10 - - n_steps - 256 - - n_timesteps - 100000000.0 - - normalize - true - - policy - MlpLstmPolicy - - policy_kwargs - dict( ortho_init=False, activation_fn=nn.ReLU, lstm_hidden_size=64, enable_critic_lstm=True, net_arch=dict(pi=[64], vf=[64]) )