Upload PPO LunarLander-v2 trained agent
Browse files- README.md +1 -1
- config.json +1 -1
- ppo-LunarLander-v2.zip +2 -2
- ppo-LunarLander-v2/data +9 -9
- ppo-LunarLander-v2/policy.optimizer.pth +1 -1
- ppo-LunarLander-v2/policy.pth +1 -1
- results.json +1 -1
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: LunarLander-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value:
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
16 |
type: LunarLander-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: 281.38 +/- 17.97
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f7c4a07a050>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f7c4a07a0e0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f7c4a07a170>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f7c4a07a200>", "_build": "<function ActorCriticPolicy._build at 0x7f7c4a07a290>", "forward": "<function ActorCriticPolicy.forward at 0x7f7c4a07a320>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f7c4a07a3b0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f7c4a07a440>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f7c4a07a4d0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f7c4a07a560>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f7c4a07a5f0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f7c4a071d40>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 2031616, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1674250808773494007, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVDQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMbS9ob21lL2NocmlzL2FuYWNvbmRhMy9lbnZzL2RlZXBfcmxfY2xhc3NfdW5pdDEvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjG0vaG9tZS9jaHJpcy9hbmFjb25kYTMvZW52cy9kZWVwX3JsX2NsYXNzX3VuaXQxL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAJpHBL24vva54Cc/uiIOHjaH9i674rxeOQAAgD8AAIA/Zr32vC7Rrz8Oexa//h/FvlKQczx8PT+8AAAAAAAAAAAzTwc8Hz3wuf4yyDtxfcY3JozguoScjTYAAIA/AACAPzN7ibtS0Pe5+rrBurxESzQtjzi6oPTiOQAAgD8AAIA/zaBNPClQLbp29ou7u2UGuZN0HjnCspM4AACAPwAAgD9NDaa94WCBuvXy/7k5izY1M5LGOgpKFTkAAIA/AACAP2atjbz2RC669GSVu5T26jfSTpC5/hMitwAAgD8AAIA/mo3HvFwHXLoj6US6XrbstQqrhDva52E5AACAPwAAgD8z3iG9b/0DPpuP0D1h4om+oJWhPFIMET4AAAAAAAAAAGbm0TuJjgM9QJBVOwYPnb6uSsq8QYrBPAAAAAAAAAAAZgbVvI82TLq6m+O6JJIbtnF2kztugQU6AACAPwAAgD96YSS+17xeuzj1qLs+KQ25+EeSPKUC8TkAAIA/AACAP3NdiD0b87w/blEPP6H0BD6Xgtw83pJiPgAAAAAAAAAAs07bPcO9MroKgps5VU4LNcnxcjtn27W4AACAPwAAgD9myNo8XGtkulAZ87r8HD+210nKOjZaCToAAIA/AACAP42bYr7Qmt8+NqWwPgmOuL4rl8W8OaCbPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVeRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIu9HHfMA0aECUhpRSlIwBbJRN6AOMAXSUR0D1QWU09QoDdX2UKGgGaAloD0MIjq89syRaZkCUhpRSlGgVTegDaBZHQPVBbUlLOA11fZQoaAZoCWgPQwg1tteC3u9mQJSGlFKUaBVN6ANoFkdA9UFuwh4dIXV9lChoBmgJaA9DCLfte9Rf5GBAlIaUUpRoFU3oA2gWR0D1QXK7w8W9dX2UKGgGaAloD0MITMecZ+wKZkCUhpRSlGgVTegDaBZHQPVBdretSyd1fZQoaAZoCWgPQwgSh2wg3dhnQJSGlFKUaBVN6ANoFkdA9UF3WrwOOXV9lChoBmgJaA9DCMgIqHAErmFAlIaUUpRoFU3oA2gWR0D1QXd9YOlPdX2UKGgGaAloD0MIUI4CREGJZUCUhpRSlGgVTegDaBZHQPVBeEUEgW91fZQoaAZoCWgPQwgoZOdt7HNkQJSGlFKUaBVN6ANoFkdA9UF7dx2jf3V9lChoBmgJaA9DCEBpqFFISWdAlIaUUpRoFU3oA2gWR0D1QXuTLW7OdX2UKGgGaAloD0MI4UIewY2iQUCUhpRSlGgVS4RoFkdA9UF71z6rNnV9lChoBmgJaA9DCATLETKQFmlAlIaUUpRoFU3oA2gWR0D1QXwUPhAGdX2UKGgGaAloD0MIweYcPBPoTUCUhpRSlGgVS5loFkdA9UGIi83+/HV9lChoBmgJaA9DCPMgPUUOeGRAlIaUUpRoFU3oA2gWR0D1QZdZjx0/dX2UKGgGaAloD0MIiSZQxKKuZUCUhpRSlGgVTegDaBZHQPVBm9U4rBl1fZQoaAZoCWgPQwj3WztREuhkQJSGlFKUaBVN6ANoFkdA9UGzTSThYXV9lChoBmgJaA9DCKJCdXNxSmdAlIaUUpRoFU3oA2gWR0D1QcRzqbBodX2UKGgGaAloD0MI/g+wVm2RZ0CUhpRSlGgVTegDaBZHQPVBx0WweNl1fZQoaAZoCWgPQwi1/MBVnppkQJSGlFKUaBVN6ANoFkdA9UHd7xAjZHV9lChoBmgJaA9DCCEhyhc0pGhAlIaUUpRoFU3oA2gWR0D1QefrDIikdX2UKGgGaAloD0MI/MOWHs1YZUCUhpRSlGgVTegDaBZHQPVB7DPt2LZ1fZQoaAZoCWgPQwiIK2fvDJVkQJSGlFKUaBVN6ANoFkdA9UHwpTMq0HV9lChoBmgJaA9DCNGvrZ9+XGJAlIaUUpRoFU3oA2gWR0D1QfFtBfKIdX2UKGgGaAloD0MIaqSl8va/ZECUhpRSlGgVTegDaBZHQPVB8ZdTo+x1fZQoaAZoCWgPQwh23VuRmBRhQJSGlFKUaBVN6ANoFkdA9UHyj8gp0HV9lChoBmgJaA9DCDYgQlw5sF5AlIaUUpRoFU3oA2gWR0D1QfYynk1edX2UKGgGaAloD0MIf0xr09i8YECUhpRSlGgVTegDaBZHQPVB9rUvwmV1fZQoaAZoCWgPQwhUxr/POABkQJSGlFKUaBVN6ANoFkdA9UH3AnQY13V9lChoBmgJaA9DCLABEeLKW2JAlIaUUpRoFU3oA2gWR0D1QgNT4cm0dX2UKGgGaAloD0MIa5vicVFEYkCUhpRSlGgVTegDaBZHQPVC0T6KtPp1fZQoaAZoCWgPQwiZ8iGomkZmQJSGlFKUaBVN6ANoFkdA9ULVgdsBQ3V9lChoBmgJaA9DCDhJ88e0LWhAlIaUUpRoFU3oA2gWR0D1Quz8vmHQdX2UKGgGaAloD0MINGWnH1SEY0CUhpRSlGgVTegDaBZHQPVC/lsnAqN1fZQoaAZoCWgPQwhLHk/LjzNnQJSGlFKUaBVN6ANoFkdA9UMA9gnc+XV9lChoBmgJaA9DCG3IPzMIq2ZAlIaUUpRoFU3oA2gWR0D1QxduwosqdX2UKGgGaAloD0MIuFonLkc/ZECUhpRSlGgVTegDaBZHQPVDIpcLSeB1fZQoaAZoCWgPQwhJ88e0NkxgQJSGlFKUaBVN6ANoFkdA9UMnNTtLMHV9lChoBmgJaA9DCJMcsKvJ3mZAlIaUUpRoFU3oA2gWR0D1Qyue8PFvdX2UKGgGaAloD0MIoBnEB/Z6YkCUhpRSlGgVTegDaBZHQPVDLF5Rjz91fZQoaAZoCWgPQwis4SL3dFpjQJSGlFKUaBVN6ANoFkdA9UMsghStNnV9lChoBmgJaA9DCKVKlL0lH2NAlIaUUpRoFU3oA2gWR0D1Qy1fbKzSdX2UKGgGaAloD0MILQsm/qjfY0CUhpRSlGgVTegDaBZHQPVDMUYZVGV1fZQoaAZoCWgPQwhYIHpSJjZkQJSGlFKUaBVN6ANoFkdA9UMxut4iYHV9lChoBmgJaA9DCD0Og/krk2VAlIaUUpRoFU3oA2gWR0D1QzILzf78dX2UKGgGaAloD0MIU7MHWoH9YUCUhpRSlGgVTegDaBZHQPVDQpg3Lmp1fZQoaAZoCWgPQwhTswdagZxQQJSGlFKUaBVLuWgWR0D1Q0aKJEYwdX2UKGgGaAloD0MIIm5OJQOrY0CUhpRSlGgVTegDaBZHQPVDUcep4r11fZQoaAZoCWgPQwjWOQZkr0NmQJSGlFKUaBVN6ANoFkdA9UNVvIwM6XV9lChoBmgJaA9DCMGQ1a0e/GNAlIaUUpRoFU3oA2gWR0D1Q21PykKvdX2UKGgGaAloD0MI4lmCjICGY0CUhpRSlGgVTegDaBZHQPVDfd1q33J1fZQoaAZoCWgPQwg3ixcLQ45mQJSGlFKUaBVN6ANoFkdA9UOAX2RJVnV9lChoBmgJaA9DCE8+Pbbl62dAlIaUUpRoFU3oA2gWR0D1Q5h0+1SgdX2UKGgGaAloD0MIcAnAP6WCZkCUhpRSlGgVTegDaBZHQPVDor3WWhR1fZQoaAZoCWgPQwjGFoIcFHZiQJSGlFKUaBVN6ANoFkdA9UOnFXiiqXV9lChoBmgJaA9DCA+BI4EGHmVAlIaUUpRoFU3oA2gWR0D1Q6uJWeYldX2UKGgGaAloD0MIlPdxNMeUZECUhpRSlGgVTegDaBZHQPVDrEzJp351fZQoaAZoCWgPQwhGDDuMyRFlQJSGlFKUaBVN6ANoFkdA9UOsddNWVHV9lChoBmgJaA9DCCrj32dcm2FAlIaUUpRoFU3oA2gWR0D1Q61jFAE/dX2UKGgGaAloD0MIkUYFTrbDS0CUhpRSlGgVS6poFkdA9UOvKLGaQXV9lChoBmgJaA9DCOnvpfAg72ZAlIaUUpRoFU3oA2gWR0D1Q7FGEf1ZdX2UKGgGaAloD0MIP5C8cyitaUCUhpRSlGgVTegDaBZHQPVDsg4rBj51fZQoaAZoCWgPQwix22eVmaZkQJSGlFKUaBVN6ANoFkdA9UPCbIDHO3V9lChoBmgJaA9DCKHyr+UVUGJAlIaUUpRoFU3oA2gWR0D1Q8ZjQRf4dX2UKGgGaAloD0MIERjrGxg4YUCUhpRSlGgVTegDaBZHQPVEoGF8G9p1fZQoaAZoCWgPQwjlRpG1hn9mQJSGlFKUaBVN6ANoFkdA9USkUZaV2XV9lChoBmgJaA9DCEbSbvQxI05AlIaUUpRoFUuQaBZHQPVEtvDKoyd1fZQoaAZoCWgPQwgGZ/D3izdfQJSGlFKUaBVN6ANoFkdA9US7oqwyI3V9lChoBmgJaA9DCGJlNPL5UWVAlIaUUpRoFU3oA2gWR0D1RMr7Qb++dX2UKGgGaAloD0MIUMdjBqqWYUCUhpRSlGgVTegDaBZHQPVEzYw9JSR1fZQoaAZoCWgPQwgRj8TLU/BiQJSGlFKUaBVN6ANoFkdA9UTrp+x4ZHV9lChoBmgJaA9DCB5QNuWKTmJAlIaUUpRoFU3oA2gWR0D1RO/ejEehdX2UKGgGaAloD0MI5zbhXpmNYkCUhpRSlGgVTegDaBZHQPVE9CmXPZ91fZQoaAZoCWgPQwgw2uOF9ItkQJSGlFKUaBVN6ANoFkdA9UT08NlRQHV9lChoBmgJaA9DCGK9USvMD2NAlIaUUpRoFU3oA2gWR0D1RPUUUO/ddX2UKGgGaAloD0MIGLSQgNHOaECUhpRSlGgVTegDaBZHQPVE9f+l0o11fZQoaAZoCWgPQwjnGJC9XsBjQJSGlFKUaBVN6ANoFkdA9UT31CPZI3V9lChoBmgJaA9DCILn3sOlWWFAlIaUUpRoFU3oA2gWR0D1RPnw0O3EdX2UKGgGaAloD0MIVG8NbBWzY0CUhpRSlGgVTegDaBZHQPVE+rboKUp1fZQoaAZoCWgPQwgdO6jEdfZiQJSGlFKUaBVN6ANoFkdA9UUMwKBuoHV9lChoBmgJaA9DCG9nX3mQC19AlIaUUpRoFU3oA2gWR0D1RRCigkC4dX2UKGgGaAloD0MIm3XG90VjYECUhpRSlGgVTegDaBZHQPVFHMPnSv11fZQoaAZoCWgPQwh6UiY1tOFkQJSGlFKUaBVN6ANoFkdA9UUx6A4GU3V9lChoBmgJaA9DCE1okljSE2hAlIaUUpRoFU3oA2gWR0D1RTaIKMNudX2UKGgGaAloD0MIFVYqqCieYkCUhpRSlGgVTegDaBZHQPVFRQRlHz91fZQoaAZoCWgPQwgLDFnd6mRmQJSGlFKUaBVN6ANoFkdA9UVHUlNUO3V9lChoBmgJaA9DCDmc+dUczGFAlIaUUpRoFU3oA2gWR0D1RWcnVoYfdX2UKGgGaAloD0MIy9jQzf4QZUCUhpRSlGgVTegDaBZHQPVFa4khRqJ1fZQoaAZoCWgPQwjPSIRGMHVlQJSGlFKUaBVN6ANoFkdA9UVvwfhddHV9lChoBmgJaA9DCNS4N7/hlmRAlIaUUpRoFU3oA2gWR0D1RXCHQyAQdX2UKGgGaAloD0MI1ub/VcfIZECUhpRSlGgVTegDaBZHQPVFcKt0V8F1fZQoaAZoCWgPQwjWpxyTxXJlQJSGlFKUaBVN6ANoFkdA9UVxgXdj5XV9lChoBmgJaA9DCB+94T5y0WZAlIaUUpRoFU3oA2gWR0D1RXNMSK3vdX2UKGgGaAloD0MIrI2xE153Z0CUhpRSlGgVTegDaBZHQPVFdW7Wd3B1fZQoaAZoCWgPQwhupGyRtCJlQJSGlFKUaBVN6ANoFkdA9UV2KTbFj3V9lChoBmgJaA9DCDjb3JieYVBAlIaUUpRoFUuXaBZHQPVFf7HQyAR1fZQoaAZoCWgPQwimtWlsrwpjQJSGlFKUaBVN6ANoFkdA9UWFnIEKV3V9lChoBmgJaA9DCMzxCkRPnkBAlIaUUpRoFUvJaBZHQPVFhg87p3Z1fZQoaAZoCWgPQwjwTj49tghjQJSGlFKUaBVN6ANoFkdA9UWJocvM83V9lChoBmgJaA9DCMA9z5+2FGhAlIaUUpRoFU3oA2gWR0D1RZSqebuudX2UKGgGaAloD0MIgzRj0XRQRkCUhpRSlGgVS75oFkdA9UWVYllbvHVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 310, "n_steps": 2048, "gamma": 0.999, "gae_lambda": 0.99, "ent_coef": 0.02, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 5, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVDQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMbS9ob21lL2NocmlzL2FuYWNvbmRhMy9lbnZzL2RlZXBfcmxfY2xhc3NfdW5pdDEvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjG0vaG9tZS9jaHJpcy9hbmFjb25kYTMvZW52cy9kZWVwX3JsX2NsYXNzX3VuaXQxL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.15.79.1-microsoft-standard-WSL2-x86_64-with-glibc2.31 #1 SMP Wed Nov 23 01:01:46 UTC 2022", "Python": "3.10.8", "Stable-Baselines3": "1.6.2", "PyTorch": "1.13.0", "GPU Enabled": "True", "Numpy": "1.23.4", "Gym": "0.21.0"}}
|
|
|
1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f7c4a07a050>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f7c4a07a0e0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f7c4a07a170>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f7c4a07a200>", "_build": "<function ActorCriticPolicy._build at 0x7f7c4a07a290>", "forward": "<function ActorCriticPolicy.forward at 0x7f7c4a07a320>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f7c4a07a3b0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f7c4a07a440>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f7c4a07a4d0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f7c4a07a560>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f7c4a07a5f0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f7c4a071d40>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 3014656, "_total_timesteps": 3000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1674252950135636214, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVDQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMbS9ob21lL2NocmlzL2FuYWNvbmRhMy9lbnZzL2RlZXBfcmxfY2xhc3NfdW5pdDEvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjG0vaG9tZS9jaHJpcy9hbmFjb25kYTMvZW52cy9kZWVwX3JsX2NsYXNzX3VuaXQxL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM2qED32mBy6Jrk7tz05mLLQrAM7zuRcNgAAgD8AAIA/zWVAPa7ttroIgDqzHKekq4QzVzjjXL4zAACAPwAAgD/mbh69KFCZvOZJgD4wzgq+AJoXvdZqnr4AAIA/AACAP5ozLr0003Q/tW0Zvhat+b4uUJe9867AvQAAAAAAAAAAszZrPZg7lD+/iYM+nqYTvwqL9j228sM9AAAAAAAAAABAvw0+KNyMP/uJ/j4rXCK/Q+cfPoasVT4AAAAAAAAAANoBoj1NNEU/YlVTO920Ab9obQo+QnTcvQAAAAAAAAAAM+LbPbHPnj7yXz6+pmyjvr5V4bucEQa+AAAAAAAAAACaAVI7H8m4u+BwLTxeSKY8fAEIvZfxiz0AAIA/AACAP5pRLzsUmJ+64ipitQpggbAQIsC6aweVNAAAgD8AAIA/ZseQPPYIVbqY3mi5GrxhtB8e7zolPYk4AACAPwAAgD/Aw2++mOquPn2D0z5+na2+M3kXvpozhz4AAAAAAAAAAGZcJzyKU3s8GkJJPsT7o75StRc+NP6dvQAAAAAAAIA/zeqYPXtig7pDfjG6gcv0uJS+YroiHVw5AACAPwAAgD9aDYy9T88VPhd0yj1Bf7m+L6MBvSocGj0AAAAAAAAAADOKrTwUgKi6wgdXOdf8VTSOQc866+52uAAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVMRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMID5wzorSBcUCUhpRSlIwBbJRL+YwBdJRHQPXuRk1ZTyd1fZQoaAZoCWgPQwhVMZV+Am9zQJSGlFKUaBVNbwFoFkdA9e5Gp6po9XV9lChoBmgJaA9DCIZXkjyXJHFAlIaUUpRoFUv4aBZHQPXuR4qhDgJ1fZQoaAZoCWgPQwjrOel9IylwQJSGlFKUaBVLx2gWR0D17kjPtUn5dX2UKGgGaAloD0MI/pqsUQ8dcECUhpRSlGgVTQwBaBZHQPXuSYqtozx1fZQoaAZoCWgPQwgNbmsLj3RzQJSGlFKUaBVL6mgWR0D17kpxhDw6dX2UKGgGaAloD0MILxnHSDZ8cUCUhpRSlGgVS8xoFkdA9e5LEeZG8XV9lChoBmgJaA9DCMIXJlOFWW9AlIaUUpRoFUvPaBZHQPXuTIIhQnB1fZQoaAZoCWgPQwjGMv0ScVJyQJSGlFKUaBVL12gWR0D17k2s6JZXdX2UKGgGaAloD0MIlScQdgopcECUhpRSlGgVTR4BaBZHQPXuTePPszF1fZQoaAZoCWgPQwhig4WTtNxvQJSGlFKUaBVL2mgWR0D17k4Dp1RtdX2UKGgGaAloD0MIlGqfjgdQcECUhpRSlGgVTQEBaBZHQPXuTjYkE9t1fZQoaAZoCWgPQwj26053XiZ0QJSGlFKUaBVL9GgWR0D17k5kJa7mdX2UKGgGaAloD0MIc9nonJ+VcUCUhpRSlGgVS9poFkdA9e5O1nZkCnV9lChoBmgJaA9DCD+nID9bunFAlIaUUpRoFUvSaBZHQPXuT22jO9p1fZQoaAZoCWgPQwh0YaQX9XtyQJSGlFKUaBVL/GgWR0D17lBBHkLhdX2UKGgGaAloD0MIVg+YhwxJcUCUhpRSlGgVS91oFkdA9e5TlNUOu3V9lChoBmgJaA9DCJG3XP1Y4HBAlIaUUpRoFUvLaBZHQPXuU5X9zfd1fZQoaAZoCWgPQwiFfTuJyGhwQJSGlFKUaBVNJwFoFkdA9e5UiRwIdHV9lChoBmgJaA9DCLEYda09L3JAlIaUUpRoFU0/AWgWR0D17lZZV4ordX2UKGgGaAloD0MIda29T9UgcECUhpRSlGgVS/NoFkdA9e5Xx33Yc3V9lChoBmgJaA9DCIenV8py4XJAlIaUUpRoFU1GAWgWR0D17lfnwXqJdX2UKGgGaAloD0MIjuVd9QCzcUCUhpRSlGgVS9VoFkdA9e5ZFPBSDXV9lChoBmgJaA9DCET67etAI3FAlIaUUpRoFUvRaBZHQPXuWRK5Cnh1fZQoaAZoCWgPQwh0toDQunxxQJSGlFKUaBVNKQFoFkdA9e5aM2JizHV9lChoBmgJaA9DCIYcW8/QbnNAlIaUUpRoFUvwaBZHQPXuWpeKKpF1fZQoaAZoCWgPQwjB/uvcNIJuQJSGlFKUaBVL4WgWR0D17lrEjPfLdX2UKGgGaAloD0MIaJQu/YtJckCUhpRSlGgVS+poFkdA9e5a2ovSMXV9lChoBmgJaA9DCG3/ykoTCnNAlIaUUpRoFUvWaBZHQPXuWxYgaFV1fZQoaAZoCWgPQwjJdyl1CY1zQJSGlFKUaBVNDQFoFkdA9e5bOFQEZHV9lChoBmgJaA9DCOqu7ILBEXJAlIaUUpRoFU0OAWgWR0D17lwe9zwMdX2UKGgGaAloD0MIowbTMPyRckCUhpRSlGgVS99oFkdA9e5cizPa+XV9lChoBmgJaA9DCIiCGVOwCHJAlIaUUpRoFUvXaBZHQPXuYEDEFW51fZQoaAZoCWgPQwiGdHgI455xQJSGlFKUaBVL8GgWR0D17mHAB1cMdX2UKGgGaAloD0MIDw2LUdelbkCUhpRSlGgVS+VoFkdA9e5iFoxpL3V9lChoBmgJaA9DCM3K9iGvmXBAlIaUUpRoFUvYaBZHQPXuZVUS7Gx1fZQoaAZoCWgPQwhYrOEiN1dwQJSGlFKUaBVL+GgWR0D17mXWGyoodX2UKGgGaAloD0MINe1immnjcUCUhpRSlGgVS+poFkdA9e5mtITXa3V9lChoBmgJaA9DCA9h/DRuvW5AlIaUUpRoFUvhaBZHQPXuZ5fsu4B1fZQoaAZoCWgPQwi2LF+X4YxyQJSGlFKUaBVLyWgWR0D17mfhpg1FdX2UKGgGaAloD0MICttPxnhScUCUhpRSlGgVS+hoFkdA9e5oHCj1w3V9lChoBmgJaA9DCH9Ma9NYwm1AlIaUUpRoFUvQaBZHQPXuaJP9DQZ1fZQoaAZoCWgPQwhMHHkgciByQJSGlFKUaBVL7mgWR0D17mnhfShKdX2UKGgGaAloD0MIRWgEG1dhcECUhpRSlGgVS+1oFkdA9e5q7iZOSHV9lChoBmgJaA9DCCHn/X+c6HBAlIaUUpRoFUv4aBZHQPXuaxdszl91fZQoaAZoCWgPQwhHOC14EclxQJSGlFKUaBVL42gWR0D17mukUbkwdX2UKGgGaAloD0MIUyCzs2gickCUhpRSlGgVTSUBaBZHQPXubszeoDR1fZQoaAZoCWgPQwjGwhA5vetzQJSGlFKUaBVNCwFoFkdA9e5vXWFvh3V9lChoBmgJaA9DCC9szVaewXBAlIaUUpRoFUvEaBZHQPXucMQUYbd1fZQoaAZoCWgPQwhX7ZqQVp9xQJSGlFKUaBVL6mgWR0D17nFiItUXdX2UKGgGaAloD0MI+Kbps8OAckCUhpRSlGgVS+xoFkdA9e5zUipvP3V9lChoBmgJaA9DCO0pOSf203JAlIaUUpRoFUvlaBZHQPXudprO7g91fZQoaAZoCWgPQwiEnziA/vZwQJSGlFKUaBVL7GgWR0D17neKMNtqdX2UKGgGaAloD0MITioaa/9Pb0CUhpRSlGgVS9RoFkdA9e539oi9qXV9lChoBmgJaA9DCOEp5Ep9mnBAlIaUUpRoFUvZaBZHQPXueCQXAM51fZQoaAZoCWgPQwjUCz7NCQZyQJSGlFKUaBVL5WgWR0D17ni0jTrndX2UKGgGaAloD0MIRnu8kE4IcECUhpRSlGgVS8doFkdA9e55zHjp93V9lChoBmgJaA9DCK3boPYboHFAlIaUUpRoFUvsaBZHQPXuejPWxyJ1fZQoaAZoCWgPQwiJYYcx6dtvQJSGlFKUaBVL3mgWR0D17npnvDxcdX2UKGgGaAloD0MILC0j9Z6cckCUhpRSlGgVTQsBaBZHQPXuenT6SDB1fZQoaAZoCWgPQwjmkT8YeChLQJSGlFKUaBVLomgWR0D17nqWKMvRdX2UKGgGaAloD0MIZk0s8JUlcUCUhpRSlGgVS+5oFkdA9e58KTB68nV9lChoBmgJaA9DCFwFMdD1KHBAlIaUUpRoFUvAaBZHQPXufKqhlDp1fZQoaAZoCWgPQwjbTIV4ZK9xQJSGlFKUaBVNBAFoFkdA9e59uocaO3V9lChoBmgJaA9DCPKxu0BJmG1AlIaUUpRoFUvTaBZHQPXuftTfixV1fZQoaAZoCWgPQwhgArfuZvRwQJSGlFKUaBVL6GgWR0D17oCUs4DLdX2UKGgGaAloD0MIQ3QIHAk2ckCUhpRSlGgVS9VoFkdA9e6BGAoXsXV9lChoBmgJaA9DCCk+PiG77nFAlIaUUpRoFUvKaBZHQPXug90mtyR1fZQoaAZoCWgPQwgEOpM21X1xQJSGlFKUaBVL0GgWR0D17oSPKuB+dX2UKGgGaAloD0MIlDKpoc1nc0CUhpRSlGgVS99oFkdA9e6FmmgrY3V9lChoBmgJaA9DCBjshm3LtHBAlIaUUpRoFUv7aBZHQPXuhiLyc1B1fZQoaAZoCWgPQwjFkQciS2hwQJSGlFKUaBVL4WgWR0D17oZEbYK6dX2UKGgGaAloD0MIkUPEzSlQb0CUhpRSlGgVS9JoFkdA9e6GUj1PFnV9lChoBmgJaA9DCOYffZOmC3FAlIaUUpRoFUvmaBZHQPXuiE7FKkF1fZQoaAZoCWgPQwiI8ZpXdT5yQJSGlFKUaBVL8WgWR0D17ojRK6FudX2UKGgGaAloD0MIol7wac4ncUCUhpRSlGgVS+5oFkdA9e6JAVO9FnV9lChoBmgJaA9DCGsOEMzRnG1AlIaUUpRoFUvRaBZHQPXuiP56+nJ1fZQoaAZoCWgPQwgB323euDxtQJSGlFKUaBVL9GgWR0D17oksJ6Y3dX2UKGgGaAloD0MIiJ//Hrz+cUCUhpRSlGgVS9poFkdA9e6Mf9UCJXV9lChoBmgJaA9DCN2WyAVnOW9AlIaUUpRoFU0BAWgWR0D17oyYCyQgdX2UKGgGaAloD0MIWMhcGZTFckCUhpRSlGgVS/JoFkdA9e6M1um78XV9lChoBmgJaA9DCGx8JvunMXJAlIaUUpRoFUv0aBZHQPXukJDNQj51fZQoaAZoCWgPQwgQ6EzalM9wQJSGlFKUaBVL0WgWR0D17pOqfvnbdX2UKGgGaAloD0MIOkGbHL4qckCUhpRSlGgVS8xoFkdA9e6ULYoRZnV9lChoBmgJaA9DCAWiJ2VSzm1AlIaUUpRoFU0tAWgWR0D17pSFYdQwdX2UKGgGaAloD0MIYcQ+AdRFckCUhpRSlGgVS9JoFkdA9e6UmxIJ7nV9lChoBmgJaA9DCBajrrW3z3JAlIaUUpRoFUvmaBZHQPXulcHhS+B1fZQoaAZoCWgPQwh9z0iEBiFyQJSGlFKUaBVL2WgWR0D17pcttQ9BdX2UKGgGaAloD0MIQbgCCrWHcUCUhpRSlGgVS9VoFkdA9e6XZeNT+HV9lChoBmgJaA9DCChJ10y+UHNAlIaUUpRoFU0ZAWgWR0D17pedIXj3dX2UKGgGaAloD0MI8ExokljBckCUhpRSlGgVTTgBaBZHQPXumMsWfsh1fZQoaAZoCWgPQwhyxcVRefxwQJSGlFKUaBVL8mgWR0D17pmlqagFdX2UKGgGaAloD0MIeQJhp1hMb0CUhpRSlGgVS/poFkdA9e6Z+8scyXV9lChoBmgJaA9DCHmxMETO+21AlIaUUpRoFUv/aBZHQPXumksK9f11fZQoaAZoCWgPQwj4F0Fjpq9tQJSGlFKUaBVL6WgWR0D17p0YL9dedX2UKGgGaAloD0MIa0jcY+lObkCUhpRSlGgVTQABaBZHQPXunmpda+x1fZQoaAZoCWgPQwjiBnx+mPxxQJSGlFKUaBVLw2gWR0D17qGmw7kodX2UKGgGaAloD0MIaw97oQCrckCUhpRSlGgVS9JoFkdA9e6jKioKlnV9lChoBmgJaA9DCBXj/E0odnBAlIaUUpRoFU1PAWgWR0D17qRwWnCPdX2UKGgGaAloD0MIMSO8PYjWcUCUhpRSlGgVS85oFkdA9e6kimEXcnVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 460, "n_steps": 2048, "gamma": 0.9999, "gae_lambda": 0.99, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 5, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVDQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMbS9ob21lL2NocmlzL2FuYWNvbmRhMy9lbnZzL2RlZXBfcmxfY2xhc3NfdW5pdDEvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjG0vaG9tZS9jaHJpcy9hbmFjb25kYTMvZW52cy9kZWVwX3JsX2NsYXNzX3VuaXQxL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.15.79.1-microsoft-standard-WSL2-x86_64-with-glibc2.31 #1 SMP Wed Nov 23 01:01:46 UTC 2022", "Python": "3.10.8", "Stable-Baselines3": "1.6.2", "PyTorch": "1.13.0", "GPU Enabled": "True", "Numpy": "1.23.4", "Gym": "0.21.0"}}
|
ppo-LunarLander-v2.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ccae721497a049d2bc5ab7d44b936e5b932d9403857c18d298055d800c298af
|
3 |
+
size 147330
|
ppo-LunarLander-v2/data
CHANGED
@@ -42,12 +42,12 @@
|
|
42 |
"_np_random": null
|
43 |
},
|
44 |
"n_envs": 16,
|
45 |
-
"num_timesteps":
|
46 |
-
"_total_timesteps":
|
47 |
"_num_timesteps_at_start": 0,
|
48 |
"seed": null,
|
49 |
"action_noise": null,
|
50 |
-
"start_time":
|
51 |
"learning_rate": 0.0003,
|
52 |
"tensorboard_log": null,
|
53 |
"lr_schedule": {
|
@@ -56,7 +56,7 @@
|
|
56 |
},
|
57 |
"_last_obs": {
|
58 |
":type:": "<class 'numpy.ndarray'>",
|
59 |
-
":serialized:": "
|
60 |
},
|
61 |
"_last_episode_starts": {
|
62 |
":type:": "<class 'numpy.ndarray'>",
|
@@ -66,20 +66,20 @@
|
|
66 |
"_episode_num": 0,
|
67 |
"use_sde": false,
|
68 |
"sde_sample_freq": -1,
|
69 |
-
"_current_progress_remaining": -0.
|
70 |
"ep_info_buffer": {
|
71 |
":type:": "<class 'collections.deque'>",
|
72 |
-
":serialized:": "
|
73 |
},
|
74 |
"ep_success_buffer": {
|
75 |
":type:": "<class 'collections.deque'>",
|
76 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
77 |
},
|
78 |
-
"_n_updates":
|
79 |
"n_steps": 2048,
|
80 |
-
"gamma": 0.
|
81 |
"gae_lambda": 0.99,
|
82 |
-
"ent_coef": 0.
|
83 |
"vf_coef": 0.5,
|
84 |
"max_grad_norm": 0.5,
|
85 |
"batch_size": 64,
|
|
|
42 |
"_np_random": null
|
43 |
},
|
44 |
"n_envs": 16,
|
45 |
+
"num_timesteps": 3014656,
|
46 |
+
"_total_timesteps": 3000000,
|
47 |
"_num_timesteps_at_start": 0,
|
48 |
"seed": null,
|
49 |
"action_noise": null,
|
50 |
+
"start_time": 1674252950135636214,
|
51 |
"learning_rate": 0.0003,
|
52 |
"tensorboard_log": null,
|
53 |
"lr_schedule": {
|
|
|
56 |
},
|
57 |
"_last_obs": {
|
58 |
":type:": "<class 'numpy.ndarray'>",
|
59 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM2qED32mBy6Jrk7tz05mLLQrAM7zuRcNgAAgD8AAIA/zWVAPa7ttroIgDqzHKekq4QzVzjjXL4zAACAPwAAgD/mbh69KFCZvOZJgD4wzgq+AJoXvdZqnr4AAIA/AACAP5ozLr0003Q/tW0Zvhat+b4uUJe9867AvQAAAAAAAAAAszZrPZg7lD+/iYM+nqYTvwqL9j228sM9AAAAAAAAAABAvw0+KNyMP/uJ/j4rXCK/Q+cfPoasVT4AAAAAAAAAANoBoj1NNEU/YlVTO920Ab9obQo+QnTcvQAAAAAAAAAAM+LbPbHPnj7yXz6+pmyjvr5V4bucEQa+AAAAAAAAAACaAVI7H8m4u+BwLTxeSKY8fAEIvZfxiz0AAIA/AACAP5pRLzsUmJ+64ipitQpggbAQIsC6aweVNAAAgD8AAIA/ZseQPPYIVbqY3mi5GrxhtB8e7zolPYk4AACAPwAAgD/Aw2++mOquPn2D0z5+na2+M3kXvpozhz4AAAAAAAAAAGZcJzyKU3s8GkJJPsT7o75StRc+NP6dvQAAAAAAAIA/zeqYPXtig7pDfjG6gcv0uJS+YroiHVw5AACAPwAAgD9aDYy9T88VPhd0yj1Bf7m+L6MBvSocGj0AAAAAAAAAADOKrTwUgKi6wgdXOdf8VTSOQc866+52uAAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
60 |
},
|
61 |
"_last_episode_starts": {
|
62 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
66 |
"_episode_num": 0,
|
67 |
"use_sde": false,
|
68 |
"sde_sample_freq": -1,
|
69 |
+
"_current_progress_remaining": -0.004885333333333408,
|
70 |
"ep_info_buffer": {
|
71 |
":type:": "<class 'collections.deque'>",
|
72 |
+
":serialized:": "gAWVMRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMID5wzorSBcUCUhpRSlIwBbJRL+YwBdJRHQPXuRk1ZTyd1fZQoaAZoCWgPQwhVMZV+Am9zQJSGlFKUaBVNbwFoFkdA9e5Gp6po9XV9lChoBmgJaA9DCIZXkjyXJHFAlIaUUpRoFUv4aBZHQPXuR4qhDgJ1fZQoaAZoCWgPQwjrOel9IylwQJSGlFKUaBVLx2gWR0D17kjPtUn5dX2UKGgGaAloD0MI/pqsUQ8dcECUhpRSlGgVTQwBaBZHQPXuSYqtozx1fZQoaAZoCWgPQwgNbmsLj3RzQJSGlFKUaBVL6mgWR0D17kpxhDw6dX2UKGgGaAloD0MILxnHSDZ8cUCUhpRSlGgVS8xoFkdA9e5LEeZG8XV9lChoBmgJaA9DCMIXJlOFWW9AlIaUUpRoFUvPaBZHQPXuTIIhQnB1fZQoaAZoCWgPQwjGMv0ScVJyQJSGlFKUaBVL12gWR0D17k2s6JZXdX2UKGgGaAloD0MIlScQdgopcECUhpRSlGgVTR4BaBZHQPXuTePPszF1fZQoaAZoCWgPQwhig4WTtNxvQJSGlFKUaBVL2mgWR0D17k4Dp1RtdX2UKGgGaAloD0MIlGqfjgdQcECUhpRSlGgVTQEBaBZHQPXuTjYkE9t1fZQoaAZoCWgPQwj26053XiZ0QJSGlFKUaBVL9GgWR0D17k5kJa7mdX2UKGgGaAloD0MIc9nonJ+VcUCUhpRSlGgVS9poFkdA9e5O1nZkCnV9lChoBmgJaA9DCD+nID9bunFAlIaUUpRoFUvSaBZHQPXuT22jO9p1fZQoaAZoCWgPQwh0YaQX9XtyQJSGlFKUaBVL/GgWR0D17lBBHkLhdX2UKGgGaAloD0MIVg+YhwxJcUCUhpRSlGgVS91oFkdA9e5TlNUOu3V9lChoBmgJaA9DCJG3XP1Y4HBAlIaUUpRoFUvLaBZHQPXuU5X9zfd1fZQoaAZoCWgPQwiFfTuJyGhwQJSGlFKUaBVNJwFoFkdA9e5UiRwIdHV9lChoBmgJaA9DCLEYda09L3JAlIaUUpRoFU0/AWgWR0D17lZZV4ordX2UKGgGaAloD0MIda29T9UgcECUhpRSlGgVS/NoFkdA9e5Xx33Yc3V9lChoBmgJaA9DCIenV8py4XJAlIaUUpRoFU1GAWgWR0D17lfnwXqJdX2UKGgGaAloD0MIjuVd9QCzcUCUhpRSlGgVS9VoFkdA9e5ZFPBSDXV9lChoBmgJaA9DCET67etAI3FAlIaUUpRoFUvRaBZHQPXuWRK5Cnh1fZQoaAZoCWgPQwh0toDQunxxQJSGlFKUaBVNKQFoFkdA9e5aM2JizHV9lChoBmgJaA9DCIYcW8/QbnNAlIaUUpRoFUvwaBZHQPXuWpeKKpF1fZQoaAZoCWgPQwjB/uvcNIJuQJSGlFKUaBVL4WgWR0D17lrEjPfLdX2UKGgGaAloD0MIaJQu/YtJckCUhpRSlGgVS+poFkdA9e5a2ovSMXV9lChoBmgJaA9DCG3/ykoTCnNAlIaUUpRoFUvWaBZHQPXuWxYgaFV1fZQoaAZoCWgPQwjJdyl1CY1zQJSGlFKUaBVNDQFoFkdA9e5bOFQEZHV9lChoBmgJaA9DCOqu7ILBEXJAlIaUUpRoFU0OAWgWR0D17lwe9zwMdX2UKGgGaAloD0MIowbTMPyRckCUhpRSlGgVS99oFkdA9e5cizPa+XV9lChoBmgJaA9DCIiCGVOwCHJAlIaUUpRoFUvXaBZHQPXuYEDEFW51fZQoaAZoCWgPQwiGdHgI455xQJSGlFKUaBVL8GgWR0D17mHAB1cMdX2UKGgGaAloD0MIDw2LUdelbkCUhpRSlGgVS+VoFkdA9e5iFoxpL3V9lChoBmgJaA9DCM3K9iGvmXBAlIaUUpRoFUvYaBZHQPXuZVUS7Gx1fZQoaAZoCWgPQwhYrOEiN1dwQJSGlFKUaBVL+GgWR0D17mXWGyoodX2UKGgGaAloD0MINe1immnjcUCUhpRSlGgVS+poFkdA9e5mtITXa3V9lChoBmgJaA9DCA9h/DRuvW5AlIaUUpRoFUvhaBZHQPXuZ5fsu4B1fZQoaAZoCWgPQwi2LF+X4YxyQJSGlFKUaBVLyWgWR0D17mfhpg1FdX2UKGgGaAloD0MICttPxnhScUCUhpRSlGgVS+hoFkdA9e5oHCj1w3V9lChoBmgJaA9DCH9Ma9NYwm1AlIaUUpRoFUvQaBZHQPXuaJP9DQZ1fZQoaAZoCWgPQwhMHHkgciByQJSGlFKUaBVL7mgWR0D17mnhfShKdX2UKGgGaAloD0MIRWgEG1dhcECUhpRSlGgVS+1oFkdA9e5q7iZOSHV9lChoBmgJaA9DCCHn/X+c6HBAlIaUUpRoFUv4aBZHQPXuaxdszl91fZQoaAZoCWgPQwhHOC14EclxQJSGlFKUaBVL42gWR0D17mukUbkwdX2UKGgGaAloD0MIUyCzs2gickCUhpRSlGgVTSUBaBZHQPXubszeoDR1fZQoaAZoCWgPQwjGwhA5vetzQJSGlFKUaBVNCwFoFkdA9e5vXWFvh3V9lChoBmgJaA9DCC9szVaewXBAlIaUUpRoFUvEaBZHQPXucMQUYbd1fZQoaAZoCWgPQwhX7ZqQVp9xQJSGlFKUaBVL6mgWR0D17nFiItUXdX2UKGgGaAloD0MI+Kbps8OAckCUhpRSlGgVS+xoFkdA9e5zUipvP3V9lChoBmgJaA9DCO0pOSf203JAlIaUUpRoFUvlaBZHQPXudprO7g91fZQoaAZoCWgPQwiEnziA/vZwQJSGlFKUaBVL7GgWR0D17neKMNtqdX2UKGgGaAloD0MITioaa/9Pb0CUhpRSlGgVS9RoFkdA9e539oi9qXV9lChoBmgJaA9DCOEp5Ep9mnBAlIaUUpRoFUvZaBZHQPXueCQXAM51fZQoaAZoCWgPQwjUCz7NCQZyQJSGlFKUaBVL5WgWR0D17ni0jTrndX2UKGgGaAloD0MIRnu8kE4IcECUhpRSlGgVS8doFkdA9e55zHjp93V9lChoBmgJaA9DCK3boPYboHFAlIaUUpRoFUvsaBZHQPXuejPWxyJ1fZQoaAZoCWgPQwiJYYcx6dtvQJSGlFKUaBVL3mgWR0D17npnvDxcdX2UKGgGaAloD0MILC0j9Z6cckCUhpRSlGgVTQsBaBZHQPXuenT6SDB1fZQoaAZoCWgPQwjmkT8YeChLQJSGlFKUaBVLomgWR0D17nqWKMvRdX2UKGgGaAloD0MIZk0s8JUlcUCUhpRSlGgVS+5oFkdA9e58KTB68nV9lChoBmgJaA9DCFwFMdD1KHBAlIaUUpRoFUvAaBZHQPXufKqhlDp1fZQoaAZoCWgPQwjbTIV4ZK9xQJSGlFKUaBVNBAFoFkdA9e59uocaO3V9lChoBmgJaA9DCPKxu0BJmG1AlIaUUpRoFUvTaBZHQPXuftTfixV1fZQoaAZoCWgPQwhgArfuZvRwQJSGlFKUaBVL6GgWR0D17oCUs4DLdX2UKGgGaAloD0MIQ3QIHAk2ckCUhpRSlGgVS9VoFkdA9e6BGAoXsXV9lChoBmgJaA9DCCk+PiG77nFAlIaUUpRoFUvKaBZHQPXug90mtyR1fZQoaAZoCWgPQwgEOpM21X1xQJSGlFKUaBVL0GgWR0D17oSPKuB+dX2UKGgGaAloD0MIlDKpoc1nc0CUhpRSlGgVS99oFkdA9e6FmmgrY3V9lChoBmgJaA9DCBjshm3LtHBAlIaUUpRoFUv7aBZHQPXuhiLyc1B1fZQoaAZoCWgPQwjFkQciS2hwQJSGlFKUaBVL4WgWR0D17oZEbYK6dX2UKGgGaAloD0MIkUPEzSlQb0CUhpRSlGgVS9JoFkdA9e6GUj1PFnV9lChoBmgJaA9DCOYffZOmC3FAlIaUUpRoFUvmaBZHQPXuiE7FKkF1fZQoaAZoCWgPQwiI8ZpXdT5yQJSGlFKUaBVL8WgWR0D17ojRK6FudX2UKGgGaAloD0MIol7wac4ncUCUhpRSlGgVS+5oFkdA9e6JAVO9FnV9lChoBmgJaA9DCGsOEMzRnG1AlIaUUpRoFUvRaBZHQPXuiP56+nJ1fZQoaAZoCWgPQwgB323euDxtQJSGlFKUaBVL9GgWR0D17oksJ6Y3dX2UKGgGaAloD0MIiJ//Hrz+cUCUhpRSlGgVS9poFkdA9e6Mf9UCJXV9lChoBmgJaA9DCN2WyAVnOW9AlIaUUpRoFU0BAWgWR0D17oyYCyQgdX2UKGgGaAloD0MIWMhcGZTFckCUhpRSlGgVS/JoFkdA9e6M1um78XV9lChoBmgJaA9DCGx8JvunMXJAlIaUUpRoFUv0aBZHQPXukJDNQj51fZQoaAZoCWgPQwgQ6EzalM9wQJSGlFKUaBVL0WgWR0D17pOqfvnbdX2UKGgGaAloD0MIOkGbHL4qckCUhpRSlGgVS8xoFkdA9e6ULYoRZnV9lChoBmgJaA9DCAWiJ2VSzm1AlIaUUpRoFU0tAWgWR0D17pSFYdQwdX2UKGgGaAloD0MIYcQ+AdRFckCUhpRSlGgVS9JoFkdA9e6UmxIJ7nV9lChoBmgJaA9DCBajrrW3z3JAlIaUUpRoFUvmaBZHQPXulcHhS+B1fZQoaAZoCWgPQwh9z0iEBiFyQJSGlFKUaBVL2WgWR0D17pcttQ9BdX2UKGgGaAloD0MIQbgCCrWHcUCUhpRSlGgVS9VoFkdA9e6XZeNT+HV9lChoBmgJaA9DCChJ10y+UHNAlIaUUpRoFU0ZAWgWR0D17pedIXj3dX2UKGgGaAloD0MI8ExokljBckCUhpRSlGgVTTgBaBZHQPXumMsWfsh1fZQoaAZoCWgPQwhyxcVRefxwQJSGlFKUaBVL8mgWR0D17pmlqagFdX2UKGgGaAloD0MIeQJhp1hMb0CUhpRSlGgVS/poFkdA9e6Z+8scyXV9lChoBmgJaA9DCHmxMETO+21AlIaUUpRoFUv/aBZHQPXumksK9f11fZQoaAZoCWgPQwj4F0Fjpq9tQJSGlFKUaBVL6WgWR0D17p0YL9dedX2UKGgGaAloD0MIa0jcY+lObkCUhpRSlGgVTQABaBZHQPXunmpda+x1fZQoaAZoCWgPQwjiBnx+mPxxQJSGlFKUaBVLw2gWR0D17qGmw7kodX2UKGgGaAloD0MIaw97oQCrckCUhpRSlGgVS9JoFkdA9e6jKioKlnV9lChoBmgJaA9DCBXj/E0odnBAlIaUUpRoFU1PAWgWR0D17qRwWnCPdX2UKGgGaAloD0MIMSO8PYjWcUCUhpRSlGgVS85oFkdA9e6kimEXcnVlLg=="
|
73 |
},
|
74 |
"ep_success_buffer": {
|
75 |
":type:": "<class 'collections.deque'>",
|
76 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
77 |
},
|
78 |
+
"_n_updates": 460,
|
79 |
"n_steps": 2048,
|
80 |
+
"gamma": 0.9999,
|
81 |
"gae_lambda": 0.99,
|
82 |
+
"ent_coef": 0.01,
|
83 |
"vf_coef": 0.5,
|
84 |
"max_grad_norm": 0.5,
|
85 |
"batch_size": 64,
|
ppo-LunarLander-v2/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 87929
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3edfa16c962a2ca669b127ff4afc0de4daf257caa03cbcc0975c51ca193d244
|
3 |
size 87929
|
ppo-LunarLander-v2/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 43201
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f73821a49158ae24da0d03159a1bdad42fb29958999612fbb5b9397b356da4cc
|
3 |
size 43201
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 281.380566165864, "std_reward": 17.969900830330083, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-01-20T18:42:30.138340"}
|