Quentin Gallouédec
commited on
Commit
•
d64f459
1
Parent(s):
3befa29
Initial commit
Browse files- README.md +7 -2
- args.yml +8 -8
- config.yml +11 -1
- ddpg-CartpoleDMC-v0.zip +2 -2
- ddpg-CartpoleDMC-v0/actor.optimizer.pth +1 -1
- ddpg-CartpoleDMC-v0/critic.optimizer.pth +1 -1
- ddpg-CartpoleDMC-v0/data +35 -23
- ddpg-CartpoleDMC-v0/policy.pth +1 -1
- replay.mp4 +2 -2
- results.json +1 -1
- train_eval_metrics.zip +2 -2
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: CartpoleDMC-v0
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value:
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
@@ -62,7 +62,12 @@ python -m rl_zoo3.push_to_hub --algo ddpg --env CartpoleDMC-v0 -f logs/ -orga qg
|
|
62 |
|
63 |
## Hyperparameters
|
64 |
```python
|
65 |
-
OrderedDict([('
|
|
|
|
|
|
|
|
|
|
|
66 |
('policy', 'MlpPolicy'),
|
67 |
('policy_kwargs',
|
68 |
'dict(net_arch=dict(pi=[300, 200], qf=[400, 300]))'),
|
|
|
16 |
type: CartpoleDMC-v0
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: 885.50 +/- 4.94
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
62 |
|
63 |
## Hyperparameters
|
64 |
```python
|
65 |
+
OrderedDict([('batch_size', 64),
|
66 |
+
('gamma', 0.99),
|
67 |
+
('learning_rate', 0.0001),
|
68 |
+
('n_timesteps', 1000000.0),
|
69 |
+
('noise_std', 0.3),
|
70 |
+
('noise_type', 'ornstein-uhlenbeck'),
|
71 |
('policy', 'MlpPolicy'),
|
72 |
('policy_kwargs',
|
73 |
'dict(net_arch=dict(pi=[300, 200], qf=[400, 300]))'),
|
args.yml
CHANGED
@@ -10,11 +10,11 @@
|
|
10 |
- - env_kwargs
|
11 |
- null
|
12 |
- - eval_episodes
|
13 |
-
-
|
14 |
- - eval_freq
|
15 |
- 25000
|
16 |
- - gym_packages
|
17 |
-
-
|
18 |
- - hyperparams
|
19 |
- null
|
20 |
- - log_folder
|
@@ -24,7 +24,7 @@
|
|
24 |
- - max_total_trials
|
25 |
- null
|
26 |
- - n_eval_envs
|
27 |
-
-
|
28 |
- - n_evaluations
|
29 |
- null
|
30 |
- - n_jobs
|
@@ -54,15 +54,15 @@
|
|
54 |
- - save_replay_buffer
|
55 |
- false
|
56 |
- - seed
|
57 |
-
-
|
58 |
- - storage
|
59 |
- null
|
60 |
- - study_name
|
61 |
- null
|
62 |
- - tensorboard_log
|
63 |
-
-
|
64 |
- - track
|
65 |
-
-
|
66 |
- - trained_agent
|
67 |
- ''
|
68 |
- - truncate_last_trajectory
|
@@ -74,9 +74,9 @@
|
|
74 |
- - verbose
|
75 |
- 1
|
76 |
- - wandb_entity
|
77 |
-
-
|
78 |
- - wandb_project_name
|
79 |
-
-
|
80 |
- - wandb_tags
|
81 |
- []
|
82 |
- - yaml_file
|
|
|
10 |
- - env_kwargs
|
11 |
- null
|
12 |
- - eval_episodes
|
13 |
+
- 20
|
14 |
- - eval_freq
|
15 |
- 25000
|
16 |
- - gym_packages
|
17 |
+
- []
|
18 |
- - hyperparams
|
19 |
- null
|
20 |
- - log_folder
|
|
|
24 |
- - max_total_trials
|
25 |
- null
|
26 |
- - n_eval_envs
|
27 |
+
- 5
|
28 |
- - n_evaluations
|
29 |
- null
|
30 |
- - n_jobs
|
|
|
54 |
- - save_replay_buffer
|
55 |
- false
|
56 |
- - seed
|
57 |
+
- 3757117300
|
58 |
- - storage
|
59 |
- null
|
60 |
- - study_name
|
61 |
- null
|
62 |
- - tensorboard_log
|
63 |
+
- runs/CartpoleDMC-v0__ddpg__3757117300__1673811016
|
64 |
- - track
|
65 |
+
- true
|
66 |
- - trained_agent
|
67 |
- ''
|
68 |
- - truncate_last_trajectory
|
|
|
74 |
- - verbose
|
75 |
- 1
|
76 |
- - wandb_entity
|
77 |
+
- qgallouedec
|
78 |
- - wandb_project_name
|
79 |
+
- dmc
|
80 |
- - wandb_tags
|
81 |
- []
|
82 |
- - yaml_file
|
config.yml
CHANGED
@@ -1,6 +1,16 @@
|
|
1 |
!!python/object/apply:collections.OrderedDict
|
2 |
-
- - -
|
|
|
|
|
|
|
|
|
|
|
|
|
3 |
- 1000000.0
|
|
|
|
|
|
|
|
|
4 |
- - policy
|
5 |
- MlpPolicy
|
6 |
- - policy_kwargs
|
|
|
1 |
!!python/object/apply:collections.OrderedDict
|
2 |
+
- - - batch_size
|
3 |
+
- 64
|
4 |
+
- - gamma
|
5 |
+
- 0.99
|
6 |
+
- - learning_rate
|
7 |
+
- 0.0001
|
8 |
+
- - n_timesteps
|
9 |
- 1000000.0
|
10 |
+
- - noise_std
|
11 |
+
- 0.3
|
12 |
+
- - noise_type
|
13 |
+
- ornstein-uhlenbeck
|
14 |
- - policy
|
15 |
- MlpPolicy
|
16 |
- - policy_kwargs
|
ddpg-CartpoleDMC-v0.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:877cd406d523ea85172a4a93ff71c81e540dec32903d4bc68f23d8a1f8873e9a
|
3 |
+
size 3011980
|
ddpg-CartpoleDMC-v0/actor.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 502319
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:166c4143263a24cdd9d3cd802ff4559bff80a9b7965a1a7d7e73ebc2a5428b3b
|
3 |
size 502319
|
ddpg-CartpoleDMC-v0/critic.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 991855
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b00f7c9cecf7772b2df007c1577f2f50d5b7e298708baed00becbb269abe6a3f
|
3 |
size 991855
|
ddpg-CartpoleDMC-v0/data
CHANGED
@@ -4,16 +4,16 @@
|
|
4 |
":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnRkMy5wb2xpY2llc5SMCVREM1BvbGljeZSTlC4=",
|
5 |
"__module__": "stable_baselines3.td3.policies",
|
6 |
"__doc__": "\n Policy class (with both actor and critic) for TD3.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
|
7 |
-
"__init__": "<function TD3Policy.__init__ at
|
8 |
-
"_build": "<function TD3Policy._build at
|
9 |
-
"_get_constructor_parameters": "<function TD3Policy._get_constructor_parameters at
|
10 |
-
"make_actor": "<function TD3Policy.make_actor at
|
11 |
-
"make_critic": "<function TD3Policy.make_critic at
|
12 |
-
"forward": "<function TD3Policy.forward at
|
13 |
-
"_predict": "<function TD3Policy._predict at
|
14 |
-
"set_training_mode": "<function TD3Policy.set_training_mode at
|
15 |
"__abstractmethods__": "frozenset()",
|
16 |
-
"_abc_impl": "<_abc._abc_data object at
|
17 |
},
|
18 |
"verbose": 1,
|
19 |
"policy_kwargs": {
|
@@ -31,7 +31,7 @@
|
|
31 |
},
|
32 |
"observation_space": {
|
33 |
":type:": "<class 'gym.spaces.box.Box'>",
|
34 |
-
":serialized:": "gAWVMgwAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLBYWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWFAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/5RoC0sFhZSMAUOUdJRSlIwEaGlnaJRoEyiWFAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAf5RoC0sFhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolgUAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////
|
35 |
"dtype": "float32",
|
36 |
"_shape": [
|
37 |
5
|
@@ -60,13 +60,25 @@
|
|
60 |
"_total_timesteps": 1000000,
|
61 |
"_num_timesteps_at_start": 0,
|
62 |
"seed": 0,
|
63 |
-
"action_noise":
|
64 |
-
|
65 |
-
|
66 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
67 |
"lr_schedule": {
|
68 |
":type:": "<class 'function'>",
|
69 |
-
":serialized:": "
|
70 |
},
|
71 |
"_last_obs": null,
|
72 |
"_last_episode_starts": {
|
@@ -75,7 +87,7 @@
|
|
75 |
},
|
76 |
"_last_original_obs": {
|
77 |
":type:": "<class 'numpy.ndarray'>",
|
78 |
-
":serialized:": "
|
79 |
},
|
80 |
"_episode_num": 1000,
|
81 |
"use_sde": false,
|
@@ -83,7 +95,7 @@
|
|
83 |
"_current_progress_remaining": 0.0,
|
84 |
"ep_info_buffer": {
|
85 |
":type:": "<class 'collections.deque'>",
|
86 |
-
":serialized:": "gAWVgRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////
|
87 |
},
|
88 |
"ep_success_buffer": {
|
89 |
":type:": "<class 'collections.deque'>",
|
@@ -91,7 +103,7 @@
|
|
91 |
},
|
92 |
"_n_updates": 1000000,
|
93 |
"buffer_size": 1,
|
94 |
-
"batch_size":
|
95 |
"learning_starts": 100,
|
96 |
"tau": 0.005,
|
97 |
"gamma": 0.99,
|
@@ -102,12 +114,12 @@
|
|
102 |
":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
|
103 |
"__module__": "stable_baselines3.common.buffers",
|
104 |
"__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
|
105 |
-
"__init__": "<function ReplayBuffer.__init__ at
|
106 |
-
"add": "<function ReplayBuffer.add at
|
107 |
-
"sample": "<function ReplayBuffer.sample at
|
108 |
-
"_get_samples": "<function ReplayBuffer._get_samples at
|
109 |
"__abstractmethods__": "frozenset()",
|
110 |
-
"_abc_impl": "<_abc._abc_data object at
|
111 |
},
|
112 |
"replay_buffer_kwargs": {},
|
113 |
"train_freq": {
|
|
|
4 |
":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnRkMy5wb2xpY2llc5SMCVREM1BvbGljeZSTlC4=",
|
5 |
"__module__": "stable_baselines3.td3.policies",
|
6 |
"__doc__": "\n Policy class (with both actor and critic) for TD3.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
|
7 |
+
"__init__": "<function TD3Policy.__init__ at 0x139898280>",
|
8 |
+
"_build": "<function TD3Policy._build at 0x139898310>",
|
9 |
+
"_get_constructor_parameters": "<function TD3Policy._get_constructor_parameters at 0x1398983a0>",
|
10 |
+
"make_actor": "<function TD3Policy.make_actor at 0x139898430>",
|
11 |
+
"make_critic": "<function TD3Policy.make_critic at 0x1398984c0>",
|
12 |
+
"forward": "<function TD3Policy.forward at 0x139898550>",
|
13 |
+
"_predict": "<function TD3Policy._predict at 0x1398985e0>",
|
14 |
+
"set_training_mode": "<function TD3Policy.set_training_mode at 0x139898670>",
|
15 |
"__abstractmethods__": "frozenset()",
|
16 |
+
"_abc_impl": "<_abc._abc_data object at 0x139892d80>"
|
17 |
},
|
18 |
"verbose": 1,
|
19 |
"policy_kwargs": {
|
|
|
31 |
},
|
32 |
"observation_space": {
|
33 |
":type:": "<class 'gym.spaces.box.Box'>",
|
34 |
+
":serialized:": "gAWVMgwAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLBYWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWFAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/5RoC0sFhZSMAUOUdJRSlIwEaGlnaJRoEyiWFAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAf5RoC0sFhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolgUAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBYWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYFAAAAAAAAAAAAAAAAlGgiSwWFlGgWdJRSlIwKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwSX19yYW5kb21zdGF0ZV9jdG9ylJOUjAdNVDE5OTM3lGgujBRfX2JpdF9nZW5lcmF0b3JfY3RvcpSTlIaUUpR9lCiMDWJpdF9nZW5lcmF0b3KUjAdNVDE5OTM3lIwFc3RhdGWUfZQojANrZXmUaBMolsAJAAAAAAAAAAAAgCJI3W7TaYNo2fkCQTqkGso9PgD+gpj29/M/d+fXv7mxGN3/7aYgZyvV0Ye9Mqg636TmZE5bw2bcCxNeR8TyCBDpnUCPLrx7pKMgwAia7+EDxmTe1NYhO87+D5+vZcW2uMYIJE+6AI/OH6W3CCHYBR11hSSk3DFQo4K+FU7SurMp04MDN6NiNxRwecmWCuT2Q+JWuRXfnmbwrzFpuTQcnNAIdKd++P+QBG1UB+Uduc/saNr7TqOCD+pzMlEeyYTEbDegZvdCaXLWDoXO5FnPoSmO3TtOWUbLuE/F7yk4DT7ZPXKQtaF5n2YfUr8lL67nyWiQUkGk76JLL5uWXFW/i96GnepHUQ1/3EBqSAfbej/Qvbzt4joABFVtCIVVfSSLFxwyzLQ+se3Yp+jaNpm+ikeEUvP2OGCbBDLAtFWwver8m0VDA71UCYGErR0oumNjhtoAOeNzd/1QZU4iaVptCrkqZvcsS8MGAWmN3NO3zQBvEBrHr2s9oWEg1uLUwsyKwp3Ej3HciQGxOQ5+biDZhB8VLLl5RyiwJ+9S/ouy40Z3vBEFhfLASbWQAo2+5lsHDduWiIw+ALN2ooo4bfAFCk9UDac3plWLrtp9le1WUnu3bXM+gCtX0D2tvPg+EnEnodd0g3YprVxiDrQ9rEAggJtpC0r/JUbFkYXweRPxsx4Oeil7IVthzxTx7wDWbCPUrwvtBuYrSDD264NaeNeW2plKz69oH0zjZJf3fuK2tmM4Qi6hlKtNQCDB4GjgtEJcFyfzsYGMpFktH6A8IaEXFj7DbVUGkPdGLod9aXyFUoyzz/LM2HvGeiAFJ74L6vSsn56LFRtPI8IZa1LZlDUamoT8PxQ+nO0rMzoSPydacC/X16q4F3KTKdxRV3YOUg+7hr8pPUXAY8fKVMOC3DcK4rvdXv2i1HhuzPdGKep18KpcYboGB9YdRUfD3xFJzTj/kdWKEtIkZKArroo4WQvXK9m2O3wcasi7QvfDlEaI1P22R10kBQmIZIJEEevbBu+vAJVoT/vuYGCLT4BO7lnqtfkJCsq97mQoenp99p42vFF/79dvNbnA6u041MH3dwoahQCYbQZ1I6fYDqNz7Ga5hscD1zr1pxTYbuP/YdFgun+BM+MayFxilRd1scPzxmUVFGHawNZ/ZFFQuEwu2RyhweiDVCwi55NMfvWVB0xxdJZ/W6lCw7uNp73sfINNREqc3tt7myYn4Zx7PBOGLk2XKMJdsnIG22qn8DcWtX7B+sycFIA1bRe1tGAn3ndOOheba4LnEHg4Z5QXwlI2ri70aSBPn69o756Rc06HVYmYuKKfNl2XUlknUPXc+JoFHRIWTucRnZVGbY4yWec2J1vX3K5Sz+8sXU1aR17I8HxiawgaJ1tgggxY38Pf8SVlwL98FVa3VqjYSG8CS1kdwGeP/w+4Ru4vNX2RlOgMoEnD/9WZAwHkmPdtngENSd826EkfJL8zh8wv+gGbBEHuw2H0w3UP70+IvLePRKaYIBXifNMa+5QtAlLBzO+fN46O/m6l/OCi7RlxJR7bqHr4KkMksYw76XCA68xzLIf8cqaI2+zw2A+xPkNDyXoRPW2abw9HSOVPQWnHkFjT7xUOhjXtc30ICmIgXeHBNwndFpBzNncjnLCVawy3tZWDjgUHdoiP4wDY9INwXMzMy6dU2rbHpLcUJowkcm7gm2TZNdSS1JeA7oOj4J8r1pvm0mOvJvY7L/u5FppT8mU2Q2mEBYXA3o5TXiBmWLkL3tDZjKWvRCEdjergoQY4l/JSv0mx37ZlARhQMs8QA2XmfCRgGZq2s6/luASo4ZCOt7IE/ZuxkrpNh68hkbmDyEYAoBU3pCLojBU8aLJDIj1TbojVL/9Eg3EQ2EOvkDLO+pNjHVsZmOWeCVx+ZqjO1oaDZZ4BRSXQzSlOGR4RMzTw39kYKUxR1lhvMQbcY8tNLSEREALhIwBEd4jWk57ZWEgrYb0Az1KqsbJ7jLmYXO6hCEwoEThdFaJsMCoIX3IKVRp6sE1CRkwii25d/euBM0cwu3QkUIx7kVUi+HsjCP3gQzYmrGL6rSxdIB0i1FqVD9ph0Q/4j3vp8BXsg0vHJzaUkOb+6Oz4ZHyPHYw3msSvjEjVUldb4s8sodV/C79foirUAiXvOjHM3aYDFABKbzZdeUnLL/mG5+wVX9ef93ssJUxK8ElWb17RVrY8HAWLErz1hOp1TQ8Ew/tcVINrcivojfmlrYgNSKgnYd5w4q4IVdcM0hRZJW1I6QUl8OdYaT/88gCfOpXJsv9Cc/6HYbl3HLFjpsBRo2I1TUZ1RQbMiQSXlrF9ff6B27FUwbG01cAac66rIu4H66pNt5MRvtHsgW8P71ULDDqFdZfNr3aUi2tNZ0CJ/vC8g15/2DBfitzcSs30blUDaXoKmDbTnbzvsc45rpv0vZf5IRcbtWe4DW3UB0bFUIPlI4FdinM+OHOs3Z2ICYrQX1IRt7+/JK2iAIpLRp34P0ZRUUuYTpvlI2vT3p0EA6395THuXhqvKtVcS21MfiktsCT4K3HanLLnJmqQ4vg0jUa6pPRNdJuAzkYMCZMrzoMKBhmeHBRqg9d7nc7rIhMWyFPRvXfcMsW5vJt9QQ6mkItDxKlJqoGfeGA0zrxoXGkScZvO/BcB/7Yt1/X2GIzuTV6rrImmPBsZFgSEoQE7ySUAW1SubvRTSTzB8yWOzHZDtROzA+gE/ZNVVuSibZbhLvvehU0nFZKlTM3NaZon+XQegGgpMKKvdnWb3aD9tqIKGLAHdqAPah5QViwLM/X2xchqdCJ6W3P9lAFryrCRmjG3hBC+oPknkpqDchoTTxCjyzbgD8dT9s79WnPzP/S+Ob7kGyulItdPn10JqPB7E3nn+OG32aKG+z0dS0JCau7DZe6lI51TdzB96209Vz0vKTLJTztSeWSdF/PJZNkAQ4gqZ+RIMOnBvSET8BtdXVktZyTinZiNSYTN5sdJqIOyppvKv3Kg/xXPlRbROCtcF0sKOonlLIxATLypV5FCkWTLXYwIpsuLxkkEW5d9F0gc1DdiLMNamrcZFWdddtGGiQYolqtZN7bSg2jUyJCqWc++kcz4/AR8FSG4zwIF95A1OIMCisZ/RJGdTs2qzAOrErX0loqR7DgszURLK8VgP4fsta5Ksm/cyBybB34Pz/Gqe/yGMRkDfrT9va1MuJyhxf/wvCjwnuXrLeNs0Jh4rwUM+gfzjZGDW+IvzG2iAzH6rZFL37dnJULnz/jYGglC3cV6ljb0eZ40N5rK0VmpTVh41CAU9RTR9sdlCFXu01EWL1tfHwIee8vasEX3lGgIjAJ1NJSJiIeUUpQoSwNoDE5OTkr/////Sv////9LAHSUYk1wAoWUaBZ0lFKUjANwb3OUTXACdYwJaGFzX2dhdXNzlEsAjAVnYXVzc5RHAAAAAAAAAAB1YnViLg==",
|
35 |
"dtype": "float32",
|
36 |
"_shape": [
|
37 |
5
|
|
|
60 |
"_total_timesteps": 1000000,
|
61 |
"_num_timesteps_at_start": 0,
|
62 |
"seed": 0,
|
63 |
+
"action_noise": {
|
64 |
+
":type:": "<class 'stable_baselines3.common.noise.OrnsteinUhlenbeckActionNoise'>",
|
65 |
+
":serialized:": "gAWVVQEAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5ub2lzZZSMHE9ybnN0ZWluVWhsZW5iZWNrQWN0aW9uTm9pc2WUk5QpgZR9lCiMBl90aGV0YZRHP8MzMzMzMzOMA19tdZSMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYIAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksBhZSMAUOUdJRSlIwGX3NpZ21hlGgJKJYIAAAAAAAAADMzMzMzM9M/lGgQSwGFlGgUdJRSlIwDX2R0lEc/hHrhR64Ue4wNaW5pdGlhbF9ub2lzZZROjApub2lzZV9wcmV2lGgJKJYIAAAAAAAAAAAAAAAAAAAAlGgQSwGFlGgUdJRSlHViLg==",
|
66 |
+
"_theta": 0.15,
|
67 |
+
"_mu": "[0.]",
|
68 |
+
"_sigma": "[0.3]",
|
69 |
+
"_dt": 0.01,
|
70 |
+
"initial_noise": null,
|
71 |
+
"noise_prev": "[0.]"
|
72 |
+
},
|
73 |
+
"start_time": 1673811020596785684,
|
74 |
+
"learning_rate": {
|
75 |
+
":type:": "<class 'function'>",
|
76 |
+
":serialized:": "gAWVCQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMay9ncGZzZHN3b3JrL3Byb2plY3RzL3JlY2gvdWxpL3VwZjgyc3AvZW52X2RtYy9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgkMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxrL2dwZnNkc3dvcmsvcHJvamVjdHMvcmVjaC91bGkvdXBmODJzcC9lbnZfZG1jL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPxo24uscQy2FlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
|
77 |
+
},
|
78 |
+
"tensorboard_log": "runs/CartpoleDMC-v0__ddpg__3757117300__1673811016/CartpoleDMC-v0",
|
79 |
"lr_schedule": {
|
80 |
":type:": "<class 'function'>",
|
81 |
+
":serialized:": "gAWVCQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMay9ncGZzZHN3b3JrL3Byb2plY3RzL3JlY2gvdWxpL3VwZjgyc3AvZW52X2RtYy9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgkMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxrL2dwZnNkc3dvcmsvcHJvamVjdHMvcmVjaC91bGkvdXBmODJzcC9lbnZfZG1jL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPxo24uscQy2FlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
|
82 |
},
|
83 |
"_last_obs": null,
|
84 |
"_last_episode_starts": {
|
|
|
87 |
},
|
88 |
"_last_original_obs": {
|
89 |
":type:": "<class 'numpy.ndarray'>",
|
90 |
+
":serialized:": "gAWViQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYUAAAAAAAAAF4seT/vRX4/JXntPbMYHb8I7ZU+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksBSwWGlIwBQ5R0lFKULg=="
|
91 |
},
|
92 |
"_episode_num": 1000,
|
93 |
"use_sde": false,
|
|
|
95 |
"_current_progress_remaining": 0.0,
|
96 |
"ep_info_buffer": {
|
97 |
":type:": "<class 'collections.deque'>",
|
98 |
+
":serialized:": "gAWVgRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIrKxtigc8jUCUhpRSlIwBbJRN6AOMAXSUR0DIWeA+yJKrdX2UKGgGaAloD0MIox03/M55jkCUhpRSlGgVTegDaBZHQMhhHExIre91fZQoaAZoCWgPQwgYl6q0hU+NQJSGlFKUaBVN6ANoFkdAyGiDqTKT0XV9lChoBmgJaA9DCDfjNEQVQ4tAlIaUUpRoFU3oA2gWR0DIb4AbsF+vdX2UKGgGaAloD0MIfR8OEoIOhkCUhpRSlGgVTegDaBZHQMh20Mr/bTN1fZQoaAZoCWgPQwg8bCIzV+KOQJSGlFKUaBVN6ANoFkdAyH48ow22onV9lChoBmgJaA9DCAjHLHvyoYdAlIaUUpRoFU3oA2gWR0DIhSVqcmShdX2UKGgGaAloD0MIVP1K5+PsjUCUhpRSlGgVTegDaBZHQMiMizz/ZNB1fZQoaAZoCWgPQwicTrLVJUWMQJSGlFKUaBVN6ANoFkdAyJNff+jubHV9lChoBmgJaA9DCJJ6T+V0uYRAlIaUUpRoFU3oA2gWR0DImd5uXNTtdX2UKGgGaAloD0MIinYVUh49h0CUhpRSlGgVTegDaBZHQMigtxIatLd1fZQoaAZoCWgPQwicNXhfFcaLQJSGlFKUaBVN6ANoFkdAyKd28/UvwnV9lChoBmgJaA9DCNIdxM70HYRAlIaUUpRoFU3oA2gWR0DIrgV8XvYwdX2UKGgGaAloD0MIhllo57TKekCUhpRSlGgVTegDaBZHQMi1dw0GeMB1fZQoaAZoCWgPQwiVu8/x8XKOQJSGlFKUaBVN6ANoFkdAyLzSz5XU6XV9lChoBmgJaA9DCEdzZOU34odAlIaUUpRoFU3oA2gWR0DIw/TDEWIodX2UKGgGaAloD0MIR1UTRD2/jECUhpRSlGgVTegDaBZHQMjLTiyhSLt1fZQoaAZoCWgPQwjpmV5iLKGDQJSGlFKUaBVN6ANoFkdAyNK3Nzr/sHV9lChoBmgJaA9DCBueXinLXYlAlIaUUpRoFU3oA2gWR0DI2b7Z8KG+dX2UKGgGaAloD0MIw552+IsHjUCUhpRSlGgVTegDaBZHQMjg8b2criF1fZQoaAZoCWgPQwgSUOEIstaGQJSGlFKUaBVN6ANoFkdAyOfHncL0BnV9lChoBmgJaA9DCBuEud3rfYxAlIaUUpRoFU3oA2gWR0DI7kc1TBIndX2UKGgGaAloD0MINEksKbeyiECUhpRSlGgVTegDaBZHQMj1IlbVz6t1fZQoaAZoCWgPQwhh4/p3nUCOQJSGlFKUaBVN6ANoFkdAyPvwV8kUsXV9lChoBmgJaA9DCHxinSpf04VAlIaUUpRoFU3oA2gWR0DJApc9U0emdX2UKGgGaAloD0MIP3PWp9zKjkCUhpRSlGgVTegDaBZHQMkPzjyOJch1fZQoaAZoCWgPQwipFDsaB9KOQJSGlFKUaBVN6ANoFkdAyRbp+GXXy3V9lChoBmgJaA9DCJPJqZ0hwIdAlIaUUpRoFU3oA2gWR0DJHkjdYW+HdX2UKGgGaAloD0MIx4Ds9W4wekCUhpRSlGgVTegDaBZHQMkluHmig011fZQoaAZoCWgPQwhsy4Cz9PKGQJSGlFKUaBVN6ANoFkdAySy+/47A+XV9lChoBmgJaA9DCD+O5sgKJo5AlIaUUpRoFU3oA2gWR0DJM/9j9XLedX2UKGgGaAloD0MI9WVpp0Yah0CUhpRSlGgVTegDaBZHQMk62w3YL9d1fZQoaAZoCWgPQwj4HFiOEBGMQJSGlFKUaBVN6ANoFkdAyUFxSXMQmXV9lChoBmgJaA9DCMdI9gj1YoNAlIaUUpRoFU3oA2gWR0DJSFAWxhUjdX2UKGgGaAloD0MIliNkIE87g0CUhpRSlGgVTegDaBZHQMlPPVlXiit1fZQoaAZoCWgPQwhHHogsEnCBQJSGlFKUaBVN6ANoFkdAyVX+CHRCyHV9lChoBmgJaA9DCAucbAPXEY5AlIaUUpRoFU3oA2gWR0DJXYU+kgwHdX2UKGgGaAloD0MIdH0fDpKai0CUhpRSlGgVTegDaBZHQMllEFCswL51fZQoaAZoCWgPQwjovwevHaaLQJSGlFKUaBVN6ANoFkdAyWxAOnVG1HV9lChoBmgJaA9DCGppboVwE4lAlIaUUpRoFU3oA2gWR0DJc8enO0LMdX2UKGgGaAloD0MI3gAz32H8jUCUhpRSlGgVTegDaBZHQMl7PzyauwJ1fZQoaAZoCWgPQwiTOCuiRjCDQJSGlFKUaBVN6ANoFkdAyYJrYTTOPnV9lChoBmgJaA9DCAJnKVmujolAlIaUUpRoFU3oA2gWR0DJiXncgyM2dX2UKGgGaAloD0MIRwTj4BLKjECUhpRSlGgVTegDaBZHQMmQa9joZAJ1fZQoaAZoCWgPQwjYRdEDv8KBQJSGlFKUaBVN6ANoFkdAyZcI7cwg1XV9lChoBmgJaA9DCJ8B9WaUr3pAlIaUUpRoFU3oA2gWR0DJnfLZtelbdX2UKGgGaAloD0MIEalpF5OjhUCUhpRSlGgVTegDaBZHQMmkkoP07Kd1fZQoaAZoCWgPQwjGM2jo32KNQJSGlFKUaBVN6ANoFkdAyavHxKg7HXV9lChoBmgJaA9DCJiJIqQOjYtAlIaUUpRoFU3oA2gWR0DJs0u6wt8NdX2UKGgGaAloD0MIYMrAAU3AgUCUhpRSlGgVTegDaBZHQMm6czjm0Vt1fZQoaAZoCWgPQwjJBWfwl7mFQJSGlFKUaBVN6ANoFkdAycfKiTMaCXV9lChoBmgJaA9DCEvK3efYw4pAlIaUUpRoFU3oA2gWR0DJz1ez0HyFdX2UKGgGaAloD0MIntFWJVERi0CUhpRSlGgVTegDaBZHQMnWkFlK9PF1fZQoaAZoCWgPQwj9hokGKQGHQJSGlFKUaBVN6ANoFkdAyd2JqrR0EHV9lChoBmgJaA9DCF+4c2FEWI5AlIaUUpRoFU3oA2gWR0DJ5BZY5ksjdX2UKGgGaAloD0MIhIO9iUGmikCUhpRSlGgVTegDaBZHQMnq+NpM6BB1fZQoaAZoCWgPQwha8KKvgI2KQJSGlFKUaBVN6ANoFkdAyfHdxlQMyHV9lChoBmgJaA9DCMmwijeSlopAlIaUUpRoFU3oA2gWR0DJ+Ckyad+YdX2UKGgGaAloD0MItTf4wiQrjECUhpRSlGgVTegDaBZHQMn/swaaTfR1fZQoaAZoCWgPQwjMe5xpovWKQJSGlFKUaBVN6ANoFkdAygdCTvAoHHV9lChoBmgJaA9DCHP3OT5agI5AlIaUUpRoFU3oA2gWR0DKDntJpWWAdX2UKGgGaAloD0MI8Z4Dy7Gxg0CUhpRSlGgVTegDaBZHQMoWDL6+FlF1fZQoaAZoCWgPQwiBzM6i1+yMQJSGlFKUaBVN6ANoFkdAyh2DUz9CNXV9lChoBmgJaA9DCMfw2M+iJ4hAlIaUUpRoFU3oA2gWR0DKJLRaLXMAdX2UKGgGaAloD0MIFxIwulxQikCUhpRSlGgVTegDaBZHQMor+n1e0HB1fZQoaAZoCWgPQwhvZYnO0oOEQJSGlFKUaBVN6ANoFkdAyjLqQf6oEXV9lChoBmgJaA9DCC7IluVLDopAlIaUUpRoFU3oA2gWR0DKOYVr433pdX2UKGgGaAloD0MIizVc5N5niUCUhpRSlGgVTegDaBZHQMpAcgEt/Wl1fZQoaAZoCWgPQwjxDYXPlmZ/QJSGlFKUaBVN6ANoFkdAykdljiGWU3V9lChoBmgJaA9DCKbydoRT5oJAlIaUUpRoFU3oA2gWR0DKTiC35N48dX2UKGgGaAloD0MIFf4MbzbMjECUhpRSlGgVTegDaBZHQMpVpRKg7HR1fZQoaAZoCWgPQwjj/iPTQe6LQJSGlFKUaBVN6ANoFkdAyl00YNy5qnV9lChoBmgJaA9DCMa/z7iw/YtAlIaUUpRoFU3oA2gWR0DKZF4nWrfcdX2UKGgGaAloD0MIxQPKplyigUCUhpRSlGgVTegDaBZHQMpr8MZP2wp1fZQoaAZoCWgPQwgx0/avTL6OQJSGlFKUaBVN6ANoFkdAynOEgnMMZ3V9lChoBmgJaA9DCFRweEFk7I1AlIaUUpRoFU3oA2gWR0DKgFMMCtA+dX2UKGgGaAloD0MIl6jeGpjcjkCUhpRSlGgVTegDaBZHQMqHSTJyQxN1fZQoaAZoCWgPQwjtEP+wJSaHQJSGlFKUaBVN6ANoFkdAyo3tK+SKWXV9lChoBmgJaA9DCAFNhA2vq45AlIaUUpRoFU3oA2gWR0DKlOLmGM4tdX2UKGgGaAloD0MIvVErTL8hjUCUhpRSlGgVTegDaBZHQMqb5IsiB5J1fZQoaAZoCWgPQwhlx0Yg3gWCQJSGlFKUaBVN6ANoFkdAyqLDYHPeHnV9lChoBmgJaA9DCKSOjqux7ItAlIaUUpRoFU3oA2gWR0DKqnExZdOZdX2UKGgGaAloD0MI6IU7F6Ymh0CUhpRSlGgVTegDaBZHQMqx8qNAC4l1fZQoaAZoCWgPQwj9SufDE0SLQJSGlFKUaBVN6ANoFkdAyrlB8VHnU3V9lChoBmgJaA9DCKUvhJxXnYlAlIaUUpRoFU3oA2gWR0DKwNgkgOjJdX2UKGgGaAloD0MIUP2DSCbih0CUhpRSlGgVTegDaBZHQMrIAFj/dZd1fZQoaAZoCWgPQwgB/FOqJDOHQJSGlFKUaBVN6ANoFkdAys+Ebn5i3HV9lChoBmgJaA9DCPfnoiHjM3tAlIaUUpRoFU3oA2gWR0DK1sdWS2YwdX2UKGgGaAloD0MIb7ckB8yjg0CUhpRSlGgVTegDaBZHQMreEmM4tHx1fZQoaAZoCWgPQwiXVdgMkJiKQJSGlFKUaBVN6ANoFkdAyuVwMnZ00XV9lChoBmgJaA9DCOTbuwY9oolAlIaUUpRoFU3oA2gWR0DK7GoFkhA4dX2UKGgGaAloD0MIdChDVcxbiECUhpRSlGgVTegDaBZHQMrwseJgssh1fZQoaAZoCWgPQwjJ/+Tv/ueKQJSGlFKUaBVN6ANoFkdAyvTmH31zyXV9lChoBmgJaA9DCF3Ed2LW4IpAlIaUUpRoFU3oA2gWR0DK+Rp6F/QTdX2UKGgGaAloD0MIEYsYdlgMiECUhpRSlGgVTegDaBZHQMr9TdJz1bt1fZQoaAZoCWgPQwiCOA8ncCOIQJSGlFKUaBVN6ANoFkdAywGCMpgCwXV9lChoBmgJaA9DCBajrrUXs4hAlIaUUpRoFU3oA2gWR0DLBbXf4yoGdX2UKGgGaAloD0MI+grSjIV7h0CUhpRSlGgVTegDaBZHQMsJ6PNFBpp1fZQoaAZoCWgPQwhm3T8WAjqJQJSGlFKUaBVN6ANoFkdAyw4cjfNzKnV9lChoBmgJaA9DCIeiQJ9ojYZAlIaUUpRoFU3oA2gWR0DLEk8zl90BdWUu"
|
99 |
},
|
100 |
"ep_success_buffer": {
|
101 |
":type:": "<class 'collections.deque'>",
|
|
|
103 |
},
|
104 |
"_n_updates": 1000000,
|
105 |
"buffer_size": 1,
|
106 |
+
"batch_size": 64,
|
107 |
"learning_starts": 100,
|
108 |
"tau": 0.005,
|
109 |
"gamma": 0.99,
|
|
|
114 |
":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
|
115 |
"__module__": "stable_baselines3.common.buffers",
|
116 |
"__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
|
117 |
+
"__init__": "<function ReplayBuffer.__init__ at 0x139896dd0>",
|
118 |
+
"add": "<function ReplayBuffer.add at 0x139896e60>",
|
119 |
+
"sample": "<function ReplayBuffer.sample at 0x139896ef0>",
|
120 |
+
"_get_samples": "<function ReplayBuffer._get_samples at 0x139896f80>",
|
121 |
"__abstractmethods__": "frozenset()",
|
122 |
+
"_abc_impl": "<_abc._abc_data object at 0x139836280>"
|
123 |
},
|
124 |
"replay_buffer_kwargs": {},
|
125 |
"train_freq": {
|
ddpg-CartpoleDMC-v0/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1492509
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2b4d0b8ccac39463f11616bef8492f3180debfd1e197a9a8023faf2072d6528
|
3 |
size 1492509
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:613f7d0e18c00bd0917ad26f69552b415640cd2300288ec5f3efab70698e7b45
|
3 |
+
size 156822
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 885.5004687999999, "std_reward": 4.93610187527313, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-01-16T08:50:36.963750"}
|
train_eval_metrics.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2ab4ce5419d6105f084e517a228f67bf79a341d2cc807c442d89f1739bd5c88
|
3 |
+
size 43170
|