ldaquan1996 commited on
Commit
1d7c8ba
1 Parent(s): 93a4a96

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 237.00 +/- 42.61
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -72,7 +72,7 @@ OrderedDict([('batch_size', 32),
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 10000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 228.00 +/- 72.88
20
  name: mean_reward
21
  verified: false
22
  ---
 
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 1000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 2661585381
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 3730863654
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 10000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d6520f35b5adb07a71fdaa0958327339a36b9d0bc686f1323e2d5677dbbd5dfa
3
- size 27224318
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbe646d731812d0a85adb71b1bd1d2884e4adb9f6d7a40b627790e080bddb33b
3
+ size 27224310
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d4cd9a0644c73582456999eeeea6759a66f71daa6badfd28b57d700c976f333
3
  size 13505419
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:971d8bb029160e298a4e7bcc2068c558d91a3b4f2f755e95f09ae6f3ca553a5b
3
  size 13505419
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6868833d9e0a267277a1dd0d68fdfbe1df3b13ca0ace7075c8eb53d90bf360cb
3
  size 13504745
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46ca94c78c24a3565ec55e16e5e20c7fe100ade479bce5d5dd57925fab2d442d
3
  size 13504745
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2d7a8d48b7f0fa9321240af4092ed43710b51af7c9e77f108f457002b7d4fae
3
- size 256978
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5197dc5fc37088023037d9c41d904c537655e841166bab6a7213ae14f8a02f76
3
+ size 247900
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 237.0, "std_reward": 42.61455150532503, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-03-21T04:54:49.844926"}
 
1
+ {"mean_reward": 228.0, "std_reward": 72.8766080440082, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-03-21T07:49:27.297960"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5510d19a94740cc9aced7770deb0d63e715c46aa28e84d19f5e216b0af512f91
3
- size 16423
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23495d370c1429b3db69944ccf15a2e89577bb8d7b42299a679190b1d81477db
3
+ size 17787