nsanghi commited on
Commit
b5d8648
1 Parent(s): 0470e29

Push to Hub

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: BreakoutNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 104.50 +/- 45.47
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: BreakoutNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 42.80 +/- 16.37
20
  name: mean_reward
21
  verified: false
22
  ---
args.yml CHANGED
@@ -12,7 +12,7 @@
12
  - - eval_episodes
13
  - 10
14
  - - eval_freq
15
- - 25000
16
  - - gym_packages
17
  - []
18
  - - hyperparams
@@ -20,7 +20,7 @@
20
  - - log_folder
21
  - logs/6_c/rlzoo3/
22
  - - log_interval
23
- - -1
24
  - - max_total_trials
25
  - null
26
  - - n_eval_envs
@@ -32,7 +32,7 @@
32
  - - n_startup_trials
33
  - 10
34
  - - n_timesteps
35
- - 1000000
36
  - - n_trials
37
  - 500
38
  - - no_optim_plots
@@ -50,17 +50,17 @@
50
  - - sampler
51
  - tpe
52
  - - save_freq
53
- - 100000
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 2330502263
58
  - - storage
59
  - null
60
  - - study_name
61
  - null
62
  - - tensorboard_log
63
- - runs/BreakoutNoFrameskip-v4__dqn__2330502263__1713096824
64
  - - track
65
  - true
66
  - - trained_agent
@@ -76,6 +76,6 @@
76
  - - wandb_entity
77
  - null
78
  - - wandb_project_name
79
- - dqn-breakout-gpu
80
  - - wandb_tags
81
  - []
 
12
  - - eval_episodes
13
  - 10
14
  - - eval_freq
15
+ - 10000
16
  - - gym_packages
17
  - []
18
  - - hyperparams
 
20
  - - log_folder
21
  - logs/6_c/rlzoo3/
22
  - - log_interval
23
+ - 400
24
  - - max_total_trials
25
  - null
26
  - - n_eval_envs
 
32
  - - n_startup_trials
33
  - 10
34
  - - n_timesteps
35
+ - 500000
36
  - - n_trials
37
  - 500
38
  - - no_optim_plots
 
50
  - - sampler
51
  - tpe
52
  - - save_freq
53
+ - 10000
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2363843725
58
  - - storage
59
  - null
60
  - - study_name
61
  - null
62
  - - tensorboard_log
63
+ - runs/BreakoutNoFrameskip-v4__dqn__2363843725__1713097209
64
  - - track
65
  - true
66
  - - trained_agent
 
76
  - - wandb_entity
77
  - null
78
  - - wandb_project_name
79
+ - dqn-breakout
80
  - - wandb_tags
81
  - []
dqn-BreakoutNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de7e49c22f6a089cbbf81d3a59d75a97587e605e738be0297373460ddf01dee0
3
- size 27203650
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18fb29212f83b706f1894da623327c0da8abfb5c36611b65c13f8a312c3d616b
3
+ size 27203195
dqn-BreakoutNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-BreakoutNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb5af1302fc777fa403d438c95334dac43fc6f69b90f30ace0435ea0ebb2d078
3
- size 13498044
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0145c4ec10d38d4959aa379c5ad4ea0fb68771fb3d6f6c06b1e9b7221a36e076
3
+ size 13497660
dqn-BreakoutNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f565084fcc52b4c9caec5882228a84863f58101a6d0907d758df9fda342e02fd
3
- size 13497178
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d42692dca5516497d5ab50165f41419c4b9409ac9ca31c0fe6f1f199048d1cf7
3
+ size 13496986
dqn-BreakoutNoFrameskip-v4/system_info.txt CHANGED
@@ -1,9 +1,9 @@
1
- - OS: Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023
2
- - Python: 3.10.12
3
  - Stable-Baselines3: 2.1.0
4
- - PyTorch: 2.2.1+cu121
5
- - GPU Enabled: True
6
- - Numpy: 1.25.2
7
- - Cloudpickle: 2.2.1
8
  - Gymnasium: 0.29.1
9
  - OpenAI Gym: 0.26.2
 
1
+ - OS: Linux-5.15.146.1-microsoft-standard-WSL2-x86_64-with-glibc2.35 # 1 SMP Thu Jan 11 04:09:03 UTC 2024
2
+ - Python: 3.9.18
3
  - Stable-Baselines3: 2.1.0
4
+ - PyTorch: 2.1.0+cpu
5
+ - GPU Enabled: False
6
+ - Numpy: 1.26.1
7
+ - Cloudpickle: 3.0.0
8
  - Gymnasium: 0.29.1
9
  - OpenAI Gym: 0.26.2
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3c426c9a9cc6e55742562142ddc080f38ebce56f22ae3e865b43bed976ec2fc
3
- size 72778
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57af4c35b302181eb2b6cc7a8b52df379d2738019e0a22c1c8079f5ec976cfa8
3
+ size 73180
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 104.5, "std_reward": 45.47141959516989, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-04-14T13:50:20.373742"}
 
1
+ {"mean_reward": 42.8, "std_reward": 16.36948380371232, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-04-14T19:45:56.555308"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5579a530a30fc1732198ef4494531effd410b1fe66e42f7ab340687dc4368f88
3
- size 50202
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d588a8292d999fc90fa65f33f6b364c901d2e2bd16e8a560742025cb5e0c082
3
+ size 40084