kingabzpro commited on
Commit
ee9de69
1 Parent(s): 5e626a1

improved score

Browse files
Files changed (6) hide show
  1. .gitattributes +4 -1
  2. README.md +2 -2
  3. hyperparameters.json +1 -1
  4. model.pt +2 -2
  5. replay.mp4 +2 -2
  6. results.json +1 -1
.gitattributes CHANGED
@@ -2,11 +2,13 @@
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
 
5
  *.ftz filter=lfs diff=lfs merge=lfs -text
6
  *.gz filter=lfs diff=lfs merge=lfs -text
7
  *.h5 filter=lfs diff=lfs merge=lfs -text
8
  *.joblib filter=lfs diff=lfs merge=lfs -text
9
  *.lfs.* filter=lfs diff=lfs merge=lfs -text
 
10
  *.model filter=lfs diff=lfs merge=lfs -text
11
  *.msgpack filter=lfs diff=lfs merge=lfs -text
12
  *.npy filter=lfs diff=lfs merge=lfs -text
@@ -20,6 +22,7 @@
20
  *.pt filter=lfs diff=lfs merge=lfs -text
21
  *.pth filter=lfs diff=lfs merge=lfs -text
22
  *.rar filter=lfs diff=lfs merge=lfs -text
 
23
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
24
  *.tar.* filter=lfs diff=lfs merge=lfs -text
25
  *.tflite filter=lfs diff=lfs merge=lfs -text
@@ -29,4 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
29
  *.zip filter=lfs diff=lfs merge=lfs -text
30
  *.zst filter=lfs diff=lfs merge=lfs -text
31
  *tfevents* filter=lfs diff=lfs merge=lfs -text
32
- *.mp4 filter=lfs diff=lfs merge=lfs -text
 
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
  *.ftz filter=lfs diff=lfs merge=lfs -text
7
  *.gz filter=lfs diff=lfs merge=lfs -text
8
  *.h5 filter=lfs diff=lfs merge=lfs -text
9
  *.joblib filter=lfs diff=lfs merge=lfs -text
10
  *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
  *.model filter=lfs diff=lfs merge=lfs -text
13
  *.msgpack filter=lfs diff=lfs merge=lfs -text
14
  *.npy filter=lfs diff=lfs merge=lfs -text
 
22
  *.pt filter=lfs diff=lfs merge=lfs -text
23
  *.pth filter=lfs diff=lfs merge=lfs -text
24
  *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
  *.tar.* filter=lfs diff=lfs merge=lfs -text
28
  *.tflite filter=lfs diff=lfs merge=lfs -text
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ replay.mp4 filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -16,12 +16,12 @@ model-index:
16
  type: Pixelcopter-PLE-v0
17
  metrics:
18
  - type: mean_reward
19
- value: 13.60 +/- 13.28
20
  name: mean_reward
21
  verified: false
22
  ---
23
 
24
  # **Reinforce** Agent playing **Pixelcopter-PLE-v0**
25
  This is a trained model of a **Reinforce** agent playing **Pixelcopter-PLE-v0** .
26
- To learn to use this model and train yours check Unit 5 of the Deep Reinforcement Learning Class: https://github.com/huggingface/deep-rl-class/tree/main/unit5
27
 
 
16
  type: Pixelcopter-PLE-v0
17
  metrics:
18
  - type: mean_reward
19
+ value: 31.30 +/- 20.84
20
  name: mean_reward
21
  verified: false
22
  ---
23
 
24
  # **Reinforce** Agent playing **Pixelcopter-PLE-v0**
25
  This is a trained model of a **Reinforce** agent playing **Pixelcopter-PLE-v0** .
26
+ To learn to use this model and train yours check Unit 4 of the Deep Reinforcement Learning Course: https://huggingface.co/deep-rl-course/unit4/introduction
27
 
hyperparameters.json CHANGED
@@ -1 +1 @@
1
- {"h_size": 64, "n_training_episodes": 50000, "n_evaluation_episodes": 10, "max_t": 10000, "gamma": 0.99, "lr": 0.0001, "env_id": "Pixelcopter-PLE-v0", "state_space": 7, "action_space": 2}
 
1
+ {"h_size": 64, "n_training_episodes": 20000, "n_evaluation_episodes": 10, "max_t": 10000, "gamma": 0.99, "lr": 0.0001, "env_id": "Pixelcopter-PLE-v0", "state_space": 7, "action_space": 2}
model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10f60fa4d48c073b106f843351cb646596bc6bd97af4927b646fd690f10f21a0
3
- size 4703
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3779a795f7d49921e18a8125f54c2b27a51246976e11512b0b513bbd9c52c0b
3
+ size 38919
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ab8e6784af18e6f655dc1e98b875bf07ade70f2e35038bb164bbce0836c9fb3
3
- size 6180
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6b6892414d614d2a928af23ddf5e12a84d93319c6da8583a6b2017ce43ec062
3
+ size 9347
results.json CHANGED
@@ -1 +1 @@
1
- {"env_id": "Pixelcopter-PLE-v0", "mean_reward": 13.6, "n_evaluation_episodes": 10, "eval_datetime": "2022-08-29T10:30:53.664728"}
 
1
+ {"env_id": "Pixelcopter-PLE-v0", "mean_reward": 31.3, "n_evaluation_episodes": 10, "eval_datetime": "2023-03-06T00:39:28.930086"}