Initial car racing model
Browse files- README.md +1 -1
- config.json +0 -0
- ppo-CarRacing.zip +2 -2
- ppo-CarRacing/data +0 -0
- ppo-CarRacing/policy.optimizer.pth +1 -1
- ppo-CarRacing/policy.pth +1 -1
- replay.mp4 +2 -2
- results.json +1 -1
README.md
CHANGED
@@ -10,7 +10,7 @@ model-index:
|
|
10 |
results:
|
11 |
- metrics:
|
12 |
- type: mean_reward
|
13 |
-
value:
|
14 |
name: mean_reward
|
15 |
task:
|
16 |
type: reinforcement-learning
|
|
|
10 |
results:
|
11 |
- metrics:
|
12 |
- type: mean_reward
|
13 |
+
value: 627.21 +/- 126.96
|
14 |
name: mean_reward
|
15 |
task:
|
16 |
type: reinforcement-learning
|
config.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
ppo-CarRacing.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71f5824945d22f258f7212bfe837423a952d2d262ed6dc658f7ffa06d6e6b828
|
3 |
+
size 27023488
|
ppo-CarRacing/data
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
ppo-CarRacing/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 17412055
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c834441ec29d574b9e77fa891e8df50c12d223275d219472fdf780c746a96c8
|
3 |
size 17412055
|
ppo-CarRacing/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 8706942
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b995535aebf34a53ded8f5fbcbbbf8fcb58456c5312e7c2893a6b8b5386d976b
|
3 |
size 8706942
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7e46a7185d38d53942bf2d03015fcb538ffe8aab7d3197dae1a5e34f79f1d40
|
3 |
+
size 845942
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 627.2098754033447, "std_reward": 126.95656141100422, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-07-03T10:57:05.029641"}
|