Cheekydave commited on
Commit
7420e46
1 Parent(s): 8f92897

Upload PPO CarRacing-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: CarRacing-v2
17
  metrics:
18
  - type: mean_reward
19
- value: -83.17 +/- 1.05
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: CarRacing-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 56.32 +/- 35.69
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
The diff for this file is too large to render. See raw diff
 
ppo-CarRacing-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5cde64c9fdcf40be21eae0773118280739a86838d671749ce0225a4de4ad9199
3
- size 26323957
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:149fa9c9cd45d4123eb5b038e3ed62ac7691c60f6695a785877792420f78305f
3
+ size 26323576
ppo-CarRacing-v2/data CHANGED
The diff for this file is too large to render. See raw diff
 
ppo-CarRacing-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe0ff6f4cf8ec2f04dbc891df9dd73be097b676c5702563808a08f724f509da6
3
  size 17416033
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ad1713a43bae37f222a58839f50b2f05f769e8e091f3c8f7a218fa53c49d7c3
3
  size 17416033
ppo-CarRacing-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:150415e1b0b84e0aad3cd70473d649f3bbd143d90037b59fd534c7b1ec37c3ae
3
  size 8710383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b932caafa555d4fedb0916465441e71dec2b71f5c49595d234c8a3de1e8f964a
3
  size 8710383
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c583f2d3e16df6aa5dbc8b57d0adf27ebeb568cb9ed8603c4b2d68d9a8f7d2a
3
- size 1193817
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:005b0fc17b51c96b5a540f319c2a41d316e7f0b90fd552caa8aa7f55d013b1c6
3
+ size 466355
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": -83.17350280000001, "std_reward": 1.0504133584746358, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-11-17T16:24:25.640912"}
 
1
+ {"mean_reward": 56.3192213, "std_reward": 35.68732608885631, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-11-23T10:01:06.854190"}