Upload PPO CarRacing-v2 trained agent

Files changed (8) hide show

README.md CHANGED Viewed

@@ -16,7 +16,7 @@ model-index:
       type: CarRacing-v2
     metrics:
     - type: mean_reward
-      value: -83.17 +/- 1.05
       name: mean_reward
       verified: false
 ---

       type: CarRacing-v2
     metrics:
     - type: mean_reward
+      value: 56.32 +/- 35.69
       name: mean_reward
       verified: false
 ---

config.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

ppo-CarRacing-v2.zip CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5cde64c9fdcf40be21eae0773118280739a86838d671749ce0225a4de4ad9199
-size 26323957

 version https://git-lfs.github.com/spec/v1
+oid sha256:149fa9c9cd45d4123eb5b038e3ed62ac7691c60f6695a785877792420f78305f
+size 26323576

ppo-CarRacing-v2/data CHANGED Viewed

The diff for this file is too large to render. See raw diff

ppo-CarRacing-v2/policy.optimizer.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fe0ff6f4cf8ec2f04dbc891df9dd73be097b676c5702563808a08f724f509da6
 size 17416033

 version https://git-lfs.github.com/spec/v1
+oid sha256:2ad1713a43bae37f222a58839f50b2f05f769e8e091f3c8f7a218fa53c49d7c3
 size 17416033

ppo-CarRacing-v2/policy.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:150415e1b0b84e0aad3cd70473d649f3bbd143d90037b59fd534c7b1ec37c3ae
 size 8710383

 version https://git-lfs.github.com/spec/v1
+oid sha256:b932caafa555d4fedb0916465441e71dec2b71f5c49595d234c8a3de1e8f964a
 size 8710383

replay.mp4 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5c583f2d3e16df6aa5dbc8b57d0adf27ebeb568cb9ed8603c4b2d68d9a8f7d2a
-size 1193817

 version https://git-lfs.github.com/spec/v1
+oid sha256:005b0fc17b51c96b5a540f319c2a41d316e7f0b90fd552caa8aa7f55d013b1c6
+size 466355

results.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"mean_reward": ~~-83~~.~~17350280000001~~, "std_reward": 1.~~0504133584746358~~, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-11-~~17T16~~:24:25.~~640912~~"}


1	+ {"mean_reward": 56.3192213, "std_reward": 35.68732608885631, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-11-23T10:01:06.854190"}