MattStammers commited on
Commit
544ac9d
1 Parent(s): 2a99e34

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: PongNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 20.30 +/- 0.90
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -82,5 +82,3 @@ OrderedDict([('batch_size', 256),
82
  ```python
83
  {'render_mode': 'rgb_array'}
84
  ```
85
-
86
- Still more work to go here as well. Need to get closer to the perfect 21
 
16
  type: PongNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 21.00 +/- 0.00
20
  name: mean_reward
21
  verified: false
22
  ---
 
82
  ```python
83
  {'render_mode': 'rgb_array'}
84
  ```
 
 
ppo-PongNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e34d72818a6c7db3995c4f2028bc9628685348b8a04c6762a67c5759b9d63e7
3
- size 20437483
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b76936e23cb806928a263bd6fdb5cbfa9a448e165887af453899257c1e743170
3
+ size 20437498
ppo-PongNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
ppo-PongNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8eceebac7677b8673fa18426b62d8e456b3fcbdae6134ea252e71e499c62b98
3
  size 13511033
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f58b06572568321b8eb5fb31c45a059fdf2fd94a96492570cfc6813adf1e72d9
3
  size 13511033
ppo-PongNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:39d65eecb1bab75578ac19cf3c99cafb0f3b88a690282420a0c50236b85b339b
3
  size 6757441
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1eb5a972f5e6d3510a262a357031380a7667e8bd1a9f271f92259136e8f73d7
3
  size 6757441
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:598827e83f56e9447687b9c41cdd327b04aad54744136c833c04473eddd73aa3
3
- size 65237
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46166601cb6c58f1fdab1b3dd30cec1939c81ea4e27649d6294536067746e33a
3
+ size 73911
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 20.3, "std_reward": 0.9000000000000001, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-09-05T06:50:27.253432"}
 
1
+ {"mean_reward": 21.0, "std_reward": 0.0, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-09-09T19:23:56.034135"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5443672ef416473cf95509d950e26888854d3793e8cb368307c72cf584dfc854
3
- size 483948
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cd267dfc0cf409961f284a389c9334fbc3fca789a2092ddfcb726c45761d51d
3
+ size 1598840