ws11yrin commited on
Commit
d0c6576
1 Parent(s): 20eb6ba

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 666.50 +/- 208.52
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 832.00 +/- 383.77
20
  name: mean_reward
21
  verified: false
22
  ---
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52993075153796e27aefef787c889b7036dc4640196cd27fa1ac9d0b0a3f0c1c
3
- size 27220321
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:968484aea4628dc8fa4fa7e00e942797be95da5244d5a54e0339d93d2aa805ea
3
+ size 27220312
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8579f64ca4cbc9b4a54f8b0a204fa4acb5f53f5d2d185bc6d3bface7ddc233ef
3
  size 13505852
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1feabd244e20fad6d62d5cf135b44dc3d39e4ac64a0bf4ce7a1d40a1309572b3
3
  size 13505852
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9d95413203937294ee8caa756df359e782d8312432b5a39eec67e69b42eff13
3
  size 13505178
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:061614a0337d927e5774943bf9c7c1c1ccef112fdc88ea75ccab0d636b461e04
3
  size 13505178
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bedcaea2b1aa81620507c67a95b58bcec4f6dacad58301a86111d8a2c855c29e
3
- size 241433
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8ceb9d8b65dde354ef145e2576583cebd17425dd0ed39d0060f7b5b5e8c5846
3
+ size 200040
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 666.5, "std_reward": 208.51918376974336, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-05-14T00:41:11.182994"}
 
1
+ {"mean_reward": 832.0, "std_reward": 383.7655534307372, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-05-14T00:43:40.409083"}