electricwapiti commited on
Commit
d5b504d
1 Parent(s): cafcd82

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 217.50 +/- 45.62
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 148.00 +/- 49.31
20
  name: mean_reward
21
  verified: false
22
  ---
args.yml CHANGED
@@ -56,7 +56,7 @@
56
  - - save_replay_buffer
57
  - false
58
  - - seed
59
- - 3492336383
60
  - - storage
61
  - null
62
  - - study_name
 
56
  - - save_replay_buffer
57
  - false
58
  - - seed
59
+ - 2338804685
60
  - - storage
61
  - null
62
  - - study_name
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05a66d1fe53d1a1eb62c02f4a74a5cb8676a05154f44b07522f85e4c7d16349e
3
- size 27220219
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20237612ce5b6e3a995949c473f90d9359aef74efe9e9dcbb64e1727d51de365
3
+ size 27220229
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c33599f41603615e39db1fc87476bca3e26a44e5923c43a8ca1be93cff9279e
3
  size 13505852
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:898f71401c573e155cd32deb2ba9765c6872f46fbb249399030868d46cfc62e0
3
  size 13505852
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fe04463b0c58569e9f7a70305c7f236afd60200852d1dffcfc5241ec31674ad
3
  size 13505178
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0370e38070b52c2c3ae25cd0b07ed1e9bf0bacce42f058fccb761556214e9105
3
  size 13505178
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 217.5, "std_reward": 45.62071897723665, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-08-15T01:43:10.321113"}
 
1
+ {"mean_reward": 148.0, "std_reward": 49.3051721424842, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-08-15T03:52:01.303345"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c1c0272df962e0816e3bca5cde3081e5bb857c65d09a2564269d913dd2eaa5b
3
- size 10236
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e2140a8e570ccdd97d8ed3977c29b9e2f915421b868c51dee193eef887c26c5
3
+ size 15509