AllIllusion commited on
Commit
38f8848
·
verified ·
1 Parent(s): 43e0d53

Initial commit

Browse files
README.md CHANGED
@@ -5,7 +5,6 @@ tags:
5
  - deep-reinforcement-learning
6
  - reinforcement-learning
7
  - stable-baselines3
8
- - SL-Sprout
9
  model-index:
10
  - name: DQN
11
  results:
@@ -17,7 +16,7 @@ model-index:
17
  type: SpaceInvadersNoFrameskip-v4
18
  metrics:
19
  - type: mean_reward
20
- value: 655.00 +/- 205.66
21
  name: mean_reward
22
  verified: false
23
  ---
 
5
  - deep-reinforcement-learning
6
  - reinforcement-learning
7
  - stable-baselines3
 
8
  model-index:
9
  - name: DQN
10
  results:
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 918.00 +/- 500.06
20
  name: mean_reward
21
  verified: false
22
  ---
args.yml CHANGED
@@ -56,7 +56,7 @@
56
  - - save_replay_buffer
57
  - false
58
  - - seed
59
- - 4238794954
60
  - - storage
61
  - null
62
  - - study_name
 
56
  - - save_replay_buffer
57
  - false
58
  - - seed
59
+ - 4277872922
60
  - - storage
61
  - null
62
  - - study_name
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c85f93c86202c0f4b7cc3f5bccec5fe6dd627d0c73629a6248b69682528d809a
3
- size 27220534
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59b5e5203e93f11675c93a31ac6bc2e8e5ed47c7c5cc817a44705a52574df8a6
3
+ size 27221042
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:327cc0f4b7cf05f83f33b531396cfe6be5d4bf6f44d56432db3551189e2a845e
3
- size 13505852
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8f10cd8d5a04dd1489489c3a871202a4379156c61727b71bf34f92e18312993
3
+ size 13506172
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e07cf43690e6be5b93437805496fa429f0283dc56ca9dc5957031b98fe045a58
3
- size 13505178
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2bb77c1df36d561ffce45df3d22893f594aa0996d562586e02e9b51a7db1e26
3
+ size 13505370
dqn-SpaceInvadersNoFrameskip-v4/system_info.txt CHANGED
@@ -2,7 +2,7 @@
2
  - Python: 3.12.9
3
  - Stable-Baselines3: 2.6.0
4
  - PyTorch: 2.5.1+cu124
5
- - GPU Enabled: False
6
  - Numpy: 1.26.4
7
  - Cloudpickle: 3.1.1
8
  - Gymnasium: 1.1.1
 
2
  - Python: 3.12.9
3
  - Stable-Baselines3: 2.6.0
4
  - PyTorch: 2.5.1+cu124
5
+ - GPU Enabled: True
6
  - Numpy: 1.26.4
7
  - Cloudpickle: 3.1.1
8
  - Gymnasium: 1.1.1
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd55744161bfbef99dbeb4278c8290c49410a358bf73d7b5fc8e34f91ca3fb13
3
- size 217844
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54e0109eaf0f948f56901ab175c3ee609ab3cae87a2adb10e0915ef98161e309
3
+ size 196397
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 655.0, "std_reward": 205.65748223684935, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2025-05-02T20:12:49.575826"}
 
1
+ {"mean_reward": 918.0, "std_reward": 500.0559968643512, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2025-05-04T13:33:03.149827"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aca83fcf905d9f1e2c356f8efd5533c1d419d6bb0756d0bd0273c951a8826ce5
3
- size 29864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf4b240a51732cf8c475936f859b4e7a9d8dc12fea6eab3d73e72656d2c78e0f
3
+ size 36963