nivaldoho commited on
Commit
e391ff1
1 Parent(s): d7b8ac7

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 316.00 +/- 141.29
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -68,7 +68,7 @@ OrderedDict([('batch_size', 64),
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
  ('exploration_final_eps', 0.01),
70
  ('exploration_fraction', 0.025),
71
- ('frame_stack', 2),
72
  ('gamma', 0.99),
73
  ('gradient_steps', 1),
74
  ('learning_rate', 5e-05),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 488.00 +/- 176.62
20
  name: mean_reward
21
  verified: false
22
  ---
 
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
  ('exploration_final_eps', 0.01),
70
  ('exploration_fraction', 0.025),
71
+ ('frame_stack', 4),
72
  ('gamma', 0.99),
73
  ('gradient_steps', 1),
74
  ('learning_rate', 5e-05),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 1566579183
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 1675566432
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -10,7 +10,7 @@
10
  - - exploration_fraction
11
  - 0.025
12
  - - frame_stack
13
- - 2
14
  - - gamma
15
  - 0.99
16
  - - gradient_steps
 
10
  - - exploration_fraction
11
  - 0.025
12
  - - frame_stack
13
+ - 4
14
  - - gamma
15
  - 0.99
16
  - - gradient_steps
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4b27a30aab0bbd6ff67409046976fa48bf5114fee0e876d2d968380b6b3b636
3
- size 27058634
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d9ad7baa1319b882ce73ec0fe974d6109ef04d8c8a23a387242242888763222
3
+ size 27220134
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dc27f4ee0d278017756c730ca9534cbb3b0fc68b46499fcb98ab9bb7d650125
3
- size 13473404
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58083e6d9f6381afd1cacd3f7130f2c81ffe685100bf88174f7dc73e5015444a
3
+ size 13506236
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18ab39c557d5ac5bfee6709495af39ff923e4a4a833ded7d5c179c3311014a19
3
- size 13472602
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19670fa9924ed8433310a795e48a7366f97210e249ec992a7076262394b34736
3
+ size 13505370
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:433fed1cc53a6594a86ad2973dbfd969641689d854084297154ca0cc2756a104
3
- size 239906
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a344103ea306cb3883bfab7020ca7e6ca657ef09b6bc92bf0b3c5dab655c1da
3
+ size 239090
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 316.0, "std_reward": 141.2940196894405, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-01-01T19:39:50.737537"}
 
1
+ {"mean_reward": 488.0, "std_reward": 176.62389419328292, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-01-01T21:20:44.065291"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89c93cfa2b72a76d4cccfa16cc6112fb843d5be177ac2a28b99e51227e2759d7
3
- size 44351
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f4def5c3d5f6af10af5d847b0fe8da8049d3820b6557cf540b2d0b0dfaf9c0c
3
+ size 43497