nivaldoho commited on
Commit
a36bcc7
1 Parent(s): 4972f84

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 390.50 +/- 145.92
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -73,7 +73,7 @@ OrderedDict([('batch_size', 64),
73
  ('gradient_steps', 1),
74
  ('learning_rate', 5e-05),
75
  ('learning_starts', 50000),
76
- ('n_timesteps', 100000.0),
77
  ('normalize', False),
78
  ('policy', 'CnnPolicy'),
79
  ('target_update_interval', 10000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 276.50 +/- 99.35
20
  name: mean_reward
21
  verified: false
22
  ---
 
73
  ('gradient_steps', 1),
74
  ('learning_rate', 5e-05),
75
  ('learning_starts', 50000),
76
+ ('n_timesteps', 1000000.0),
77
  ('normalize', False),
78
  ('policy', 'CnnPolicy'),
79
  ('target_update_interval', 10000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 2957842650
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 1822311238
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -20,7 +20,7 @@
20
  - - learning_starts
21
  - 50000
22
  - - n_timesteps
23
- - 100000.0
24
  - - normalize
25
  - false
26
  - - policy
 
20
  - - learning_starts
21
  - 50000
22
  - - n_timesteps
23
+ - 1000000.0
24
  - - normalize
25
  - false
26
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38d005501e227a0f29d2655e0fbc99ed1bb0667086241662842a33f51074c39c
3
- size 27220129
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39200e623580750db285c28b592c0eec3fabf02fbd9e42d93df9b18943c02002
3
+ size 27220136
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0db2e3b8c2168aa9ea8430b472d56db222b82461c9a8182eead1c057309a19bb
3
  size 13506236
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c93480606676c3829a92ba0bea0085408563e4405d9443214eb8ff1e28668c2e
3
  size 13506236
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14cb70e22cd28ab4c9c6d60aa9439f46666e95a3479c04910dd3d3933a753560
3
  size 13505370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f70661536ab983c8a46ebbb4b7a93887a03f9f3a6e3d6524a3c61b1b77f5b339
3
  size 13505370
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:668f5267ab783777567b8c7f33c27b372a8b413e0a52bd31f23ecc08b00dba5e
3
- size 257293
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53eb0f05ee6de6e93bbbec711b0df040eca07472e77e7a671e5080c80f2314e6
3
+ size 282770
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 390.5, "std_reward": 145.91864171516949, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-01-01T16:41:16.100047"}
 
1
+ {"mean_reward": 276.5, "std_reward": 99.34913185327791, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-01-01T17:17:53.501959"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22f2ae568f607e7d6d4aea704e318b1f5c7221fc4b47bec5c9e0e5208fe4249f
3
- size 5374
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:837874989e248d13b88103834b4e47708e38d986dfd40ae696550104564e62ba
3
+ size 9475