llmvetter commited on
Commit
975c1f7
·
1 Parent(s): 9c93774

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 165.00 +/- 95.52
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -70,8 +70,8 @@ OrderedDict([('batch_size', 32),
70
  ('exploration_fraction', 0.1),
71
  ('frame_stack', 4),
72
  ('gradient_steps', 1),
73
- ('learning_rate', 0.0001),
74
- ('learning_starts', 10000),
75
  ('n_timesteps', 100000),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 328.50 +/- 224.43
20
  name: mean_reward
21
  verified: false
22
  ---
 
70
  ('exploration_fraction', 0.1),
71
  ('frame_stack', 4),
72
  ('gradient_steps', 1),
73
+ ('learning_rate', 0.0005),
74
+ ('learning_starts', 5000),
75
  ('n_timesteps', 100000),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 1908441606
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 3620644676
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -14,9 +14,9 @@
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
- - 0.0001
18
  - - learning_starts
19
- - 10000
20
  - - n_timesteps
21
  - 100000
22
  - - optimize_memory_usage
 
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
+ - 0.0005
18
  - - learning_starts
19
+ - 5000
20
  - - n_timesteps
21
  - 100000
22
  - - optimize_memory_usage
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e95029f8f31b20d4da7729e1eb5d70657e9350450447fe2b09c830dfc2d0079c
3
- size 27220782
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:978bffcc3dfd0ea7d1dc821bb1e688a94a15750d9d752471cf65db5138d5e2aa
3
+ size 27220781
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12572659a4b1d8002b1db5c5986d92d4c3bd71234fc790650813aa0cfaf7b3b9
3
  size 13506236
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea109d3a00809d20660c3a59bbb6fcc5944e3bcc88a8eb2b6c22f56f74871d6a
3
  size 13506236
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:740233404e67f9b136fd1ee1b3ce8219ab635cf1799f4605f65d75c158faa62a
3
  size 13505370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8668d852aac9e381b5a570d014c9ba172ce85c55ef9cd222683958385eab0d3
3
  size 13505370
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0b585bcd981128fd3362327162d8f769abd13bf3fe397575cbf922b5652fe4e
3
- size 257162
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c68f3d07b3171a2a3eb46a87c8561640deffb0d8c4fa1cb0765c1dfc5b363c1
3
+ size 259624
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 165.0, "std_reward": 95.524865872714, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-05-30T15:15:37.602754"}
 
1
+ {"mean_reward": 328.5, "std_reward": 224.43317490959308, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-05-30T15:36:20.082615"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac4b6138e8a31d18c951bcf178951208bfdaa62bc9de22ab5a53fd9bc9c8b565
3
- size 5190
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ea0fb038b334dca6fb5ff1b72fc30b300aee039dabfcde269b37840d6772ca9
3
+ size 5180