mobiusmatt commited on
Commit
a8dc54f
1 Parent(s): 961d5fc

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 573.50 +/- 148.90
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -67,7 +67,7 @@ OrderedDict([('batch_size', 32),
67
  ('gradient_steps', 1),
68
  ('learning_rate', 0.0001),
69
  ('learning_starts', 100000),
70
- ('n_timesteps', 1000000.0),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 274.50 +/- 31.50
20
  name: mean_reward
21
  verified: false
22
  ---
 
67
  ('gradient_steps', 1),
68
  ('learning_rate', 0.0001),
69
  ('learning_starts', 100000),
70
+ ('n_timesteps', 100000),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 2503867575
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2178589186
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 100000
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90a6b16dea5688fa11d043cc76a8478cfc584e8fc32e5b06e4487508356ea961
3
- size 27224809
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d42382dc7edbe6275ffc335372780f35f178be774828bda3b2bc01dcc221e062
3
+ size 13719748
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7cc68ec005e48bb72cb10449dfb146119f2b77a1284f66fd7fb631a3c5414100
3
- size 13505739
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1e067afe9912f3dd1b7925918b8cbe439229f6008e572c9c7e431ae731419f1
3
+ size 687
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8131a75037922f7cadd811f23d6dcde96ef73e7345d2b0d0714a72f9a31d825c
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3953755450f0916a0ad79f08d635f8c7b70ded68b5fc7ec2cc4271bcbf5a4cbe
3
  size 13504937
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49c6644912c65817402baaa8897a416ac8f537516810efa337c96885f201f490
3
- size 238682
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e13a11a839fea521ecfd34a27ae00521e04cfb8dd63fb3e005e2d701b498e2b
3
+ size 261744
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 573.5, "std_reward": 148.89677632507696, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-01-04T18:07:22.400137"}
 
1
+ {"mean_reward": 274.5, "std_reward": 31.5, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-01-04T19:50:40.854781"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e96d5ea312942c436786da49ac6d381cbc9d4e8d0956612e1589a83de69e28e8
3
- size 34299
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec1d2dfd2c6adc3403ae8b5a9b0ce8a084086f88935f0a8b925ba09b3fe36480
3
+ size 5795