mobiusmatt commited on
Commit
ac91261
1 Parent(s): a8dc54f

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 274.50 +/- 31.50
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -67,7 +67,7 @@ OrderedDict([('batch_size', 32),
67
  ('gradient_steps', 1),
68
  ('learning_rate', 0.0001),
69
  ('learning_starts', 100000),
70
- ('n_timesteps', 100000),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 573.00 +/- 134.45
20
  name: mean_reward
21
  verified: false
22
  ---
 
67
  ('gradient_steps', 1),
68
  ('learning_rate', 0.0001),
69
  ('learning_starts', 100000),
70
+ ('n_timesteps', 1000000),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 2178589186
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2015047634
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 100000
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 1000000
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d42382dc7edbe6275ffc335372780f35f178be774828bda3b2bc01dcc221e062
3
- size 13719748
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3efe9d9f7c7a05c04aaa93cdfb52d46614728a7c8548bc985301f818b6b86040
3
+ size 27224809
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1e067afe9912f3dd1b7925918b8cbe439229f6008e572c9c7e431ae731419f1
3
- size 687
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b8c39e0e138b2cdd6759906021846d6ada9bc82c87a41ce1b35b992845b6827
3
+ size 13505739
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3953755450f0916a0ad79f08d635f8c7b70ded68b5fc7ec2cc4271bcbf5a4cbe
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:471f3bfe75cc5a1ad2fdbbc71108580d2d3162dabb568e869e67f6afb2cad8b0
3
  size 13504937
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e13a11a839fea521ecfd34a27ae00521e04cfb8dd63fb3e005e2d701b498e2b
3
- size 261744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9d9d8842b782483c036c2c1e59944c50a9d5b4ad05577d7451c2f6109babe70
3
+ size 185645
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 274.5, "std_reward": 31.5, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-01-04T19:50:40.854781"}
 
1
+ {"mean_reward": 573.0, "std_reward": 134.44701558606647, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-01-04T21:04:02.523304"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec1d2dfd2c6adc3403ae8b5a9b0ce8a084086f88935f0a8b925ba09b3fe36480
3
- size 5795
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7f1e2221c26c9d698c2b040ea5792fb363751dee98b748c9e9b53d6187d1b48
3
+ size 35912