dallonf commited on
Commit
8e83769
1 Parent(s): d123f7f

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 606.50 +/- 139.50
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -72,7 +72,7 @@ OrderedDict([('batch_size', 32),
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 1000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 752.50 +/- 268.05
20
  name: mean_reward
21
  verified: false
22
  ---
 
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 10000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 3491495171
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 158802615
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 10000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42d2769306656be8ded8bacea47af14cf56009b4062c9a1f42c0629a3a59cd43
3
- size 27220328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3867c5516bbfbf275c66ba93e041b9bf92146337db233fb59f18ec247332829b
3
+ size 27220333
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:60e71a848de1c73be36fea2422da895347667648c8a197419a7c868ad2a7f03d
3
  size 13506236
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d456c26423fa5cc05b5b5922845a56bad8889e8098bba14866d7b6d1cc8630e
3
  size 13506236
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84a0c5289fb64edfd2b062a02d443f7441facef7146a18f59c2149460fd2be2e
3
  size 13505370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d3e210ead917832b49238c90fe1617203f93a0e6abdcc6d3cb6c41425980fd5
3
  size 13505370
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7b221b40dce3f1a2949fc749964c5501f68e5c672b0b4da067f21af341f939f
3
- size 208553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c5c35c1a89799fc817230e7266c2f07fce14aae9111e375c313f2d9a3cd5358
3
+ size 210785
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 606.5, "std_reward": 139.5, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-04-22T00:06:27.394500"}
 
1
+ {"mean_reward": 752.5, "std_reward": 268.0508347310263, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-04-23T23:48:29.560357"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52463dbfd1ee47fa38e903d67e8ce83a6484c66734cb2558cf0013cb4a09ba31
3
- size 36544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2194b0007d8d2f219444ed6e516a1d7479824f6a32a283f6c20bbac273298aa0
3
+ size 276855