picklehari commited on
Commit
496327b
1 Parent(s): c75ac0e

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 268.50 +/- 78.17
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -72,7 +72,7 @@ OrderedDict([('batch_size', 16),
72
  ('gradient_steps', 2),
73
  ('learning_rate', 0.001),
74
  ('learning_starts', 1000000),
75
- ('n_timesteps', 10000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 567),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 14.50 +/- 16.95
20
  name: mean_reward
21
  verified: false
22
  ---
 
72
  ('gradient_steps', 2),
73
  ('learning_rate', 0.001),
74
  ('learning_starts', 1000000),
75
+ ('n_timesteps', 100000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 567),
args.yml CHANGED
@@ -2,7 +2,7 @@
2
  - - - algo
3
  - dqn
4
  - - conf_file
5
- - /content/SpaceInvadersNoFrameskip-v4.yml
6
  - - device
7
  - auto
8
  - - env
@@ -18,7 +18,7 @@
18
  - - hyperparams
19
  - null
20
  - - log_folder
21
- - .
22
  - - log_interval
23
  - -1
24
  - - max_total_trials
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 1709877418
58
  - - storage
59
  - null
60
  - - study_name
 
2
  - - - algo
3
  - dqn
4
  - - conf_file
5
+ - /content/SpaceInvadersNoFrameskip-v4:.yml
6
  - - device
7
  - auto
8
  - - env
 
18
  - - hyperparams
19
  - null
20
  - - log_folder
21
+ - logs/
22
  - - log_interval
23
  - -1
24
  - - max_total_trials
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2075307157
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 1000000
20
  - - n_timesteps
21
- - 10000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
18
  - - learning_starts
19
  - 1000000
20
  - - n_timesteps
21
+ - 100000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7c1695f1e600b6517cb4a19a8e94b0001296a6a06620c367242c65b30f18e7d
3
- size 13711597
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cfdca5d89032017117ab7e14763f5b32462ce25e1a4d1decb9bc8344fa8df3c
3
+ size 13714993
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:74b4ffc263872dfb879cb378f63c1b622525709b05bfb210969f3eef62230479
3
  size 13505370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb77bd4626ffe6019b8549af7c7f337d606227ac8aceec708250c4ade2beabd6
3
  size 13505370
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38a799ac9657faeb813344ec56ae265d381f35a430091e2c90337e271719a9db
3
- size 278674
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5147b26aa099360ec73d0e546302fdd669f5d6e2f70fb0e91ed838ed4ff94afd
3
+ size 290486
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 268.5, "std_reward": 78.16808811785025, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-11-20T16:56:47.300137"}
 
1
+ {"mean_reward": 14.5, "std_reward": 16.948451256678293, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-11-20T18:33:27.474767"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:07d195d22b0720c8fbfee8437fe6b4f126a46f69c1d103952bcf7b1601bde8cf
3
- size 591
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c41d69ea7971dd228e57d29eab440959b845fd65ba0c86d18886086669053563
3
+ size 5728