paicup09 commited on
Commit
a47d1d2
·
1 Parent(s): f79768a

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 542.00 +/- 152.14
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -57,20 +57,20 @@ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f lo
57
 
58
  ## Hyperparameters
59
  ```python
60
- OrderedDict([('batch_size', 64),
61
- ('buffer_size', 120000),
62
  ('env_wrapper',
63
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
64
  ('exploration_final_eps', 0.01),
65
  ('exploration_fraction', 0.1),
66
  ('frame_stack', 4),
67
  ('gradient_steps', 1),
68
- ('learning_rate', 7e-05),
69
  ('learning_starts', 100000),
70
- ('n_timesteps', 900000.0),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
- ('target_update_interval', 900),
74
  ('train_freq', 4),
75
  ('normalize', False)])
76
  ```
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 607.00 +/- 170.22
20
  name: mean_reward
21
  verified: false
22
  ---
 
57
 
58
  ## Hyperparameters
59
  ```python
60
+ OrderedDict([('batch_size', 128),
61
+ ('buffer_size', 130000),
62
  ('env_wrapper',
63
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
64
  ('exploration_final_eps', 0.01),
65
  ('exploration_fraction', 0.1),
66
  ('frame_stack', 4),
67
  ('gradient_steps', 1),
68
+ ('learning_rate', 8e-05),
69
  ('learning_starts', 100000),
70
+ ('n_timesteps', 2000000.0),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
+ ('target_update_interval', 980),
74
  ('train_freq', 4),
75
  ('normalize', False)])
76
  ```
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 2699922974
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2190085864
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -1,8 +1,8 @@
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
- - 64
4
  - - buffer_size
5
- - 120000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
@@ -14,16 +14,16 @@
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
- - 7.0e-05
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 900000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
25
  - CnnPolicy
26
  - - target_update_interval
27
- - 900
28
  - - train_freq
29
  - 4
 
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
+ - 128
4
  - - buffer_size
5
+ - 130000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
 
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
+ - 8.0e-05
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 2000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
25
  - CnnPolicy
26
  - - target_update_interval
27
+ - 980
28
  - - train_freq
29
  - 4
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b5dcee4abc1be008b849b801877de0231a0fd40c3579f59102f3340bfc2d3bb
3
- size 27224790
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f4cecc0366bcc0be0fd795a3900894be5d7939d5906baa0595005a663f566d1
3
+ size 27224794
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1083c25fd1e80e1f96ae86cb63b80c6ed3e6dfb085404724c2c3484a4376b05
3
  size 13505739
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3346f1dce4922633d8cd79da133b71843fa4abf251ac90904f050e992b54b1f8
3
  size 13505739
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b9afb9fc4ab5f1ec30d02fe9dbc4e900bef9230476ed54fbcbd8d830998828ac
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb075ce9f561a250c7c7d21617d26ec2c8e983c651bb5d374dae3784f79c17b5
3
  size 13504937
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:373cf67558da5b74e3054e99f006e9c50eabce3d834756ea670fd10532c989f9
3
- size 197209
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cef49b39f18b35b9738ebb38a966a841853746b32b159740f2ef103c8ae0464d
3
+ size 195721
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 542.0, "std_reward": 152.1380951635717, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-12-29T15:36:12.285870"}
 
1
+ {"mean_reward": 607.0, "std_reward": 170.2233826476257, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-12-30T13:01:28.879243"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7dd11f7dc9329365aecafdfbe5bd322f48dd202bf8dbd788d9a020cec3b19c3
3
- size 34949
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e64baf8f7d995312d22faf3a009535a097f2124802636eff3cda96b9d4b94396
3
+ size 67396