nivaldoho commited on
Commit
4972f84
1 Parent(s): 9ca0f80

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 217.50 +/- 61.98
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -62,23 +62,22 @@ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f lo
62
 
63
  ## Hyperparameters
64
  ```python
65
- OrderedDict([('batch_size', 32),
66
- ('buffer_size', 10000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
- ('exploration_final_eps', 0.05),
70
- ('exploration_fraction', 0.1),
71
  ('frame_stack', 4),
72
- ('gamma', 0.8),
73
  ('gradient_steps', 1),
74
- ('learning_rate', 0.0001),
75
- ('learning_starts', 10000),
76
  ('n_timesteps', 100000.0),
77
- ('optimize_memory_usage', False),
78
  ('policy', 'CnnPolicy'),
79
- ('target_update_interval', 1000),
80
- ('train_freq', 4),
81
- ('normalize', False)])
82
  ```
83
 
84
  # Environment Arguments
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 390.50 +/- 145.92
20
  name: mean_reward
21
  verified: false
22
  ---
 
62
 
63
  ## Hyperparameters
64
  ```python
65
+ OrderedDict([('batch_size', 64),
66
+ ('buffer_size', 1000000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
+ ('exploration_final_eps', 0.01),
70
+ ('exploration_fraction', 0.025),
71
  ('frame_stack', 4),
72
+ ('gamma', 0.99),
73
  ('gradient_steps', 1),
74
+ ('learning_rate', 5e-05),
75
+ ('learning_starts', 50000),
76
  ('n_timesteps', 100000.0),
77
+ ('normalize', False),
78
  ('policy', 'CnnPolicy'),
79
+ ('target_update_interval', 10000),
80
+ ('train_freq', 4)])
 
81
  ```
82
 
83
  # Environment Arguments
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 1458835778
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2957842650
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -1,31 +1,31 @@
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
- - 32
4
  - - buffer_size
5
- - 10000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
9
- - 0.05
10
  - - exploration_fraction
11
- - 0.1
12
  - - frame_stack
13
  - 4
14
  - - gamma
15
- - 0.8
16
  - - gradient_steps
17
  - 1
18
  - - learning_rate
19
- - 0.0001
20
  - - learning_starts
21
- - 10000
22
  - - n_timesteps
23
  - 100000.0
24
- - - optimize_memory_usage
25
  - false
26
  - - policy
27
  - CnnPolicy
28
  - - target_update_interval
29
- - 1000
30
  - - train_freq
31
  - 4
 
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
+ - 64
4
  - - buffer_size
5
+ - 1000000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
9
+ - 0.01
10
  - - exploration_fraction
11
+ - 0.025
12
  - - frame_stack
13
  - 4
14
  - - gamma
15
+ - 0.99
16
  - - gradient_steps
17
  - 1
18
  - - learning_rate
19
+ - 5.0e-05
20
  - - learning_starts
21
+ - 50000
22
  - - n_timesteps
23
  - 100000.0
24
+ - - normalize
25
  - false
26
  - - policy
27
  - CnnPolicy
28
  - - target_update_interval
29
+ - 10000
30
  - - train_freq
31
  - 4
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dd869026b133ba1328f43820b459e6ff24b85a2a878ddb1f6d23dd5642985bf
3
- size 27220125
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38d005501e227a0f29d2655e0fbc99ed1bb0667086241662842a33f51074c39c
3
+ size 27220129
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:56b15d0749d2cc7f9b993b38022fadd10069037b5210e64f83c893678eb70b3a
3
  size 13506236
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0db2e3b8c2168aa9ea8430b472d56db222b82461c9a8182eead1c057309a19bb
3
  size 13506236
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c496751a1fd0205fb387c07ce76116add5145cc906136b07f856473beb6af800
3
  size 13505370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14cb70e22cd28ab4c9c6d60aa9439f46666e95a3479c04910dd3d3933a753560
3
  size 13505370
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c82371d6bc7d1b89389e744d5f8fb8669450fe263a6fe4132c1ab3cb9664d8c9
3
- size 264302
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:668f5267ab783777567b8c7f33c27b372a8b413e0a52bd31f23ecc08b00dba5e
3
+ size 257293
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 217.5, "std_reward": 61.97781861279082, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-01-01T02:13:36.609591"}
 
1
+ {"mean_reward": 390.5, "std_reward": 145.91864171516949, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-01-01T16:41:16.100047"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41fefb8aa27a36c423cdccfe4c42383c31be9fa93caabf02a80e83e27c43605d
3
- size 5275
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22f2ae568f607e7d6d4aea704e318b1f5c7221fc4b47bec5c9e0e5208fe4249f
3
+ size 5374