YarramsettiNaresh commited on
Commit
4d65a5b
1 Parent(s): 7570b03

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 162.50 +/- 94.74
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -62,19 +62,19 @@ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f lo
62
 
63
  ## Hyperparameters
64
  ```python
65
- OrderedDict([('batch_size', 128),
66
- ('buffer_size', 1000000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
  ('exploration_final_eps', 0.01),
70
  ('exploration_fraction', 0.1),
71
  ('frame_stack', 4),
72
  ('gradient_steps', 1),
73
- ('learning_rate', 1e-06),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 10000000.0),
76
  ('optimize_memory_usage', False),
77
- ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
79
  ('train_freq', 4),
80
  ('normalize', False)])
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 319.00 +/- 125.73
20
  name: mean_reward
21
  verified: false
22
  ---
 
62
 
63
  ## Hyperparameters
64
  ```python
65
+ OrderedDict([('batch_size', 16),
66
+ ('buffer_size', 50000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
  ('exploration_final_eps', 0.01),
70
  ('exploration_fraction', 0.1),
71
  ('frame_stack', 4),
72
  ('gradient_steps', 1),
73
+ ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 1000000.0),
76
  ('optimize_memory_usage', False),
77
+ ('policy', 'MlpPolicy'),
78
  ('target_update_interval', 1000),
79
  ('train_freq', 4),
80
  ('normalize', False)])
args.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - hyperparams
19
  - null
20
  - - log_folder
21
- - logs6/
22
  - - log_interval
23
  - -1
24
  - - max_total_trials
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 3305755252
58
  - - storage
59
  - null
60
  - - study_name
 
18
  - - hyperparams
19
  - null
20
  - - log_folder
21
+ - logs7/
22
  - - log_interval
23
  - -1
24
  - - max_total_trials
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 270929130
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -1,8 +1,8 @@
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
- - 128
4
  - - buffer_size
5
- - 1000000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
@@ -14,15 +14,15 @@
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
- - 1.0e-06
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 10000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
25
- - CnnPolicy
26
  - - target_update_interval
27
  - 1000
28
  - - train_freq
 
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
+ - 16
4
  - - buffer_size
5
+ - 50000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
 
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
+ - 0.0001
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
25
+ - MlpPolicy
26
  - - target_update_interval
27
  - 1000
28
  - - train_freq
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0fc8c87806d4c68d49289814aa79a636065d27f9c78728f5abd2896e9bcc176
3
- size 27218054
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:904521a0ed48b661412f6fe9965b5dc1ef4544a432fb62d9adf3c7ef6a952f51
3
+ size 29192260
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1384fb70056808fd49020e21dd1c48eaa4ebdc1223d9bcf300d22ab998385d9e
3
- size 13505419
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44de05d5d2ae57d78fbee4ee2b0dc266bc850f6efe27842b03c97abc6da4b712
3
+ size 14492399
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e51c0e845ccdaf52e921edbef01d7244ae8a0773777fd10b5ac4c490c0be8d5
3
- size 13504745
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cfae794674f7b4cc055afa73e53ce8c528dd608a47f5019317cad5dc9de88e6
3
+ size 14491521
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:459eb5214cce8826056ab0d83fbf902fc3e352ab3ebb64a2dbf41afc7dab5f77
3
- size 264242
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8844acf903ec50ff6390ef5cf264eb4433418c5bcd7a256635242a718636974d
3
+ size 240647
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 162.5, "std_reward": 94.74307362546351, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-07-27T03:50:18.254345"}
 
1
+ {"mean_reward": 319.0, "std_reward": 125.73384588089239, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-07-27T09:05:03.377842"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ac1a6cfdd9fb8e9e40f67e8692da1c60b777adb0e30ae7fd85af2556a94ff28
3
- size 28732
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:922f003a28eed0e06c39318a20a57e5be0c163aad32b2552a8c7ca7ed60c2088
3
+ size 43152