iiserkbikram commited on
Commit
e6c7e76
1 Parent(s): d4e41b3

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 274.50 +/- 31.50
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -62,20 +62,20 @@ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f lo
62
 
63
  ## Hyperparameters
64
  ```python
65
- OrderedDict([('batch_size', 64),
66
- ('buffer_size', 100000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
- ('exploration_final_eps', 0.01),
70
- ('exploration_fraction', 0.25),
71
  ('frame_stack', 4),
72
- ('gradient_steps', 2),
73
- ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 100000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
79
- ('train_freq', 8),
80
  ('normalize', False)])
81
  ```
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 261.50 +/- 41.42
20
  name: mean_reward
21
  verified: false
22
  ---
 
62
 
63
  ## Hyperparameters
64
  ```python
65
+ OrderedDict([('batch_size', 16),
66
+ ('buffer_size', 10000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
+ ('exploration_final_eps', 0.02),
70
+ ('exploration_fraction', 0.1),
71
  ('frame_stack', 4),
72
+ ('gradient_steps', 1),
73
+ ('learning_rate', 0.001),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 1000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
79
+ ('train_freq', 4),
80
  ('normalize', False)])
81
  ```
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 1380014744
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 3090249662
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -1,24 +1,24 @@
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
- - 64
4
  - - buffer_size
5
- - 100000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
9
- - 0.01
10
  - - exploration_fraction
11
- - 0.25
12
  - - frame_stack
13
  - 4
14
  - - gradient_steps
15
- - 2
16
  - - learning_rate
17
- - 0.0001
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 100000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
@@ -26,4 +26,4 @@
26
  - - target_update_interval
27
  - 1000
28
  - - train_freq
29
- - 8
 
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
+ - 16
4
  - - buffer_size
5
+ - 10000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
9
+ - 0.02
10
  - - exploration_fraction
11
+ - 0.1
12
  - - frame_stack
13
  - 4
14
  - - gradient_steps
15
+ - 1
16
  - - learning_rate
17
+ - 0.001
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
26
  - - target_update_interval
27
  - 1000
28
  - - train_freq
29
+ - 4
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca880fa3efba07161dc058a306329e0ac3e4b89fb728c0bef4b50da026094914
3
- size 13719757
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d885e48cdc50aca7c8b020d05c8e5bb5c858b51dd0f77e006a6d8eb571cea2be
3
+ size 27224402
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1e067afe9912f3dd1b7925918b8cbe439229f6008e572c9c7e431ae731419f1
3
- size 687
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12d532259f6f95e095f87f47597cc9c81ec8447d5cb62f9b812476da748ecf8c
3
+ size 13505419
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24514105126a149636622f02550979a5ea7d74c27de67f1760dd68ee6c30b6c9
3
- size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c407119b70d4f9af5a8b3c95880361b767fe6d393f05982607a821c357ba9e26
3
+ size 13504745
dqn-SpaceInvadersNoFrameskip-v4/system_info.txt CHANGED
@@ -2,6 +2,6 @@
2
  - Python: 3.9.16
3
  - Stable-Baselines3: 1.8.0a9
4
  - PyTorch: 1.13.1+cu116
5
- - GPU Enabled: True
6
- - Numpy: 1.22.4
7
  - Gym: 0.21.0
 
2
  - Python: 3.9.16
3
  - Stable-Baselines3: 1.8.0a9
4
  - PyTorch: 1.13.1+cu116
5
+ - GPU Enabled: False
6
+ - Numpy: 1.24.2
7
  - Gym: 0.21.0
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fba2ab7031f7061f065c3d5bc1de3dcfb9536d40b9bccd2413c48c7909f59ea3
3
- size 261744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7267eeb72f97d23e26e79a38f73024988ea5fc5381f7fcd55c0ef651ef4e38d
3
+ size 263544
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 274.5, "std_reward": 31.5, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-03-20T11:06:20.310249"}
 
1
+ {"mean_reward": 261.5, "std_reward": 41.415576779757636, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-03-20T18:58:35.003220"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:211b9f56f9962bf7e6f95cef3b8bf226e37ef74dcf6d0cbfbb4fe7b478b7df62
3
- size 5803
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06cd0586a1c94455c3309573b64159908ea1052d32e60858b86602fdc6fbafd9
3
+ size 41552