YarramsettiNaresh commited on
Commit
002c870
1 Parent(s): 4d65a5b

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 319.00 +/- 125.73
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -62,8 +62,8 @@ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f lo
62
 
63
  ## Hyperparameters
64
  ```python
65
- OrderedDict([('batch_size', 16),
66
- ('buffer_size', 50000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
  ('exploration_final_eps', 0.01),
@@ -72,9 +72,9 @@ OrderedDict([('batch_size', 16),
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 1000000.0),
76
  ('optimize_memory_usage', False),
77
- ('policy', 'MlpPolicy'),
78
  ('target_update_interval', 1000),
79
  ('train_freq', 4),
80
  ('normalize', False)])
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 851.50 +/- 275.82
20
  name: mean_reward
21
  verified: false
22
  ---
 
62
 
63
  ## Hyperparameters
64
  ```python
65
+ OrderedDict([('batch_size', 32),
66
+ ('buffer_size', 100000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
  ('exploration_final_eps', 0.01),
 
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 10000000.0),
76
  ('optimize_memory_usage', False),
77
+ ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
79
  ('train_freq', 4),
80
  ('normalize', False)])
args.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - hyperparams
19
  - null
20
  - - log_folder
21
- - logs7/
22
  - - log_interval
23
  - -1
24
  - - max_total_trials
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 270929130
58
  - - storage
59
  - null
60
  - - study_name
 
18
  - - hyperparams
19
  - null
20
  - - log_folder
21
+ - logs5/
22
  - - log_interval
23
  - -1
24
  - - max_total_trials
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 429927090
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -1,8 +1,8 @@
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
- - 16
4
  - - buffer_size
5
- - 50000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
@@ -18,11 +18,11 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
25
- - MlpPolicy
26
  - - target_update_interval
27
  - 1000
28
  - - train_freq
 
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
+ - 32
4
  - - buffer_size
5
+ - 100000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 10000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
25
+ - CnnPolicy
26
  - - target_update_interval
27
  - 1000
28
  - - train_freq
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:904521a0ed48b661412f6fe9965b5dc1ef4544a432fb62d9adf3c7ef6a952f51
3
- size 29192260
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3163d2b05b45150250ae6b9d67e4bcabb405ac5876d5f5e298512881f6d927df
3
+ size 27215583
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44de05d5d2ae57d78fbee4ee2b0dc266bc850f6efe27842b03c97abc6da4b712
3
- size 14492399
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbb7f209e445a93699fab0a850a09274e4551090af88655e9def9f0aedcbc229
3
+ size 13502953
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cfae794674f7b4cc055afa73e53ce8c528dd608a47f5019317cad5dc9de88e6
3
- size 14491521
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc5ed37177ee7376f5e65591125b7a47170bc0bbbe25ca99405f56182aac4215
3
+ size 13504745
dqn-SpaceInvadersNoFrameskip-v4/system_info.txt CHANGED
@@ -1,9 +1,9 @@
1
- - OS: Linux-5.15.0-1039-oracle-x86_64-with-glibc2.35 # 45-Ubuntu SMP Thu Jul 13 19:37:23 UTC 2023
2
- - Python: 3.10.6
3
  - Stable-Baselines3: 2.0.0
4
- - PyTorch: 2.0.1+cu117
5
  - GPU Enabled: False
6
- - Numpy: 1.25.1
7
  - Cloudpickle: 2.2.1
8
  - Gymnasium: 0.28.1
9
  - OpenAI Gym: 0.26.2
 
1
+ - OS: Linux-5.15.0-1038-oracle-x86_64-with-glibc2.31 # 44~20.04.1-Ubuntu SMP Thu Jun 22 16:36:07 UTC 2023
2
+ - Python: 3.9.17
3
  - Stable-Baselines3: 2.0.0
4
+ - PyTorch: 1.11.0+cu102
5
  - GPU Enabled: False
6
+ - Numpy: 1.21.2
7
  - Cloudpickle: 2.2.1
8
  - Gymnasium: 0.28.1
9
  - OpenAI Gym: 0.26.2
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8844acf903ec50ff6390ef5cf264eb4433418c5bcd7a256635242a718636974d
3
- size 240647
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d38caf32749738c5aff1cd187080caa787c003bb5d151b2508441c7dd9c190c1
3
+ size 205711
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 319.0, "std_reward": 125.73384588089239, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-07-27T09:05:03.377842"}
 
1
+ {"mean_reward": 851.5, "std_reward": 275.81742149472717, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-07-28T03:28:54.201893"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:922f003a28eed0e06c39318a20a57e5be0c163aad32b2552a8c7ca7ed60c2088
3
- size 43152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77cae0c0b68ea162037f18c93c4114918fdcdf8f7240f63b377df8d22f2bdbcc
3
+ size 276708