Initial commit

Files changed (12) hide show

README.md CHANGED Viewed

@@ -16,7 +16,7 @@ model-index:
       type: SpaceInvadersNoFrameskip-v4
     metrics:
     - type: mean_reward
-      value: 374.00 +/- 214.89
       name: mean_reward
       verified: false
 ---
@@ -57,15 +57,15 @@ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f lo
 ## Hyperparameters
 ```python
-OrderedDict([('batch_size', 16),
              ('buffer_size', 100000),
              ('env_wrapper',
               ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
              ('exploration_final_eps', 0.01),
-             ('exploration_fraction', 0.1),
-             ('frame_stack', 4),
              ('gradient_steps', 1),
-             ('learning_rate', 0.001),
              ('learning_starts', 100000),
              ('n_timesteps', 1000000.0),
              ('optimize_memory_usage', False),

       type: SpaceInvadersNoFrameskip-v4
     metrics:
     - type: mean_reward
+      value: 527.00 +/- 220.46
       name: mean_reward
       verified: false
 ---
 ## Hyperparameters
 ```python
+OrderedDict([('batch_size', 32),
              ('buffer_size', 100000),
              ('env_wrapper',
               ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
              ('exploration_final_eps', 0.01),
+             ('exploration_fraction', 0.025),
+             ('frame_stack', 3),
              ('gradient_steps', 1),
+             ('learning_rate', 0.0001),
              ('learning_starts', 100000),
              ('n_timesteps', 1000000.0),
              ('optimize_memory_usage', False),

args.yml CHANGED Viewed

@@ -54,7 +54,7 @@
   - - save_replay_buffer
     - false
   - - seed
-    - 1069349440
   - - storage
     - null
   - - study_name

   - - save_replay_buffer
     - false
   - - seed
+    - 2989382765
   - - storage
     - null
   - - study_name

config.yml CHANGED Viewed

@@ -1,6 +1,6 @@
 !!python/object/apply:collections.OrderedDict
 - - - batch_size
-    - 16
   - - buffer_size
     - 100000
   - - env_wrapper
@@ -8,13 +8,13 @@
   - - exploration_final_eps
     - 0.01
   - - exploration_fraction
-    - 0.1
   - - frame_stack
-    - 4
   - - gradient_steps
     - 1
   - - learning_rate
-    - 0.001
   - - learning_starts
     - 100000
   - - n_timesteps

 !!python/object/apply:collections.OrderedDict
 - - - batch_size
+    - 32
   - - buffer_size
     - 100000
   - - env_wrapper
   - - exploration_final_eps
     - 0.01
   - - exploration_fraction
+    - 0.025
   - - frame_stack
+    - 3
   - - gradient_steps
     - 1
   - - learning_rate
+    - 0.0001
   - - learning_starts
     - 100000
   - - n_timesteps

dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0ceaa737a7114cbb5f1191c306bbed863daa9ae826b938d5a5b3846cb59f4638
-size 27224788

 version https://git-lfs.github.com/spec/v1
+oid sha256:21fe42182f075450c7abd138b7c7486bf603bddb8be5cb0ff731d0e9ba1590aa
+size 27144084

dqn-SpaceInvadersNoFrameskip-v4/_stable_baselines3_version CHANGED Viewed

	@@ -1 +1 @@
1	- 1.6.2


1	+ 1.7.0a10

dqn-SpaceInvadersNoFrameskip-v4/data CHANGED Viewed

The diff for this file is too large to render. See raw diff

dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:375b860e110b7be2f9da38da3f0fe7bcc503a5d007cf2e7ae753dcaf3cf8ec9f
-size 13505739

 version https://git-lfs.github.com/spec/v1
+oid sha256:7e0127f09bfebbfab6e0e95edf5f429d07a073f85d68dcaa3edfd9a8f686c9e6
+size 13489355

dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:de3b4f8a1ec2a36d84f01ff7b9e0b6fbfb52154b65ccf7b0fcc1c0be80c200e3
-size 13504937

 version https://git-lfs.github.com/spec/v1
+oid sha256:5a1168910a71d949e5cdb418d34d1df1a8139a74c55208d9954845dfe9015d0b
+size 13488553

dqn-SpaceInvadersNoFrameskip-v4/system_info.txt CHANGED Viewed

@@ -1,6 +1,6 @@
 OS: Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022
 Python: 3.8.16
-Stable-Baselines3: 1.6.2
 PyTorch: 1.13.0+cu116
 GPU Enabled: True
 Numpy: 1.21.6

 OS: Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022
 Python: 3.8.16
+Stable-Baselines3: 1.7.0a10
 PyTorch: 1.13.0+cu116
 GPU Enabled: True
 Numpy: 1.21.6

replay.mp4 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0b231c3e33922a65189db4066e7414df0b5a66d5fa35017253dc63dd0d43b457
-size 233415

 version https://git-lfs.github.com/spec/v1
+oid sha256:34b8dcd7b098e3d17dd6c7206b1795abba5236bd96bcdd4b089c6f3fd51a9d9b
+size 206858

results.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"mean_reward": ~~374~~.0, "std_reward": ~~214~~.~~89299662855464~~, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-12-~~19T22~~:14:07.~~643212~~"}


1	+ {"mean_reward": 527.0, "std_reward": 220.45634488487738, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-12-29T16:43:44.510264"}

train_eval_metrics.zip CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:25471be8f6630682b10afbad6ed662f144cdf126f6abdb4bed4cb6d88dc2fea9
-size 40539

 version https://git-lfs.github.com/spec/v1
+oid sha256:c34df2d496212e4d9c3c0b3170fa533b4177dda3d0a8e74b530ca10c28af7129
+size 38596