reachrkr commited on
Commit
6d2b8ae
1 Parent(s): a6eb7c0

2nd commit

Browse files
.gitattributes CHANGED
@@ -2,11 +2,13 @@
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
 
5
  *.ftz filter=lfs diff=lfs merge=lfs -text
6
  *.gz filter=lfs diff=lfs merge=lfs -text
7
  *.h5 filter=lfs diff=lfs merge=lfs -text
8
  *.joblib filter=lfs diff=lfs merge=lfs -text
9
  *.lfs.* filter=lfs diff=lfs merge=lfs -text
 
10
  *.model filter=lfs diff=lfs merge=lfs -text
11
  *.msgpack filter=lfs diff=lfs merge=lfs -text
12
  *.npy filter=lfs diff=lfs merge=lfs -text
@@ -20,6 +22,7 @@
20
  *.pt filter=lfs diff=lfs merge=lfs -text
21
  *.pth filter=lfs diff=lfs merge=lfs -text
22
  *.rar filter=lfs diff=lfs merge=lfs -text
 
23
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
24
  *.tar.* filter=lfs diff=lfs merge=lfs -text
25
  *.tflite filter=lfs diff=lfs merge=lfs -text
@@ -27,6 +30,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
  *.wasm filter=lfs diff=lfs merge=lfs -text
28
  *.xz filter=lfs diff=lfs merge=lfs -text
29
  *.zip filter=lfs diff=lfs merge=lfs -text
30
- *.zstandard filter=lfs diff=lfs merge=lfs -text
31
  *tfevents* filter=lfs diff=lfs merge=lfs -text
32
  *.mp4 filter=lfs diff=lfs merge=lfs -text
 
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
  *.ftz filter=lfs diff=lfs merge=lfs -text
7
  *.gz filter=lfs diff=lfs merge=lfs -text
8
  *.h5 filter=lfs diff=lfs merge=lfs -text
9
  *.joblib filter=lfs diff=lfs merge=lfs -text
10
  *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
  *.model filter=lfs diff=lfs merge=lfs -text
13
  *.msgpack filter=lfs diff=lfs merge=lfs -text
14
  *.npy filter=lfs diff=lfs merge=lfs -text
 
22
  *.pt filter=lfs diff=lfs merge=lfs -text
23
  *.pth filter=lfs diff=lfs merge=lfs -text
24
  *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
  *.tar.* filter=lfs diff=lfs merge=lfs -text
28
  *.tflite filter=lfs diff=lfs merge=lfs -text
 
30
  *.wasm filter=lfs diff=lfs merge=lfs -text
31
  *.xz filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
+ *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
  *.mp4 filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 210.00 +/- 145.89
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -43,13 +43,13 @@ pip install rl_zoo3
43
 
44
  ```
45
  # Download model and save it into the logs/ folder
46
- python -m rl_zoo3.load_from_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -orga reachrkr -f logs/
47
  python -m rl_zoo3.enjoy --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
48
  ```
49
 
50
  If you installed the RL Zoo3 via pip (`pip install rl_zoo3`), from anywhere you can do:
51
  ```
52
- python -m rl_zoo3.load_from_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -orga reachrkr -f logs/
53
  python -m rl_zoo3.enjoy --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
54
  ```
55
 
@@ -57,7 +57,7 @@ python -m rl_zoo3.enjoy --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
57
  ```
58
  python -m rl_zoo3.train --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
59
  # Upload the model and generate video (when possible)
60
- python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/ -orga reachrkr
61
  ```
62
 
63
  ## Hyperparameters
@@ -72,7 +72,7 @@ OrderedDict([('batch_size', 32),
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 100000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 562.00 +/- 92.42
20
  name: mean_reward
21
  verified: false
22
  ---
 
43
 
44
  ```
45
  # Download model and save it into the logs/ folder
46
+ python -m rl_zoo3.load_from_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -orga dineshresearch -f logs/
47
  python -m rl_zoo3.enjoy --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
48
  ```
49
 
50
  If you installed the RL Zoo3 via pip (`pip install rl_zoo3`), from anywhere you can do:
51
  ```
52
+ python -m rl_zoo3.load_from_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -orga dineshresearch -f logs/
53
  python -m rl_zoo3.enjoy --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
54
  ```
55
 
 
57
  ```
58
  python -m rl_zoo3.train --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
59
  # Upload the model and generate video (when possible)
60
+ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/ -orga dineshresearch
61
  ```
62
 
63
  ## Hyperparameters
 
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 1000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 2794116141
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2115956098
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 100000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5d698f7e0387732d291f05a32b81ac651d1a68f2693feb3d88fc75e596425c5
3
- size 13719746
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:717a588e45d5ceb619a3a3734a0a26e967f2566e839a4b9fdec01ef72bf9b383
3
+ size 27224807
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1e067afe9912f3dd1b7925918b8cbe439229f6008e572c9c7e431ae731419f1
3
- size 687
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7c1b37b19a251e7770eb0c75e9e073fc174219b7fd47bda8bad73c04a80f635
3
+ size 13505739
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9cfcd9e1766805f72358e8889b276d0318eca05e35400bbf4bdc770bb354005
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76fedabee2addf0f00776109d73599f94d39390b0d268384b25ba245d0e7a53a
3
  size 13504937
dqn-SpaceInvadersNoFrameskip-v4/system_info.txt CHANGED
@@ -3,5 +3,5 @@
3
  - Stable-Baselines3: 1.8.0a2
4
  - PyTorch: 1.13.1+cu116
5
  - GPU Enabled: True
6
- - Numpy: 1.21.6
7
  - Gym: 0.21.0
 
3
  - Stable-Baselines3: 1.8.0a2
4
  - PyTorch: 1.13.1+cu116
5
  - GPU Enabled: True
6
+ - Numpy: 1.22.4
7
  - Gym: 0.21.0
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e38cee50b413c4b8cdda5a1434709b6fd57234bbadab18c33a59a732db44e643
3
- size 255939
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a3f07c5303853d0728e0684857b05e17920782cdcb5361567ac8927489c34fa
3
+ size 202273
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 210.0, "std_reward": 145.89379698945393, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-01-29T22:38:26.926819"}
 
1
+ {"mean_reward": 562.0, "std_reward": 92.41753080449618, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-03-08T16:28:49.763824"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa0570b193c78251d11188d295befaabb70a340db45aaf1effcd1fd2aa78d91b
3
- size 5845
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ce75a56fdd4d63757460939e069ffb167df6ca3faed071e26eac01c9c48df6a
3
+ size 36758