Push to Hub
Browse files- README.md +1 -1
- args.yml +7 -7
- dqn-BreakoutNoFrameskip-v4.zip +2 -2
- dqn-BreakoutNoFrameskip-v4/data +0 -0
- dqn-BreakoutNoFrameskip-v4/policy.optimizer.pth +2 -2
- dqn-BreakoutNoFrameskip-v4/policy.pth +2 -2
- dqn-BreakoutNoFrameskip-v4/system_info.txt +6 -6
- replay.mp4 +2 -2
- results.json +1 -1
- train_eval_metrics.zip +2 -2
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: BreakoutNoFrameskip-v4
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value:
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
16 |
type: BreakoutNoFrameskip-v4
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: 42.80 +/- 16.37
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
args.yml
CHANGED
@@ -12,7 +12,7 @@
|
|
12 |
- - eval_episodes
|
13 |
- 10
|
14 |
- - eval_freq
|
15 |
-
-
|
16 |
- - gym_packages
|
17 |
- []
|
18 |
- - hyperparams
|
@@ -20,7 +20,7 @@
|
|
20 |
- - log_folder
|
21 |
- logs/6_c/rlzoo3/
|
22 |
- - log_interval
|
23 |
-
-
|
24 |
- - max_total_trials
|
25 |
- null
|
26 |
- - n_eval_envs
|
@@ -32,7 +32,7 @@
|
|
32 |
- - n_startup_trials
|
33 |
- 10
|
34 |
- - n_timesteps
|
35 |
-
-
|
36 |
- - n_trials
|
37 |
- 500
|
38 |
- - no_optim_plots
|
@@ -50,17 +50,17 @@
|
|
50 |
- - sampler
|
51 |
- tpe
|
52 |
- - save_freq
|
53 |
-
-
|
54 |
- - save_replay_buffer
|
55 |
- false
|
56 |
- - seed
|
57 |
-
-
|
58 |
- - storage
|
59 |
- null
|
60 |
- - study_name
|
61 |
- null
|
62 |
- - tensorboard_log
|
63 |
-
- runs/BreakoutNoFrameskip-
|
64 |
- - track
|
65 |
- true
|
66 |
- - trained_agent
|
@@ -76,6 +76,6 @@
|
|
76 |
- - wandb_entity
|
77 |
- null
|
78 |
- - wandb_project_name
|
79 |
-
- dqn-breakout
|
80 |
- - wandb_tags
|
81 |
- []
|
|
|
12 |
- - eval_episodes
|
13 |
- 10
|
14 |
- - eval_freq
|
15 |
+
- 10000
|
16 |
- - gym_packages
|
17 |
- []
|
18 |
- - hyperparams
|
|
|
20 |
- - log_folder
|
21 |
- logs/6_c/rlzoo3/
|
22 |
- - log_interval
|
23 |
+
- 400
|
24 |
- - max_total_trials
|
25 |
- null
|
26 |
- - n_eval_envs
|
|
|
32 |
- - n_startup_trials
|
33 |
- 10
|
34 |
- - n_timesteps
|
35 |
+
- 500000
|
36 |
- - n_trials
|
37 |
- 500
|
38 |
- - no_optim_plots
|
|
|
50 |
- - sampler
|
51 |
- tpe
|
52 |
- - save_freq
|
53 |
+
- 10000
|
54 |
- - save_replay_buffer
|
55 |
- false
|
56 |
- - seed
|
57 |
+
- 2363843725
|
58 |
- - storage
|
59 |
- null
|
60 |
- - study_name
|
61 |
- null
|
62 |
- - tensorboard_log
|
63 |
+
- runs/BreakoutNoFrameskip-v4__dqn__2363843725__1713097209
|
64 |
- - track
|
65 |
- true
|
66 |
- - trained_agent
|
|
|
76 |
- - wandb_entity
|
77 |
- null
|
78 |
- - wandb_project_name
|
79 |
+
- dqn-breakout
|
80 |
- - wandb_tags
|
81 |
- []
|
dqn-BreakoutNoFrameskip-v4.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18fb29212f83b706f1894da623327c0da8abfb5c36611b65c13f8a312c3d616b
|
3 |
+
size 27203195
|
dqn-BreakoutNoFrameskip-v4/data
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
dqn-BreakoutNoFrameskip-v4/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0145c4ec10d38d4959aa379c5ad4ea0fb68771fb3d6f6c06b1e9b7221a36e076
|
3 |
+
size 13497660
|
dqn-BreakoutNoFrameskip-v4/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d42692dca5516497d5ab50165f41419c4b9409ac9ca31c0fe6f1f199048d1cf7
|
3 |
+
size 13496986
|
dqn-BreakoutNoFrameskip-v4/system_info.txt
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
-
- OS: Linux-
|
2 |
-
- Python: 3.
|
3 |
- Stable-Baselines3: 2.1.0
|
4 |
-
- PyTorch: 2.
|
5 |
-
- GPU Enabled:
|
6 |
-
- Numpy: 1.
|
7 |
-
- Cloudpickle:
|
8 |
- Gymnasium: 0.29.1
|
9 |
- OpenAI Gym: 0.26.2
|
|
|
1 |
+
- OS: Linux-5.15.146.1-microsoft-standard-WSL2-x86_64-with-glibc2.35 # 1 SMP Thu Jan 11 04:09:03 UTC 2024
|
2 |
+
- Python: 3.9.18
|
3 |
- Stable-Baselines3: 2.1.0
|
4 |
+
- PyTorch: 2.1.0+cpu
|
5 |
+
- GPU Enabled: False
|
6 |
+
- Numpy: 1.26.1
|
7 |
+
- Cloudpickle: 3.0.0
|
8 |
- Gymnasium: 0.29.1
|
9 |
- OpenAI Gym: 0.26.2
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57af4c35b302181eb2b6cc7a8b52df379d2738019e0a22c1c8079f5ec976cfa8
|
3 |
+
size 73180
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 42.8, "std_reward": 16.36948380371232, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-04-14T19:45:56.555308"}
|
train_eval_metrics.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d588a8292d999fc90fa65f33f6b364c901d2e2bd16e8a560742025cb5e0c082
|
3 |
+
size 40084
|