Upload folder using huggingface_hub
Browse files
.summary/0/events.out.tfevents.1704458512.bd4e88014723
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0ee1637da859992af8c7d0cfd98f6b5dcccde56b754c7de50493571673a45b3
|
3 |
+
size 2164694
|
README.md
CHANGED
@@ -15,7 +15,7 @@ model-index:
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
-
value:
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
@@ -38,19 +38,19 @@ python -m sample_factory.huggingface.load_from_hub -r gchindemi/appo-vizdoom_hea
|
|
38 |
|
39 |
To run the model after download, use the `enjoy` script corresponding to this environment:
|
40 |
```
|
41 |
-
python -m .
|
42 |
```
|
43 |
|
44 |
|
45 |
You can also upload models to the Hugging Face Hub using the same script with the `--push_to_hub` flag.
|
46 |
See https://www.samplefactory.dev/10-huggingface/huggingface/ for more details
|
47 |
-
|
48 |
## Training with this model
|
49 |
|
50 |
To continue training with this model, use the `train` script corresponding to this environment:
|
51 |
```
|
52 |
-
python -m .
|
53 |
```
|
54 |
|
55 |
Note, you may have to adjust `--train_for_env_steps` to a suitably high number as the experiment will resume at the number of steps it concluded at.
|
56 |
-
|
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
+
value: 10.05 +/- 5.52
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
|
|
38 |
|
39 |
To run the model after download, use the `enjoy` script corresponding to this environment:
|
40 |
```
|
41 |
+
python -m <path.to.enjoy.module> --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=appo-vizdoom_health_gathering_supreme
|
42 |
```
|
43 |
|
44 |
|
45 |
You can also upload models to the Hugging Face Hub using the same script with the `--push_to_hub` flag.
|
46 |
See https://www.samplefactory.dev/10-huggingface/huggingface/ for more details
|
47 |
+
|
48 |
## Training with this model
|
49 |
|
50 |
To continue training with this model, use the `train` script corresponding to this environment:
|
51 |
```
|
52 |
+
python -m <path.to.train.module> --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=appo-vizdoom_health_gathering_supreme --restart_behavior=resume --train_for_env_steps=10000000000
|
53 |
```
|
54 |
|
55 |
Note, you may have to adjust `--train_for_env_steps` to a suitably high number as the experiment will resume at the number of steps it concluded at.
|
56 |
+
|
checkpoint_p0/best_000002374_9723904_reward_31.566.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c4cfd3c27c3062c7492438a8d6ac9e688f8ccbd0e8667ca6cb0431dcd6f7298
|
3 |
+
size 34929051
|
checkpoint_p0/checkpoint_000002361_9670656.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:454e3595bc4134cb418e36a70a48032620a46b3d6dede2e8174624a803a6f171
|
3 |
+
size 34929477
|
checkpoint_p0/checkpoint_000002443_10006528.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:860095e3b2bd68985a7a38f88abd26a19bc80ed23bfd60177d7aa0abb22458f9
|
3 |
+
size 34929541
|
config.json
CHANGED
@@ -46,6 +46,8 @@
|
|
46 |
"learning_rate": 0.0001,
|
47 |
"lr_schedule": "constant",
|
48 |
"lr_schedule_kl_threshold": 0.008,
|
|
|
|
|
49 |
"obs_subtract_mean": 0.0,
|
50 |
"obs_scale": 255.0,
|
51 |
"normalize_input": true,
|
@@ -63,7 +65,7 @@
|
|
63 |
"summaries_use_frameskip": true,
|
64 |
"heartbeat_interval": 20,
|
65 |
"heartbeat_reporting_interval": 600,
|
66 |
-
"train_for_env_steps":
|
67 |
"train_for_seconds": 10000000000,
|
68 |
"save_every_sec": 120,
|
69 |
"keep_checkpoints": 2,
|
@@ -128,14 +130,13 @@
|
|
128 |
"wide_aspect_ratio": false,
|
129 |
"eval_env_frameskip": 1,
|
130 |
"fps": 35,
|
131 |
-
"command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=
|
132 |
"cli_args": {
|
133 |
"env": "doom_health_gathering_supreme",
|
134 |
"num_workers": 8,
|
135 |
"num_envs_per_worker": 4,
|
136 |
-
"train_for_env_steps":
|
137 |
},
|
138 |
"git_hash": "unknown",
|
139 |
-
"git_repo_name": "not a git repository"
|
140 |
-
"train_script": ".usr.local.lib.python3.10.dist-packages.colab_kernel_launcher"
|
141 |
}
|
|
|
46 |
"learning_rate": 0.0001,
|
47 |
"lr_schedule": "constant",
|
48 |
"lr_schedule_kl_threshold": 0.008,
|
49 |
+
"lr_adaptive_min": 1e-06,
|
50 |
+
"lr_adaptive_max": 0.01,
|
51 |
"obs_subtract_mean": 0.0,
|
52 |
"obs_scale": 255.0,
|
53 |
"normalize_input": true,
|
|
|
65 |
"summaries_use_frameskip": true,
|
66 |
"heartbeat_interval": 20,
|
67 |
"heartbeat_reporting_interval": 600,
|
68 |
+
"train_for_env_steps": 10000000,
|
69 |
"train_for_seconds": 10000000000,
|
70 |
"save_every_sec": 120,
|
71 |
"keep_checkpoints": 2,
|
|
|
130 |
"wide_aspect_ratio": false,
|
131 |
"eval_env_frameskip": 1,
|
132 |
"fps": 35,
|
133 |
+
"command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=10_000_000",
|
134 |
"cli_args": {
|
135 |
"env": "doom_health_gathering_supreme",
|
136 |
"num_workers": 8,
|
137 |
"num_envs_per_worker": 4,
|
138 |
+
"train_for_env_steps": 10000000
|
139 |
},
|
140 |
"git_hash": "unknown",
|
141 |
+
"git_repo_name": "not a git repository"
|
|
|
142 |
}
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec9914a6f5ce460610e03957d37966d71e027a8aa02fb818975dc73d99e1c4c3
|
3 |
+
size 19675353
|
sf_log.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|