gchindemi commited on
Commit
4eff597
1 Parent(s): f0a58ae

Upload folder using huggingface_hub

Browse files
.summary/0/events.out.tfevents.1704458512.bd4e88014723 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0ee1637da859992af8c7d0cfd98f6b5dcccde56b754c7de50493571673a45b3
3
+ size 2164694
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
- value: 9.31 +/- 4.55
19
  name: mean_reward
20
  verified: false
21
  ---
@@ -38,19 +38,19 @@ python -m sample_factory.huggingface.load_from_hub -r gchindemi/appo-vizdoom_hea
38
 
39
  To run the model after download, use the `enjoy` script corresponding to this environment:
40
  ```
41
- python -m .usr.local.lib.python3.10.dist-packages.colab_kernel_launcher --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=appo-vizdoom_health_gathering_supreme
42
  ```
43
 
44
 
45
  You can also upload models to the Hugging Face Hub using the same script with the `--push_to_hub` flag.
46
  See https://www.samplefactory.dev/10-huggingface/huggingface/ for more details
47
-
48
  ## Training with this model
49
 
50
  To continue training with this model, use the `train` script corresponding to this environment:
51
  ```
52
- python -m .usr.local.lib.python3.10.dist-packages.colab_kernel_launcher --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=appo-vizdoom_health_gathering_supreme --restart_behavior=resume --train_for_env_steps=10000000000
53
  ```
54
 
55
  Note, you may have to adjust `--train_for_env_steps` to a suitably high number as the experiment will resume at the number of steps it concluded at.
56
-
 
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
+ value: 10.05 +/- 5.52
19
  name: mean_reward
20
  verified: false
21
  ---
 
38
 
39
  To run the model after download, use the `enjoy` script corresponding to this environment:
40
  ```
41
+ python -m <path.to.enjoy.module> --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=appo-vizdoom_health_gathering_supreme
42
  ```
43
 
44
 
45
  You can also upload models to the Hugging Face Hub using the same script with the `--push_to_hub` flag.
46
  See https://www.samplefactory.dev/10-huggingface/huggingface/ for more details
47
+
48
  ## Training with this model
49
 
50
  To continue training with this model, use the `train` script corresponding to this environment:
51
  ```
52
+ python -m <path.to.train.module> --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=appo-vizdoom_health_gathering_supreme --restart_behavior=resume --train_for_env_steps=10000000000
53
  ```
54
 
55
  Note, you may have to adjust `--train_for_env_steps` to a suitably high number as the experiment will resume at the number of steps it concluded at.
56
+
checkpoint_p0/best_000002374_9723904_reward_31.566.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c4cfd3c27c3062c7492438a8d6ac9e688f8ccbd0e8667ca6cb0431dcd6f7298
3
+ size 34929051
checkpoint_p0/checkpoint_000002361_9670656.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:454e3595bc4134cb418e36a70a48032620a46b3d6dede2e8174624a803a6f171
3
+ size 34929477
checkpoint_p0/checkpoint_000002443_10006528.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:860095e3b2bd68985a7a38f88abd26a19bc80ed23bfd60177d7aa0abb22458f9
3
+ size 34929541
config.json CHANGED
@@ -46,6 +46,8 @@
46
  "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
 
 
49
  "obs_subtract_mean": 0.0,
50
  "obs_scale": 255.0,
51
  "normalize_input": true,
@@ -63,7 +65,7 @@
63
  "summaries_use_frameskip": true,
64
  "heartbeat_interval": 20,
65
  "heartbeat_reporting_interval": 600,
66
- "train_for_env_steps": 4000000,
67
  "train_for_seconds": 10000000000,
68
  "save_every_sec": 120,
69
  "keep_checkpoints": 2,
@@ -128,14 +130,13 @@
128
  "wide_aspect_ratio": false,
129
  "eval_env_frameskip": 1,
130
  "fps": 35,
131
- "command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=4000000",
132
  "cli_args": {
133
  "env": "doom_health_gathering_supreme",
134
  "num_workers": 8,
135
  "num_envs_per_worker": 4,
136
- "train_for_env_steps": 4000000
137
  },
138
  "git_hash": "unknown",
139
- "git_repo_name": "not a git repository",
140
- "train_script": ".usr.local.lib.python3.10.dist-packages.colab_kernel_launcher"
141
  }
 
46
  "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
49
+ "lr_adaptive_min": 1e-06,
50
+ "lr_adaptive_max": 0.01,
51
  "obs_subtract_mean": 0.0,
52
  "obs_scale": 255.0,
53
  "normalize_input": true,
 
65
  "summaries_use_frameskip": true,
66
  "heartbeat_interval": 20,
67
  "heartbeat_reporting_interval": 600,
68
+ "train_for_env_steps": 10000000,
69
  "train_for_seconds": 10000000000,
70
  "save_every_sec": 120,
71
  "keep_checkpoints": 2,
 
130
  "wide_aspect_ratio": false,
131
  "eval_env_frameskip": 1,
132
  "fps": 35,
133
+ "command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=10_000_000",
134
  "cli_args": {
135
  "env": "doom_health_gathering_supreme",
136
  "num_workers": 8,
137
  "num_envs_per_worker": 4,
138
+ "train_for_env_steps": 10000000
139
  },
140
  "git_hash": "unknown",
141
+ "git_repo_name": "not a git repository"
 
142
  }
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93249e065e6b3ca58e1312d0ba76b1fafc67ccd6be73871b293c910200ce8dc4
3
- size 17744257
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec9914a6f5ce460610e03957d37966d71e027a8aa02fb818975dc73d99e1c4c3
3
+ size 19675353
sf_log.txt ADDED
The diff for this file is too large to render. See raw diff