alidenewade commited on
Commit
5f048cb
·
verified ·
1 Parent(s): 23ef735

Upload folder using huggingface_hub

Browse files
.summary/0/events.out.tfevents.1731062261.54cd0c9040da ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:929302b80ec8dd6692657a325d2d3c05d6c3e5a320e1c0e14835752297598de0
3
+ size 727083
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
- value: 4.06 +/- 0.41
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
+ value: 11.41 +/- 4.52
19
  name: mean_reward
20
  verified: false
21
  ---
checkpoint_p0/best_000000895_3665920_reward_23.358.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e90f42a33e006c942fb16e7ea24adb325f3843ecbfb55a8345dda3a68e7200e
3
+ size 34929051
checkpoint_p0/checkpoint_000000910_3727360.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2508e11890f5d65c94f9da1ce0ba9ed60ea7cbb7ad6496fd081359b97c4b1560
3
+ size 34929477
checkpoint_p0/checkpoint_000000978_4005888.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fa99455ba1fbe585942b03f43eed7d14008e65fbb6cd2b891c4be9c3ccb7825
3
+ size 34929477
config.json CHANGED
@@ -3,7 +3,7 @@
3
  "algo": "APPO",
4
  "env": "doom_health_gathering_supreme",
5
  "experiment": "default_experiment",
6
- "train_dir": "/root/hfRL/ml/LunarLander-v2/train_dir",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
9
  "seed": null,
@@ -16,7 +16,7 @@
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
  "num_workers": 8,
19
- "num_envs_per_worker": 4,
20
  "batch_size": 1024,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
@@ -130,11 +130,13 @@
130
  "wide_aspect_ratio": false,
131
  "eval_env_frameskip": 1,
132
  "fps": 35,
133
- "command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=4000000",
134
  "cli_args": {
135
  "env": "doom_health_gathering_supreme",
136
  "num_workers": 8,
137
- "num_envs_per_worker": 4,
 
 
138
  "train_for_env_steps": 4000000
139
  },
140
  "git_hash": "unknown",
 
3
  "algo": "APPO",
4
  "env": "doom_health_gathering_supreme",
5
  "experiment": "default_experiment",
6
+ "train_dir": "/content/train_dir",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
9
  "seed": null,
 
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
  "num_workers": 8,
19
+ "num_envs_per_worker": 16,
20
  "batch_size": 1024,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
 
130
  "wide_aspect_ratio": false,
131
  "eval_env_frameskip": 1,
132
  "fps": 35,
133
+ "command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=4000000 --learning_rate=0.0001 --batch_size=1024 --num_envs=16",
134
  "cli_args": {
135
  "env": "doom_health_gathering_supreme",
136
  "num_workers": 8,
137
+ "num_envs_per_worker": 16,
138
+ "batch_size": 1024,
139
+ "learning_rate": 0.0001,
140
  "train_for_env_steps": 4000000
141
  },
142
  "git_hash": "unknown",
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ddf3c95fa679fc9ffc32521921710e4073367088ae805f5e334d6d5fe2e37f8d
3
- size 6040020
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4ed78c785cd0df2285dd3f6ddb9c575870fd08a36d041831c63254bbee305ba
3
+ size 21865704
sf_log.txt CHANGED
The diff for this file is too large to render. See raw diff