chqmatteo commited on
Commit
c45c0f9
1 Parent(s): 01f2c8c

Upload . with huggingface_hub

Browse files
.summary/0/events.out.tfevents.1677225358.pop-os ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e40ea1910c6acde0638d1fc813a791448b39c2eae3638f55d1e4d876c17855a4
3
+ size 72788
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
- value: 3.94 +/- 0.20
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
+ value: 5.12 +/- 1.18
19
  name: mean_reward
20
  verified: false
21
  ---
checkpoint_p0/best_000000254_1040384_reward_6.010.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67af5682ef46f0d3035627fb356f41ef1b12bae5c1a510362ccef50bdf78939a
3
+ size 34928614
checkpoint_p0/checkpoint_000000268_1097728.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d38433749271bdb5c4c181d735cd77648786687a528baa8c3d3ee8903f10abd
3
+ size 34929028
config.json CHANGED
@@ -3,7 +3,7 @@
3
  "algo": "APPO",
4
  "env": "doom_health_gathering_supreme",
5
  "experiment": "default_experiment",
6
- "train_dir": "/mnt/c/Users/chqma/projects/ai/deep-rl-class/notebooks/unit8/train_dir",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
9
  "seed": null,
@@ -65,7 +65,7 @@
65
  "summaries_use_frameskip": true,
66
  "heartbeat_interval": 20,
67
  "heartbeat_reporting_interval": 600,
68
- "train_for_env_steps": 40000000,
69
  "train_for_seconds": 10000000000,
70
  "save_every_sec": 120,
71
  "keep_checkpoints": 2,
@@ -137,6 +137,6 @@
137
  "num_envs_per_worker": 4,
138
  "train_for_env_steps": 4000000
139
  },
140
- "git_hash": "372eb1042c1a2a82a2684e1795d47eaa26c046f7",
141
  "git_repo_name": "https://github.com/huggingface/deep-rl-class.git"
142
  }
 
3
  "algo": "APPO",
4
  "env": "doom_health_gathering_supreme",
5
  "experiment": "default_experiment",
6
+ "train_dir": "/mnt/chqma/data-ssd-01/dataset/oss/RWKV-LM/deep-rl-class/notebooks/unit8/train_dir",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
9
  "seed": null,
 
65
  "summaries_use_frameskip": true,
66
  "heartbeat_interval": 20,
67
  "heartbeat_reporting_interval": 600,
68
+ "train_for_env_steps": 4000000,
69
  "train_for_seconds": 10000000000,
70
  "save_every_sec": 120,
71
  "keep_checkpoints": 2,
 
137
  "num_envs_per_worker": 4,
138
  "train_for_env_steps": 4000000
139
  },
140
+ "git_hash": "1a2374cbd09490752b14aee6fdecfe64db411550",
141
  "git_repo_name": "https://github.com/huggingface/deep-rl-class.git"
142
  }
sf_log.txt CHANGED
The diff for this file is too large to render. See raw diff