knight9114
commited on
Commit
•
e8e1a20
1
Parent(s):
0b0e31f
Upload config.json with huggingface_hub
Browse files- config.json +13 -21
config.json
CHANGED
@@ -4,7 +4,7 @@
|
|
4 |
"env": "doom_health_gathering_supreme",
|
5 |
"experiment": "default_experiment",
|
6 |
"train_dir": "/home/knight/github/huggingface-deep-rl-course/unit8/train_dir",
|
7 |
-
"restart_behavior": "
|
8 |
"device": "gpu",
|
9 |
"seed": null,
|
10 |
"num_policies": 1,
|
@@ -16,7 +16,7 @@
|
|
16 |
"policy_workers_per_policy": 1,
|
17 |
"max_policy_lag": 1000,
|
18 |
"num_workers": 8,
|
19 |
-
"num_envs_per_worker":
|
20 |
"batch_size": 1024,
|
21 |
"num_batches_per_epoch": 1,
|
22 |
"num_epochs": 1,
|
@@ -39,11 +39,11 @@
|
|
39 |
"vtrace_rho": 1.0,
|
40 |
"vtrace_c": 1.0,
|
41 |
"optimizer": "adam",
|
42 |
-
"adam_eps": 1e-
|
43 |
-
"adam_beta1": 0.
|
44 |
-
"adam_beta2": 0.
|
45 |
-
"max_grad_norm": 0
|
46 |
-
"learning_rate":
|
47 |
"lr_schedule": "constant",
|
48 |
"lr_schedule_kl_threshold": 0.008,
|
49 |
"obs_subtract_mean": 0.0,
|
@@ -63,7 +63,7 @@
|
|
63 |
"summaries_use_frameskip": true,
|
64 |
"heartbeat_interval": 20,
|
65 |
"heartbeat_reporting_interval": 600,
|
66 |
-
"train_for_env_steps":
|
67 |
"train_for_seconds": 10000000000,
|
68 |
"save_every_sec": 120,
|
69 |
"keep_checkpoints": 2,
|
@@ -81,7 +81,7 @@
|
|
81 |
"encoder_conv_mlp_layers": [
|
82 |
512
|
83 |
],
|
84 |
-
"use_rnn":
|
85 |
"rnn_size": 512,
|
86 |
"rnn_type": "gru",
|
87 |
"rnn_num_layers": 1,
|
@@ -89,7 +89,7 @@
|
|
89 |
"nonlinearity": "elu",
|
90 |
"policy_initialization": "orthogonal",
|
91 |
"policy_init_gain": 1.0,
|
92 |
-
"actor_critic_share_weights":
|
93 |
"adaptive_stddev": true,
|
94 |
"continuous_tanh_scale": 0.0,
|
95 |
"initial_stddev": 1.0,
|
@@ -128,20 +128,12 @@
|
|
128 |
"wide_aspect_ratio": false,
|
129 |
"eval_env_frameskip": 1,
|
130 |
"fps": 35,
|
131 |
-
"command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=
|
132 |
"cli_args": {
|
133 |
"env": "doom_health_gathering_supreme",
|
134 |
-
"restart_behavior": "restart",
|
135 |
"num_workers": 8,
|
136 |
-
"num_envs_per_worker":
|
137 |
-
"
|
138 |
-
"adam_beta1": 0.5,
|
139 |
-
"adam_beta2": 0.9,
|
140 |
-
"max_grad_norm": 0.5,
|
141 |
-
"learning_rate": 3e-05,
|
142 |
-
"train_for_env_steps": 10000000,
|
143 |
-
"use_rnn": false,
|
144 |
-
"actor_critic_share_weights": false
|
145 |
},
|
146 |
"git_hash": "unknown",
|
147 |
"git_repo_name": "not a git repository",
|
|
|
4 |
"env": "doom_health_gathering_supreme",
|
5 |
"experiment": "default_experiment",
|
6 |
"train_dir": "/home/knight/github/huggingface-deep-rl-course/unit8/train_dir",
|
7 |
+
"restart_behavior": "resume",
|
8 |
"device": "gpu",
|
9 |
"seed": null,
|
10 |
"num_policies": 1,
|
|
|
16 |
"policy_workers_per_policy": 1,
|
17 |
"max_policy_lag": 1000,
|
18 |
"num_workers": 8,
|
19 |
+
"num_envs_per_worker": 4,
|
20 |
"batch_size": 1024,
|
21 |
"num_batches_per_epoch": 1,
|
22 |
"num_epochs": 1,
|
|
|
39 |
"vtrace_rho": 1.0,
|
40 |
"vtrace_c": 1.0,
|
41 |
"optimizer": "adam",
|
42 |
+
"adam_eps": 1e-06,
|
43 |
+
"adam_beta1": 0.9,
|
44 |
+
"adam_beta2": 0.999,
|
45 |
+
"max_grad_norm": 4.0,
|
46 |
+
"learning_rate": 0.0001,
|
47 |
"lr_schedule": "constant",
|
48 |
"lr_schedule_kl_threshold": 0.008,
|
49 |
"obs_subtract_mean": 0.0,
|
|
|
63 |
"summaries_use_frameskip": true,
|
64 |
"heartbeat_interval": 20,
|
65 |
"heartbeat_reporting_interval": 600,
|
66 |
+
"train_for_env_steps": 4000000,
|
67 |
"train_for_seconds": 10000000000,
|
68 |
"save_every_sec": 120,
|
69 |
"keep_checkpoints": 2,
|
|
|
81 |
"encoder_conv_mlp_layers": [
|
82 |
512
|
83 |
],
|
84 |
+
"use_rnn": true,
|
85 |
"rnn_size": 512,
|
86 |
"rnn_type": "gru",
|
87 |
"rnn_num_layers": 1,
|
|
|
89 |
"nonlinearity": "elu",
|
90 |
"policy_initialization": "orthogonal",
|
91 |
"policy_init_gain": 1.0,
|
92 |
+
"actor_critic_share_weights": true,
|
93 |
"adaptive_stddev": true,
|
94 |
"continuous_tanh_scale": 0.0,
|
95 |
"initial_stddev": 1.0,
|
|
|
128 |
"wide_aspect_ratio": false,
|
129 |
"eval_env_frameskip": 1,
|
130 |
"fps": 35,
|
131 |
+
"command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=4000000",
|
132 |
"cli_args": {
|
133 |
"env": "doom_health_gathering_supreme",
|
|
|
134 |
"num_workers": 8,
|
135 |
+
"num_envs_per_worker": 4,
|
136 |
+
"train_for_env_steps": 4000000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
137 |
},
|
138 |
"git_hash": "unknown",
|
139 |
"git_repo_name": "not a git repository",
|