labicquette
commited on
Commit
·
f8fa1aa
1
Parent(s):
091baba
Upload config.json with huggingface_hub
Browse files- config.json +17 -15
config.json
CHANGED
@@ -2,7 +2,7 @@
|
|
2 |
"help": false,
|
3 |
"algo": "APPO",
|
4 |
"env": "doom_health_gathering_supreme",
|
5 |
-
"experiment": "
|
6 |
"train_dir": "/home/labicquette/wip/hugRL/train_dir",
|
7 |
"restart_behavior": "resume",
|
8 |
"device": "gpu",
|
@@ -16,7 +16,7 @@
|
|
16 |
"policy_workers_per_policy": 1,
|
17 |
"max_policy_lag": 1000,
|
18 |
"num_workers": 12,
|
19 |
-
"num_envs_per_worker":
|
20 |
"batch_size": 2048,
|
21 |
"num_batches_per_epoch": 1,
|
22 |
"num_epochs": 1,
|
@@ -42,7 +42,7 @@
|
|
42 |
"adam_eps": 1e-06,
|
43 |
"adam_beta1": 0.9,
|
44 |
"adam_beta2": 0.999,
|
45 |
-
"max_grad_norm":
|
46 |
"learning_rate": 0.0001,
|
47 |
"lr_schedule": "constant",
|
48 |
"lr_schedule_kl_threshold": 0.008,
|
@@ -61,8 +61,8 @@
|
|
61 |
"flush_summaries_interval": 30,
|
62 |
"stats_avg": 100,
|
63 |
"summaries_use_frameskip": true,
|
64 |
-
"heartbeat_interval":
|
65 |
-
"heartbeat_reporting_interval":
|
66 |
"train_for_env_steps": 10000000,
|
67 |
"train_for_seconds": 10000000000,
|
68 |
"save_every_sec": 120,
|
@@ -83,10 +83,10 @@
|
|
83 |
],
|
84 |
"use_rnn": true,
|
85 |
"rnn_size": 512,
|
86 |
-
"rnn_type": "
|
87 |
"rnn_num_layers": 1,
|
88 |
"decoder_mlp_layers": [],
|
89 |
-
"nonlinearity": "
|
90 |
"policy_initialization": "orthogonal",
|
91 |
"policy_init_gain": 1.0,
|
92 |
"actor_critic_share_weights": true,
|
@@ -95,7 +95,7 @@
|
|
95 |
"initial_stddev": 1.0,
|
96 |
"use_env_info_cache": false,
|
97 |
"env_gpu_actions": false,
|
98 |
-
"env_gpu_observations":
|
99 |
"env_frameskip": 4,
|
100 |
"env_framestack": 1,
|
101 |
"pixel_format": "CHW",
|
@@ -128,20 +128,22 @@
|
|
128 |
"wide_aspect_ratio": false,
|
129 |
"eval_env_frameskip": 1,
|
130 |
"fps": 35,
|
131 |
-
"command_line": "--env=doom_health_gathering_supreme --experiment=
|
132 |
"cli_args": {
|
133 |
"env": "doom_health_gathering_supreme",
|
134 |
-
"experiment": "
|
135 |
"seed": 2222,
|
136 |
"num_workers": 12,
|
137 |
-
"num_envs_per_worker":
|
138 |
"batch_size": 2048,
|
139 |
-
"max_grad_norm":
|
140 |
"decorrelate_experience_max_seconds": 1,
|
|
|
|
|
141 |
"train_for_env_steps": 10000000,
|
142 |
-
"rnn_type": "
|
143 |
-
"nonlinearity": "
|
144 |
-
"env_gpu_observations":
|
145 |
},
|
146 |
"git_hash": "unknown",
|
147 |
"git_repo_name": "not a git repository",
|
|
|
2 |
"help": false,
|
3 |
"algo": "APPO",
|
4 |
"env": "doom_health_gathering_supreme",
|
5 |
+
"experiment": "vizdoom_doom_health_gathering_supreme_lstm_2222_3_decorrelate_10M",
|
6 |
"train_dir": "/home/labicquette/wip/hugRL/train_dir",
|
7 |
"restart_behavior": "resume",
|
8 |
"device": "gpu",
|
|
|
16 |
"policy_workers_per_policy": 1,
|
17 |
"max_policy_lag": 1000,
|
18 |
"num_workers": 12,
|
19 |
+
"num_envs_per_worker": 12,
|
20 |
"batch_size": 2048,
|
21 |
"num_batches_per_epoch": 1,
|
22 |
"num_epochs": 1,
|
|
|
42 |
"adam_eps": 1e-06,
|
43 |
"adam_beta1": 0.9,
|
44 |
"adam_beta2": 0.999,
|
45 |
+
"max_grad_norm": 0.0,
|
46 |
"learning_rate": 0.0001,
|
47 |
"lr_schedule": "constant",
|
48 |
"lr_schedule_kl_threshold": 0.008,
|
|
|
61 |
"flush_summaries_interval": 30,
|
62 |
"stats_avg": 100,
|
63 |
"summaries_use_frameskip": true,
|
64 |
+
"heartbeat_interval": 10,
|
65 |
+
"heartbeat_reporting_interval": 300,
|
66 |
"train_for_env_steps": 10000000,
|
67 |
"train_for_seconds": 10000000000,
|
68 |
"save_every_sec": 120,
|
|
|
83 |
],
|
84 |
"use_rnn": true,
|
85 |
"rnn_size": 512,
|
86 |
+
"rnn_type": "lstm",
|
87 |
"rnn_num_layers": 1,
|
88 |
"decoder_mlp_layers": [],
|
89 |
+
"nonlinearity": "relu",
|
90 |
"policy_initialization": "orthogonal",
|
91 |
"policy_init_gain": 1.0,
|
92 |
"actor_critic_share_weights": true,
|
|
|
95 |
"initial_stddev": 1.0,
|
96 |
"use_env_info_cache": false,
|
97 |
"env_gpu_actions": false,
|
98 |
+
"env_gpu_observations": true,
|
99 |
"env_frameskip": 4,
|
100 |
"env_framestack": 1,
|
101 |
"pixel_format": "CHW",
|
|
|
128 |
"wide_aspect_ratio": false,
|
129 |
"eval_env_frameskip": 1,
|
130 |
"fps": 35,
|
131 |
+
"command_line": "--env=doom_health_gathering_supreme --experiment=vizdoom_doom_health_gathering_supreme_lstm_2222_3_decorrelate_10M --num_workers=12 --num_envs_per_worker=12 --train_for_env_steps=10000000 --batch_size=2048 --max_grad_norm=0.0 --nonlinearity=relu --rnn_type=lstm --decorrelate_experience_max_seconds=1 --env_gpu_observations=true --seed=2222 --heartbeat_interval=10 --heartbeat_reporting_interval=300",
|
132 |
"cli_args": {
|
133 |
"env": "doom_health_gathering_supreme",
|
134 |
+
"experiment": "vizdoom_doom_health_gathering_supreme_lstm_2222_3_decorrelate_10M",
|
135 |
"seed": 2222,
|
136 |
"num_workers": 12,
|
137 |
+
"num_envs_per_worker": 12,
|
138 |
"batch_size": 2048,
|
139 |
+
"max_grad_norm": 0.0,
|
140 |
"decorrelate_experience_max_seconds": 1,
|
141 |
+
"heartbeat_interval": 10,
|
142 |
+
"heartbeat_reporting_interval": 300,
|
143 |
"train_for_env_steps": 10000000,
|
144 |
+
"rnn_type": "lstm",
|
145 |
+
"nonlinearity": "relu",
|
146 |
+
"env_gpu_observations": true
|
147 |
},
|
148 |
"git_hash": "unknown",
|
149 |
"git_repo_name": "not a git repository",
|