labicquette commited on
Commit
f8fa1aa
·
1 Parent(s): 091baba

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +17 -15
config.json CHANGED
@@ -2,7 +2,7 @@
2
  "help": false,
3
  "algo": "APPO",
4
  "env": "doom_health_gathering_supreme",
5
- "experiment": "vizdoom_doom_health_gathering_supreme_gru_2222_1_decorrelate_10M",
6
  "train_dir": "/home/labicquette/wip/hugRL/train_dir",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
@@ -16,7 +16,7 @@
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
  "num_workers": 12,
19
- "num_envs_per_worker": 8,
20
  "batch_size": 2048,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
@@ -42,7 +42,7 @@
42
  "adam_eps": 1e-06,
43
  "adam_beta1": 0.9,
44
  "adam_beta2": 0.999,
45
- "max_grad_norm": 4.0,
46
  "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
@@ -61,8 +61,8 @@
61
  "flush_summaries_interval": 30,
62
  "stats_avg": 100,
63
  "summaries_use_frameskip": true,
64
- "heartbeat_interval": 20,
65
- "heartbeat_reporting_interval": 600,
66
  "train_for_env_steps": 10000000,
67
  "train_for_seconds": 10000000000,
68
  "save_every_sec": 120,
@@ -83,10 +83,10 @@
83
  ],
84
  "use_rnn": true,
85
  "rnn_size": 512,
86
- "rnn_type": "gru",
87
  "rnn_num_layers": 1,
88
  "decoder_mlp_layers": [],
89
- "nonlinearity": "elu",
90
  "policy_initialization": "orthogonal",
91
  "policy_init_gain": 1.0,
92
  "actor_critic_share_weights": true,
@@ -95,7 +95,7 @@
95
  "initial_stddev": 1.0,
96
  "use_env_info_cache": false,
97
  "env_gpu_actions": false,
98
- "env_gpu_observations": false,
99
  "env_frameskip": 4,
100
  "env_framestack": 1,
101
  "pixel_format": "CHW",
@@ -128,20 +128,22 @@
128
  "wide_aspect_ratio": false,
129
  "eval_env_frameskip": 1,
130
  "fps": 35,
131
- "command_line": "--env=doom_health_gathering_supreme --experiment=vizdoom_doom_health_gathering_supreme_gru_2222_1_decorrelate_10M --num_workers=12 --num_envs_per_worker=8 --train_for_env_steps=10000000 --batch_size=2048 --max_grad_norm=4.0 --nonlinearity=elu --rnn_type=gru --decorrelate_experience_max_seconds=1 --env_gpu_observations=false --seed=2222",
132
  "cli_args": {
133
  "env": "doom_health_gathering_supreme",
134
- "experiment": "vizdoom_doom_health_gathering_supreme_gru_2222_1_decorrelate_10M",
135
  "seed": 2222,
136
  "num_workers": 12,
137
- "num_envs_per_worker": 8,
138
  "batch_size": 2048,
139
- "max_grad_norm": 4.0,
140
  "decorrelate_experience_max_seconds": 1,
 
 
141
  "train_for_env_steps": 10000000,
142
- "rnn_type": "gru",
143
- "nonlinearity": "elu",
144
- "env_gpu_observations": false
145
  },
146
  "git_hash": "unknown",
147
  "git_repo_name": "not a git repository",
 
2
  "help": false,
3
  "algo": "APPO",
4
  "env": "doom_health_gathering_supreme",
5
+ "experiment": "vizdoom_doom_health_gathering_supreme_lstm_2222_3_decorrelate_10M",
6
  "train_dir": "/home/labicquette/wip/hugRL/train_dir",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
 
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
  "num_workers": 12,
19
+ "num_envs_per_worker": 12,
20
  "batch_size": 2048,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
 
42
  "adam_eps": 1e-06,
43
  "adam_beta1": 0.9,
44
  "adam_beta2": 0.999,
45
+ "max_grad_norm": 0.0,
46
  "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
 
61
  "flush_summaries_interval": 30,
62
  "stats_avg": 100,
63
  "summaries_use_frameskip": true,
64
+ "heartbeat_interval": 10,
65
+ "heartbeat_reporting_interval": 300,
66
  "train_for_env_steps": 10000000,
67
  "train_for_seconds": 10000000000,
68
  "save_every_sec": 120,
 
83
  ],
84
  "use_rnn": true,
85
  "rnn_size": 512,
86
+ "rnn_type": "lstm",
87
  "rnn_num_layers": 1,
88
  "decoder_mlp_layers": [],
89
+ "nonlinearity": "relu",
90
  "policy_initialization": "orthogonal",
91
  "policy_init_gain": 1.0,
92
  "actor_critic_share_weights": true,
 
95
  "initial_stddev": 1.0,
96
  "use_env_info_cache": false,
97
  "env_gpu_actions": false,
98
+ "env_gpu_observations": true,
99
  "env_frameskip": 4,
100
  "env_framestack": 1,
101
  "pixel_format": "CHW",
 
128
  "wide_aspect_ratio": false,
129
  "eval_env_frameskip": 1,
130
  "fps": 35,
131
+ "command_line": "--env=doom_health_gathering_supreme --experiment=vizdoom_doom_health_gathering_supreme_lstm_2222_3_decorrelate_10M --num_workers=12 --num_envs_per_worker=12 --train_for_env_steps=10000000 --batch_size=2048 --max_grad_norm=0.0 --nonlinearity=relu --rnn_type=lstm --decorrelate_experience_max_seconds=1 --env_gpu_observations=true --seed=2222 --heartbeat_interval=10 --heartbeat_reporting_interval=300",
132
  "cli_args": {
133
  "env": "doom_health_gathering_supreme",
134
+ "experiment": "vizdoom_doom_health_gathering_supreme_lstm_2222_3_decorrelate_10M",
135
  "seed": 2222,
136
  "num_workers": 12,
137
+ "num_envs_per_worker": 12,
138
  "batch_size": 2048,
139
+ "max_grad_norm": 0.0,
140
  "decorrelate_experience_max_seconds": 1,
141
+ "heartbeat_interval": 10,
142
+ "heartbeat_reporting_interval": 300,
143
  "train_for_env_steps": 10000000,
144
+ "rnn_type": "lstm",
145
+ "nonlinearity": "relu",
146
+ "env_gpu_observations": true
147
  },
148
  "git_hash": "unknown",
149
  "git_repo_name": "not a git repository",