knight9114 commited on
Commit
e8e1a20
1 Parent(s): 0b0e31f

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +13 -21
config.json CHANGED
@@ -4,7 +4,7 @@
4
  "env": "doom_health_gathering_supreme",
5
  "experiment": "default_experiment",
6
  "train_dir": "/home/knight/github/huggingface-deep-rl-course/unit8/train_dir",
7
- "restart_behavior": "restart",
8
  "device": "gpu",
9
  "seed": null,
10
  "num_policies": 1,
@@ -16,7 +16,7 @@
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
  "num_workers": 8,
19
- "num_envs_per_worker": 8,
20
  "batch_size": 1024,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
@@ -39,11 +39,11 @@
39
  "vtrace_rho": 1.0,
40
  "vtrace_c": 1.0,
41
  "optimizer": "adam",
42
- "adam_eps": 1e-05,
43
- "adam_beta1": 0.5,
44
- "adam_beta2": 0.9,
45
- "max_grad_norm": 0.5,
46
- "learning_rate": 3e-05,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
49
  "obs_subtract_mean": 0.0,
@@ -63,7 +63,7 @@
63
  "summaries_use_frameskip": true,
64
  "heartbeat_interval": 20,
65
  "heartbeat_reporting_interval": 600,
66
- "train_for_env_steps": 10000000,
67
  "train_for_seconds": 10000000000,
68
  "save_every_sec": 120,
69
  "keep_checkpoints": 2,
@@ -81,7 +81,7 @@
81
  "encoder_conv_mlp_layers": [
82
  512
83
  ],
84
- "use_rnn": false,
85
  "rnn_size": 512,
86
  "rnn_type": "gru",
87
  "rnn_num_layers": 1,
@@ -89,7 +89,7 @@
89
  "nonlinearity": "elu",
90
  "policy_initialization": "orthogonal",
91
  "policy_init_gain": 1.0,
92
- "actor_critic_share_weights": false,
93
  "adaptive_stddev": true,
94
  "continuous_tanh_scale": 0.0,
95
  "initial_stddev": 1.0,
@@ -128,20 +128,12 @@
128
  "wide_aspect_ratio": false,
129
  "eval_env_frameskip": 1,
130
  "fps": 35,
131
- "command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=8 --train_for_env_steps=10000000 --restart_behavior=restart --max_grad_norm=0.5 --adam_eps=1e-5 --adam_beta1=0.5 --adam_beta2=0.9 --learning_rate=0.00003 --use_rnn=False --actor_critic_share_weights=False",
132
  "cli_args": {
133
  "env": "doom_health_gathering_supreme",
134
- "restart_behavior": "restart",
135
  "num_workers": 8,
136
- "num_envs_per_worker": 8,
137
- "adam_eps": 1e-05,
138
- "adam_beta1": 0.5,
139
- "adam_beta2": 0.9,
140
- "max_grad_norm": 0.5,
141
- "learning_rate": 3e-05,
142
- "train_for_env_steps": 10000000,
143
- "use_rnn": false,
144
- "actor_critic_share_weights": false
145
  },
146
  "git_hash": "unknown",
147
  "git_repo_name": "not a git repository",
 
4
  "env": "doom_health_gathering_supreme",
5
  "experiment": "default_experiment",
6
  "train_dir": "/home/knight/github/huggingface-deep-rl-course/unit8/train_dir",
7
+ "restart_behavior": "resume",
8
  "device": "gpu",
9
  "seed": null,
10
  "num_policies": 1,
 
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
  "num_workers": 8,
19
+ "num_envs_per_worker": 4,
20
  "batch_size": 1024,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
 
39
  "vtrace_rho": 1.0,
40
  "vtrace_c": 1.0,
41
  "optimizer": "adam",
42
+ "adam_eps": 1e-06,
43
+ "adam_beta1": 0.9,
44
+ "adam_beta2": 0.999,
45
+ "max_grad_norm": 4.0,
46
+ "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
49
  "obs_subtract_mean": 0.0,
 
63
  "summaries_use_frameskip": true,
64
  "heartbeat_interval": 20,
65
  "heartbeat_reporting_interval": 600,
66
+ "train_for_env_steps": 4000000,
67
  "train_for_seconds": 10000000000,
68
  "save_every_sec": 120,
69
  "keep_checkpoints": 2,
 
81
  "encoder_conv_mlp_layers": [
82
  512
83
  ],
84
+ "use_rnn": true,
85
  "rnn_size": 512,
86
  "rnn_type": "gru",
87
  "rnn_num_layers": 1,
 
89
  "nonlinearity": "elu",
90
  "policy_initialization": "orthogonal",
91
  "policy_init_gain": 1.0,
92
+ "actor_critic_share_weights": true,
93
  "adaptive_stddev": true,
94
  "continuous_tanh_scale": 0.0,
95
  "initial_stddev": 1.0,
 
128
  "wide_aspect_ratio": false,
129
  "eval_env_frameskip": 1,
130
  "fps": 35,
131
+ "command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=4000000",
132
  "cli_args": {
133
  "env": "doom_health_gathering_supreme",
 
134
  "num_workers": 8,
135
+ "num_envs_per_worker": 4,
136
+ "train_for_env_steps": 4000000
 
 
 
 
 
 
 
137
  },
138
  "git_hash": "unknown",
139
  "git_repo_name": "not a git repository",