Lorius2 commited on
Commit
e2e44ba
1 Parent(s): 610b2b4

First Push

Browse files
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18d24a27f9ca998a26fce59e884615d7d5adae049b9d78b8388875fda0ac553c
3
  size 1764633
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfa4e657c1f0d9f19eb01072e258b3a96ebfc9385c738eca8f929ab26a459da0
3
  size 1764633
SoccerTwos/SoccerTwos-1200138.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfa4e657c1f0d9f19eb01072e258b3a96ebfc9385c738eca8f929ab26a459da0
3
+ size 1764633
SoccerTwos/SoccerTwos-1200138.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34c4451c24392d87e1f15bc461d130440913ac02b65dddd82dda8babfb526e97
3
+ size 28422481
SoccerTwos/SoccerTwos-999491.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:184780fe9f9d6f0f72a6cc3faee031e161ccddff2e232be4369fec8cf73cba57
3
+ size 1764633
SoccerTwos/SoccerTwos-999491.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7351fede99366b78eb139acd54c81d112b7d9a25edc05f5919c4254d530c61c1
3
+ size 28422481
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d34843140369db345028a839431952bde94a27b0dc87a1df92f8300bb9fe9f6c
3
  size 28422481
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34c4451c24392d87e1f15bc461d130440913ac02b65dddd82dda8babfb526e97
3
  size 28422481
SoccerTwos/events.out.tfevents.1684022101.pytorch-1-13-gpu-py-ml-g4dn-xlarge-527e33c924f34a0c20ebf51c5b64.1151.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c960750f06b5e3c3d41064187d62123eb1803aa227774ab00dac764fe43b347d
3
+ size 616744
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "constant", "beta_schedule": "constant", "epsilon_schedule": "constant"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 600000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 100000, "swap_steps": 2000, "window": 10, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/SoccerTwos/SoccerTwos.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "constant", "beta_schedule": "constant", "epsilon_schedule": "constant"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 1200000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 100000, "swap_steps": 2000, "window": 10, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/SoccerTwos/SoccerTwos.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -37,7 +37,7 @@ behaviors:
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
- max_steps: 600000
41
  time_horizon: 1000
42
  summary_freq: 10000
43
  threaded: false
 
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
+ max_steps: 1200000
41
  time_horizon: 1000
42
  summary_freq: 10000
43
  threaded: false
run_logs/Player-0.log CHANGED
@@ -31,7 +31,7 @@ ALSA lib pcm.c:2666:(snd_pcm_open_noupdate) Unknown PCM default
31
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
32
  FMOD initialized on nosound output
33
  Begin MonoManager ReloadAssembly
34
- - Completed reload, in 0.300 seconds
35
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
36
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
37
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -56,16 +56,39 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
56
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
57
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
58
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
59
- UnloadTime: 0.662147 ms
60
  Registered Communicator in Agent.
61
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
62
  requesting resize 84 x 84
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  Setting up 2 worker threads for Enlighten.
64
  Memory Statistics:
65
  [ALLOC_TEMP_TLS] TLS Allocator
66
  StackAllocators :
67
  [ALLOC_TEMP_MAIN]
68
- Peak usage frame count: [2.0 MB-4.0 MB]: 1 frames
69
  Initial Block Size 4.0 MB
70
  Current Block Size 4.0 MB
71
  Peak Allocated Bytes 2.1 MB
@@ -197,16 +220,16 @@ Memory Statistics:
197
  Used Block count 1
198
  Peak Allocated bytes 1.0 MB
199
  [ALLOC_DEFAULT_MAIN]
200
- Peak usage frame count: [4.0 MB-8.0 MB]: 1 frames
201
  Requested Block Size 16.0 MB
202
  Peak Block count 1
203
- Peak Allocated memory 4.7 MB
204
  Peak Large allocation bytes 0 B
205
  [ALLOC_DEFAULT_THREAD]
206
- Peak usage frame count: [16.0 MB-32.0 MB]: 1 frames
207
  Requested Block Size 16.0 MB
208
  Peak Block count 1
209
- Peak Allocated memory 17.5 MB
210
  Peak Large allocation bytes 16.0 MB
211
  [ALLOC_TEMP_JOB_1_FRAME]
212
  Initial Block Size 2.0 MB
@@ -220,7 +243,7 @@ Memory Statistics:
220
  Overflow Count (full) 0
221
  [ALLOC_TEMP_JOB_4_FRAMES (JobTemp)]
222
  Initial Block Size 2.0 MB
223
- Used Block Count 1
224
  Overflow Count (too large) 0
225
  Overflow Count (full) 0
226
  [ALLOC_TEMP_JOB_ASYNC (Background)]
@@ -235,13 +258,13 @@ Memory Statistics:
235
  Used Block count 1
236
  Peak Allocated bytes 1.0 MB
237
  [ALLOC_GFX_MAIN]
238
- Peak usage frame count: [64.0 KB-128.0 KB]: 1 frames
239
  Requested Block Size 16.0 MB
240
  Peak Block count 1
241
  Peak Allocated memory 65.6 KB
242
  Peak Large allocation bytes 0 B
243
  [ALLOC_GFX_THREAD]
244
- Peak usage frame count: [128.0 KB-256.0 KB]: 1 frames
245
  Requested Block Size 16.0 MB
246
  Peak Block count 1
247
  Peak Allocated memory 173.5 KB
@@ -253,13 +276,13 @@ Memory Statistics:
253
  Used Block count 1
254
  Peak Allocated bytes 1.0 MB
255
  [ALLOC_CACHEOBJECTS_MAIN]
256
- Peak usage frame count: [0.5 MB-1.0 MB]: 1 frames
257
  Requested Block Size 4.0 MB
258
  Peak Block count 1
259
  Peak Allocated memory 0.6 MB
260
  Peak Large allocation bytes 0 B
261
  [ALLOC_CACHEOBJECTS_THREAD]
262
- Peak usage frame count: [4.0 MB-8.0 MB]: 1 frames
263
  Requested Block Size 4.0 MB
264
  Peak Block count 2
265
  Peak Allocated memory 4.4 MB
@@ -271,13 +294,13 @@ Memory Statistics:
271
  Used Block count 1
272
  Peak Allocated bytes 1.0 MB
273
  [ALLOC_TYPETREE_MAIN]
274
- Peak usage frame count: [0-1.0 KB]: 1 frames
275
  Requested Block Size 2.0 MB
276
  Peak Block count 1
277
  Peak Allocated memory 1.0 KB
278
  Peak Large allocation bytes 0 B
279
  [ALLOC_TYPETREE_THREAD]
280
- Peak usage frame count: [2.0 KB-4.0 KB]: 1 frames
281
  Requested Block Size 2.0 MB
282
  Peak Block count 1
283
  Peak Allocated memory 2.2 KB
 
31
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
32
  FMOD initialized on nosound output
33
  Begin MonoManager ReloadAssembly
34
+ - Completed reload, in 0.304 seconds
35
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
36
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
37
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
56
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
57
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
58
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
59
+ UnloadTime: 0.611657 ms
60
  Registered Communicator in Agent.
61
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
62
  requesting resize 84 x 84
63
+ TOO LONG
64
+ TOO LONG
65
+ TOO LONG
66
+ TOO LONG
67
+ TOO LONG
68
+ TOO LONG
69
+ TOO LONG
70
+ TOO LONG
71
+ TOO LONG
72
+ TOO LONG
73
+ TOO LONG
74
+ TOO LONG
75
+ TOO LONG
76
+ TOO LONG
77
+ TOO LONG
78
+ TOO LONG
79
+ TOO LONG
80
+ TOO LONG
81
+ TOO LONG
82
+ TOO LONG
83
+ TOO LONG
84
+ TOO LONG
85
+ TOO LONG
86
  Setting up 2 worker threads for Enlighten.
87
  Memory Statistics:
88
  [ALLOC_TEMP_TLS] TLS Allocator
89
  StackAllocators :
90
  [ALLOC_TEMP_MAIN]
91
+ Peak usage frame count: [8.0 KB-16.0 KB]: 11539 frames, [2.0 MB-4.0 MB]: 1 frames
92
  Initial Block Size 4.0 MB
93
  Current Block Size 4.0 MB
94
  Peak Allocated Bytes 2.1 MB
 
220
  Used Block count 1
221
  Peak Allocated bytes 1.0 MB
222
  [ALLOC_DEFAULT_MAIN]
223
+ Peak usage frame count: [4.0 MB-8.0 MB]: 11540 frames
224
  Requested Block Size 16.0 MB
225
  Peak Block count 1
226
+ Peak Allocated memory 4.9 MB
227
  Peak Large allocation bytes 0 B
228
  [ALLOC_DEFAULT_THREAD]
229
+ Peak usage frame count: [16.0 MB-32.0 MB]: 11540 frames
230
  Requested Block Size 16.0 MB
231
  Peak Block count 1
232
+ Peak Allocated memory 17.3 MB
233
  Peak Large allocation bytes 16.0 MB
234
  [ALLOC_TEMP_JOB_1_FRAME]
235
  Initial Block Size 2.0 MB
 
243
  Overflow Count (full) 0
244
  [ALLOC_TEMP_JOB_4_FRAMES (JobTemp)]
245
  Initial Block Size 2.0 MB
246
+ Used Block Count 2
247
  Overflow Count (too large) 0
248
  Overflow Count (full) 0
249
  [ALLOC_TEMP_JOB_ASYNC (Background)]
 
258
  Used Block count 1
259
  Peak Allocated bytes 1.0 MB
260
  [ALLOC_GFX_MAIN]
261
+ Peak usage frame count: [32.0 KB-64.0 KB]: 11539 frames, [64.0 KB-128.0 KB]: 1 frames
262
  Requested Block Size 16.0 MB
263
  Peak Block count 1
264
  Peak Allocated memory 65.6 KB
265
  Peak Large allocation bytes 0 B
266
  [ALLOC_GFX_THREAD]
267
+ Peak usage frame count: [128.0 KB-256.0 KB]: 11540 frames
268
  Requested Block Size 16.0 MB
269
  Peak Block count 1
270
  Peak Allocated memory 173.5 KB
 
276
  Used Block count 1
277
  Peak Allocated bytes 1.0 MB
278
  [ALLOC_CACHEOBJECTS_MAIN]
279
+ Peak usage frame count: [0.5 MB-1.0 MB]: 11540 frames
280
  Requested Block Size 4.0 MB
281
  Peak Block count 1
282
  Peak Allocated memory 0.6 MB
283
  Peak Large allocation bytes 0 B
284
  [ALLOC_CACHEOBJECTS_THREAD]
285
+ Peak usage frame count: [0.5 MB-1.0 MB]: 11539 frames, [4.0 MB-8.0 MB]: 1 frames
286
  Requested Block Size 4.0 MB
287
  Peak Block count 2
288
  Peak Allocated memory 4.4 MB
 
294
  Used Block count 1
295
  Peak Allocated bytes 1.0 MB
296
  [ALLOC_TYPETREE_MAIN]
297
+ Peak usage frame count: [0-1.0 KB]: 11540 frames
298
  Requested Block Size 2.0 MB
299
  Peak Block count 1
300
  Peak Allocated memory 1.0 KB
301
  Peak Large allocation bytes 0 B
302
  [ALLOC_TYPETREE_THREAD]
303
+ Peak usage frame count: [1.0 KB-2.0 KB]: 11539 frames, [2.0 KB-4.0 KB]: 1 frames
304
  Requested Block Size 2.0 MB
305
  Peak Block count 1
306
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -1,8 +1,202 @@
1
  {
2
  "name": "root",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  "metadata": {
4
  "timer_format_version": "0.1.0",
5
- "start_time_seconds": "1684021312",
6
  "python_version": "3.9.16 | packaged by conda-forge | (main, Feb 1 2023, 21:39:03) \n[GCC 11.3.0]",
7
  "command_line_arguments": "/opt/conda/bin/mlagents-learn ./config_file_soccer_twos/config_soccer_twos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume",
8
  "mlagents_version": "0.31.0.dev0",
@@ -10,41 +204,217 @@
10
  "communication_protocol_version": "1.5.0",
11
  "pytorch_version": "1.11.0+cu102",
12
  "numpy_version": "1.21.2",
13
- "end_time_seconds": "1684021317"
14
  },
15
- "total": 5.203121796999767,
16
  "count": 1,
17
- "self": 0.39114949900067586,
18
  "children": {
19
  "run_training.setup": {
20
- "total": 0.07265499399909459,
21
  "count": 1,
22
- "self": 0.07265499399909459
23
  },
24
  "TrainerController.start_learning": {
25
- "total": 4.7393173039999965,
26
  "count": 1,
27
- "self": 0.00010848599958990235,
28
  "children": {
29
  "TrainerController._reset_env": {
30
- "total": 4.050190531001135,
31
- "count": 1,
32
- "self": 4.050190531001135
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  },
34
  "trainer_threads": {
35
- "total": 1.3959997886558995e-06,
36
  "count": 1,
37
- "self": 1.3959997886558995e-06
38
  },
39
  "TrainerController._save_models": {
40
- "total": 0.6890168909994827,
41
  "count": 1,
42
- "self": 0.054944899000474834,
43
  "children": {
44
  "RLTrainer._checkpoint": {
45
- "total": 0.6340719919990079,
46
  "count": 1,
47
- "self": 0.6340719919990079
48
  }
49
  }
50
  }
 
1
  {
2
  "name": "root",
3
+ "gauges": {
4
+ "SoccerTwos.Policy.Entropy.mean": {
5
+ "value": 2.733802556991577,
6
+ "min": 2.733802556991577,
7
+ "max": 3.1146745681762695,
8
+ "count": 60
9
+ },
10
+ "SoccerTwos.Policy.Entropy.sum": {
11
+ "value": 54676.05078125,
12
+ "min": 39622.75,
13
+ "max": 92614.453125,
14
+ "count": 60
15
+ },
16
+ "SoccerTwos.Environment.EpisodeLength.mean": {
17
+ "value": 82.61016949152543,
18
+ "min": 69.67605633802818,
19
+ "max": 382.84615384615387,
20
+ "count": 60
21
+ },
22
+ "SoccerTwos.Environment.EpisodeLength.sum": {
23
+ "value": 19496.0,
24
+ "min": 16932.0,
25
+ "max": 23032.0,
26
+ "count": 60
27
+ },
28
+ "SoccerTwos.Self-play.ELO.mean": {
29
+ "value": 1294.8368885711739,
30
+ "min": 1229.6291367571866,
31
+ "max": 1296.6227957304347,
32
+ "count": 60
33
+ },
34
+ "SoccerTwos.Self-play.ELO.sum": {
35
+ "value": 152790.75285139852,
36
+ "min": 27249.504481312182,
37
+ "max": 181303.85226480005,
38
+ "count": 60
39
+ },
40
+ "SoccerTwos.Step.mean": {
41
+ "value": 1199974.0,
42
+ "min": 609553.0,
43
+ "max": 1199974.0,
44
+ "count": 60
45
+ },
46
+ "SoccerTwos.Step.sum": {
47
+ "value": 1199974.0,
48
+ "min": 609553.0,
49
+ "max": 1199974.0,
50
+ "count": 60
51
+ },
52
+ "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
+ "value": -0.006674866657704115,
54
+ "min": -0.04357234388589859,
55
+ "max": 0.07854899019002914,
56
+ "count": 60
57
+ },
58
+ "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
+ "value": -0.7876342535018921,
60
+ "min": -4.531523704528809,
61
+ "max": 8.404742240905762,
62
+ "count": 60
63
+ },
64
+ "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
+ "value": -0.008247418329119682,
66
+ "min": -0.041314251720905304,
67
+ "max": 0.08966611325740814,
68
+ "count": 60
69
+ },
70
+ "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
+ "value": -0.9731953144073486,
72
+ "min": -4.296682357788086,
73
+ "max": 8.482354164123535,
74
+ "count": 60
75
+ },
76
+ "SoccerTwos.Environment.CumulativeReward.mean": {
77
+ "value": 0.0,
78
+ "min": 0.0,
79
+ "max": 0.0,
80
+ "count": 60
81
+ },
82
+ "SoccerTwos.Environment.CumulativeReward.sum": {
83
+ "value": 0.0,
84
+ "min": 0.0,
85
+ "max": 0.0,
86
+ "count": 60
87
+ },
88
+ "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
+ "value": -0.24403559454416823,
90
+ "min": -0.6071574459684655,
91
+ "max": 0.3048800006508827,
92
+ "count": 60
93
+ },
94
+ "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
+ "value": -28.796200156211853,
96
+ "min": -28.796200156211853,
97
+ "max": 20.276399731636047,
98
+ "count": 60
99
+ },
100
+ "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
+ "value": -0.24403559454416823,
102
+ "min": -0.6071574459684655,
103
+ "max": 0.3048800006508827,
104
+ "count": 60
105
+ },
106
+ "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
+ "value": -28.796200156211853,
108
+ "min": -28.796200156211853,
109
+ "max": 20.276399731636047,
110
+ "count": 60
111
+ },
112
+ "SoccerTwos.IsTraining.mean": {
113
+ "value": 1.0,
114
+ "min": 1.0,
115
+ "max": 1.0,
116
+ "count": 60
117
+ },
118
+ "SoccerTwos.IsTraining.sum": {
119
+ "value": 1.0,
120
+ "min": 1.0,
121
+ "max": 1.0,
122
+ "count": 60
123
+ },
124
+ "SoccerTwos.Losses.PolicyLoss.mean": {
125
+ "value": 0.021856299584032967,
126
+ "min": 0.012633150363884245,
127
+ "max": 0.022237880590061345,
128
+ "count": 28
129
+ },
130
+ "SoccerTwos.Losses.PolicyLoss.sum": {
131
+ "value": 0.021856299584032967,
132
+ "min": 0.012633150363884245,
133
+ "max": 0.022237880590061345,
134
+ "count": 28
135
+ },
136
+ "SoccerTwos.Losses.ValueLoss.mean": {
137
+ "value": 0.054838288699587186,
138
+ "min": 0.01981707736849785,
139
+ "max": 0.05926394251485666,
140
+ "count": 28
141
+ },
142
+ "SoccerTwos.Losses.ValueLoss.sum": {
143
+ "value": 0.054838288699587186,
144
+ "min": 0.01981707736849785,
145
+ "max": 0.05926394251485666,
146
+ "count": 28
147
+ },
148
+ "SoccerTwos.Losses.BaselineLoss.mean": {
149
+ "value": 0.056269766638676326,
150
+ "min": 0.020496825998028118,
151
+ "max": 0.061689524973432226,
152
+ "count": 28
153
+ },
154
+ "SoccerTwos.Losses.BaselineLoss.sum": {
155
+ "value": 0.056269766638676326,
156
+ "min": 0.020496825998028118,
157
+ "max": 0.061689524973432226,
158
+ "count": 28
159
+ },
160
+ "SoccerTwos.Policy.LearningRate.mean": {
161
+ "value": 0.0003,
162
+ "min": 0.0003,
163
+ "max": 0.0003,
164
+ "count": 28
165
+ },
166
+ "SoccerTwos.Policy.LearningRate.sum": {
167
+ "value": 0.0003,
168
+ "min": 0.0003,
169
+ "max": 0.0003,
170
+ "count": 28
171
+ },
172
+ "SoccerTwos.Policy.Epsilon.mean": {
173
+ "value": 0.20000000000000007,
174
+ "min": 0.20000000000000007,
175
+ "max": 0.20000000000000007,
176
+ "count": 28
177
+ },
178
+ "SoccerTwos.Policy.Epsilon.sum": {
179
+ "value": 0.20000000000000007,
180
+ "min": 0.20000000000000007,
181
+ "max": 0.20000000000000007,
182
+ "count": 28
183
+ },
184
+ "SoccerTwos.Policy.Beta.mean": {
185
+ "value": 0.005000000000000001,
186
+ "min": 0.005000000000000001,
187
+ "max": 0.005000000000000001,
188
+ "count": 28
189
+ },
190
+ "SoccerTwos.Policy.Beta.sum": {
191
+ "value": 0.005000000000000001,
192
+ "min": 0.005000000000000001,
193
+ "max": 0.005000000000000001,
194
+ "count": 28
195
+ }
196
+ },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
+ "start_time_seconds": "1684022100",
200
  "python_version": "3.9.16 | packaged by conda-forge | (main, Feb 1 2023, 21:39:03) \n[GCC 11.3.0]",
201
  "command_line_arguments": "/opt/conda/bin/mlagents-learn ./config_file_soccer_twos/config_soccer_twos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume",
202
  "mlagents_version": "0.31.0.dev0",
 
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "1.11.0+cu102",
206
  "numpy_version": "1.21.2",
207
+ "end_time_seconds": "1684023102"
208
  },
209
+ "total": 1001.5571157470004,
210
  "count": 1,
211
+ "self": 0.3420637059989531,
212
  "children": {
213
  "run_training.setup": {
214
+ "total": 0.07226520600124786,
215
  "count": 1,
216
+ "self": 0.07226520600124786
217
  },
218
  "TrainerController.start_learning": {
219
+ "total": 1001.1427868350002,
220
  "count": 1,
221
+ "self": 0.7613444388116477,
222
  "children": {
223
  "TrainerController._reset_env": {
224
+ "total": 4.240916573002323,
225
+ "count": 7,
226
+ "self": 4.240916573002323
227
+ },
228
+ "TrainerController.advance": {
229
+ "total": 995.5049644211849,
230
+ "count": 40161,
231
+ "self": 0.8210167502202239,
232
+ "children": {
233
+ "env_step": {
234
+ "total": 762.4870510351793,
235
+ "count": 40161,
236
+ "self": 598.2191287610458,
237
+ "children": {
238
+ "SubprocessEnvManager._take_step": {
239
+ "total": 163.81086692280587,
240
+ "count": 40161,
241
+ "self": 5.853933413649429,
242
+ "children": {
243
+ "TorchPolicy.evaluate": {
244
+ "total": 157.95693350915644,
245
+ "count": 76930,
246
+ "self": 157.95693350915644
247
+ }
248
+ }
249
+ },
250
+ "workers": {
251
+ "total": 0.4570553513276536,
252
+ "count": 40161,
253
+ "self": 0.0,
254
+ "children": {
255
+ "worker_root": {
256
+ "total": 998.9299083149399,
257
+ "count": 40161,
258
+ "is_parallel": true,
259
+ "self": 496.6829484137961,
260
+ "children": {
261
+ "run_training.setup": {
262
+ "total": 0.0,
263
+ "count": 0,
264
+ "is_parallel": true,
265
+ "self": 0.0,
266
+ "children": {
267
+ "steps_from_proto": {
268
+ "total": 0.002802859000439639,
269
+ "count": 2,
270
+ "is_parallel": true,
271
+ "self": 0.0007083620021148818,
272
+ "children": {
273
+ "_process_rank_one_or_two_observation": {
274
+ "total": 0.0020944969983247574,
275
+ "count": 8,
276
+ "is_parallel": true,
277
+ "self": 0.0020944969983247574
278
+ }
279
+ }
280
+ },
281
+ "UnityEnvironment.step": {
282
+ "total": 0.03400731399960932,
283
+ "count": 1,
284
+ "is_parallel": true,
285
+ "self": 0.0011763070015149424,
286
+ "children": {
287
+ "UnityEnvironment._generate_step_input": {
288
+ "total": 0.0004787719990417827,
289
+ "count": 1,
290
+ "is_parallel": true,
291
+ "self": 0.0004787719990417827
292
+ },
293
+ "communicator.exchange": {
294
+ "total": 0.028489536000051885,
295
+ "count": 1,
296
+ "is_parallel": true,
297
+ "self": 0.028489536000051885
298
+ },
299
+ "steps_from_proto": {
300
+ "total": 0.0038626989990007132,
301
+ "count": 2,
302
+ "is_parallel": true,
303
+ "self": 0.0007088879956427263,
304
+ "children": {
305
+ "_process_rank_one_or_two_observation": {
306
+ "total": 0.003153811003357987,
307
+ "count": 8,
308
+ "is_parallel": true,
309
+ "self": 0.003153811003357987
310
+ }
311
+ }
312
+ }
313
+ }
314
+ }
315
+ }
316
+ },
317
+ "steps_from_proto": {
318
+ "total": 0.012707542000498506,
319
+ "count": 12,
320
+ "is_parallel": true,
321
+ "self": 0.002516350001315004,
322
+ "children": {
323
+ "_process_rank_one_or_two_observation": {
324
+ "total": 0.010191191999183502,
325
+ "count": 48,
326
+ "is_parallel": true,
327
+ "self": 0.010191191999183502
328
+ }
329
+ }
330
+ },
331
+ "UnityEnvironment.step": {
332
+ "total": 502.2342523591433,
333
+ "count": 40160,
334
+ "is_parallel": true,
335
+ "self": 27.97795652955938,
336
+ "children": {
337
+ "UnityEnvironment._generate_step_input": {
338
+ "total": 17.989639229994282,
339
+ "count": 40160,
340
+ "is_parallel": true,
341
+ "self": 17.989639229994282
342
+ },
343
+ "communicator.exchange": {
344
+ "total": 366.7374251978308,
345
+ "count": 40160,
346
+ "is_parallel": true,
347
+ "self": 366.7374251978308
348
+ },
349
+ "steps_from_proto": {
350
+ "total": 89.5292314017588,
351
+ "count": 80320,
352
+ "is_parallel": true,
353
+ "self": 16.533958772148253,
354
+ "children": {
355
+ "_process_rank_one_or_two_observation": {
356
+ "total": 72.99527262961055,
357
+ "count": 321280,
358
+ "is_parallel": true,
359
+ "self": 72.99527262961055
360
+ }
361
+ }
362
+ }
363
+ }
364
+ }
365
+ }
366
+ }
367
+ }
368
+ }
369
+ }
370
+ },
371
+ "trainer_advance": {
372
+ "total": 232.19689663578538,
373
+ "count": 40161,
374
+ "self": 6.532605739683277,
375
+ "children": {
376
+ "process_trajectory": {
377
+ "total": 75.352097508101,
378
+ "count": 40161,
379
+ "self": 74.74050682209963,
380
+ "children": {
381
+ "RLTrainer._checkpoint": {
382
+ "total": 0.6115906860013638,
383
+ "count": 1,
384
+ "self": 0.6115906860013638
385
+ }
386
+ }
387
+ },
388
+ "_update_policy": {
389
+ "total": 150.3121933880011,
390
+ "count": 28,
391
+ "self": 92.59276351401058,
392
+ "children": {
393
+ "TorchPOCAOptimizer.update": {
394
+ "total": 57.71942987399052,
395
+ "count": 840,
396
+ "self": 57.71942987399052
397
+ }
398
+ }
399
+ }
400
+ }
401
+ }
402
+ }
403
  },
404
  "trainer_threads": {
405
+ "total": 9.29001544136554e-07,
406
  "count": 1,
407
+ "self": 9.29001544136554e-07
408
  },
409
  "TrainerController._save_models": {
410
+ "total": 0.635560472999714,
411
  "count": 1,
412
+ "self": 0.057611300000644405,
413
  "children": {
414
  "RLTrainer._checkpoint": {
415
+ "total": 0.5779491729990696,
416
  "count": 1,
417
+ "self": 0.5779491729990696
418
  }
419
  }
420
  }
run_logs/training_status.json CHANGED
@@ -27,16 +27,34 @@
27
  "auxillary_file_paths": [
28
  "results/SoccerTwos/SoccerTwos/SoccerTwos-600788.pt"
29
  ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
30
  }
31
  ],
32
- "elo": 1237.2060690468327,
33
  "final_checkpoint": {
34
- "steps": 600788,
35
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
36
- "reward": null,
37
- "creation_time": 1684021317.5136611,
38
  "auxillary_file_paths": [
39
- "results/SoccerTwos/SoccerTwos/SoccerTwos-600788.pt"
40
  ]
41
  }
42
  },
 
27
  "auxillary_file_paths": [
28
  "results/SoccerTwos/SoccerTwos/SoccerTwos-600788.pt"
29
  ]
30
+ },
31
+ {
32
+ "steps": 999491,
33
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-999491.onnx",
34
+ "reward": 0.0,
35
+ "creation_time": 1684022771.5567825,
36
+ "auxillary_file_paths": [
37
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-999491.pt"
38
+ ]
39
+ },
40
+ {
41
+ "steps": 1200138,
42
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-1200138.onnx",
43
+ "reward": 0.0,
44
+ "creation_time": 1684023102.0223331,
45
+ "auxillary_file_paths": [
46
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-1200138.pt"
47
+ ]
48
  }
49
  ],
50
+ "elo": 1292.2213924352507,
51
  "final_checkpoint": {
52
+ "steps": 1200138,
53
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
54
+ "reward": 0.0,
55
+ "creation_time": 1684023102.0223331,
56
  "auxillary_file_paths": [
57
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-1200138.pt"
58
  ]
59
  }
60
  },