felixdae commited on
Commit
37b6d51
1 Parent(s): 97eb276

First Push

Browse files
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a33abf63337f2ed65dd7e39237a8b2c4e25b2d5e182933577c9d174e30b9bf69
3
  size 1764633
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e75e17c630eb15700d03b89761624b07eafd3e65504fd8ddea492326c8c8011f
3
  size 1764633
SoccerTwos/SoccerTwos-2794.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e75e17c630eb15700d03b89761624b07eafd3e65504fd8ddea492326c8c8011f
3
+ size 1764633
SoccerTwos/SoccerTwos-2794.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a33ed152196abb0ac1e7422fa71300bacb7bcebc4d85484d46fbe5140d9dee6e
3
+ size 9478265
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a239fb80d7d4091d1581183ede1c9e245c99bd3a13abe3882dab5f8d6f9c91aa
3
- size 28421137
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a33ed152196abb0ac1e7422fa71300bacb7bcebc4d85484d46fbe5140d9dee6e
3
+ size 9478265
SoccerTwos/events.out.tfevents.1686748708.d37089838a3f.6889.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2725adab92e59e7bfc546cb5e461117961ce54d42e7062f013a33c9651a72316
3
+ size 1240
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "constant", "beta_schedule": "constant", "epsilon_schedule": "constant"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 50000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 200000, "swap_steps": 2000, "window": 10, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/SoccerTwos.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "constant", "beta_schedule": "constant", "epsilon_schedule": "constant"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 5000000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 200000, "swap_steps": 2000, "window": 10, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/SoccerTwos.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -37,7 +37,7 @@ behaviors:
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
- max_steps: 50000
41
  time_horizon: 1000
42
  summary_freq: 10000
43
  threaded: false
 
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
+ max_steps: 5000000
41
  time_horizon: 1000
42
  summary_freq: 10000
43
  threaded: false
run_logs/Player-0.log CHANGED
@@ -31,7 +31,7 @@ ALSA lib pcm.c:2642:(snd_pcm_open_noupdate) Unknown PCM default
31
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
32
  FMOD initialized on nosound output
33
  Begin MonoManager ReloadAssembly
34
- - Completed reload, in 0.719 seconds
35
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
36
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
37
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -56,36 +56,16 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
56
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
57
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
58
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
59
- UnloadTime: 1.110830 ms
60
  Registered Communicator in Agent.
61
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
62
  requesting resize 84 x 84
63
- TOO LONG
64
- TOO LONG
65
- TOO LONG
66
- TOO LONG
67
- TOO LONG
68
- TOO LONG
69
- TOO LONG
70
- TOO LONG
71
- TOO LONG
72
- TOO LONG
73
- TOO LONG
74
- TOO LONG
75
- TOO LONG
76
- TOO LONG
77
- TOO LONG
78
- TOO LONG
79
- TOO LONG
80
- TOO LONG
81
- TOO LONG
82
- TOO LONG
83
  Setting up 1 worker threads for Enlighten.
84
  Memory Statistics:
85
  [ALLOC_TEMP_TLS] TLS Allocator
86
  StackAllocators :
87
  [ALLOC_TEMP_MAIN]
88
- Peak usage frame count: [8.0 KB-16.0 KB]: 1153 frames, [2.0 MB-4.0 MB]: 1 frames
89
  Initial Block Size 4.0 MB
90
  Current Block Size 4.0 MB
91
  Peak Allocated Bytes 2.1 MB
@@ -207,16 +187,16 @@ Memory Statistics:
207
  Used Block count 1
208
  Peak Allocated bytes 1.0 MB
209
  [ALLOC_DEFAULT_MAIN]
210
- Peak usage frame count: [4.0 MB-8.0 MB]: 1154 frames
211
  Requested Block Size 16.0 MB
212
  Peak Block count 1
213
- Peak Allocated memory 4.7 MB
214
  Peak Large allocation bytes 0 B
215
  [ALLOC_DEFAULT_THREAD]
216
- Peak usage frame count: [16.0 MB-32.0 MB]: 1154 frames
217
  Requested Block Size 16.0 MB
218
  Peak Block count 1
219
- Peak Allocated memory 17.5 MB
220
  Peak Large allocation bytes 16.0 MB
221
  [ALLOC_TEMP_JOB_1_FRAME]
222
  Initial Block Size 2.0 MB
@@ -245,13 +225,13 @@ Memory Statistics:
245
  Used Block count 1
246
  Peak Allocated bytes 1.0 MB
247
  [ALLOC_GFX_MAIN]
248
- Peak usage frame count: [32.0 KB-64.0 KB]: 1153 frames, [64.0 KB-128.0 KB]: 1 frames
249
  Requested Block Size 16.0 MB
250
  Peak Block count 1
251
  Peak Allocated memory 65.6 KB
252
  Peak Large allocation bytes 0 B
253
  [ALLOC_GFX_THREAD]
254
- Peak usage frame count: [128.0 KB-256.0 KB]: 1154 frames
255
  Requested Block Size 16.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 173.5 KB
@@ -263,16 +243,16 @@ Memory Statistics:
263
  Used Block count 1
264
  Peak Allocated bytes 1.0 MB
265
  [ALLOC_CACHEOBJECTS_MAIN]
266
- Peak usage frame count: [0.5 MB-1.0 MB]: 1154 frames
267
  Requested Block Size 4.0 MB
268
  Peak Block count 1
269
  Peak Allocated memory 0.6 MB
270
  Peak Large allocation bytes 0 B
271
  [ALLOC_CACHEOBJECTS_THREAD]
272
- Peak usage frame count: [0.5 MB-1.0 MB]: 1153 frames, [2.0 MB-4.0 MB]: 1 frames
273
  Requested Block Size 4.0 MB
274
- Peak Block count 1
275
- Peak Allocated memory 4.0 MB
276
  Peak Large allocation bytes 0 B
277
  [ALLOC_TYPETREE] Dual Thread Allocator
278
  Peak main deferred allocation count 0
@@ -281,13 +261,13 @@ Memory Statistics:
281
  Used Block count 1
282
  Peak Allocated bytes 1.0 MB
283
  [ALLOC_TYPETREE_MAIN]
284
- Peak usage frame count: [0-1.0 KB]: 1154 frames
285
  Requested Block Size 2.0 MB
286
  Peak Block count 1
287
  Peak Allocated memory 1.0 KB
288
  Peak Large allocation bytes 0 B
289
  [ALLOC_TYPETREE_THREAD]
290
- Peak usage frame count: [1.0 KB-2.0 KB]: 1153 frames, [2.0 KB-4.0 KB]: 1 frames
291
  Requested Block Size 2.0 MB
292
  Peak Block count 1
293
  Peak Allocated memory 2.2 KB
 
31
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
32
  FMOD initialized on nosound output
33
  Begin MonoManager ReloadAssembly
34
+ - Completed reload, in 0.874 seconds
35
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
36
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
37
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
56
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
57
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
58
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
59
+ UnloadTime: 0.896118 ms
60
  Registered Communicator in Agent.
61
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
62
  requesting resize 84 x 84
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  Setting up 1 worker threads for Enlighten.
64
  Memory Statistics:
65
  [ALLOC_TEMP_TLS] TLS Allocator
66
  StackAllocators :
67
  [ALLOC_TEMP_MAIN]
68
+ Peak usage frame count: [8.0 KB-16.0 KB]: 235 frames, [2.0 MB-4.0 MB]: 1 frames
69
  Initial Block Size 4.0 MB
70
  Current Block Size 4.0 MB
71
  Peak Allocated Bytes 2.1 MB
 
187
  Used Block count 1
188
  Peak Allocated bytes 1.0 MB
189
  [ALLOC_DEFAULT_MAIN]
190
+ Peak usage frame count: [4.0 MB-8.0 MB]: 236 frames
191
  Requested Block Size 16.0 MB
192
  Peak Block count 1
193
+ Peak Allocated memory 5.0 MB
194
  Peak Large allocation bytes 0 B
195
  [ALLOC_DEFAULT_THREAD]
196
+ Peak usage frame count: [16.0 MB-32.0 MB]: 236 frames
197
  Requested Block Size 16.0 MB
198
  Peak Block count 1
199
+ Peak Allocated memory 17.2 MB
200
  Peak Large allocation bytes 16.0 MB
201
  [ALLOC_TEMP_JOB_1_FRAME]
202
  Initial Block Size 2.0 MB
 
225
  Used Block count 1
226
  Peak Allocated bytes 1.0 MB
227
  [ALLOC_GFX_MAIN]
228
+ Peak usage frame count: [32.0 KB-64.0 KB]: 235 frames, [64.0 KB-128.0 KB]: 1 frames
229
  Requested Block Size 16.0 MB
230
  Peak Block count 1
231
  Peak Allocated memory 65.6 KB
232
  Peak Large allocation bytes 0 B
233
  [ALLOC_GFX_THREAD]
234
+ Peak usage frame count: [128.0 KB-256.0 KB]: 236 frames
235
  Requested Block Size 16.0 MB
236
  Peak Block count 1
237
  Peak Allocated memory 173.5 KB
 
243
  Used Block count 1
244
  Peak Allocated bytes 1.0 MB
245
  [ALLOC_CACHEOBJECTS_MAIN]
246
+ Peak usage frame count: [0.5 MB-1.0 MB]: 236 frames
247
  Requested Block Size 4.0 MB
248
  Peak Block count 1
249
  Peak Allocated memory 0.6 MB
250
  Peak Large allocation bytes 0 B
251
  [ALLOC_CACHEOBJECTS_THREAD]
252
+ Peak usage frame count: [0.5 MB-1.0 MB]: 235 frames, [4.0 MB-8.0 MB]: 1 frames
253
  Requested Block Size 4.0 MB
254
+ Peak Block count 2
255
+ Peak Allocated memory 4.5 MB
256
  Peak Large allocation bytes 0 B
257
  [ALLOC_TYPETREE] Dual Thread Allocator
258
  Peak main deferred allocation count 0
 
261
  Used Block count 1
262
  Peak Allocated bytes 1.0 MB
263
  [ALLOC_TYPETREE_MAIN]
264
+ Peak usage frame count: [0-1.0 KB]: 236 frames
265
  Requested Block Size 2.0 MB
266
  Peak Block count 1
267
  Peak Allocated memory 1.0 KB
268
  Peak Large allocation bytes 0 B
269
  [ALLOC_TYPETREE_THREAD]
270
+ Peak usage frame count: [1.0 KB-2.0 KB]: 235 frames, [2.0 KB-4.0 KB]: 1 frames
271
  Requested Block Size 2.0 MB
272
  Peak Block count 1
273
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -1,202 +1,8 @@
1
  {
2
  "name": "root",
3
- "gauges": {
4
- "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 3.28265643119812,
6
- "min": 3.28265643119812,
7
- "max": 3.295696258544922,
8
- "count": 5
9
- },
10
- "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 88763.03125,
12
- "min": 29053.037109375,
13
- "max": 105462.21875,
14
- "count": 5
15
- },
16
- "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 754.6666666666666,
18
- "min": 668.3333333333334,
19
- "max": 820.1666666666666,
20
- "count": 5
21
- },
22
- "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 18112.0,
24
- "min": 16040.0,
25
- "max": 25180.0,
26
- "count": 5
27
- },
28
- "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1198.3874877821277,
30
- "min": 1198.0911687838272,
31
- "max": 1201.004267761486,
32
- "count": 5
33
- },
34
- "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 4793.549951128511,
36
- "min": 4793.549951128511,
37
- "max": 9608.034142091888,
38
- "count": 5
39
- },
40
- "SoccerTwos.Step.mean": {
41
- "value": 49926.0,
42
- "min": 9608.0,
43
- "max": 49926.0,
44
- "count": 5
45
- },
46
- "SoccerTwos.Step.sum": {
47
- "value": 49926.0,
48
- "min": 9608.0,
49
- "max": 49926.0,
50
- "count": 5
51
- },
52
- "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
- "value": 0.06536506116390228,
54
- "min": 0.06536506116390228,
55
- "max": 0.10138500481843948,
56
- "count": 5
57
- },
58
- "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
- "value": 0.8497458100318909,
60
- "min": 0.8497458100318909,
61
- "max": 1.5207037925720215,
62
- "count": 5
63
- },
64
- "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
- "value": 0.06429646909236908,
66
- "min": 0.06429646909236908,
67
- "max": 0.10138337314128876,
68
- "count": 5
69
- },
70
- "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
- "value": 0.8358541131019592,
72
- "min": 0.8358541131019592,
73
- "max": 1.520679235458374,
74
- "count": 5
75
- },
76
- "SoccerTwos.Environment.CumulativeReward.mean": {
77
- "value": 0.0,
78
- "min": 0.0,
79
- "max": 0.0,
80
- "count": 5
81
- },
82
- "SoccerTwos.Environment.CumulativeReward.sum": {
83
- "value": 0.0,
84
- "min": 0.0,
85
- "max": 0.0,
86
- "count": 5
87
- },
88
- "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
- "value": -0.04378461837768555,
90
- "min": -0.25,
91
- "max": -0.04378461837768555,
92
- "count": 5
93
- },
94
- "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
- "value": -0.5692000389099121,
96
- "min": -3.0648000240325928,
97
- "max": -0.5692000389099121,
98
- "count": 5
99
- },
100
- "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
- "value": -0.04378461837768555,
102
- "min": -0.25,
103
- "max": -0.04378461837768555,
104
- "count": 5
105
- },
106
- "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
- "value": -0.5692000389099121,
108
- "min": -3.0648000240325928,
109
- "max": -0.5692000389099121,
110
- "count": 5
111
- },
112
- "SoccerTwos.IsTraining.mean": {
113
- "value": 1.0,
114
- "min": 1.0,
115
- "max": 1.0,
116
- "count": 5
117
- },
118
- "SoccerTwos.IsTraining.sum": {
119
- "value": 1.0,
120
- "min": 1.0,
121
- "max": 1.0,
122
- "count": 5
123
- },
124
- "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.018575048559190083,
126
- "min": 0.018208359370085723,
127
- "max": 0.018575048559190083,
128
- "count": 2
129
- },
130
- "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.018575048559190083,
132
- "min": 0.018208359370085723,
133
- "max": 0.018575048559190083,
134
- "count": 2
135
- },
136
- "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.004095277213491499,
138
- "min": 0.004095277213491499,
139
- "max": 0.005249080806970596,
140
- "count": 2
141
- },
142
- "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.004095277213491499,
144
- "min": 0.004095277213491499,
145
- "max": 0.005249080806970596,
146
- "count": 2
147
- },
148
- "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.0041288621801262105,
150
- "min": 0.0041288621801262105,
151
- "max": 0.004664750932715833,
152
- "count": 2
153
- },
154
- "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.0041288621801262105,
156
- "min": 0.0041288621801262105,
157
- "max": 0.004664750932715833,
158
- "count": 2
159
- },
160
- "SoccerTwos.Policy.LearningRate.mean": {
161
- "value": 0.0003,
162
- "min": 0.0003,
163
- "max": 0.0003,
164
- "count": 2
165
- },
166
- "SoccerTwos.Policy.LearningRate.sum": {
167
- "value": 0.0003,
168
- "min": 0.0003,
169
- "max": 0.0003,
170
- "count": 2
171
- },
172
- "SoccerTwos.Policy.Epsilon.mean": {
173
- "value": 0.20000000000000007,
174
- "min": 0.20000000000000007,
175
- "max": 0.20000000000000007,
176
- "count": 2
177
- },
178
- "SoccerTwos.Policy.Epsilon.sum": {
179
- "value": 0.20000000000000007,
180
- "min": 0.20000000000000007,
181
- "max": 0.20000000000000007,
182
- "count": 2
183
- },
184
- "SoccerTwos.Policy.Beta.mean": {
185
- "value": 0.005000000000000001,
186
- "min": 0.005000000000000001,
187
- "max": 0.005000000000000001,
188
- "count": 2
189
- },
190
- "SoccerTwos.Policy.Beta.sum": {
191
- "value": 0.005000000000000001,
192
- "min": 0.005000000000000001,
193
- "max": 0.005000000000000001,
194
- "count": 2
195
- }
196
- },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1686748280",
200
  "python_version": "3.10.12 (main, Jun 7 2023, 12:45:35) [GCC 9.4.0]",
201
  "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics",
202
  "mlagents_version": "0.31.0.dev0",
@@ -204,59 +10,59 @@
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "1.11.0+cu102",
206
  "numpy_version": "1.21.2",
207
- "end_time_seconds": "1686748587"
208
  },
209
- "total": 306.415053358,
210
  "count": 1,
211
- "self": 1.121778402000018,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.0938294400000359,
215
  "count": 1,
216
- "self": 0.0938294400000359
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 305.19944551599997,
220
  "count": 1,
221
- "self": 0.15516480800101817,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 2.553870785000072,
225
  "count": 1,
226
- "self": 2.553870785000072
227
  },
228
  "TrainerController.advance": {
229
- "total": 301.9086998829989,
230
- "count": 3860,
231
- "self": 0.16292576999762787,
232
  "children": {
233
  "env_step": {
234
- "total": 135.97904770200284,
235
- "count": 3860,
236
- "self": 111.68265270400366,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
- "total": 24.206270759996187,
240
- "count": 3860,
241
- "self": 0.9830231650059886,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
- "total": 23.223247594990198,
245
- "count": 7690,
246
- "self": 23.223247594990198
247
  }
248
  }
249
  },
250
  "workers": {
251
- "total": 0.09012423800299985,
252
- "count": 3860,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
- "total": 302.3054157560109,
257
- "count": 3860,
258
  "is_parallel": true,
259
- "self": 209.07813883900644,
260
  "children": {
261
  "run_training.setup": {
262
  "total": 0.0,
@@ -265,48 +71,48 @@
265
  "self": 0.0,
266
  "children": {
267
  "steps_from_proto": {
268
- "total": 0.004979842000011558,
269
  "count": 2,
270
  "is_parallel": true,
271
- "self": 0.001133596999807196,
272
  "children": {
273
  "_process_rank_one_or_two_observation": {
274
- "total": 0.0038462450002043624,
275
  "count": 8,
276
  "is_parallel": true,
277
- "self": 0.0038462450002043624
278
  }
279
  }
280
  },
281
  "UnityEnvironment.step": {
282
- "total": 0.07906042300010085,
283
  "count": 1,
284
  "is_parallel": true,
285
- "self": 0.0013764720001745445,
286
  "children": {
287
  "UnityEnvironment._generate_step_input": {
288
- "total": 0.0010573090000889351,
289
  "count": 1,
290
  "is_parallel": true,
291
- "self": 0.0010573090000889351
292
  },
293
  "communicator.exchange": {
294
- "total": 0.07225851399994099,
295
  "count": 1,
296
  "is_parallel": true,
297
- "self": 0.07225851399994099
298
  },
299
  "steps_from_proto": {
300
- "total": 0.004368127999896387,
301
  "count": 2,
302
  "is_parallel": true,
303
- "self": 0.0008362700000361656,
304
  "children": {
305
  "_process_rank_one_or_two_observation": {
306
- "total": 0.0035318579998602218,
307
  "count": 8,
308
  "is_parallel": true,
309
- "self": 0.0035318579998602218
310
  }
311
  }
312
  }
@@ -315,34 +121,34 @@
315
  }
316
  },
317
  "UnityEnvironment.step": {
318
- "total": 93.22727691700447,
319
- "count": 3859,
320
  "is_parallel": true,
321
- "self": 5.486070685996538,
322
  "children": {
323
  "UnityEnvironment._generate_step_input": {
324
- "total": 2.933011493001686,
325
- "count": 3859,
326
  "is_parallel": true,
327
- "self": 2.933011493001686
328
  },
329
  "communicator.exchange": {
330
- "total": 67.80359328600025,
331
- "count": 3859,
332
  "is_parallel": true,
333
- "self": 67.80359328600025
334
  },
335
  "steps_from_proto": {
336
- "total": 17.004601452006,
337
- "count": 7718,
338
  "is_parallel": true,
339
- "self": 3.028566120012556,
340
  "children": {
341
  "_process_rank_one_or_two_observation": {
342
- "total": 13.976035331993444,
343
- "count": 30872,
344
  "is_parallel": true,
345
- "self": 13.976035331993444
346
  }
347
  }
348
  }
@@ -355,45 +161,33 @@
355
  }
356
  },
357
  "trainer_advance": {
358
- "total": 165.76672641099844,
359
- "count": 3860,
360
- "self": 0.9075624519957728,
361
  "children": {
362
  "process_trajectory": {
363
- "total": 22.190596382002468,
364
- "count": 3860,
365
- "self": 22.190596382002468
366
- },
367
- "_update_policy": {
368
- "total": 142.6685675770002,
369
- "count": 2,
370
- "self": 10.168901357000323,
371
- "children": {
372
- "TorchPOCAOptimizer.update": {
373
- "total": 132.49966621999988,
374
- "count": 60,
375
- "self": 132.49966621999988
376
- }
377
- }
378
  }
379
  }
380
  }
381
  }
382
  },
383
  "trainer_threads": {
384
- "total": 1.6999999843392288e-06,
385
  "count": 1,
386
- "self": 1.6999999843392288e-06
387
  },
388
  "TrainerController._save_models": {
389
- "total": 0.5817083399999774,
390
  "count": 1,
391
- "self": 0.01770135299989306,
392
  "children": {
393
  "RLTrainer._checkpoint": {
394
- "total": 0.5640069870000843,
395
  "count": 1,
396
- "self": 0.5640069870000843
397
  }
398
  }
399
  }
 
1
  {
2
  "name": "root",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  "metadata": {
4
  "timer_format_version": "0.1.0",
5
+ "start_time_seconds": "1686748705",
6
  "python_version": "3.10.12 (main, Jun 7 2023, 12:45:35) [GCC 9.4.0]",
7
  "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics",
8
  "mlagents_version": "0.31.0.dev0",
 
10
  "communication_protocol_version": "1.5.0",
11
  "pytorch_version": "1.11.0+cu102",
12
  "numpy_version": "1.21.2",
13
+ "end_time_seconds": "1686748738"
14
  },
15
+ "total": 33.052970894000055,
16
  "count": 1,
17
+ "self": 0.33947862600007284,
18
  "children": {
19
  "run_training.setup": {
20
+ "total": 0.06832204300008016,
21
  "count": 1,
22
+ "self": 0.06832204300008016
23
  },
24
  "TrainerController.start_learning": {
25
+ "total": 32.6451702249999,
26
  "count": 1,
27
+ "self": 0.030823673994973433,
28
  "children": {
29
  "TrainerController._reset_env": {
30
+ "total": 2.2724867280001035,
31
  "count": 1,
32
+ "self": 2.2724867280001035
33
  },
34
  "TrainerController.advance": {
35
+ "total": 29.596817908004823,
36
+ "count": 786,
37
+ "self": 0.03293174200621252,
38
  "children": {
39
  "env_step": {
40
+ "total": 27.952460072998974,
41
+ "count": 786,
42
+ "self": 23.146774284001367,
43
  "children": {
44
  "SubprocessEnvManager._take_step": {
45
+ "total": 4.788731201000019,
46
+ "count": 786,
47
+ "self": 0.2026699519972226,
48
  "children": {
49
  "TorchPolicy.evaluate": {
50
+ "total": 4.586061249002796,
51
+ "count": 1568,
52
+ "self": 4.586061249002796
53
  }
54
  }
55
  },
56
  "workers": {
57
+ "total": 0.016954587997588533,
58
+ "count": 785,
59
  "self": 0.0,
60
  "children": {
61
  "worker_root": {
62
+ "total": 31.7358276460011,
63
+ "count": 785,
64
  "is_parallel": true,
65
+ "self": 12.433781939002301,
66
  "children": {
67
  "run_training.setup": {
68
  "total": 0.0,
 
71
  "self": 0.0,
72
  "children": {
73
  "steps_from_proto": {
74
+ "total": 0.004423301000088031,
75
  "count": 2,
76
  "is_parallel": true,
77
+ "self": 0.0011540060006609565,
78
  "children": {
79
  "_process_rank_one_or_two_observation": {
80
+ "total": 0.003269294999427075,
81
  "count": 8,
82
  "is_parallel": true,
83
+ "self": 0.003269294999427075
84
  }
85
  }
86
  },
87
  "UnityEnvironment.step": {
88
+ "total": 0.05084969499989711,
89
  "count": 1,
90
  "is_parallel": true,
91
+ "self": 0.0013758599998254795,
92
  "children": {
93
  "UnityEnvironment._generate_step_input": {
94
+ "total": 0.0011552159999155265,
95
  "count": 1,
96
  "is_parallel": true,
97
+ "self": 0.0011552159999155265
98
  },
99
  "communicator.exchange": {
100
+ "total": 0.04405214700000215,
101
  "count": 1,
102
  "is_parallel": true,
103
+ "self": 0.04405214700000215
104
  },
105
  "steps_from_proto": {
106
+ "total": 0.0042664720001539536,
107
  "count": 2,
108
  "is_parallel": true,
109
+ "self": 0.0008813620002001699,
110
  "children": {
111
  "_process_rank_one_or_two_observation": {
112
+ "total": 0.0033851099999537837,
113
  "count": 8,
114
  "is_parallel": true,
115
+ "self": 0.0033851099999537837
116
  }
117
  }
118
  }
 
121
  }
122
  },
123
  "UnityEnvironment.step": {
124
+ "total": 19.302045706998797,
125
+ "count": 784,
126
  "is_parallel": true,
127
+ "self": 1.1347571000064818,
128
  "children": {
129
  "UnityEnvironment._generate_step_input": {
130
+ "total": 0.6015711309985363,
131
+ "count": 784,
132
  "is_parallel": true,
133
+ "self": 0.6015711309985363
134
  },
135
  "communicator.exchange": {
136
+ "total": 13.988910074998785,
137
+ "count": 784,
138
  "is_parallel": true,
139
+ "self": 13.988910074998785
140
  },
141
  "steps_from_proto": {
142
+ "total": 3.576807400994994,
143
+ "count": 1568,
144
  "is_parallel": true,
145
+ "self": 0.6389004019983986,
146
  "children": {
147
  "_process_rank_one_or_two_observation": {
148
+ "total": 2.9379069989965956,
149
+ "count": 6272,
150
  "is_parallel": true,
151
+ "self": 2.9379069989965956
152
  }
153
  }
154
  }
 
161
  }
162
  },
163
  "trainer_advance": {
164
+ "total": 1.6114260929996362,
165
+ "count": 785,
166
+ "self": 0.10081051099723481,
167
  "children": {
168
  "process_trajectory": {
169
+ "total": 1.5106155820024014,
170
+ "count": 785,
171
+ "self": 1.5106155820024014
 
 
 
 
 
 
 
 
 
 
 
 
172
  }
173
  }
174
  }
175
  }
176
  },
177
  "trainer_threads": {
178
+ "total": 1.94700010069937e-06,
179
  "count": 1,
180
+ "self": 1.94700010069937e-06
181
  },
182
  "TrainerController._save_models": {
183
+ "total": 0.7450399679999009,
184
  "count": 1,
185
+ "self": 0.02608699899997191,
186
  "children": {
187
  "RLTrainer._checkpoint": {
188
+ "total": 0.718952968999929,
189
  "count": 1,
190
+ "self": 0.718952968999929
191
  }
192
  }
193
  }
run_logs/training_status.json CHANGED
@@ -1,24 +1,24 @@
1
  {
2
  "SoccerTwos": {
3
- "elo": 1199.0185606756888,
4
  "checkpoints": [
5
  {
6
- "steps": 51926,
7
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-51926.onnx",
8
  "reward": 0.0,
9
- "creation_time": 1686748585.8895307,
10
  "auxillary_file_paths": [
11
- "results/SoccerTwos/SoccerTwos/SoccerTwos-51926.pt"
12
  ]
13
  }
14
  ],
15
  "final_checkpoint": {
16
- "steps": 51926,
17
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
18
  "reward": 0.0,
19
- "creation_time": 1686748585.8895307,
20
  "auxillary_file_paths": [
21
- "results/SoccerTwos/SoccerTwos/SoccerTwos-51926.pt"
22
  ]
23
  }
24
  },
 
1
  {
2
  "SoccerTwos": {
3
+ "elo": 1200.9928540150988,
4
  "checkpoints": [
5
  {
6
+ "steps": 2794,
7
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-2794.onnx",
8
  "reward": 0.0,
9
+ "creation_time": 1686748738.4783692,
10
  "auxillary_file_paths": [
11
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-2794.pt"
12
  ]
13
  }
14
  ],
15
  "final_checkpoint": {
16
+ "steps": 2794,
17
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
18
  "reward": 0.0,
19
+ "creation_time": 1686748738.4783692,
20
  "auxillary_file_paths": [
21
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-2794.pt"
22
  ]
23
  }
24
  },