giovannidispoto commited on
Commit
9db8030
1 Parent(s): 4b62b3d

First Push`

Browse files
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70506f8cee310950c62ab165bf7ebe724d52a1128a883c02b70f912fa671cdec
3
  size 1764633
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6687d7b93488beaa3a2711f6f03563e8a0f6b77fab174bdc7e45d35b36101c20
3
  size 1764633
SoccerTwos/SoccerTwos-2934422.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6687d7b93488beaa3a2711f6f03563e8a0f6b77fab174bdc7e45d35b36101c20
3
+ size 1764633
SoccerTwos/SoccerTwos-2934422.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d67d3af86811aaa17d02763d901139d2e2c20e2970766669775c00e9f4bf14b2
3
+ size 28421201
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15283d56cd77101e66587ac8b1b8c709476a8bc1d03bc14efa34fec302849a1a
3
  size 28421201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d67d3af86811aaa17d02763d901139d2e2c20e2970766669775c00e9f4bf14b2
3
  size 28421201
SoccerTwos/events.out.tfevents.1689930706.MBP-di-Giovanni.homenet.telecomitalia.it.8723.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d048b1053efe34ed0664661eb03b21cee8984edf774b0cdb86c4b6430b52754
3
- size 1241
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d7aab6ba08161b8ac5c1ad308864c3050db68d9d155c0d403111d831f7a2e8b
3
+ size 335348
run_logs/Player-0.log CHANGED
@@ -38,3 +38,297 @@ WARNING: Shader If subshaders removal was intentional, you may have forgotten tu
38
  UnloadTime: 0.256916 ms
39
  Registered Communicator in Agent.
40
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
38
  UnloadTime: 0.256916 ms
39
  Registered Communicator in Agent.
40
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
41
+ TOO LONG
42
+ TOO LONG
43
+ TOO LONG
44
+ TOO LONG
45
+ TOO LONG
46
+ TOO LONG
47
+ TOO LONG
48
+ TOO LONG
49
+ TOO LONG
50
+ TOO LONG
51
+ TOO LONG
52
+ TOO LONG
53
+ TOO LONG
54
+ TOO LONG
55
+ TOO LONG
56
+ TOO LONG
57
+ TOO LONG
58
+ TOO LONG
59
+ TOO LONG
60
+ TOO LONG
61
+ TOO LONG
62
+ TOO LONG
63
+ TOO LONG
64
+ TOO LONG
65
+ TOO LONG
66
+ TOO LONG
67
+ TOO LONG
68
+ TOO LONG
69
+ TOO LONG
70
+ TOO LONG
71
+ TOO LONG
72
+ TOO LONG
73
+ TOO LONG
74
+ TOO LONG
75
+ TOO LONG
76
+ TOO LONG
77
+ TOO LONG
78
+ TOO LONG
79
+ TOO LONG
80
+ TOO LONG
81
+ TOO LONG
82
+ TOO LONG
83
+ TOO LONG
84
+ TOO LONG
85
+ TOO LONG
86
+ GRPC Exception: Status(StatusCode=Unknown, Detail="Exception calling application: [Errno 32] Broken pipe"). Disconnecting from trainer.
87
+ Thread 0x17131f000 may have been prematurely finalized
88
+ Setting up 4 worker threads for Enlighten.
89
+ Memory Statistics:
90
+ [ALLOC_TEMP_TLS] TLS Allocator
91
+ StackAllocators :
92
+ [ALLOC_TEMP_MAIN]
93
+ Peak usage frame count: [2.0 KB-4.0 KB]: 1 frames, [8.0 KB-16.0 KB]: 6297 frames, [2.0 MB-4.0 MB]: 1 frames
94
+ Initial Block Size 4.0 MB
95
+ Current Block Size 4.0 MB
96
+ Peak Allocated Bytes 2.1 MB
97
+ Overflow Count 0
98
+ [ALLOC_TEMP_Loading.AsyncRead]
99
+ Initial Block Size 64.0 KB
100
+ Current Block Size 64.0 KB
101
+ Peak Allocated Bytes 141 B
102
+ Overflow Count 0
103
+ [ALLOC_TEMP_Loading.PreloadManager]
104
+ Initial Block Size 256.0 KB
105
+ Current Block Size 256.0 KB
106
+ Peak Allocated Bytes 78.8 KB
107
+ Overflow Count 4
108
+ [ALLOC_TEMP_Background Job.Worker 8]
109
+ Initial Block Size 32.0 KB
110
+ Current Block Size 32.0 KB
111
+ Peak Allocated Bytes 0 B
112
+ Overflow Count 0
113
+ [ALLOC_TEMP_Job.Worker 6]
114
+ Initial Block Size 256.0 KB
115
+ Current Block Size 256.0 KB
116
+ Peak Allocated Bytes 0 B
117
+ Overflow Count 0
118
+ [ALLOC_TEMP_Job.Worker 0]
119
+ Initial Block Size 256.0 KB
120
+ Current Block Size 256.0 KB
121
+ Peak Allocated Bytes 0.7 KB
122
+ Overflow Count 0
123
+ [ALLOC_TEMP_Background Job.Worker 10]
124
+ Initial Block Size 32.0 KB
125
+ Current Block Size 32.0 KB
126
+ Peak Allocated Bytes 0 B
127
+ Overflow Count 0
128
+ [ALLOC_TEMP_Background Job.Worker 9]
129
+ Initial Block Size 32.0 KB
130
+ Current Block Size 32.0 KB
131
+ Peak Allocated Bytes 0 B
132
+ Overflow Count 0
133
+ [ALLOC_TEMP_Job.Worker 5]
134
+ Initial Block Size 256.0 KB
135
+ Current Block Size 256.0 KB
136
+ Peak Allocated Bytes 0 B
137
+ Overflow Count 0
138
+ [ALLOC_TEMP_Background Job.Worker 14]
139
+ Initial Block Size 32.0 KB
140
+ Current Block Size 32.0 KB
141
+ Peak Allocated Bytes 0 B
142
+ Overflow Count 0
143
+ [ALLOC_TEMP_Background Job.Worker 6]
144
+ Initial Block Size 32.0 KB
145
+ Current Block Size 32.0 KB
146
+ Peak Allocated Bytes 0 B
147
+ Overflow Count 0
148
+ [ALLOC_TEMP_Job.Worker 4]
149
+ Initial Block Size 256.0 KB
150
+ Current Block Size 256.0 KB
151
+ Peak Allocated Bytes 0 B
152
+ Overflow Count 0
153
+ [ALLOC_TEMP_Job.Worker 3]
154
+ Initial Block Size 256.0 KB
155
+ Current Block Size 256.0 KB
156
+ Peak Allocated Bytes 0 B
157
+ Overflow Count 0
158
+ [ALLOC_TEMP_Background Job.Worker 12]
159
+ Initial Block Size 32.0 KB
160
+ Current Block Size 32.0 KB
161
+ Peak Allocated Bytes 0 B
162
+ Overflow Count 0
163
+ [ALLOC_TEMP_EnlightenWorker] x 4
164
+ Initial Block Size 64.0 KB
165
+ Current Block Size 64.0 KB
166
+ Peak Allocated Bytes 0 B
167
+ Overflow Count 0
168
+ [ALLOC_TEMP_Background Job.Worker 15]
169
+ Initial Block Size 32.0 KB
170
+ Current Block Size 32.0 KB
171
+ Peak Allocated Bytes 0 B
172
+ Overflow Count 0
173
+ [ALLOC_TEMP_Background Job.Worker 1]
174
+ Initial Block Size 32.0 KB
175
+ Current Block Size 32.0 KB
176
+ Peak Allocated Bytes 0 B
177
+ Overflow Count 0
178
+ [ALLOC_TEMP_Background Job.Worker 2]
179
+ Initial Block Size 32.0 KB
180
+ Current Block Size 32.0 KB
181
+ Peak Allocated Bytes 0 B
182
+ Overflow Count 0
183
+ [ALLOC_TEMP_Background Job.Worker 7]
184
+ Initial Block Size 32.0 KB
185
+ Current Block Size 32.0 KB
186
+ Peak Allocated Bytes 0 B
187
+ Overflow Count 0
188
+ [ALLOC_TEMP_AssetGarbageCollectorHelper] x 7
189
+ Initial Block Size 64.0 KB
190
+ Current Block Size 64.0 KB
191
+ Peak Allocated Bytes 0 B
192
+ Overflow Count 0
193
+ [ALLOC_TEMP_Background Job.Worker 5]
194
+ Initial Block Size 32.0 KB
195
+ Current Block Size 32.0 KB
196
+ Peak Allocated Bytes 0 B
197
+ Overflow Count 0
198
+ [ALLOC_TEMP_Background Job.Worker 13]
199
+ Initial Block Size 32.0 KB
200
+ Current Block Size 32.0 KB
201
+ Peak Allocated Bytes 0 B
202
+ Overflow Count 0
203
+ [ALLOC_TEMP_OSX HID Input]
204
+ Initial Block Size 64.0 KB
205
+ Current Block Size 64.0 KB
206
+ Peak Allocated Bytes 0 B
207
+ Overflow Count 0
208
+ [ALLOC_TEMP_Job.Worker 1]
209
+ Initial Block Size 256.0 KB
210
+ Current Block Size 256.0 KB
211
+ Peak Allocated Bytes 0 B
212
+ Overflow Count 0
213
+ [ALLOC_TEMP_Job.Worker 2]
214
+ Initial Block Size 256.0 KB
215
+ Current Block Size 256.0 KB
216
+ Peak Allocated Bytes 0 B
217
+ Overflow Count 0
218
+ [ALLOC_TEMP_Background Job.Worker 3]
219
+ Initial Block Size 32.0 KB
220
+ Current Block Size 32.0 KB
221
+ Peak Allocated Bytes 0 B
222
+ Overflow Count 0
223
+ [ALLOC_TEMP_Background Job.Worker 11]
224
+ Initial Block Size 32.0 KB
225
+ Current Block Size 32.0 KB
226
+ Peak Allocated Bytes 0 B
227
+ Overflow Count 0
228
+ [ALLOC_TEMP_Background Job.Worker 0]
229
+ Initial Block Size 32.0 KB
230
+ Current Block Size 32.0 KB
231
+ Peak Allocated Bytes 0 B
232
+ Overflow Count 0
233
+ [ALLOC_TEMP_Background Job.Worker 4]
234
+ Initial Block Size 32.0 KB
235
+ Current Block Size 32.0 KB
236
+ Peak Allocated Bytes 0 B
237
+ Overflow Count 0
238
+ [ALLOC_TEMP_BatchDeleteObjects]
239
+ Initial Block Size 64.0 KB
240
+ Current Block Size 64.0 KB
241
+ Peak Allocated Bytes 0 B
242
+ Overflow Count 0
243
+ [ALLOC_DEFAULT] Dual Thread Allocator
244
+ Peak main deferred allocation count 8
245
+ [ALLOC_BUCKET]
246
+ Large Block size 4.0 MB
247
+ Used Block count 1
248
+ Peak Allocated bytes 1.0 MB
249
+ [ALLOC_DEFAULT_MAIN]
250
+ Peak usage frame count: [4.0 MB-8.0 MB]: 6299 frames
251
+ Requested Block Size 16.0 MB
252
+ Peak Block count 1
253
+ Peak Allocated memory 5.0 MB
254
+ Peak Large allocation bytes 0 B
255
+ [ALLOC_DEFAULT_THREAD]
256
+ Peak usage frame count: [16.0 MB-32.0 MB]: 6299 frames
257
+ Requested Block Size 16.0 MB
258
+ Peak Block count 1
259
+ Peak Allocated memory 17.4 MB
260
+ Peak Large allocation bytes 16.0 MB
261
+ [ALLOC_TEMP_JOB_1_FRAME]
262
+ Initial Block Size 2.0 MB
263
+ Used Block Count 1
264
+ Overflow Count (too large) 0
265
+ Overflow Count (full) 0
266
+ [ALLOC_TEMP_JOB_2_FRAMES]
267
+ Initial Block Size 2.0 MB
268
+ Used Block Count 1
269
+ Overflow Count (too large) 0
270
+ Overflow Count (full) 0
271
+ [ALLOC_TEMP_JOB_4_FRAMES (JobTemp)]
272
+ Initial Block Size 2.0 MB
273
+ Used Block Count 2
274
+ Overflow Count (too large) 0
275
+ Overflow Count (full) 0
276
+ [ALLOC_TEMP_JOB_ASYNC (Background)]
277
+ Initial Block Size 1.0 MB
278
+ Used Block Count 3
279
+ Overflow Count (too large) 0
280
+ Overflow Count (full) 0
281
+ [ALLOC_GFX] Dual Thread Allocator
282
+ Peak main deferred allocation count 0
283
+ [ALLOC_BUCKET]
284
+ Large Block size 4.0 MB
285
+ Used Block count 1
286
+ Peak Allocated bytes 1.0 MB
287
+ [ALLOC_GFX_MAIN]
288
+ Peak usage frame count: [32.0 KB-64.0 KB]: 6298 frames, [64.0 KB-128.0 KB]: 1 frames
289
+ Requested Block Size 16.0 MB
290
+ Peak Block count 1
291
+ Peak Allocated memory 65.6 KB
292
+ Peak Large allocation bytes 0 B
293
+ [ALLOC_GFX_THREAD]
294
+ Peak usage frame count: [128.0 KB-256.0 KB]: 6299 frames
295
+ Requested Block Size 16.0 MB
296
+ Peak Block count 1
297
+ Peak Allocated memory 173.5 KB
298
+ Peak Large allocation bytes 0 B
299
+ [ALLOC_CACHEOBJECTS] Dual Thread Allocator
300
+ Peak main deferred allocation count 0
301
+ [ALLOC_BUCKET]
302
+ Large Block size 4.0 MB
303
+ Used Block count 1
304
+ Peak Allocated bytes 1.0 MB
305
+ [ALLOC_CACHEOBJECTS_MAIN]
306
+ Peak usage frame count: [0.5 MB-1.0 MB]: 6299 frames
307
+ Requested Block Size 4.0 MB
308
+ Peak Block count 1
309
+ Peak Allocated memory 0.6 MB
310
+ Peak Large allocation bytes 0 B
311
+ [ALLOC_CACHEOBJECTS_THREAD]
312
+ Peak usage frame count: [0.5 MB-1.0 MB]: 6298 frames, [2.0 MB-4.0 MB]: 1 frames
313
+ Requested Block Size 4.0 MB
314
+ Peak Block count 1
315
+ Peak Allocated memory 3.4 MB
316
+ Peak Large allocation bytes 0 B
317
+ [ALLOC_TYPETREE] Dual Thread Allocator
318
+ Peak main deferred allocation count 0
319
+ [ALLOC_BUCKET]
320
+ Large Block size 4.0 MB
321
+ Used Block count 1
322
+ Peak Allocated bytes 1.0 MB
323
+ [ALLOC_TYPETREE_MAIN]
324
+ Peak usage frame count: [0-1.0 KB]: 6299 frames
325
+ Requested Block Size 2.0 MB
326
+ Peak Block count 1
327
+ Peak Allocated memory 1.0 KB
328
+ Peak Large allocation bytes 0 B
329
+ [ALLOC_TYPETREE_THREAD]
330
+ Peak usage frame count: [1.0 KB-2.0 KB]: 6298 frames, [2.0 KB-4.0 KB]: 1 frames
331
+ Requested Block Size 2.0 MB
332
+ Peak Block count 1
333
+ Peak Allocated memory 2.2 KB
334
+ Peak Large allocation bytes 0 B
run_logs/timers.json CHANGED
@@ -2,201 +2,201 @@
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 3.0429799556732178,
6
- "min": 3.0280234813690186,
7
- "max": 3.191495418548584,
8
- "count": 161
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 55893.45703125,
12
- "min": 9785.7265625,
13
- "max": 110518.34375,
14
- "count": 161
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 573.5714285714286,
18
- "min": 95.0,
19
- "max": 999.0,
20
- "count": 161
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 16060.0,
24
- "min": 380.0,
25
- "max": 23704.0,
26
- "count": 161
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1253.5616176330443,
30
- "min": 1198.1748449658994,
31
- "max": 1255.1449382701196,
32
- "count": 153
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 12535.616176330443,
36
- "min": 2396.349689931799,
37
- "max": 45056.64592682517,
38
- "count": 153
39
- },
40
- "SoccerTwos.IsTraining.mean": {
41
- "value": 1.0,
42
- "min": 1.0,
43
- "max": 1.0,
44
- "count": 161
45
- },
46
- "SoccerTwos.IsTraining.sum": {
47
- "value": 1.0,
48
- "min": 1.0,
49
- "max": 1.0,
50
- "count": 161
51
  },
52
  "SoccerTwos.Step.mean": {
53
- "value": 2599727.0,
54
- "min": 1009454.0,
55
- "max": 2599727.0,
56
- "count": 160
57
  },
58
  "SoccerTwos.Step.sum": {
59
- "value": 2599727.0,
60
- "min": 1009454.0,
61
- "max": 2599727.0,
62
- "count": 160
63
  },
64
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
65
- "value": -0.015503649599850178,
66
- "min": -0.04074995219707489,
67
- "max": 0.03584587574005127,
68
- "count": 160
69
  },
70
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
71
- "value": -0.23255474865436554,
72
- "min": -0.6843217611312866,
73
- "max": 1.254599928855896,
74
- "count": 160
75
  },
76
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
77
- "value": -0.015258976258337498,
78
- "min": -0.039837684482336044,
79
- "max": 0.03866251930594444,
80
- "count": 160
81
  },
82
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
83
- "value": -0.22888463735580444,
84
- "min": -0.6837544441223145,
85
- "max": 1.353188157081604,
86
- "count": 160
87
  },
88
  "SoccerTwos.Environment.CumulativeReward.mean": {
89
  "value": 0.0,
90
  "min": 0.0,
91
  "max": 0.0,
92
- "count": 160
93
  },
94
  "SoccerTwos.Environment.CumulativeReward.sum": {
95
  "value": 0.0,
96
  "min": 0.0,
97
  "max": 0.0,
98
- "count": 160
99
  },
100
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
101
- "value": -0.2710533301035563,
102
- "min": -0.7474956512451172,
103
- "max": 0.46924210222143875,
104
- "count": 160
105
  },
106
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
107
- "value": -4.065799951553345,
108
- "min": -17.192399978637695,
109
- "max": 9.174400091171265,
110
- "count": 160
111
  },
112
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
113
- "value": -0.2710533301035563,
114
- "min": -0.7474956512451172,
115
- "max": 0.46924210222143875,
116
- "count": 160
117
  },
118
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
119
- "value": -4.065799951553345,
120
- "min": -17.192399978637695,
121
- "max": 9.174400091171265,
122
- "count": 160
 
 
 
 
 
 
 
 
 
 
 
 
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.01552068288049971,
126
- "min": 0.012524987536016852,
127
- "max": 0.022274984690981606,
128
- "count": 75
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.01552068288049971,
132
- "min": 0.012524987536016852,
133
- "max": 0.022274984690981606,
134
- "count": 75
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.012713205628097057,
138
- "min": 0.0005046518689293104,
139
- "max": 0.015418903343379498,
140
- "count": 75
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.012713205628097057,
144
- "min": 0.0005046518689293104,
145
- "max": 0.015418903343379498,
146
- "count": 75
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.01291948426514864,
150
- "min": 0.000504054954944877,
151
- "max": 0.01562350361297528,
152
- "count": 75
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.01291948426514864,
156
- "min": 0.000504054954944877,
157
- "max": 0.01562350361297528,
158
- "count": 75
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
  "value": 0.0003,
162
  "min": 0.0003,
163
  "max": 0.0003,
164
- "count": 75
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
  "value": 0.0003,
168
  "min": 0.0003,
169
  "max": 0.0003,
170
- "count": 75
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
  "value": 0.20000000000000007,
174
  "min": 0.20000000000000007,
175
  "max": 0.20000000000000007,
176
- "count": 75
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
  "value": 0.20000000000000007,
180
  "min": 0.20000000000000007,
181
  "max": 0.20000000000000007,
182
- "count": 75
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
  "value": 0.005000000000000001,
186
  "min": 0.005000000000000001,
187
  "max": 0.005000000000000001,
188
- "count": 75
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
  "value": 0.005000000000000001,
192
  "min": 0.005000000000000001,
193
  "max": 0.005000000000000001,
194
- "count": 75
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1689924786",
200
  "python_version": "3.9.16 | packaged by conda-forge | (main, Feb 1 2023, 21:38:11) \n[Clang 14.0.6 ]",
201
  "command_line_arguments": "/Users/giovannidispoto/miniforge3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env training-envs-executables/linux/SoccerTwos/SoccerTwos --run-id =SoccerTwos training --no-graphics --resume",
202
  "mlagents_version": "0.31.0.dev0",
@@ -204,103 +204,103 @@
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "1.11.0",
206
  "numpy_version": "1.21.2",
207
- "end_time_seconds": "1689930698"
208
  },
209
- "total": 5911.306915667001,
210
  "count": 1,
211
- "self": 0.20646262500122248,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.056267874999999856,
215
  "count": 1,
216
- "self": 0.056267874999999856
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 5911.044185166999,
220
  "count": 1,
221
- "self": 1.1270955429890819,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 2.8766715400011753,
225
- "count": 10,
226
- "self": 2.8766715400011753
227
  },
228
  "TrainerController.advance": {
229
- "total": 5906.894979584009,
230
- "count": 104383,
231
- "self": 1.0448963620874565,
232
  "children": {
233
  "env_step": {
234
- "total": 4601.6896993350165,
235
- "count": 104383,
236
- "self": 4409.8189295159245,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
- "total": 191.10761183097588,
240
- "count": 104383,
241
- "self": 5.378499134121967,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
- "total": 185.72911269685392,
245
- "count": 206502,
246
- "self": 185.72911269685392
247
  }
248
  }
249
  },
250
  "workers": {
251
- "total": 0.7631579881156241,
252
- "count": 104382,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
- "total": 5906.829998433097,
257
- "count": 104382,
258
  "is_parallel": true,
259
- "self": 1679.6308405951095,
260
  "children": {
261
  "steps_from_proto": {
262
- "total": 0.013667627000538918,
263
- "count": 20,
264
  "is_parallel": true,
265
- "self": 0.0020639220016827053,
266
  "children": {
267
  "_process_rank_one_or_two_observation": {
268
- "total": 0.011603704998856212,
269
- "count": 80,
270
  "is_parallel": true,
271
- "self": 0.011603704998856212
272
  }
273
  }
274
  },
275
  "UnityEnvironment.step": {
276
- "total": 4227.185490210987,
277
- "count": 104382,
278
  "is_parallel": true,
279
- "self": 11.35144842086902,
280
  "children": {
281
  "UnityEnvironment._generate_step_input": {
282
- "total": 66.85198158409172,
283
- "count": 104382,
284
  "is_parallel": true,
285
- "self": 66.85198158409172
286
  },
287
  "communicator.exchange": {
288
- "total": 4017.812950275919,
289
- "count": 104382,
290
  "is_parallel": true,
291
- "self": 4017.812950275919
292
  },
293
  "steps_from_proto": {
294
- "total": 131.16910993010734,
295
- "count": 208764,
296
  "is_parallel": true,
297
- "self": 17.862625829338057,
298
  "children": {
299
  "_process_rank_one_or_two_observation": {
300
- "total": 113.30648410076928,
301
- "count": 835056,
302
  "is_parallel": true,
303
- "self": 113.30648410076928
304
  }
305
  }
306
  }
@@ -313,31 +313,24 @@
313
  }
314
  },
315
  "trainer_advance": {
316
- "total": 1304.1603838869046,
317
- "count": 104382,
318
- "self": 9.110193707981125,
319
  "children": {
320
  "process_trajectory": {
321
- "total": 190.7648718849274,
322
- "count": 104382,
323
- "self": 190.26279075992727,
324
- "children": {
325
- "RLTrainer._checkpoint": {
326
- "total": 0.5020811250001316,
327
- "count": 4,
328
- "self": 0.5020811250001316
329
- }
330
- }
331
  },
332
  "_update_policy": {
333
- "total": 1104.2853182939962,
334
- "count": 75,
335
- "self": 136.70639390800068,
336
  "children": {
337
  "TorchPOCAOptimizer.update": {
338
- "total": 967.5789243859955,
339
- "count": 2250,
340
- "self": 967.5789243859955
341
  }
342
  }
343
  }
@@ -351,14 +344,14 @@
351
  "self": 5.000001692678779e-07
352
  },
353
  "TrainerController._save_models": {
354
- "total": 0.1454379999995581,
355
  "count": 1,
356
- "self": 0.003915333999430004,
357
  "children": {
358
  "RLTrainer._checkpoint": {
359
- "total": 0.14152266600012808,
360
  "count": 1,
361
- "self": 0.14152266600012808
362
  }
363
  }
364
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
+ "value": 2.918834924697876,
6
+ "min": 2.8833391666412354,
7
+ "max": 3.0236945152282715,
8
+ "count": 33
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
+ "value": 78271.4765625,
12
+ "min": 39830.37109375,
13
+ "max": 84569.7890625,
14
+ "count": 33
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
+ "value": 230.95652173913044,
18
+ "min": 124.25714285714285,
19
+ "max": 623.625,
20
+ "count": 33
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
+ "value": 21248.0,
24
+ "min": 9680.0,
25
+ "max": 22600.0,
26
+ "count": 33
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
+ "value": 1282.0056355876839,
30
+ "min": 1253.013989211454,
31
+ "max": 1282.0056355876839,
32
+ "count": 33
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
+ "value": 58972.25923703346,
36
+ "min": 12559.079803129456,
37
+ "max": 101548.60181663197,
38
+ "count": 33
 
 
 
 
 
 
 
 
 
 
 
 
39
  },
40
  "SoccerTwos.Step.mean": {
41
+ "value": 2929962.0,
42
+ "min": 2609928.0,
43
+ "max": 2929962.0,
44
+ "count": 33
45
  },
46
  "SoccerTwos.Step.sum": {
47
+ "value": 2929962.0,
48
+ "min": 2609928.0,
49
+ "max": 2929962.0,
50
+ "count": 33
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
+ "value": 0.03823350369930267,
54
+ "min": -0.049646422266960144,
55
+ "max": 0.052216753363609314,
56
+ "count": 33
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
+ "value": 1.7205077409744263,
60
+ "min": -2.035503387451172,
61
+ "max": 2.2943410873413086,
62
+ "count": 33
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
+ "value": 0.03543571010231972,
66
+ "min": -0.05077830329537392,
67
+ "max": 0.05149360001087189,
68
+ "count": 33
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
+ "value": 1.594606876373291,
72
+ "min": -2.0819103717803955,
73
+ "max": 2.4051408767700195,
74
+ "count": 33
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
+ "count": 33
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
+ "count": 33
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
+ "value": 0.12317777209811741,
90
+ "min": -0.563066663164081,
91
+ "max": 0.48426666997727896,
92
+ "count": 33
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
+ "value": 5.542999744415283,
96
+ "min": -18.581199884414673,
97
+ "max": 12.681599855422974,
98
+ "count": 33
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
+ "value": 0.12317777209811741,
102
+ "min": -0.563066663164081,
103
+ "max": 0.48426666997727896,
104
+ "count": 33
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
+ "value": 5.542999744415283,
108
+ "min": -18.581199884414673,
109
+ "max": 12.681599855422974,
110
+ "count": 33
111
+ },
112
+ "SoccerTwos.IsTraining.mean": {
113
+ "value": 1.0,
114
+ "min": 1.0,
115
+ "max": 1.0,
116
+ "count": 33
117
+ },
118
+ "SoccerTwos.IsTraining.sum": {
119
+ "value": 1.0,
120
+ "min": 1.0,
121
+ "max": 1.0,
122
+ "count": 33
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
+ "value": 0.015882109101706496,
126
+ "min": 0.010916591945958013,
127
+ "max": 0.02235342748463154,
128
+ "count": 15
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
+ "value": 0.015882109101706496,
132
+ "min": 0.010916591945958013,
133
+ "max": 0.02235342748463154,
134
+ "count": 15
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
+ "value": 0.032553153360883394,
138
+ "min": 0.008785408766319355,
139
+ "max": 0.032553153360883394,
140
+ "count": 15
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
+ "value": 0.032553153360883394,
144
+ "min": 0.008785408766319355,
145
+ "max": 0.032553153360883394,
146
+ "count": 15
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
+ "value": 0.03331315269072851,
150
+ "min": 0.008910710799197356,
151
+ "max": 0.03331315269072851,
152
+ "count": 15
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
+ "value": 0.03331315269072851,
156
+ "min": 0.008910710799197356,
157
+ "max": 0.03331315269072851,
158
+ "count": 15
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
  "value": 0.0003,
162
  "min": 0.0003,
163
  "max": 0.0003,
164
+ "count": 15
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
  "value": 0.0003,
168
  "min": 0.0003,
169
  "max": 0.0003,
170
+ "count": 15
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
  "value": 0.20000000000000007,
174
  "min": 0.20000000000000007,
175
  "max": 0.20000000000000007,
176
+ "count": 15
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
  "value": 0.20000000000000007,
180
  "min": 0.20000000000000007,
181
  "max": 0.20000000000000007,
182
+ "count": 15
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
  "value": 0.005000000000000001,
186
  "min": 0.005000000000000001,
187
  "max": 0.005000000000000001,
188
+ "count": 15
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
  "value": 0.005000000000000001,
192
  "min": 0.005000000000000001,
193
  "max": 0.005000000000000001,
194
+ "count": 15
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
+ "start_time_seconds": "1689930704",
200
  "python_version": "3.9.16 | packaged by conda-forge | (main, Feb 1 2023, 21:38:11) \n[Clang 14.0.6 ]",
201
  "command_line_arguments": "/Users/giovannidispoto/miniforge3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env training-envs-executables/linux/SoccerTwos/SoccerTwos --run-id =SoccerTwos training --no-graphics --resume",
202
  "mlagents_version": "0.31.0.dev0",
 
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "1.11.0",
206
  "numpy_version": "1.21.2",
207
+ "end_time_seconds": "1689931918"
208
  },
209
+ "total": 1213.220998792,
210
  "count": 1,
211
+ "self": 0.19836883399989347,
212
  "children": {
213
  "run_training.setup": {
214
+ "total": 0.0146809160000001,
215
  "count": 1,
216
+ "self": 0.0146809160000001
217
  },
218
  "TrainerController.start_learning": {
219
+ "total": 1213.007949042,
220
  "count": 1,
221
+ "self": 0.256065019000971,
222
  "children": {
223
  "TrainerController._reset_env": {
224
+ "total": 1.6167403750000064,
225
+ "count": 3,
226
+ "self": 1.6167403750000064
227
  },
228
  "TrainerController.advance": {
229
+ "total": 1210.9198496889987,
230
+ "count": 21467,
231
+ "self": 0.2263428089916033,
232
  "children": {
233
  "env_step": {
234
+ "total": 935.021241669002,
235
+ "count": 21467,
236
+ "self": 896.3483562050126,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
+ "total": 38.50613126399476,
240
+ "count": 21467,
241
+ "self": 1.2515383709973094,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
+ "total": 37.25459289299745,
245
+ "count": 41986,
246
+ "self": 37.25459289299745
247
  }
248
  }
249
  },
250
  "workers": {
251
+ "total": 0.16675419999469066,
252
+ "count": 21466,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
+ "total": 1210.8783447740025,
257
+ "count": 21466,
258
  "is_parallel": true,
259
+ "self": 348.50981015801983,
260
  "children": {
261
  "steps_from_proto": {
262
+ "total": 0.004010457999933603,
263
+ "count": 6,
264
  "is_parallel": true,
265
+ "self": 0.0006119609999728493,
266
  "children": {
267
  "_process_rank_one_or_two_observation": {
268
+ "total": 0.003398496999960754,
269
+ "count": 24,
270
  "is_parallel": true,
271
+ "self": 0.003398496999960754
272
  }
273
  }
274
  },
275
  "UnityEnvironment.step": {
276
+ "total": 862.3645241579827,
277
+ "count": 21466,
278
  "is_parallel": true,
279
+ "self": 2.4730160429826356,
280
  "children": {
281
  "UnityEnvironment._generate_step_input": {
282
+ "total": 14.117127869999308,
283
+ "count": 21466,
284
  "is_parallel": true,
285
+ "self": 14.117127869999308
286
  },
287
  "communicator.exchange": {
288
+ "total": 818.327291241,
289
+ "count": 21466,
290
  "is_parallel": true,
291
+ "self": 818.327291241
292
  },
293
  "steps_from_proto": {
294
+ "total": 27.447089004000716,
295
+ "count": 42932,
296
  "is_parallel": true,
297
+ "self": 3.8421029960153845,
298
  "children": {
299
  "_process_rank_one_or_two_observation": {
300
+ "total": 23.60498600798533,
301
+ "count": 171728,
302
  "is_parallel": true,
303
+ "self": 23.60498600798533
304
  }
305
  }
306
  }
 
313
  }
314
  },
315
  "trainer_advance": {
316
+ "total": 275.67226521100497,
317
+ "count": 21466,
318
+ "self": 2.0925505520029333,
319
  "children": {
320
  "process_trajectory": {
321
+ "total": 41.71501174500203,
322
+ "count": 21466,
323
+ "self": 41.71501174500203
 
 
 
 
 
 
 
324
  },
325
  "_update_policy": {
326
+ "total": 231.86470291400002,
327
+ "count": 15,
328
+ "self": 27.459560829000736,
329
  "children": {
330
  "TorchPOCAOptimizer.update": {
331
+ "total": 204.40514208499928,
332
+ "count": 450,
333
+ "self": 204.40514208499928
334
  }
335
  }
336
  }
 
344
  "self": 5.000001692678779e-07
345
  },
346
  "TrainerController._save_models": {
347
+ "total": 0.2152934590001223,
348
  "count": 1,
349
+ "self": 0.0022526249999827996,
350
  "children": {
351
  "RLTrainer._checkpoint": {
352
+ "total": 0.2130408340001395,
353
  "count": 1,
354
+ "self": 0.2130408340001395
355
  }
356
  }
357
  }
run_logs/training_status.json CHANGED
@@ -1,16 +1,7 @@
1
  {
2
  "SoccerTwos": {
3
- "elo": 1253.7885927395525,
4
  "checkpoints": [
5
- {
6
- "steps": 999938,
7
- "file_path": "results/=SoccerTwos training/SoccerTwos/SoccerTwos-999938.onnx",
8
- "reward": null,
9
- "creation_time": 1689924793.830441,
10
- "auxillary_file_paths": [
11
- "results/=SoccerTwos training/SoccerTwos/SoccerTwos-999938.pt"
12
- ]
13
- },
14
  {
15
  "steps": 1499744,
16
  "file_path": "results/=SoccerTwos training/SoccerTwos/SoccerTwos-1499744.onnx",
@@ -46,15 +37,24 @@
46
  "auxillary_file_paths": [
47
  "results/=SoccerTwos training/SoccerTwos/SoccerTwos-2606308.pt"
48
  ]
 
 
 
 
 
 
 
 
 
49
  }
50
  ],
51
  "final_checkpoint": {
52
- "steps": 2606308,
53
  "file_path": "results/=SoccerTwos training/SoccerTwos.onnx",
54
  "reward": 0.0,
55
- "creation_time": 1689930697.907537,
56
  "auxillary_file_paths": [
57
- "results/=SoccerTwos training/SoccerTwos/SoccerTwos-2606308.pt"
58
  ]
59
  }
60
  },
 
1
  {
2
  "SoccerTwos": {
3
+ "elo": 1279.794658723823,
4
  "checkpoints": [
 
 
 
 
 
 
 
 
 
5
  {
6
  "steps": 1499744,
7
  "file_path": "results/=SoccerTwos training/SoccerTwos/SoccerTwos-1499744.onnx",
 
37
  "auxillary_file_paths": [
38
  "results/=SoccerTwos training/SoccerTwos/SoccerTwos-2606308.pt"
39
  ]
40
+ },
41
+ {
42
+ "steps": 2934422,
43
+ "file_path": "results/=SoccerTwos training/SoccerTwos/SoccerTwos-2934422.onnx",
44
+ "reward": 0.0,
45
+ "creation_time": 1689931918.062052,
46
+ "auxillary_file_paths": [
47
+ "results/=SoccerTwos training/SoccerTwos/SoccerTwos-2934422.pt"
48
+ ]
49
  }
50
  ],
51
  "final_checkpoint": {
52
+ "steps": 2934422,
53
  "file_path": "results/=SoccerTwos training/SoccerTwos.onnx",
54
  "reward": 0.0,
55
+ "creation_time": 1689931918.062052,
56
  "auxillary_file_paths": [
57
+ "results/=SoccerTwos training/SoccerTwos/SoccerTwos-2934422.pt"
58
  ]
59
  }
60
  },