alexdavey commited on
Commit
e9c1989
β€’
1 Parent(s): 37ffa3a

Trained to 1572 ELO

Browse files
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d4a9963b708711b8d0f37052735023837f265e2bf871eb4232b39373434fa72
3
  size 1764633
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4771129c8ad26e11f4a8f34d439ffd480fda48f628b3a4463a3855402dd40e61
3
  size 1764633
SoccerTwos/{SoccerTwos-1499957.onnx β†’ SoccerTwos-12999992.onnx} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17849b03ce92d7f808ab07541dcc22f9ab9d54057b98c612760d74d629ac0526
3
  size 1764633
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:549ec281a17e285442320a181b6f29cafc6c71b6a2997ae9ed344cbb1be97131
3
  size 1764633
SoccerTwos/{SoccerTwos-2499998.pt β†’ SoccerTwos-12999992.pt} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4e46423801fbc8a107aaeed651a052cbbcc5e8817e90921f2e7cede75780d13
3
  size 28421201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f378e49f6f0dfbb9626c0ee6fd4b4bf4472a6c5751adfeaa32e92fe15b8e06f4
3
  size 28421201
SoccerTwos/{SoccerTwos-2499998.onnx β†’ SoccerTwos-13499996.onnx} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c5dbd0a8fcac33356903e66186153832a53a69b5c897223288d6442feae5e2c9
3
  size 1764633
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35fbeece95d61c2a676ddd81318a156e5b334d2cbbac08bb47a369f3c88b8125
3
  size 1764633
SoccerTwos/{SoccerTwos-1499957.pt β†’ SoccerTwos-13499996.pt} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e0a0277b9585311022860bab13799c67751d94f73417d8a155f024f68408ef2
3
  size 28421201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35487969f33bf4d77ab8ebc796d9cd44ff8dabcf5fccf7d69a8f2956ad08407b
3
  size 28421201
SoccerTwos/{SoccerTwos-1999940.onnx β†’ SoccerTwos-13999972.onnx} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76195e8ecab17b427d7ad7d0198b9d486e294ad8bcf0965785daaf0a7921beff
3
  size 1764633
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ec3b2634dadae5dc0c77aea3a6f191cc7fe1cf14c505e52504ad2a9cbbc3315
3
  size 1764633
SoccerTwos/{SoccerTwos-2511370.pt β†’ SoccerTwos-13999972.pt} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7de37f76bf5b58fde322b34cac14392d9b060f77049e8547cf74f84bed339674
3
  size 28421201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0d46d00ccdab26b10a786a0be140b2aea0ba49f54afcc4600bd9e9161281072
3
  size 28421201
SoccerTwos/{SoccerTwos-2511370.onnx β†’ SoccerTwos-14499964.onnx} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c5dbd0a8fcac33356903e66186153832a53a69b5c897223288d6442feae5e2c9
3
  size 1764633
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ea20a8f9f342fb1b1a411dfe762e252fb0eb5f462cee5cb344ea36ec572644d
3
  size 1764633
SoccerTwos/{SoccerTwos-1999940.pt β†’ SoccerTwos-14499964.pt} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:85d54743662785f6d785c86d443c5514dcecc742a9c0ceb5618b914c16a436e3
3
  size 28421201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a112afa1aa0635ad8088c218164e7afc59985592e82b423a6108d92258f3074
3
  size 28421201
SoccerTwos/SoccerTwos-14666438.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4771129c8ad26e11f4a8f34d439ffd480fda48f628b3a4463a3855402dd40e61
3
+ size 1764633
SoccerTwos/SoccerTwos-14666438.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1351a2d6da08221790798f89ea322523251190099fbfe542d3e6a2df530c139c
3
+ size 28421201
SoccerTwos/SoccerTwos-2644140.onnx DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d4a9963b708711b8d0f37052735023837f265e2bf871eb4232b39373434fa72
3
- size 1764633
 
 
 
 
SoccerTwos/SoccerTwos-2644140.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b860b3e78cbb02b69ee5d0844c690eecc9165e058d997731aa87f70d196805d8
3
- size 28421201
 
 
 
 
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b860b3e78cbb02b69ee5d0844c690eecc9165e058d997731aa87f70d196805d8
3
  size 28421201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1351a2d6da08221790798f89ea322523251190099fbfe542d3e6a2df530c139c
3
  size 28421201
SoccerTwos/events.out.tfevents.1680912512.Alexs-MacBook-Pro-M2.local.2360.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7680e2f4e83b48cd71014dcdd2846a31f2342359f073b72f59842ad8fcbe985
3
+ size 12355179
run_logs/Player-0.log CHANGED
@@ -10,7 +10,7 @@ NullGfxDevice:
10
  Renderer: Null Device
11
  Vendor: Unity Technologies
12
  Begin MonoManager ReloadAssembly
13
- - Completed reload, in 0.062 seconds
14
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
15
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
16
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -35,16 +35,16 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
35
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
36
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
37
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
38
- UnloadTime: 0.341458 ms
39
  Registered Communicator in Agent.
40
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
41
- Thread 0x170b77000 may have been prematurely finalized
42
  Setting up 5 worker threads for Enlighten.
43
  Memory Statistics:
44
  [ALLOC_TEMP_TLS] TLS Allocator
45
  StackAllocators :
46
  [ALLOC_TEMP_MAIN]
47
- Peak usage frame count: [8.0 KB-16.0 KB]: 2498 frames, [2.0 MB-4.0 MB]: 1 frames
48
  Initial Block Size 4.0 MB
49
  Current Block Size 4.0 MB
50
  Peak Allocated Bytes 2.1 MB
@@ -67,12 +67,12 @@ Memory Statistics:
67
  [ALLOC_TEMP_Job.Worker 6]
68
  Initial Block Size 256.0 KB
69
  Current Block Size 256.0 KB
70
- Peak Allocated Bytes 0 B
71
  Overflow Count 0
72
  [ALLOC_TEMP_Job.Worker 0]
73
  Initial Block Size 256.0 KB
74
  Current Block Size 256.0 KB
75
- Peak Allocated Bytes 0.7 KB
76
  Overflow Count 0
77
  [ALLOC_TEMP_Background Job.Worker 10]
78
  Initial Block Size 32.0 KB
@@ -205,22 +205,22 @@ Memory Statistics:
205
  Peak Allocated Bytes 0 B
206
  Overflow Count 0
207
  [ALLOC_DEFAULT] Dual Thread Allocator
208
- Peak main deferred allocation count 3
209
  [ALLOC_BUCKET]
210
  Large Block size 4.0 MB
211
  Used Block count 1
212
  Peak Allocated bytes 1.0 MB
213
  [ALLOC_DEFAULT_MAIN]
214
- Peak usage frame count: [4.0 MB-8.0 MB]: 2499 frames
215
  Requested Block Size 16.0 MB
216
  Peak Block count 1
217
- Peak Allocated memory 4.9 MB
218
  Peak Large allocation bytes 0 B
219
  [ALLOC_DEFAULT_THREAD]
220
- Peak usage frame count: [16.0 MB-32.0 MB]: 2499 frames
221
  Requested Block Size 16.0 MB
222
  Peak Block count 1
223
- Peak Allocated memory 17.4 MB
224
  Peak Large allocation bytes 16.0 MB
225
  [ALLOC_TEMP_JOB_1_FRAME]
226
  Initial Block Size 2.0 MB
@@ -249,13 +249,13 @@ Memory Statistics:
249
  Used Block count 1
250
  Peak Allocated bytes 1.0 MB
251
  [ALLOC_GFX_MAIN]
252
- Peak usage frame count: [32.0 KB-64.0 KB]: 2498 frames, [64.0 KB-128.0 KB]: 1 frames
253
  Requested Block Size 16.0 MB
254
  Peak Block count 1
255
  Peak Allocated memory 65.6 KB
256
  Peak Large allocation bytes 0 B
257
  [ALLOC_GFX_THREAD]
258
- Peak usage frame count: [128.0 KB-256.0 KB]: 2499 frames
259
  Requested Block Size 16.0 MB
260
  Peak Block count 1
261
  Peak Allocated memory 173.5 KB
@@ -267,13 +267,13 @@ Memory Statistics:
267
  Used Block count 1
268
  Peak Allocated bytes 1.0 MB
269
  [ALLOC_CACHEOBJECTS_MAIN]
270
- Peak usage frame count: [0.5 MB-1.0 MB]: 2499 frames
271
  Requested Block Size 4.0 MB
272
  Peak Block count 1
273
  Peak Allocated memory 0.6 MB
274
  Peak Large allocation bytes 0 B
275
  [ALLOC_CACHEOBJECTS_THREAD]
276
- Peak usage frame count: [0.5 MB-1.0 MB]: 2498 frames, [2.0 MB-4.0 MB]: 1 frames
277
  Requested Block Size 4.0 MB
278
  Peak Block count 1
279
  Peak Allocated memory 3.4 MB
@@ -285,13 +285,13 @@ Memory Statistics:
285
  Used Block count 1
286
  Peak Allocated bytes 1.0 MB
287
  [ALLOC_TYPETREE_MAIN]
288
- Peak usage frame count: [0-1.0 KB]: 2499 frames
289
  Requested Block Size 2.0 MB
290
  Peak Block count 1
291
  Peak Allocated memory 1.0 KB
292
  Peak Large allocation bytes 0 B
293
  [ALLOC_TYPETREE_THREAD]
294
- Peak usage frame count: [1.0 KB-2.0 KB]: 2498 frames, [2.0 KB-4.0 KB]: 1 frames
295
  Requested Block Size 2.0 MB
296
  Peak Block count 1
297
  Peak Allocated memory 2.2 KB
 
10
  Renderer: Null Device
11
  Vendor: Unity Technologies
12
  Begin MonoManager ReloadAssembly
13
+ - Completed reload, in 0.037 seconds
14
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
15
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
16
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
35
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
36
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
37
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
38
+ UnloadTime: 0.250541 ms
39
  Registered Communicator in Agent.
40
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
41
+ Thread 0x171177000 may have been prematurely finalized
42
  Setting up 5 worker threads for Enlighten.
43
  Memory Statistics:
44
  [ALLOC_TEMP_TLS] TLS Allocator
45
  StackAllocators :
46
  [ALLOC_TEMP_MAIN]
47
+ Peak usage frame count: [8.0 KB-16.0 KB]: 226341 frames, [2.0 MB-4.0 MB]: 1 frames
48
  Initial Block Size 4.0 MB
49
  Current Block Size 4.0 MB
50
  Peak Allocated Bytes 2.1 MB
 
67
  [ALLOC_TEMP_Job.Worker 6]
68
  Initial Block Size 256.0 KB
69
  Current Block Size 256.0 KB
70
+ Peak Allocated Bytes 0.7 KB
71
  Overflow Count 0
72
  [ALLOC_TEMP_Job.Worker 0]
73
  Initial Block Size 256.0 KB
74
  Current Block Size 256.0 KB
75
+ Peak Allocated Bytes 0 B
76
  Overflow Count 0
77
  [ALLOC_TEMP_Background Job.Worker 10]
78
  Initial Block Size 32.0 KB
 
205
  Peak Allocated Bytes 0 B
206
  Overflow Count 0
207
  [ALLOC_DEFAULT] Dual Thread Allocator
208
+ Peak main deferred allocation count 4
209
  [ALLOC_BUCKET]
210
  Large Block size 4.0 MB
211
  Used Block count 1
212
  Peak Allocated bytes 1.0 MB
213
  [ALLOC_DEFAULT_MAIN]
214
+ Peak usage frame count: [4.0 MB-8.0 MB]: 226342 frames
215
  Requested Block Size 16.0 MB
216
  Peak Block count 1
217
+ Peak Allocated memory 4.8 MB
218
  Peak Large allocation bytes 0 B
219
  [ALLOC_DEFAULT_THREAD]
220
+ Peak usage frame count: [16.0 MB-32.0 MB]: 226342 frames
221
  Requested Block Size 16.0 MB
222
  Peak Block count 1
223
+ Peak Allocated memory 17.6 MB
224
  Peak Large allocation bytes 16.0 MB
225
  [ALLOC_TEMP_JOB_1_FRAME]
226
  Initial Block Size 2.0 MB
 
249
  Used Block count 1
250
  Peak Allocated bytes 1.0 MB
251
  [ALLOC_GFX_MAIN]
252
+ Peak usage frame count: [32.0 KB-64.0 KB]: 226341 frames, [64.0 KB-128.0 KB]: 1 frames
253
  Requested Block Size 16.0 MB
254
  Peak Block count 1
255
  Peak Allocated memory 65.6 KB
256
  Peak Large allocation bytes 0 B
257
  [ALLOC_GFX_THREAD]
258
+ Peak usage frame count: [128.0 KB-256.0 KB]: 226342 frames
259
  Requested Block Size 16.0 MB
260
  Peak Block count 1
261
  Peak Allocated memory 173.5 KB
 
267
  Used Block count 1
268
  Peak Allocated bytes 1.0 MB
269
  [ALLOC_CACHEOBJECTS_MAIN]
270
+ Peak usage frame count: [0.5 MB-1.0 MB]: 226342 frames
271
  Requested Block Size 4.0 MB
272
  Peak Block count 1
273
  Peak Allocated memory 0.6 MB
274
  Peak Large allocation bytes 0 B
275
  [ALLOC_CACHEOBJECTS_THREAD]
276
+ Peak usage frame count: [0.5 MB-1.0 MB]: 226341 frames, [2.0 MB-4.0 MB]: 1 frames
277
  Requested Block Size 4.0 MB
278
  Peak Block count 1
279
  Peak Allocated memory 3.4 MB
 
285
  Used Block count 1
286
  Peak Allocated bytes 1.0 MB
287
  [ALLOC_TYPETREE_MAIN]
288
+ Peak usage frame count: [0-1.0 KB]: 226342 frames
289
  Requested Block Size 2.0 MB
290
  Peak Block count 1
291
  Peak Allocated memory 1.0 KB
292
  Peak Large allocation bytes 0 B
293
  [ALLOC_TYPETREE_THREAD]
294
+ Peak usage frame count: [1.0 KB-2.0 KB]: 226341 frames, [2.0 KB-4.0 KB]: 1 frames
295
  Requested Block Size 2.0 MB
296
  Peak Block count 1
297
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -2,201 +2,201 @@
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 2.2829747200012207,
6
- "min": 2.2494966983795166,
7
- "max": 2.297738790512085,
8
- "count": 13
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 45367.2734375,
12
- "min": 42737.79296875,
13
- "max": 47082.828125,
14
- "count": 13
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 56.18181818181818,
18
- "min": 48.87,
19
- "max": 64.94666666666667,
20
- "count": 13
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 19776.0,
24
- "min": 17412.0,
25
- "max": 20064.0,
26
- "count": 13
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1410.9445802488876,
30
- "min": 1395.780553139902,
31
- "max": 1412.1593855697279,
32
- "count": 13
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 248326.24612380422,
36
- "min": 205213.6227782548,
37
- "max": 281546.1329652176,
38
- "count": 13
39
  },
40
  "SoccerTwos.Step.mean": {
41
- "value": 2639936.0,
42
- "min": 2519904.0,
43
- "max": 2639936.0,
44
- "count": 13
45
  },
46
  "SoccerTwos.Step.sum": {
47
- "value": 2639936.0,
48
- "min": 2519904.0,
49
- "max": 2639936.0,
50
- "count": 13
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
- "value": -0.06163661554455757,
54
- "min": -0.07923465222120285,
55
- "max": -0.009704259224236012,
56
- "count": 13
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
- "value": -10.786407470703125,
60
- "min": -14.10390853881836,
61
- "max": -1.9505560398101807,
62
- "count": 13
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
- "value": -0.06483850628137589,
66
- "min": -0.08182556927204132,
67
- "max": -0.01359673123806715,
68
- "count": 13
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
- "value": -11.346738815307617,
72
- "min": -14.012410163879395,
73
- "max": -2.732943058013916,
74
- "count": 13
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
- "count": 13
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
- "count": 13
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
- "value": -0.004626287051609584,
90
- "min": -0.3000333309173584,
91
- "max": 0.05962978842410636,
92
- "count": 13
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
- "value": -0.8096002340316772,
96
- "min": -43.20479965209961,
97
- "max": 11.438199996948242,
98
- "count": 13
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
- "value": -0.004626287051609584,
102
- "min": -0.3000333309173584,
103
- "max": 0.05962978842410636,
104
- "count": 13
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
- "value": -0.8096002340316772,
108
- "min": -43.20479965209961,
109
- "max": 11.438199996948242,
110
- "count": 13
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
- "count": 13
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
- "count": 13
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.013498812660327531,
126
- "min": 0.013476709986571222,
127
- "max": 0.020637649172567763,
128
- "count": 6
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.013498812660327531,
132
- "min": 0.013476709986571222,
133
- "max": 0.020637649172567763,
134
- "count": 6
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.09673845395445824,
138
- "min": 0.09279797971248627,
139
- "max": 0.10791213264067968,
140
- "count": 6
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.09673845395445824,
144
- "min": 0.09279797971248627,
145
- "max": 0.10791213264067968,
146
- "count": 6
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.09819150865077972,
150
- "min": 0.09445200115442276,
151
- "max": 0.10951845124363899,
152
- "count": 6
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.09819150865077972,
156
- "min": 0.09445200115442276,
157
- "max": 0.10951845124363899,
158
- "count": 6
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
  "value": 0.0003,
162
  "min": 0.0003,
163
  "max": 0.0003,
164
- "count": 6
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
  "value": 0.0003,
168
  "min": 0.0003,
169
  "max": 0.0003,
170
- "count": 6
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
  "value": 0.20000000000000007,
174
  "min": 0.20000000000000007,
175
  "max": 0.20000000000000007,
176
- "count": 6
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
  "value": 0.20000000000000007,
180
  "min": 0.20000000000000007,
181
  "max": 0.20000000000000007,
182
- "count": 6
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
  "value": 0.005000000000000001,
186
  "min": 0.005000000000000001,
187
  "max": 0.005000000000000001,
188
- "count": 6
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
  "value": 0.005000000000000001,
192
  "min": 0.005000000000000001,
193
  "max": 0.005000000000000001,
194
- "count": 6
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1680911678",
200
  "python_version": "3.9.16 (main, Mar 8 2023, 04:29:24) \n[Clang 14.0.6 ]",
201
  "command_line_arguments": "/opt/homebrew/Caskroom/miniconda/base/envs/deep-rl-class/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics --resume",
202
  "mlagents_version": "0.31.0.dev0",
@@ -204,103 +204,103 @@
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "1.11.0",
206
  "numpy_version": "1.21.2",
207
- "end_time_seconds": "1680912104"
208
  },
209
- "total": 426.626813167,
210
  "count": 1,
211
- "self": 0.07740695900002947,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.025569500000000023,
215
  "count": 1,
216
- "self": 0.025569500000000023
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 426.523836708,
220
  "count": 1,
221
- "self": 0.09378716900090467,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 1.3233759999999997,
225
- "count": 2,
226
- "self": 1.3233759999999997
227
  },
228
  "TrainerController.advance": {
229
- "total": 425.00220607999904,
230
- "count": 9232,
231
- "self": 0.07757942499415549,
232
  "children": {
233
  "env_step": {
234
- "total": 336.9465781640031,
235
- "count": 9232,
236
- "self": 323.98379543200366,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
- "total": 12.904846605999973,
240
- "count": 9232,
241
- "self": 0.3862697700014124,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
- "total": 12.51857683599856,
245
- "count": 16654,
246
- "self": 12.51857683599856
247
  }
248
  }
249
  },
250
  "workers": {
251
- "total": 0.05793612599943909,
252
- "count": 9231,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
- "total": 425.0197629289996,
257
- "count": 9231,
258
  "is_parallel": true,
259
- "self": 113.68635206200298,
260
  "children": {
261
  "steps_from_proto": {
262
- "total": 0.0028477499999997047,
263
- "count": 4,
264
  "is_parallel": true,
265
- "self": 0.00037816600000017964,
266
  "children": {
267
  "_process_rank_one_or_two_observation": {
268
- "total": 0.002469583999999525,
269
- "count": 16,
270
  "is_parallel": true,
271
- "self": 0.002469583999999525
272
  }
273
  }
274
  },
275
  "UnityEnvironment.step": {
276
- "total": 311.33056311699664,
277
- "count": 9231,
278
  "is_parallel": true,
279
- "self": 0.8630629969991901,
280
  "children": {
281
  "UnityEnvironment._generate_step_input": {
282
- "total": 5.481860843001171,
283
- "count": 9231,
284
  "is_parallel": true,
285
- "self": 5.481860843001171
286
  },
287
  "communicator.exchange": {
288
- "total": 293.425782295001,
289
- "count": 9231,
290
  "is_parallel": true,
291
- "self": 293.425782295001
292
  },
293
  "steps_from_proto": {
294
- "total": 11.559856981995265,
295
- "count": 18462,
296
  "is_parallel": true,
297
- "self": 1.2888407609985109,
298
  "children": {
299
  "_process_rank_one_or_two_observation": {
300
- "total": 10.271016220996755,
301
- "count": 73848,
302
  "is_parallel": true,
303
- "self": 10.271016220996755
304
  }
305
  }
306
  }
@@ -313,24 +313,31 @@
313
  }
314
  },
315
  "trainer_advance": {
316
- "total": 87.97804849100183,
317
- "count": 9231,
318
- "self": 0.7175479140037737,
319
  "children": {
320
  "process_trajectory": {
321
- "total": 25.909726616998064,
322
- "count": 9231,
323
- "self": 25.909726616998064
 
 
 
 
 
 
 
324
  },
325
  "_update_policy": {
326
- "total": 61.35077396,
327
- "count": 6,
328
- "self": 7.930714580999755,
329
  "children": {
330
  "TorchPOCAOptimizer.update": {
331
- "total": 53.42005937900024,
332
- "count": 180,
333
- "self": 53.42005937900024
334
  }
335
  }
336
  }
@@ -339,19 +346,19 @@
339
  }
340
  },
341
  "trainer_threads": {
342
- "total": 4.1700002384459367e-07,
343
  "count": 1,
344
- "self": 4.1700002384459367e-07
345
  },
346
  "TrainerController._save_models": {
347
- "total": 0.10446704200001022,
348
  "count": 1,
349
- "self": 0.0008785420000094746,
350
  "children": {
351
  "RLTrainer._checkpoint": {
352
- "total": 0.10358850000000075,
353
  "count": 1,
354
- "self": 0.10358850000000075
355
  }
356
  }
357
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
+ "value": 1.5082602500915527,
6
+ "min": 1.4549720287322998,
7
+ "max": 2.265712022781372,
8
+ "count": 1202
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
+ "value": 33398.9140625,
12
+ "min": 25996.87109375,
13
+ "max": 47126.80859375,
14
+ "count": 1202
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
+ "value": 53.064516129032256,
18
+ "min": 39.63934426229508,
19
+ "max": 85.66666666666667,
20
+ "count": 1202
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
+ "value": 19740.0,
24
+ "min": 11676.0,
25
+ "max": 21748.0,
26
+ "count": 1202
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
+ "value": 1572.202049157151,
30
+ "min": 1403.3055570745742,
31
+ "max": 1610.9957334443245,
32
+ "count": 1202
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
+ "value": 292429.5811432301,
36
+ "min": 173663.35595911706,
37
+ "max": 380185.3125300383,
38
+ "count": 1202
39
  },
40
  "SoccerTwos.Step.mean": {
41
+ "value": 14659958.0,
42
+ "min": 2649975.0,
43
+ "max": 14659958.0,
44
+ "count": 1202
45
  },
46
  "SoccerTwos.Step.sum": {
47
+ "value": 14659958.0,
48
+ "min": 2649975.0,
49
+ "max": 14659958.0,
50
+ "count": 1202
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
+ "value": -0.04047131538391113,
54
+ "min": -0.12949728965759277,
55
+ "max": 0.10559314489364624,
56
+ "count": 1202
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
+ "value": -7.568136215209961,
60
+ "min": -24.920269012451172,
61
+ "max": 19.74591827392578,
62
+ "count": 1202
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
+ "value": -0.038699373602867126,
66
+ "min": -0.1304614245891571,
67
+ "max": 0.10752364993095398,
68
+ "count": 1202
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
+ "value": -7.236783027648926,
72
+ "min": -25.15608787536621,
73
+ "max": 20.106922149658203,
74
+ "count": 1202
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
+ "count": 1202
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
+ "count": 1202
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
+ "value": -0.07591336710567781,
90
+ "min": -0.3485661543332613,
91
+ "max": 0.3920156877804426,
92
+ "count": 1202
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
+ "value": -14.19579964876175,
96
+ "min": -73.85320019721985,
97
+ "max": 59.978400230407715,
98
+ "count": 1202
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
+ "value": -0.07591336710567781,
102
+ "min": -0.3485661543332613,
103
+ "max": 0.3920156877804426,
104
+ "count": 1202
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
+ "value": -14.19579964876175,
108
+ "min": -73.85320019721985,
109
+ "max": 59.978400230407715,
110
+ "count": 1202
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
+ "count": 1202
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
+ "count": 1202
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
+ "value": 0.016982776935522755,
126
+ "min": 0.010868341186627125,
127
+ "max": 0.02667792578189013,
128
+ "count": 583
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
+ "value": 0.016982776935522755,
132
+ "min": 0.010868341186627125,
133
+ "max": 0.02667792578189013,
134
+ "count": 583
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
+ "value": 0.11821085462967555,
138
+ "min": 0.08800648426016172,
139
+ "max": 0.12883232111732165,
140
+ "count": 583
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
+ "value": 0.11821085462967555,
144
+ "min": 0.08800648426016172,
145
+ "max": 0.12883232111732165,
146
+ "count": 583
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
+ "value": 0.11980451295773188,
150
+ "min": 0.08937925597031911,
151
+ "max": 0.13096312458316486,
152
+ "count": 583
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
+ "value": 0.11980451295773188,
156
+ "min": 0.08937925597031911,
157
+ "max": 0.13096312458316486,
158
+ "count": 583
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
  "value": 0.0003,
162
  "min": 0.0003,
163
  "max": 0.0003,
164
+ "count": 583
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
  "value": 0.0003,
168
  "min": 0.0003,
169
  "max": 0.0003,
170
+ "count": 583
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
  "value": 0.20000000000000007,
174
  "min": 0.20000000000000007,
175
  "max": 0.20000000000000007,
176
+ "count": 583
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
  "value": 0.20000000000000007,
180
  "min": 0.20000000000000007,
181
  "max": 0.20000000000000007,
182
+ "count": 583
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
  "value": 0.005000000000000001,
186
  "min": 0.005000000000000001,
187
  "max": 0.005000000000000001,
188
+ "count": 583
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
  "value": 0.005000000000000001,
192
  "min": 0.005000000000000001,
193
  "max": 0.005000000000000001,
194
+ "count": 583
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
+ "start_time_seconds": "1680912511",
200
  "python_version": "3.9.16 (main, Mar 8 2023, 04:29:24) \n[Clang 14.0.6 ]",
201
  "command_line_arguments": "/opt/homebrew/Caskroom/miniconda/base/envs/deep-rl-class/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics --resume",
202
  "mlagents_version": "0.31.0.dev0",
 
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "1.11.0",
206
  "numpy_version": "1.21.2",
207
+ "end_time_seconds": "1680951275"
208
  },
209
+ "total": 38764.087656417,
210
  "count": 1,
211
+ "self": 0.09442195900192019,
212
  "children": {
213
  "run_training.setup": {
214
+ "total": 0.009670666999999966,
215
  "count": 1,
216
+ "self": 0.009670666999999966
217
  },
218
  "TrainerController.start_learning": {
219
+ "total": 38763.983563791,
220
  "count": 1,
221
+ "self": 9.121081361445249,
222
  "children": {
223
  "TrainerController._reset_env": {
224
+ "total": 3.2734744629951806,
225
+ "count": 62,
226
+ "self": 3.2734744629951806
227
  },
228
  "TrainerController.advance": {
229
+ "total": 38751.51397613357,
230
+ "count": 840821,
231
+ "self": 7.283000948016706,
232
  "children": {
233
  "env_step": {
234
+ "total": 30646.677439031813,
235
+ "count": 840821,
236
+ "self": 29467.50711357281,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
+ "total": 1173.7110879960755,
240
+ "count": 840821,
241
+ "self": 30.728198681857293,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
+ "total": 1142.9828893142183,
245
+ "count": 1508960,
246
+ "self": 1142.9828893142183
247
  }
248
  }
249
  },
250
  "workers": {
251
+ "total": 5.4592374629280425,
252
+ "count": 840821,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
+ "total": 38741.549223342096,
257
+ "count": 840821,
258
  "is_parallel": true,
259
+ "self": 10345.48275503689,
260
  "children": {
261
  "steps_from_proto": {
262
+ "total": 0.08496799695775925,
263
+ "count": 124,
264
  "is_parallel": true,
265
+ "self": 0.009829328961364903,
266
  "children": {
267
  "_process_rank_one_or_two_observation": {
268
+ "total": 0.07513866799639435,
269
+ "count": 496,
270
  "is_parallel": true,
271
+ "self": 0.07513866799639435
272
  }
273
  }
274
  },
275
  "UnityEnvironment.step": {
276
+ "total": 28395.981500308248,
277
+ "count": 840821,
278
  "is_parallel": true,
279
+ "self": 78.5241393496326,
280
  "children": {
281
  "UnityEnvironment._generate_step_input": {
282
+ "total": 499.6481334747981,
283
+ "count": 840821,
284
  "is_parallel": true,
285
+ "self": 499.6481334747981
286
  },
287
  "communicator.exchange": {
288
+ "total": 26759.368367345356,
289
+ "count": 840821,
290
  "is_parallel": true,
291
+ "self": 26759.368367345356
292
  },
293
  "steps_from_proto": {
294
+ "total": 1058.4408601384594,
295
+ "count": 1681642,
296
  "is_parallel": true,
297
+ "self": 115.98925291435125,
298
  "children": {
299
  "_process_rank_one_or_two_observation": {
300
+ "total": 942.4516072241081,
301
+ "count": 6726568,
302
  "is_parallel": true,
303
+ "self": 942.4516072241081
304
  }
305
  }
306
  }
 
313
  }
314
  },
315
  "trainer_advance": {
316
+ "total": 8097.553536153739,
317
+ "count": 840821,
318
+ "self": 64.9191855755953,
319
  "children": {
320
  "process_trajectory": {
321
+ "total": 2104.6275479220776,
322
+ "count": 840821,
323
+ "self": 2102.9520721740782,
324
+ "children": {
325
+ "RLTrainer._checkpoint": {
326
+ "total": 1.6754757479993714,
327
+ "count": 24,
328
+ "self": 1.6754757479993714
329
+ }
330
+ }
331
  },
332
  "_update_policy": {
333
+ "total": 5928.006802656066,
334
+ "count": 584,
335
+ "self": 775.4999598093327,
336
  "children": {
337
  "TorchPOCAOptimizer.update": {
338
+ "total": 5152.506842846733,
339
+ "count": 17512,
340
+ "self": 5152.506842846733
341
  }
342
  }
343
  }
 
346
  }
347
  },
348
  "trainer_threads": {
349
+ "total": 9.57996235229075e-07,
350
  "count": 1,
351
+ "self": 9.57996235229075e-07
352
  },
353
  "TrainerController._save_models": {
354
+ "total": 0.07503087499935646,
355
  "count": 1,
356
+ "self": 0.0011619170036283322,
357
  "children": {
358
  "RLTrainer._checkpoint": {
359
+ "total": 0.07386895799572812,
360
  "count": 1,
361
+ "self": 0.07386895799572812
362
  }
363
  }
364
  }
run_logs/training_status.json CHANGED
@@ -2,59 +2,59 @@
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
- "steps": 1499957,
6
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-1499957.onnx",
7
  "reward": 0.0,
8
- "creation_time": 1680907382.099221,
9
  "auxillary_file_paths": [
10
- "results/SoccerTwos/SoccerTwos/SoccerTwos-1499957.pt"
11
  ]
12
  },
13
  {
14
- "steps": 1999940,
15
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-1999940.onnx",
16
  "reward": 0.0,
17
- "creation_time": 1680909181.6373088,
18
  "auxillary_file_paths": [
19
- "results/SoccerTwos/SoccerTwos/SoccerTwos-1999940.pt"
20
  ]
21
  },
22
  {
23
- "steps": 2499998,
24
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-2499998.onnx",
25
- "reward": null,
26
- "creation_time": 1680911028.430613,
27
  "auxillary_file_paths": [
28
- "results/SoccerTwos/SoccerTwos/SoccerTwos-2499998.pt"
29
  ]
30
  },
31
  {
32
- "steps": 2511370,
33
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-2511370.onnx",
34
  "reward": 0.0,
35
- "creation_time": 1680911062.556363,
36
  "auxillary_file_paths": [
37
- "results/SoccerTwos/SoccerTwos/SoccerTwos-2511370.pt"
38
  ]
39
  },
40
  {
41
- "steps": 2644140,
42
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-2644140.onnx",
43
- "reward": 0.0,
44
- "creation_time": 1680912104.708426,
45
  "auxillary_file_paths": [
46
- "results/SoccerTwos/SoccerTwos/SoccerTwos-2644140.pt"
47
  ]
48
  }
49
  ],
50
- "elo": 1421.0773299193036,
51
  "final_checkpoint": {
52
- "steps": 2644140,
53
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
54
- "reward": 0.0,
55
- "creation_time": 1680912104.708426,
56
  "auxillary_file_paths": [
57
- "results/SoccerTwos/SoccerTwos/SoccerTwos-2644140.pt"
58
  ]
59
  }
60
  },
 
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
+ "steps": 12999992,
6
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-12999992.onnx",
7
  "reward": 0.0,
8
+ "creation_time": 1680946042.883106,
9
  "auxillary_file_paths": [
10
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-12999992.pt"
11
  ]
12
  },
13
  {
14
+ "steps": 13499996,
15
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-13499996.onnx",
16
  "reward": 0.0,
17
+ "creation_time": 1680947614.062955,
18
  "auxillary_file_paths": [
19
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-13499996.pt"
20
  ]
21
  },
22
  {
23
+ "steps": 13999972,
24
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-13999972.onnx",
25
+ "reward": 0.0,
26
+ "creation_time": 1680949178.047651,
27
  "auxillary_file_paths": [
28
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-13999972.pt"
29
  ]
30
  },
31
  {
32
+ "steps": 14499964,
33
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-14499964.onnx",
34
  "reward": 0.0,
35
+ "creation_time": 1680950744.0797691,
36
  "auxillary_file_paths": [
37
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-14499964.pt"
38
  ]
39
  },
40
  {
41
+ "steps": 14666438,
42
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-14666438.onnx",
43
+ "reward": null,
44
+ "creation_time": 1680951275.4068632,
45
  "auxillary_file_paths": [
46
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-14666438.pt"
47
  ]
48
  }
49
  ],
50
+ "elo": 1571.7671539228909,
51
  "final_checkpoint": {
52
+ "steps": 14666438,
53
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
54
+ "reward": null,
55
+ "creation_time": 1680951275.4068632,
56
  "auxillary_file_paths": [
57
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-14666438.pt"
58
  ]
59
  }
60
  },