ahmadsyy commited on
Commit
9cf8a4e
·
verified ·
1 Parent(s): 04fd40f

First Push`

Browse files
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69f0e6e2805958cda451132abcf52ab3631a28c39f2429d2fd4c9901d668c4b1
3
  size 1768747
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d47cac1be56645cf0167844a39f11276b31723456ba56ba75e3f6b090f31a07
3
  size 1768747
SoccerTwos/SoccerTwos-3999950.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bfedf48bffd46536865c9a20ad9317675a2377fc2936cc20536c31dd5d01758
3
+ size 1768747
SoccerTwos/SoccerTwos-3999950.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c2e84c1d9bf0e31d8038cce8eb42ff48eef2000faff364542e337dd097297ef
3
+ size 28430358
SoccerTwos/SoccerTwos-4499944.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc0cc24322ea2c951ad614d62a75c7ad0e159325336b740a974a9f430aab3c92
3
+ size 1768747
SoccerTwos/SoccerTwos-4499944.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f7be7887c57b0088fe7857fe45df15017303aa885e7497149bb2a66debce971
3
+ size 28430358
SoccerTwos/SoccerTwos-4999939.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ccc01d4cf6ae864c63c19c7e1f887cb8644296cb8884a16661d2322456a2add
3
+ size 1768747
SoccerTwos/SoccerTwos-4999939.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4483725e01e95c359b647e9d5a36d6fc2c6b178b74ba149440afeff428bed9a
3
+ size 28430358
SoccerTwos/SoccerTwos-5499963.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa94fb32932a9585f2d2f2633b1ce360a4db02cadd5596f3b8dc77dc4ad74b17
3
+ size 1768747
SoccerTwos/SoccerTwos-5499963.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f718c13d10f19434e5c00e96789f019fcce24a69ca1501bb457df71d541028e
3
+ size 28430358
SoccerTwos/SoccerTwos-5533130.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d47cac1be56645cf0167844a39f11276b31723456ba56ba75e3f6b090f31a07
3
+ size 1768747
SoccerTwos/SoccerTwos-5533130.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2307f933faef0cc39251b5fcd0820217273b6fb3539aa0ee505af2acc5c5b349
3
+ size 28430358
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cfd81fc578e9a14e3509037c8685eca53447114b61e48d25d46cc3da937ff8d
3
  size 28429366
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4713dbad866b6ba9b07a1674c30ad5232d7b1ba6155cf2e2bbca3adacd7f37f
3
  size 28429366
SoccerTwos/events.out.tfevents.1732091344.DESKTOP-BQV6K1N.23044.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1b440e846129a9c2681e1e2df7cddacca6293a37506a7937cb17d09cc4f5cf1
3
+ size 1003633
SoccerTwos/events.out.tfevents.1732095108.DESKTOP-BQV6K1N.30732.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52b420db8fd06f0c4f19c75f34e942c3f6fe6976aa4e217e165525ccb9b5b797
3
+ size 2069107
run_logs/Player-0.log CHANGED
@@ -9,7 +9,7 @@ NullGfxDevice:
9
  Renderer: Null Device
10
  Vendor: Unity Technologies
11
  Begin MonoManager ReloadAssembly
12
- - Completed reload, in 0.345 seconds
13
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
14
  Microsoft Media Foundation video decoding to texture disabled: graphics device is Null, only Direct3D 11 and Direct3D 12 (only on desktop) are supported for hardware-accelerated video decoding.
15
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -35,7 +35,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
35
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
36
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
37
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
38
- UnloadTime: 0.728800 ms
39
  Registered Communicator in Agent.
40
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
41
  Setting up 4 worker threads for Enlighten.
@@ -43,7 +43,7 @@ Memory Statistics:
43
  [ALLOC_TEMP_TLS] TLS Allocator
44
  StackAllocators :
45
  [ALLOC_TEMP_MAIN]
46
- Peak usage frame count: [8.0 KB-16.0 KB]: 3029 frames, [2.0 MB-4.0 MB]: 1 frames
47
  Initial Block Size 4.0 MB
48
  Current Block Size 4.0 MB
49
  Peak Allocated Bytes 2.0 MB
@@ -86,7 +86,7 @@ Memory Statistics:
86
  [ALLOC_TEMP_Job.Worker 5]
87
  Initial Block Size 256.0 KB
88
  Current Block Size 256.0 KB
89
- Peak Allocated Bytes 0 B
90
  Overflow Count 0
91
  [ALLOC_TEMP_Background Job.Worker 14]
92
  Initial Block Size 32.0 KB
@@ -161,7 +161,7 @@ Memory Statistics:
161
  [ALLOC_TEMP_Job.Worker 2]
162
  Initial Block Size 256.0 KB
163
  Current Block Size 256.0 KB
164
- Peak Allocated Bytes 0.8 KB
165
  Overflow Count 0
166
  [ALLOC_TEMP_Background Job.Worker 3]
167
  Initial Block Size 32.0 KB
@@ -195,13 +195,13 @@ Memory Statistics:
195
  Used Block count 1
196
  Peak Allocated bytes 0.9 MB
197
  [ALLOC_DEFAULT_MAIN]
198
- Peak usage frame count: [4.0 MB-8.0 MB]: 3030 frames
199
  Requested Block Size 16.0 MB
200
  Peak Block count 1
201
  Peak Allocated memory 5.0 MB
202
  Peak Large allocation bytes 0 B
203
  [ALLOC_DEFAULT_THREAD]
204
- Peak usage frame count: [16.0 MB-32.0 MB]: 3030 frames
205
  Requested Block Size 16.0 MB
206
  Peak Block count 1
207
  Peak Allocated memory 17.3 MB
@@ -233,13 +233,13 @@ Memory Statistics:
233
  Used Block count 1
234
  Peak Allocated bytes 0.9 MB
235
  [ALLOC_GFX_MAIN]
236
- Peak usage frame count: [32.0 KB-64.0 KB]: 3029 frames, [64.0 KB-128.0 KB]: 1 frames
237
  Requested Block Size 16.0 MB
238
  Peak Block count 1
239
  Peak Allocated memory 65.6 KB
240
  Peak Large allocation bytes 0 B
241
  [ALLOC_GFX_THREAD]
242
- Peak usage frame count: [128.0 KB-256.0 KB]: 3030 frames
243
  Requested Block Size 16.0 MB
244
  Peak Block count 1
245
  Peak Allocated memory 173.6 KB
@@ -251,13 +251,13 @@ Memory Statistics:
251
  Used Block count 1
252
  Peak Allocated bytes 0.9 MB
253
  [ALLOC_CACHEOBJECTS_MAIN]
254
- Peak usage frame count: [0.5 MB-1.0 MB]: 3030 frames
255
  Requested Block Size 4.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 0.6 MB
258
  Peak Large allocation bytes 0 B
259
  [ALLOC_CACHEOBJECTS_THREAD]
260
- Peak usage frame count: [0.5 MB-1.0 MB]: 3029 frames, [2.0 MB-4.0 MB]: 1 frames
261
  Requested Block Size 4.0 MB
262
  Peak Block count 1
263
  Peak Allocated memory 3.2 MB
@@ -269,13 +269,13 @@ Memory Statistics:
269
  Used Block count 1
270
  Peak Allocated bytes 0.9 MB
271
  [ALLOC_TYPETREE_MAIN]
272
- Peak usage frame count: [0-1.0 KB]: 3030 frames
273
  Requested Block Size 2.0 MB
274
  Peak Block count 1
275
  Peak Allocated memory 1.0 KB
276
  Peak Large allocation bytes 0 B
277
  [ALLOC_TYPETREE_THREAD]
278
- Peak usage frame count: [1.0 KB-2.0 KB]: 3029 frames, [2.0 KB-4.0 KB]: 1 frames
279
  Requested Block Size 2.0 MB
280
  Peak Block count 1
281
  Peak Allocated memory 2.2 KB
 
9
  Renderer: Null Device
10
  Vendor: Unity Technologies
11
  Begin MonoManager ReloadAssembly
12
+ - Completed reload, in 0.096 seconds
13
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
14
  Microsoft Media Foundation video decoding to texture disabled: graphics device is Null, only Direct3D 11 and Direct3D 12 (only on desktop) are supported for hardware-accelerated video decoding.
15
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
35
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
36
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
37
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
38
+ UnloadTime: 0.682800 ms
39
  Registered Communicator in Agent.
40
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
41
  Setting up 4 worker threads for Enlighten.
 
43
  [ALLOC_TEMP_TLS] TLS Allocator
44
  StackAllocators :
45
  [ALLOC_TEMP_MAIN]
46
+ Peak usage frame count: [8.0 KB-16.0 KB]: 37256 frames, [2.0 MB-4.0 MB]: 1 frames
47
  Initial Block Size 4.0 MB
48
  Current Block Size 4.0 MB
49
  Peak Allocated Bytes 2.0 MB
 
86
  [ALLOC_TEMP_Job.Worker 5]
87
  Initial Block Size 256.0 KB
88
  Current Block Size 256.0 KB
89
+ Peak Allocated Bytes 0.8 KB
90
  Overflow Count 0
91
  [ALLOC_TEMP_Background Job.Worker 14]
92
  Initial Block Size 32.0 KB
 
161
  [ALLOC_TEMP_Job.Worker 2]
162
  Initial Block Size 256.0 KB
163
  Current Block Size 256.0 KB
164
+ Peak Allocated Bytes 0 B
165
  Overflow Count 0
166
  [ALLOC_TEMP_Background Job.Worker 3]
167
  Initial Block Size 32.0 KB
 
195
  Used Block count 1
196
  Peak Allocated bytes 0.9 MB
197
  [ALLOC_DEFAULT_MAIN]
198
+ Peak usage frame count: [4.0 MB-8.0 MB]: 37257 frames
199
  Requested Block Size 16.0 MB
200
  Peak Block count 1
201
  Peak Allocated memory 5.0 MB
202
  Peak Large allocation bytes 0 B
203
  [ALLOC_DEFAULT_THREAD]
204
+ Peak usage frame count: [16.0 MB-32.0 MB]: 37257 frames
205
  Requested Block Size 16.0 MB
206
  Peak Block count 1
207
  Peak Allocated memory 17.3 MB
 
233
  Used Block count 1
234
  Peak Allocated bytes 0.9 MB
235
  [ALLOC_GFX_MAIN]
236
+ Peak usage frame count: [32.0 KB-64.0 KB]: 37256 frames, [64.0 KB-128.0 KB]: 1 frames
237
  Requested Block Size 16.0 MB
238
  Peak Block count 1
239
  Peak Allocated memory 65.6 KB
240
  Peak Large allocation bytes 0 B
241
  [ALLOC_GFX_THREAD]
242
+ Peak usage frame count: [128.0 KB-256.0 KB]: 37257 frames
243
  Requested Block Size 16.0 MB
244
  Peak Block count 1
245
  Peak Allocated memory 173.6 KB
 
251
  Used Block count 1
252
  Peak Allocated bytes 0.9 MB
253
  [ALLOC_CACHEOBJECTS_MAIN]
254
+ Peak usage frame count: [0.5 MB-1.0 MB]: 37257 frames
255
  Requested Block Size 4.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 0.6 MB
258
  Peak Large allocation bytes 0 B
259
  [ALLOC_CACHEOBJECTS_THREAD]
260
+ Peak usage frame count: [0.5 MB-1.0 MB]: 37256 frames, [2.0 MB-4.0 MB]: 1 frames
261
  Requested Block Size 4.0 MB
262
  Peak Block count 1
263
  Peak Allocated memory 3.2 MB
 
269
  Used Block count 1
270
  Peak Allocated bytes 0.9 MB
271
  [ALLOC_TYPETREE_MAIN]
272
+ Peak usage frame count: [0-1.0 KB]: 37257 frames
273
  Requested Block Size 2.0 MB
274
  Peak Block count 1
275
  Peak Allocated memory 1.0 KB
276
  Peak Large allocation bytes 0 B
277
  [ALLOC_TYPETREE_THREAD]
278
+ Peak usage frame count: [1.0 KB-2.0 KB]: 37256 frames, [2.0 KB-4.0 KB]: 1 frames
279
  Requested Block Size 2.0 MB
280
  Peak Block count 1
281
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -2,201 +2,201 @@
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 2.1043341159820557,
6
- "min": 2.0979535579681396,
7
- "max": 2.1590776443481445,
8
- "count": 16
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 43972.1640625,
12
- "min": 26032.80859375,
13
- "max": 45091.49609375,
14
- "count": 16
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 59.036144578313255,
18
- "min": 43.96875,
19
- "max": 80.04838709677419,
20
- "count": 16
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 19600.0,
24
- "min": 11256.0,
25
- "max": 20152.0,
26
- "count": 16
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1371.4343926038857,
30
- "min": 1351.258794107496,
31
- "max": 1376.8250075552155,
32
- "count": 16
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 227658.10917224502,
36
- "min": 168379.3515789552,
37
- "max": 295067.20596112404,
38
- "count": 16
39
  },
40
  "SoccerTwos.Step.mean": {
41
- "value": 2589954.0,
42
- "min": 2439951.0,
43
- "max": 2589954.0,
44
- "count": 16
45
  },
46
  "SoccerTwos.Step.sum": {
47
- "value": 2589954.0,
48
- "min": 2439951.0,
49
- "max": 2589954.0,
50
- "count": 16
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
- "value": -0.0010260975686833262,
54
- "min": -0.042237937450408936,
55
- "max": 0.05772840976715088,
56
- "count": 16
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
- "value": -0.1703321933746338,
60
- "min": -7.180449485778809,
61
- "max": 10.557044982910156,
62
- "count": 16
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
- "value": -0.0008884711423888803,
66
- "min": -0.0447610504925251,
67
- "max": 0.06113218888640404,
68
- "count": 16
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
- "value": -0.14748620986938477,
72
- "min": -7.609378337860107,
73
- "max": 10.162272453308105,
74
- "count": 16
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
- "count": 16
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
- "count": 16
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
- "value": -0.08471084287367671,
90
- "min": -0.16729411903549643,
91
- "max": 0.12818064516590488,
92
- "count": 16
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
- "value": -14.061999917030334,
96
- "min": -28.440000236034393,
97
- "max": 20.809599995613098,
98
- "count": 16
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
- "value": -0.08471084287367671,
102
- "min": -0.16729411903549643,
103
- "max": 0.12818064516590488,
104
- "count": 16
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
- "value": -14.061999917030334,
108
- "min": -28.440000236034393,
109
- "max": 20.809599995613098,
110
- "count": 16
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
- "count": 16
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
- "count": 16
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.022567808740185918,
126
- "min": 0.019185953977284953,
127
- "max": 0.027850079436407046,
128
- "count": 15
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.022567808740185918,
132
- "min": 0.019185953977284953,
133
- "max": 0.027850079436407046,
134
- "count": 15
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.09001306472001253,
138
- "min": 0.08273657162984212,
139
- "max": 0.11319424932201703,
140
- "count": 15
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.09001306472001253,
144
- "min": 0.08273657162984212,
145
- "max": 0.11319424932201703,
146
- "count": 15
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.09164557605981827,
150
- "min": 0.0842846728861332,
151
- "max": 0.11616631199916204,
152
- "count": 15
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.09164557605981827,
156
- "min": 0.0842846728861332,
157
- "max": 0.11616631199916204,
158
- "count": 15
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
  "value": 0.0003,
162
  "min": 0.0003,
163
  "max": 0.0003,
164
- "count": 15
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
  "value": 0.0003,
168
  "min": 0.0003,
169
  "max": 0.0003,
170
- "count": 15
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
- "value": 0.20000000000000004,
174
- "min": 0.20000000000000004,
175
  "max": 0.20000000000000007,
176
- "count": 15
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
- "value": 0.20000000000000004,
180
- "min": 0.20000000000000004,
181
  "max": 0.20000000000000007,
182
- "count": 15
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
- "value": 0.005,
186
  "min": 0.005,
187
  "max": 0.005000000000000001,
188
- "count": 15
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
- "value": 0.005,
192
  "min": 0.005,
193
  "max": 0.005000000000000001,
194
- "count": 15
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1732088289",
200
  "python_version": "3.10.4 (tags/v3.10.4:9d38120, Mar 23 2022, 23:13:41) [MSC v.1929 64 bit (AMD64)]",
201
  "command_line_arguments": "D:\\python projects\\ml-agents\\venv\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --resume",
202
  "mlagents_version": "1.1.0",
@@ -204,103 +204,103 @@
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "2.5.1+cpu",
206
  "numpy_version": "1.23.5",
207
- "end_time_seconds": "1732088761"
208
  },
209
- "total": 471.954658200033,
210
  "count": 1,
211
- "self": 4.281521999975666,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.3720814000116661,
215
  "count": 1,
216
- "self": 0.3720814000116661
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 467.3010548000457,
220
  "count": 1,
221
- "self": 0.2854381112847477,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 8.18414569995366,
225
- "count": 2,
226
- "self": 8.18414569995366
227
  },
228
  "TrainerController.advance": {
229
- "total": 458.6811532888096,
230
- "count": 11195,
231
- "self": 0.2861784966662526,
232
  "children": {
233
  "env_step": {
234
- "total": 207.8955141028855,
235
- "count": 11195,
236
- "self": 162.24072081502527,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
- "total": 45.47821909491904,
240
- "count": 11195,
241
- "self": 1.5987130993744358,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
- "total": 43.879505995544605,
245
- "count": 20198,
246
- "self": 43.879505995544605
247
  }
248
  }
249
  },
250
  "workers": {
251
- "total": 0.1765741929411888,
252
- "count": 11194,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
- "total": 461.4469671078259,
257
- "count": 11194,
258
  "is_parallel": true,
259
- "self": 330.1103191067232,
260
  "children": {
261
  "steps_from_proto": {
262
- "total": 0.002890500007197261,
263
- "count": 4,
264
  "is_parallel": true,
265
- "self": 0.0005716999294236302,
266
  "children": {
267
  "_process_rank_one_or_two_observation": {
268
- "total": 0.0023188000777736306,
269
- "count": 16,
270
  "is_parallel": true,
271
- "self": 0.0023188000777736306
272
  }
273
  }
274
  },
275
  "UnityEnvironment.step": {
276
- "total": 131.33375750109553,
277
- "count": 11194,
278
  "is_parallel": true,
279
- "self": 6.943547705188394,
280
  "children": {
281
  "UnityEnvironment._generate_step_input": {
282
- "total": 5.550321500981227,
283
- "count": 11194,
284
  "is_parallel": true,
285
- "self": 5.550321500981227
286
  },
287
  "communicator.exchange": {
288
- "total": 98.2395213979762,
289
- "count": 11194,
290
  "is_parallel": true,
291
- "self": 98.2395213979762
292
  },
293
  "steps_from_proto": {
294
- "total": 20.60036689694971,
295
- "count": 22388,
296
  "is_parallel": true,
297
- "self": 4.042497379472479,
298
  "children": {
299
  "_process_rank_one_or_two_observation": {
300
- "total": 16.55786951747723,
301
- "count": 89552,
302
  "is_parallel": true,
303
- "self": 16.55786951747723
304
  }
305
  }
306
  }
@@ -313,31 +313,31 @@
313
  }
314
  },
315
  "trainer_advance": {
316
- "total": 250.49946068925783,
317
- "count": 11194,
318
- "self": 1.9064420951763168,
319
  "children": {
320
  "process_trajectory": {
321
- "total": 49.97855669434648,
322
- "count": 11194,
323
- "self": 49.55093809426762,
324
  "children": {
325
  "RLTrainer._checkpoint": {
326
- "total": 0.42761860007885844,
327
- "count": 1,
328
- "self": 0.42761860007885844
329
  }
330
  }
331
  },
332
  "_update_policy": {
333
- "total": 198.61446189973503,
334
- "count": 15,
335
- "self": 20.9438984983135,
336
  "children": {
337
  "TorchPOCAOptimizer.update": {
338
- "total": 177.67056340142153,
339
- "count": 438,
340
- "self": 177.67056340142153
341
  }
342
  }
343
  }
@@ -346,19 +346,19 @@
346
  }
347
  },
348
  "trainer_threads": {
349
- "total": 1.800013706088066e-06,
350
  "count": 1,
351
- "self": 1.800013706088066e-06
352
  },
353
  "TrainerController._save_models": {
354
- "total": 0.15031589998397976,
355
  "count": 1,
356
- "self": 0.002495500026270747,
357
  "children": {
358
  "RLTrainer._checkpoint": {
359
- "total": 0.14782039995770901,
360
  "count": 1,
361
- "self": 0.14782039995770901
362
  }
363
  }
364
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
+ "value": 1.5660171508789062,
6
+ "min": 1.5396820306777954,
7
+ "max": 1.880081295967102,
8
+ "count": 198
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
+ "value": 31320.34375,
12
+ "min": 29534.00390625,
13
+ "max": 41144.2421875,
14
+ "count": 198
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
+ "value": 63.835443037974684,
18
+ "min": 42.70175438596491,
19
+ "max": 84.71666666666667,
20
+ "count": 198
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
+ "value": 20172.0,
24
+ "min": 16128.0,
25
+ "max": 20528.0,
26
+ "count": 198
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
+ "value": 1417.6097296242715,
30
+ "min": 1380.403699591196,
31
+ "max": 1456.4866303781612,
32
+ "count": 198
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
+ "value": 223982.3372806349,
36
+ "min": 167199.51708247018,
37
+ "max": 323254.78982444253,
38
+ "count": 198
39
  },
40
  "SoccerTwos.Step.mean": {
41
+ "value": 5529938.0,
42
+ "min": 3559972.0,
43
+ "max": 5529938.0,
44
+ "count": 198
45
  },
46
  "SoccerTwos.Step.sum": {
47
+ "value": 5529938.0,
48
+ "min": 3559972.0,
49
+ "max": 5529938.0,
50
+ "count": 198
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
+ "value": -0.051855020225048065,
54
+ "min": -0.14628547430038452,
55
+ "max": 0.0822330117225647,
56
+ "count": 198
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
+ "value": -8.193093299865723,
60
+ "min": -28.37938117980957,
61
+ "max": 16.035436630249023,
62
+ "count": 198
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
+ "value": -0.042027898132801056,
66
+ "min": -0.1427212804555893,
67
+ "max": 0.08749193698167801,
68
+ "count": 198
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
+ "value": -6.640408039093018,
72
+ "min": -27.68792724609375,
73
+ "max": 17.060928344726562,
74
+ "count": 198
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
+ "count": 198
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
+ "count": 198
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
+ "value": -0.09168860882143431,
90
+ "min": -0.3312575988769531,
91
+ "max": 0.3173333341425115,
92
+ "count": 198
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
+ "value": -14.486800193786621,
96
+ "min": -54.38579994440079,
97
+ "max": 52.360000133514404,
98
+ "count": 198
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
+ "value": -0.09168860882143431,
102
+ "min": -0.3312575988769531,
103
+ "max": 0.3173333341425115,
104
+ "count": 198
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
+ "value": -14.486800193786621,
108
+ "min": -54.38579994440079,
109
+ "max": 52.360000133514404,
110
+ "count": 198
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
+ "count": 198
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
+ "count": 198
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
+ "value": 0.026255231936617444,
126
+ "min": 0.01627497440543569,
127
+ "max": 0.03656857611301045,
128
+ "count": 191
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
+ "value": 0.026255231936617444,
132
+ "min": 0.01627497440543569,
133
+ "max": 0.03656857611301045,
134
+ "count": 191
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
+ "value": 0.09653884669144948,
138
+ "min": 0.07564474120736123,
139
+ "max": 0.12114908628993565,
140
+ "count": 191
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
+ "value": 0.09653884669144948,
144
+ "min": 0.07564474120736123,
145
+ "max": 0.12114908628993565,
146
+ "count": 191
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
+ "value": 0.10025102198123932,
150
+ "min": 0.07619098275899887,
151
+ "max": 0.1247354370576364,
152
+ "count": 191
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
+ "value": 0.10025102198123932,
156
+ "min": 0.07619098275899887,
157
+ "max": 0.1247354370576364,
158
+ "count": 191
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
  "value": 0.0003,
162
  "min": 0.0003,
163
  "max": 0.0003,
164
+ "count": 191
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
  "value": 0.0003,
168
  "min": 0.0003,
169
  "max": 0.0003,
170
+ "count": 191
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
+ "value": 0.20000000000000007,
174
+ "min": 0.2,
175
  "max": 0.20000000000000007,
176
+ "count": 191
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
+ "value": 0.20000000000000007,
180
+ "min": 0.2,
181
  "max": 0.20000000000000007,
182
+ "count": 191
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
+ "value": 0.005000000000000001,
186
  "min": 0.005,
187
  "max": 0.005000000000000001,
188
+ "count": 191
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
+ "value": 0.005000000000000001,
192
  "min": 0.005,
193
  "max": 0.005000000000000001,
194
+ "count": 191
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
+ "start_time_seconds": "1732095102",
200
  "python_version": "3.10.4 (tags/v3.10.4:9d38120, Mar 23 2022, 23:13:41) [MSC v.1929 64 bit (AMD64)]",
201
  "command_line_arguments": "D:\\python projects\\ml-agents\\venv\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --resume",
202
  "mlagents_version": "1.1.0",
 
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "2.5.1+cpu",
206
  "numpy_version": "1.23.5",
207
+ "end_time_seconds": "1732101370"
208
  },
209
+ "total": 6268.3186942000175,
210
  "count": 1,
211
+ "self": 10.264327400014736,
212
  "children": {
213
  "run_training.setup": {
214
+ "total": 0.3097142999758944,
215
  "count": 1,
216
+ "self": 0.3097142999758944
217
  },
218
  "TrainerController.start_learning": {
219
+ "total": 6257.744652500027,
220
  "count": 1,
221
+ "self": 3.813153204973787,
222
  "children": {
223
  "TrainerController._reset_env": {
224
+ "total": 11.315755600109696,
225
+ "count": 11,
226
+ "self": 11.315755600109696
227
  },
228
  "TrainerController.advance": {
229
+ "total": 6242.059609094984,
230
+ "count": 137126,
231
+ "self": 3.7370750026311725,
232
  "children": {
233
  "env_step": {
234
+ "total": 2836.0991703160107,
235
+ "count": 137126,
236
+ "self": 2218.9756366901565,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
+ "total": 614.819088418386,
240
+ "count": 137126,
241
+ "self": 22.754441584693268,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
+ "total": 592.0646468336927,
245
+ "count": 248380,
246
+ "self": 592.0646468336927
247
  }
248
  }
249
  },
250
  "workers": {
251
+ "total": 2.304445207468234,
252
+ "count": 137125,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
+ "total": 6246.121647206368,
257
+ "count": 137125,
258
  "is_parallel": true,
259
+ "self": 4446.1522600069875,
260
  "children": {
261
  "steps_from_proto": {
262
+ "total": 0.020320799783803523,
263
+ "count": 22,
264
  "is_parallel": true,
265
+ "self": 0.0038775004213675857,
266
  "children": {
267
  "_process_rank_one_or_two_observation": {
268
+ "total": 0.016443299362435937,
269
+ "count": 88,
270
  "is_parallel": true,
271
+ "self": 0.016443299362435937
272
  }
273
  }
274
  },
275
  "UnityEnvironment.step": {
276
+ "total": 1799.9490663995966,
277
+ "count": 137125,
278
  "is_parallel": true,
279
+ "self": 95.17972115217708,
280
  "children": {
281
  "UnityEnvironment._generate_step_input": {
282
+ "total": 73.22999456862453,
283
+ "count": 137125,
284
  "is_parallel": true,
285
+ "self": 73.22999456862453
286
  },
287
  "communicator.exchange": {
288
+ "total": 1345.3410510788672,
289
+ "count": 137125,
290
  "is_parallel": true,
291
+ "self": 1345.3410510788672
292
  },
293
  "steps_from_proto": {
294
+ "total": 286.19829959992785,
295
+ "count": 274250,
296
  "is_parallel": true,
297
+ "self": 55.273062570835464,
298
  "children": {
299
  "_process_rank_one_or_two_observation": {
300
+ "total": 230.9252370290924,
301
+ "count": 1097000,
302
  "is_parallel": true,
303
+ "self": 230.9252370290924
304
  }
305
  }
306
  }
 
313
  }
314
  },
315
  "trainer_advance": {
316
+ "total": 3402.223363776342,
317
+ "count": 137125,
318
+ "self": 25.176138061331585,
319
  "children": {
320
  "process_trajectory": {
321
+ "total": 673.8780544148758,
322
+ "count": 137125,
323
+ "self": 669.0686950148083,
324
  "children": {
325
  "RLTrainer._checkpoint": {
326
+ "total": 4.809359400067478,
327
+ "count": 4,
328
+ "self": 4.809359400067478
329
  }
330
  }
331
  },
332
  "_update_policy": {
333
+ "total": 2703.1691713001346,
334
+ "count": 191,
335
+ "self": 285.2503954063868,
336
  "children": {
337
  "TorchPOCAOptimizer.update": {
338
+ "total": 2417.918775893748,
339
+ "count": 5562,
340
+ "self": 2417.918775893748
341
  }
342
  }
343
  }
 
346
  }
347
  },
348
  "trainer_threads": {
349
+ "total": 1.200009137392044e-06,
350
  "count": 1,
351
+ "self": 1.200009137392044e-06
352
  },
353
  "TrainerController._save_models": {
354
+ "total": 0.5561333999503404,
355
  "count": 1,
356
+ "self": 0.2464682999998331,
357
  "children": {
358
  "RLTrainer._checkpoint": {
359
+ "total": 0.3096650999505073,
360
  "count": 1,
361
+ "self": 0.3096650999505073
362
  }
363
  }
364
  }
run_logs/training_status.json CHANGED
@@ -2,59 +2,59 @@
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
- "steps": 1500254,
6
- "file_path": "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-1500254.onnx",
7
  "reward": 0.0,
8
- "creation_time": 1732083936.7681327,
9
  "auxillary_file_paths": [
10
- "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-1500254.pt"
11
  ]
12
  },
13
  {
14
- "steps": 1999918,
15
- "file_path": "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-1999918.onnx",
16
  "reward": 0.0,
17
- "creation_time": 1732086538.8482232,
18
  "auxillary_file_paths": [
19
- "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-1999918.pt"
20
  ]
21
  },
22
  {
23
- "steps": 2434288,
24
- "file_path": "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-2434288.onnx",
25
  "reward": 0.0,
26
- "creation_time": 1732087816.7232904,
27
  "auxillary_file_paths": [
28
- "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-2434288.pt"
29
  ]
30
  },
31
  {
32
- "steps": 2499994,
33
- "file_path": "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-2499994.onnx",
34
  "reward": 0.0,
35
- "creation_time": 1732088478.368934,
36
  "auxillary_file_paths": [
37
- "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-2499994.pt"
38
  ]
39
  },
40
  {
41
- "steps": 2595280,
42
- "file_path": "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-2595280.onnx",
43
  "reward": 0.0,
44
- "creation_time": 1732088757.6685371,
45
  "auxillary_file_paths": [
46
- "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-2595280.pt"
47
  ]
48
  }
49
  ],
50
- "elo": 1379.7441604815701,
51
  "final_checkpoint": {
52
- "steps": 2595280,
53
  "file_path": "results\\SoccerTwos\\SoccerTwos.onnx",
54
  "reward": 0.0,
55
- "creation_time": 1732088757.6685371,
56
  "auxillary_file_paths": [
57
- "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-2595280.pt"
58
  ]
59
  }
60
  },
 
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
+ "steps": 3999950,
6
+ "file_path": "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-3999950.onnx",
7
  "reward": 0.0,
8
+ "creation_time": 1732096457.436601,
9
  "auxillary_file_paths": [
10
+ "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-3999950.pt"
11
  ]
12
  },
13
  {
14
+ "steps": 4499944,
15
+ "file_path": "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-4499944.onnx",
16
  "reward": 0.0,
17
+ "creation_time": 1732098011.4361103,
18
  "auxillary_file_paths": [
19
+ "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-4499944.pt"
20
  ]
21
  },
22
  {
23
+ "steps": 4999939,
24
+ "file_path": "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-4999939.onnx",
25
  "reward": 0.0,
26
+ "creation_time": 1732099649.0932033,
27
  "auxillary_file_paths": [
28
+ "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-4999939.pt"
29
  ]
30
  },
31
  {
32
+ "steps": 5499963,
33
+ "file_path": "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-5499963.onnx",
34
  "reward": 0.0,
35
+ "creation_time": 1732101248.257919,
36
  "auxillary_file_paths": [
37
+ "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-5499963.pt"
38
  ]
39
  },
40
  {
41
+ "steps": 5533130,
42
+ "file_path": "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-5533130.onnx",
43
  "reward": 0.0,
44
+ "creation_time": 1732101360.1694858,
45
  "auxillary_file_paths": [
46
+ "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-5533130.pt"
47
  ]
48
  }
49
  ],
50
+ "elo": 1419.6992312865282,
51
  "final_checkpoint": {
52
+ "steps": 5533130,
53
  "file_path": "results\\SoccerTwos\\SoccerTwos.onnx",
54
  "reward": 0.0,
55
+ "creation_time": 1732101360.1694858,
56
  "auxillary_file_paths": [
57
+ "results\\SoccerTwos\\SoccerTwos\\SoccerTwos-5533130.pt"
58
  ]
59
  }
60
  },