duwi commited on
Commit
8066690
1 Parent(s): 22a5723

Second Push

Browse files
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:077b92580214921e33c0632df5e9c0817aad84a947e12b8541a357fcd811df57
3
  size 1768746
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc7a64b8b21374afcf71770bc32fb58f76e3b7fb9e71dafbf7aed2dd0aea5c50
3
  size 1768746
SoccerTwos/SoccerTwos-499576.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8505d98fffca9bd17b6d2ba85fb4b8ea7164758215ecc7d15bc25edf334010ad
3
+ size 1768746
SoccerTwos/SoccerTwos-499576.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be24ab8cf993523eed32bc6570d879856a72ec5e704f94e458e54d2b5c0d6ba1
3
+ size 28429781
SoccerTwos/SoccerTwos-601382.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc7a64b8b21374afcf71770bc32fb58f76e3b7fb9e71dafbf7aed2dd0aea5c50
3
+ size 1768746
SoccerTwos/SoccerTwos-601382.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e734da90a745f46935e55dec6d6e0c1a58c951fed71d8f562904b6b8e24c3602
3
+ size 28429781
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb343c5fd0dbf092d11958eeddf723ae17b2d9d462eebe032183e173cb9fa66a
3
  size 28428927
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c95dafcf7241ff671c4dfef898bf79c2c15a7886a99b1d52e7880bfc5c58cf16
3
  size 28428927
SoccerTwos/events.out.tfevents.1696602836.adf406a794a6.23505.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a26f87354ce1c93b579da12322d6e01109c259ab36d9debe82b7e87f2e89b71
3
+ size 435576
SoccerTwos/events.out.tfevents.1696606415.adf406a794a6.37829.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:909058cd1ef25c38238089552bb07bf4ae30c28ea906faaf74f90c1d84ec0b6d
3
+ size 1239
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "constant", "beta_schedule": "constant", "epsilon_schedule": "constant"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 50000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 200000, "swap_steps": 2000, "window": 10, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SoccerTwos.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "constant", "beta_schedule": "constant", "epsilon_schedule": "constant"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 600000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 200000, "swap_steps": 2000, "window": 10, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SoccerTwos.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -37,7 +37,7 @@ behaviors:
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
- max_steps: 50000
41
  time_horizon: 1000
42
  summary_freq: 10000
43
  threaded: false
@@ -72,8 +72,8 @@ checkpoint_settings:
72
  run_id: SoccerTwos
73
  initialize_from: null
74
  load_model: false
75
- resume: false
76
- force: true
77
  train_model: false
78
  inference: false
79
  results_dir: results
 
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
+ max_steps: 600000
41
  time_horizon: 1000
42
  summary_freq: 10000
43
  threaded: false
 
72
  run_id: SoccerTwos
73
  initialize_from: null
74
  load_model: false
75
+ resume: true
76
+ force: false
77
  train_model: false
78
  inference: false
79
  results_dir: results
run_logs/Player-0.log CHANGED
@@ -31,7 +31,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
31
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
32
  FMOD initialized on nosound output
33
  Begin MonoManager ReloadAssembly
34
- - Completed reload, in 0.154 seconds
35
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
36
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
37
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -56,38 +56,16 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
56
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
57
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
58
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
59
- UnloadTime: 1.138678 ms
60
  Registered Communicator in Agent.
61
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
62
  requesting resize 84 x 84
63
- TOO LONG
64
- TOO LONG
65
- TOO LONG
66
- TOO LONG
67
- TOO LONG
68
- TOO LONG
69
- TOO LONG
70
- TOO LONG
71
- TOO LONG
72
- TOO LONG
73
- TOO LONG
74
- TOO LONG
75
- TOO LONG
76
- TOO LONG
77
- TOO LONG
78
- TOO LONG
79
- TOO LONG
80
- TOO LONG
81
- TOO LONG
82
- TOO LONG
83
- TOO LONG
84
- TOO LONG
85
  Setting up 1 worker threads for Enlighten.
86
  Memory Statistics:
87
  [ALLOC_TEMP_TLS] TLS Allocator
88
  StackAllocators :
89
  [ALLOC_TEMP_MAIN]
90
- Peak usage frame count: [8.0 KB-16.0 KB]: 1054 frames, [2.0 MB-4.0 MB]: 1 frames
91
  Initial Block Size 4.0 MB
92
  Current Block Size 4.0 MB
93
  Peak Allocated Bytes 2.1 MB
@@ -209,13 +187,13 @@ Memory Statistics:
209
  Used Block count 1
210
  Peak Allocated bytes 1.0 MB
211
  [ALLOC_DEFAULT_MAIN]
212
- Peak usage frame count: [4.0 MB-8.0 MB]: 1055 frames
213
  Requested Block Size 16.0 MB
214
  Peak Block count 1
215
- Peak Allocated memory 4.6 MB
216
  Peak Large allocation bytes 0 B
217
  [ALLOC_DEFAULT_THREAD]
218
- Peak usage frame count: [16.0 MB-32.0 MB]: 1055 frames
219
  Requested Block Size 16.0 MB
220
  Peak Block count 1
221
  Peak Allocated memory 17.6 MB
@@ -232,7 +210,7 @@ Memory Statistics:
232
  Overflow Count (full) 0
233
  [ALLOC_TEMP_JOB_4_FRAMES (JobTemp)]
234
  Initial Block Size 2.0 MB
235
- Used Block Count 2
236
  Overflow Count (too large) 0
237
  Overflow Count (full) 0
238
  [ALLOC_TEMP_JOB_ASYNC (Background)]
@@ -247,13 +225,13 @@ Memory Statistics:
247
  Used Block count 1
248
  Peak Allocated bytes 1.0 MB
249
  [ALLOC_GFX_MAIN]
250
- Peak usage frame count: [32.0 KB-64.0 KB]: 1054 frames, [64.0 KB-128.0 KB]: 1 frames
251
  Requested Block Size 16.0 MB
252
  Peak Block count 1
253
  Peak Allocated memory 65.6 KB
254
  Peak Large allocation bytes 0 B
255
  [ALLOC_GFX_THREAD]
256
- Peak usage frame count: [128.0 KB-256.0 KB]: 1055 frames
257
  Requested Block Size 16.0 MB
258
  Peak Block count 1
259
  Peak Allocated memory 173.5 KB
@@ -265,16 +243,16 @@ Memory Statistics:
265
  Used Block count 1
266
  Peak Allocated bytes 1.0 MB
267
  [ALLOC_CACHEOBJECTS_MAIN]
268
- Peak usage frame count: [0.5 MB-1.0 MB]: 1055 frames
269
  Requested Block Size 4.0 MB
270
  Peak Block count 1
271
  Peak Allocated memory 0.6 MB
272
  Peak Large allocation bytes 0 B
273
  [ALLOC_CACHEOBJECTS_THREAD]
274
- Peak usage frame count: [0.5 MB-1.0 MB]: 1054 frames, [4.0 MB-8.0 MB]: 1 frames
275
  Requested Block Size 4.0 MB
276
  Peak Block count 2
277
- Peak Allocated memory 4.5 MB
278
  Peak Large allocation bytes 0 B
279
  [ALLOC_TYPETREE] Dual Thread Allocator
280
  Peak main deferred allocation count 0
@@ -283,13 +261,13 @@ Memory Statistics:
283
  Used Block count 1
284
  Peak Allocated bytes 1.0 MB
285
  [ALLOC_TYPETREE_MAIN]
286
- Peak usage frame count: [0-1.0 KB]: 1055 frames
287
  Requested Block Size 2.0 MB
288
  Peak Block count 1
289
  Peak Allocated memory 1.0 KB
290
  Peak Large allocation bytes 0 B
291
  [ALLOC_TYPETREE_THREAD]
292
- Peak usage frame count: [1.0 KB-2.0 KB]: 1054 frames, [2.0 KB-4.0 KB]: 1 frames
293
  Requested Block Size 2.0 MB
294
  Peak Block count 1
295
  Peak Allocated memory 2.2 KB
 
31
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
32
  FMOD initialized on nosound output
33
  Begin MonoManager ReloadAssembly
34
+ - Completed reload, in 0.099 seconds
35
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
36
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
37
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
56
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
57
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
58
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
59
+ UnloadTime: 1.055459 ms
60
  Registered Communicator in Agent.
61
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
62
  requesting resize 84 x 84
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  Setting up 1 worker threads for Enlighten.
64
  Memory Statistics:
65
  [ALLOC_TEMP_TLS] TLS Allocator
66
  StackAllocators :
67
  [ALLOC_TEMP_MAIN]
68
+ Peak usage frame count: [2.0 MB-4.0 MB]: 1 frames
69
  Initial Block Size 4.0 MB
70
  Current Block Size 4.0 MB
71
  Peak Allocated Bytes 2.1 MB
 
187
  Used Block count 1
188
  Peak Allocated bytes 1.0 MB
189
  [ALLOC_DEFAULT_MAIN]
190
+ Peak usage frame count: [4.0 MB-8.0 MB]: 1 frames
191
  Requested Block Size 16.0 MB
192
  Peak Block count 1
193
+ Peak Allocated memory 4.5 MB
194
  Peak Large allocation bytes 0 B
195
  [ALLOC_DEFAULT_THREAD]
196
+ Peak usage frame count: [16.0 MB-32.0 MB]: 1 frames
197
  Requested Block Size 16.0 MB
198
  Peak Block count 1
199
  Peak Allocated memory 17.6 MB
 
210
  Overflow Count (full) 0
211
  [ALLOC_TEMP_JOB_4_FRAMES (JobTemp)]
212
  Initial Block Size 2.0 MB
213
+ Used Block Count 1
214
  Overflow Count (too large) 0
215
  Overflow Count (full) 0
216
  [ALLOC_TEMP_JOB_ASYNC (Background)]
 
225
  Used Block count 1
226
  Peak Allocated bytes 1.0 MB
227
  [ALLOC_GFX_MAIN]
228
+ Peak usage frame count: [64.0 KB-128.0 KB]: 1 frames
229
  Requested Block Size 16.0 MB
230
  Peak Block count 1
231
  Peak Allocated memory 65.6 KB
232
  Peak Large allocation bytes 0 B
233
  [ALLOC_GFX_THREAD]
234
+ Peak usage frame count: [128.0 KB-256.0 KB]: 1 frames
235
  Requested Block Size 16.0 MB
236
  Peak Block count 1
237
  Peak Allocated memory 173.5 KB
 
243
  Used Block count 1
244
  Peak Allocated bytes 1.0 MB
245
  [ALLOC_CACHEOBJECTS_MAIN]
246
+ Peak usage frame count: [0.5 MB-1.0 MB]: 1 frames
247
  Requested Block Size 4.0 MB
248
  Peak Block count 1
249
  Peak Allocated memory 0.6 MB
250
  Peak Large allocation bytes 0 B
251
  [ALLOC_CACHEOBJECTS_THREAD]
252
+ Peak usage frame count: [4.0 MB-8.0 MB]: 1 frames
253
  Requested Block Size 4.0 MB
254
  Peak Block count 2
255
+ Peak Allocated memory 4.0 MB
256
  Peak Large allocation bytes 0 B
257
  [ALLOC_TYPETREE] Dual Thread Allocator
258
  Peak main deferred allocation count 0
 
261
  Used Block count 1
262
  Peak Allocated bytes 1.0 MB
263
  [ALLOC_TYPETREE_MAIN]
264
+ Peak usage frame count: [0-1.0 KB]: 1 frames
265
  Requested Block Size 2.0 MB
266
  Peak Block count 1
267
  Peak Allocated memory 1.0 KB
268
  Peak Large allocation bytes 0 B
269
  [ALLOC_TYPETREE_THREAD]
270
+ Peak usage frame count: [2.0 KB-4.0 KB]: 1 frames
271
  Requested Block Size 2.0 MB
272
  Peak Block count 1
273
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -1,399 +1,50 @@
1
  {
2
  "name": "root",
3
- "gauges": {
4
- "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 3.2849185466766357,
6
- "min": 3.2822699546813965,
7
- "max": 3.2957403659820557,
8
- "count": 5
9
- },
10
- "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 54345.69140625,
12
- "min": 36568.9921875,
13
- "max": 120650.375,
14
- "count": 5
15
- },
16
- "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 629.3333333333334,
18
- "min": 629.3333333333334,
19
- "max": 999.0,
20
- "count": 5
21
- },
22
- "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 15104.0,
24
- "min": 11988.0,
25
- "max": 27384.0,
26
- "count": 5
27
- },
28
- "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1199.970800819546,
30
- "min": 1198.139685214751,
31
- "max": 1199.970800819546,
32
- "count": 4
33
- },
34
- "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 7199.824804917276,
36
- "min": 2399.6008352755034,
37
- "max": 9585.117481718007,
38
- "count": 4
39
- },
40
- "SoccerTwos.Step.mean": {
41
- "value": 49613.0,
42
- "min": 9926.0,
43
- "max": 49613.0,
44
- "count": 5
45
- },
46
- "SoccerTwos.Step.sum": {
47
- "value": 49613.0,
48
- "min": 9926.0,
49
- "max": 49613.0,
50
- "count": 5
51
- },
52
- "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
- "value": 0.07776747643947601,
54
- "min": 0.07776747643947601,
55
- "max": 0.10341869294643402,
56
- "count": 5
57
- },
58
- "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
- "value": 1.0887446403503418,
60
- "min": 0.8938918709754944,
61
- "max": 1.6546990871429443,
62
- "count": 5
63
- },
64
- "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
- "value": 0.07662778347730637,
66
- "min": 0.07662778347730637,
67
- "max": 0.10339052230119705,
68
- "count": 5
69
- },
70
- "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
- "value": 1.072788953781128,
72
- "min": 0.8882986903190613,
73
- "max": 1.6542176008224487,
74
- "count": 5
75
- },
76
- "SoccerTwos.Environment.CumulativeReward.mean": {
77
- "value": 0.0,
78
- "min": 0.0,
79
- "max": 0.0,
80
- "count": 5
81
- },
82
- "SoccerTwos.Environment.CumulativeReward.sum": {
83
- "value": 0.0,
84
- "min": 0.0,
85
- "max": 0.0,
86
- "count": 5
87
- },
88
- "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
- "value": -0.0006142897265298026,
90
- "min": -0.29465000331401825,
91
- "max": 0.10069090669805353,
92
- "count": 5
93
- },
94
- "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
- "value": -0.008600056171417236,
96
- "min": -4.714400053024292,
97
- "max": 1.1075999736785889,
98
- "count": 5
99
- },
100
- "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
- "value": -0.0006142897265298026,
102
- "min": -0.29465000331401825,
103
- "max": 0.10069090669805353,
104
- "count": 5
105
- },
106
- "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
- "value": -0.008600056171417236,
108
- "min": -4.714400053024292,
109
- "max": 1.1075999736785889,
110
- "count": 5
111
- },
112
- "SoccerTwos.IsTraining.mean": {
113
- "value": 1.0,
114
- "min": 1.0,
115
- "max": 1.0,
116
- "count": 5
117
- },
118
- "SoccerTwos.IsTraining.sum": {
119
- "value": 1.0,
120
- "min": 1.0,
121
- "max": 1.0,
122
- "count": 5
123
- },
124
- "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.01827663181272025,
126
- "min": 0.01827663181272025,
127
- "max": 0.018535127410561673,
128
- "count": 2
129
- },
130
- "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.01827663181272025,
132
- "min": 0.01827663181272025,
133
- "max": 0.018535127410561673,
134
- "count": 2
135
- },
136
- "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.0014572304925726106,
138
- "min": 0.0014572304925726106,
139
- "max": 0.004968332605332964,
140
- "count": 2
141
- },
142
- "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.0014572304925726106,
144
- "min": 0.0014572304925726106,
145
- "max": 0.004968332605332964,
146
- "count": 2
147
- },
148
- "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.001462098511789615,
150
- "min": 0.001462098511789615,
151
- "max": 0.004616912305613773,
152
- "count": 2
153
- },
154
- "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.001462098511789615,
156
- "min": 0.001462098511789615,
157
- "max": 0.004616912305613773,
158
- "count": 2
159
- },
160
- "SoccerTwos.Policy.LearningRate.mean": {
161
- "value": 0.0003,
162
- "min": 0.0003,
163
- "max": 0.0003,
164
- "count": 2
165
- },
166
- "SoccerTwos.Policy.LearningRate.sum": {
167
- "value": 0.0003,
168
- "min": 0.0003,
169
- "max": 0.0003,
170
- "count": 2
171
- },
172
- "SoccerTwos.Policy.Epsilon.mean": {
173
- "value": 0.20000000000000007,
174
- "min": 0.20000000000000004,
175
- "max": 0.20000000000000007,
176
- "count": 2
177
- },
178
- "SoccerTwos.Policy.Epsilon.sum": {
179
- "value": 0.20000000000000007,
180
- "min": 0.20000000000000004,
181
- "max": 0.20000000000000007,
182
- "count": 2
183
- },
184
- "SoccerTwos.Policy.Beta.mean": {
185
- "value": 0.005000000000000001,
186
- "min": 0.005000000000000001,
187
- "max": 0.005000000000000001,
188
- "count": 2
189
- },
190
- "SoccerTwos.Policy.Beta.sum": {
191
- "value": 0.005000000000000001,
192
- "min": 0.005000000000000001,
193
- "max": 0.005000000000000001,
194
- "count": 2
195
- }
196
- },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1696601341",
200
  "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
201
- "command_line_arguments": "/usr/local/bin/mlagents-learn ./SoccerTwos.yaml --env=./training-envs-executables/linux/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
202
  "mlagents_version": "0.31.0.dev0",
203
  "mlagents_envs_version": "0.31.0.dev0",
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "2.0.1+cu118",
206
  "numpy_version": "1.21.2",
207
- "end_time_seconds": "1696601675"
208
  },
209
- "total": 333.77662798599977,
210
  "count": 1,
211
- "self": 0.4779327979995287,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.09646322800017515,
215
  "count": 1,
216
- "self": 0.09646322800017515
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 333.20223196000006,
220
  "count": 1,
221
- "self": 0.16315604495594016,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 1.379666351999731,
225
  "count": 1,
226
- "self": 1.379666351999731
227
- },
228
- "TrainerController.advance": {
229
- "total": 331.4088556190445,
230
- "count": 3536,
231
- "self": 0.20539585004735272,
232
- "children": {
233
- "env_step": {
234
- "total": 142.37804969698027,
235
- "count": 3536,
236
- "self": 114.59354260094551,
237
- "children": {
238
- "SubprocessEnvManager._take_step": {
239
- "total": 27.685866596002597,
240
- "count": 3536,
241
- "self": 1.316916077021233,
242
- "children": {
243
- "TorchPolicy.evaluate": {
244
- "total": 26.368950518981364,
245
- "count": 7034,
246
- "self": 26.368950518981364
247
- }
248
- }
249
- },
250
- "workers": {
251
- "total": 0.09864050003216107,
252
- "count": 3536,
253
- "self": 0.0,
254
- "children": {
255
- "worker_root": {
256
- "total": 331.7274617339681,
257
- "count": 3536,
258
- "is_parallel": true,
259
- "self": 237.67229141499047,
260
- "children": {
261
- "run_training.setup": {
262
- "total": 0.0,
263
- "count": 0,
264
- "is_parallel": true,
265
- "self": 0.0,
266
- "children": {
267
- "steps_from_proto": {
268
- "total": 0.006192820000251231,
269
- "count": 2,
270
- "is_parallel": true,
271
- "self": 0.001473469999837107,
272
- "children": {
273
- "_process_rank_one_or_two_observation": {
274
- "total": 0.004719350000414124,
275
- "count": 8,
276
- "is_parallel": true,
277
- "self": 0.004719350000414124
278
- }
279
- }
280
- },
281
- "UnityEnvironment.step": {
282
- "total": 0.11690096400070615,
283
- "count": 1,
284
- "is_parallel": true,
285
- "self": 0.0015231720008159755,
286
- "children": {
287
- "UnityEnvironment._generate_step_input": {
288
- "total": 0.0010221030006505316,
289
- "count": 1,
290
- "is_parallel": true,
291
- "self": 0.0010221030006505316
292
- },
293
- "communicator.exchange": {
294
- "total": 0.10395117400003073,
295
- "count": 1,
296
- "is_parallel": true,
297
- "self": 0.10395117400003073
298
- },
299
- "steps_from_proto": {
300
- "total": 0.010404514999208914,
301
- "count": 2,
302
- "is_parallel": true,
303
- "self": 0.003400746999432158,
304
- "children": {
305
- "_process_rank_one_or_two_observation": {
306
- "total": 0.0070037679997767555,
307
- "count": 8,
308
- "is_parallel": true,
309
- "self": 0.0070037679997767555
310
- }
311
- }
312
- }
313
- }
314
- }
315
- }
316
- },
317
- "UnityEnvironment.step": {
318
- "total": 94.05517031897762,
319
- "count": 3535,
320
- "is_parallel": true,
321
- "self": 6.599305579941756,
322
- "children": {
323
- "UnityEnvironment._generate_step_input": {
324
- "total": 3.2360494990043662,
325
- "count": 3535,
326
- "is_parallel": true,
327
- "self": 3.2360494990043662
328
- },
329
- "communicator.exchange": {
330
- "total": 65.80380868402062,
331
- "count": 3535,
332
- "is_parallel": true,
333
- "self": 65.80380868402062
334
- },
335
- "steps_from_proto": {
336
- "total": 18.41600655601087,
337
- "count": 7070,
338
- "is_parallel": true,
339
- "self": 3.534552065990283,
340
- "children": {
341
- "_process_rank_one_or_two_observation": {
342
- "total": 14.881454490020587,
343
- "count": 28280,
344
- "is_parallel": true,
345
- "self": 14.881454490020587
346
- }
347
- }
348
- }
349
- }
350
- }
351
- }
352
- }
353
- }
354
- }
355
- }
356
- },
357
- "trainer_advance": {
358
- "total": 188.8254100720169,
359
- "count": 3536,
360
- "self": 1.1613369650240202,
361
- "children": {
362
- "process_trajectory": {
363
- "total": 25.060931144992537,
364
- "count": 3536,
365
- "self": 25.060931144992537
366
- },
367
- "_update_policy": {
368
- "total": 162.60314196200034,
369
- "count": 2,
370
- "self": 14.102124521005862,
371
- "children": {
372
- "TorchPOCAOptimizer.update": {
373
- "total": 148.50101744099447,
374
- "count": 66,
375
- "self": 148.50101744099447
376
- }
377
- }
378
- }
379
- }
380
- }
381
- }
382
  },
383
  "trainer_threads": {
384
- "total": 1.2900000001536682e-06,
385
  "count": 1,
386
- "self": 1.2900000001536682e-06
387
  },
388
  "TrainerController._save_models": {
389
- "total": 0.2505526539998755,
390
  "count": 1,
391
- "self": 0.002800123999804782,
392
  "children": {
393
  "RLTrainer._checkpoint": {
394
- "total": 0.2477525300000707,
395
  "count": 1,
396
- "self": 0.2477525300000707
397
  }
398
  }
399
  }
 
1
  {
2
  "name": "root",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  "metadata": {
4
  "timer_format_version": "0.1.0",
5
+ "start_time_seconds": "1696606414",
6
  "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
7
+ "command_line_arguments": "/usr/local/bin/mlagents-learn ./SoccerTwos.yaml --env=./training-envs-executables/linux/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume",
8
  "mlagents_version": "0.31.0.dev0",
9
  "mlagents_envs_version": "0.31.0.dev0",
10
  "communication_protocol_version": "1.5.0",
11
  "pytorch_version": "2.0.1+cu118",
12
  "numpy_version": "1.21.2",
13
+ "end_time_seconds": "1696606417"
14
  },
15
+ "total": 3.1464899069997045,
16
  "count": 1,
17
+ "self": 1.3063794559984672,
18
  "children": {
19
  "run_training.setup": {
20
+ "total": 0.0578642470009072,
21
  "count": 1,
22
+ "self": 0.0578642470009072
23
  },
24
  "TrainerController.start_learning": {
25
+ "total": 1.7822462040003302,
26
  "count": 1,
27
+ "self": 0.0002163680001103785,
28
  "children": {
29
  "TrainerController._reset_env": {
30
+ "total": 1.3604172539999126,
31
  "count": 1,
32
+ "self": 1.3604172539999126
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  },
34
  "trainer_threads": {
35
+ "total": 1.9889994291588664e-06,
36
  "count": 1,
37
+ "self": 1.9889994291588664e-06
38
  },
39
  "TrainerController._save_models": {
40
+ "total": 0.421610593000878,
41
  "count": 1,
42
+ "self": 0.003257940001276438,
43
  "children": {
44
  "RLTrainer._checkpoint": {
45
+ "total": 0.41835265299960156,
46
  "count": 1,
47
+ "self": 0.41835265299960156
48
  }
49
  }
50
  }
run_logs/training_status.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "SoccerTwos": {
3
- "elo": 1201.0544577894468,
4
  "checkpoints": [
5
  {
6
  "steps": 50092,
@@ -10,15 +10,42 @@
10
  "auxillary_file_paths": [
11
  "results/SoccerTwos/SoccerTwos/SoccerTwos-50092.pt"
12
  ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  }
14
  ],
15
  "final_checkpoint": {
16
- "steps": 50092,
17
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
18
- "reward": 0.0,
19
- "creation_time": 1696601674.8342452,
20
  "auxillary_file_paths": [
21
- "results/SoccerTwos/SoccerTwos/SoccerTwos-50092.pt"
22
  ]
23
  }
24
  },
 
1
  {
2
  "SoccerTwos": {
3
+ "elo": 1224.542007813142,
4
  "checkpoints": [
5
  {
6
  "steps": 50092,
 
10
  "auxillary_file_paths": [
11
  "results/SoccerTwos/SoccerTwos/SoccerTwos-50092.pt"
12
  ]
13
+ },
14
+ {
15
+ "steps": 499576,
16
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-499576.onnx",
17
+ "reward": 0.0,
18
+ "creation_time": 1696605803.2668495,
19
+ "auxillary_file_paths": [
20
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-499576.pt"
21
+ ]
22
+ },
23
+ {
24
+ "steps": 601382,
25
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-601382.onnx",
26
+ "reward": 0.0,
27
+ "creation_time": 1696606405.8739417,
28
+ "auxillary_file_paths": [
29
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-601382.pt"
30
+ ]
31
+ },
32
+ {
33
+ "steps": 601382,
34
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-601382.onnx",
35
+ "reward": null,
36
+ "creation_time": 1696606416.505571,
37
+ "auxillary_file_paths": [
38
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-601382.pt"
39
+ ]
40
  }
41
  ],
42
  "final_checkpoint": {
43
+ "steps": 601382,
44
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
45
+ "reward": null,
46
+ "creation_time": 1696606416.505571,
47
  "auxillary_file_paths": [
48
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-601382.pt"
49
  ]
50
  }
51
  },