Statos6 commited on
Commit
f5c5d35
1 Parent(s): 3c53f01

Retrained to 10M steps, with higher play_against_latest_model_ratio (0.75 instead of 0.25) this helped the model to learn to play defense better

Browse files
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c574606e5c1839061cdb7dc9b76863444295b5b91caccfc413a1ed077ee8c3f
3
  size 895526
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b6d608c4248e0b310070b2af2b4ea2275b174aeed4ae07c4b7ff7524ee580d5
3
  size 895526
SoccerTwos/SoccerTwos-10000046.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b6d608c4248e0b310070b2af2b4ea2275b174aeed4ae07c4b7ff7524ee580d5
3
+ size 895526
SoccerTwos/SoccerTwos-10000046.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7da542e5ed006a647545f746b09a40c9006d9b32927ef30a3ab22b48f7c7775c
3
+ size 10325290
SoccerTwos/SoccerTwos-8499978.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6c0ccf92cff2ea1b32b49e95f6a42b5d63affc6f5ee79e658cd79776696d523
3
+ size 895526
SoccerTwos/SoccerTwos-8499978.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eecdb844b9847844a5be6db79e351f3711605e9c42b7cc03ab11b57b62e7522f
3
+ size 10325138
SoccerTwos/SoccerTwos-8999988.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19f45f7b592496e18ff616e19a9a276b8269eba93055ddb4f2a1d24b6e414b20
3
+ size 895526
SoccerTwos/SoccerTwos-8999988.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cde9c9d152dc7cce4fe5a93171548d2a7f8103247bc932b061a6e0c7faf43c7
3
+ size 10325138
SoccerTwos/SoccerTwos-9499993.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b6772ba57d0dda936a1b86cfe6c1d0da4bff2be72cdf1a8289ac94f43aaa77f
3
+ size 895526
SoccerTwos/SoccerTwos-9499993.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:811ca51769e17fef7d09824811d17d0e7b4823ff3e3459cf4dcdd9fa5753c134
3
+ size 10325138
SoccerTwos/SoccerTwos-9999982.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ae6b4d8b9bce2651e6142580cdc5b4625eb01736ba52eb9ab6a952a964b862c
3
+ size 895526
SoccerTwos/SoccerTwos-9999982.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5a6a4d7f4080efe31a06dc37491f39b98ca4223b9ab7f31f785bfefb6ccfb1f
3
+ size 10325138
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:008145e1e808608cc93b4d650ceaa479d23cc271324dee6c3b01906b96fa84f6
3
  size 10323922
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37854fa1cf62607fbcf6e1fa3522fdc3890a2084987edc894f3955253d66549d
3
  size 10323922
SoccerTwos/events.out.tfevents.1710341962.stephan-ms7c02.29905.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4328e8cf67a012d3b679ca03e83f9101e4827d554072a1d9dde86d2717a0992a
3
+ size 661583
SoccerTwos/events.out.tfevents.1710343832.stephan-ms7c02.33144.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97512bb4824eae2e636aac4106b752ef6109d681e20d6fc75355ec92b3a0529f
3
+ size 3405815
SoccerTwos_orig/SoccerTwos-4999994.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be96c3872475cc25d67472685bc2fee156427488a3c08e79bd28cf6c98213a94
3
+ size 895526
SoccerTwos_orig/SoccerTwos-4999994.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71e54f36b571a60d1bd3474e5ee403ddc02aa6aafcd1c007e1272b0fa33cbfd8
3
+ size 10325138
SoccerTwos_orig/SoccerTwos-5000026.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23416b67a78fe350c105debeb7be130b546d1ca99633a6d58b7b2ab627bdac15
3
+ size 895526
SoccerTwos_orig/SoccerTwos-5000026.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef0aa7a1f48d9f4164990361bc247cd36df0a533121533f0cdf22a25adfb7189
3
+ size 10325138
SoccerTwos_orig/SoccerTwos-5499990.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ee5c6c1bdaa2e03dd5acac35279c5a077f98827615be82d01ca79d646f2847f
3
+ size 895526
SoccerTwos_orig/SoccerTwos-5499990.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1b631e6e474edfbd6397a6a173d3a36a447960b4e996fe4f72efd68936a6196
3
+ size 10325138
SoccerTwos_orig/SoccerTwos-5999976.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56acb86e98bacbe50d2c8305c10c4bcb279131ff4c1359ef6245cccfed56cd97
3
+ size 895526
SoccerTwos_orig/SoccerTwos-5999976.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c17aec0f05d051f9f1c6ca2db48529936e5c49c6978ab68abb2f1a5a9dbc004a
3
+ size 10325138
SoccerTwos_orig/SoccerTwos-6000104.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c574606e5c1839061cdb7dc9b76863444295b5b91caccfc413a1ed077ee8c3f
3
+ size 895526
SoccerTwos_orig/SoccerTwos-6000104.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccaa39ff525af5de7c6578077964314fe8b52d503f9fd6cb8fa52b144355b61b
3
+ size 10325138
SoccerTwos_orig/checkpoint.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:008145e1e808608cc93b4d650ceaa479d23cc271324dee6c3b01906b96fa84f6
3
+ size 10323922
SoccerTwos_orig/events.out.tfevents.1710290777.stephan-ms7c02.14283.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:921364813e102c784e2b1fe10a218e4108aaf0c18241e88faad09085f782460c
3
+ size 4854988
SoccerTwos_orig/events.out.tfevents.1710333085.stephan-ms7c02.24579.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cd4e31cb3abbb0f4426bddd18591f073816db885a8bc2560ff7951c70d47284
3
+ size 1017522
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 4096, "buffer_size": 65536, "learning_rate": 0.0004345843188705317, "beta": 0.00019215097636640332, "epsilon": 0.15831928707038231, "lambd": 0.9467147291117369, "num_epoch": 5, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": true, "hidden_units": 256, "num_layers": 3, "vis_encode_type": "fully_connected", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.9608227414353802, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 6000000, "time_horizon": 32, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 60000, "team_change": 589998, "swap_steps": 70000, "window": 25, "play_against_latest_model_ratio": 0.2427456302841774, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./ml-agents/training-envs-executables/SoccerTwos.exe", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 1280, "height": 720, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": false, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos-read-deal", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 4096, "buffer_size": 65536, "learning_rate": 0.0004345843188705317, "beta": 0.00019215097636640332, "epsilon": 0.15831928707038231, "lambd": 0.9467147291117369, "num_epoch": 5, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": true, "hidden_units": 256, "num_layers": 3, "vis_encode_type": "fully_connected", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.9608227414353802, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 10000000, "time_horizon": 32, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 60000, "team_change": 589998, "swap_steps": 70000, "window": 25, "play_against_latest_model_ratio": 0.75, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./ml-agents/training-envs-executables/SoccerTwos.exe", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 1280, "height": 720, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": false, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos-read-deal", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -37,7 +37,7 @@ behaviors:
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
- max_steps: 6000000
41
  time_horizon: 32
42
  summary_freq: 10000
43
  threaded: false
@@ -46,7 +46,7 @@ behaviors:
46
  team_change: 589998
47
  swap_steps: 70000
48
  window: 25
49
- play_against_latest_model_ratio: 0.2427456302841774
50
  initial_elo: 1200.0
51
  behavioral_cloning: null
52
  env_settings:
 
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
+ max_steps: 10000000
41
  time_horizon: 32
42
  summary_freq: 10000
43
  threaded: false
 
46
  team_change: 589998
47
  swap_steps: 70000
48
  window: 25
49
+ play_against_latest_model_ratio: 0.75
50
  initial_elo: 1200.0
51
  behavioral_cloning: null
52
  env_settings:
run_logs/Player-0.log CHANGED
@@ -19,14 +19,14 @@ ns GL_ARB_stencil_texturing GL_ARB_sync GL_ARB_tessellation_shader GL_ARB_textur
19
  _buffer_object GL_ARB_vertex_shader GL_ARB_vertex_type_10f_11f_11f_rev GL_ARB_vertex_type_2_10_10_10_rev GL_ARB_viewport_array GL_ATI_blend_equation_separate GL_ATI_meminfo GL_ATI_texture_float GL_ATI_texture_mirror_once GL_EXT_EGL_image_storage GL_EXT_EGL_sync GL_EXT_abgr GL_EXT_blend_equation_separate GL_EXT_debug_label GL_EXT_demote_to_helper_invocation GL_EXT_depth_bounds_test GL_EXT_draw_buffers2 GL_EXT_draw_instanced GL_EXT_framebuffer_blit GL_EXT_framebuffer_multisample GL_EXT_framebuffer_multisample_blit_scaled GL_EXT_framebuffer_object GL_EXT_framebuffer_sRGB GL_EXT_memory_object GL_EXT_memory_object_fd GL_EXT_packed_depth_stencil GL_EXT_packed_float GL_EXT_pixel_buffer_object GL_EXT_polygon_offset_clamp GL_EXT_provoking_vertex GL_EXT_semaphore GL_EXT_semaphore_fd GL_EXT_shader_image_load_formatted GL_EXT_shader_image_load_store GL_EXT_shader_integer_mix GL_EXT_shader_samples_identical GL_EXT_texture_array GL_EXT_texture_compression_dxt1 GL_EXT_texture_compression_rgtc GL_EXT_texture_compression_s3t
20
  c GL_EXT_texture_filter_anisotropic GL_EXT_texture_integer GL_EXT_texture_mirror_clamp GL_EXT_texture_sRGB GL_EXT_texture_sRGB_R8 GL_EXT_texture_sRGB_decode GL_EXT_texture_shadow_lod GL_EXT_texture_shared_exponent GL_EXT_texture_snorm GL_EXT_texture_swizzle GL_EXT_timer_query GL_EXT_transform_feedback GL_EXT_vertex_array_bgra GL_EXT_vertex_attrib_64bit GL_EXT_window_rectangles GL_IBM_multimode_draw_arrays GL_INTEL_blackhole_render GL_KHR_blend_equation_advanced GL_KHR_context_flush_control GL_KHR_debug GL_KHR_no_error GL_KHR_parallel_shader_compile GL_KHR_robust_buffer_access_behavior GL_KHR_robustness GL_KHR_texture_compression_astc_ldr GL_KHR_texture_compression_astc_sliced_3d GL_MESA_framebuffer_flip_y GL_MESA_pack_invert GL_MESA_shader_integer_functions GL_MESA_texture_const_bandwidth GL_MESA_texture_signed_rgba GL_NVX_gpu_memory_info GL_NV_alpha_to_coverage_dither_control GL_NV_compute_shader_derivatives GL_NV_conditional_render GL_NV_copy_image GL_NV_depth_clamp GL_NV_packed_depth_stencil GL_NV_shader_
21
  atomic_int64 GL_NV_texture_barrier GL_NV_vdpau_interop GL_OES_EGL_image GL_S3_s3tc
22
- OPENGL LOG: Creating OpenGL 4.6 graphics device ; Context level <OpenGL 4.5> ; Context handle 16352240
23
  Begin MonoManager ReloadAssembly
24
- - Completed reload, in 0.083 seconds
25
  Default vsync count 1
26
  requesting resize 1280 x 720
27
  resizing window to 1280 x 720
28
  Desktop is 1920 x 1080 @ 60 Hz
29
- UnloadTime: 0.827430 ms
30
  Registered Communicator in Agent.
31
  Setting up 6 worker threads for Enlighten.
32
  requesting resize 1280 x 720
@@ -36,7 +36,7 @@ Memory Statistics:
36
  [ALLOC_TEMP_TLS] TLS Allocator
37
  StackAllocators :
38
  [ALLOC_TEMP_MAIN]
39
- Peak usage frame count: [8.0 KB-16.0 KB]: 18758 frames, [2.0 MB-4.0 MB]: 1 frames
40
  Initial Block Size 4.0 MB
41
  Current Block Size 4.0 MB
42
  Peak Allocated Bytes 2.1 MB
@@ -211,18 +211,18 @@ Memory Statistics:
211
  [ALLOC_BUCKET]
212
  Large Block size 4.0 MB
213
  Used Block count 1
214
- Peak Allocated bytes 2.0 MB
215
  [ALLOC_DEFAULT_MAIN]
216
- Peak usage frame count: [8.0 MB-16.0 MB]: 18759 frames
217
  Requested Block Size 16.0 MB
218
  Peak Block count 1
219
  Peak Allocated memory 13.0 MB
220
  Peak Large allocation bytes 0 B
221
  [ALLOC_DEFAULT_THREAD]
222
- Peak usage frame count: [16.0 MB-32.0 MB]: 18759 frames
223
  Requested Block Size 16.0 MB
224
  Peak Block count 1
225
- Peak Allocated memory 29.1 MB
226
  Peak Large allocation bytes 16.0 MB
227
  [ALLOC_TEMP_JOB_1_FRAME]
228
  Initial Block Size 2.0 MB
@@ -249,15 +249,15 @@ Memory Statistics:
249
  [ALLOC_BUCKET]
250
  Large Block size 4.0 MB
251
  Used Block count 1
252
- Peak Allocated bytes 2.0 MB
253
  [ALLOC_GFX_MAIN]
254
- Peak usage frame count: [32.0 KB-64.0 KB]: 18758 frames, [2.0 MB-4.0 MB]: 1 frames
255
  Requested Block Size 16.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 2.7 MB
258
  Peak Large allocation bytes 0 B
259
  [ALLOC_GFX_THREAD]
260
- Peak usage frame count: [128.0 KB-256.0 KB]: 18759 frames
261
  Requested Block Size 16.0 MB
262
  Peak Block count 1
263
  Peak Allocated memory 174.7 KB
@@ -267,15 +267,15 @@ Memory Statistics:
267
  [ALLOC_BUCKET]
268
  Large Block size 4.0 MB
269
  Used Block count 1
270
- Peak Allocated bytes 2.0 MB
271
  [ALLOC_CACHEOBJECTS_MAIN]
272
- Peak usage frame count: [0.5 MB-1.0 MB]: 18758 frames, [1.0 MB-2.0 MB]: 1 frames
273
  Requested Block Size 4.0 MB
274
  Peak Block count 1
275
  Peak Allocated memory 1.2 MB
276
  Peak Large allocation bytes 0 B
277
  [ALLOC_CACHEOBJECTS_THREAD]
278
- Peak usage frame count: [4.0 MB-8.0 MB]: 18759 frames
279
  Requested Block Size 4.0 MB
280
  Peak Block count 2
281
  Peak Allocated memory 7.8 MB
@@ -285,15 +285,15 @@ Memory Statistics:
285
  [ALLOC_BUCKET]
286
  Large Block size 4.0 MB
287
  Used Block count 1
288
- Peak Allocated bytes 2.0 MB
289
  [ALLOC_TYPETREE_MAIN]
290
- Peak usage frame count: [0-1.0 KB]: 18759 frames
291
  Requested Block Size 2.0 MB
292
  Peak Block count 1
293
  Peak Allocated memory 1.0 KB
294
  Peak Large allocation bytes 0 B
295
  [ALLOC_TYPETREE_THREAD]
296
- Peak usage frame count: [1.0 KB-2.0 KB]: 18758 frames, [2.0 KB-4.0 KB]: 1 frames
297
  Requested Block Size 2.0 MB
298
  Peak Block count 1
299
  Peak Allocated memory 2.2 KB
 
19
  _buffer_object GL_ARB_vertex_shader GL_ARB_vertex_type_10f_11f_11f_rev GL_ARB_vertex_type_2_10_10_10_rev GL_ARB_viewport_array GL_ATI_blend_equation_separate GL_ATI_meminfo GL_ATI_texture_float GL_ATI_texture_mirror_once GL_EXT_EGL_image_storage GL_EXT_EGL_sync GL_EXT_abgr GL_EXT_blend_equation_separate GL_EXT_debug_label GL_EXT_demote_to_helper_invocation GL_EXT_depth_bounds_test GL_EXT_draw_buffers2 GL_EXT_draw_instanced GL_EXT_framebuffer_blit GL_EXT_framebuffer_multisample GL_EXT_framebuffer_multisample_blit_scaled GL_EXT_framebuffer_object GL_EXT_framebuffer_sRGB GL_EXT_memory_object GL_EXT_memory_object_fd GL_EXT_packed_depth_stencil GL_EXT_packed_float GL_EXT_pixel_buffer_object GL_EXT_polygon_offset_clamp GL_EXT_provoking_vertex GL_EXT_semaphore GL_EXT_semaphore_fd GL_EXT_shader_image_load_formatted GL_EXT_shader_image_load_store GL_EXT_shader_integer_mix GL_EXT_shader_samples_identical GL_EXT_texture_array GL_EXT_texture_compression_dxt1 GL_EXT_texture_compression_rgtc GL_EXT_texture_compression_s3t
20
  c GL_EXT_texture_filter_anisotropic GL_EXT_texture_integer GL_EXT_texture_mirror_clamp GL_EXT_texture_sRGB GL_EXT_texture_sRGB_R8 GL_EXT_texture_sRGB_decode GL_EXT_texture_shadow_lod GL_EXT_texture_shared_exponent GL_EXT_texture_snorm GL_EXT_texture_swizzle GL_EXT_timer_query GL_EXT_transform_feedback GL_EXT_vertex_array_bgra GL_EXT_vertex_attrib_64bit GL_EXT_window_rectangles GL_IBM_multimode_draw_arrays GL_INTEL_blackhole_render GL_KHR_blend_equation_advanced GL_KHR_context_flush_control GL_KHR_debug GL_KHR_no_error GL_KHR_parallel_shader_compile GL_KHR_robust_buffer_access_behavior GL_KHR_robustness GL_KHR_texture_compression_astc_ldr GL_KHR_texture_compression_astc_sliced_3d GL_MESA_framebuffer_flip_y GL_MESA_pack_invert GL_MESA_shader_integer_functions GL_MESA_texture_const_bandwidth GL_MESA_texture_signed_rgba GL_NVX_gpu_memory_info GL_NV_alpha_to_coverage_dither_control GL_NV_compute_shader_derivatives GL_NV_conditional_render GL_NV_copy_image GL_NV_depth_clamp GL_NV_packed_depth_stencil GL_NV_shader_
21
  atomic_int64 GL_NV_texture_barrier GL_NV_vdpau_interop GL_OES_EGL_image GL_S3_s3tc
22
+ OPENGL LOG: Creating OpenGL 4.6 graphics device ; Context level <OpenGL 4.5> ; Context handle 22053744
23
  Begin MonoManager ReloadAssembly
24
+ - Completed reload, in 0.092 seconds
25
  Default vsync count 1
26
  requesting resize 1280 x 720
27
  resizing window to 1280 x 720
28
  Desktop is 1920 x 1080 @ 60 Hz
29
+ UnloadTime: 0.807040 ms
30
  Registered Communicator in Agent.
31
  Setting up 6 worker threads for Enlighten.
32
  requesting resize 1280 x 720
 
36
  [ALLOC_TEMP_TLS] TLS Allocator
37
  StackAllocators :
38
  [ALLOC_TEMP_MAIN]
39
+ Peak usage frame count: [8.0 KB-16.0 KB]: 62727 frames, [2.0 MB-4.0 MB]: 1 frames
40
  Initial Block Size 4.0 MB
41
  Current Block Size 4.0 MB
42
  Peak Allocated Bytes 2.1 MB
 
211
  [ALLOC_BUCKET]
212
  Large Block size 4.0 MB
213
  Used Block count 1
214
+ Peak Allocated bytes 1.9 MB
215
  [ALLOC_DEFAULT_MAIN]
216
+ Peak usage frame count: [8.0 MB-16.0 MB]: 62728 frames
217
  Requested Block Size 16.0 MB
218
  Peak Block count 1
219
  Peak Allocated memory 13.0 MB
220
  Peak Large allocation bytes 0 B
221
  [ALLOC_DEFAULT_THREAD]
222
+ Peak usage frame count: [16.0 MB-32.0 MB]: 62728 frames
223
  Requested Block Size 16.0 MB
224
  Peak Block count 1
225
+ Peak Allocated memory 28.7 MB
226
  Peak Large allocation bytes 16.0 MB
227
  [ALLOC_TEMP_JOB_1_FRAME]
228
  Initial Block Size 2.0 MB
 
249
  [ALLOC_BUCKET]
250
  Large Block size 4.0 MB
251
  Used Block count 1
252
+ Peak Allocated bytes 1.9 MB
253
  [ALLOC_GFX_MAIN]
254
+ Peak usage frame count: [32.0 KB-64.0 KB]: 62727 frames, [2.0 MB-4.0 MB]: 1 frames
255
  Requested Block Size 16.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 2.7 MB
258
  Peak Large allocation bytes 0 B
259
  [ALLOC_GFX_THREAD]
260
+ Peak usage frame count: [128.0 KB-256.0 KB]: 62728 frames
261
  Requested Block Size 16.0 MB
262
  Peak Block count 1
263
  Peak Allocated memory 174.7 KB
 
267
  [ALLOC_BUCKET]
268
  Large Block size 4.0 MB
269
  Used Block count 1
270
+ Peak Allocated bytes 1.9 MB
271
  [ALLOC_CACHEOBJECTS_MAIN]
272
+ Peak usage frame count: [0.5 MB-1.0 MB]: 62727 frames, [1.0 MB-2.0 MB]: 1 frames
273
  Requested Block Size 4.0 MB
274
  Peak Block count 1
275
  Peak Allocated memory 1.2 MB
276
  Peak Large allocation bytes 0 B
277
  [ALLOC_CACHEOBJECTS_THREAD]
278
+ Peak usage frame count: [4.0 MB-8.0 MB]: 62728 frames
279
  Requested Block Size 4.0 MB
280
  Peak Block count 2
281
  Peak Allocated memory 7.8 MB
 
285
  [ALLOC_BUCKET]
286
  Large Block size 4.0 MB
287
  Used Block count 1
288
+ Peak Allocated bytes 1.9 MB
289
  [ALLOC_TYPETREE_MAIN]
290
+ Peak usage frame count: [0-1.0 KB]: 62728 frames
291
  Requested Block Size 2.0 MB
292
  Peak Block count 1
293
  Peak Allocated memory 1.0 KB
294
  Peak Large allocation bytes 0 B
295
  [ALLOC_TYPETREE_THREAD]
296
+ Peak usage frame count: [1.0 KB-2.0 KB]: 62727 frames, [2.0 KB-4.0 KB]: 1 frames
297
  Requested Block Size 2.0 MB
298
  Peak Block count 1
299
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -2,201 +2,201 @@
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 1.778828501701355,
6
- "min": 1.7496646642684937,
7
- "max": 1.904069185256958,
8
- "count": 100
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 35690.4140625,
12
- "min": 34937.3046875,
13
- "max": 38751.6171875,
14
- "count": 100
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 43.51754385964912,
18
- "min": 38.792,
19
- "max": 53.82022471910113,
20
- "count": 100
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 19844.0,
24
- "min": 18336.0,
25
- "max": 20936.0,
26
- "count": 100
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1561.460064375993,
30
- "min": 1519.7251303553944,
31
- "max": 1561.4942652168481,
32
- "count": 100
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 356012.8946777264,
36
- "min": 273814.30154407705,
37
- "max": 390373.566304212,
38
- "count": 100
39
  },
40
  "SoccerTwos.Step.mean": {
41
- "value": 5999976.0,
42
- "min": 5009984.0,
43
- "max": 5999976.0,
44
- "count": 100
45
  },
46
  "SoccerTwos.Step.sum": {
47
- "value": 5999976.0,
48
- "min": 5009984.0,
49
- "max": 5999976.0,
50
- "count": 100
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
- "value": 0.036884572356939316,
54
- "min": -0.06633567065000534,
55
- "max": 0.09457974880933762,
56
- "count": 100
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
- "value": 15.380867004394531,
60
- "min": -27.06495475769043,
61
- "max": 38.872276306152344,
62
- "count": 100
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
- "value": 0.03724776208400726,
66
- "min": -0.06787735223770142,
67
- "max": 0.09511835128068924,
68
- "count": 100
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
- "value": 15.532317161560059,
72
- "min": -27.693960189819336,
73
- "max": 39.09364318847656,
74
- "count": 100
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
- "count": 100
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
- "count": 100
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
- "value": 0.04650350934580753,
90
- "min": -0.2562914263634455,
91
- "max": 0.2151981968063492,
92
- "count": 100
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
- "value": 10.602800130844116,
96
- "min": -53.82119953632355,
97
- "max": 47.77399969100952,
98
- "count": 100
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
- "value": 0.04650350934580753,
102
- "min": -0.2562914263634455,
103
- "max": 0.2151981968063492,
104
- "count": 100
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
- "value": 10.602800130844116,
108
- "min": -53.82119953632355,
109
- "max": 47.77399969100952,
110
- "count": 100
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
- "count": 100
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
- "count": 100
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.014634914088446749,
126
- "min": 0.010371605570253451,
127
- "max": 0.014634914088446749,
128
- "count": 15
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.014634914088446749,
132
- "min": 0.010371605570253451,
133
- "max": 0.014634914088446749,
134
- "count": 15
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.051349658705294135,
138
- "min": 0.048586570238694546,
139
- "max": 0.05451308977790177,
140
- "count": 15
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.051349658705294135,
144
- "min": 0.048586570238694546,
145
- "max": 0.05451308977790177,
146
- "count": 15
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.0515909023117274,
150
- "min": 0.04938719081692398,
151
- "max": 0.054688979778438805,
152
- "count": 15
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.0515909023117274,
156
- "min": 0.04938719081692398,
157
- "max": 0.054688979778438805,
158
- "count": 15
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
- "value": 1.1853560262662174e-06,
162
- "min": 1.1853560262662174e-06,
163
- "max": 6.767456859236319e-05,
164
- "count": 15
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
- "value": 1.1853560262662174e-06,
168
- "min": 1.1853560262662174e-06,
169
- "max": 6.767456859236319e-05,
170
- "count": 15
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
- "value": 0.1001590561356033,
174
- "min": 0.1001590561356033,
175
- "max": 0.10908161546093645,
176
- "count": 15
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
- "value": 0.1001590561356033,
180
- "min": 0.1001590561356033,
181
- "max": 0.10908161546093645,
182
- "count": 15
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
- "value": 1.04967864295433e-05,
186
- "min": 1.04967864295433e-05,
187
- "max": 3.8364975058721184e-05,
188
- "count": 15
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
- "value": 1.04967864295433e-05,
192
- "min": 1.04967864295433e-05,
193
- "max": 3.8364975058721184e-05,
194
- "count": 15
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1710333081",
200
  "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
201
  "command_line_arguments": "/home/stephan/.conda/envs/rl/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./ml-agents/training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos-read-deal --width=1280 --height=720 --resume",
202
  "mlagents_version": "1.1.0.dev0",
@@ -204,59 +204,59 @@
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "2.2.1+cu121",
206
  "numpy_version": "1.23.5",
207
- "end_time_seconds": "1710335865"
208
  },
209
- "total": 2783.08172296299,
210
  "count": 1,
211
- "self": 0.3221229049813701,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.017381374011165462,
215
  "count": 1,
216
- "self": 0.017381374011165462
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 2782.7422186839976,
220
  "count": 1,
221
- "self": 1.4529281045834068,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 4.399289562992635,
225
- "count": 3,
226
- "self": 4.399289562992635
227
  },
228
  "TrainerController.advance": {
229
- "total": 2776.7682698464196,
230
- "count": 71154,
231
- "self": 1.2270896326372167,
232
  "children": {
233
  "env_step": {
234
- "total": 1269.4150066098955,
235
- "count": 71154,
236
- "self": 1077.1618315594678,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
- "total": 191.40557155759598,
240
- "count": 71154,
241
- "self": 5.71247391810175,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
- "total": 185.69309763949423,
245
- "count": 125058,
246
- "self": 185.69309763949423
247
  }
248
  }
249
  },
250
  "workers": {
251
- "total": 0.8476034928316949,
252
- "count": 71154,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
- "total": 2780.0714288110757,
257
- "count": 71154,
258
  "is_parallel": true,
259
- "self": 1856.7726158039295,
260
  "children": {
261
  "run_training.setup": {
262
  "total": 0.0,
@@ -265,48 +265,48 @@
265
  "self": 0.0,
266
  "children": {
267
  "steps_from_proto": {
268
- "total": 0.06613134100916795,
269
  "count": 2,
270
  "is_parallel": true,
271
- "self": 0.00047555101627949625,
272
  "children": {
273
  "_process_rank_one_or_two_observation": {
274
- "total": 0.06565578999288846,
275
  "count": 8,
276
  "is_parallel": true,
277
- "self": 0.06565578999288846
278
  }
279
  }
280
  },
281
  "UnityEnvironment.step": {
282
- "total": 0.031780133009306155,
283
  "count": 1,
284
  "is_parallel": true,
285
- "self": 0.0006475910049630329,
286
  "children": {
287
  "UnityEnvironment._generate_step_input": {
288
- "total": 0.0005751600110670552,
289
  "count": 1,
290
  "is_parallel": true,
291
- "self": 0.0005751600110670552
292
  },
293
  "communicator.exchange": {
294
- "total": 0.02851476900104899,
295
  "count": 1,
296
  "is_parallel": true,
297
- "self": 0.02851476900104899
298
  },
299
  "steps_from_proto": {
300
- "total": 0.0020426129922270775,
301
  "count": 2,
302
  "is_parallel": true,
303
- "self": 0.0004071999865118414,
304
  "children": {
305
  "_process_rank_one_or_two_observation": {
306
- "total": 0.001635413005715236,
307
  "count": 8,
308
  "is_parallel": true,
309
- "self": 0.001635413005715236
310
  }
311
  }
312
  }
@@ -315,48 +315,48 @@
315
  }
316
  },
317
  "steps_from_proto": {
318
- "total": 0.003298083000117913,
319
- "count": 4,
320
  "is_parallel": true,
321
- "self": 0.0005663799965986982,
322
  "children": {
323
  "_process_rank_one_or_two_observation": {
324
- "total": 0.0027317030035192147,
325
- "count": 16,
326
  "is_parallel": true,
327
- "self": 0.0027317030035192147
328
  }
329
  }
330
  },
331
  "UnityEnvironment.step": {
332
- "total": 923.2955149241461,
333
- "count": 71153,
334
  "is_parallel": true,
335
- "self": 50.94944198477606,
336
  "children": {
337
  "UnityEnvironment._generate_step_input": {
338
- "total": 31.86183314715163,
339
- "count": 71153,
340
  "is_parallel": true,
341
- "self": 31.86183314715163
342
  },
343
  "communicator.exchange": {
344
- "total": 713.6419240085379,
345
- "count": 71153,
346
  "is_parallel": true,
347
- "self": 713.6419240085379
348
  },
349
  "steps_from_proto": {
350
- "total": 126.84231578368053,
351
- "count": 142306,
352
  "is_parallel": true,
353
- "self": 22.54734104256204,
354
  "children": {
355
  "_process_rank_one_or_two_observation": {
356
- "total": 104.2949747411185,
357
- "count": 569224,
358
  "is_parallel": true,
359
- "self": 104.2949747411185
360
  }
361
  }
362
  }
@@ -369,31 +369,31 @@
369
  }
370
  },
371
  "trainer_advance": {
372
- "total": 1506.1261736038869,
373
- "count": 71154,
374
- "self": 8.044354920290061,
375
  "children": {
376
  "process_trajectory": {
377
- "total": 323.5915293196158,
378
- "count": 71154,
379
- "self": 323.3412643446063,
380
  "children": {
381
  "RLTrainer._checkpoint": {
382
- "total": 0.2502649750094861,
383
- "count": 2,
384
- "self": 0.2502649750094861
385
  }
386
  }
387
  },
388
  "_update_policy": {
389
- "total": 1174.490289363981,
390
- "count": 15,
391
- "self": 185.54603042497183,
392
  "children": {
393
  "TorchPOCAOptimizer.update": {
394
- "total": 988.9442589390092,
395
- "count": 1200,
396
- "self": 988.9442589390092
397
  }
398
  }
399
  }
@@ -402,19 +402,19 @@
402
  }
403
  },
404
  "trainer_threads": {
405
- "total": 8.600036380812526e-07,
406
  "count": 1,
407
- "self": 8.600036380812526e-07
408
  },
409
  "TrainerController._save_models": {
410
- "total": 0.12173030999838375,
411
  "count": 1,
412
- "self": 0.002498182002454996,
413
  "children": {
414
  "RLTrainer._checkpoint": {
415
- "total": 0.11923212799592875,
416
  "count": 1,
417
- "self": 0.11923212799592875
418
  }
419
  }
420
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
+ "value": 1.4048619270324707,
6
+ "min": 1.3750499486923218,
7
+ "max": 1.7051565647125244,
8
+ "count": 335
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
+ "value": 28277.060546875,
12
+ "min": 14701.9814453125,
13
+ "max": 34322.671875,
14
+ "count": 335
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
+ "value": 45.06422018348624,
18
+ "min": 35.125,
19
+ "max": 53.40425531914894,
20
+ "count": 335
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
+ "value": 19648.0,
24
+ "min": 8072.0,
25
+ "max": 20960.0,
26
+ "count": 335
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
+ "value": 1607.9046472284606,
30
+ "min": 1555.6832652825399,
31
+ "max": 1613.038356436412,
32
+ "count": 335
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
+ "value": 350523.2130958044,
36
+ "min": 163654.2453609866,
37
+ "max": 434134.2547516843,
38
+ "count": 335
39
  },
40
  "SoccerTwos.Step.mean": {
41
+ "value": 9999982.0,
42
+ "min": 6659988.0,
43
+ "max": 9999982.0,
44
+ "count": 335
45
  },
46
  "SoccerTwos.Step.sum": {
47
+ "value": 9999982.0,
48
+ "min": 6659988.0,
49
+ "max": 9999982.0,
50
+ "count": 335
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
+ "value": 0.03223046660423279,
54
+ "min": -0.11106479167938232,
55
+ "max": 0.10332842171192169,
56
+ "count": 335
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
+ "value": 13.246722221374512,
60
+ "min": -46.31401824951172,
61
+ "max": 44.017906188964844,
62
+ "count": 335
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
+ "value": 0.031953852623701096,
66
+ "min": -0.11250180751085281,
67
+ "max": 0.10477326810359955,
68
+ "count": 335
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
+ "value": 13.133033752441406,
72
+ "min": -46.91325378417969,
73
+ "max": 44.6334114074707,
74
+ "count": 335
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
+ "count": 335
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
+ "count": 335
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
+ "value": 0.09531192604554903,
90
+ "min": -0.381275439994377,
91
+ "max": 0.26663347656634745,
92
+ "count": 335
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
+ "value": 20.777999877929688,
96
+ "min": -86.93080031871796,
97
+ "max": 62.125600039958954,
98
+ "count": 335
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
+ "value": 0.09531192604554903,
102
+ "min": -0.381275439994377,
103
+ "max": 0.26663347656634745,
104
+ "count": 335
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
+ "value": 20.777999877929688,
108
+ "min": -86.93080031871796,
109
+ "max": 62.125600039958954,
110
+ "count": 335
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
+ "count": 335
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
+ "count": 335
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
+ "value": 0.01046212162455049,
126
+ "min": 0.009879295097471185,
127
+ "max": 0.014559235423075734,
128
+ "count": 51
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
+ "value": 0.01046212162455049,
132
+ "min": 0.009879295097471185,
133
+ "max": 0.014559235423075734,
134
+ "count": 51
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
+ "value": 0.05891079842112958,
138
+ "min": 0.04971672408282757,
139
+ "max": 0.05918900854885578,
140
+ "count": 51
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
+ "value": 0.05891079842112958,
144
+ "min": 0.04971672408282757,
145
+ "max": 0.05918900854885578,
146
+ "count": 51
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
+ "value": 0.05924153439700604,
150
+ "min": 0.051102403877303006,
151
+ "max": 0.05954511137679219,
152
+ "count": 51
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
+ "value": 0.05924153439700604,
156
+ "min": 0.051102403877303006,
157
+ "max": 0.05954511137679219,
158
+ "count": 51
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
+ "value": 6.4449295954992225e-09,
162
+ "min": 6.4449295954992225e-09,
163
+ "max": 0.00014248644558948728,
164
+ "count": 51
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
+ "value": 6.4449295954992225e-09,
168
+ "min": 6.4449295954992225e-09,
169
+ "max": 0.00014248644558948728,
170
+ "count": 51
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
+ "value": 0.10000085146159124,
174
+ "min": 0.10000085146159124,
175
+ "max": 0.11912103967704953,
176
+ "count": 51
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
+ "value": 0.10000085146159124,
180
+ "min": 0.10000085146159124,
181
+ "max": 0.11912103967704953,
182
+ "count": 51
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
+ "value": 1.0002659404254946e-05,
186
+ "min": 1.0002659404254946e-05,
187
+ "max": 6.972151274949521e-05,
188
+ "count": 51
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
+ "value": 1.0002659404254946e-05,
192
+ "min": 1.0002659404254946e-05,
193
+ "max": 6.972151274949521e-05,
194
+ "count": 51
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
+ "start_time_seconds": "1710343829",
200
  "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
201
  "command_line_arguments": "/home/stephan/.conda/envs/rl/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./ml-agents/training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos-read-deal --width=1280 --height=720 --resume",
202
  "mlagents_version": "1.1.0.dev0",
 
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "2.2.1+cu121",
206
  "numpy_version": "1.23.5",
207
+ "end_time_seconds": "1710353568"
208
  },
209
+ "total": 9739.254863360999,
210
  "count": 1,
211
+ "self": 0.270132729987381,
212
  "children": {
213
  "run_training.setup": {
214
+ "total": 0.018506341002648696,
215
  "count": 1,
216
+ "self": 0.018506341002648696
217
  },
218
  "TrainerController.start_learning": {
219
+ "total": 9738.966224290009,
220
  "count": 1,
221
+ "self": 4.652608350283117,
222
  "children": {
223
  "TrainerController._reset_env": {
224
+ "total": 4.244304390012985,
225
+ "count": 7,
226
+ "self": 4.244304390012985
227
  },
228
  "TrainerController.advance": {
229
+ "total": 9729.947026144713,
230
+ "count": 239073,
231
+ "self": 4.148107524248189,
232
  "children": {
233
  "env_step": {
234
+ "total": 4354.3673745146225,
235
+ "count": 239073,
236
+ "self": 3721.0493522615725,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
+ "total": 630.4299217515072,
240
+ "count": 239073,
241
+ "self": 19.02124206413282,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
+ "total": 611.4086796873744,
245
+ "count": 418182,
246
+ "self": 611.4086796873744
247
  }
248
  }
249
  },
250
  "workers": {
251
+ "total": 2.8881005015427945,
252
+ "count": 239073,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
+ "total": 9731.739510110943,
257
+ "count": 239073,
258
  "is_parallel": true,
259
+ "self": 6533.360267171403,
260
  "children": {
261
  "run_training.setup": {
262
  "total": 0.0,
 
265
  "self": 0.0,
266
  "children": {
267
  "steps_from_proto": {
268
+ "total": 0.06389564499841072,
269
  "count": 2,
270
  "is_parallel": true,
271
+ "self": 0.000593470991589129,
272
  "children": {
273
  "_process_rank_one_or_two_observation": {
274
+ "total": 0.06330217400682159,
275
  "count": 8,
276
  "is_parallel": true,
277
+ "self": 0.06330217400682159
278
  }
279
  }
280
  },
281
  "UnityEnvironment.step": {
282
+ "total": 0.02612613000383135,
283
  "count": 1,
284
  "is_parallel": true,
285
+ "self": 0.000600070008658804,
286
  "children": {
287
  "UnityEnvironment._generate_step_input": {
288
+ "total": 0.00040655999328009784,
289
  "count": 1,
290
  "is_parallel": true,
291
+ "self": 0.00040655999328009784
292
  },
293
  "communicator.exchange": {
294
+ "total": 0.02343449799809605,
295
  "count": 1,
296
  "is_parallel": true,
297
+ "self": 0.02343449799809605
298
  },
299
  "steps_from_proto": {
300
+ "total": 0.0016850020037963986,
301
  "count": 2,
302
  "is_parallel": true,
303
+ "self": 0.0003057300054933876,
304
  "children": {
305
  "_process_rank_one_or_two_observation": {
306
+ "total": 0.001379271998303011,
307
  "count": 8,
308
  "is_parallel": true,
309
+ "self": 0.001379271998303011
310
  }
311
  }
312
  }
 
315
  }
316
  },
317
  "steps_from_proto": {
318
+ "total": 0.012151043978519738,
319
+ "count": 12,
320
  "is_parallel": true,
321
+ "self": 0.002059131977148354,
322
  "children": {
323
  "_process_rank_one_or_two_observation": {
324
+ "total": 0.010091912001371384,
325
+ "count": 48,
326
  "is_parallel": true,
327
+ "self": 0.010091912001371384
328
  }
329
  }
330
  },
331
  "UnityEnvironment.step": {
332
+ "total": 3198.3670918955613,
333
+ "count": 239072,
334
  "is_parallel": true,
335
+ "self": 175.16570653802773,
336
  "children": {
337
  "UnityEnvironment._generate_step_input": {
338
+ "total": 110.43290661888022,
339
+ "count": 239072,
340
  "is_parallel": true,
341
+ "self": 110.43290661888022
342
  },
343
  "communicator.exchange": {
344
+ "total": 2470.8126502879313,
345
+ "count": 239072,
346
  "is_parallel": true,
347
+ "self": 2470.8126502879313
348
  },
349
  "steps_from_proto": {
350
+ "total": 441.95582845072204,
351
+ "count": 478144,
352
  "is_parallel": true,
353
+ "self": 78.3687699053844,
354
  "children": {
355
  "_process_rank_one_or_two_observation": {
356
+ "total": 363.58705854533764,
357
+ "count": 1912576,
358
  "is_parallel": true,
359
+ "self": 363.58705854533764
360
  }
361
  }
362
  }
 
369
  }
370
  },
371
  "trainer_advance": {
372
+ "total": 5371.4315441058425,
373
+ "count": 239073,
374
+ "self": 26.83088273082103,
375
  "children": {
376
  "process_trajectory": {
377
+ "total": 1094.2377518599678,
378
+ "count": 239073,
379
+ "self": 1093.3974272879568,
380
  "children": {
381
  "RLTrainer._checkpoint": {
382
+ "total": 0.8403245720110135,
383
+ "count": 7,
384
+ "self": 0.8403245720110135
385
  }
386
  }
387
  },
388
  "_update_policy": {
389
+ "total": 4250.362909515054,
390
+ "count": 51,
391
+ "self": 652.032682771809,
392
  "children": {
393
  "TorchPOCAOptimizer.update": {
394
+ "total": 3598.3302267432446,
395
+ "count": 4080,
396
+ "self": 3598.3302267432446
397
  }
398
  }
399
  }
 
402
  }
403
  },
404
  "trainer_threads": {
405
+ "total": 9.200011845678091e-07,
406
  "count": 1,
407
+ "self": 9.200011845678091e-07
408
  },
409
  "TrainerController._save_models": {
410
+ "total": 0.12228448499809019,
411
  "count": 1,
412
+ "self": 0.0026952329935738817,
413
  "children": {
414
  "RLTrainer._checkpoint": {
415
+ "total": 0.11958925200451631,
416
  "count": 1,
417
+ "self": 0.11958925200451631
418
  }
419
  }
420
  }
run_logs/training_status.json CHANGED
@@ -2,59 +2,59 @@
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
- "steps": 4999994,
6
- "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-4999994.onnx",
7
  "reward": 0.0,
8
- "creation_time": 1710305448.3632262,
9
  "auxillary_file_paths": [
10
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-4999994.pt"
11
  ]
12
  },
13
  {
14
- "steps": 5000026,
15
- "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-5000026.onnx",
16
  "reward": 0.0,
17
- "creation_time": 1710305448.48951,
18
  "auxillary_file_paths": [
19
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-5000026.pt"
20
  ]
21
  },
22
  {
23
- "steps": 5499990,
24
- "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-5499990.onnx",
25
  "reward": 0.0,
26
- "creation_time": 1710334432.864333,
27
  "auxillary_file_paths": [
28
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-5499990.pt"
29
  ]
30
  },
31
  {
32
- "steps": 5999976,
33
- "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-5999976.onnx",
34
- "reward": 0.0,
35
- "creation_time": 1710335864.5550687,
36
  "auxillary_file_paths": [
37
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-5999976.pt"
38
  ]
39
  },
40
  {
41
- "steps": 6000104,
42
- "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-6000104.onnx",
43
- "reward": 0.0,
44
- "creation_time": 1710335864.7100072,
45
  "auxillary_file_paths": [
46
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-6000104.pt"
47
  ]
48
  }
49
  ],
50
- "elo": 1561.4600643759927,
51
  "final_checkpoint": {
52
- "steps": 6000104,
53
  "file_path": "results/SoccerTwos-read-deal/SoccerTwos.onnx",
54
- "reward": 0.0,
55
- "creation_time": 1710335864.7100072,
56
  "auxillary_file_paths": [
57
- "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-6000104.pt"
58
  ]
59
  }
60
  },
 
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
+ "steps": 8499978,
6
+ "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8499978.onnx",
7
  "reward": 0.0,
8
+ "creation_time": 1710349255.752344,
9
  "auxillary_file_paths": [
10
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8499978.pt"
11
  ]
12
  },
13
  {
14
+ "steps": 8999988,
15
+ "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8999988.onnx",
16
  "reward": 0.0,
17
+ "creation_time": 1710350638.0742688,
18
  "auxillary_file_paths": [
19
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8999988.pt"
20
  ]
21
  },
22
  {
23
+ "steps": 9499993,
24
+ "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9499993.onnx",
25
  "reward": 0.0,
26
+ "creation_time": 1710352100.153916,
27
  "auxillary_file_paths": [
28
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9499993.pt"
29
  ]
30
  },
31
  {
32
+ "steps": 9999982,
33
+ "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9999982.onnx",
34
+ "reward": null,
35
+ "creation_time": 1710353568.109763,
36
  "auxillary_file_paths": [
37
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9999982.pt"
38
  ]
39
  },
40
  {
41
+ "steps": 10000046,
42
+ "file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-10000046.onnx",
43
+ "reward": null,
44
+ "creation_time": 1710353568.2486105,
45
  "auxillary_file_paths": [
46
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-10000046.pt"
47
  ]
48
  }
49
  ],
50
+ "elo": 1607.9046472284606,
51
  "final_checkpoint": {
52
+ "steps": 10000046,
53
  "file_path": "results/SoccerTwos-read-deal/SoccerTwos.onnx",
54
+ "reward": null,
55
+ "creation_time": 1710353568.2486105,
56
  "auxillary_file_paths": [
57
+ "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-10000046.pt"
58
  ]
59
  }
60
  },