Retrained to 10M steps, with higher play_against_latest_model_ratio (0.75 instead of 0.25) this helped the model to learn to play defense better
Browse files- SoccerTwos.onnx +1 -1
- SoccerTwos/SoccerTwos-10000046.onnx +3 -0
- SoccerTwos/SoccerTwos-10000046.pt +3 -0
- SoccerTwos/SoccerTwos-8499978.onnx +3 -0
- SoccerTwos/SoccerTwos-8499978.pt +3 -0
- SoccerTwos/SoccerTwos-8999988.onnx +3 -0
- SoccerTwos/SoccerTwos-8999988.pt +3 -0
- SoccerTwos/SoccerTwos-9499993.onnx +3 -0
- SoccerTwos/SoccerTwos-9499993.pt +3 -0
- SoccerTwos/SoccerTwos-9999982.onnx +3 -0
- SoccerTwos/SoccerTwos-9999982.pt +3 -0
- SoccerTwos/checkpoint.pt +1 -1
- SoccerTwos/events.out.tfevents.1710341962.stephan-ms7c02.29905.0 +3 -0
- SoccerTwos/events.out.tfevents.1710343832.stephan-ms7c02.33144.0 +3 -0
- SoccerTwos_orig/SoccerTwos-4999994.onnx +3 -0
- SoccerTwos_orig/SoccerTwos-4999994.pt +3 -0
- SoccerTwos_orig/SoccerTwos-5000026.onnx +3 -0
- SoccerTwos_orig/SoccerTwos-5000026.pt +3 -0
- SoccerTwos_orig/SoccerTwos-5499990.onnx +3 -0
- SoccerTwos_orig/SoccerTwos-5499990.pt +3 -0
- SoccerTwos_orig/SoccerTwos-5999976.onnx +3 -0
- SoccerTwos_orig/SoccerTwos-5999976.pt +3 -0
- SoccerTwos_orig/SoccerTwos-6000104.onnx +3 -0
- SoccerTwos_orig/SoccerTwos-6000104.pt +3 -0
- SoccerTwos_orig/checkpoint.pt +3 -0
- SoccerTwos_orig/events.out.tfevents.1710290777.stephan-ms7c02.14283.0 +3 -0
- SoccerTwos_orig/events.out.tfevents.1710333085.stephan-ms7c02.24579.0 +3 -0
- config.json +1 -1
- configuration.yaml +2 -2
- run_logs/Player-0.log +17 -17
- run_logs/timers.json +200 -200
- run_logs/training_status.json +27 -27
SoccerTwos.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 895526
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b6d608c4248e0b310070b2af2b4ea2275b174aeed4ae07c4b7ff7524ee580d5
|
3 |
size 895526
|
SoccerTwos/SoccerTwos-10000046.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b6d608c4248e0b310070b2af2b4ea2275b174aeed4ae07c4b7ff7524ee580d5
|
3 |
+
size 895526
|
SoccerTwos/SoccerTwos-10000046.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7da542e5ed006a647545f746b09a40c9006d9b32927ef30a3ab22b48f7c7775c
|
3 |
+
size 10325290
|
SoccerTwos/SoccerTwos-8499978.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6c0ccf92cff2ea1b32b49e95f6a42b5d63affc6f5ee79e658cd79776696d523
|
3 |
+
size 895526
|
SoccerTwos/SoccerTwos-8499978.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eecdb844b9847844a5be6db79e351f3711605e9c42b7cc03ab11b57b62e7522f
|
3 |
+
size 10325138
|
SoccerTwos/SoccerTwos-8999988.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19f45f7b592496e18ff616e19a9a276b8269eba93055ddb4f2a1d24b6e414b20
|
3 |
+
size 895526
|
SoccerTwos/SoccerTwos-8999988.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cde9c9d152dc7cce4fe5a93171548d2a7f8103247bc932b061a6e0c7faf43c7
|
3 |
+
size 10325138
|
SoccerTwos/SoccerTwos-9499993.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b6772ba57d0dda936a1b86cfe6c1d0da4bff2be72cdf1a8289ac94f43aaa77f
|
3 |
+
size 895526
|
SoccerTwos/SoccerTwos-9499993.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:811ca51769e17fef7d09824811d17d0e7b4823ff3e3459cf4dcdd9fa5753c134
|
3 |
+
size 10325138
|
SoccerTwos/SoccerTwos-9999982.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ae6b4d8b9bce2651e6142580cdc5b4625eb01736ba52eb9ab6a952a964b862c
|
3 |
+
size 895526
|
SoccerTwos/SoccerTwos-9999982.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5a6a4d7f4080efe31a06dc37491f39b98ca4223b9ab7f31f785bfefb6ccfb1f
|
3 |
+
size 10325138
|
SoccerTwos/checkpoint.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 10323922
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37854fa1cf62607fbcf6e1fa3522fdc3890a2084987edc894f3955253d66549d
|
3 |
size 10323922
|
SoccerTwos/events.out.tfevents.1710341962.stephan-ms7c02.29905.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4328e8cf67a012d3b679ca03e83f9101e4827d554072a1d9dde86d2717a0992a
|
3 |
+
size 661583
|
SoccerTwos/events.out.tfevents.1710343832.stephan-ms7c02.33144.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97512bb4824eae2e636aac4106b752ef6109d681e20d6fc75355ec92b3a0529f
|
3 |
+
size 3405815
|
SoccerTwos_orig/SoccerTwos-4999994.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be96c3872475cc25d67472685bc2fee156427488a3c08e79bd28cf6c98213a94
|
3 |
+
size 895526
|
SoccerTwos_orig/SoccerTwos-4999994.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71e54f36b571a60d1bd3474e5ee403ddc02aa6aafcd1c007e1272b0fa33cbfd8
|
3 |
+
size 10325138
|
SoccerTwos_orig/SoccerTwos-5000026.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23416b67a78fe350c105debeb7be130b546d1ca99633a6d58b7b2ab627bdac15
|
3 |
+
size 895526
|
SoccerTwos_orig/SoccerTwos-5000026.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef0aa7a1f48d9f4164990361bc247cd36df0a533121533f0cdf22a25adfb7189
|
3 |
+
size 10325138
|
SoccerTwos_orig/SoccerTwos-5499990.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ee5c6c1bdaa2e03dd5acac35279c5a077f98827615be82d01ca79d646f2847f
|
3 |
+
size 895526
|
SoccerTwos_orig/SoccerTwos-5499990.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1b631e6e474edfbd6397a6a173d3a36a447960b4e996fe4f72efd68936a6196
|
3 |
+
size 10325138
|
SoccerTwos_orig/SoccerTwos-5999976.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56acb86e98bacbe50d2c8305c10c4bcb279131ff4c1359ef6245cccfed56cd97
|
3 |
+
size 895526
|
SoccerTwos_orig/SoccerTwos-5999976.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c17aec0f05d051f9f1c6ca2db48529936e5c49c6978ab68abb2f1a5a9dbc004a
|
3 |
+
size 10325138
|
SoccerTwos_orig/SoccerTwos-6000104.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c574606e5c1839061cdb7dc9b76863444295b5b91caccfc413a1ed077ee8c3f
|
3 |
+
size 895526
|
SoccerTwos_orig/SoccerTwos-6000104.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccaa39ff525af5de7c6578077964314fe8b52d503f9fd6cb8fa52b144355b61b
|
3 |
+
size 10325138
|
SoccerTwos_orig/checkpoint.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:008145e1e808608cc93b4d650ceaa479d23cc271324dee6c3b01906b96fa84f6
|
3 |
+
size 10323922
|
SoccerTwos_orig/events.out.tfevents.1710290777.stephan-ms7c02.14283.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:921364813e102c784e2b1fe10a218e4108aaf0c18241e88faad09085f782460c
|
3 |
+
size 4854988
|
SoccerTwos_orig/events.out.tfevents.1710333085.stephan-ms7c02.24579.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cd4e31cb3abbb0f4426bddd18591f073816db885a8bc2560ff7951c70d47284
|
3 |
+
size 1017522
|
config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 4096, "buffer_size": 65536, "learning_rate": 0.0004345843188705317, "beta": 0.00019215097636640332, "epsilon": 0.15831928707038231, "lambd": 0.9467147291117369, "num_epoch": 5, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": true, "hidden_units": 256, "num_layers": 3, "vis_encode_type": "fully_connected", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.9608227414353802, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps":
|
|
|
1 |
+
{"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 4096, "buffer_size": 65536, "learning_rate": 0.0004345843188705317, "beta": 0.00019215097636640332, "epsilon": 0.15831928707038231, "lambd": 0.9467147291117369, "num_epoch": 5, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": true, "hidden_units": 256, "num_layers": 3, "vis_encode_type": "fully_connected", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.9608227414353802, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 10000000, "time_horizon": 32, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 60000, "team_change": 589998, "swap_steps": 70000, "window": 25, "play_against_latest_model_ratio": 0.75, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./ml-agents/training-envs-executables/SoccerTwos.exe", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 1280, "height": 720, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": false, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos-read-deal", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
|
configuration.yaml
CHANGED
@@ -37,7 +37,7 @@ behaviors:
|
|
37 |
init_path: null
|
38 |
keep_checkpoints: 5
|
39 |
even_checkpoints: false
|
40 |
-
max_steps:
|
41 |
time_horizon: 32
|
42 |
summary_freq: 10000
|
43 |
threaded: false
|
@@ -46,7 +46,7 @@ behaviors:
|
|
46 |
team_change: 589998
|
47 |
swap_steps: 70000
|
48 |
window: 25
|
49 |
-
play_against_latest_model_ratio: 0.
|
50 |
initial_elo: 1200.0
|
51 |
behavioral_cloning: null
|
52 |
env_settings:
|
|
|
37 |
init_path: null
|
38 |
keep_checkpoints: 5
|
39 |
even_checkpoints: false
|
40 |
+
max_steps: 10000000
|
41 |
time_horizon: 32
|
42 |
summary_freq: 10000
|
43 |
threaded: false
|
|
|
46 |
team_change: 589998
|
47 |
swap_steps: 70000
|
48 |
window: 25
|
49 |
+
play_against_latest_model_ratio: 0.75
|
50 |
initial_elo: 1200.0
|
51 |
behavioral_cloning: null
|
52 |
env_settings:
|
run_logs/Player-0.log
CHANGED
@@ -19,14 +19,14 @@ ns GL_ARB_stencil_texturing GL_ARB_sync GL_ARB_tessellation_shader GL_ARB_textur
|
|
19 |
_buffer_object GL_ARB_vertex_shader GL_ARB_vertex_type_10f_11f_11f_rev GL_ARB_vertex_type_2_10_10_10_rev GL_ARB_viewport_array GL_ATI_blend_equation_separate GL_ATI_meminfo GL_ATI_texture_float GL_ATI_texture_mirror_once GL_EXT_EGL_image_storage GL_EXT_EGL_sync GL_EXT_abgr GL_EXT_blend_equation_separate GL_EXT_debug_label GL_EXT_demote_to_helper_invocation GL_EXT_depth_bounds_test GL_EXT_draw_buffers2 GL_EXT_draw_instanced GL_EXT_framebuffer_blit GL_EXT_framebuffer_multisample GL_EXT_framebuffer_multisample_blit_scaled GL_EXT_framebuffer_object GL_EXT_framebuffer_sRGB GL_EXT_memory_object GL_EXT_memory_object_fd GL_EXT_packed_depth_stencil GL_EXT_packed_float GL_EXT_pixel_buffer_object GL_EXT_polygon_offset_clamp GL_EXT_provoking_vertex GL_EXT_semaphore GL_EXT_semaphore_fd GL_EXT_shader_image_load_formatted GL_EXT_shader_image_load_store GL_EXT_shader_integer_mix GL_EXT_shader_samples_identical GL_EXT_texture_array GL_EXT_texture_compression_dxt1 GL_EXT_texture_compression_rgtc GL_EXT_texture_compression_s3t
|
20 |
c GL_EXT_texture_filter_anisotropic GL_EXT_texture_integer GL_EXT_texture_mirror_clamp GL_EXT_texture_sRGB GL_EXT_texture_sRGB_R8 GL_EXT_texture_sRGB_decode GL_EXT_texture_shadow_lod GL_EXT_texture_shared_exponent GL_EXT_texture_snorm GL_EXT_texture_swizzle GL_EXT_timer_query GL_EXT_transform_feedback GL_EXT_vertex_array_bgra GL_EXT_vertex_attrib_64bit GL_EXT_window_rectangles GL_IBM_multimode_draw_arrays GL_INTEL_blackhole_render GL_KHR_blend_equation_advanced GL_KHR_context_flush_control GL_KHR_debug GL_KHR_no_error GL_KHR_parallel_shader_compile GL_KHR_robust_buffer_access_behavior GL_KHR_robustness GL_KHR_texture_compression_astc_ldr GL_KHR_texture_compression_astc_sliced_3d GL_MESA_framebuffer_flip_y GL_MESA_pack_invert GL_MESA_shader_integer_functions GL_MESA_texture_const_bandwidth GL_MESA_texture_signed_rgba GL_NVX_gpu_memory_info GL_NV_alpha_to_coverage_dither_control GL_NV_compute_shader_derivatives GL_NV_conditional_render GL_NV_copy_image GL_NV_depth_clamp GL_NV_packed_depth_stencil GL_NV_shader_
|
21 |
atomic_int64 GL_NV_texture_barrier GL_NV_vdpau_interop GL_OES_EGL_image GL_S3_s3tc
|
22 |
-
OPENGL LOG: Creating OpenGL 4.6 graphics device ; Context level <OpenGL 4.5> ; Context handle
|
23 |
Begin MonoManager ReloadAssembly
|
24 |
-
- Completed reload, in 0.
|
25 |
Default vsync count 1
|
26 |
requesting resize 1280 x 720
|
27 |
resizing window to 1280 x 720
|
28 |
Desktop is 1920 x 1080 @ 60 Hz
|
29 |
-
UnloadTime: 0.
|
30 |
Registered Communicator in Agent.
|
31 |
Setting up 6 worker threads for Enlighten.
|
32 |
requesting resize 1280 x 720
|
@@ -36,7 +36,7 @@ Memory Statistics:
|
|
36 |
[ALLOC_TEMP_TLS] TLS Allocator
|
37 |
StackAllocators :
|
38 |
[ALLOC_TEMP_MAIN]
|
39 |
-
Peak usage frame count: [8.0 KB-16.0 KB]:
|
40 |
Initial Block Size 4.0 MB
|
41 |
Current Block Size 4.0 MB
|
42 |
Peak Allocated Bytes 2.1 MB
|
@@ -211,18 +211,18 @@ Memory Statistics:
|
|
211 |
[ALLOC_BUCKET]
|
212 |
Large Block size 4.0 MB
|
213 |
Used Block count 1
|
214 |
-
Peak Allocated bytes
|
215 |
[ALLOC_DEFAULT_MAIN]
|
216 |
-
Peak usage frame count: [8.0 MB-16.0 MB]:
|
217 |
Requested Block Size 16.0 MB
|
218 |
Peak Block count 1
|
219 |
Peak Allocated memory 13.0 MB
|
220 |
Peak Large allocation bytes 0 B
|
221 |
[ALLOC_DEFAULT_THREAD]
|
222 |
-
Peak usage frame count: [16.0 MB-32.0 MB]:
|
223 |
Requested Block Size 16.0 MB
|
224 |
Peak Block count 1
|
225 |
-
Peak Allocated memory
|
226 |
Peak Large allocation bytes 16.0 MB
|
227 |
[ALLOC_TEMP_JOB_1_FRAME]
|
228 |
Initial Block Size 2.0 MB
|
@@ -249,15 +249,15 @@ Memory Statistics:
|
|
249 |
[ALLOC_BUCKET]
|
250 |
Large Block size 4.0 MB
|
251 |
Used Block count 1
|
252 |
-
Peak Allocated bytes
|
253 |
[ALLOC_GFX_MAIN]
|
254 |
-
Peak usage frame count: [32.0 KB-64.0 KB]:
|
255 |
Requested Block Size 16.0 MB
|
256 |
Peak Block count 1
|
257 |
Peak Allocated memory 2.7 MB
|
258 |
Peak Large allocation bytes 0 B
|
259 |
[ALLOC_GFX_THREAD]
|
260 |
-
Peak usage frame count: [128.0 KB-256.0 KB]:
|
261 |
Requested Block Size 16.0 MB
|
262 |
Peak Block count 1
|
263 |
Peak Allocated memory 174.7 KB
|
@@ -267,15 +267,15 @@ Memory Statistics:
|
|
267 |
[ALLOC_BUCKET]
|
268 |
Large Block size 4.0 MB
|
269 |
Used Block count 1
|
270 |
-
Peak Allocated bytes
|
271 |
[ALLOC_CACHEOBJECTS_MAIN]
|
272 |
-
Peak usage frame count: [0.5 MB-1.0 MB]:
|
273 |
Requested Block Size 4.0 MB
|
274 |
Peak Block count 1
|
275 |
Peak Allocated memory 1.2 MB
|
276 |
Peak Large allocation bytes 0 B
|
277 |
[ALLOC_CACHEOBJECTS_THREAD]
|
278 |
-
Peak usage frame count: [4.0 MB-8.0 MB]:
|
279 |
Requested Block Size 4.0 MB
|
280 |
Peak Block count 2
|
281 |
Peak Allocated memory 7.8 MB
|
@@ -285,15 +285,15 @@ Memory Statistics:
|
|
285 |
[ALLOC_BUCKET]
|
286 |
Large Block size 4.0 MB
|
287 |
Used Block count 1
|
288 |
-
Peak Allocated bytes
|
289 |
[ALLOC_TYPETREE_MAIN]
|
290 |
-
Peak usage frame count: [0-1.0 KB]:
|
291 |
Requested Block Size 2.0 MB
|
292 |
Peak Block count 1
|
293 |
Peak Allocated memory 1.0 KB
|
294 |
Peak Large allocation bytes 0 B
|
295 |
[ALLOC_TYPETREE_THREAD]
|
296 |
-
Peak usage frame count: [1.0 KB-2.0 KB]:
|
297 |
Requested Block Size 2.0 MB
|
298 |
Peak Block count 1
|
299 |
Peak Allocated memory 2.2 KB
|
|
|
19 |
_buffer_object GL_ARB_vertex_shader GL_ARB_vertex_type_10f_11f_11f_rev GL_ARB_vertex_type_2_10_10_10_rev GL_ARB_viewport_array GL_ATI_blend_equation_separate GL_ATI_meminfo GL_ATI_texture_float GL_ATI_texture_mirror_once GL_EXT_EGL_image_storage GL_EXT_EGL_sync GL_EXT_abgr GL_EXT_blend_equation_separate GL_EXT_debug_label GL_EXT_demote_to_helper_invocation GL_EXT_depth_bounds_test GL_EXT_draw_buffers2 GL_EXT_draw_instanced GL_EXT_framebuffer_blit GL_EXT_framebuffer_multisample GL_EXT_framebuffer_multisample_blit_scaled GL_EXT_framebuffer_object GL_EXT_framebuffer_sRGB GL_EXT_memory_object GL_EXT_memory_object_fd GL_EXT_packed_depth_stencil GL_EXT_packed_float GL_EXT_pixel_buffer_object GL_EXT_polygon_offset_clamp GL_EXT_provoking_vertex GL_EXT_semaphore GL_EXT_semaphore_fd GL_EXT_shader_image_load_formatted GL_EXT_shader_image_load_store GL_EXT_shader_integer_mix GL_EXT_shader_samples_identical GL_EXT_texture_array GL_EXT_texture_compression_dxt1 GL_EXT_texture_compression_rgtc GL_EXT_texture_compression_s3t
|
20 |
c GL_EXT_texture_filter_anisotropic GL_EXT_texture_integer GL_EXT_texture_mirror_clamp GL_EXT_texture_sRGB GL_EXT_texture_sRGB_R8 GL_EXT_texture_sRGB_decode GL_EXT_texture_shadow_lod GL_EXT_texture_shared_exponent GL_EXT_texture_snorm GL_EXT_texture_swizzle GL_EXT_timer_query GL_EXT_transform_feedback GL_EXT_vertex_array_bgra GL_EXT_vertex_attrib_64bit GL_EXT_window_rectangles GL_IBM_multimode_draw_arrays GL_INTEL_blackhole_render GL_KHR_blend_equation_advanced GL_KHR_context_flush_control GL_KHR_debug GL_KHR_no_error GL_KHR_parallel_shader_compile GL_KHR_robust_buffer_access_behavior GL_KHR_robustness GL_KHR_texture_compression_astc_ldr GL_KHR_texture_compression_astc_sliced_3d GL_MESA_framebuffer_flip_y GL_MESA_pack_invert GL_MESA_shader_integer_functions GL_MESA_texture_const_bandwidth GL_MESA_texture_signed_rgba GL_NVX_gpu_memory_info GL_NV_alpha_to_coverage_dither_control GL_NV_compute_shader_derivatives GL_NV_conditional_render GL_NV_copy_image GL_NV_depth_clamp GL_NV_packed_depth_stencil GL_NV_shader_
|
21 |
atomic_int64 GL_NV_texture_barrier GL_NV_vdpau_interop GL_OES_EGL_image GL_S3_s3tc
|
22 |
+
OPENGL LOG: Creating OpenGL 4.6 graphics device ; Context level <OpenGL 4.5> ; Context handle 22053744
|
23 |
Begin MonoManager ReloadAssembly
|
24 |
+
- Completed reload, in 0.092 seconds
|
25 |
Default vsync count 1
|
26 |
requesting resize 1280 x 720
|
27 |
resizing window to 1280 x 720
|
28 |
Desktop is 1920 x 1080 @ 60 Hz
|
29 |
+
UnloadTime: 0.807040 ms
|
30 |
Registered Communicator in Agent.
|
31 |
Setting up 6 worker threads for Enlighten.
|
32 |
requesting resize 1280 x 720
|
|
|
36 |
[ALLOC_TEMP_TLS] TLS Allocator
|
37 |
StackAllocators :
|
38 |
[ALLOC_TEMP_MAIN]
|
39 |
+
Peak usage frame count: [8.0 KB-16.0 KB]: 62727 frames, [2.0 MB-4.0 MB]: 1 frames
|
40 |
Initial Block Size 4.0 MB
|
41 |
Current Block Size 4.0 MB
|
42 |
Peak Allocated Bytes 2.1 MB
|
|
|
211 |
[ALLOC_BUCKET]
|
212 |
Large Block size 4.0 MB
|
213 |
Used Block count 1
|
214 |
+
Peak Allocated bytes 1.9 MB
|
215 |
[ALLOC_DEFAULT_MAIN]
|
216 |
+
Peak usage frame count: [8.0 MB-16.0 MB]: 62728 frames
|
217 |
Requested Block Size 16.0 MB
|
218 |
Peak Block count 1
|
219 |
Peak Allocated memory 13.0 MB
|
220 |
Peak Large allocation bytes 0 B
|
221 |
[ALLOC_DEFAULT_THREAD]
|
222 |
+
Peak usage frame count: [16.0 MB-32.0 MB]: 62728 frames
|
223 |
Requested Block Size 16.0 MB
|
224 |
Peak Block count 1
|
225 |
+
Peak Allocated memory 28.7 MB
|
226 |
Peak Large allocation bytes 16.0 MB
|
227 |
[ALLOC_TEMP_JOB_1_FRAME]
|
228 |
Initial Block Size 2.0 MB
|
|
|
249 |
[ALLOC_BUCKET]
|
250 |
Large Block size 4.0 MB
|
251 |
Used Block count 1
|
252 |
+
Peak Allocated bytes 1.9 MB
|
253 |
[ALLOC_GFX_MAIN]
|
254 |
+
Peak usage frame count: [32.0 KB-64.0 KB]: 62727 frames, [2.0 MB-4.0 MB]: 1 frames
|
255 |
Requested Block Size 16.0 MB
|
256 |
Peak Block count 1
|
257 |
Peak Allocated memory 2.7 MB
|
258 |
Peak Large allocation bytes 0 B
|
259 |
[ALLOC_GFX_THREAD]
|
260 |
+
Peak usage frame count: [128.0 KB-256.0 KB]: 62728 frames
|
261 |
Requested Block Size 16.0 MB
|
262 |
Peak Block count 1
|
263 |
Peak Allocated memory 174.7 KB
|
|
|
267 |
[ALLOC_BUCKET]
|
268 |
Large Block size 4.0 MB
|
269 |
Used Block count 1
|
270 |
+
Peak Allocated bytes 1.9 MB
|
271 |
[ALLOC_CACHEOBJECTS_MAIN]
|
272 |
+
Peak usage frame count: [0.5 MB-1.0 MB]: 62727 frames, [1.0 MB-2.0 MB]: 1 frames
|
273 |
Requested Block Size 4.0 MB
|
274 |
Peak Block count 1
|
275 |
Peak Allocated memory 1.2 MB
|
276 |
Peak Large allocation bytes 0 B
|
277 |
[ALLOC_CACHEOBJECTS_THREAD]
|
278 |
+
Peak usage frame count: [4.0 MB-8.0 MB]: 62728 frames
|
279 |
Requested Block Size 4.0 MB
|
280 |
Peak Block count 2
|
281 |
Peak Allocated memory 7.8 MB
|
|
|
285 |
[ALLOC_BUCKET]
|
286 |
Large Block size 4.0 MB
|
287 |
Used Block count 1
|
288 |
+
Peak Allocated bytes 1.9 MB
|
289 |
[ALLOC_TYPETREE_MAIN]
|
290 |
+
Peak usage frame count: [0-1.0 KB]: 62728 frames
|
291 |
Requested Block Size 2.0 MB
|
292 |
Peak Block count 1
|
293 |
Peak Allocated memory 1.0 KB
|
294 |
Peak Large allocation bytes 0 B
|
295 |
[ALLOC_TYPETREE_THREAD]
|
296 |
+
Peak usage frame count: [1.0 KB-2.0 KB]: 62727 frames, [2.0 KB-4.0 KB]: 1 frames
|
297 |
Requested Block Size 2.0 MB
|
298 |
Peak Block count 1
|
299 |
Peak Allocated memory 2.2 KB
|
run_logs/timers.json
CHANGED
@@ -2,201 +2,201 @@
|
|
2 |
"name": "root",
|
3 |
"gauges": {
|
4 |
"SoccerTwos.Policy.Entropy.mean": {
|
5 |
-
"value": 1.
|
6 |
-
"min": 1.
|
7 |
-
"max": 1.
|
8 |
-
"count":
|
9 |
},
|
10 |
"SoccerTwos.Policy.Entropy.sum": {
|
11 |
-
"value":
|
12 |
-
"min":
|
13 |
-
"max":
|
14 |
-
"count":
|
15 |
},
|
16 |
"SoccerTwos.Environment.EpisodeLength.mean": {
|
17 |
-
"value":
|
18 |
-
"min":
|
19 |
-
"max": 53.
|
20 |
-
"count":
|
21 |
},
|
22 |
"SoccerTwos.Environment.EpisodeLength.sum": {
|
23 |
-
"value":
|
24 |
-
"min":
|
25 |
-
"max":
|
26 |
-
"count":
|
27 |
},
|
28 |
"SoccerTwos.Self-play.ELO.mean": {
|
29 |
-
"value":
|
30 |
-
"min":
|
31 |
-
"max":
|
32 |
-
"count":
|
33 |
},
|
34 |
"SoccerTwos.Self-play.ELO.sum": {
|
35 |
-
"value":
|
36 |
-
"min":
|
37 |
-
"max":
|
38 |
-
"count":
|
39 |
},
|
40 |
"SoccerTwos.Step.mean": {
|
41 |
-
"value":
|
42 |
-
"min":
|
43 |
-
"max":
|
44 |
-
"count":
|
45 |
},
|
46 |
"SoccerTwos.Step.sum": {
|
47 |
-
"value":
|
48 |
-
"min":
|
49 |
-
"max":
|
50 |
-
"count":
|
51 |
},
|
52 |
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
|
53 |
-
"value": 0.
|
54 |
-
"min": -0.
|
55 |
-
"max": 0.
|
56 |
-
"count":
|
57 |
},
|
58 |
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
|
59 |
-
"value":
|
60 |
-
"min": -
|
61 |
-
"max":
|
62 |
-
"count":
|
63 |
},
|
64 |
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
|
65 |
-
"value": 0.
|
66 |
-
"min": -0.
|
67 |
-
"max": 0.
|
68 |
-
"count":
|
69 |
},
|
70 |
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
|
71 |
-
"value":
|
72 |
-
"min": -
|
73 |
-
"max":
|
74 |
-
"count":
|
75 |
},
|
76 |
"SoccerTwos.Environment.CumulativeReward.mean": {
|
77 |
"value": 0.0,
|
78 |
"min": 0.0,
|
79 |
"max": 0.0,
|
80 |
-
"count":
|
81 |
},
|
82 |
"SoccerTwos.Environment.CumulativeReward.sum": {
|
83 |
"value": 0.0,
|
84 |
"min": 0.0,
|
85 |
"max": 0.0,
|
86 |
-
"count":
|
87 |
},
|
88 |
"SoccerTwos.Policy.ExtrinsicReward.mean": {
|
89 |
-
"value": 0.
|
90 |
-
"min": -0.
|
91 |
-
"max": 0.
|
92 |
-
"count":
|
93 |
},
|
94 |
"SoccerTwos.Policy.ExtrinsicReward.sum": {
|
95 |
-
"value":
|
96 |
-
"min": -
|
97 |
-
"max":
|
98 |
-
"count":
|
99 |
},
|
100 |
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
|
101 |
-
"value": 0.
|
102 |
-
"min": -0.
|
103 |
-
"max": 0.
|
104 |
-
"count":
|
105 |
},
|
106 |
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
|
107 |
-
"value":
|
108 |
-
"min": -
|
109 |
-
"max":
|
110 |
-
"count":
|
111 |
},
|
112 |
"SoccerTwos.IsTraining.mean": {
|
113 |
"value": 1.0,
|
114 |
"min": 1.0,
|
115 |
"max": 1.0,
|
116 |
-
"count":
|
117 |
},
|
118 |
"SoccerTwos.IsTraining.sum": {
|
119 |
"value": 1.0,
|
120 |
"min": 1.0,
|
121 |
"max": 1.0,
|
122 |
-
"count":
|
123 |
},
|
124 |
"SoccerTwos.Losses.PolicyLoss.mean": {
|
125 |
-
"value": 0.
|
126 |
-
"min": 0.
|
127 |
-
"max": 0.
|
128 |
-
"count":
|
129 |
},
|
130 |
"SoccerTwos.Losses.PolicyLoss.sum": {
|
131 |
-
"value": 0.
|
132 |
-
"min": 0.
|
133 |
-
"max": 0.
|
134 |
-
"count":
|
135 |
},
|
136 |
"SoccerTwos.Losses.ValueLoss.mean": {
|
137 |
-
"value": 0.
|
138 |
-
"min": 0.
|
139 |
-
"max": 0.
|
140 |
-
"count":
|
141 |
},
|
142 |
"SoccerTwos.Losses.ValueLoss.sum": {
|
143 |
-
"value": 0.
|
144 |
-
"min": 0.
|
145 |
-
"max": 0.
|
146 |
-
"count":
|
147 |
},
|
148 |
"SoccerTwos.Losses.BaselineLoss.mean": {
|
149 |
-
"value": 0.
|
150 |
-
"min": 0.
|
151 |
-
"max": 0.
|
152 |
-
"count":
|
153 |
},
|
154 |
"SoccerTwos.Losses.BaselineLoss.sum": {
|
155 |
-
"value": 0.
|
156 |
-
"min": 0.
|
157 |
-
"max": 0.
|
158 |
-
"count":
|
159 |
},
|
160 |
"SoccerTwos.Policy.LearningRate.mean": {
|
161 |
-
"value":
|
162 |
-
"min":
|
163 |
-
"max":
|
164 |
-
"count":
|
165 |
},
|
166 |
"SoccerTwos.Policy.LearningRate.sum": {
|
167 |
-
"value":
|
168 |
-
"min":
|
169 |
-
"max":
|
170 |
-
"count":
|
171 |
},
|
172 |
"SoccerTwos.Policy.Epsilon.mean": {
|
173 |
-
"value": 0.
|
174 |
-
"min": 0.
|
175 |
-
"max": 0.
|
176 |
-
"count":
|
177 |
},
|
178 |
"SoccerTwos.Policy.Epsilon.sum": {
|
179 |
-
"value": 0.
|
180 |
-
"min": 0.
|
181 |
-
"max": 0.
|
182 |
-
"count":
|
183 |
},
|
184 |
"SoccerTwos.Policy.Beta.mean": {
|
185 |
-
"value": 1.
|
186 |
-
"min": 1.
|
187 |
-
"max":
|
188 |
-
"count":
|
189 |
},
|
190 |
"SoccerTwos.Policy.Beta.sum": {
|
191 |
-
"value": 1.
|
192 |
-
"min": 1.
|
193 |
-
"max":
|
194 |
-
"count":
|
195 |
}
|
196 |
},
|
197 |
"metadata": {
|
198 |
"timer_format_version": "0.1.0",
|
199 |
-
"start_time_seconds": "
|
200 |
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
|
201 |
"command_line_arguments": "/home/stephan/.conda/envs/rl/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./ml-agents/training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos-read-deal --width=1280 --height=720 --resume",
|
202 |
"mlagents_version": "1.1.0.dev0",
|
@@ -204,59 +204,59 @@
|
|
204 |
"communication_protocol_version": "1.5.0",
|
205 |
"pytorch_version": "2.2.1+cu121",
|
206 |
"numpy_version": "1.23.5",
|
207 |
-
"end_time_seconds": "
|
208 |
},
|
209 |
-
"total":
|
210 |
"count": 1,
|
211 |
-
"self": 0.
|
212 |
"children": {
|
213 |
"run_training.setup": {
|
214 |
-
"total": 0.
|
215 |
"count": 1,
|
216 |
-
"self": 0.
|
217 |
},
|
218 |
"TrainerController.start_learning": {
|
219 |
-
"total":
|
220 |
"count": 1,
|
221 |
-
"self":
|
222 |
"children": {
|
223 |
"TrainerController._reset_env": {
|
224 |
-
"total": 4.
|
225 |
-
"count":
|
226 |
-
"self": 4.
|
227 |
},
|
228 |
"TrainerController.advance": {
|
229 |
-
"total":
|
230 |
-
"count":
|
231 |
-
"self":
|
232 |
"children": {
|
233 |
"env_step": {
|
234 |
-
"total":
|
235 |
-
"count":
|
236 |
-
"self":
|
237 |
"children": {
|
238 |
"SubprocessEnvManager._take_step": {
|
239 |
-
"total":
|
240 |
-
"count":
|
241 |
-
"self":
|
242 |
"children": {
|
243 |
"TorchPolicy.evaluate": {
|
244 |
-
"total":
|
245 |
-
"count":
|
246 |
-
"self":
|
247 |
}
|
248 |
}
|
249 |
},
|
250 |
"workers": {
|
251 |
-
"total":
|
252 |
-
"count":
|
253 |
"self": 0.0,
|
254 |
"children": {
|
255 |
"worker_root": {
|
256 |
-
"total":
|
257 |
-
"count":
|
258 |
"is_parallel": true,
|
259 |
-
"self":
|
260 |
"children": {
|
261 |
"run_training.setup": {
|
262 |
"total": 0.0,
|
@@ -265,48 +265,48 @@
|
|
265 |
"self": 0.0,
|
266 |
"children": {
|
267 |
"steps_from_proto": {
|
268 |
-
"total": 0.
|
269 |
"count": 2,
|
270 |
"is_parallel": true,
|
271 |
-
"self": 0.
|
272 |
"children": {
|
273 |
"_process_rank_one_or_two_observation": {
|
274 |
-
"total": 0.
|
275 |
"count": 8,
|
276 |
"is_parallel": true,
|
277 |
-
"self": 0.
|
278 |
}
|
279 |
}
|
280 |
},
|
281 |
"UnityEnvironment.step": {
|
282 |
-
"total": 0.
|
283 |
"count": 1,
|
284 |
"is_parallel": true,
|
285 |
-
"self": 0.
|
286 |
"children": {
|
287 |
"UnityEnvironment._generate_step_input": {
|
288 |
-
"total": 0.
|
289 |
"count": 1,
|
290 |
"is_parallel": true,
|
291 |
-
"self": 0.
|
292 |
},
|
293 |
"communicator.exchange": {
|
294 |
-
"total": 0.
|
295 |
"count": 1,
|
296 |
"is_parallel": true,
|
297 |
-
"self": 0.
|
298 |
},
|
299 |
"steps_from_proto": {
|
300 |
-
"total": 0.
|
301 |
"count": 2,
|
302 |
"is_parallel": true,
|
303 |
-
"self": 0.
|
304 |
"children": {
|
305 |
"_process_rank_one_or_two_observation": {
|
306 |
-
"total": 0.
|
307 |
"count": 8,
|
308 |
"is_parallel": true,
|
309 |
-
"self": 0.
|
310 |
}
|
311 |
}
|
312 |
}
|
@@ -315,48 +315,48 @@
|
|
315 |
}
|
316 |
},
|
317 |
"steps_from_proto": {
|
318 |
-
"total": 0.
|
319 |
-
"count":
|
320 |
"is_parallel": true,
|
321 |
-
"self": 0.
|
322 |
"children": {
|
323 |
"_process_rank_one_or_two_observation": {
|
324 |
-
"total": 0.
|
325 |
-
"count":
|
326 |
"is_parallel": true,
|
327 |
-
"self": 0.
|
328 |
}
|
329 |
}
|
330 |
},
|
331 |
"UnityEnvironment.step": {
|
332 |
-
"total":
|
333 |
-
"count":
|
334 |
"is_parallel": true,
|
335 |
-
"self":
|
336 |
"children": {
|
337 |
"UnityEnvironment._generate_step_input": {
|
338 |
-
"total":
|
339 |
-
"count":
|
340 |
"is_parallel": true,
|
341 |
-
"self":
|
342 |
},
|
343 |
"communicator.exchange": {
|
344 |
-
"total":
|
345 |
-
"count":
|
346 |
"is_parallel": true,
|
347 |
-
"self":
|
348 |
},
|
349 |
"steps_from_proto": {
|
350 |
-
"total":
|
351 |
-
"count":
|
352 |
"is_parallel": true,
|
353 |
-
"self":
|
354 |
"children": {
|
355 |
"_process_rank_one_or_two_observation": {
|
356 |
-
"total":
|
357 |
-
"count":
|
358 |
"is_parallel": true,
|
359 |
-
"self":
|
360 |
}
|
361 |
}
|
362 |
}
|
@@ -369,31 +369,31 @@
|
|
369 |
}
|
370 |
},
|
371 |
"trainer_advance": {
|
372 |
-
"total":
|
373 |
-
"count":
|
374 |
-
"self":
|
375 |
"children": {
|
376 |
"process_trajectory": {
|
377 |
-
"total":
|
378 |
-
"count":
|
379 |
-
"self":
|
380 |
"children": {
|
381 |
"RLTrainer._checkpoint": {
|
382 |
-
"total": 0.
|
383 |
-
"count":
|
384 |
-
"self": 0.
|
385 |
}
|
386 |
}
|
387 |
},
|
388 |
"_update_policy": {
|
389 |
-
"total":
|
390 |
-
"count":
|
391 |
-
"self":
|
392 |
"children": {
|
393 |
"TorchPOCAOptimizer.update": {
|
394 |
-
"total":
|
395 |
-
"count":
|
396 |
-
"self":
|
397 |
}
|
398 |
}
|
399 |
}
|
@@ -402,19 +402,19 @@
|
|
402 |
}
|
403 |
},
|
404 |
"trainer_threads": {
|
405 |
-
"total":
|
406 |
"count": 1,
|
407 |
-
"self":
|
408 |
},
|
409 |
"TrainerController._save_models": {
|
410 |
-
"total": 0.
|
411 |
"count": 1,
|
412 |
-
"self": 0.
|
413 |
"children": {
|
414 |
"RLTrainer._checkpoint": {
|
415 |
-
"total": 0.
|
416 |
"count": 1,
|
417 |
-
"self": 0.
|
418 |
}
|
419 |
}
|
420 |
}
|
|
|
2 |
"name": "root",
|
3 |
"gauges": {
|
4 |
"SoccerTwos.Policy.Entropy.mean": {
|
5 |
+
"value": 1.4048619270324707,
|
6 |
+
"min": 1.3750499486923218,
|
7 |
+
"max": 1.7051565647125244,
|
8 |
+
"count": 335
|
9 |
},
|
10 |
"SoccerTwos.Policy.Entropy.sum": {
|
11 |
+
"value": 28277.060546875,
|
12 |
+
"min": 14701.9814453125,
|
13 |
+
"max": 34322.671875,
|
14 |
+
"count": 335
|
15 |
},
|
16 |
"SoccerTwos.Environment.EpisodeLength.mean": {
|
17 |
+
"value": 45.06422018348624,
|
18 |
+
"min": 35.125,
|
19 |
+
"max": 53.40425531914894,
|
20 |
+
"count": 335
|
21 |
},
|
22 |
"SoccerTwos.Environment.EpisodeLength.sum": {
|
23 |
+
"value": 19648.0,
|
24 |
+
"min": 8072.0,
|
25 |
+
"max": 20960.0,
|
26 |
+
"count": 335
|
27 |
},
|
28 |
"SoccerTwos.Self-play.ELO.mean": {
|
29 |
+
"value": 1607.9046472284606,
|
30 |
+
"min": 1555.6832652825399,
|
31 |
+
"max": 1613.038356436412,
|
32 |
+
"count": 335
|
33 |
},
|
34 |
"SoccerTwos.Self-play.ELO.sum": {
|
35 |
+
"value": 350523.2130958044,
|
36 |
+
"min": 163654.2453609866,
|
37 |
+
"max": 434134.2547516843,
|
38 |
+
"count": 335
|
39 |
},
|
40 |
"SoccerTwos.Step.mean": {
|
41 |
+
"value": 9999982.0,
|
42 |
+
"min": 6659988.0,
|
43 |
+
"max": 9999982.0,
|
44 |
+
"count": 335
|
45 |
},
|
46 |
"SoccerTwos.Step.sum": {
|
47 |
+
"value": 9999982.0,
|
48 |
+
"min": 6659988.0,
|
49 |
+
"max": 9999982.0,
|
50 |
+
"count": 335
|
51 |
},
|
52 |
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
|
53 |
+
"value": 0.03223046660423279,
|
54 |
+
"min": -0.11106479167938232,
|
55 |
+
"max": 0.10332842171192169,
|
56 |
+
"count": 335
|
57 |
},
|
58 |
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
|
59 |
+
"value": 13.246722221374512,
|
60 |
+
"min": -46.31401824951172,
|
61 |
+
"max": 44.017906188964844,
|
62 |
+
"count": 335
|
63 |
},
|
64 |
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
|
65 |
+
"value": 0.031953852623701096,
|
66 |
+
"min": -0.11250180751085281,
|
67 |
+
"max": 0.10477326810359955,
|
68 |
+
"count": 335
|
69 |
},
|
70 |
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
|
71 |
+
"value": 13.133033752441406,
|
72 |
+
"min": -46.91325378417969,
|
73 |
+
"max": 44.6334114074707,
|
74 |
+
"count": 335
|
75 |
},
|
76 |
"SoccerTwos.Environment.CumulativeReward.mean": {
|
77 |
"value": 0.0,
|
78 |
"min": 0.0,
|
79 |
"max": 0.0,
|
80 |
+
"count": 335
|
81 |
},
|
82 |
"SoccerTwos.Environment.CumulativeReward.sum": {
|
83 |
"value": 0.0,
|
84 |
"min": 0.0,
|
85 |
"max": 0.0,
|
86 |
+
"count": 335
|
87 |
},
|
88 |
"SoccerTwos.Policy.ExtrinsicReward.mean": {
|
89 |
+
"value": 0.09531192604554903,
|
90 |
+
"min": -0.381275439994377,
|
91 |
+
"max": 0.26663347656634745,
|
92 |
+
"count": 335
|
93 |
},
|
94 |
"SoccerTwos.Policy.ExtrinsicReward.sum": {
|
95 |
+
"value": 20.777999877929688,
|
96 |
+
"min": -86.93080031871796,
|
97 |
+
"max": 62.125600039958954,
|
98 |
+
"count": 335
|
99 |
},
|
100 |
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
|
101 |
+
"value": 0.09531192604554903,
|
102 |
+
"min": -0.381275439994377,
|
103 |
+
"max": 0.26663347656634745,
|
104 |
+
"count": 335
|
105 |
},
|
106 |
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
|
107 |
+
"value": 20.777999877929688,
|
108 |
+
"min": -86.93080031871796,
|
109 |
+
"max": 62.125600039958954,
|
110 |
+
"count": 335
|
111 |
},
|
112 |
"SoccerTwos.IsTraining.mean": {
|
113 |
"value": 1.0,
|
114 |
"min": 1.0,
|
115 |
"max": 1.0,
|
116 |
+
"count": 335
|
117 |
},
|
118 |
"SoccerTwos.IsTraining.sum": {
|
119 |
"value": 1.0,
|
120 |
"min": 1.0,
|
121 |
"max": 1.0,
|
122 |
+
"count": 335
|
123 |
},
|
124 |
"SoccerTwos.Losses.PolicyLoss.mean": {
|
125 |
+
"value": 0.01046212162455049,
|
126 |
+
"min": 0.009879295097471185,
|
127 |
+
"max": 0.014559235423075734,
|
128 |
+
"count": 51
|
129 |
},
|
130 |
"SoccerTwos.Losses.PolicyLoss.sum": {
|
131 |
+
"value": 0.01046212162455049,
|
132 |
+
"min": 0.009879295097471185,
|
133 |
+
"max": 0.014559235423075734,
|
134 |
+
"count": 51
|
135 |
},
|
136 |
"SoccerTwos.Losses.ValueLoss.mean": {
|
137 |
+
"value": 0.05891079842112958,
|
138 |
+
"min": 0.04971672408282757,
|
139 |
+
"max": 0.05918900854885578,
|
140 |
+
"count": 51
|
141 |
},
|
142 |
"SoccerTwos.Losses.ValueLoss.sum": {
|
143 |
+
"value": 0.05891079842112958,
|
144 |
+
"min": 0.04971672408282757,
|
145 |
+
"max": 0.05918900854885578,
|
146 |
+
"count": 51
|
147 |
},
|
148 |
"SoccerTwos.Losses.BaselineLoss.mean": {
|
149 |
+
"value": 0.05924153439700604,
|
150 |
+
"min": 0.051102403877303006,
|
151 |
+
"max": 0.05954511137679219,
|
152 |
+
"count": 51
|
153 |
},
|
154 |
"SoccerTwos.Losses.BaselineLoss.sum": {
|
155 |
+
"value": 0.05924153439700604,
|
156 |
+
"min": 0.051102403877303006,
|
157 |
+
"max": 0.05954511137679219,
|
158 |
+
"count": 51
|
159 |
},
|
160 |
"SoccerTwos.Policy.LearningRate.mean": {
|
161 |
+
"value": 6.4449295954992225e-09,
|
162 |
+
"min": 6.4449295954992225e-09,
|
163 |
+
"max": 0.00014248644558948728,
|
164 |
+
"count": 51
|
165 |
},
|
166 |
"SoccerTwos.Policy.LearningRate.sum": {
|
167 |
+
"value": 6.4449295954992225e-09,
|
168 |
+
"min": 6.4449295954992225e-09,
|
169 |
+
"max": 0.00014248644558948728,
|
170 |
+
"count": 51
|
171 |
},
|
172 |
"SoccerTwos.Policy.Epsilon.mean": {
|
173 |
+
"value": 0.10000085146159124,
|
174 |
+
"min": 0.10000085146159124,
|
175 |
+
"max": 0.11912103967704953,
|
176 |
+
"count": 51
|
177 |
},
|
178 |
"SoccerTwos.Policy.Epsilon.sum": {
|
179 |
+
"value": 0.10000085146159124,
|
180 |
+
"min": 0.10000085146159124,
|
181 |
+
"max": 0.11912103967704953,
|
182 |
+
"count": 51
|
183 |
},
|
184 |
"SoccerTwos.Policy.Beta.mean": {
|
185 |
+
"value": 1.0002659404254946e-05,
|
186 |
+
"min": 1.0002659404254946e-05,
|
187 |
+
"max": 6.972151274949521e-05,
|
188 |
+
"count": 51
|
189 |
},
|
190 |
"SoccerTwos.Policy.Beta.sum": {
|
191 |
+
"value": 1.0002659404254946e-05,
|
192 |
+
"min": 1.0002659404254946e-05,
|
193 |
+
"max": 6.972151274949521e-05,
|
194 |
+
"count": 51
|
195 |
}
|
196 |
},
|
197 |
"metadata": {
|
198 |
"timer_format_version": "0.1.0",
|
199 |
+
"start_time_seconds": "1710343829",
|
200 |
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
|
201 |
"command_line_arguments": "/home/stephan/.conda/envs/rl/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./ml-agents/training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos-read-deal --width=1280 --height=720 --resume",
|
202 |
"mlagents_version": "1.1.0.dev0",
|
|
|
204 |
"communication_protocol_version": "1.5.0",
|
205 |
"pytorch_version": "2.2.1+cu121",
|
206 |
"numpy_version": "1.23.5",
|
207 |
+
"end_time_seconds": "1710353568"
|
208 |
},
|
209 |
+
"total": 9739.254863360999,
|
210 |
"count": 1,
|
211 |
+
"self": 0.270132729987381,
|
212 |
"children": {
|
213 |
"run_training.setup": {
|
214 |
+
"total": 0.018506341002648696,
|
215 |
"count": 1,
|
216 |
+
"self": 0.018506341002648696
|
217 |
},
|
218 |
"TrainerController.start_learning": {
|
219 |
+
"total": 9738.966224290009,
|
220 |
"count": 1,
|
221 |
+
"self": 4.652608350283117,
|
222 |
"children": {
|
223 |
"TrainerController._reset_env": {
|
224 |
+
"total": 4.244304390012985,
|
225 |
+
"count": 7,
|
226 |
+
"self": 4.244304390012985
|
227 |
},
|
228 |
"TrainerController.advance": {
|
229 |
+
"total": 9729.947026144713,
|
230 |
+
"count": 239073,
|
231 |
+
"self": 4.148107524248189,
|
232 |
"children": {
|
233 |
"env_step": {
|
234 |
+
"total": 4354.3673745146225,
|
235 |
+
"count": 239073,
|
236 |
+
"self": 3721.0493522615725,
|
237 |
"children": {
|
238 |
"SubprocessEnvManager._take_step": {
|
239 |
+
"total": 630.4299217515072,
|
240 |
+
"count": 239073,
|
241 |
+
"self": 19.02124206413282,
|
242 |
"children": {
|
243 |
"TorchPolicy.evaluate": {
|
244 |
+
"total": 611.4086796873744,
|
245 |
+
"count": 418182,
|
246 |
+
"self": 611.4086796873744
|
247 |
}
|
248 |
}
|
249 |
},
|
250 |
"workers": {
|
251 |
+
"total": 2.8881005015427945,
|
252 |
+
"count": 239073,
|
253 |
"self": 0.0,
|
254 |
"children": {
|
255 |
"worker_root": {
|
256 |
+
"total": 9731.739510110943,
|
257 |
+
"count": 239073,
|
258 |
"is_parallel": true,
|
259 |
+
"self": 6533.360267171403,
|
260 |
"children": {
|
261 |
"run_training.setup": {
|
262 |
"total": 0.0,
|
|
|
265 |
"self": 0.0,
|
266 |
"children": {
|
267 |
"steps_from_proto": {
|
268 |
+
"total": 0.06389564499841072,
|
269 |
"count": 2,
|
270 |
"is_parallel": true,
|
271 |
+
"self": 0.000593470991589129,
|
272 |
"children": {
|
273 |
"_process_rank_one_or_two_observation": {
|
274 |
+
"total": 0.06330217400682159,
|
275 |
"count": 8,
|
276 |
"is_parallel": true,
|
277 |
+
"self": 0.06330217400682159
|
278 |
}
|
279 |
}
|
280 |
},
|
281 |
"UnityEnvironment.step": {
|
282 |
+
"total": 0.02612613000383135,
|
283 |
"count": 1,
|
284 |
"is_parallel": true,
|
285 |
+
"self": 0.000600070008658804,
|
286 |
"children": {
|
287 |
"UnityEnvironment._generate_step_input": {
|
288 |
+
"total": 0.00040655999328009784,
|
289 |
"count": 1,
|
290 |
"is_parallel": true,
|
291 |
+
"self": 0.00040655999328009784
|
292 |
},
|
293 |
"communicator.exchange": {
|
294 |
+
"total": 0.02343449799809605,
|
295 |
"count": 1,
|
296 |
"is_parallel": true,
|
297 |
+
"self": 0.02343449799809605
|
298 |
},
|
299 |
"steps_from_proto": {
|
300 |
+
"total": 0.0016850020037963986,
|
301 |
"count": 2,
|
302 |
"is_parallel": true,
|
303 |
+
"self": 0.0003057300054933876,
|
304 |
"children": {
|
305 |
"_process_rank_one_or_two_observation": {
|
306 |
+
"total": 0.001379271998303011,
|
307 |
"count": 8,
|
308 |
"is_parallel": true,
|
309 |
+
"self": 0.001379271998303011
|
310 |
}
|
311 |
}
|
312 |
}
|
|
|
315 |
}
|
316 |
},
|
317 |
"steps_from_proto": {
|
318 |
+
"total": 0.012151043978519738,
|
319 |
+
"count": 12,
|
320 |
"is_parallel": true,
|
321 |
+
"self": 0.002059131977148354,
|
322 |
"children": {
|
323 |
"_process_rank_one_or_two_observation": {
|
324 |
+
"total": 0.010091912001371384,
|
325 |
+
"count": 48,
|
326 |
"is_parallel": true,
|
327 |
+
"self": 0.010091912001371384
|
328 |
}
|
329 |
}
|
330 |
},
|
331 |
"UnityEnvironment.step": {
|
332 |
+
"total": 3198.3670918955613,
|
333 |
+
"count": 239072,
|
334 |
"is_parallel": true,
|
335 |
+
"self": 175.16570653802773,
|
336 |
"children": {
|
337 |
"UnityEnvironment._generate_step_input": {
|
338 |
+
"total": 110.43290661888022,
|
339 |
+
"count": 239072,
|
340 |
"is_parallel": true,
|
341 |
+
"self": 110.43290661888022
|
342 |
},
|
343 |
"communicator.exchange": {
|
344 |
+
"total": 2470.8126502879313,
|
345 |
+
"count": 239072,
|
346 |
"is_parallel": true,
|
347 |
+
"self": 2470.8126502879313
|
348 |
},
|
349 |
"steps_from_proto": {
|
350 |
+
"total": 441.95582845072204,
|
351 |
+
"count": 478144,
|
352 |
"is_parallel": true,
|
353 |
+
"self": 78.3687699053844,
|
354 |
"children": {
|
355 |
"_process_rank_one_or_two_observation": {
|
356 |
+
"total": 363.58705854533764,
|
357 |
+
"count": 1912576,
|
358 |
"is_parallel": true,
|
359 |
+
"self": 363.58705854533764
|
360 |
}
|
361 |
}
|
362 |
}
|
|
|
369 |
}
|
370 |
},
|
371 |
"trainer_advance": {
|
372 |
+
"total": 5371.4315441058425,
|
373 |
+
"count": 239073,
|
374 |
+
"self": 26.83088273082103,
|
375 |
"children": {
|
376 |
"process_trajectory": {
|
377 |
+
"total": 1094.2377518599678,
|
378 |
+
"count": 239073,
|
379 |
+
"self": 1093.3974272879568,
|
380 |
"children": {
|
381 |
"RLTrainer._checkpoint": {
|
382 |
+
"total": 0.8403245720110135,
|
383 |
+
"count": 7,
|
384 |
+
"self": 0.8403245720110135
|
385 |
}
|
386 |
}
|
387 |
},
|
388 |
"_update_policy": {
|
389 |
+
"total": 4250.362909515054,
|
390 |
+
"count": 51,
|
391 |
+
"self": 652.032682771809,
|
392 |
"children": {
|
393 |
"TorchPOCAOptimizer.update": {
|
394 |
+
"total": 3598.3302267432446,
|
395 |
+
"count": 4080,
|
396 |
+
"self": 3598.3302267432446
|
397 |
}
|
398 |
}
|
399 |
}
|
|
|
402 |
}
|
403 |
},
|
404 |
"trainer_threads": {
|
405 |
+
"total": 9.200011845678091e-07,
|
406 |
"count": 1,
|
407 |
+
"self": 9.200011845678091e-07
|
408 |
},
|
409 |
"TrainerController._save_models": {
|
410 |
+
"total": 0.12228448499809019,
|
411 |
"count": 1,
|
412 |
+
"self": 0.0026952329935738817,
|
413 |
"children": {
|
414 |
"RLTrainer._checkpoint": {
|
415 |
+
"total": 0.11958925200451631,
|
416 |
"count": 1,
|
417 |
+
"self": 0.11958925200451631
|
418 |
}
|
419 |
}
|
420 |
}
|
run_logs/training_status.json
CHANGED
@@ -2,59 +2,59 @@
|
|
2 |
"SoccerTwos": {
|
3 |
"checkpoints": [
|
4 |
{
|
5 |
-
"steps":
|
6 |
-
"file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-
|
7 |
"reward": 0.0,
|
8 |
-
"creation_time":
|
9 |
"auxillary_file_paths": [
|
10 |
-
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-
|
11 |
]
|
12 |
},
|
13 |
{
|
14 |
-
"steps":
|
15 |
-
"file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-
|
16 |
"reward": 0.0,
|
17 |
-
"creation_time":
|
18 |
"auxillary_file_paths": [
|
19 |
-
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-
|
20 |
]
|
21 |
},
|
22 |
{
|
23 |
-
"steps":
|
24 |
-
"file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-
|
25 |
"reward": 0.0,
|
26 |
-
"creation_time":
|
27 |
"auxillary_file_paths": [
|
28 |
-
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-
|
29 |
]
|
30 |
},
|
31 |
{
|
32 |
-
"steps":
|
33 |
-
"file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-
|
34 |
-
"reward":
|
35 |
-
"creation_time":
|
36 |
"auxillary_file_paths": [
|
37 |
-
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-
|
38 |
]
|
39 |
},
|
40 |
{
|
41 |
-
"steps":
|
42 |
-
"file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-
|
43 |
-
"reward":
|
44 |
-
"creation_time":
|
45 |
"auxillary_file_paths": [
|
46 |
-
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-
|
47 |
]
|
48 |
}
|
49 |
],
|
50 |
-
"elo":
|
51 |
"final_checkpoint": {
|
52 |
-
"steps":
|
53 |
"file_path": "results/SoccerTwos-read-deal/SoccerTwos.onnx",
|
54 |
-
"reward":
|
55 |
-
"creation_time":
|
56 |
"auxillary_file_paths": [
|
57 |
-
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-
|
58 |
]
|
59 |
}
|
60 |
},
|
|
|
2 |
"SoccerTwos": {
|
3 |
"checkpoints": [
|
4 |
{
|
5 |
+
"steps": 8499978,
|
6 |
+
"file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8499978.onnx",
|
7 |
"reward": 0.0,
|
8 |
+
"creation_time": 1710349255.752344,
|
9 |
"auxillary_file_paths": [
|
10 |
+
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8499978.pt"
|
11 |
]
|
12 |
},
|
13 |
{
|
14 |
+
"steps": 8999988,
|
15 |
+
"file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8999988.onnx",
|
16 |
"reward": 0.0,
|
17 |
+
"creation_time": 1710350638.0742688,
|
18 |
"auxillary_file_paths": [
|
19 |
+
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-8999988.pt"
|
20 |
]
|
21 |
},
|
22 |
{
|
23 |
+
"steps": 9499993,
|
24 |
+
"file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9499993.onnx",
|
25 |
"reward": 0.0,
|
26 |
+
"creation_time": 1710352100.153916,
|
27 |
"auxillary_file_paths": [
|
28 |
+
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9499993.pt"
|
29 |
]
|
30 |
},
|
31 |
{
|
32 |
+
"steps": 9999982,
|
33 |
+
"file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9999982.onnx",
|
34 |
+
"reward": null,
|
35 |
+
"creation_time": 1710353568.109763,
|
36 |
"auxillary_file_paths": [
|
37 |
+
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-9999982.pt"
|
38 |
]
|
39 |
},
|
40 |
{
|
41 |
+
"steps": 10000046,
|
42 |
+
"file_path": "results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-10000046.onnx",
|
43 |
+
"reward": null,
|
44 |
+
"creation_time": 1710353568.2486105,
|
45 |
"auxillary_file_paths": [
|
46 |
+
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-10000046.pt"
|
47 |
]
|
48 |
}
|
49 |
],
|
50 |
+
"elo": 1607.9046472284606,
|
51 |
"final_checkpoint": {
|
52 |
+
"steps": 10000046,
|
53 |
"file_path": "results/SoccerTwos-read-deal/SoccerTwos.onnx",
|
54 |
+
"reward": null,
|
55 |
+
"creation_time": 1710353568.2486105,
|
56 |
"auxillary_file_paths": [
|
57 |
+
"results/SoccerTwos-read-deal/SoccerTwos/SoccerTwos-10000046.pt"
|
58 |
]
|
59 |
}
|
60 |
},
|