ralphkalweit commited on
Commit
af19fb7
1 Parent(s): 1172dd1
SnowballTarget.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:805e29e0dea258fbd8c62872a54af02145490c17f9184fab00b1741ec6db6703
3
- size 1814028
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:739867ba7af7748404f94c816b00d286afa7e11d7cd9f1ebed05fadeb7f12a43
3
+ size 1815958
SnowballTarget/SnowballTarget-149960.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55af2d7d6ae2a3f78dad67044b2439c23833600a3eb4666e3a3cdf461e47a554
3
+ size 1815958
SnowballTarget/SnowballTarget-149960.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcd077db07ffd06478179c7cdf690360cfedbcf52f0fd854479a36c54deb641e
3
+ size 10820443
SnowballTarget/SnowballTarget-199920.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:592efa674896e88c882d6746192ef76d65899f3eed065ac55fecda7766d66799
3
+ size 1815958
SnowballTarget/SnowballTarget-199920.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6db8bddd751d09abd4249f553f79f76e55a03d73f0f690154c3f01eeee4e2200
3
+ size 10820443
SnowballTarget/SnowballTarget-249936.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8924c5496f256cc76f5cce8bf3caa9fef1e23d0dc5b8a1ffeb9cec87749f392
3
+ size 1815958
SnowballTarget/SnowballTarget-249936.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e0c6f559fa3ed5d24bdd42b2e817133eea5479e728a06007020df6adaf18f8d
3
+ size 10820443
SnowballTarget/SnowballTarget-299960.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:739867ba7af7748404f94c816b00d286afa7e11d7cd9f1ebed05fadeb7f12a43
3
+ size 1815958
SnowballTarget/SnowballTarget-299960.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1319ffe0ee9795eae2024ab20b3d0491544ec2d0d82e33181efc1fb239c2397b
3
+ size 10820443
SnowballTarget/SnowballTarget-300104.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:739867ba7af7748404f94c816b00d286afa7e11d7cd9f1ebed05fadeb7f12a43
3
+ size 1815958
SnowballTarget/SnowballTarget-300104.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bb3e089c9c1356722dd5fc36b2b28bca88387f7f5f51d363830049edb3728cc
3
+ size 10820443
SnowballTarget/SnowballTarget-49936.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6ce0767b17bc1279f52e7a88f4198ef9df37230bb5286a461701972e12b80af
3
+ size 1815958
SnowballTarget/SnowballTarget-49936.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15e9da38f5d2984bf5ad6f7d916b95ad52dec7fc9b98f33db7df32c77f857328
3
+ size 10820368
SnowballTarget/SnowballTarget-65208.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54702bcc3faf852f8d2458bb78c1c597e798b64e234cd62fe87c261b012402e0
3
+ size 1815958
SnowballTarget/SnowballTarget-65208.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85e663874e57e193a2bdb19cbeecc618cd7a7b89b888f389b79684ca607e5659
3
+ size 10820368
SnowballTarget/SnowballTarget-99976.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6e990377f6720a7f221ac05634e39a4c010283a5f91ac29f9ca08568964882b
3
+ size 1815958
SnowballTarget/SnowballTarget-99976.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fed0bceb406c744f44ca476dbde64fefc11a99b90589ac3d187afdb05f1186db
3
+ size 10820368
SnowballTarget/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c621c2632c09f83f09e139e60c0c3c9f0f79fe73e945535d315ae0179bbe6556
3
- size 3609442
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae597bb36e897b39e227449638d7353c978ed00c48b77139b6b7b73002ded789
3
+ size 10819618
SnowballTarget/events.out.tfevents.1720249336.c27fe8d53be1.6080.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d46cddf19726e5ce3f477f3a4ad93c50358f2dacd22f7957bbe237877c2a827d
3
+ size 25937
SnowballTarget/events.out.tfevents.1720249498.c27fe8d53be1.6821.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:223f8baa20bbd277f6daa66ae2f5343512fa7fca94648bf02feabc72fdc165ee
3
+ size 27266
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 256, "buffer_size": 10240, "learning_rate": 0.0002, "beta": 0.01, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 220000, "time_horizon": 128, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 256, "buffer_size": 10240, "learning_rate": 0.0002, "beta": 0.01, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 300000, "time_horizon": 128, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -38,7 +38,7 @@ behaviors:
38
  init_path: null
39
  keep_checkpoints: 10
40
  even_checkpoints: false
41
- max_steps: 220000
42
  time_horizon: 128
43
  summary_freq: 10000
44
  threaded: true
@@ -69,7 +69,7 @@ checkpoint_settings:
69
  run_id: SnowballTarget1
70
  initialize_from: null
71
  load_model: false
72
- resume: false
73
  force: false
74
  train_model: false
75
  inference: false
 
38
  init_path: null
39
  keep_checkpoints: 10
40
  even_checkpoints: false
41
+ max_steps: 300000
42
  time_horizon: 128
43
  summary_freq: 10000
44
  threaded: true
 
69
  run_id: SnowballTarget1
70
  initialize_from: null
71
  load_model: false
72
+ resume: true
73
  force: false
74
  train_model: false
75
  inference: false
run_logs/Player-0.log CHANGED
@@ -2,9 +2,6 @@ Mono path[0] = '/content/ml-agents/training-envs-executables/linux/SnowballTarge
2
  Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
3
  Preloaded 'lib_burst_generated.so'
4
  Preloaded 'libgrpc_csharp_ext.x64.so'
5
- PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face
6
- PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face/SnowballTarget
7
- Unable to load player prefs
8
  Initialize engine version: 2021.3.14f1 (eee1884e7226)
9
  [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
10
  Forcing GfxDevice: Null
@@ -34,7 +31,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
34
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
35
  FMOD initialized on nosound output
36
  Begin MonoManager ReloadAssembly
37
- - Completed reload, in 0.091 seconds
38
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
39
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
40
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -45,7 +42,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
45
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
46
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
47
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
48
- UnloadTime: 0.853906 ms
49
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
50
  requesting resize 84 x 84
51
  Setting up 1 worker threads for Enlighten.
@@ -53,7 +50,7 @@ Memory Statistics:
53
  [ALLOC_TEMP_TLS] TLS Allocator
54
  StackAllocators :
55
  [ALLOC_TEMP_MAIN]
56
- Peak usage frame count: [8.0 KB-16.0 KB]: 159 frames, [16.0 KB-32.0 KB]: 2 frames, [2.0 MB-4.0 MB]: 1 frames
57
  Initial Block Size 4.0 MB
58
  Current Block Size 4.0 MB
59
  Peak Allocated Bytes 2.0 MB
@@ -169,19 +166,19 @@ Memory Statistics:
169
  Peak Allocated Bytes 0 B
170
  Overflow Count 0
171
  [ALLOC_DEFAULT] Dual Thread Allocator
172
- Peak main deferred allocation count 36
173
  [ALLOC_BUCKET]
174
  Large Block size 4.0 MB
175
  Used Block count 1
176
  Peak Allocated bytes 1.0 MB
177
  [ALLOC_DEFAULT_MAIN]
178
- Peak usage frame count: [4.0 MB-8.0 MB]: 162 frames
179
  Requested Block Size 16.0 MB
180
  Peak Block count 1
181
- Peak Allocated memory 5.2 MB
182
  Peak Large allocation bytes 0 B
183
  [ALLOC_DEFAULT_THREAD]
184
- Peak usage frame count: [16.0 MB-32.0 MB]: 162 frames
185
  Requested Block Size 16.0 MB
186
  Peak Block count 1
187
  Peak Allocated memory 17.8 MB
@@ -213,13 +210,13 @@ Memory Statistics:
213
  Used Block count 1
214
  Peak Allocated bytes 1.0 MB
215
  [ALLOC_GFX_MAIN]
216
- Peak usage frame count: [32.0 KB-64.0 KB]: 152 frames, [64.0 KB-128.0 KB]: 10 frames
217
  Requested Block Size 16.0 MB
218
  Peak Block count 1
219
- Peak Allocated memory 65.6 KB
220
  Peak Large allocation bytes 0 B
221
  [ALLOC_GFX_THREAD]
222
- Peak usage frame count: [32.0 KB-64.0 KB]: 162 frames
223
  Requested Block Size 16.0 MB
224
  Peak Block count 1
225
  Peak Allocated memory 39.6 KB
@@ -231,13 +228,13 @@ Memory Statistics:
231
  Used Block count 1
232
  Peak Allocated bytes 1.0 MB
233
  [ALLOC_CACHEOBJECTS_MAIN]
234
- Peak usage frame count: [0.5 MB-1.0 MB]: 162 frames
235
  Requested Block Size 4.0 MB
236
  Peak Block count 1
237
  Peak Allocated memory 0.6 MB
238
  Peak Large allocation bytes 0 B
239
  [ALLOC_CACHEOBJECTS_THREAD]
240
- Peak usage frame count: [0.5 MB-1.0 MB]: 161 frames, [2.0 MB-4.0 MB]: 1 frames
241
  Requested Block Size 4.0 MB
242
  Peak Block count 1
243
  Peak Allocated memory 2.2 MB
@@ -249,13 +246,13 @@ Memory Statistics:
249
  Used Block count 1
250
  Peak Allocated bytes 1.0 MB
251
  [ALLOC_TYPETREE_MAIN]
252
- Peak usage frame count: [0-1.0 KB]: 162 frames
253
  Requested Block Size 2.0 MB
254
  Peak Block count 1
255
  Peak Allocated memory 1.0 KB
256
  Peak Large allocation bytes 0 B
257
  [ALLOC_TYPETREE_THREAD]
258
- Peak usage frame count: [1.0 KB-2.0 KB]: 162 frames
259
  Requested Block Size 2.0 MB
260
  Peak Block count 1
261
  Peak Allocated memory 1.7 KB
 
2
  Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
3
  Preloaded 'lib_burst_generated.so'
4
  Preloaded 'libgrpc_csharp_ext.x64.so'
 
 
 
5
  Initialize engine version: 2021.3.14f1 (eee1884e7226)
6
  [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
7
  Forcing GfxDevice: Null
 
31
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
32
  FMOD initialized on nosound output
33
  Begin MonoManager ReloadAssembly
34
+ - Completed reload, in 0.090 seconds
35
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
36
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
37
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
42
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
43
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
44
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
45
+ UnloadTime: 0.659639 ms
46
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
47
  requesting resize 84 x 84
48
  Setting up 1 worker threads for Enlighten.
 
50
  [ALLOC_TEMP_TLS] TLS Allocator
51
  StackAllocators :
52
  [ALLOC_TEMP_MAIN]
53
+ Peak usage frame count: [8.0 KB-16.0 KB]: 6315 frames, [16.0 KB-32.0 KB]: 107 frames, [2.0 MB-4.0 MB]: 1 frames
54
  Initial Block Size 4.0 MB
55
  Current Block Size 4.0 MB
56
  Peak Allocated Bytes 2.0 MB
 
166
  Peak Allocated Bytes 0 B
167
  Overflow Count 0
168
  [ALLOC_DEFAULT] Dual Thread Allocator
169
+ Peak main deferred allocation count 44
170
  [ALLOC_BUCKET]
171
  Large Block size 4.0 MB
172
  Used Block count 1
173
  Peak Allocated bytes 1.0 MB
174
  [ALLOC_DEFAULT_MAIN]
175
+ Peak usage frame count: [4.0 MB-8.0 MB]: 6423 frames
176
  Requested Block Size 16.0 MB
177
  Peak Block count 1
178
+ Peak Allocated memory 7.0 MB
179
  Peak Large allocation bytes 0 B
180
  [ALLOC_DEFAULT_THREAD]
181
+ Peak usage frame count: [16.0 MB-32.0 MB]: 6423 frames
182
  Requested Block Size 16.0 MB
183
  Peak Block count 1
184
  Peak Allocated memory 17.8 MB
 
210
  Used Block count 1
211
  Peak Allocated bytes 1.0 MB
212
  [ALLOC_GFX_MAIN]
213
+ Peak usage frame count: [32.0 KB-64.0 KB]: 5024 frames, [64.0 KB-128.0 KB]: 1399 frames
214
  Requested Block Size 16.0 MB
215
  Peak Block count 1
216
+ Peak Allocated memory 66.8 KB
217
  Peak Large allocation bytes 0 B
218
  [ALLOC_GFX_THREAD]
219
+ Peak usage frame count: [32.0 KB-64.0 KB]: 6423 frames
220
  Requested Block Size 16.0 MB
221
  Peak Block count 1
222
  Peak Allocated memory 39.6 KB
 
228
  Used Block count 1
229
  Peak Allocated bytes 1.0 MB
230
  [ALLOC_CACHEOBJECTS_MAIN]
231
+ Peak usage frame count: [0.5 MB-1.0 MB]: 6423 frames
232
  Requested Block Size 4.0 MB
233
  Peak Block count 1
234
  Peak Allocated memory 0.6 MB
235
  Peak Large allocation bytes 0 B
236
  [ALLOC_CACHEOBJECTS_THREAD]
237
+ Peak usage frame count: [0.5 MB-1.0 MB]: 6422 frames, [2.0 MB-4.0 MB]: 1 frames
238
  Requested Block Size 4.0 MB
239
  Peak Block count 1
240
  Peak Allocated memory 2.2 MB
 
246
  Used Block count 1
247
  Peak Allocated bytes 1.0 MB
248
  [ALLOC_TYPETREE_MAIN]
249
+ Peak usage frame count: [0-1.0 KB]: 6423 frames
250
  Requested Block Size 2.0 MB
251
  Peak Block count 1
252
  Peak Allocated memory 1.0 KB
253
  Peak Large allocation bytes 0 B
254
  [ALLOC_TYPETREE_THREAD]
255
+ Peak usage frame count: [1.0 KB-2.0 KB]: 6423 frames
256
  Requested Block Size 2.0 MB
257
  Peak Block count 1
258
  Peak Allocated memory 1.7 KB
run_logs/timers.json CHANGED
@@ -1,68 +1,214 @@
1
  {
2
  "name": "root",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  "metadata": {
4
  "timer_format_version": "0.1.0",
5
- "start_time_seconds": "1720249254",
6
  "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
7
- "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
8
  "mlagents_version": "1.1.0.dev0",
9
  "mlagents_envs_version": "1.1.0.dev0",
10
  "communication_protocol_version": "1.5.0",
11
  "pytorch_version": "2.3.0+cu121",
12
  "numpy_version": "1.23.5",
13
- "end_time_seconds": "1720249270"
14
  },
15
- "total": 16.25279369099985,
16
  "count": 1,
17
- "self": 0.14720840399991175,
18
  "children": {
19
  "run_training.setup": {
20
- "total": 0.05964862199994059,
21
  "count": 1,
22
- "self": 0.05964862199994059
23
  },
24
  "TrainerController.start_learning": {
25
- "total": 16.045936665,
26
  "count": 1,
27
- "self": 0.01878256399845668,
28
  "children": {
29
  "TrainerController._reset_env": {
30
- "total": 2.8109563699999853,
31
  "count": 1,
32
- "self": 2.8109563699999853
33
  },
34
  "TrainerController.advance": {
35
- "total": 12.917836443001534,
36
- "count": 540,
37
- "self": 0.008619109001074321,
38
  "children": {
39
  "env_step": {
40
- "total": 12.90921733400046,
41
- "count": 540,
42
- "self": 8.603649299005383,
43
  "children": {
44
  "SubprocessEnvManager._take_step": {
45
- "total": 4.296834380997325,
46
- "count": 540,
47
- "self": 0.04560909600172636,
48
  "children": {
49
  "TorchPolicy.evaluate": {
50
- "total": 4.2512252849955985,
51
- "count": 540,
52
- "self": 4.2512252849955985
53
  }
54
  }
55
  },
56
  "workers": {
57
- "total": 0.00873365399775139,
58
- "count": 539,
59
  "self": 0.0,
60
  "children": {
61
  "worker_root": {
62
- "total": 15.742622637999375,
63
- "count": 539,
64
  "is_parallel": true,
65
- "self": 8.727718367001216,
66
  "children": {
67
  "run_training.setup": {
68
  "total": 0.0,
@@ -71,48 +217,48 @@
71
  "self": 0.0,
72
  "children": {
73
  "steps_from_proto": {
74
- "total": 0.00549071799991907,
75
  "count": 1,
76
  "is_parallel": true,
77
- "self": 0.0039051780001955194,
78
  "children": {
79
  "_process_rank_one_or_two_observation": {
80
- "total": 0.0015855399997235509,
81
  "count": 10,
82
  "is_parallel": true,
83
- "self": 0.0015855399997235509
84
  }
85
  }
86
  },
87
  "UnityEnvironment.step": {
88
- "total": 0.06512434399996891,
89
  "count": 1,
90
  "is_parallel": true,
91
- "self": 0.0006391009999333619,
92
  "children": {
93
  "UnityEnvironment._generate_step_input": {
94
- "total": 0.0003716569999596686,
95
  "count": 1,
96
  "is_parallel": true,
97
- "self": 0.0003716569999596686
98
  },
99
  "communicator.exchange": {
100
- "total": 0.06223896100004822,
101
  "count": 1,
102
  "is_parallel": true,
103
- "self": 0.06223896100004822
104
  },
105
  "steps_from_proto": {
106
- "total": 0.0018746250000276632,
107
  "count": 1,
108
  "is_parallel": true,
109
- "self": 0.0003390939998553222,
110
  "children": {
111
  "_process_rank_one_or_two_observation": {
112
- "total": 0.001535531000172341,
113
  "count": 10,
114
  "is_parallel": true,
115
- "self": 0.001535531000172341
116
  }
117
  }
118
  }
@@ -121,34 +267,34 @@
121
  }
122
  },
123
  "UnityEnvironment.step": {
124
- "total": 7.014904270998159,
125
- "count": 538,
126
  "is_parallel": true,
127
- "self": 0.3154182389998823,
128
  "children": {
129
  "UnityEnvironment._generate_step_input": {
130
- "total": 0.1720740619987282,
131
- "count": 538,
132
  "is_parallel": true,
133
- "self": 0.1720740619987282
134
  },
135
  "communicator.exchange": {
136
- "total": 5.432349116000751,
137
- "count": 538,
138
  "is_parallel": true,
139
- "self": 5.432349116000751
140
  },
141
  "steps_from_proto": {
142
- "total": 1.0950628539987974,
143
- "count": 538,
144
  "is_parallel": true,
145
- "self": 0.21312870899510017,
146
  "children": {
147
  "_process_rank_one_or_two_observation": {
148
- "total": 0.8819341450036973,
149
- "count": 5380,
150
  "is_parallel": true,
151
- "self": 0.8819341450036973
152
  }
153
  }
154
  }
@@ -163,9 +309,9 @@
163
  }
164
  },
165
  "trainer_threads": {
166
- "total": 2.2120000039649312e-05,
167
  "count": 1,
168
- "self": 2.2120000039649312e-05,
169
  "children": {
170
  "thread_root": {
171
  "total": 0.0,
@@ -174,16 +320,38 @@
174
  "self": 0.0,
175
  "children": {
176
  "trainer_advance": {
177
- "total": 12.58680932998277,
178
- "count": 38900,
179
  "is_parallel": true,
180
- "self": 0.7406553219732359,
181
  "children": {
182
  "process_trajectory": {
183
- "total": 11.846154008009535,
184
- "count": 38900,
185
  "is_parallel": true,
186
- "self": 11.846154008009535
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
187
  }
188
  }
189
  }
@@ -192,14 +360,14 @@
192
  }
193
  },
194
  "TrainerController._save_models": {
195
- "total": 0.29833916799998406,
196
  "count": 1,
197
- "self": 0.002305101999809267,
198
  "children": {
199
  "RLTrainer._checkpoint": {
200
- "total": 0.2960340660001748,
201
  "count": 1,
202
- "self": 0.2960340660001748
203
  }
204
  }
205
  }
 
1
  {
2
  "name": "root",
3
+ "gauges": {
4
+ "SnowballTarget.Policy.Entropy.mean": {
5
+ "value": 1.8118195533752441,
6
+ "min": 1.8118195533752441,
7
+ "max": 2.771235704421997,
8
+ "count": 24
9
+ },
10
+ "SnowballTarget.Policy.Entropy.sum": {
11
+ "value": 17378.97265625,
12
+ "min": 16125.8203125,
13
+ "max": 27430.41796875,
14
+ "count": 24
15
+ },
16
+ "SnowballTarget.Step.mean": {
17
+ "value": 299960.0,
18
+ "min": 69992.0,
19
+ "max": 299960.0,
20
+ "count": 24
21
+ },
22
+ "SnowballTarget.Step.sum": {
23
+ "value": 299960.0,
24
+ "min": 69992.0,
25
+ "max": 299960.0,
26
+ "count": 24
27
+ },
28
+ "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
29
+ "value": 8.524247169494629,
30
+ "min": 1.3393324613571167,
31
+ "max": 8.524247169494629,
32
+ "count": 24
33
+ },
34
+ "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
35
+ "value": 835.376220703125,
36
+ "min": 62.94862747192383,
37
+ "max": 854.62353515625,
38
+ "count": 24
39
+ },
40
+ "SnowballTarget.Environment.EpisodeLength.mean": {
41
+ "value": 199.0,
42
+ "min": 199.0,
43
+ "max": 199.0,
44
+ "count": 24
45
+ },
46
+ "SnowballTarget.Environment.EpisodeLength.sum": {
47
+ "value": 10945.0,
48
+ "min": 4378.0,
49
+ "max": 10945.0,
50
+ "count": 24
51
+ },
52
+ "SnowballTarget.Environment.CumulativeReward.mean": {
53
+ "value": 19.608695652173914,
54
+ "min": 7.2727272727272725,
55
+ "max": 20.5,
56
+ "count": 24
57
+ },
58
+ "SnowballTarget.Environment.CumulativeReward.sum": {
59
+ "value": 902.0,
60
+ "min": 160.0,
61
+ "max": 1069.0,
62
+ "count": 24
63
+ },
64
+ "SnowballTarget.Policy.ExtrinsicReward.mean": {
65
+ "value": 19.608695652173914,
66
+ "min": 7.2727272727272725,
67
+ "max": 20.5,
68
+ "count": 24
69
+ },
70
+ "SnowballTarget.Policy.ExtrinsicReward.sum": {
71
+ "value": 902.0,
72
+ "min": 160.0,
73
+ "max": 1069.0,
74
+ "count": 24
75
+ },
76
+ "SnowballTarget.IsTraining.mean": {
77
+ "value": 1.0,
78
+ "min": 1.0,
79
+ "max": 1.0,
80
+ "count": 24
81
+ },
82
+ "SnowballTarget.IsTraining.sum": {
83
+ "value": 1.0,
84
+ "min": 1.0,
85
+ "max": 1.0,
86
+ "count": 24
87
+ },
88
+ "SnowballTarget.Losses.PolicyLoss.mean": {
89
+ "value": 0.046152475377773894,
90
+ "min": 0.045261845252724246,
91
+ "max": 0.05613040942273709,
92
+ "count": 21
93
+ },
94
+ "SnowballTarget.Losses.PolicyLoss.sum": {
95
+ "value": 0.046152475377773894,
96
+ "min": 0.045261845252724246,
97
+ "max": 0.05613040942273709,
98
+ "count": 21
99
+ },
100
+ "SnowballTarget.Losses.ValueLoss.mean": {
101
+ "value": 0.2707705969611804,
102
+ "min": 0.2489233562161052,
103
+ "max": 0.31760141750176746,
104
+ "count": 21
105
+ },
106
+ "SnowballTarget.Losses.ValueLoss.sum": {
107
+ "value": 0.2707705969611804,
108
+ "min": 0.2489233562161052,
109
+ "max": 0.31760141750176746,
110
+ "count": 21
111
+ },
112
+ "SnowballTarget.Policy.LearningRate.mean": {
113
+ "value": 3.056098471999992e-06,
114
+ "min": 3.056098471999992e-06,
115
+ "max": 0.00014962669185333328,
116
+ "count": 21
117
+ },
118
+ "SnowballTarget.Policy.LearningRate.sum": {
119
+ "value": 3.056098471999992e-06,
120
+ "min": 3.056098471999992e-06,
121
+ "max": 0.00014962669185333328,
122
+ "count": 21
123
+ },
124
+ "SnowballTarget.Policy.Epsilon.mean": {
125
+ "value": 0.10152800000000005,
126
+ "min": 0.10152800000000005,
127
+ "max": 0.1748133333333333,
128
+ "count": 21
129
+ },
130
+ "SnowballTarget.Policy.Epsilon.sum": {
131
+ "value": 0.10152800000000005,
132
+ "min": 0.10152800000000005,
133
+ "max": 0.1748133333333333,
134
+ "count": 21
135
+ },
136
+ "SnowballTarget.Policy.Beta.mean": {
137
+ "value": 0.00016264719999999966,
138
+ "min": 0.00016264719999999966,
139
+ "max": 0.007483852,
140
+ "count": 21
141
+ },
142
+ "SnowballTarget.Policy.Beta.sum": {
143
+ "value": 0.00016264719999999966,
144
+ "min": 0.00016264719999999966,
145
+ "max": 0.007483852,
146
+ "count": 21
147
+ }
148
+ },
149
  "metadata": {
150
  "timer_format_version": "0.1.0",
151
+ "start_time_seconds": "1720249497",
152
  "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
153
+ "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics --resume",
154
  "mlagents_version": "1.1.0.dev0",
155
  "mlagents_envs_version": "1.1.0.dev0",
156
  "communication_protocol_version": "1.5.0",
157
  "pytorch_version": "2.3.0+cu121",
158
  "numpy_version": "1.23.5",
159
+ "end_time_seconds": "1720250049"
160
  },
161
+ "total": 552.2202583549999,
162
  "count": 1,
163
+ "self": 0.42978697499984264,
164
  "children": {
165
  "run_training.setup": {
166
+ "total": 0.05920954599992001,
167
  "count": 1,
168
+ "self": 0.05920954599992001
169
  },
170
  "TrainerController.start_learning": {
171
+ "total": 551.7312618340002,
172
  "count": 1,
173
+ "self": 0.7641373830313114,
174
  "children": {
175
  "TrainerController._reset_env": {
176
+ "total": 2.0999622650001584,
177
  "count": 1,
178
+ "self": 2.0999622650001584
179
  },
180
  "TrainerController.advance": {
181
+ "total": 548.7307076829686,
182
+ "count": 21407,
183
+ "self": 0.3434664609551419,
184
  "children": {
185
  "env_step": {
186
+ "total": 548.3872412220135,
187
+ "count": 21407,
188
+ "self": 357.6078869710309,
189
  "children": {
190
  "SubprocessEnvManager._take_step": {
191
+ "total": 190.41055164898262,
192
+ "count": 21407,
193
+ "self": 1.8487056709798253,
194
  "children": {
195
  "TorchPolicy.evaluate": {
196
+ "total": 188.5618459780028,
197
+ "count": 21407,
198
+ "self": 188.5618459780028
199
  }
200
  }
201
  },
202
  "workers": {
203
+ "total": 0.36880260199995973,
204
+ "count": 21407,
205
  "self": 0.0,
206
  "children": {
207
  "worker_root": {
208
+ "total": 550.1251846769994,
209
+ "count": 21407,
210
  "is_parallel": true,
211
+ "self": 269.83681195401164,
212
  "children": {
213
  "run_training.setup": {
214
  "total": 0.0,
 
217
  "self": 0.0,
218
  "children": {
219
  "steps_from_proto": {
220
+ "total": 0.0026616340001055505,
221
  "count": 1,
222
  "is_parallel": true,
223
+ "self": 0.0008052370003497344,
224
  "children": {
225
  "_process_rank_one_or_two_observation": {
226
+ "total": 0.001856396999755816,
227
  "count": 10,
228
  "is_parallel": true,
229
+ "self": 0.001856396999755816
230
  }
231
  }
232
  },
233
  "UnityEnvironment.step": {
234
+ "total": 0.045671846000004734,
235
  "count": 1,
236
  "is_parallel": true,
237
+ "self": 0.000765755999736939,
238
  "children": {
239
  "UnityEnvironment._generate_step_input": {
240
+ "total": 0.000451747000170144,
241
  "count": 1,
242
  "is_parallel": true,
243
+ "self": 0.000451747000170144
244
  },
245
  "communicator.exchange": {
246
+ "total": 0.04220969600009994,
247
  "count": 1,
248
  "is_parallel": true,
249
+ "self": 0.04220969600009994
250
  },
251
  "steps_from_proto": {
252
+ "total": 0.0022446469999977126,
253
  "count": 1,
254
  "is_parallel": true,
255
+ "self": 0.0004208880002352089,
256
  "children": {
257
  "_process_rank_one_or_two_observation": {
258
+ "total": 0.0018237589997625037,
259
  "count": 10,
260
  "is_parallel": true,
261
+ "self": 0.0018237589997625037
262
  }
263
  }
264
  }
 
267
  }
268
  },
269
  "UnityEnvironment.step": {
270
+ "total": 280.2883727229878,
271
+ "count": 21406,
272
  "is_parallel": true,
273
+ "self": 12.630060233967242,
274
  "children": {
275
  "UnityEnvironment._generate_step_input": {
276
+ "total": 6.792817600001172,
277
+ "count": 21406,
278
  "is_parallel": true,
279
+ "self": 6.792817600001172
280
  },
281
  "communicator.exchange": {
282
+ "total": 218.07006982201506,
283
+ "count": 21406,
284
  "is_parallel": true,
285
+ "self": 218.07006982201506
286
  },
287
  "steps_from_proto": {
288
+ "total": 42.79542506700432,
289
+ "count": 21406,
290
  "is_parallel": true,
291
+ "self": 8.107294056017963,
292
  "children": {
293
  "_process_rank_one_or_two_observation": {
294
+ "total": 34.68813101098635,
295
+ "count": 214060,
296
  "is_parallel": true,
297
+ "self": 34.68813101098635
298
  }
299
  }
300
  }
 
309
  }
310
  },
311
  "trainer_threads": {
312
+ "total": 0.00023989800001800177,
313
  "count": 1,
314
+ "self": 0.00023989800001800177,
315
  "children": {
316
  "thread_root": {
317
  "total": 0.0,
 
320
  "self": 0.0,
321
  "children": {
322
  "trainer_advance": {
323
+ "total": 539.1018590201095,
324
+ "count": 1085599,
325
  "is_parallel": true,
326
+ "self": 24.56119199611271,
327
  "children": {
328
  "process_trajectory": {
329
+ "total": 362.60708646899616,
330
+ "count": 1085599,
331
  "is_parallel": true,
332
+ "self": 361.4931656489964,
333
+ "children": {
334
+ "RLTrainer._checkpoint": {
335
+ "total": 1.1139208199997483,
336
+ "count": 5,
337
+ "is_parallel": true,
338
+ "self": 1.1139208199997483
339
+ }
340
+ }
341
+ },
342
+ "_update_policy": {
343
+ "total": 151.93358055500062,
344
+ "count": 21,
345
+ "is_parallel": true,
346
+ "self": 69.69792452899833,
347
+ "children": {
348
+ "TorchPPOOptimizer.update": {
349
+ "total": 82.23565602600229,
350
+ "count": 2640,
351
+ "is_parallel": true,
352
+ "self": 82.23565602600229
353
+ }
354
+ }
355
  }
356
  }
357
  }
 
360
  }
361
  },
362
  "TrainerController._save_models": {
363
+ "total": 0.13621460500007743,
364
  "count": 1,
365
+ "self": 0.0026471169999240374,
366
  "children": {
367
  "RLTrainer._checkpoint": {
368
+ "total": 0.1335674880001534,
369
  "count": 1,
370
+ "self": 0.1335674880001534
371
  }
372
  }
373
  }
run_logs/training_status.json CHANGED
@@ -9,15 +9,87 @@
9
  "auxillary_file_paths": [
10
  "results/SnowballTarget1/SnowballTarget/SnowballTarget-5808.pt"
11
  ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  }
13
  ],
14
  "final_checkpoint": {
15
- "steps": 5808,
16
  "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
17
- "reward": 3.227272727272727,
18
- "creation_time": 1720249270.666838,
19
  "auxillary_file_paths": [
20
- "results/SnowballTarget1/SnowballTarget/SnowballTarget-5808.pt"
21
  ]
22
  }
23
  },
 
9
  "auxillary_file_paths": [
10
  "results/SnowballTarget1/SnowballTarget/SnowballTarget-5808.pt"
11
  ]
12
+ },
13
+ {
14
+ "steps": 49936,
15
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
16
+ "reward": 6.636363636363637,
17
+ "creation_time": 1720249445.0350823,
18
+ "auxillary_file_paths": [
19
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
20
+ ]
21
+ },
22
+ {
23
+ "steps": 65208,
24
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-65208.onnx",
25
+ "reward": 6.606060606060606,
26
+ "creation_time": 1720249477.8707228,
27
+ "auxillary_file_paths": [
28
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-65208.pt"
29
+ ]
30
+ },
31
+ {
32
+ "steps": 99976,
33
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99976.onnx",
34
+ "reward": 9.1875,
35
+ "creation_time": 1720249581.9225633,
36
+ "auxillary_file_paths": [
37
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-99976.pt"
38
+ ]
39
+ },
40
+ {
41
+ "steps": 149960,
42
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149960.onnx",
43
+ "reward": 13.295454545454545,
44
+ "creation_time": 1720249696.0399718,
45
+ "auxillary_file_paths": [
46
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-149960.pt"
47
+ ]
48
+ },
49
+ {
50
+ "steps": 199920,
51
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199920.onnx",
52
+ "reward": 16.5,
53
+ "creation_time": 1720249815.2746449,
54
+ "auxillary_file_paths": [
55
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-199920.pt"
56
+ ]
57
+ },
58
+ {
59
+ "steps": 249936,
60
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-249936.onnx",
61
+ "reward": 18.51851851851852,
62
+ "creation_time": 1720249928.8175292,
63
+ "auxillary_file_paths": [
64
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-249936.pt"
65
+ ]
66
+ },
67
+ {
68
+ "steps": 299960,
69
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-299960.onnx",
70
+ "reward": 19.75,
71
+ "creation_time": 1720250049.0235999,
72
+ "auxillary_file_paths": [
73
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-299960.pt"
74
+ ]
75
+ },
76
+ {
77
+ "steps": 300104,
78
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-300104.onnx",
79
+ "reward": 19.576923076923077,
80
+ "creation_time": 1720250049.1946568,
81
+ "auxillary_file_paths": [
82
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-300104.pt"
83
+ ]
84
  }
85
  ],
86
  "final_checkpoint": {
87
+ "steps": 300104,
88
  "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
89
+ "reward": 19.576923076923077,
90
+ "creation_time": 1720250049.1946568,
91
  "auxillary_file_paths": [
92
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-300104.pt"
93
  ]
94
  }
95
  },