adhisetiawan commited on Mar 27, 2023

Commit

3ee64fc

•

1 Parent(s): bdbd567

change number of layers

Browse files

Files changed (18) hide show

SnowballTarget.onnx +2 -2
SnowballTarget/SnowballTarget-149984.onnx +2 -2
SnowballTarget/SnowballTarget-149984.pt +2 -2
SnowballTarget/SnowballTarget-199984.onnx +2 -2
SnowballTarget/SnowballTarget-199984.pt +2 -2
SnowballTarget/SnowballTarget-200112.onnx +2 -2
SnowballTarget/SnowballTarget-200112.pt +2 -2
SnowballTarget/SnowballTarget-49936.onnx +2 -2
SnowballTarget/SnowballTarget-49936.pt +2 -2
SnowballTarget/SnowballTarget-99960.onnx +2 -2
SnowballTarget/SnowballTarget-99960.pt +2 -2
SnowballTarget/checkpoint.pt +2 -2
SnowballTarget/{events.out.tfevents.1679902715.efb1629e622b.2657.0 → events.out.tfevents.1679908425.efb1629e622b.26805.0} +2 -2
config.json +1 -1
configuration.yaml +2 -2
run_logs/Player-0.log +12 -15
run_logs/timers.json +111 -111
run_logs/training_status.json +12 -12

SnowballTarget.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d7e2c5d3bd5a7b681a7452c45a6330d1923dded42f78f3d54f109b838eadc3e5
-size 646532

 version https://git-lfs.github.com/spec/v1
+oid sha256:510fffc23a002d6bc4c199621b6f673a1ed128eed7f99a2a3a4f4194a723e173
+size 910131

SnowballTarget/SnowballTarget-149984.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2cb42f8d4c0886137a71f8212e60fea4e163330ba0274a45b3d1223915bd4946
-size 646532

 version https://git-lfs.github.com/spec/v1
+oid sha256:fbca599c83610ecdad2c6f9d8a66442440a2840c24aa0c33b3f20cd6d9031ccd
+size 910131

SnowballTarget/SnowballTarget-149984.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d00dc1534137383652074b3ef6ef78bb79f12a2215816e432b898ba4a030eac3
-size 3843968

 version https://git-lfs.github.com/spec/v1
+oid sha256:c2f085bd423c674e2558e9c02b3e195d97608821a937c1e3c1de22c6cb01b2d7
+size 5426908

SnowballTarget/SnowballTarget-199984.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d7e2c5d3bd5a7b681a7452c45a6330d1923dded42f78f3d54f109b838eadc3e5
-size 646532

 version https://git-lfs.github.com/spec/v1
+oid sha256:510fffc23a002d6bc4c199621b6f673a1ed128eed7f99a2a3a4f4194a723e173
+size 910131

SnowballTarget/SnowballTarget-199984.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:db09a26a9d209ff31a03d4d95352e2a3151141ed9e0c2dc5edb43b052022a889
-size 3843968

 version https://git-lfs.github.com/spec/v1
+oid sha256:41ce224edaf67a70520a025f68c2be3a3c7c0a6d7ee46f38489058191817b78b
+size 5426908

SnowballTarget/SnowballTarget-200112.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d7e2c5d3bd5a7b681a7452c45a6330d1923dded42f78f3d54f109b838eadc3e5
-size 646532

 version https://git-lfs.github.com/spec/v1
+oid sha256:510fffc23a002d6bc4c199621b6f673a1ed128eed7f99a2a3a4f4194a723e173
+size 910131

SnowballTarget/SnowballTarget-200112.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f160aaa60e9e1272e249e32e757a6cf4c08efb8fd6be98b9d61683dcb9417dc0
-size 3843968

 version https://git-lfs.github.com/spec/v1
+oid sha256:da66ee1bddfded35b863053faaed30ae4d70826e2e4b3eafbf0e073fac71638e
+size 5426908

SnowballTarget/SnowballTarget-49936.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2f95aaec83d4aa6c3a740903c7e27882f499df754a2affb5d692e2fc5c4f8827
-size 646532

 version https://git-lfs.github.com/spec/v1
+oid sha256:13eb0df36312a46fdd37125cf03bc8395537f1a17eeab36b9382829a9404a6b3
+size 910131

SnowballTarget/SnowballTarget-49936.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:964b4c29ac96e4b711da3d56aea89191ab20c7bceac794004ebced0802af55c0
-size 3843968

 version https://git-lfs.github.com/spec/v1
+oid sha256:52d5bf107be74b3091fcb1c34699b02b05a60f39b7a1ccb4ada03b33339c1805
+size 5426908

SnowballTarget/SnowballTarget-99960.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a1818687e11dc5c49876c6421c88362ce1caff9ee0f96539e3f5ed23d8aad885
-size 646532

 version https://git-lfs.github.com/spec/v1
+oid sha256:6e9dbc35d4da555d203f2ee0d0c46db73d3af5f7d6a40b2729da683b7e57c003
+size 910131

SnowballTarget/SnowballTarget-99960.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc3f831cc339ee1131d2e4cd167a3d8348a7c00dad344aafbcb66b40e5cc1b7b
-size 3843968

 version https://git-lfs.github.com/spec/v1
+oid sha256:f37db3c05a9a0fb9f370ef6070cc91e468c84f888231660312afc032b8a2e60b
+size 5426908

SnowballTarget/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f160aaa60e9e1272e249e32e757a6cf4c08efb8fd6be98b9d61683dcb9417dc0
-size 3843968

 version https://git-lfs.github.com/spec/v1
+oid sha256:da66ee1bddfded35b863053faaed30ae4d70826e2e4b3eafbf0e073fac71638e
+size 5426908

SnowballTarget/{events.out.tfevents.1679902715.efb1629e622b.2657.0 → events.out.tfevents.1679908425.efb1629e622b.26805.0} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8d68530243d31cde090f9635a27f3df293140b8b3fa932b5c5977bce972389fa
-size 23702

 version https://git-lfs.github.com/spec/v1
+oid sha256:5ca596d92751d486ddd019de384f3d3f165ab6bda1de02a51c33eaa0e3ce28f8
+size 23489

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": ~~false~~, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -18,7 +18,7 @@ behaviors:
     network_settings:
       normalize: false
       hidden_units: 256
-      num_layers: 2
       vis_encode_type: simple
       memory: null
       goal_conditioning_type: hyper
@@ -68,7 +68,7 @@ checkpoint_settings:
   initialize_from: null
   load_model: false
   resume: false
-  force: false
   train_model: false
   inference: false
   results_dir: results

     network_settings:
       normalize: false
       hidden_units: 256
+      num_layers: 3
       vis_encode_type: simple
       memory: null
       goal_conditioning_type: hyper
   initialize_from: null
   load_model: false
   resume: false
+  force: true
   train_model: false
   inference: false
   results_dir: results

run_logs/Player-0.log CHANGED Viewed

@@ -2,9 +2,6 @@ Mono path[0] = '/content/ml-agents/training-envs-executables/linux/SnowballTarge
 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face/SnowballTarget
-Unable to load player prefs
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
@@ -34,7 +31,7 @@ ALSA lib pcm.c:2642:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.091 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -45,7 +42,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.666829 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
@@ -53,7 +50,7 @@ Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
-      Peak usage frame count: [8.0 KB-16.0 KB]: 5369 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
@@ -169,19 +166,19 @@ Memory Statistics:
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
-  Peak main deferred allocation count 41
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
-      Peak usage frame count: [4.0 MB-8.0 MB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 6.7 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
-      Peak usage frame count: [16.0 MB-32.0 MB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 17.8 MB
@@ -213,13 +210,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 5017 frames, [64.0 KB-128.0 KB]: 444 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 66.8 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
@@ -231,13 +228,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5461 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5460 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
@@ -249,13 +246,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
-      Peak usage frame count: [0-1.0 KB]: 5461 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
-      Peak usage frame count: [1.0 KB-2.0 KB]: 5461 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.080 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.649644 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [8.0 KB-16.0 KB]: 5374 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
+  Peak main deferred allocation count 42
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [4.0 MB-8.0 MB]: 5466 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 6.7 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 5466 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 17.8 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 4388 frames, [64.0 KB-128.0 KB]: 1078 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 66.8 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 5466 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5466 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5465 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 5466 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [1.0 KB-2.0 KB]: 5466 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

run_logs/timers.json CHANGED Viewed

@@ -2,15 +2,15 @@
     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
-            "value": 0.94545978307724,
-            "min": 0.916050374507904,
-            "max": 2.867387533187866,
             "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
-            "value": 9027.25,
-            "min": 8837.1376953125,
-            "max": 29396.45703125,
             "count": 20
         },
         "SnowballTarget.Step.mean": {
@@ -26,15 +26,15 @@
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 13.051465034484863,
-            "min": 0.27961480617523193,
-            "max": 13.051465034484863,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 2545.03564453125,
-            "min": 54.245269775390625,
-            "max": 2638.4033203125,
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
@@ -50,27 +50,27 @@
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.07293560138314918,
-            "min": 0.0596467264406052,
-            "max": 0.07503485352122773,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.2917424055325967,
-            "min": 0.2597963432598786,
-            "max": 0.37517426760613865,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.1870236031199787,
-            "min": 0.10796726512432774,
-            "max": 0.2893612817806356,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.7480944124799148,
-            "min": 0.43186906049731094,
-            "max": 1.446806408903178,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
@@ -110,27 +110,27 @@
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 25.545454545454547,
-            "min": 2.9318181818181817,
-            "max": 25.727272727272727,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 1124.0,
-            "min": 129.0,
-            "max": 1415.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 25.545454545454547,
-            "min": 2.9318181818181817,
-            "max": 25.727272727272727,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 1124.0,
-            "min": 129.0,
-            "max": 1415.0,
             "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
@@ -148,67 +148,67 @@
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1679902709",
         "python_version": "3.9.16 (main, Dec  7 2022, 01:11:51) \n[GCC 9.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "0.31.0.dev0",
         "mlagents_envs_version": "0.31.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "1.11.0+cu102",
         "numpy_version": "1.21.2",
-        "end_time_seconds": "1679903171"
     },
-    "total": 462.34764825699983,
     "count": 1,
-    "self": 0.43356318499991175,
     "children": {
         "run_training.setup": {
-            "total": 0.11549864999994952,
             "count": 1,
-            "self": 0.11549864999994952
         },
         "TrainerController.start_learning": {
-            "total": 461.79858642199997,
             "count": 1,
-            "self": 0.5018591850098346,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 10.100400470000068,
                     "count": 1,
-                    "self": 10.100400470000068
                 },
                 "TrainerController.advance": {
-                    "total": 451.0666685519898,
-                    "count": 18202,
-                    "self": 0.26017733399521603,
                     "children": {
                         "env_step": {
-                            "total": 450.80649121799456,
-                            "count": 18202,
-                            "self": 326.2002793959772,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 124.34499847501093,
-                                    "count": 18202,
-                                    "self": 2.645034317017007,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 121.69996415799392,
-                                            "count": 18202,
-                                            "self": 121.69996415799392
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.2612133470064464,
-                                    "count": 18202,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 460.47195434199557,
-                                            "count": 18202,
                                             "is_parallel": true,
-                                            "self": 223.98804554998026,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -217,48 +217,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.0056975500000362445,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.004164137999964623,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.0015334120000716212,
                                                                     "count": 10,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0015334120000716212
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.12132309499997973,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0006008689998679984,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.00043788599998606514,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00043788599998606514
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.11834234600007676,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.11834234600007676
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.0019419940000489078,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00039704700009224325,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0015449469999566645,
                                                                             "count": 10,
                                                                             "is_parallel": true,
-                                                                            "self": 0.0015449469999566645
                                                                         }
                                                                     }
                                                                 }
@@ -267,34 +267,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 236.4839087920153,
-                                                    "count": 18201,
                                                     "is_parallel": true,
-                                                    "self": 9.50358736703356,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 5.196618792003733,
-                                                            "count": 18201,
                                                             "is_parallel": true,
-                                                            "self": 5.196618792003733
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 191.09818791898738,
-                                                            "count": 18201,
                                                             "is_parallel": true,
-                                                            "self": 191.09818791898738
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 30.685514713990642,
-                                                            "count": 18201,
                                                             "is_parallel": true,
-                                                            "self": 5.897759952005572,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 24.78775476198507,
-                                                                    "count": 182010,
                                                                     "is_parallel": true,
-                                                                    "self": 24.78775476198507
                                                                 }
                                                             }
                                                         }
@@ -309,9 +309,9 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 0.00012075600011485221,
                     "count": 1,
-                    "self": 0.00012075600011485221,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
@@ -320,36 +320,36 @@
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
-                                    "total": 447.64375773002325,
-                                    "count": 395087,
                                     "is_parallel": true,
-                                    "self": 9.728361957030529,
                                     "children": {
                                         "process_trajectory": {
-                                            "total": 245.96384885199188,
-                                            "count": 395087,
                                             "is_parallel": true,
-                                            "self": 245.08376061799197,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
-                                                    "total": 0.8800882339999134,
                                                     "count": 4,
                                                     "is_parallel": true,
-                                                    "self": 0.8800882339999134
                                                 }
                                             }
                                         },
                                         "_update_policy": {
-                                            "total": 191.95154692100084,
                                             "count": 90,
                                             "is_parallel": true,
-                                            "self": 73.56837819000191,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
-                                                    "total": 118.38316873099893,
                                                     "count": 4587,
                                                     "is_parallel": true,
-                                                    "self": 118.38316873099893
                                                 }
                                             }
                                         }
@@ -360,14 +360,14 @@
                     }
                 },
                 "TrainerController._save_models": {
-                    "total": 0.12953745900017566,
                     "count": 1,
-                    "self": 0.0008388180001475121,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.12869864100002815,
                             "count": 1,
-                            "self": 0.12869864100002815
                         }
                     }
                 }

     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
+            "value": 0.9946820735931396,
+            "min": 0.9946820735931396,
+            "max": 2.8663761615753174,
             "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
+            "value": 9530.048828125,
+            "min": 9530.048828125,
+            "max": 29480.677734375,
             "count": 20
         },
         "SnowballTarget.Step.mean": {
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 12.850577354431152,
+            "min": 0.4389503598213196,
+            "max": 12.850577354431152,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 2505.862548828125,
+            "min": 85.1563720703125,
+            "max": 2582.72509765625,
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.07140613051103406,
+            "min": 0.06089604495951505,
+            "max": 0.07297919158322744,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.28562452204413624,
+            "min": 0.25895955315568514,
+            "max": 0.3648959579161372,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.21466431233520603,
+            "min": 0.12085397768418725,
+            "max": 0.29286830470550296,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.8586572493408241,
+            "min": 0.483415910736749,
+            "max": 1.3729174195551404,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 25.613636363636363,
+            "min": 3.3863636363636362,
+            "max": 25.613636363636363,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 1127.0,
+            "min": 149.0,
+            "max": 1394.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 25.613636363636363,
+            "min": 3.3863636363636362,
+            "max": 25.613636363636363,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 1127.0,
+            "min": 149.0,
+            "max": 1394.0,
             "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1679908422",
         "python_version": "3.9.16 (main, Dec  7 2022, 01:11:51) \n[GCC 9.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics --force",
         "mlagents_version": "0.31.0.dev0",
         "mlagents_envs_version": "0.31.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "1.11.0+cu102",
         "numpy_version": "1.21.2",
+        "end_time_seconds": "1679908882"
     },
+    "total": 460.14895640899977,
     "count": 1,
+    "self": 0.7895674730007158,
     "children": {
         "run_training.setup": {
+            "total": 0.10292876199946477,
             "count": 1,
+            "self": 0.10292876199946477
         },
         "TrainerController.start_learning": {
+            "total": 459.2564601739996,
             "count": 1,
+            "self": 0.49016623697934847,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 5.846241936000297,
                     "count": 1,
+                    "self": 5.846241936000297
                 },
                 "TrainerController.advance": {
+                    "total": 452.6829718790186,
+                    "count": 18217,
+                    "self": 0.263493961050699,
                     "children": {
                         "env_step": {
+                            "total": 452.4194779179679,
+                            "count": 18217,
+                            "self": 329.18339330596154,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 122.98751471001287,
+                                    "count": 18217,
+                                    "self": 1.8901296979720428,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 121.09738501204083,
+                                            "count": 18217,
+                                            "self": 121.09738501204083
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.24856990199350548,
+                                    "count": 18217,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 457.74583978990995,
+                                            "count": 18217,
                                             "is_parallel": true,
+                                            "self": 223.41518318488306,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.002092693000122381,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0006417580016204738,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.001450934998501907,
                                                                     "count": 10,
                                                                     "is_parallel": true,
+                                                                    "self": 0.001450934998501907
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.034367600999758,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.00047767500018380815,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.0003021359998456319,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0003021359998456319
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.032102486999974644,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.032102486999974644
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.0014853029997539124,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0003237099999751081,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.0011615929997788044,
                                                                             "count": 10,
                                                                             "is_parallel": true,
+                                                                            "self": 0.0011615929997788044
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 234.3306566050269,
+                                                    "count": 18216,
                                                     "is_parallel": true,
+                                                    "self": 9.466481910018956,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 5.099213578037052,
+                                                            "count": 18216,
                                                             "is_parallel": true,
+                                                            "self": 5.099213578037052
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 189.53019968192984,
+                                                            "count": 18216,
                                                             "is_parallel": true,
+                                                            "self": 189.53019968192984
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 30.234761435041037,
+                                                            "count": 18216,
                                                             "is_parallel": true,
+                                                            "self": 5.846674117066868,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 24.38808731797417,
+                                                                    "count": 182160,
                                                                     "is_parallel": true,
+                                                                    "self": 24.38808731797417
                                                                 }
                                                             }
                                                         }
                     }
                 },
                 "trainer_threads": {
+                    "total": 8.636000075057382e-05,
                     "count": 1,
+                    "self": 8.636000075057382e-05,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
+                                    "total": 449.5033354977977,
+                                    "count": 385886,
                                     "is_parallel": true,
+                                    "self": 9.206752954598414,
                                     "children": {
                                         "process_trajectory": {
+                                            "total": 244.94867293820062,
+                                            "count": 385886,
                                             "is_parallel": true,
+                                            "self": 243.48391041620016,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
+                                                    "total": 1.4647625220004556,
                                                     "count": 4,
                                                     "is_parallel": true,
+                                                    "self": 1.4647625220004556
                                                 }
                                             }
                                         },
                                         "_update_policy": {
+                                            "total": 195.34790960499868,
                                             "count": 90,
                                             "is_parallel": true,
+                                            "self": 75.03490625402355,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
+                                                    "total": 120.31300335097512,
                                                     "count": 4587,
                                                     "is_parallel": true,
+                                                    "self": 120.31300335097512
                                                 }
                                             }
                                         }
                     }
                 },
                 "TrainerController._save_models": {
+                    "total": 0.23699376200056577,
                     "count": 1,
+                    "self": 0.002571512000031362,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.2344222500005344,
                             "count": 1,
+                            "self": 0.2344222500005344
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -4,8 +4,8 @@
             {
                 "steps": 49936,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
-                "reward": 14.181818181818182,
-                "creation_time": 1679902833.8099377,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
                 ]
@@ -13,8 +13,8 @@
             {
                 "steps": 99960,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
-                "reward": 22.727272727272727,
-                "creation_time": 1679902946.4722717,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
                 ]
@@ -22,8 +22,8 @@
             {
                 "steps": 149984,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
-                "reward": 24.636363636363637,
-                "creation_time": 1679903058.3628073,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
                 ]
@@ -31,8 +31,8 @@
             {
                 "steps": 199984,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
-                "reward": 26.181818181818183,
-                "creation_time": 1679903171.278404,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
                 ]
@@ -40,8 +40,8 @@
             {
                 "steps": 200112,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
-                "reward": 26.181818181818183,
-                "creation_time": 1679903171.431922,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
                 ]
@@ -50,8 +50,8 @@
         "final_checkpoint": {
             "steps": 200112,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
-            "reward": 26.181818181818183,
-            "creation_time": 1679903171.431922,
             "auxillary_file_paths": [
                 "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
             ]

             {
                 "steps": 49936,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
+                "reward": 13.909090909090908,
+                "creation_time": 1679908542.6574535,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
                 ]
             {
                 "steps": 99960,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
+                "reward": 21.727272727272727,
+                "creation_time": 1679908655.6292062,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
                 ]
             {
                 "steps": 149984,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
+                "reward": 23.90909090909091,
+                "creation_time": 1679908769.2580125,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
                 ]
             {
                 "steps": 199984,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
+                "reward": 26.545454545454547,
+                "creation_time": 1679908881.3867598,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
                 ]
             {
                 "steps": 200112,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
+                "reward": 26.545454545454547,
+                "creation_time": 1679908881.6471078,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
                 ]
         "final_checkpoint": {
             "steps": 200112,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
+            "reward": 26.545454545454547,
+            "creation_time": 1679908881.6471078,
             "auxillary_file_paths": [
                 "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
             ]