| { |
| "name": "root", |
| "gauges": { |
| "SnowballTarget.Policy.Entropy.mean": { |
| "value": 1.1493377685546875, |
| "min": 1.1493377685546875, |
| "max": 2.864180564880371, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.Entropy.sum": { |
| "value": 57347.35546875, |
| "min": 57347.35546875, |
| "max": 144675.484375, |
| "count": 10 |
| }, |
| "SnowballTarget.Step.mean": { |
| "value": 499976.0, |
| "min": 49936.0, |
| "max": 499976.0, |
| "count": 10 |
| }, |
| "SnowballTarget.Step.sum": { |
| "value": 499976.0, |
| "min": 49936.0, |
| "max": 499976.0, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 12.845760345458984, |
| "min": 0.3540566861629486, |
| "max": 12.845760345458984, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 12884.2978515625, |
| "min": 351.2242431640625, |
| "max": 12884.2978515625, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.CuriosityValueEstimate.mean": { |
| "value": 0.8443097472190857, |
| "min": 0.21610280871391296, |
| "max": 1.0515366792678833, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.CuriosityValueEstimate.sum": { |
| "value": 846.8426513671875, |
| "min": 214.37399291992188, |
| "max": 1044.1759033203125, |
| "count": 10 |
| }, |
| "SnowballTarget.Environment.EpisodeLength.mean": { |
| "value": 199.0, |
| "min": 199.0, |
| "max": 199.0, |
| "count": 10 |
| }, |
| "SnowballTarget.Environment.EpisodeLength.sum": { |
| "value": 50347.0, |
| "min": 48158.0, |
| "max": 50347.0, |
| "count": 10 |
| }, |
| "SnowballTarget.Environment.CumulativeReward.mean": { |
| "value": 25.893280632411066, |
| "min": 3.855371900826446, |
| "max": 25.893280632411066, |
| "count": 10 |
| }, |
| "SnowballTarget.Environment.CumulativeReward.sum": { |
| "value": 6551.0, |
| "min": 933.0, |
| "max": 6551.0, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.ExtrinsicReward.mean": { |
| "value": 25.893280632411066, |
| "min": 3.855371900826446, |
| "max": 25.893280632411066, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.ExtrinsicReward.sum": { |
| "value": 6551.0, |
| "min": 933.0, |
| "max": 6551.0, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.CuriosityReward.mean": { |
| "value": 1.624363026246723, |
| "min": 1.624363026246723, |
| "max": 2.892317029639832, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.CuriosityReward.sum": { |
| "value": 410.9638456404209, |
| "min": 410.9638456404209, |
| "max": 699.9407211728394, |
| "count": 10 |
| }, |
| "SnowballTarget.Losses.PolicyLoss.mean": { |
| "value": 0.022228808685273785, |
| "min": 0.0222080560298006, |
| "max": 0.026353130527180232, |
| "count": 10 |
| }, |
| "SnowballTarget.Losses.PolicyLoss.sum": { |
| "value": 0.08891523474109514, |
| "min": 0.08891523474109514, |
| "max": 0.12910080968249532, |
| "count": 10 |
| }, |
| "SnowballTarget.Losses.ValueLoss.mean": { |
| "value": 0.13977829820166032, |
| "min": 0.07806220607211192, |
| "max": 0.19508210450410843, |
| "count": 10 |
| }, |
| "SnowballTarget.Losses.ValueLoss.sum": { |
| "value": 0.5591131928066413, |
| "min": 0.3122488242884477, |
| "max": 0.9754105225205422, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.LearningRate.mean": { |
| "value": 1.4576495141199999e-05, |
| "min": 1.4576495141199999e-05, |
| "max": 0.0002841864052712, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.LearningRate.sum": { |
| "value": 5.8305980564799996e-05, |
| "min": 5.8305980564799996e-05, |
| "max": 0.0012797184734271998, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.Epsilon.mean": { |
| "value": 0.1048588, |
| "min": 0.1048588, |
| "max": 0.19472879999999998, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.Epsilon.sum": { |
| "value": 0.4194352, |
| "min": 0.4194352, |
| "max": 0.9265728000000001, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.Beta.mean": { |
| "value": 0.00025245412000000005, |
| "min": 0.00025245412000000005, |
| "max": 0.004736967120000001, |
| "count": 10 |
| }, |
| "SnowballTarget.Policy.Beta.sum": { |
| "value": 0.0010098164800000002, |
| "min": 0.0010098164800000002, |
| "max": 0.02133598272, |
| "count": 10 |
| }, |
| "SnowballTarget.Losses.CuriosityForwardLoss.mean": { |
| "value": 0.04066641284152865, |
| "min": 0.04066641284152865, |
| "max": 0.15649448223412038, |
| "count": 10 |
| }, |
| "SnowballTarget.Losses.CuriosityForwardLoss.sum": { |
| "value": 0.1626656513661146, |
| "min": 0.1626656513661146, |
| "max": 0.6259779289364815, |
| "count": 10 |
| }, |
| "SnowballTarget.Losses.CuriosityInverseLoss.mean": { |
| "value": 1.054714846611023, |
| "min": 1.054714846611023, |
| "max": 2.801060312986374, |
| "count": 10 |
| }, |
| "SnowballTarget.Losses.CuriosityInverseLoss.sum": { |
| "value": 4.218859386444092, |
| "min": 4.218859386444092, |
| "max": 12.449160003662112, |
| "count": 10 |
| }, |
| "SnowballTarget.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 10 |
| }, |
| "SnowballTarget.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 10 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1711530713", |
| "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget3 --no-graphics", |
| "mlagents_version": "1.1.0.dev0", |
| "mlagents_envs_version": "1.1.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.2.1+cu121", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1711531767" |
| }, |
| "total": 1053.6621658160002, |
| "count": 1, |
| "self": 0.42601278500069384, |
| "children": { |
| "run_training.setup": { |
| "total": 0.06015482199973121, |
| "count": 1, |
| "self": 0.06015482199973121 |
| }, |
| "TrainerController.start_learning": { |
| "total": 1053.1759982089998, |
| "count": 1, |
| "self": 0.8691430139365366, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 2.0402573049996136, |
| "count": 1, |
| "self": 2.0402573049996136 |
| }, |
| "TrainerController.advance": { |
| "total": 1050.1352405880639, |
| "count": 45464, |
| "self": 0.9238774870291309, |
| "children": { |
| "env_step": { |
| "total": 752.7561935750673, |
| "count": 45464, |
| "self": 584.8651935689213, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 167.33226991003266, |
| "count": 45464, |
| "self": 3.134988525036988, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 164.19728138499568, |
| "count": 45464, |
| "self": 164.19728138499568 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.5587300961133224, |
| "count": 45464, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 1049.6666539140938, |
| "count": 45464, |
| "is_parallel": true, |
| "self": 537.8826951320802, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0022327749998112267, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0006461329994635889, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0015866420003476378, |
| "count": 10, |
| "is_parallel": true, |
| "self": 0.0015866420003476378 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.034909802000129275, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0006885730003887147, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.000443045999872993, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.000443045999872993 |
| }, |
| "communicator.exchange": { |
| "total": 0.03193026799999643, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.03193026799999643 |
| }, |
| "steps_from_proto": { |
| "total": 0.0018479149998711364, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.000360121000539948, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0014877939993311884, |
| "count": 10, |
| "is_parallel": true, |
| "self": 0.0014877939993311884 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 511.78395878201354, |
| "count": 45463, |
| "is_parallel": true, |
| "self": 25.870365160052643, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 13.876963266005987, |
| "count": 45463, |
| "is_parallel": true, |
| "self": 13.876963266005987 |
| }, |
| "communicator.exchange": { |
| "total": 390.81473614399374, |
| "count": 45463, |
| "is_parallel": true, |
| "self": 390.81473614399374 |
| }, |
| "steps_from_proto": { |
| "total": 81.22189421196117, |
| "count": 45463, |
| "is_parallel": true, |
| "self": 14.647346818277128, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 66.57454739368404, |
| "count": 454630, |
| "is_parallel": true, |
| "self": 66.57454739368404 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 296.45516952596745, |
| "count": 45464, |
| "self": 1.0763309329308868, |
| "children": { |
| "process_trajectory": { |
| "total": 119.15690446203689, |
| "count": 45464, |
| "self": 119.00658910103766, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.1503153609992296, |
| "count": 1, |
| "self": 0.1503153609992296 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 176.22193413099967, |
| "count": 47, |
| "self": 146.0050128549974, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 30.216921276002267, |
| "count": 1410, |
| "self": 30.216921276002267 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 8.010001693037339e-07, |
| "count": 1, |
| "self": 8.010001693037339e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.13135650099957275, |
| "count": 1, |
| "self": 0.0007333689991355641, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.13062313200043718, |
| "count": 1, |
| "self": 0.13062313200043718 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |