{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.14292973279953003, "min": 0.11940550804138184, "max": 1.4193896055221558, "count": 100 }, "Pyramids.Policy.Entropy.sum": { "value": 4287.89208984375, "min": 3571.55322265625, "max": 43058.6015625, "count": 100 }, "Pyramids.Step.mean": { "value": 2999956.0, "min": 29952.0, "max": 2999956.0, "count": 100 }, "Pyramids.Step.sum": { "value": 2999956.0, "min": 29952.0, "max": 2999956.0, "count": 100 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.7337890267372131, "min": -0.0974569022655487, "max": 0.8745170831680298, "count": 100 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 218.66912841796875, "min": -23.38965606689453, "max": 267.60223388671875, "count": 100 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.00890808179974556, "min": 0.005811864510178566, "max": 0.35619595646858215, "count": 100 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 2.6546082496643066, "min": 1.6854406595230103, "max": 84.41844177246094, "count": 100 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.06833154014635107, "min": 0.06399497415978692, "max": 0.07514426053461587, "count": 100 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 1.024973102195266, "min": 0.4874997344426677, "max": 1.0692854776017495, "count": 100 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.017900132499764573, "min": 0.00010899150240232841, "max": 0.017900132499764573, "count": 100 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.2685019874964686, "min": 0.0010899150240232841, "max": 0.2685019874964686, "count": 100 }, "Pyramids.Policy.LearningRate.mean": { "value": 1.493559502180004e-06, "min": 1.493559502180004e-06, "max": 0.00029838354339596195, "count": 100 }, "Pyramids.Policy.LearningRate.sum": { "value": 2.2403392532700062e-05, "min": 2.2403392532700062e-05, "max": 0.0037593076468974995, "count": 100 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10049782, "min": 0.10049782, "max": 0.19946118095238097, "count": 100 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.5074673, "min": 1.3897045333333333, "max": 2.7375006, "count": 100 }, "Pyramids.Policy.Beta.mean": { "value": 5.973221800000014e-05, "min": 5.973221800000014e-05, "max": 0.009946171977142856, "count": 100 }, "Pyramids.Policy.Beta.sum": { "value": 0.0008959832700000021, "min": 0.0008959832700000021, "max": 0.12532493975, "count": 100 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.010917965322732925, "min": 0.010454429313540459, "max": 0.412590354681015, "count": 100 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.16376948356628418, "min": 0.14636200666427612, "max": 2.8881325721740723, "count": 100 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 239.45454545454547, "min": 200.07333333333332, "max": 999.0, "count": 100 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 31608.0, "min": 15984.0, "max": 32626.0, "count": 100 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.6677419668390552, "min": -1.0000000521540642, "max": 1.8003873107298998, "count": 100 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 218.4741976559162, "min": -32.000001668930054, "max": 269.9889975488186, "count": 100 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.6677419668390552, "min": -1.0000000521540642, "max": 1.8003873107298998, "count": 100 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 218.4741976559162, "min": -32.000001668930054, "max": 269.9889975488186, "count": 100 }, "Pyramids.Policy.RndReward.mean": { "value": 0.027038944790824956, "min": 0.022283377670889972, "max": 7.986746062524617, "count": 100 }, "Pyramids.Policy.RndReward.sum": { "value": 3.5421017675980693, "min": 3.1401077657646965, "max": 127.78793700039387, "count": 100 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 100 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 100 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1673618390", "python_version": "3.8.16 (default, Dec 7 2022, 01:12:13) \n[GCC 7.5.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1673625632" }, "total": 7242.3605654210005, "count": 1, "self": 0.4372184270014259, "children": { "run_training.setup": { "total": 0.105973203999838, "count": 1, "self": 0.105973203999838 }, "TrainerController.start_learning": { "total": 7241.81737379, "count": 1, "self": 4.579230756133256, "children": { "TrainerController._reset_env": { "total": 6.543547028000148, "count": 1, "self": 6.543547028000148 }, "TrainerController.advance": { "total": 7230.586427100864, "count": 195016, "self": 4.490833558803388, "children": { "env_step": { "total": 5159.303983696915, "count": 195016, "self": 4810.334707433127, "children": { "SubprocessEnvManager._take_step": { "total": 346.29557439382916, "count": 195016, "self": 13.882790613081852, "children": { "TorchPolicy.evaluate": { "total": 332.4127837807473, "count": 187550, "self": 111.8615250430737, "children": { "TorchPolicy.sample_actions": { "total": 220.5512587376736, "count": 187550, "self": 220.5512587376736 } } } } }, "workers": { "total": 2.6737018699591317, "count": 195016, "self": 0.0, "children": { "worker_root": { "total": 7226.187007238168, "count": 195016, "is_parallel": true, "self": 2751.6561048512895, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0020136030000230676, "count": 1, "is_parallel": true, "self": 0.0007262540002557216, "children": { "_process_rank_one_or_two_observation": { "total": 0.001287348999767346, "count": 8, "is_parallel": true, "self": 0.001287348999767346 } } }, "UnityEnvironment.step": { "total": 0.05069685099988419, "count": 1, "is_parallel": true, "self": 0.0005426359998637054, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0005443689999538037, "count": 1, "is_parallel": true, "self": 0.0005443689999538037 }, "communicator.exchange": { "total": 0.04759826800000155, "count": 1, "is_parallel": true, "self": 0.04759826800000155 }, "steps_from_proto": { "total": 0.0020115780000651284, "count": 1, "is_parallel": true, "self": 0.0005427880003026075, "children": { "_process_rank_one_or_two_observation": { "total": 0.001468789999762521, "count": 8, "is_parallel": true, "self": 0.001468789999762521 } } } } } } }, "UnityEnvironment.step": { "total": 4474.530902386879, "count": 195015, "is_parallel": true, "self": 91.20027822259453, "children": { "UnityEnvironment._generate_step_input": { "total": 75.49031692596441, "count": 195015, "is_parallel": true, "self": 75.49031692596441 }, "communicator.exchange": { "total": 3963.4243047810323, "count": 195015, "is_parallel": true, "self": 3963.4243047810323 }, "steps_from_proto": { "total": 344.4160024572873, "count": 195015, "is_parallel": true, "self": 76.94733183536914, "children": { "_process_rank_one_or_two_observation": { "total": 267.46867062191814, "count": 1560120, "is_parallel": true, "self": 267.46867062191814 } } } } } } } } } } }, "trainer_advance": { "total": 2066.7916098451456, "count": 195016, "self": 8.21757212244438, "children": { "process_trajectory": { "total": 481.03133866070357, "count": 195016, "self": 480.4249248987021, "children": { "RLTrainer._checkpoint": { "total": 0.6064137620014662, "count": 6, "self": 0.6064137620014662 } } }, "_update_policy": { "total": 1577.5426990619974, "count": 1378, "self": 598.4271979679559, "children": { "TorchPPOOptimizer.update": { "total": 979.1155010940415, "count": 68439, "self": 979.1155010940415 } } } } } } }, "trainer_threads": { "total": 8.470015018247068e-07, "count": 1, "self": 8.470015018247068e-07 }, "TrainerController._save_models": { "total": 0.10816805800095608, "count": 1, "self": 0.0015202980011963518, "children": { "RLTrainer._checkpoint": { "total": 0.10664775999975973, "count": 1, "self": 0.10664775999975973 } } } } } } }