{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.4383755624294281, "min": 0.4383755624294281, "max": 1.5862054824829102, "count": 67 }, "Pyramids.Policy.Entropy.sum": { "value": 12996.958984375, "min": 12996.958984375, "max": 65935.390625, "count": 67 }, "Pyramids.Step.mean": { "value": 2009877.0, "min": 29952.0, "max": 2009877.0, "count": 67 }, "Pyramids.Step.sum": { "value": 2009877.0, "min": 29952.0, "max": 2009877.0, "count": 67 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.8164554834365845, "min": -0.09642726927995682, "max": 0.8519212603569031, "count": 67 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 240.0379180908203, "min": -24.01038932800293, "max": 261.5398254394531, "count": 67 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.010017666034400463, "min": -0.009136217646300793, "max": 0.3027942478656769, "count": 67 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 2.9451937675476074, "min": -2.5215959548950195, "max": 70.85385131835938, "count": 67 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.07075320851397394, "min": 0.06568519165940508, "max": 0.07565438236626529, "count": 67 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.9905449191956353, "min": 0.4734425738764306, "max": 1.050996414263741, "count": 67 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.013001791703104204, "min": 0.0003456554292742117, "max": 0.01566592345678793, "count": 67 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.18202508384345886, "min": 0.0027652434341936937, "max": 0.21932292839503098, "count": 67 }, "Pyramids.Policy.LearningRate.mean": { "value": 0.00010061087360592142, "min": 0.00010061087360592142, "max": 0.00029836160054613336, "count": 67 }, "Pyramids.Policy.LearningRate.sum": { "value": 0.0014085522304828999, "min": 0.0014085522304828999, "max": 0.003464173045275733, "count": 67 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.13353693571428574, "min": 0.13353693571428574, "max": 0.1994538666666667, "count": 67 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.8695171000000004, "min": 1.3827968, "max": 2.5547242666666667, "count": 67 }, "Pyramids.Policy.Beta.mean": { "value": 0.0033603398778571437, "min": 0.0033603398778571437, "max": 0.00994544128, "count": 67 }, "Pyramids.Policy.Beta.sum": { "value": 0.04704475829000001, "min": 0.04704475829000001, "max": 0.11549695423999998, "count": 67 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.00899757631123066, "min": 0.00899757631123066, "max": 0.3189292848110199, "count": 67 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.12596607208251953, "min": 0.12251792103052139, "max": 2.2325050830841064, "count": 67 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 67 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 67 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 230.68376068376068, "min": 220.4724409448819, "max": 997.1625, "count": 64 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 26990.0, "min": 926.0, "max": 79773.0, "count": 64 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.735117936427267, "min": -0.9731500518508256, "max": 1.779565872956616, "count": 64 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 203.00879856199026, "min": -77.85200414806604, "max": 248.7059983983636, "count": 64 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.735117936427267, "min": -0.9731500518508256, "max": 1.779565872956616, "count": 64 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 203.00879856199026, "min": -77.85200414806604, "max": 248.7059983983636, "count": 64 }, "Pyramids.Policy.RndReward.mean": { "value": 0.021515196687780704, "min": 0.021181808893123006, "max": 3.3438625559210777, "count": 64 }, "Pyramids.Policy.RndReward.sum": { "value": 2.517278012470342, "min": 2.517278012470342, "max": 156.16331193596125, "count": 64 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1674138899", "python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --num-envs=10 --run-id=Pyramids Training --no-graphics --force", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1674142245" }, "total": 3346.5197448459994, "count": 1, "self": 1.5104933649990926, "children": { "run_training.setup": { "total": 0.22388053600002422, "count": 1, "self": 0.22388053600002422 }, "TrainerController.start_learning": { "total": 3344.785370945, "count": 1, "self": 2.191321581034117, "children": { "TrainerController._reset_env": { "total": 11.036381419999998, "count": 1, "self": 11.036381419999998 }, "TrainerController.advance": { "total": 3330.519638434966, "count": 23321, "self": 2.14965534799785, "children": { "env_step": { "total": 1781.5993759870178, "count": 23321, "self": 963.0564049740243, "children": { "SubprocessEnvManager._take_step": { "total": 814.5518747129988, "count": 130766, "self": 29.430823052086566, "children": { "TorchPolicy.evaluate": { "total": 785.1210516609123, "count": 126498, "self": 224.14092069291928, "children": { "TorchPolicy.sample_actions": { "total": 560.980130967993, "count": 126498, "self": 560.980130967993 } } } } }, "workers": { "total": 3.9910962999946378, "count": 23321, "self": 0.0, "children": { "worker_root": { "total": 33402.44909967305, "count": 130759, "is_parallel": true, "self": 25763.64540756009, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.046783416000039324, "count": 10, "is_parallel": true, "self": 0.008720006000885405, "children": { "_process_rank_one_or_two_observation": { "total": 0.03806340999915392, "count": 80, "is_parallel": true, "self": 0.03806340999915392 } } }, "UnityEnvironment.step": { "total": 2.3285360760000913, "count": 10, "is_parallel": true, "self": 0.004722976000380186, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0036794169999438964, "count": 10, "is_parallel": true, "self": 0.0036794169999438964 }, "communicator.exchange": { "total": 2.297539016999849, "count": 10, "is_parallel": true, "self": 2.297539016999849 }, "steps_from_proto": { "total": 0.022594665999918107, "count": 10, "is_parallel": true, "self": 0.010956463999946209, "children": { "_process_rank_one_or_two_observation": { "total": 0.011638201999971898, "count": 80, "is_parallel": true, "self": 0.011638201999971898 } } } } } } }, "UnityEnvironment.step": { "total": 7638.803692112964, "count": 130749, "is_parallel": true, "self": 72.15934311896217, "children": { "UnityEnvironment._generate_step_input": { "total": 45.65303698401249, "count": 130749, "is_parallel": true, "self": 45.65303698401249 }, "communicator.exchange": { "total": 7282.672770433042, "count": 130749, "is_parallel": true, "self": 7282.672770433042 }, "steps_from_proto": { "total": 238.3185415769467, "count": 130749, "is_parallel": true, "self": 65.68012743502061, "children": { "_process_rank_one_or_two_observation": { "total": 172.6384141419261, "count": 1045992, "is_parallel": true, "self": 172.6384141419261 } } } } } } } } } } }, "trainer_advance": { "total": 1546.7706070999502, "count": 23320, "self": 4.446033568937764, "children": { "process_trajectory": { "total": 463.3108352430115, "count": 23320, "self": 462.8958884420117, "children": { "RLTrainer._checkpoint": { "total": 0.4149468009998145, "count": 4, "self": 0.4149468009998145 } } }, "_update_policy": { "total": 1079.013738288001, "count": 869, "self": 400.01942840705453, "children": { "TorchPPOOptimizer.update": { "total": 678.9943098809464, "count": 46083, "self": 678.9943098809464 } } } } } } }, "trainer_threads": { "total": 1.7120000848080963e-06, "count": 1, "self": 1.7120000848080963e-06 }, "TrainerController._save_models": { "total": 1.0380277969998133, "count": 1, "self": 0.003971679999267508, "children": { "RLTrainer._checkpoint": { "total": 1.0340561170005458, "count": 1, "self": 1.0340561170005458 } } } } } } }