{ "name": "root", "gauges": { "Huggy.Policy.Entropy.mean": { "value": 1.272360920906067, "min": 1.272360920906067, "max": 1.4177839756011963, "count": 40 }, "Huggy.Policy.Entropy.sum": { "value": 63418.28515625, "min": 63117.1328125, "max": 77316.015625, "count": 40 }, "Huggy.Environment.EpisodeLength.mean": { "value": 58.789725209080046, "min": 57.79882352941176, "max": 411.12295081967216, "count": 40 }, "Huggy.Environment.EpisodeLength.sum": { "value": 49207.0, "min": 49082.0, "max": 50157.0, "count": 40 }, "Huggy.Step.mean": { "value": 1999951.0, "min": 49761.0, "max": 1999951.0, "count": 40 }, "Huggy.Step.sum": { "value": 1999951.0, "min": 49761.0, "max": 1999951.0, "count": 40 }, "Huggy.Policy.ExtrinsicValueEstimate.mean": { "value": 2.3403899669647217, "min": -0.06675603240728378, "max": 2.3693079948425293, "count": 40 }, "Huggy.Policy.ExtrinsicValueEstimate.sum": { "value": 1958.906494140625, "min": -8.07748031616211, "max": 1983.164306640625, "count": 40 }, "Huggy.Environment.CumulativeReward.mean": { "value": 4.022737948982804, "min": 1.7483754448654238, "max": 4.088219650154528, "count": 40 }, "Huggy.Environment.CumulativeReward.sum": { "value": 3367.031663298607, "min": 211.55342882871628, "max": 3412.0298920869827, "count": 40 }, "Huggy.Policy.ExtrinsicReward.mean": { "value": 4.022737948982804, "min": 1.7483754448654238, "max": 4.088219650154528, "count": 40 }, "Huggy.Policy.ExtrinsicReward.sum": { "value": 3367.031663298607, "min": 211.55342882871628, "max": 3412.0298920869827, "count": 40 }, "Huggy.Losses.PolicyLoss.mean": { "value": 0.0158508474686793, "min": 0.01572813392713821, "max": 0.020096193913777826, "count": 40 }, "Huggy.Losses.PolicyLoss.sum": { "value": 0.0475525424060379, "min": 0.03188362865243107, "max": 0.060288581741333475, "count": 40 }, "Huggy.Losses.ValueLoss.mean": { "value": 0.0381449685121576, "min": 0.011993605922907592, "max": 0.0381449685121576, "count": 40 }, "Huggy.Losses.ValueLoss.sum": { "value": 0.1144349055364728, "min": 0.023987211845815183, "max": 0.1144349055364728, "count": 40 }, "Huggy.Policy.LearningRate.mean": { "value": 6.770515312583334e-06, "min": 6.770515312583334e-06, "max": 0.0004922375015525, "count": 40 }, "Huggy.Policy.LearningRate.sum": { "value": 2.0311545937750003e-05, "min": 2.0311545937750003e-05, "max": 0.0014064560187087996, "count": 40 }, "Huggy.Policy.Epsilon.mean": { "value": 0.10135408333333333, "min": 0.10135408333333333, "max": 0.1984475, "count": 40 }, "Huggy.Policy.Epsilon.sum": { "value": 0.30406225, "min": 0.2078454, "max": 0.5812912000000001, "count": 40 }, "Huggy.Policy.Beta.mean": { "value": 0.00011819125833333336, "min": 0.00011819125833333336, "max": 0.007875955250000002, "count": 40 }, "Huggy.Policy.Beta.sum": { "value": 0.00035457377500000006, "min": 0.00035457377500000006, "max": 0.022505166880000003, "count": 40 }, "Huggy.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 40 }, "Huggy.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 40 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1681893135", "python_version": "3.9.16 (main, Dec 7 2022, 01:11:51) \n[GCC 9.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/Huggy.yaml --env=./trained-envs-executables/linux/Huggy/Huggy --run-id=Huggy --no-graphics", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", "end_time_seconds": "1681895694" }, "total": 2559.166976126, "count": 1, "self": 0.8097139050005353, "children": { "run_training.setup": { "total": 0.1145879649999415, "count": 1, "self": 0.1145879649999415 }, "TrainerController.start_learning": { "total": 2558.2426742559996, "count": 1, "self": 4.292987405986878, "children": { "TrainerController._reset_env": { "total": 3.8401997849999816, "count": 1, "self": 3.8401997849999816 }, "TrainerController.advance": { "total": 2549.9153827610126, "count": 235628, "self": 4.582706898178458, "children": { "env_step": { "total": 1793.2137557689534, "count": 235628, "self": 1523.892993927895, "children": { "SubprocessEnvManager._take_step": { "total": 266.5616282730939, "count": 235628, "self": 15.944396015038024, "children": { "TorchPolicy.evaluate": { "total": 250.61723225805588, "count": 222988, "self": 250.61723225805588 } } }, "workers": { "total": 2.759133567964568, "count": 235628, "self": 0.0, "children": { "worker_root": { "total": 2550.215545113937, "count": 235628, "is_parallel": true, "self": 1300.1728753009625, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.001100021999945966, "count": 1, "is_parallel": true, "self": 0.00034278800001175114, "children": { "_process_rank_one_or_two_observation": { "total": 0.0007572339999342148, "count": 2, "is_parallel": true, "self": 0.0007572339999342148 } } }, "UnityEnvironment.step": { "total": 0.02952216899996074, "count": 1, "is_parallel": true, "self": 0.00031085800003438635, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0002153719999569148, "count": 1, "is_parallel": true, "self": 0.0002153719999569148 }, "communicator.exchange": { "total": 0.02825725799993961, "count": 1, "is_parallel": true, "self": 0.02825725799993961 }, "steps_from_proto": { "total": 0.0007386810000298283, "count": 1, "is_parallel": true, "self": 0.00020744400001149188, "children": { "_process_rank_one_or_two_observation": { "total": 0.0005312370000183364, "count": 2, "is_parallel": true, "self": 0.0005312370000183364 } } } } } } }, "UnityEnvironment.step": { "total": 1250.0426698129745, "count": 235627, "is_parallel": true, "self": 37.46319541107414, "children": { "UnityEnvironment._generate_step_input": { "total": 79.0649567230356, "count": 235627, "is_parallel": true, "self": 79.0649567230356 }, "communicator.exchange": { "total": 1045.048376449951, "count": 235627, "is_parallel": true, "self": 1045.048376449951 }, "steps_from_proto": { "total": 88.46614122891378, "count": 235627, "is_parallel": true, "self": 33.590727534969915, "children": { "_process_rank_one_or_two_observation": { "total": 54.87541369394387, "count": 471254, "is_parallel": true, "self": 54.87541369394387 } } } } } } } } } } }, "trainer_advance": { "total": 752.1189200938807, "count": 235628, "self": 6.150655554905825, "children": { "process_trajectory": { "total": 140.74624189097608, "count": 235628, "self": 139.4328579379761, "children": { "RLTrainer._checkpoint": { "total": 1.3133839529999705, "count": 10, "self": 1.3133839529999705 } } }, "_update_policy": { "total": 605.2220226479988, "count": 97, "self": 509.0342657289798, "children": { "TorchPPOOptimizer.update": { "total": 96.18775691901897, "count": 4850, "self": 96.18775691901897 } } } } } } }, "trainer_threads": { "total": 1.3349999790079892e-06, "count": 1, "self": 1.3349999790079892e-06 }, "TrainerController._save_models": { "total": 0.19410296900014146, "count": 1, "self": 0.003124358000150096, "children": { "RLTrainer._checkpoint": { "total": 0.19097861099999136, "count": 1, "self": 0.19097861099999136 } } } } } } }