| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.31657862663269043, |
| "min": 0.31657862663269043, |
| "max": 1.4554413557052612, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 9477.09765625, |
| "min": 9477.09765625, |
| "max": 44152.26953125, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 989980.0, |
| "min": 29952.0, |
| "max": 989980.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 989980.0, |
| "min": 29952.0, |
| "max": 989980.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.6274967193603516, |
| "min": -0.11481665819883347, |
| "max": 0.6775597333908081, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 176.3265838623047, |
| "min": -27.670814514160156, |
| "max": 193.6967010498047, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.007007249165326357, |
| "min": 0.0015687725972384214, |
| "max": 0.2707160711288452, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 1.9690370559692383, |
| "min": 0.3968994617462158, |
| "max": 64.97185516357422, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06876534378738904, |
| "min": 0.0638591812139133, |
| "max": 0.07539782882806667, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 1.0314801568108356, |
| "min": 0.4858075592386865, |
| "max": 1.0861022743920332, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.015090243930276331, |
| "min": 0.0014578654519899834, |
| "max": 0.01636559136651446, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.22635365895414497, |
| "min": 0.014578654519899835, |
| "max": 0.23666382780841863, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 7.471197509633331e-06, |
| "min": 7.471197509633331e-06, |
| "max": 0.00029515063018788575, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.00011206796264449996, |
| "min": 0.00011206796264449996, |
| "max": 0.003633119888960099, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10249036666666664, |
| "min": 0.10249036666666664, |
| "max": 0.19838354285714285, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.5373554999999997, |
| "min": 1.3886848, |
| "max": 2.6177872000000004, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.00025878762999999994, |
| "min": 0.00025878762999999994, |
| "max": 0.00983851593142857, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.003881814449999999, |
| "min": 0.003881814449999999, |
| "max": 0.12112288601000001, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.013059018179774284, |
| "min": 0.013059018179774284, |
| "max": 0.3602496087551117, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.19588527083396912, |
| "min": 0.18780364096164703, |
| "max": 2.521747350692749, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 294.9072164948454, |
| "min": 273.9259259259259, |
| "max": 999.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 28606.0, |
| "min": 15984.0, |
| "max": 33199.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.6638412233634092, |
| "min": -1.0000000521540642, |
| "max": 1.7112599892914295, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 161.3925986662507, |
| "min": -30.58620174229145, |
| "max": 184.41499803215265, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.6638412233634092, |
| "min": -1.0000000521540642, |
| "max": 1.7112599892914295, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 161.3925986662507, |
| "min": -30.58620174229145, |
| "max": 184.41499803215265, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.03977758732813977, |
| "min": 0.038694411753331895, |
| "max": 5.93458700645715, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 3.8584259708295576, |
| "min": 3.8584259708295576, |
| "max": 94.9533921033144, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1707503277", |
| "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids_Training_2 --no-graphics", |
| "mlagents_version": "1.1.0.dev0", |
| "mlagents_envs_version": "1.1.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.2.0+cu121", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1707505522" |
| }, |
| "total": 2245.319947405, |
| "count": 1, |
| "self": 0.5272818630000984, |
| "children": { |
| "run_training.setup": { |
| "total": 0.045931434000067384, |
| "count": 1, |
| "self": 0.045931434000067384 |
| }, |
| "TrainerController.start_learning": { |
| "total": 2244.746734108, |
| "count": 1, |
| "self": 1.3551528949469684, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 2.591978273999757, |
| "count": 1, |
| "self": 2.591978273999757 |
| }, |
| "TrainerController.advance": { |
| "total": 2240.715435246053, |
| "count": 64307, |
| "self": 1.3556013230345343, |
| "children": { |
| "env_step": { |
| "total": 1622.8087104969645, |
| "count": 64307, |
| "self": 1495.0211759589215, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 126.96520265190884, |
| "count": 64307, |
| "self": 4.483194459915467, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 122.48200819199337, |
| "count": 62551, |
| "self": 122.48200819199337 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.8223318861341795, |
| "count": 64307, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 2239.8021957169412, |
| "count": 64307, |
| "is_parallel": true, |
| "self": 856.1966301607363, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.002120863000072859, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0007098269993548456, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0014110360007180134, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0014110360007180134 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.07481945000017731, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005770530005975161, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.00048371000002589426, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00048371000002589426 |
| }, |
| "communicator.exchange": { |
| "total": 0.07214259699958347, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.07214259699958347 |
| }, |
| "steps_from_proto": { |
| "total": 0.001616089999970427, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0003722429996741994, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0012438470002962276, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0012438470002962276 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1383.605565556205, |
| "count": 64306, |
| "is_parallel": true, |
| "self": 34.697032933224364, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 23.583619527958035, |
| "count": 64306, |
| "is_parallel": true, |
| "self": 23.583619527958035 |
| }, |
| "communicator.exchange": { |
| "total": 1228.2680790799955, |
| "count": 64306, |
| "is_parallel": true, |
| "self": 1228.2680790799955 |
| }, |
| "steps_from_proto": { |
| "total": 97.0568340150271, |
| "count": 64306, |
| "is_parallel": true, |
| "self": 18.96307213379896, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 78.09376188122815, |
| "count": 514448, |
| "is_parallel": true, |
| "self": 78.09376188122815 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 616.5511234260539, |
| "count": 64307, |
| "self": 2.6369264381287394, |
| "children": { |
| "process_trajectory": { |
| "total": 123.49490136293343, |
| "count": 64307, |
| "self": 123.29177375393328, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.20312760900014837, |
| "count": 2, |
| "self": 0.20312760900014837 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 490.4192956249917, |
| "count": 451, |
| "self": 285.5619166979768, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 204.8573789270149, |
| "count": 22755, |
| "self": 204.8573789270149 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 9.55000359681435e-07, |
| "count": 1, |
| "self": 9.55000359681435e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.08416673800002172, |
| "count": 1, |
| "self": 0.0013754459996562218, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.0827912920003655, |
| "count": 1, |
| "self": 0.0827912920003655 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |