{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.5025023818016052, "min": 0.4954706132411957, "max": 1.4921729564666748, "count": 33 }, "Pyramids.Policy.Entropy.sum": { "value": 15067.03125, "min": 15014.7412109375, "max": 45266.55859375, "count": 33 }, "Pyramids.Step.mean": { "value": 989957.0, "min": 29952.0, "max": 989957.0, "count": 33 }, "Pyramids.Step.sum": { "value": 989957.0, "min": 29952.0, "max": 989957.0, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.43156328797340393, "min": -0.11121068894863129, "max": 0.5647807717323303, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 114.79583740234375, "min": -26.35693359375, "max": 156.44427490234375, "count": 33 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": -0.027206676080822945, "min": -0.2914373576641083, "max": 0.37699419260025024, "count": 33 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": -7.23697566986084, "min": -78.97952270507812, "max": 89.34762573242188, "count": 33 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.06745950118610858, "min": 0.06591277108689873, "max": 0.0718440967154845, "count": 33 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.94443301660552, "min": 0.4886386653467954, "max": 1.0732553767607613, "count": 33 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.016013090989526104, "min": 0.00030833215952521045, "max": 0.023195202232418218, "count": 33 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.22418327385336548, "min": 0.004008318073827736, "max": 0.32473283125385505, "count": 33 }, "Pyramids.Policy.LearningRate.mean": { "value": 7.710247429950002e-06, "min": 7.710247429950002e-06, "max": 0.00029515063018788575, "count": 33 }, "Pyramids.Policy.LearningRate.sum": { "value": 0.00010794346401930003, "min": 0.00010794346401930003, "max": 0.0033820256726582003, "count": 33 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10257005, "min": 0.10257005, "max": 0.19838354285714285, "count": 33 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.4359807, "min": 1.3886848, "max": 2.5273418000000003, "count": 33 }, "Pyramids.Policy.Beta.mean": { "value": 0.0002667479950000001, "min": 0.0002667479950000001, "max": 0.00983851593142857, "count": 33 }, "Pyramids.Policy.Beta.sum": { "value": 0.003734471930000001, "min": 0.003734471930000001, "max": 0.11276144581999999, "count": 33 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.00880816113203764, "min": 0.008608461357653141, "max": 0.37863412499427795, "count": 33 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.1233142539858818, "min": 0.12051846086978912, "max": 2.6504387855529785, "count": 33 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 427.8378378378378, "min": 374.32, "max": 999.0, "count": 33 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 31660.0, "min": 15984.0, "max": 33911.0, "count": 33 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.436016415079979, "min": -1.0000000521540642, "max": 1.577045217777292, "count": 33 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 104.82919830083847, "min": -31.996001660823822, "max": 132.47179829329252, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.436016415079979, "min": -1.0000000521540642, "max": 1.577045217777292, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 104.82919830083847, "min": -31.996001660823822, "max": 132.47179829329252, "count": 33 }, "Pyramids.Policy.RndReward.mean": { "value": 0.0390342784605359, "min": 0.0335061490811876, "max": 7.762439802289009, "count": 33 }, "Pyramids.Policy.RndReward.sum": { "value": 2.8495023276191205, "min": 2.618655948404921, "max": 124.19903683662415, "count": 33 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1656146094", "python_version": "3.7.13 (default, Apr 24 2022, 01:04:09) \n[GCC 7.5.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn /content/ml-agents/config/ppo/PyramidsRND.yaml --env=/content/ml-agents/trained-envs-executables/linux/Pyramids/Pyramids --run-id=First Training --force --no-graphics", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1656149187" }, "total": 3093.621723573, "count": 1, "self": 0.5792813749994821, "children": { "run_training.setup": { "total": 0.06636839900011182, "count": 1, "self": 0.06636839900011182 }, "TrainerController.start_learning": { "total": 3092.9760737990005, "count": 1, "self": 2.4741103200740326, "children": { "TrainerController._reset_env": { "total": 8.725167850000162, "count": 1, "self": 8.725167850000162 }, "TrainerController.advance": { "total": 3081.6708474279267, "count": 63671, "self": 2.552840573861886, "children": { "env_step": { "total": 1832.180661930931, "count": 63671, "self": 1681.7573832998764, "children": { "SubprocessEnvManager._take_step": { "total": 148.88740735094643, "count": 63671, "self": 7.053575330899093, "children": { "TorchPolicy.evaluate": { "total": 141.83383202004734, "count": 62563, "self": 31.184050374058643, "children": { "TorchPolicy.sample_actions": { "total": 110.6497816459887, "count": 62563, "self": 110.6497816459887 } } } } }, "workers": { "total": 1.53587128010804, "count": 63671, "self": 0.0, "children": { "worker_root": { "total": 3086.7966180901794, "count": 63671, "is_parallel": true, "self": 1576.42598972627, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.007325150000269787, "count": 1, "is_parallel": true, "self": 0.005629217000659992, "children": { "_process_rank_one_or_two_observation": { "total": 0.001695932999609795, "count": 8, "is_parallel": true, "self": 0.001695932999609795 } } }, "UnityEnvironment.step": { "total": 0.07035671099993124, "count": 1, "is_parallel": true, "self": 0.000710478999735642, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0006465070000558626, "count": 1, "is_parallel": true, "self": 0.0006465070000558626 }, "communicator.exchange": { "total": 0.06669388599993908, "count": 1, "is_parallel": true, "self": 0.06669388599993908 }, "steps_from_proto": { "total": 0.002305839000200649, "count": 1, "is_parallel": true, "self": 0.0006614260000787908, "children": { "_process_rank_one_or_two_observation": { "total": 0.0016444130001218582, "count": 8, "is_parallel": true, "self": 0.0016444130001218582 } } } } } } }, "UnityEnvironment.step": { "total": 1510.3706283639094, "count": 63670, "is_parallel": true, "self": 40.86527133974096, "children": { "UnityEnvironment._generate_step_input": { "total": 26.713646200000767, "count": 63670, "is_parallel": true, "self": 26.713646200000767 }, "communicator.exchange": { "total": 1296.5562163450732, "count": 63670, "is_parallel": true, "self": 1296.5562163450732 }, "steps_from_proto": { "total": 146.23549447909454, "count": 63670, "is_parallel": true, "self": 40.840835090034034, "children": { "_process_rank_one_or_two_observation": { "total": 105.39465938906051, "count": 509360, "is_parallel": true, "self": 105.39465938906051 } } } } } } } } } } }, "trainer_advance": { "total": 1246.9373449231339, "count": 63671, "self": 4.858867588176508, "children": { "process_trajectory": { "total": 224.24579585895845, "count": 63671, "self": 224.01144094195843, "children": { "RLTrainer._checkpoint": { "total": 0.23435491700001876, "count": 2, "self": 0.23435491700001876 } } }, "_update_policy": { "total": 1017.8326814759989, "count": 446, "self": 280.58072937801626, "children": { "TorchPPOOptimizer.update": { "total": 737.2519520979827, "count": 22812, "self": 737.2519520979827 } } } } } } }, "trainer_threads": { "total": 1.4399993233382702e-06, "count": 1, "self": 1.4399993233382702e-06 }, "TrainerController._save_models": { "total": 0.10594676100026845, "count": 1, "self": 0.0021927860007053823, "children": { "RLTrainer._checkpoint": { "total": 0.10375397499956307, "count": 1, "self": 0.10375397499956307 } } } } } } }