| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.39427027106285095, | |
| "min": 0.39427027106285095, | |
| "max": 1.503057599067688, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 11727.1748046875, | |
| "min": 11727.1748046875, | |
| "max": 45596.75390625, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989983.0, | |
| "min": 29952.0, | |
| "max": 989983.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989983.0, | |
| "min": 29952.0, | |
| "max": 989983.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.4405461549758911, | |
| "min": -0.16041484475135803, | |
| "max": 0.47715598344802856, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 120.26910400390625, | |
| "min": -38.01831817626953, | |
| "max": 130.26358032226562, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.06472254544496536, | |
| "min": 0.005800291895866394, | |
| "max": 0.3595026135444641, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 17.669254302978516, | |
| "min": 1.5776793956756592, | |
| "max": 85.20211791992188, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06988046964294933, | |
| "min": 0.06550643272866082, | |
| "max": 0.07200131401237467, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 1.04820704464424, | |
| "min": 0.5040091980866227, | |
| "max": 1.0646780332431707, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.015888691466515486, | |
| "min": 0.00015085834189976672, | |
| "max": 0.015888691466515486, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.2383303719977323, | |
| "min": 0.002112016786596734, | |
| "max": 0.2383303719977323, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.421617526160003e-06, | |
| "min": 7.421617526160003e-06, | |
| "max": 0.00029515063018788575, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00011132426289240005, | |
| "min": 0.00011132426289240005, | |
| "max": 0.0035089430303524, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10247384000000002, | |
| "min": 0.10247384000000002, | |
| "max": 0.19838354285714285, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.5371076000000004, | |
| "min": 1.3886848, | |
| "max": 2.5696476000000006, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.0002571366160000002, | |
| "min": 0.0002571366160000002, | |
| "max": 0.00983851593142857, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0038570492400000025, | |
| "min": 0.0038570492400000025, | |
| "max": 0.11698779524000001, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.011800948530435562, | |
| "min": 0.011800948530435562, | |
| "max": 0.5517892241477966, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.17701423168182373, | |
| "min": 0.17513614892959595, | |
| "max": 3.8625245094299316, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 391.68, | |
| "min": 377.2368421052632, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 29376.0, | |
| "min": 15984.0, | |
| "max": 32413.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.4749413097898165, | |
| "min": -1.0000000521540642, | |
| "max": 1.4948524727486074, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 110.62059823423624, | |
| "min": -31.991201624274254, | |
| "max": 119.58819781988859, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.4749413097898165, | |
| "min": -1.0000000521540642, | |
| "max": 1.4948524727486074, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 110.62059823423624, | |
| "min": -31.991201624274254, | |
| "max": 119.58819781988859, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.04701650693003709, | |
| "min": 0.04701650693003709, | |
| "max": 12.144991533830762, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 3.526238019752782, | |
| "min": 3.526238019752782, | |
| "max": 194.3198645412922, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1706764846", | |
| "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.1.0.dev0", | |
| "mlagents_envs_version": "1.1.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.2.0+cu121", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1706766850" | |
| }, | |
| "total": 2003.6855430330002, | |
| "count": 1, | |
| "self": 0.4784587050007758, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.045315219999793044, | |
| "count": 1, | |
| "self": 0.045315219999793044 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2003.1617691079996, | |
| "count": 1, | |
| "self": 1.2035995239743897, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.304946627999925, | |
| "count": 1, | |
| "self": 2.304946627999925 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 1999.5667290440251, | |
| "count": 63610, | |
| "self": 1.289900200961256, | |
| "children": { | |
| "env_step": { | |
| "total": 1388.6125022690344, | |
| "count": 63610, | |
| "self": 1266.7464263020975, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 121.1312562029866, | |
| "count": 63610, | |
| "self": 4.464040634106368, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 116.66721556888024, | |
| "count": 62556, | |
| "self": 116.66721556888024 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.7348197639503269, | |
| "count": 63610, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 1998.3162297030844, | |
| "count": 63610, | |
| "is_parallel": true, | |
| "self": 839.5699807410365, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0020450080000955495, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.000602087000515894, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0014429209995796555, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0014429209995796555 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.04878286700022727, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006065019997549825, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005665480002789991, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005665480002789991 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.045886881000114954, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.045886881000114954 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0017229360000783345, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00044658600018010475, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012763499998982297, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012763499998982297 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1158.746248962048, | |
| "count": 63609, | |
| "is_parallel": true, | |
| "self": 33.89405494105995, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 23.267558004025886, | |
| "count": 63609, | |
| "is_parallel": true, | |
| "self": 23.267558004025886 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1006.7537877148643, | |
| "count": 63609, | |
| "is_parallel": true, | |
| "self": 1006.7537877148643 | |
| }, | |
| "steps_from_proto": { | |
| "total": 94.83084830209782, | |
| "count": 63609, | |
| "is_parallel": true, | |
| "self": 18.473791196097864, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 76.35705710599996, | |
| "count": 508872, | |
| "is_parallel": true, | |
| "self": 76.35705710599996 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 609.6643265740295, | |
| "count": 63610, | |
| "self": 2.3415845629647265, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 118.32200545906699, | |
| "count": 63610, | |
| "self": 118.1322458300674, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.18975962899958176, | |
| "count": 2, | |
| "self": 0.18975962899958176 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 489.00073655199776, | |
| "count": 453, | |
| "self": 287.4265515640459, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 201.57418498795187, | |
| "count": 22785, | |
| "self": 201.57418498795187 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.1140000424347818e-06, | |
| "count": 1, | |
| "self": 1.1140000424347818e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.08649279800010845, | |
| "count": 1, | |
| "self": 0.0015377529998659156, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.08495504500024254, | |
| "count": 1, | |
| "self": 0.08495504500024254 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |