|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.4975653886795044, |
|
"min": 0.47961491346359253, |
|
"max": 1.3951681852340698, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 14847.3515625, |
|
"min": 14350.078125, |
|
"max": 42323.8203125, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989894.0, |
|
"min": 29952.0, |
|
"max": 989894.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989894.0, |
|
"min": 29952.0, |
|
"max": 989894.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.4085873067378998, |
|
"min": -0.08974519371986389, |
|
"max": 0.4677356481552124, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 108.275634765625, |
|
"min": -21.449100494384766, |
|
"max": 127.2240982055664, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.014104614965617657, |
|
"min": -0.005268337205052376, |
|
"max": 0.25343790650367737, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 3.737722873687744, |
|
"min": -1.4066460132598877, |
|
"max": 60.064781188964844, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06710505671061397, |
|
"min": 0.06500589805137781, |
|
"max": 0.07254626382824657, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9394707939485956, |
|
"min": 0.5075860991809736, |
|
"max": 1.0320246177531465, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.01582775835001793, |
|
"min": 0.0003489376471918086, |
|
"max": 0.01644820867449097, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.221588616900251, |
|
"min": 0.004885127060685321, |
|
"max": 0.24672313011736455, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.363468974114286e-06, |
|
"min": 7.363468974114286e-06, |
|
"max": 0.00029515063018788575, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.0001030885656376, |
|
"min": 0.0001030885656376, |
|
"max": 0.0036331561889480003, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10245445714285714, |
|
"min": 0.10245445714285714, |
|
"max": 0.19838354285714285, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4343624, |
|
"min": 1.3886848, |
|
"max": 2.6110519999999995, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.00025520026857142863, |
|
"min": 0.00025520026857142863, |
|
"max": 0.00983851593142857, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.003572803760000001, |
|
"min": 0.003572803760000001, |
|
"max": 0.12112409480000001, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.009822138585150242, |
|
"min": 0.009822138585150242, |
|
"max": 0.4139936566352844, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.13750994205474854, |
|
"min": 0.13750994205474854, |
|
"max": 2.8979556560516357, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 389.09859154929575, |
|
"min": 389.09859154929575, |
|
"max": 999.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 27626.0, |
|
"min": 15984.0, |
|
"max": 32785.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.4136591310232458, |
|
"min": -1.0000000521540642, |
|
"max": 1.5503628332700048, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 100.36979830265045, |
|
"min": -29.89840167760849, |
|
"max": 108.52539832890034, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.4136591310232458, |
|
"min": -1.0000000521540642, |
|
"max": 1.5503628332700048, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 100.36979830265045, |
|
"min": -29.89840167760849, |
|
"max": 108.52539832890034, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.03946737707309707, |
|
"min": 0.03946737707309707, |
|
"max": 8.436937988270074, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.802183772189892, |
|
"min": 2.802183772189892, |
|
"max": 134.9910078123212, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1679827432", |
|
"python_version": "3.9.16 (main, Dec 7 2022, 01:11:51) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids-Training-01 --no-graphics", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1679829642" |
|
}, |
|
"total": 2209.582941508, |
|
"count": 1, |
|
"self": 0.48784612800000104, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.11024874600002477, |
|
"count": 1, |
|
"self": 0.11024874600002477 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2208.984846634, |
|
"count": 1, |
|
"self": 1.6394397359608774, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 6.252175113000021, |
|
"count": 1, |
|
"self": 6.252175113000021 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2200.9970362320387, |
|
"count": 63574, |
|
"self": 1.7514847370725874, |
|
"children": { |
|
"env_step": { |
|
"total": 1559.8176929829783, |
|
"count": 63574, |
|
"self": 1442.1477295419309, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 116.75630156701459, |
|
"count": 63574, |
|
"self": 4.92620027300444, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 111.83010129401015, |
|
"count": 62556, |
|
"self": 111.83010129401015 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.9136618740329823, |
|
"count": 63574, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2203.9800220379916, |
|
"count": 63574, |
|
"is_parallel": true, |
|
"self": 886.5983430489539, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.001865398000006735, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005853390000538639, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001280058999952871, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001280058999952871 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.08041903200000888, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005801249999421998, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0004834540000047127, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004834540000047127 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.07765766700003951, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.07765766700003951 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.001697786000022461, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004786699998930999, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001219116000129361, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001219116000129361 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1317.3816789890377, |
|
"count": 63573, |
|
"is_parallel": true, |
|
"self": 32.843421338983035, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 23.393729668981848, |
|
"count": 63573, |
|
"is_parallel": true, |
|
"self": 23.393729668981848 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1164.2905567070488, |
|
"count": 63573, |
|
"is_parallel": true, |
|
"self": 1164.2905567070488 |
|
}, |
|
"steps_from_proto": { |
|
"total": 96.85397127402388, |
|
"count": 63573, |
|
"is_parallel": true, |
|
"self": 20.916294354970887, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 75.93767691905299, |
|
"count": 508584, |
|
"is_parallel": true, |
|
"self": 75.93767691905299 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 639.427858511988, |
|
"count": 63574, |
|
"self": 2.9213153139994574, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 119.87786565599055, |
|
"count": 63574, |
|
"self": 119.61185070899074, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.2660149469998032, |
|
"count": 2, |
|
"self": 0.2660149469998032 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 516.6286775419981, |
|
"count": 452, |
|
"self": 327.54881674702926, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 189.0798607949688, |
|
"count": 22830, |
|
"self": 189.0798607949688 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.0280000424245372e-06, |
|
"count": 1, |
|
"self": 1.0280000424245372e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.09619452500010084, |
|
"count": 1, |
|
"self": 0.001404715000262513, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.09478980999983833, |
|
"count": 1, |
|
"self": 0.09478980999983833 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |