|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.4197154641151428, |
|
"min": 0.272203266620636, |
|
"max": 1.5045830011367798, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 12625.041015625, |
|
"min": 8148.67724609375, |
|
"max": 45643.03125, |
|
"count": 377 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 11309921.0, |
|
"min": 29952.0, |
|
"max": 11309921.0, |
|
"count": 377 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 11309921.0, |
|
"min": 29952.0, |
|
"max": 11309921.0, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.7003707885742188, |
|
"min": -0.19950847327709198, |
|
"max": 0.7662648558616638, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 197.5045623779297, |
|
"min": -47.28350830078125, |
|
"max": 224.49522399902344, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.003947226796299219, |
|
"min": -0.05940214917063713, |
|
"max": 0.3908889889717102, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 1.1131179332733154, |
|
"min": -16.513797760009766, |
|
"max": 93.8133544921875, |
|
"count": 377 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.05026319106469773, |
|
"min": 0.04300903675833806, |
|
"max": 0.09981689124556614, |
|
"count": 377 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.3518423374528841, |
|
"min": 0.2035083431895173, |
|
"max": 0.698718238718963, |
|
"count": 377 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.01388661854296169, |
|
"min": 0.00031933543865666705, |
|
"max": 9.80639659676568, |
|
"count": 377 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.09720632980073182, |
|
"min": 0.0022353480705966694, |
|
"max": 68.64477617735976, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 0.002322299456875733, |
|
"min": 0.002322299456875733, |
|
"max": 0.0029990899200303357, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.01625609619813013, |
|
"min": 0.011996359680121343, |
|
"max": 0.02384890956503635, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.17740998114285714, |
|
"min": 0.17740998114285714, |
|
"max": 0.19996966400000002, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.241869868, |
|
"min": 0.7998786560000001, |
|
"max": 1.5949636520000001, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.007743257116171428, |
|
"min": 0.007743257116171428, |
|
"max": 0.0099969694336, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.054202799813199996, |
|
"min": 0.0399878777344, |
|
"max": 0.0794968688348, |
|
"count": 377 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.0034704941790550947, |
|
"min": 0.0034704941790550947, |
|
"max": 0.6667643785476685, |
|
"count": 377 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.024293459951877594, |
|
"min": 0.024293459951877594, |
|
"max": 2.667057514190674, |
|
"count": 377 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 316.0, |
|
"min": 237.55371900826447, |
|
"max": 999.0, |
|
"count": 377 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 30968.0, |
|
"min": 15984.0, |
|
"max": 35843.0, |
|
"count": 377 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.644698966482673, |
|
"min": -1.0000000521540642, |
|
"max": 1.7624462644669636, |
|
"count": 377 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 162.82519768178463, |
|
"min": -29.995001636445522, |
|
"max": 218.6787971407175, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.644698966482673, |
|
"min": -1.0000000521540642, |
|
"max": 1.7624462644669636, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 162.82519768178463, |
|
"min": -29.995001636445522, |
|
"max": 218.6787971407175, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.011586302707398475, |
|
"min": 0.009915739200480927, |
|
"max": 11.432586884126067, |
|
"count": 377 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 1.147043968032449, |
|
"min": 1.0746353828071733, |
|
"max": 182.92139014601707, |
|
"count": 377 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 377 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 377 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1689757960", |
|
"python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]", |
|
"command_line_arguments": "/home/arran/.local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --force", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1689767774" |
|
}, |
|
"total": 9813.438060935005, |
|
"count": 1, |
|
"self": 0.14997585001401603, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.009300467994762585, |
|
"count": 1, |
|
"self": 0.009300467994762585 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 9813.278784616996, |
|
"count": 1, |
|
"self": 9.232576190959662, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.422013842005981, |
|
"count": 1, |
|
"self": 2.422013842005981 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 9801.555481683026, |
|
"count": 732625, |
|
"self": 8.413826392206829, |
|
"children": { |
|
"env_step": { |
|
"total": 6327.068002251006, |
|
"count": 732625, |
|
"self": 5318.326892920915, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 1003.0577777927683, |
|
"count": 732625, |
|
"self": 25.714818801294314, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 977.342958991474, |
|
"count": 707201, |
|
"self": 977.342958991474 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 5.683331537322374, |
|
"count": 732624, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 9801.626357703004, |
|
"count": 732624, |
|
"is_parallel": true, |
|
"self": 5066.491318356275, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0007869589899200946, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00021948496578261256, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.000567474024137482, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.000567474024137482 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.01652249798644334, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00017548198229633272, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00020307398517616093, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00020307398517616093 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.015603690000716597, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.015603690000716597 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0005402520182542503, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00013721000868827105, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.00040304200956597924, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.00040304200956597924 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 4735.135039346729, |
|
"count": 732623, |
|
"is_parallel": true, |
|
"self": 148.83361234873882, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 108.86860577567131, |
|
"count": 732623, |
|
"is_parallel": true, |
|
"self": 108.86860577567131 |
|
}, |
|
"communicator.exchange": { |
|
"total": 4039.3383600350353, |
|
"count": 732623, |
|
"is_parallel": true, |
|
"self": 4039.3383600350353 |
|
}, |
|
"steps_from_proto": { |
|
"total": 438.09446118728374, |
|
"count": 732623, |
|
"is_parallel": true, |
|
"self": 100.58675679168664, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 337.5077043955971, |
|
"count": 5860984, |
|
"is_parallel": true, |
|
"self": 337.5077043955971 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 3466.0736530398135, |
|
"count": 732624, |
|
"self": 16.990142274677055, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 817.632784697169, |
|
"count": 732624, |
|
"self": 816.1766611461062, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 1.456123551062774, |
|
"count": 22, |
|
"self": 1.456123551062774 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 2631.4507260679675, |
|
"count": 2712, |
|
"self": 1861.5610947568202, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 769.8896313111472, |
|
"count": 130515, |
|
"self": 769.8896313111472 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 6.709888111799955e-07, |
|
"count": 1, |
|
"self": 6.709888111799955e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.06871223001508042, |
|
"count": 1, |
|
"self": 0.0009454120299778879, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.06776681798510253, |
|
"count": 1, |
|
"self": 0.06776681798510253 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |