|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.32218632102012634, |
|
"min": 0.32218632102012634, |
|
"max": 1.417680025100708, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 9598.5751953125, |
|
"min": 9598.5751953125, |
|
"max": 43006.7421875, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989967.0, |
|
"min": 29925.0, |
|
"max": 989967.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989967.0, |
|
"min": 29925.0, |
|
"max": 989967.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.48654529452323914, |
|
"min": -0.10096907615661621, |
|
"max": 0.6211122274398804, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 133.79995727539062, |
|
"min": -24.253517150878906, |
|
"max": 174.53253173828125, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.023541927337646484, |
|
"min": -0.0011328005930408835, |
|
"max": 0.3510272204875946, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 6.474030017852783, |
|
"min": -0.29792654514312744, |
|
"max": 83.19345092773438, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.0695969604644781, |
|
"min": 0.06443182451363802, |
|
"max": 0.07345597657314058, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9743574465026933, |
|
"min": 0.4958543585895711, |
|
"max": 1.0447592619953758, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.016993682267506614, |
|
"min": 0.000713795746494557, |
|
"max": 0.017529804446981177, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.23791155174509257, |
|
"min": 0.007851753211440127, |
|
"max": 0.2454172622577365, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.638976025135713e-06, |
|
"min": 7.638976025135713e-06, |
|
"max": 0.0002952340730172143, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00010694566435189998, |
|
"min": 0.00010694566435189998, |
|
"max": 0.0032548496150501998, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10254629285714287, |
|
"min": 0.10254629285714287, |
|
"max": 0.19841135714285715, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4356481, |
|
"min": 1.3888795, |
|
"max": 2.4826161, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.00026437465642857144, |
|
"min": 0.00026437465642857144, |
|
"max": 0.009841294578571427, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.0037012451900000003, |
|
"min": 0.0037012451900000003, |
|
"max": 0.10851648502, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.016000542789697647, |
|
"min": 0.016000542789697647, |
|
"max": 0.4562482237815857, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.22400760650634766, |
|
"min": 0.22400760650634766, |
|
"max": 3.193737506866455, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 344.3370786516854, |
|
"min": 323.82022471910113, |
|
"max": 996.5806451612904, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 30646.0, |
|
"min": 16596.0, |
|
"max": 32642.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.5855636105618693, |
|
"min": -0.9330065036492963, |
|
"max": 1.6537011029680124, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 139.5295977294445, |
|
"min": -30.626201704144478, |
|
"max": 147.1793981641531, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.5855636105618693, |
|
"min": -0.9330065036492963, |
|
"max": 1.6537011029680124, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 139.5295977294445, |
|
"min": -30.626201704144478, |
|
"max": 147.1793981641531, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.05686455532552579, |
|
"min": 0.05686455532552579, |
|
"max": 8.655580476802939, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 5.00408086864627, |
|
"min": 5.00408086864627, |
|
"max": 147.14486810564995, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1674132593", |
|
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.6", |
|
"end_time_seconds": "1674134692" |
|
}, |
|
"total": 2099.230538492, |
|
"count": 1, |
|
"self": 0.4243024410002363, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.10984147299996039, |
|
"count": 1, |
|
"self": 0.10984147299996039 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2098.696394578, |
|
"count": 1, |
|
"self": 1.2625659520158479, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 6.117145030000074, |
|
"count": 1, |
|
"self": 6.117145030000074 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2091.2296980779834, |
|
"count": 63912, |
|
"self": 1.2819954649921783, |
|
"children": { |
|
"env_step": { |
|
"total": 1425.4749036940316, |
|
"count": 63912, |
|
"self": 1317.3880180700214, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 107.26816299203801, |
|
"count": 63912, |
|
"self": 4.4487346080372845, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 102.81942838400073, |
|
"count": 62561, |
|
"self": 34.71087786992098, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 68.10855051407975, |
|
"count": 62561, |
|
"self": 68.10855051407975 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.8187226319721503, |
|
"count": 63912, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2093.959562874037, |
|
"count": 63912, |
|
"is_parallel": true, |
|
"self": 879.2294356219936, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0017212289999406494, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006590159998722811, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0010622130000683683, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0010622130000683683 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.04934523400015678, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005252009998457652, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00044360000015331025, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00044360000015331025 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.04644157699999596, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.04644157699999596 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0019348560001617443, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00044470200009527616, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0014901540000664681, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0014901540000664681 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1214.7301272520435, |
|
"count": 63911, |
|
"is_parallel": true, |
|
"self": 28.141131763056592, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 23.962738398002784, |
|
"count": 63911, |
|
"is_parallel": true, |
|
"self": 23.962738398002784 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1058.0187053659834, |
|
"count": 63911, |
|
"is_parallel": true, |
|
"self": 1058.0187053659834 |
|
}, |
|
"steps_from_proto": { |
|
"total": 104.6075517250008, |
|
"count": 63911, |
|
"is_parallel": true, |
|
"self": 23.2369245229263, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 81.3706272020745, |
|
"count": 511288, |
|
"is_parallel": true, |
|
"self": 81.3706272020745 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 664.4727989189596, |
|
"count": 63912, |
|
"self": 2.3066455699427024, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 148.80680335001898, |
|
"count": 63912, |
|
"self": 148.6195796840184, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.18722366600059104, |
|
"count": 2, |
|
"self": 0.18722366600059104 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 513.3593499989979, |
|
"count": 448, |
|
"self": 197.59070913301753, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 315.7686408659804, |
|
"count": 22818, |
|
"self": 315.7686408659804 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 9.890000001178123e-07, |
|
"count": 1, |
|
"self": 9.890000001178123e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.08698452900034681, |
|
"count": 1, |
|
"self": 0.0012948880003023078, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.0856896410000445, |
|
"count": 1, |
|
"self": 0.0856896410000445 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |