|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.2816214859485626, |
|
"min": 0.27325060963630676, |
|
"max": 1.447108507156372, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 8484.6923828125, |
|
"min": 8193.3017578125, |
|
"max": 43899.484375, |
|
"count": 40 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 1199944.0, |
|
"min": 29952.0, |
|
"max": 1199944.0, |
|
"count": 40 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 1199944.0, |
|
"min": 29952.0, |
|
"max": 1199944.0, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.641365110874176, |
|
"min": -0.11645389348268509, |
|
"max": 0.6860062479972839, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 182.14768981933594, |
|
"min": -28.065387725830078, |
|
"max": 196.8837890625, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.0178033709526062, |
|
"min": -0.00929284654557705, |
|
"max": 0.225004643201828, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 5.056157112121582, |
|
"min": -2.5927042961120605, |
|
"max": 54.22611999511719, |
|
"count": 40 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06766902339932997, |
|
"min": 0.0650183567001174, |
|
"max": 0.07413154792794516, |
|
"count": 40 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9473663275906196, |
|
"min": 0.4989679115433005, |
|
"max": 1.0472376360654987, |
|
"count": 40 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.01697522836426894, |
|
"min": 0.0006247077437635777, |
|
"max": 0.01713264944976092, |
|
"count": 40 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.23765319709976515, |
|
"min": 0.00812120066892651, |
|
"max": 0.2569897417464138, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 3.7445451804226198e-06, |
|
"min": 3.7445451804226198e-06, |
|
"max": 0.0002959588584899048, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 5.242363252591668e-05, |
|
"min": 5.242363252591668e-05, |
|
"max": 0.0036226571924476664, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10124814880952382, |
|
"min": 0.10124814880952382, |
|
"max": 0.1986529523809524, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4174740833333335, |
|
"min": 1.3905706666666668, |
|
"max": 2.6075523333333335, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.00013469006607142857, |
|
"min": 0.00013469006607142857, |
|
"max": 0.00986542994285714, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.0018856609250000001, |
|
"min": 0.0018856609250000001, |
|
"max": 0.12077447809999999, |
|
"count": 40 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.007941853255033493, |
|
"min": 0.007908061146736145, |
|
"max": 0.415669709444046, |
|
"count": 40 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.1111859455704689, |
|
"min": 0.11071285605430603, |
|
"max": 2.9096879959106445, |
|
"count": 40 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 294.36893203883494, |
|
"min": 274.6509433962264, |
|
"max": 999.0, |
|
"count": 40 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 30320.0, |
|
"min": 15984.0, |
|
"max": 33038.0, |
|
"count": 40 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.686211634174134, |
|
"min": -1.0000000521540642, |
|
"max": 1.7018968920732283, |
|
"count": 40 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 173.6797983199358, |
|
"min": -29.898201644420624, |
|
"max": 184.77499793469906, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.686211634174134, |
|
"min": -1.0000000521540642, |
|
"max": 1.7018968920732283, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 173.6797983199358, |
|
"min": -29.898201644420624, |
|
"max": 184.77499793469906, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.024442765250286647, |
|
"min": 0.022999434261846374, |
|
"max": 9.523486039601266, |
|
"count": 40 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.5176048207795247, |
|
"min": 2.381915781501448, |
|
"max": 152.37577663362026, |
|
"count": 40 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 40 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 40 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1674325890", |
|
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.6", |
|
"end_time_seconds": "1674328335" |
|
}, |
|
"total": 2444.817424825, |
|
"count": 1, |
|
"self": 0.4274704730000849, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.11824862000003122, |
|
"count": 1, |
|
"self": 0.11824862000003122 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2444.271705732, |
|
"count": 1, |
|
"self": 1.424217562974718, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 6.8738629819999915, |
|
"count": 1, |
|
"self": 6.8738629819999915 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2435.8780134030258, |
|
"count": 76972, |
|
"self": 1.4874208402252407, |
|
"children": { |
|
"env_step": { |
|
"total": 1673.3590310878744, |
|
"count": 76972, |
|
"self": 1556.884214595943, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 115.61947711898802, |
|
"count": 76972, |
|
"self": 4.774968489137791, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 110.84450862985022, |
|
"count": 75059, |
|
"self": 37.589818540806846, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 73.25469008904338, |
|
"count": 75059, |
|
"self": 73.25469008904338 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.8553393729434902, |
|
"count": 76972, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2439.99166084691, |
|
"count": 76972, |
|
"is_parallel": true, |
|
"self": 993.0030073088096, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0016060819998529041, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005645320002258813, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0010415499996270228, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0010415499996270228 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.0458810490003998, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005086400001346192, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0005010350000702601, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005010350000702601 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.04316214900018167, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.04316214900018167 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.001709225000013248, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004373009996925248, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0012719240003207233, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0012719240003207233 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1446.9886535381002, |
|
"count": 76971, |
|
"is_parallel": true, |
|
"self": 31.65827170807006, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 25.12121521501558, |
|
"count": 76971, |
|
"is_parallel": true, |
|
"self": 25.12121521501558 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1277.6611165719955, |
|
"count": 76971, |
|
"is_parallel": true, |
|
"self": 1277.6611165719955 |
|
}, |
|
"steps_from_proto": { |
|
"total": 112.54805004301897, |
|
"count": 76971, |
|
"is_parallel": true, |
|
"self": 24.446230012097203, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 88.10182003092177, |
|
"count": 615768, |
|
"is_parallel": true, |
|
"self": 88.10182003092177 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 761.0315614749261, |
|
"count": 76972, |
|
"self": 2.6816516639114525, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 167.05535639602613, |
|
"count": 76972, |
|
"self": 166.77351540902646, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.28184098699966853, |
|
"count": 2, |
|
"self": 0.28184098699966853 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 591.2945534149885, |
|
"count": 546, |
|
"self": 226.89345218001654, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 364.401101234972, |
|
"count": 27321, |
|
"self": 364.401101234972 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.0310004654456861e-06, |
|
"count": 1, |
|
"self": 1.0310004654456861e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.0956107529991641, |
|
"count": 1, |
|
"self": 0.001357368999379105, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.094253383999785, |
|
"count": 1, |
|
"self": 0.094253383999785 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |