|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.4373374283313751, |
|
"min": 0.4373374283313751, |
|
"max": 1.3828552961349487, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 13246.076171875, |
|
"min": 13246.076171875, |
|
"max": 41950.296875, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989883.0, |
|
"min": 29999.0, |
|
"max": 989883.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989883.0, |
|
"min": 29999.0, |
|
"max": 989883.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.4891029894351959, |
|
"min": -0.09020061045885086, |
|
"max": 0.6365716457366943, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 130.1013946533203, |
|
"min": -21.828548431396484, |
|
"max": 183.3326416015625, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": -0.048941098153591156, |
|
"min": -0.048941098153591156, |
|
"max": 0.37877002358436584, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": -13.018332481384277, |
|
"min": -13.018332481384277, |
|
"max": 90.14726257324219, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06822469798914556, |
|
"min": 0.06464895404449233, |
|
"max": 0.07416838001158864, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9551457718480378, |
|
"min": 0.5869756277689735, |
|
"max": 1.0502334930968251, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.014525838625905592, |
|
"min": 0.0011728096766552994, |
|
"max": 0.016486373742823378, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.2033617407626783, |
|
"min": 0.01641933547317419, |
|
"max": 0.23160827474202964, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.481861791792858e-06, |
|
"min": 7.481861791792858e-06, |
|
"max": 0.00029476297674567496, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.0001047460650851, |
|
"min": 0.0001047460650851, |
|
"max": 0.0036343006885665, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10249392142857146, |
|
"min": 0.10249392142857146, |
|
"max": 0.198254325, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4349149000000003, |
|
"min": 1.4349149000000003, |
|
"max": 2.6114335, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.0002591427507142858, |
|
"min": 0.0002591427507142858, |
|
"max": 0.009825607067499999, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.003627998510000001, |
|
"min": 0.003627998510000001, |
|
"max": 0.12116220665, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.008063855580985546, |
|
"min": 0.008063855580985546, |
|
"max": 0.406576007604599, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.1128939762711525, |
|
"min": 0.1128939762711525, |
|
"max": 3.252608060836792, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 397.1333333333333, |
|
"min": 294.7113402061856, |
|
"max": 988.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29785.0, |
|
"min": 17437.0, |
|
"max": 32910.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.3894666435321172, |
|
"min": -0.8614437992218882, |
|
"max": 1.6561379090979182, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 104.20999826490879, |
|
"min": -27.566201575100422, |
|
"max": 160.54179845750332, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.3894666435321172, |
|
"min": -0.8614437992218882, |
|
"max": 1.6561379090979182, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 104.20999826490879, |
|
"min": -27.566201575100422, |
|
"max": 160.54179845750332, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.03451023576237882, |
|
"min": 0.027286063975949144, |
|
"max": 7.722050276895364, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.5882676821784116, |
|
"min": 2.527639201070997, |
|
"max": 138.99690498411655, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1674034331", |
|
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.6", |
|
"end_time_seconds": "1674036519" |
|
}, |
|
"total": 2188.7614649880006, |
|
"count": 1, |
|
"self": 0.4432769940003709, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.12702667200005635, |
|
"count": 1, |
|
"self": 0.12702667200005635 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2188.191161322, |
|
"count": 1, |
|
"self": 1.202378460966429, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 6.287917343000117, |
|
"count": 1, |
|
"self": 6.287917343000117 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2180.615527025033, |
|
"count": 63910, |
|
"self": 1.2253711531620866, |
|
"children": { |
|
"env_step": { |
|
"total": 1508.8387061199205, |
|
"count": 63910, |
|
"self": 1407.0341820169178, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 101.0686858690151, |
|
"count": 63910, |
|
"self": 4.217618594031137, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 96.85106727498396, |
|
"count": 62561, |
|
"self": 32.782131168993146, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 64.06893610599082, |
|
"count": 62561, |
|
"self": 64.06893610599082 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.7358382339875789, |
|
"count": 63910, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2183.722967143883, |
|
"count": 63910, |
|
"is_parallel": true, |
|
"self": 873.2771783049241, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0018528010000409267, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006990250001308596, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0011537759999100672, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0011537759999100672 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.046326847000045746, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00050268099994355, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0004745530000036524, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004745530000036524 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.043726396000010936, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.043726396000010936 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0016232170000876067, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0003801480004312907, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001243068999656316, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001243068999656316 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1310.445788838959, |
|
"count": 63909, |
|
"is_parallel": true, |
|
"self": 28.151701304915377, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 22.246336114978703, |
|
"count": 63909, |
|
"is_parallel": true, |
|
"self": 22.246336114978703 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1161.9887209290075, |
|
"count": 63909, |
|
"is_parallel": true, |
|
"self": 1161.9887209290075 |
|
}, |
|
"steps_from_proto": { |
|
"total": 98.05903049005747, |
|
"count": 63909, |
|
"is_parallel": true, |
|
"self": 21.388863524164208, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 76.67016696589326, |
|
"count": 511272, |
|
"is_parallel": true, |
|
"self": 76.67016696589326 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 670.5514497519505, |
|
"count": 63910, |
|
"self": 2.2265912289567495, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 147.30195031299968, |
|
"count": 63910, |
|
"self": 147.11662121099903, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.1853291020006509, |
|
"count": 2, |
|
"self": 0.1853291020006509 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 521.0229082099941, |
|
"count": 459, |
|
"self": 198.27613544599762, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 322.74677276399643, |
|
"count": 22734, |
|
"self": 322.74677276399643 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 9.190007403958589e-07, |
|
"count": 1, |
|
"self": 9.190007403958589e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.08533757399982278, |
|
"count": 1, |
|
"self": 0.0014087740000832127, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.08392879999973957, |
|
"count": 1, |
|
"self": 0.08392879999973957 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |