|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.34867730736732483, |
|
"min": 0.34867730736732483, |
|
"max": 1.388346552848816, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 10477.0556640625, |
|
"min": 10477.0556640625, |
|
"max": 42116.8828125, |
|
"count": 34 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 1019966.0, |
|
"min": 29952.0, |
|
"max": 1019966.0, |
|
"count": 34 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 1019966.0, |
|
"min": 29952.0, |
|
"max": 1019966.0, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.593503475189209, |
|
"min": -0.09624023735523224, |
|
"max": 0.6029665470123291, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 161.43295288085938, |
|
"min": -23.290138244628906, |
|
"max": 168.83062744140625, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.026628784835338593, |
|
"min": 0.019439801573753357, |
|
"max": 0.3245362639427185, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 7.243029594421387, |
|
"min": 5.287626266479492, |
|
"max": 78.21324157714844, |
|
"count": 34 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.0726065815991203, |
|
"min": 0.06518121377733067, |
|
"max": 0.0738082705479396, |
|
"count": 34 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 1.0164921423876843, |
|
"min": 0.4951569713843148, |
|
"max": 1.0532709674056, |
|
"count": 34 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.013795891233837442, |
|
"min": 0.00022016958157364307, |
|
"max": 0.016662508809246242, |
|
"count": 34 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.1931424772737242, |
|
"min": 0.002642034978883717, |
|
"max": 0.2332751233294474, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 0.00019953571205953572, |
|
"min": 0.00019953571205953572, |
|
"max": 0.00029838354339596195, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.0027934999688335, |
|
"min": 0.0020886848037717336, |
|
"max": 0.004072620342459933, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.16651189285714288, |
|
"min": 0.16651189285714288, |
|
"max": 0.19946118095238097, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 2.3311665, |
|
"min": 1.3962282666666668, |
|
"max": 2.857540066666667, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.006654538096428571, |
|
"min": 0.006654538096428571, |
|
"max": 0.009946171977142856, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.09316353335, |
|
"min": 0.06962320384, |
|
"max": 0.13576825266, |
|
"count": 34 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.021514538675546646, |
|
"min": 0.019645169377326965, |
|
"max": 0.45205339789390564, |
|
"count": 34 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.30120354890823364, |
|
"min": 0.2750323712825775, |
|
"max": 3.1643738746643066, |
|
"count": 34 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 363.6125, |
|
"min": 321.8510638297872, |
|
"max": 999.0, |
|
"count": 34 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29089.0, |
|
"min": 15984.0, |
|
"max": 32456.0, |
|
"count": 34 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.5113474772311748, |
|
"min": -1.0000000521540642, |
|
"max": 1.6568701980595892, |
|
"count": 34 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 120.90779817849398, |
|
"min": -31.998001664876938, |
|
"max": 155.7457986176014, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.5113474772311748, |
|
"min": -1.0000000521540642, |
|
"max": 1.6568701980595892, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 120.90779817849398, |
|
"min": -31.998001664876938, |
|
"max": 155.7457986176014, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.08085155892549664, |
|
"min": 0.0660823707253502, |
|
"max": 9.158712689764798, |
|
"count": 34 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 6.468124714039732, |
|
"min": 5.902974153170362, |
|
"max": 146.53940303623676, |
|
"count": 34 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 34 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 34 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1711912175", |
|
"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.2.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1711916143" |
|
}, |
|
"total": 3967.928722861, |
|
"count": 1, |
|
"self": 0.5304992470000798, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0689880190002441, |
|
"count": 1, |
|
"self": 0.0689880190002441 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 3967.329235595, |
|
"count": 1, |
|
"self": 2.783447556980718, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.9833197799998743, |
|
"count": 1, |
|
"self": 2.9833197799998743 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 3961.4013934760187, |
|
"count": 65943, |
|
"self": 3.0230258670521835, |
|
"children": { |
|
"env_step": { |
|
"total": 2676.8190595849724, |
|
"count": 65943, |
|
"self": 2471.335659888868, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 203.7215361380886, |
|
"count": 65943, |
|
"self": 8.738868755081512, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 194.98266738300708, |
|
"count": 64487, |
|
"self": 194.98266738300708 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 1.7618635580156479, |
|
"count": 65942, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 3959.3801244119204, |
|
"count": 65942, |
|
"is_parallel": true, |
|
"self": 1717.3903096018576, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0035716060001504957, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0010753879996627802, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0024962180004877155, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0024962180004877155 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.07145232299990312, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0007847249994483718, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00033339300034640473, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00033339300034640473 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.06824412100013433, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.06824412100013433 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.002090083999974013, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004403819998515246, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0016497020001224882, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0016497020001224882 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 2241.989814810063, |
|
"count": 65941, |
|
"is_parallel": true, |
|
"self": 60.44033313942464, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 32.60185797985423, |
|
"count": 65941, |
|
"is_parallel": true, |
|
"self": 32.60185797985423 |
|
}, |
|
"communicator.exchange": { |
|
"total": 2000.7793568549287, |
|
"count": 65941, |
|
"is_parallel": true, |
|
"self": 2000.7793568549287 |
|
}, |
|
"steps_from_proto": { |
|
"total": 148.16826683585532, |
|
"count": 65941, |
|
"is_parallel": true, |
|
"self": 33.26586393802609, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 114.90240289782923, |
|
"count": 527528, |
|
"is_parallel": true, |
|
"self": 114.90240289782923 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 1281.5593080239942, |
|
"count": 65942, |
|
"self": 6.257364301982307, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 203.62035893600614, |
|
"count": 65942, |
|
"self": 203.41450901600683, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.20584991999930935, |
|
"count": 2, |
|
"self": 0.20584991999930935 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 1071.6815847860057, |
|
"count": 464, |
|
"self": 415.06280488803486, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 656.6187798979709, |
|
"count": 23553, |
|
"self": 656.6187798979709 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.965000592463184e-06, |
|
"count": 1, |
|
"self": 1.965000592463184e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.16107281699987652, |
|
"count": 1, |
|
"self": 0.004031147000205237, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.15704166999967129, |
|
"count": 1, |
|
"self": 0.15704166999967129 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |