|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.14446556568145752, |
|
"min": 0.14446556568145752, |
|
"max": 1.444345235824585, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 4329.34423828125, |
|
"min": 4329.34423828125, |
|
"max": 43815.65625, |
|
"count": 100 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 2999995.0, |
|
"min": 29952.0, |
|
"max": 2999995.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 2999995.0, |
|
"min": 29952.0, |
|
"max": 2999995.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.7704235315322876, |
|
"min": -0.10181490331888199, |
|
"max": 0.8655116558074951, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 228.8157958984375, |
|
"min": -24.537391662597656, |
|
"max": 263.11553955078125, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.016733018681406975, |
|
"min": 0.0011387375416234136, |
|
"max": 0.555656373500824, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 4.9697065353393555, |
|
"min": 0.3108753561973572, |
|
"max": 131.69056701660156, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06988161647585038, |
|
"min": 0.06204224426050851, |
|
"max": 0.07483950753770285, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9783426306619054, |
|
"min": 0.4822765194875156, |
|
"max": 1.0786946713342331, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.01392988887444629, |
|
"min": 0.00039698107112373356, |
|
"max": 0.02598050595420415, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.19501844424224804, |
|
"min": 0.00555773499573227, |
|
"max": 0.26956557048833935, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 1.5683637629595244e-06, |
|
"min": 1.5683637629595244e-06, |
|
"max": 0.00029838354339596195, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 2.1957092681433342e-05, |
|
"min": 2.1957092681433342e-05, |
|
"max": 0.0039275268908244, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10052275476190477, |
|
"min": 0.10052275476190477, |
|
"max": 0.19946118095238097, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4073185666666668, |
|
"min": 1.3897045333333333, |
|
"max": 2.7973922, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 6.222320071428574e-05, |
|
"min": 6.222320071428574e-05, |
|
"max": 0.009946171977142856, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.0008711248100000005, |
|
"min": 0.0008711248100000005, |
|
"max": 0.13092664244000002, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.008425016887485981, |
|
"min": 0.008099747821688652, |
|
"max": 0.6463526487350464, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.11795023083686829, |
|
"min": 0.11600933969020844, |
|
"max": 4.524468421936035, |
|
"count": 100 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 222.0597014925373, |
|
"min": 207.645390070922, |
|
"max": 999.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29756.0, |
|
"min": 15984.0, |
|
"max": 32511.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.761954872175715, |
|
"min": -1.0000000521540642, |
|
"max": 1.7871785570468222, |
|
"count": 100 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 234.3399979993701, |
|
"min": -32.000001668930054, |
|
"max": 251.8519984483719, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.761954872175715, |
|
"min": -1.0000000521540642, |
|
"max": 1.7871785570468222, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 234.3399979993701, |
|
"min": -32.000001668930054, |
|
"max": 251.8519984483719, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.019676849928105082, |
|
"min": 0.017501125833372988, |
|
"max": 15.005290312692523, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.617021040437976, |
|
"min": 2.4676587425055914, |
|
"max": 240.08464500308037, |
|
"count": 100 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 100 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1712438014", |
|
"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", |
|
"command_line_arguments": "/home/joeny/.local/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=trained-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.2.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1712441530" |
|
}, |
|
"total": 3516.1791991659993, |
|
"count": 1, |
|
"self": 0.2688839359998383, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.03330624399950466, |
|
"count": 1, |
|
"self": 0.03330624399950466 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 3515.877008986, |
|
"count": 1, |
|
"self": 3.147021408013643, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 1.5705331240005762, |
|
"count": 1, |
|
"self": 1.5705331240005762 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 3511.0439016629844, |
|
"count": 194833, |
|
"self": 3.0325700815346863, |
|
"children": { |
|
"env_step": { |
|
"total": 2382.5480493187533, |
|
"count": 194833, |
|
"self": 2118.9429423037627, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 261.4096492479948, |
|
"count": 194833, |
|
"self": 8.231087012253738, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 253.17856223574108, |
|
"count": 187554, |
|
"self": 253.17856223574108 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 2.195457766995787, |
|
"count": 194833, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 3511.8801136623697, |
|
"count": 194833, |
|
"is_parallel": true, |
|
"self": 1610.1382468191578, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0011475289993541082, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.000341423000463692, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0008061059988904162, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0008061059988904162 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.0254131720002988, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005840149988216581, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00019179200080543524, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00019179200080543524 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.023148442000092473, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.023148442000092473 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0014889230005792342, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0002428700017844676, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0012460529987947666, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0012460529987947666 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1901.741866843212, |
|
"count": 194832, |
|
"is_parallel": true, |
|
"self": 61.07512853609114, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 32.398689086351624, |
|
"count": 194832, |
|
"is_parallel": true, |
|
"self": 32.398689086351624 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1653.8236376497634, |
|
"count": 194832, |
|
"is_parallel": true, |
|
"self": 1653.8236376497634 |
|
}, |
|
"steps_from_proto": { |
|
"total": 154.44441157100573, |
|
"count": 194832, |
|
"is_parallel": true, |
|
"self": 31.70061374753186, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 122.74379782347387, |
|
"count": 1558656, |
|
"is_parallel": true, |
|
"self": 122.74379782347387 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 1125.4632822626963, |
|
"count": 194833, |
|
"self": 5.892573370757418, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 220.0148202569244, |
|
"count": 194833, |
|
"self": 219.5871394479209, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.4276808090035047, |
|
"count": 6, |
|
"self": 0.4276808090035047 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 899.5558886350145, |
|
"count": 1392, |
|
"self": 520.4894827230446, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 379.0664059119699, |
|
"count": 68403, |
|
"self": 379.0664059119699 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 5.830006557516754e-07, |
|
"count": 1, |
|
"self": 5.830006557516754e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.11555220800073585, |
|
"count": 1, |
|
"self": 0.0009456030020373873, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.11460660499869846, |
|
"count": 1, |
|
"self": 0.11460660499869846 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |