|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.4935741126537323, |
|
"min": 0.4935741126537323, |
|
"max": 1.467158317565918, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 14751.943359375, |
|
"min": 14751.943359375, |
|
"max": 44507.71484375, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989927.0, |
|
"min": 29952.0, |
|
"max": 989927.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989927.0, |
|
"min": 29952.0, |
|
"max": 989927.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.5647760033607483, |
|
"min": -0.08042053878307343, |
|
"max": 0.5647760033607483, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 156.4429473876953, |
|
"min": -19.381349563598633, |
|
"max": 156.4429473876953, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": -0.07561420649290085, |
|
"min": -0.07561420649290085, |
|
"max": 0.2936772406101227, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": -20.94513511657715, |
|
"min": -20.94513511657715, |
|
"max": 70.48253631591797, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.070965174417602, |
|
"min": 0.06495135207531146, |
|
"max": 0.07382341051771718, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.993512441846428, |
|
"min": 0.47700984054445766, |
|
"max": 1.1073511577657578, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.025176059511664295, |
|
"min": 0.0008474972185009295, |
|
"max": 0.025176059511664295, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.35246483316330013, |
|
"min": 0.005932480529506507, |
|
"max": 0.35246483316330013, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.28480471462143e-06, |
|
"min": 7.28480471462143e-06, |
|
"max": 0.00029515063018788575, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00010198726600470002, |
|
"min": 0.00010198726600470002, |
|
"max": 0.0035070968309678, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10242823571428572, |
|
"min": 0.10242823571428572, |
|
"max": 0.19838354285714285, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4339953, |
|
"min": 1.3691136000000002, |
|
"max": 2.5690322000000005, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.00025258074785714294, |
|
"min": 0.00025258074785714294, |
|
"max": 0.00983851593142857, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.0035361304700000013, |
|
"min": 0.0035361304700000013, |
|
"max": 0.11692631678000001, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.008750544860959053, |
|
"min": 0.00849044881761074, |
|
"max": 0.5230200290679932, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.12250763177871704, |
|
"min": 0.11886627972126007, |
|
"max": 3.661140203475952, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 329.40697674418607, |
|
"min": 329.40697674418607, |
|
"max": 999.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 28329.0, |
|
"min": 15984.0, |
|
"max": 33568.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.6722823395448572, |
|
"min": -1.0000000521540642, |
|
"max": 1.6722823395448572, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 142.14399886131287, |
|
"min": -32.000001668930054, |
|
"max": 142.14399886131287, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.6722823395448572, |
|
"min": -1.0000000521540642, |
|
"max": 1.6722823395448572, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 142.14399886131287, |
|
"min": -32.000001668930054, |
|
"max": 142.14399886131287, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.030229675734538913, |
|
"min": 0.030229675734538913, |
|
"max": 11.100240192376077, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.5695224374358077, |
|
"min": 2.5695224374358077, |
|
"max": 177.60384307801723, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1701516215", |
|
"python_version": "3.10.12 | packaged by conda-forge | (main, Jun 23 2023, 22:40:32) [GCC 12.3.0]", |
|
"command_line_arguments": "/opt/conda/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.1.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1701518720" |
|
}, |
|
"total": 2505.304226058, |
|
"count": 1, |
|
"self": 0.38100207599973146, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.09773542300013105, |
|
"count": 1, |
|
"self": 0.09773542300013105 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2504.825488559, |
|
"count": 1, |
|
"self": 1.636165807953148, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.750886860999799, |
|
"count": 1, |
|
"self": 2.750886860999799 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2500.364389289047, |
|
"count": 63677, |
|
"self": 1.694592466064023, |
|
"children": { |
|
"env_step": { |
|
"total": 1609.357019011958, |
|
"count": 63677, |
|
"self": 1483.6055631649015, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 124.72657889706738, |
|
"count": 63677, |
|
"self": 5.280796016091472, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 119.44578288097591, |
|
"count": 62557, |
|
"self": 119.44578288097591 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 1.0248769499892205, |
|
"count": 63677, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2502.1594690359657, |
|
"count": 63677, |
|
"is_parallel": true, |
|
"self": 1148.875177171908, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.002381091999950513, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0007242210006097594, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0016568709993407538, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0016568709993407538 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.03902450999999019, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00042446399993423256, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0004501749999690219, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004501749999690219 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.03670142200007831, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.03670142200007831 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0014484490000086225, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00031598000009580574, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0011324689999128168, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0011324689999128168 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1353.2842918640576, |
|
"count": 63676, |
|
"is_parallel": true, |
|
"self": 29.068680306120996, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 24.68096147993151, |
|
"count": 63676, |
|
"is_parallel": true, |
|
"self": 24.68096147993151 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1199.4893243349823, |
|
"count": 63676, |
|
"is_parallel": true, |
|
"self": 1199.4893243349823 |
|
}, |
|
"steps_from_proto": { |
|
"total": 100.04532574302289, |
|
"count": 63676, |
|
"is_parallel": true, |
|
"self": 20.499260584999774, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 79.54606515802311, |
|
"count": 509408, |
|
"is_parallel": true, |
|
"self": 79.54606515802311 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 889.3127778110247, |
|
"count": 63677, |
|
"self": 3.186108067023497, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 155.82249490900745, |
|
"count": 63677, |
|
"self": 155.6665104930073, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.15598441600013757, |
|
"count": 2, |
|
"self": 0.15598441600013757 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 730.3041748349938, |
|
"count": 449, |
|
"self": 446.9584316469975, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 283.3457431879963, |
|
"count": 22848, |
|
"self": 283.3457431879963 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.1830002222268376e-06, |
|
"count": 1, |
|
"self": 1.1830002222268376e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.07404541799996878, |
|
"count": 1, |
|
"self": 0.0015703580002082163, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.07247505999976056, |
|
"count": 1, |
|
"self": 0.07247505999976056 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |