First Push

e4de8b7 verified over 1 year ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.41336187720298767,
	"min": 0.41336187720298767,
	"max": 1.4649927616119385,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 12381.0146484375,
	"min": 12381.0146484375,
	"max": 44442.01953125,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989987.0,
	"min": 29909.0,
	"max": 989987.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989987.0,
	"min": 29909.0,
	"max": 989987.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.4611879289150238,
	"min": -0.08653777837753296,
	"max": 0.5208510756492615,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 127.2878646850586,
	"min": -21.115217208862305,
	"max": 144.27574157714844,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.0827915370464325,
	"min": -0.020135240629315376,
	"max": 0.2369966059923172,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 22.8504638671875,
	"min": -5.456650257110596,
	"max": 57.116180419921875,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06954284608310302,
	"min": 0.06541757567417032,
	"max": 0.07559310506136778,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9735998451634422,
	"min": 0.5782482939776992,
	"max": 1.058303470859149,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.01547441167993496,
	"min": 0.0006549689626029119,
	"max": 0.016060077420358237,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.21664176351908943,
	"min": 0.009169565476440766,
	"max": 0.2248410838850153,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.481947506049992e-06,
	"min": 7.481947506049992e-06,
	"max": 0.0002947665392444875,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.0001047472650846999,
	"min": 0.0001047472650846999,
	"max": 0.0036331999889333997,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10249395000000001,
	"min": 0.10249395000000001,
	"max": 0.1982555125,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4349153000000001,
	"min": 1.4349153000000001,
	"max": 2.611066600000001,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00025914560499999976,
	"min": 0.00025914560499999976,
	"max": 0.00982572569875,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.003628038469999997,
	"min": 0.003628038469999997,
	"max": 0.12112555333999998,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.014167736284434795,
	"min": 0.014167736284434795,
	"max": 0.3874890208244324,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.19834831357002258,
	"min": 0.19834831357002258,
	"max": 3.099912166595459,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 409.88461538461536,
	"min": 366.975,
	"max": 990.2666666666667,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 31971.0,
	"min": 17475.0,
	"max": 33463.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.458477897303445,
	"min": -0.9246250505093485,
	"max": 1.5830149767920374,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 112.30279809236526,
	"min": -29.588001616299152,
	"max": 129.21399794518948,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.458477897303445,
	"min": -0.9246250505093485,
	"max": 1.5830149767920374,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 112.30279809236526,
	"min": -29.588001616299152,
	"max": 129.21399794518948,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.060503237912894,
	"min": 0.0541872761779814,
	"max": 7.393877701212962,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 4.658749319292838,
	"min": 4.309561093163211,
	"max": 133.08979862183332,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1737039256",
	"python_version": "3.10.12 (main, Nov 6 2024, 20:22:13) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.5.1+cu124",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1737041473"
	},
	"total": 2217.250903149,
	"count": 1,
	"self": 0.6431621699998686,
	"children": {
	"run_training.setup": {
	"total": 0.02193374899997025,
	"count": 1,
	"self": 0.02193374899997025
	},
	"TrainerController.start_learning": {
	"total": 2216.5858072300002,
	"count": 1,
	"self": 1.4333999779391888,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.036220076999996,
	"count": 1,
	"self": 3.036220076999996
	},
	"TrainerController.advance": {
	"total": 2212.027598170061,
	"count": 63806,
	"self": 1.5035490330851644,
	"children": {
	"env_step": {
	"total": 1513.254193532992,
	"count": 63806,
	"self": 1356.5088433809983,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 155.8851694540142,
	"count": 63806,
	"self": 4.693354754020561,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 151.19181469999364,
	"count": 62564,
	"self": 151.19181469999364
	}
	}
	},
	"workers": {
	"total": 0.8601806979794446,
	"count": 63806,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2211.2968053100417,
	"count": 63806,
	"is_parallel": true,
	"self": 968.987262491059,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.005746649000002435,
	"count": 1,
	"is_parallel": true,
	"self": 0.004351683000095363,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013949659999070718,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013949659999070718
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.047842519000028005,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005632550000882475,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004649149999522706,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004649149999522706
	},
	"communicator.exchange": {
	"total": 0.045036253000034776,
	"count": 1,
	"is_parallel": true,
	"self": 0.045036253000034776
	},
	"steps_from_proto": {
	"total": 0.0017780959999527113,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005030499997928928,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012750460001598185,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012750460001598185
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1242.3095428189827,
	"count": 63805,
	"is_parallel": true,
	"self": 32.21548038704668,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 22.983295438992513,
	"count": 63805,
	"is_parallel": true,
	"self": 22.983295438992513
	},
	"communicator.exchange": {
	"total": 1090.358355256982,
	"count": 63805,
	"is_parallel": true,
	"self": 1090.358355256982
	},
	"steps_from_proto": {
	"total": 96.75241173596157,
	"count": 63805,
	"is_parallel": true,
	"self": 19.48196411892627,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 77.2704476170353,
	"count": 510440,
	"is_parallel": true,
	"self": 77.2704476170353
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 697.269855603984,
	"count": 63806,
	"self": 2.728400674074919,
	"children": {
	"process_trajectory": {
	"total": 129.63196941690978,
	"count": 63806,
	"self": 129.37337858891,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2585908279997966,
	"count": 2,
	"self": 0.2585908279997966
	}
	}
	},
	"_update_policy": {
	"total": 564.9094855129993,
	"count": 459,
	"self": 314.3957293169875,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 250.51375619601174,
	"count": 22791,
	"self": 250.51375619601174
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.219999472203199e-07,
	"count": 1,
	"self": 8.219999472203199e-07
	},
	"TrainerController._save_models": {
	"total": 0.08858818299995619,
	"count": 1,
	"self": 0.0015602419998685946,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.0870279410000876,
	"count": 1,
	"self": 0.0870279410000876
	}
	}
	}
	}
	}
	}
	}