joen2010

First Push

3cd3080 verified 7 months ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.14446556568145752,
	"min": 0.14446556568145752,
	"max": 1.444345235824585,
	"count": 100
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 4329.34423828125,
	"min": 4329.34423828125,
	"max": 43815.65625,
	"count": 100
	},
	"Pyramids.Step.mean": {
	"value": 2999995.0,
	"min": 29952.0,
	"max": 2999995.0,
	"count": 100
	},
	"Pyramids.Step.sum": {
	"value": 2999995.0,
	"min": 29952.0,
	"max": 2999995.0,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.7704235315322876,
	"min": -0.10181490331888199,
	"max": 0.8655116558074951,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 228.8157958984375,
	"min": -24.537391662597656,
	"max": 263.11553955078125,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.016733018681406975,
	"min": 0.0011387375416234136,
	"max": 0.555656373500824,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 4.9697065353393555,
	"min": 0.3108753561973572,
	"max": 131.69056701660156,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06988161647585038,
	"min": 0.06204224426050851,
	"max": 0.07483950753770285,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9783426306619054,
	"min": 0.4822765194875156,
	"max": 1.0786946713342331,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.01392988887444629,
	"min": 0.00039698107112373356,
	"max": 0.02598050595420415,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.19501844424224804,
	"min": 0.00555773499573227,
	"max": 0.26956557048833935,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 1.5683637629595244e-06,
	"min": 1.5683637629595244e-06,
	"max": 0.00029838354339596195,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 2.1957092681433342e-05,
	"min": 2.1957092681433342e-05,
	"max": 0.0039275268908244,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10052275476190477,
	"min": 0.10052275476190477,
	"max": 0.19946118095238097,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4073185666666668,
	"min": 1.3897045333333333,
	"max": 2.7973922,
	"count": 100
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 6.222320071428574e-05,
	"min": 6.222320071428574e-05,
	"max": 0.009946171977142856,
	"count": 100
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0008711248100000005,
	"min": 0.0008711248100000005,
	"max": 0.13092664244000002,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.008425016887485981,
	"min": 0.008099747821688652,
	"max": 0.6463526487350464,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.11795023083686829,
	"min": 0.11600933969020844,
	"max": 4.524468421936035,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 222.0597014925373,
	"min": 207.645390070922,
	"max": 999.0,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29756.0,
	"min": 15984.0,
	"max": 32511.0,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.761954872175715,
	"min": -1.0000000521540642,
	"max": 1.7871785570468222,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 234.3399979993701,
	"min": -32.000001668930054,
	"max": 251.8519984483719,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.761954872175715,
	"min": -1.0000000521540642,
	"max": 1.7871785570468222,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 234.3399979993701,
	"min": -32.000001668930054,
	"max": 251.8519984483719,
	"count": 100
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.019676849928105082,
	"min": 0.017501125833372988,
	"max": 15.005290312692523,
	"count": 100
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.617021040437976,
	"min": 2.4676587425055914,
	"max": 240.08464500308037,
	"count": 100
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1712438014",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/home/joeny/.local/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=trained-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1712441530"
	},
	"total": 3516.1791991659993,
	"count": 1,
	"self": 0.2688839359998383,
	"children": {
	"run_training.setup": {
	"total": 0.03330624399950466,
	"count": 1,
	"self": 0.03330624399950466
	},
	"TrainerController.start_learning": {
	"total": 3515.877008986,
	"count": 1,
	"self": 3.147021408013643,
	"children": {
	"TrainerController._reset_env": {
	"total": 1.5705331240005762,
	"count": 1,
	"self": 1.5705331240005762
	},
	"TrainerController.advance": {
	"total": 3511.0439016629844,
	"count": 194833,
	"self": 3.0325700815346863,
	"children": {
	"env_step": {
	"total": 2382.5480493187533,
	"count": 194833,
	"self": 2118.9429423037627,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 261.4096492479948,
	"count": 194833,
	"self": 8.231087012253738,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 253.17856223574108,
	"count": 187554,
	"self": 253.17856223574108
	}
	}
	},
	"workers": {
	"total": 2.195457766995787,
	"count": 194833,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3511.8801136623697,
	"count": 194833,
	"is_parallel": true,
	"self": 1610.1382468191578,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0011475289993541082,
	"count": 1,
	"is_parallel": true,
	"self": 0.000341423000463692,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0008061059988904162,
	"count": 8,
	"is_parallel": true,
	"self": 0.0008061059988904162
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.0254131720002988,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005840149988216581,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00019179200080543524,
	"count": 1,
	"is_parallel": true,
	"self": 0.00019179200080543524
	},
	"communicator.exchange": {
	"total": 0.023148442000092473,
	"count": 1,
	"is_parallel": true,
	"self": 0.023148442000092473
	},
	"steps_from_proto": {
	"total": 0.0014889230005792342,
	"count": 1,
	"is_parallel": true,
	"self": 0.0002428700017844676,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012460529987947666,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012460529987947666
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1901.741866843212,
	"count": 194832,
	"is_parallel": true,
	"self": 61.07512853609114,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 32.398689086351624,
	"count": 194832,
	"is_parallel": true,
	"self": 32.398689086351624
	},
	"communicator.exchange": {
	"total": 1653.8236376497634,
	"count": 194832,
	"is_parallel": true,
	"self": 1653.8236376497634
	},
	"steps_from_proto": {
	"total": 154.44441157100573,
	"count": 194832,
	"is_parallel": true,
	"self": 31.70061374753186,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 122.74379782347387,
	"count": 1558656,
	"is_parallel": true,
	"self": 122.74379782347387
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1125.4632822626963,
	"count": 194833,
	"self": 5.892573370757418,
	"children": {
	"process_trajectory": {
	"total": 220.0148202569244,
	"count": 194833,
	"self": 219.5871394479209,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.4276808090035047,
	"count": 6,
	"self": 0.4276808090035047
	}
	}
	},
	"_update_policy": {
	"total": 899.5558886350145,
	"count": 1392,
	"self": 520.4894827230446,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 379.0664059119699,
	"count": 68403,
	"self": 379.0664059119699
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 5.830006557516754e-07,
	"count": 1,
	"self": 5.830006557516754e-07
	},
	"TrainerController._save_models": {
	"total": 0.11555220800073585,
	"count": 1,
	"self": 0.0009456030020373873,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.11460660499869846,
	"count": 1,
	"self": 0.11460660499869846
	}
	}
	}
	}
	}
	}
	}