First Push

e90ba5c verified 5 months ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.6198543310165405,
	"min": 0.6181684136390686,
	"max": 1.4397516250610352,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 18704.724609375,
	"min": 18426.36328125,
	"max": 43676.3046875,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989919.0,
	"min": 29952.0,
	"max": 989919.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989919.0,
	"min": 29952.0,
	"max": 989919.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.20321184396743774,
	"min": -0.1136462390422821,
	"max": 0.2698386013507843,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 51.615806579589844,
	"min": -27.275096893310547,
	"max": 69.61836242675781,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.3597458302974701,
	"min": -0.3597458302974701,
	"max": 0.2695969045162201,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -91.37544250488281,
	"min": -91.37544250488281,
	"max": 64.70325469970703,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.0710423098076024,
	"min": 0.06481601432117969,
	"max": 0.07412011613098765,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9945923373064336,
	"min": 0.47087696331905077,
	"max": 1.0567155789912623,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.039052608103832306,
	"min": 0.00016720261613035686,
	"max": 0.039052608103832306,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.5467365134536523,
	"min": 0.002340836625824996,
	"max": 0.5467365134536523,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.65005459287143e-06,
	"min": 7.65005459287143e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010710076430020003,
	"min": 0.00010710076430020003,
	"max": 0.003507054230982,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10254998571428572,
	"min": 0.10254998571428572,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4356998,
	"min": 1.3691136000000002,
	"max": 2.5690179999999994,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.000264743572857143,
	"min": 0.000264743572857143,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0037064100200000023,
	"min": 0.0037064100200000023,
	"max": 0.1169248982,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.010702558793127537,
	"min": 0.010649963282048702,
	"max": 0.4051334857940674,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.14983582496643066,
	"min": 0.14983582496643066,
	"max": 2.8359344005584717,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 590.7021276595744,
	"min": 557.08,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 27763.0,
	"min": 15984.0,
	"max": 33052.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.026191457313426,
	"min": -1.0000000521540642,
	"max": 1.082807960063219,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 48.23099849373102,
	"min": -32.000001668930054,
	"max": 54.14039800316095,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.026191457313426,
	"min": -1.0000000521540642,
	"max": 1.082807960063219,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 48.23099849373102,
	"min": -32.000001668930054,
	"max": 54.14039800316095,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.06640417896585163,
	"min": 0.06490983254687828,
	"max": 7.933333176188171,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 3.1209964113950264,
	"min": 3.1209964113950264,
	"max": 126.93333081901073,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1719354078",
	"python_version": "3.10.12 (main, Jun 25 2024, 18:12:47) [GCC 14.1.1 20240522]",
	"command_line_arguments": "/home/matt/docs/howTo/ai/u5/hf-env/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=PyramidsTraining1 --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.3.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1719354850"
	},
	"total": 772.2147408680012,
	"count": 1,
	"self": 0.21933395199994266,
	"children": {
	"run_training.setup": {
	"total": 0.00818785800038313,
	"count": 1,
	"self": 0.00818785800038313
	},
	"TrainerController.start_learning": {
	"total": 771.9872190580008,
	"count": 1,
	"self": 0.7863086638917594,
	"children": {
	"TrainerController._reset_env": {
	"total": 1.1219685710002523,
	"count": 1,
	"self": 1.1219685710002523
	},
	"TrainerController.advance": {
	"total": 770.0380192641078,
	"count": 63306,
	"self": 0.7409733681888611,
	"children": {
	"env_step": {
	"total": 494.03147631499996,
	"count": 63306,
	"self": 436.92875950705275,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 56.58980958004031,
	"count": 63306,
	"self": 2.445062810993477,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 54.14474676904683,
	"count": 62559,
	"self": 54.14474676904683
	}
	}
	},
	"workers": {
	"total": 0.5129072279069078,
	"count": 63306,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 770.9131181956782,
	"count": 63306,
	"is_parallel": true,
	"self": 389.37936747566346,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.001608086000487674,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005663340034516295,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0010417519970360445,
	"count": 8,
	"is_parallel": true,
	"self": 0.0010417519970360445
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.019292205000965623,
	"count": 1,
	"is_parallel": true,
	"self": 0.00030818700179224834,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0002608859995234525,
	"count": 1,
	"is_parallel": true,
	"self": 0.0002608859995234525
	},
	"communicator.exchange": {
	"total": 0.017637499000557,
	"count": 1,
	"is_parallel": true,
	"self": 0.017637499000557
	},
	"steps_from_proto": {
	"total": 0.0010856329990929225,
	"count": 1,
	"is_parallel": true,
	"self": 0.00025549399651936255,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.00083013900257356,
	"count": 8,
	"is_parallel": true,
	"self": 0.00083013900257356
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 381.5337507200147,
	"count": 63305,
	"is_parallel": true,
	"self": 10.501863388253696,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 7.007109749909432,
	"count": 63305,
	"is_parallel": true,
	"self": 7.007109749909432
	},
	"communicator.exchange": {
	"total": 332.8179504499112,
	"count": 63305,
	"is_parallel": true,
	"self": 332.8179504499112
	},
	"steps_from_proto": {
	"total": 31.206827131940372,
	"count": 63305,
	"is_parallel": true,
	"self": 6.654570320828498,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 24.552256811111874,
	"count": 506440,
	"is_parallel": true,
	"self": 24.552256811111874
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 275.26556958091896,
	"count": 63306,
	"self": 1.3477594488267641,
	"children": {
	"process_trajectory": {
	"total": 56.49142784509422,
	"count": 63306,
	"self": 56.40052474509321,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09090310000101454,
	"count": 2,
	"self": 0.09090310000101454
	}
	}
	},
	"_update_policy": {
	"total": 217.42638228699798,
	"count": 442,
	"self": 141.62483508419973,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 75.80154720279825,
	"count": 22779,
	"self": 75.80154720279825
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 5.150013748789206e-07,
	"count": 1,
	"self": 5.150013748789206e-07
	},
	"TrainerController._save_models": {
	"total": 0.04092204399967159,
	"count": 1,
	"self": 0.00048346999938075896,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.04043857400029083,
	"count": 1,
	"self": 0.04043857400029083
	}
	}
	}
	}
	}
	}
	}