First training of PyramidsRND

668a19c over 1 year ago

No virus

19.2 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.354724258184433,
	"min": 0.354724258184433,
	"max": 1.4311972856521606,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 10607.673828125,
	"min": 10607.673828125,
	"max": 43416.80078125,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989909.0,
	"min": 29942.0,
	"max": 989909.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989909.0,
	"min": 29942.0,
	"max": 989909.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.3551175892353058,
	"min": -0.1156456395983696,
	"max": 0.4024066925048828,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 92.33057403564453,
	"min": -27.754953384399414,
	"max": 105.43054962158203,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.030001625418663025,
	"min": 0.013187402859330177,
	"max": 0.357007771730423,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 7.800422668457031,
	"min": 3.4814743995666504,
	"max": 84.61083984375,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06602441271598865,
	"min": 0.06491788623717208,
	"max": 0.07224542644852275,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9903661907398297,
	"min": 0.5057179851396593,
	"max": 1.038277832228535,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.013510492222849278,
	"min": 0.0002837238385301293,
	"max": 0.016081601046261357,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.20265738334273917,
	"min": 0.003688409900891681,
	"max": 0.225142414647659,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.596837467753329e-06,
	"min": 7.596837467753329e-06,
	"max": 0.0002952333444460286,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00011395256201629994,
	"min": 0.00011395256201629994,
	"max": 0.0036082053972648995,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10253224666666667,
	"min": 0.10253224666666667,
	"max": 0.19841111428571429,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.5379837,
	"min": 1.3888778,
	"max": 2.5277187,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002629714419999999,
	"min": 0.0002629714419999999,
	"max": 0.009841270317142856,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.003944571629999998,
	"min": 0.003944571629999998,
	"max": 0.12028323649000001,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.017204105854034424,
	"min": 0.017204105854034424,
	"max": 0.5529566407203674,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.25806158781051636,
	"min": 0.24432560801506042,
	"max": 3.870696544647217,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 510.1694915254237,
	"min": 434.72463768115944,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30100.0,
	"min": 16613.0,
	"max": 32937.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.1887699672331413,
	"min": -0.9999097292461703,
	"max": 1.4830738237270942,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 71.32619803398848,
	"min": -31.99640165269375,
	"max": 96.39979854226112,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.1887699672331413,
	"min": -0.9999097292461703,
	"max": 1.4830738237270942,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 71.32619803398848,
	"min": -31.99640165269375,
	"max": 96.39979854226112,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.09074038836988621,
	"min": 0.0801951661689099,
	"max": 10.70980906661819,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 5.444423302193172,
	"min": 5.183203927415889,
	"max": 182.06675413250923,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1673452018",
	"python_version": "3.8.16 (default, Dec 7 2022, 01:12:13) \n[GCC 7.5.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.6",
	"end_time_seconds": "1673454411"
	},
	"total": 2393.1668312819997,
	"count": 1,
	"self": 0.47755716700021367,
	"children": {
	"run_training.setup": {
	"total": 0.11762555299992528,
	"count": 1,
	"self": 0.11762555299992528
	},
	"TrainerController.start_learning": {
	"total": 2392.5716485619996,
	"count": 1,
	"self": 1.5854257429091376,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.8362330350000775,
	"count": 1,
	"self": 6.8362330350000775
	},
	"TrainerController.advance": {
	"total": 2384.0418137450906,
	"count": 63621,
	"self": 1.616192863044489,
	"children": {
	"env_step": {
	"total": 1661.473924934033,
	"count": 63621,
	"self": 1538.4197854910983,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 122.06969735695066,
	"count": 63621,
	"self": 5.009102428891538,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 117.06059492805912,
	"count": 62564,
	"self": 39.53905387709028,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 77.52154105096884,
	"count": 62564,
	"self": 77.52154105096884
	}
	}
	}
	}
	},
	"workers": {
	"total": 0.9844420859840284,
	"count": 63621,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2387.6302787020186,
	"count": 63621,
	"is_parallel": true,
	"self": 969.392527242966,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.002011108000033346,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007641249999323918,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001246983000100954,
	"count": 8,
	"is_parallel": true,
	"self": 0.001246983000100954
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.05306404899988593,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006155969999781519,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004808159999356576,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004808159999356576
	},
	"communicator.exchange": {
	"total": 0.0501046409999617,
	"count": 1,
	"is_parallel": true,
	"self": 0.0501046409999617
	},
	"steps_from_proto": {
	"total": 0.0018629950000104145,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004884800002855627,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013745149997248518,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013745149997248518
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1418.2377514590526,
	"count": 63620,
	"is_parallel": true,
	"self": 31.6984673098882,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 27.314615026037245,
	"count": 63620,
	"is_parallel": true,
	"self": 27.314615026037245
	},
	"communicator.exchange": {
	"total": 1247.6935183621076,
	"count": 63620,
	"is_parallel": true,
	"self": 1247.6935183621076
	},
	"steps_from_proto": {
	"total": 111.53115076101949,
	"count": 63620,
	"is_parallel": true,
	"self": 26.628848834943028,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 84.90230192607646,
	"count": 508960,
	"is_parallel": true,
	"self": 84.90230192607646
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 720.9516959480134,
	"count": 63621,
	"self": 2.9347500919830054,
	"children": {
	"process_trajectory": {
	"total": 164.10474770702876,
	"count": 63621,
	"self": 163.83715446802898,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2675932389997797,
	"count": 2,
	"self": 0.2675932389997797
	}
	}
	},
	"_update_policy": {
	"total": 553.9121981490016,
	"count": 457,
	"self": 216.4857368529856,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 337.426461296016,
	"count": 22833,
	"self": 337.426461296016
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.436999809811823e-06,
	"count": 1,
	"self": 1.436999809811823e-06
	},
	"TrainerController._save_models": {
	"total": 0.10817460199996276,
	"count": 1,
	"self": 0.0016312939997078502,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.10654330800025491,
	"count": 1,
	"self": 0.10654330800025491
	}
	}
	}
	}
	}
	}
	}