Training 1

6cad639 over 1 year ago

No virus

19.2 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.4205172061920166,
	"min": 0.4205172061920166,
	"max": 1.178979754447937,
	"count": 31
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 12689.52734375,
	"min": 12689.52734375,
	"max": 34186.8125,
	"count": 31
	},
	"Pyramids.Step.mean": {
	"value": 989915.0,
	"min": 89998.0,
	"max": 989915.0,
	"count": 31
	},
	"Pyramids.Step.sum": {
	"value": 989915.0,
	"min": 89998.0,
	"max": 989915.0,
	"count": 31
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.578375518321991,
	"min": -0.09325366467237473,
	"max": 0.6088351607322693,
	"count": 31
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 160.21002197265625,
	"min": -22.38088035583496,
	"max": 171.08267211914062,
	"count": 31
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.15920183062553406,
	"min": -0.15920183062553406,
	"max": 0.12669534981250763,
	"count": 31
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -44.098907470703125,
	"min": -44.098907470703125,
	"max": 25.567962646484375,
	"count": 31
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06781885955909578,
	"min": 0.06377447864118342,
	"max": 0.07362295601892078,
	"count": 31
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 1.0172828933864366,
	"min": 0.14013763737845392,
	"max": 1.1043443402838118,
	"count": 31
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.020172474435659955,
	"min": 0.0003241572943200784,
	"max": 0.020172474435659955,
	"count": 31
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.30258711653489934,
	"min": 0.0006483145886401568,
	"max": 0.30258711653489934,
	"count": 31
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.5422774859400034e-06,
	"min": 7.5422774859400034e-06,
	"max": 0.00027422940859020005,
	"count": 31
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00011313416228910005,
	"min": 0.00011313416228910005,
	"max": 0.0031372469542511002,
	"count": 31
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10251405999999999,
	"min": 0.10251405999999999,
	"max": 0.19140980000000005,
	"count": 31
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.5377108999999998,
	"min": 0.3828196000000001,
	"max": 2.4437612,
	"count": 31
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002611545940000001,
	"min": 0.0002611545940000001,
	"max": 0.00914183902,
	"count": 31
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.003917318910000002,
	"min": 0.003917318910000002,
	"max": 0.10460031511,
	"count": 31
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.008740575052797794,
	"min": 0.008740575052797794,
	"max": 0.09000152349472046,
	"count": 31
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.1311086267232895,
	"min": 0.12701763212680817,
	"max": 0.6430901288986206,
	"count": 31
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 31
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 31
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 326.6923076923077,
	"min": 312.42105263157896,
	"max": 999.0,
	"count": 30
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29729.0,
	"min": 25036.0,
	"max": 33299.0,
	"count": 30
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.6293362414280137,
	"min": -0.9999806977087452,
	"max": 1.6875789339605132,
	"count": 30
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 148.26959796994925,
	"min": -30.9994016289711,
	"max": 160.31999872624874,
	"count": 30
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.6293362414280137,
	"min": -0.9999806977087452,
	"max": 1.6875789339605132,
	"count": 30
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 148.26959796994925,
	"min": -30.9994016289711,
	"max": 160.31999872624874,
	"count": 30
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.02928505246373978,
	"min": 0.02928505246373978,
	"max": 0.7404885896591141,
	"count": 30
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.6649397742003202,
	"min": 2.6649397742003202,
	"max": 25.17661204840988,
	"count": 30
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1677351631",
	"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.22.4",
	"end_time_seconds": "1677353799"
	},
	"total": 2168.03837705,
	"count": 1,
	"self": 0.5264525419997881,
	"children": {
	"run_training.setup": {
	"total": 0.11523128399994675,
	"count": 1,
	"self": 0.11523128399994675
	},
	"TrainerController.start_learning": {
	"total": 2167.396693224,
	"count": 1,
	"self": 1.281207674162033,
	"children": {
	"TrainerController._reset_env": {
	"total": 7.431841023999823,
	"count": 1,
	"self": 7.431841023999823
	},
	"TrainerController.advance": {
	"total": 2158.5916747428387,
	"count": 58930,
	"self": 1.4100693748250706,
	"children": {
	"env_step": {
	"total": 1451.608715427868,
	"count": 58930,
	"self": 1345.1334192078716,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 105.7063820859039,
	"count": 58930,
	"self": 4.455333714709013,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 101.25104837119488,
	"count": 57563,
	"self": 34.654481669223514,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 66.59656670197137,
	"count": 57563,
	"self": 66.59656670197137
	}
	}
	}
	}
	},
	"workers": {
	"total": 0.7689141340924834,
	"count": 58930,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2162.7388273921424,
	"count": 58930,
	"is_parallel": true,
	"self": 925.3624172811874,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0027587790000325185,
	"count": 1,
	"is_parallel": true,
	"self": 0.0009597249995749735,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001799054000457545,
	"count": 8,
	"is_parallel": true,
	"self": 0.001799054000457545
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.048602867999761656,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005728439996346424,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005117810001138423,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005117810001138423
	},
	"communicator.exchange": {
	"total": 0.045841995000046154,
	"count": 1,
	"is_parallel": true,
	"self": 0.045841995000046154
	},
	"steps_from_proto": {
	"total": 0.0016762479999670177,
	"count": 1,
	"is_parallel": true,
	"self": 0.00043473300047480734,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012415149994922103,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012415149994922103
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1237.376410110955,
	"count": 58929,
	"is_parallel": true,
	"self": 29.76034144775622,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 22.040904430164574,
	"count": 58929,
	"is_parallel": true,
	"self": 22.040904430164574
	},
	"communicator.exchange": {
	"total": 1098.0368322140225,
	"count": 58929,
	"is_parallel": true,
	"self": 1098.0368322140225
	},
	"steps_from_proto": {
	"total": 87.5383320190117,
	"count": 58929,
	"is_parallel": true,
	"self": 20.82721406836481,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 66.7111179506469,
	"count": 471432,
	"is_parallel": true,
	"self": 66.7111179506469
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 705.5728899401456,
	"count": 58930,
	"self": 2.4748141240802397,
	"children": {
	"process_trajectory": {
	"total": 157.126547701062,
	"count": 58930,
	"self": 156.86858836006286,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2579593409991503,
	"count": 2,
	"self": 0.2579593409991503
	}
	}
	},
	"_update_policy": {
	"total": 545.9715281150034,
	"count": 421,
	"self": 212.2055353260048,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 333.7659927889986,
	"count": 20955,
	"self": 333.7659927889986
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.0199992175330408e-06,
	"count": 1,
	"self": 1.0199992175330408e-06
	},
	"TrainerController._save_models": {
	"total": 0.09196876300029544,
	"count": 1,
	"self": 0.0019856570006595575,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08998310599963588,
	"count": 1,
	"self": 0.08998310599963588
	}
	}
	}
	}
	}
	}
	}