PyramidsRND initial training

b72cc3b over 1 year ago

No virus

19.2 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.2071920931339264,
	"min": 0.201755091547966,
	"max": 1.4341418743133545,
	"count": 66
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 6232.33837890625,
	"min": 6030.05615234375,
	"max": 43506.12890625,
	"count": 66
	},
	"Pyramids.Step.mean": {
	"value": 1979889.0,
	"min": 29952.0,
	"max": 1979889.0,
	"count": 66
	},
	"Pyramids.Step.sum": {
	"value": 1979889.0,
	"min": 29952.0,
	"max": 1979889.0,
	"count": 66
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.8243393301963806,
	"min": -0.09622462093830109,
	"max": 0.9279937148094177,
	"count": 66
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 248.9504852294922,
	"min": -23.190134048461914,
	"max": 290.4620361328125,
	"count": 66
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.011662246659398079,
	"min": -0.07439544796943665,
	"max": 0.31239381432533264,
	"count": 66
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 3.521998405456543,
	"min": -21.42588996887207,
	"max": 75.28691101074219,
	"count": 66
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06858035875068577,
	"min": 0.06510530802738725,
	"max": 0.07328678109514018,
	"count": 66
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9601250225096009,
	"min": 0.5068921602656262,
	"max": 1.0789347016446604,
	"count": 66
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.016518163341624176,
	"min": 0.000323967105224438,
	"max": 0.017910530448879643,
	"count": 66
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.23125428678273846,
	"min": 0.002915703947019942,
	"max": 0.250747426284315,
	"count": 66
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 5.334291079078573e-06,
	"min": 5.334291079078573e-06,
	"max": 0.0002975753150939428,
	"count": 66
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 7.468007510710002e-05,
	"min": 7.468007510710002e-05,
	"max": 0.0037903268865577496,
	"count": 66
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.1017780642857143,
	"min": 0.1017780642857143,
	"max": 0.19919177142857142,
	"count": 66
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4248929000000001,
	"min": 1.3943424,
	"max": 2.6634422500000006,
	"count": 66
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00018762862214285718,
	"min": 0.00018762862214285718,
	"max": 0.009919257965714285,
	"count": 66
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0026268007100000005,
	"min": 0.0026268007100000005,
	"max": 0.12635788077500001,
	"count": 66
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.008229024708271027,
	"min": 0.007826493121683598,
	"max": 0.4388757348060608,
	"count": 66
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.11520634591579437,
	"min": 0.10957090556621552,
	"max": 3.0721302032470703,
	"count": 66
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 220.4962962962963,
	"min": 203.6993006993007,
	"max": 999.0,
	"count": 66
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29767.0,
	"min": 15984.0,
	"max": 33082.0,
	"count": 66
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.7795036924106102,
	"min": -1.0000000521540642,
	"max": 1.7966783059226883,
	"count": 66
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 240.2329984754324,
	"min": -31.998801663517952,
	"max": 267.112998560071,
	"count": 66
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.7795036924106102,
	"min": -1.0000000521540642,
	"max": 1.7966783059226883,
	"count": 66
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 240.2329984754324,
	"min": -31.998801663517952,
	"max": 267.112998560071,
	"count": 66
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.01889126900124312,
	"min": 0.01764048443792935,
	"max": 9.110685833729804,
	"count": 66
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.550321315167821,
	"min": 2.4585653777612606,
	"max": 145.77097333967686,
	"count": 66
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 66
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 66
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1673620315",
	"python_version": "3.8.16 (default, Dec 7 2022, 01:12:13) \n[GCC 7.5.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.6",
	"end_time_seconds": "1673624710"
	},
	"total": 4395.093876395001,
	"count": 1,
	"self": 0.4241593910010124,
	"children": {
	"run_training.setup": {
	"total": 0.11400399699999753,
	"count": 1,
	"self": 0.11400399699999753
	},
	"TrainerController.start_learning": {
	"total": 4394.555713007,
	"count": 1,
	"self": 2.4842224960120802,
	"children": {
	"TrainerController._reset_env": {
	"total": 9.521725463999985,
	"count": 1,
	"self": 9.521725463999985
	},
	"TrainerController.advance": {
	"total": 4382.457732749988,
	"count": 129598,
	"self": 2.6425799711014406,
	"children": {
	"env_step": {
	"total": 3061.4848862749936,
	"count": 129598,
	"self": 2858.441981782051,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 201.47308610696194,
	"count": 129598,
	"self": 8.28559791601623,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 193.18748819094571,
	"count": 125056,
	"self": 65.43051573290359,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 127.75697245804213,
	"count": 125056,
	"self": 127.75697245804213
	}
	}
	}
	}
	},
	"workers": {
	"total": 1.5698183859809092,
	"count": 129598,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 4386.382064792113,
	"count": 129598,
	"is_parallel": true,
	"self": 1720.7778098162344,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.005104625999990731,
	"count": 1,
	"is_parallel": true,
	"self": 0.0029805739999915204,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0021240519999992102,
	"count": 8,
	"is_parallel": true,
	"self": 0.0021240519999992102
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.043102734999990844,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004890889999842329,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004396570000153588,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004396570000153588
	},
	"communicator.exchange": {
	"total": 0.04056606300002841,
	"count": 1,
	"is_parallel": true,
	"self": 0.04056606300002841
	},
	"steps_from_proto": {
	"total": 0.0016079259999628448,
	"count": 1,
	"is_parallel": true,
	"self": 0.00040968699994436975,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001198239000018475,
	"count": 8,
	"is_parallel": true,
	"self": 0.001198239000018475
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2665.6042549758786,
	"count": 129597,
	"is_parallel": true,
	"self": 55.36691782582648,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 42.91561223704417,
	"count": 129597,
	"is_parallel": true,
	"self": 42.91561223704417
	},
	"communicator.exchange": {
	"total": 2367.501065414963,
	"count": 129597,
	"is_parallel": true,
	"self": 2367.501065414963
	},
	"steps_from_proto": {
	"total": 199.82065949804507,
	"count": 129597,
	"is_parallel": true,
	"self": 43.54814323008969,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 156.27251626795538,
	"count": 1036776,
	"is_parallel": true,
	"self": 156.27251626795538
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1318.3302665038937,
	"count": 129598,
	"self": 4.844167717961227,
	"children": {
	"process_trajectory": {
	"total": 292.83526258293523,
	"count": 129598,
	"self": 292.46484278993603,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.3704197929992006,
	"count": 4,
	"self": 0.3704197929992006
	}
	}
	},
	"_update_policy": {
	"total": 1020.6508362029972,
	"count": 917,
	"self": 392.9678273220085,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 627.6830088809887,
	"count": 45675,
	"self": 627.6830088809887
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.609995347796939e-07,
	"count": 1,
	"self": 8.609995347796939e-07
	},
	"TrainerController._save_models": {
	"total": 0.09203143600007024,
	"count": 1,
	"self": 0.0015091730001586257,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09052226299991162,
	"count": 1,
	"self": 0.09052226299991162
	}
	}
	}
	}
	}
	}
	}