Genis

First Commit

766d45f over 1 year ago

20.3 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.6801722049713135,
	"min": 1.6689929962158203,
	"max": 3.295753240585327,
	"count": 522
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 31345.29296875,
	"min": 16059.88671875,
	"max": 117480.875,
	"count": 522
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 47.85436893203884,
	"min": 37.19402985074627,
	"max": 999.0,
	"count": 522
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19716.0,
	"min": 12776.0,
	"max": 28128.0,
	"count": 522
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1512.3841506926258,
	"min": 1182.721040420331,
	"max": 1520.1387888025301,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 311551.1350426809,
	"min": 2365.575166765614,
	"max": 402909.03120493336,
	"count": 500
	},
	"SoccerTwos.Step.mean": {
	"value": 5219984.0,
	"min": 9082.0,
	"max": 5219984.0,
	"count": 522
	},
	"SoccerTwos.Step.sum": {
	"value": 5219984.0,
	"min": 9082.0,
	"max": 5219984.0,
	"count": 522
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.017524413764476776,
	"min": -0.12234243750572205,
	"max": 0.30277761816978455,
	"count": 522
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -3.5925049781799316,
	"min": -24.590829849243164,
	"max": 32.93498611450195,
	"count": 522
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.01664070226252079,
	"min": -0.12715943157672882,
	"max": 0.2870791554450989,
	"count": 522
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -3.411344051361084,
	"min": -25.559045791625977,
	"max": 31.987327575683594,
	"count": 522
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 522
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 522
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.1805639040179369,
	"min": -0.5964551711904591,
	"max": 0.48996875062584877,
	"count": 522
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -37.01560032367706,
	"min": -56.88379991054535,
	"max": 51.32639992237091,
	"count": 522
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.1805639040179369,
	"min": -0.5964551711904591,
	"max": 0.48996875062584877,
	"count": 522
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -37.01560032367706,
	"min": -56.88379991054535,
	"max": 51.32639992237091,
	"count": 522
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 522
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 522
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.016975674087492128,
	"min": 0.011308841101708822,
	"max": 0.024441575802241763,
	"count": 250
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.016975674087492128,
	"min": 0.011308841101708822,
	"max": 0.024441575802241763,
	"count": 250
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.09598184923330942,
	"min": 1.3440602704880196e-06,
	"max": 0.10366184016068776,
	"count": 250
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.09598184923330942,
	"min": 1.3440602704880196e-06,
	"max": 0.10366184016068776,
	"count": 250
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.09921732048193614,
	"min": 4.471496655848265e-06,
	"max": 0.10685077408949534,
	"count": 250
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.09921732048193614,
	"min": 4.471496655848265e-06,
	"max": 0.10685077408949534,
	"count": 250
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0005000000000000001,
	"min": 0.0005000000000000001,
	"max": 0.0005000000000000001,
	"count": 250
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0005000000000000001,
	"min": 0.0005000000000000001,
	"max": 0.0005000000000000001,
	"count": 250
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 250
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 250
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 250
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 250
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1692717082",
	"python_version": "3.9.17 (main, Jul 5 2023, 20:41:20) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/genis/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1692734710"
	},
	"total": 17627.666772411998,
	"count": 1,
	"self": 0.09028954200039152,
	"children": {
	"run_training.setup": {
	"total": 0.008287695000035455,
	"count": 1,
	"self": 0.008287695000035455
	},
	"TrainerController.start_learning": {
	"total": 17627.568195174998,
	"count": 1,
	"self": 7.836454700638569,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.0494618500052866,
	"count": 21,
	"self": 2.0494618500052866
	},
	"TrainerController.advance": {
	"total": 17617.451557357355,
	"count": 355657,
	"self": 7.943129163682897,
	"children": {
	"env_step": {
	"total": 5259.7881734208,
	"count": 355657,
	"self": 4268.029192443379,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 987.002381628069,
	"count": 355657,
	"self": 38.885623749441834,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 948.1167578786271,
	"count": 659920,
	"self": 948.1167578786271
	}
	}
	},
	"workers": {
	"total": 4.756599349352882,
	"count": 355656,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 17616.246501720587,
	"count": 355656,
	"is_parallel": true,
	"self": 14199.876406307758,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.002839553000058004,
	"count": 2,
	"is_parallel": true,
	"self": 0.0013376410003047567,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001501911999753247,
	"count": 8,
	"is_parallel": true,
	"self": 0.001501911999753247
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.019501769000044078,
	"count": 1,
	"is_parallel": true,
	"self": 0.00047463800001423806,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00035923199993703747,
	"count": 1,
	"is_parallel": true,
	"self": 0.00035923199993703747
	},
	"communicator.exchange": {
	"total": 0.017162689000087994,
	"count": 1,
	"is_parallel": true,
	"self": 0.017162689000087994
	},
	"steps_from_proto": {
	"total": 0.0015052100000048085,
	"count": 2,
	"is_parallel": true,
	"self": 0.00028915600000800623,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012160539999968023,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012160539999968023
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 3416.3324846668224,
	"count": 355655,
	"is_parallel": true,
	"self": 192.92021787136537,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 129.56033859774914,
	"count": 355655,
	"is_parallel": true,
	"self": 129.56033859774914
	},
	"communicator.exchange": {
	"total": 2474.453554164158,
	"count": 355655,
	"is_parallel": true,
	"self": 2474.453554164158
	},
	"steps_from_proto": {
	"total": 619.3983740335495,
	"count": 711310,
	"is_parallel": true,
	"self": 122.86005064013443,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 496.5383233934151,
	"count": 2845240,
	"is_parallel": true,
	"self": 496.5383233934151
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.03761074600720349,
	"count": 40,
	"is_parallel": true,
	"self": 0.0073545120210383175,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.03025623398616517,
	"count": 160,
	"is_parallel": true,
	"self": 0.03025623398616517
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 12349.720254772872,
	"count": 355656,
	"self": 53.74877238922272,
	"children": {
	"process_trajectory": {
	"total": 1201.6411975316382,
	"count": 355656,
	"self": 1198.943791865635,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 2.6974056660033057,
	"count": 10,
	"self": 2.6974056660033057
	}
	}
	},
	"_update_policy": {
	"total": 11094.33028485201,
	"count": 251,
	"self": 778.9787935760087,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 10315.351491276002,
	"count": 7530,
	"self": 10315.351491276002
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.0909971024375409e-06,
	"count": 1,
	"self": 1.0909971024375409e-06
	},
	"TrainerController._save_models": {
	"total": 0.23072017600134131,
	"count": 1,
	"self": 0.0015350430003309157,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2291851330010104,
	"count": 1,
	"self": 0.2291851330010104
	}
	}
	}
	}
	}
	}
	}