First Push`

5495df5 almost 2 years ago

15.6 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.9531906843185425,
	"min": 1.9333367347717285,
	"max": 3.2957451343536377,
	"count": 500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 42313.921875,
	"min": 20685.5234375,
	"max": 110978.8046875,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 57.89411764705882,
	"min": 45.570093457943926,
	"max": 999.0,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19684.0,
	"min": 9304.0,
	"max": 31968.0,
	"count": 500
	},
	"SoccerTwos.Step.mean": {
	"value": 4999918.0,
	"min": 9000.0,
	"max": 4999918.0,
	"count": 500
	},
	"SoccerTwos.Step.sum": {
	"value": 4999918.0,
	"min": 9000.0,
	"max": 4999918.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.06822053343057632,
	"min": -0.13340337574481964,
	"max": 0.17353291809558868,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 11.597490310668945,
	"min": -22.678573608398438,
	"max": 27.418201446533203,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.06983315944671631,
	"min": -0.12757983803749084,
	"max": 0.16391581296920776,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 11.871637344360352,
	"min": -21.68857192993164,
	"max": 25.898698806762695,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.09850823598749497,
	"min": -0.5384615384615384,
	"max": 0.487155556678772,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 16.746400117874146,
	"min": -65.81360006332397,
	"max": 48.89580023288727,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.09850823598749497,
	"min": -0.5384615384615384,
	"max": 0.487155556678772,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 16.746400117874146,
	"min": -65.81360006332397,
	"max": 48.89580023288727,
	"count": 500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1516.2468810022674,
	"min": 1192.28374816736,
	"max": 1522.8103071340324,
	"count": 414
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 257761.96977038548,
	"min": 2385.845780844732,
	"max": 310656.77838486026,
	"count": 414
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.014279249346388193,
	"min": 0.01140843817035299,
	"max": 0.025414117853021403,
	"count": 237
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.014279249346388193,
	"min": 0.01140843817035299,
	"max": 0.025414117853021403,
	"count": 237
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.08459945817788442,
	"min": 3.708402582939622e-07,
	"max": 0.1083966962993145,
	"count": 237
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.08459945817788442,
	"min": 3.708402582939622e-07,
	"max": 0.1083966962993145,
	"count": 237
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.0862138512233893,
	"min": 5.9369759431623e-07,
	"max": 0.11099762643376986,
	"count": 237
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.0862138512233893,
	"min": 5.9369759431623e-07,
	"max": 0.11099762643376986,
	"count": 237
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 237
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 237
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 237
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 237
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 237
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 237
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1675613821",
	"python_version": "3.9.16 (main, Jan 11 2023, 16:16:36) [MSC v.1916 64 bit (AMD64)]",
	"command_line_arguments": "C:\\Users\\Francisco\\anaconda3\\envs\\rl\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.13.1+cpu",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1675632219"
	},
	"total": 18398.338030699997,
	"count": 1,
	"self": 0.44735779999609804,
	"children": {
	"run_training.setup": {
	"total": 0.12766220000000006,
	"count": 1,
	"self": 0.12766220000000006
	},
	"TrainerController.start_learning": {
	"total": 18397.7630107,
	"count": 1,
	"self": 10.556686000109039,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.009154099999812,
	"count": 25,
	"self": 6.009154099999812
	},
	"TrainerController.advance": {
	"total": 18381.032313799893,
	"count": 336211,
	"self": 10.097430798919959,
	"children": {
	"env_step": {
	"total": 7878.255441100767,
	"count": 336211,
	"self": 6209.0573362012565,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1662.1884631005626,
	"count": 336211,
	"self": 60.01698679983224,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1602.1714763007303,
	"count": 635166,
	"self": 1602.1714763007303
	}
	}
	},
	"workers": {
	"total": 7.009641798948309,
	"count": 336211,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 18377.433205799953,
	"count": 336211,
	"is_parallel": true,
	"self": 13398.232135199562,
	"children": {
	"steps_from_proto": {
	"total": 0.05499650000088252,
	"count": 50,
	"is_parallel": true,
	"self": 0.012067300012920334,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.042929199987962186,
	"count": 200,
	"is_parallel": true,
	"self": 0.042929199987962186
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 4979.14607410039,
	"count": 336211,
	"is_parallel": true,
	"self": 240.76061850083715,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 205.50819700051986,
	"count": 336211,
	"is_parallel": true,
	"self": 205.50819700051986
	},
	"communicator.exchange": {
	"total": 3728.012818700003,
	"count": 336211,
	"is_parallel": true,
	"self": 3728.012818700003
	},
	"steps_from_proto": {
	"total": 804.86443989903,
	"count": 672422,
	"is_parallel": true,
	"self": 168.9518741989816,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 635.9125657000484,
	"count": 2689688,
	"is_parallel": true,
	"self": 635.9125657000484
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 10492.679441900207,
	"count": 336211,
	"self": 76.79321610071383,
	"children": {
	"process_trajectory": {
	"total": 1569.9522774994998,
	"count": 336211,
	"self": 1568.0727003995046,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.879577099995231,
	"count": 10,
	"self": 1.879577099995231
	}
	}
	},
	"_update_policy": {
	"total": 8845.933948299993,
	"count": 237,
	"self": 920.2543032999702,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 7925.679645000023,
	"count": 7110,
	"self": 7925.679645000023
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.6999983927235007e-06,
	"count": 1,
	"self": 1.6999983927235007e-06
	},
	"TrainerController._save_models": {
	"total": 0.1648550999998406,
	"count": 1,
	"self": 0.0038491999985126313,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.16100590000132797,
	"count": 1,
	"self": 0.16100590000132797
	}
	}
	}
	}
	}
	}
	}