First Push

adaa211 almost 2 years ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.4070029258728027,
	"min": 1.364182472229004,
	"max": 3.2957570552825928,
	"count": 2251
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 27824.890625,
	"min": 14507.8642578125,
	"max": 105464.2265625,
	"count": 2251
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 49.7979797979798,
	"min": 40.31147540983606,
	"max": 999.0,
	"count": 2251
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19720.0,
	"min": 13332.0,
	"max": 28468.0,
	"count": 2251
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1550.0245450575744,
	"min": 1190.0487814065316,
	"max": 1641.0483088367112,
	"count": 2246
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 306904.85992139974,
	"min": 2385.9431164520465,
	"max": 388701.1363259206,
	"count": 2246
	},
	"SoccerTwos.Step.mean": {
	"value": 22509878.0,
	"min": 9250.0,
	"max": 22509878.0,
	"count": 2251
	},
	"SoccerTwos.Step.sum": {
	"value": 22509878.0,
	"min": 9250.0,
	"max": 22509878.0,
	"count": 2251
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.028588376939296722,
	"min": -0.14516468346118927,
	"max": 0.22160297632217407,
	"count": 2251
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 5.66049861907959,
	"min": -26.064918518066406,
	"max": 33.42010498046875,
	"count": 2251
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.02912515588104725,
	"min": -0.14482811093330383,
	"max": 0.21980521082878113,
	"count": 2251
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 5.766780853271484,
	"min": -27.210805892944336,
	"max": 34.05256652832031,
	"count": 2251
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 2251
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 2251
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.1643575755032626,
	"min": -0.6405809518127215,
	"max": 0.5064571443058196,
	"count": 2251
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 32.542799949645996,
	"min": -65.78759974241257,
	"max": 66.88839983940125,
	"count": 2251
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.1643575755032626,
	"min": -0.6405809518127215,
	"max": 0.5064571443058196,
	"count": 2251
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 32.542799949645996,
	"min": -65.78759974241257,
	"max": 66.88839983940125,
	"count": 2251
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 2251
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 2251
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01851427239695719,
	"min": 0.010531172272749245,
	"max": 0.02492763645859668,
	"count": 1091
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01851427239695719,
	"min": 0.010531172272749245,
	"max": 0.02492763645859668,
	"count": 1091
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10829064498345058,
	"min": 0.0010078916025425618,
	"max": 0.1292997161547343,
	"count": 1091
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10829064498345058,
	"min": 0.0010078916025425618,
	"max": 0.1292997161547343,
	"count": 1091
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.11002712522943815,
	"min": 0.0010057883948320523,
	"max": 0.13142008284727733,
	"count": 1091
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.11002712522943815,
	"min": 0.0010057883948320523,
	"max": 0.13142008284727733,
	"count": 1091
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 1091
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 1091
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 1091
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 1091
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 1091
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 1091
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1675332665",
	"python_version": "3.8.16 (default, Jan 17 2023, 23:13:24) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/antoine/anaconda3/envs/hf_drl_unit7/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos_1 --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1675364819"
	},
	"total": 32154.188953462,
	"count": 1,
	"self": 0.1803494279993174,
	"children": {
	"run_training.setup": {
	"total": 0.00640905700129224,
	"count": 1,
	"self": 0.00640905700129224
	},
	"TrainerController.start_learning": {
	"total": 32154.002194976998,
	"count": 1,
	"self": 22.474659589188377,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.29831169298086,
	"count": 113,
	"self": 4.29831169298086
	},
	"TrainerController.advance": {
	"total": 32127.09101790282,
	"count": 1562426,
	"self": 20.422603639017325,
	"children": {
	"env_step": {
	"total": 24643.542619113483,
	"count": 1562426,
	"self": 19942.420775126586,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 4686.904853418628,
	"count": 1562426,
	"self": 111.88414057251794,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 4575.02071284611,
	"count": 2828472,
	"self": 4575.02071284611
	}
	}
	},
	"workers": {
	"total": 14.216990568267647,
	"count": 1562425,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 32115.610743571782,
	"count": 1562425,
	"is_parallel": true,
	"self": 14869.433992172224,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0017130690011981642,
	"count": 2,
	"is_parallel": true,
	"self": 0.00035320399911142886,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013598650020867353,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013598650020867353
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.020998721000069054,
	"count": 1,
	"is_parallel": true,
	"self": 0.0009554309981467668,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0006709480003337376,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006709480003337376
	},
	"communicator.exchange": {
	"total": 0.016712819000531454,
	"count": 1,
	"is_parallel": true,
	"self": 0.016712819000531454
	},
	"steps_from_proto": {
	"total": 0.002659523001057096,
	"count": 2,
	"is_parallel": true,
	"self": 0.00043291599831718486,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.002226607002739911,
	"count": 8,
	"is_parallel": true,
	"self": 0.002226607002739911
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 17245.90504891357,
	"count": 1562424,
	"is_parallel": true,
	"self": 1198.7301085013478,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 786.7526528414492,
	"count": 1562424,
	"is_parallel": true,
	"self": 786.7526528414492
	},
	"communicator.exchange": {
	"total": 11804.459724711165,
	"count": 1562424,
	"is_parallel": true,
	"self": 11804.459724711165
	},
	"steps_from_proto": {
	"total": 3455.9625628596077,
	"count": 3124848,
	"is_parallel": true,
	"self": 519.3835088980377,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 2936.57905396157,
	"count": 12499392,
	"is_parallel": true,
	"self": 2936.57905396157
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.27170248599031765,
	"count": 224,
	"is_parallel": true,
	"self": 0.03974755697345245,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.2319549290168652,
	"count": 896,
	"is_parallel": true,
	"self": 0.2319549290168652
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 7463.125795150323,
	"count": 1562425,
	"self": 156.0927741749765,
	"children": {
	"process_trajectory": {
	"total": 3043.756003937433,
	"count": 1562425,
	"self": 3037.450239336422,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 6.305764601011106,
	"count": 45,
	"self": 6.305764601011106
	}
	}
	},
	"_update_policy": {
	"total": 4263.2770170379135,
	"count": 1092,
	"self": 2639.284905304594,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 1623.9921117333197,
	"count": 32763,
	"self": 1623.9921117333197
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 6.400005077011883e-07,
	"count": 1,
	"self": 6.400005077011883e-07
	},
	"TrainerController._save_models": {
	"total": 0.1382051520049572,
	"count": 1,
	"self": 0.0012712670068140142,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.13693388499814318,
	"count": 1,
	"self": 0.13693388499814318
	}
	}
	}
	}
	}
	}
	}