candrews1971

50Million

1d4cb64 verified 7 months ago

20.3 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 0.9085261225700378,
	"min": 0.900277316570282,
	"max": 3.29008150100708,
	"count": 3700
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 17501.84765625,
	"min": 14925.09375,
	"max": 105282.609375,
	"count": 3700
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 72.75,
	"min": 50.422680412371136,
	"max": 999.0,
	"count": 3700
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19788.0,
	"min": 7992.0,
	"max": 31936.0,
	"count": 3700
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 3701
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 3701
	},
	"SoccerTwos.Step.mean": {
	"value": 49999990.0,
	"min": 13009988.0,
	"max": 49999990.0,
	"count": 3700
	},
	"SoccerTwos.Step.sum": {
	"value": 49999990.0,
	"min": 13009988.0,
	"max": 49999990.0,
	"count": 3700
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.020666854456067085,
	"min": -0.18262770771980286,
	"max": 0.3022185266017914,
	"count": 3700
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -2.810692310333252,
	"min": -23.04550552368164,
	"max": 30.200801849365234,
	"count": 3700
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.020067332312464714,
	"min": -0.18312671780586243,
	"max": 0.30087995529174805,
	"count": 3700
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -2.7291572093963623,
	"min": -22.754257202148438,
	"max": 30.499494552612305,
	"count": 3700
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 3700
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 3700
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.12077352842863869,
	"min": -0.4557133336861928,
	"max": 0.5597831369882607,
	"count": 3700
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -16.42519986629486,
	"min": -54.68560004234314,
	"max": 46.9363996386528,
	"count": 3700
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.12077352842863869,
	"min": -0.4557133336861928,
	"max": 0.5597831369882607,
	"count": 3700
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -16.42519986629486,
	"min": -54.68560004234314,
	"max": 46.9363996386528,
	"count": 3700
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1762.2704252584133,
	"min": 1199.9971506578554,
	"max": 1807.2337574364283,
	"count": 3697
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 239668.7778351442,
	"min": 2403.487199768784,
	"max": 345797.03797725256,
	"count": 3697
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.015397342308036362,
	"min": 0.011067466323099021,
	"max": 0.03322836385729412,
	"count": 1793
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.015397342308036362,
	"min": 0.011067466323099021,
	"max": 0.03322836385729412,
	"count": 1793
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.12179502000411352,
	"min": 0.0008780070677554856,
	"max": 0.1353025034070015,
	"count": 1793
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.12179502000411352,
	"min": 0.0008780070677554856,
	"max": 0.1353025034070015,
	"count": 1793
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.12190080806612968,
	"min": 0.0010242766661879917,
	"max": 0.13573680569728216,
	"count": 1793
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.12190080806612968,
	"min": 0.0010242766661879917,
	"max": 0.13573680569728216,
	"count": 1793
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 7.555998921999384e-08,
	"min": 7.555998921999384e-08,
	"max": 0.0005176344860522198,
	"count": 1793
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 7.555998921999384e-08,
	"min": 7.555998921999384e-08,
	"max": 0.0005176344860522198,
	"count": 1793
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.10001077999999998,
	"min": 0.10001077999999998,
	"max": 0.17394777999999997,
	"count": 1793
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.10001077999999998,
	"min": 0.10001077999999998,
	"max": 0.17394777999999997,
	"count": 1793
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 1.053792199999996e-05,
	"min": 1.053792199999996e-05,
	"max": 0.0036999942220000016,
	"count": 1793
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 1.053792199999996e-05,
	"min": 1.053792199999996e-05,
	"max": 0.0036999942220000016,
	"count": 1793
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1718202104",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/home/candrews/anaconda3/envs/rl/bin/mlagents-learn results/SoccerTwos/configuration.yaml --run-id=SoccerTwos --resume",
	"mlagents_version": "1.0.0",
	"mlagents_envs_version": "1.0.0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.3.1+cu121",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1718291544"
	},
	"total": 89439.655143559,
	"count": 1,
	"self": 0.12202233797870576,
	"children": {
	"run_training.setup": {
	"total": 0.016299434000757174,
	"count": 1,
	"self": 0.016299434000757174
	},
	"TrainerController.start_learning": {
	"total": 89439.51682178701,
	"count": 1,
	"self": 48.225265316374134,
	"children": {
	"TrainerController._reset_env": {
	"total": 5.392195741071191,
	"count": 186,
	"self": 5.392195741071191
	},
	"TrainerController.advance": {
	"total": 89385.65861405357,
	"count": 2504281,
	"self": 43.67091076684301,
	"children": {
	"env_step": {
	"total": 72551.5218888928,
	"count": 2504281,
	"self": 48862.6198433862,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 23658.219093947908,
	"count": 2504281,
	"self": 324.338922350933,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 23333.880171596975,
	"count": 4648782,
	"self": 23333.880171596975
	}
	}
	},
	"workers": {
	"total": 30.682951558695095,
	"count": 2504281,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 89322.32348160779,
	"count": 2504281,
	"is_parallel": true,
	"self": 45938.6905439756,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.002996798999447492,
	"count": 2,
	"is_parallel": true,
	"self": 0.0012141010010964237,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0017826979983510682,
	"count": 8,
	"is_parallel": true,
	"self": 0.0017826979983510682
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.03301058000033663,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005553990004045772,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00037568999960058136,
	"count": 1,
	"is_parallel": true,
	"self": 0.00037568999960058136
	},
	"communicator.exchange": {
	"total": 0.030290142000012565,
	"count": 1,
	"is_parallel": true,
	"self": 0.030290142000012565
	},
	"steps_from_proto": {
	"total": 0.0017893490003189072,
	"count": 2,
	"is_parallel": true,
	"self": 0.00037193900061538443,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014174099997035228,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014174099997035228
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.3447280409091036,
	"count": 370,
	"is_parallel": true,
	"self": 0.06514130008235952,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.27958674082674406,
	"count": 1480,
	"is_parallel": true,
	"self": 0.27958674082674406
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 43383.28820959128,
	"count": 2504280,
	"is_parallel": true,
	"self": 1448.4682002114132,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 932.0408725699708,
	"count": 2504280,
	"is_parallel": true,
	"self": 932.0408725699708
	},
	"communicator.exchange": {
	"total": 36480.94365370879,
	"count": 2504280,
	"is_parallel": true,
	"self": 36480.94365370879
	},
	"steps_from_proto": {
	"total": 4521.83548310111,
	"count": 5008560,
	"is_parallel": true,
	"self": 864.9375246691716,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 3656.8979584319386,
	"count": 20034240,
	"is_parallel": true,
	"self": 3656.8979584319386
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 16790.465814393916,
	"count": 2504281,
	"self": 389.440108310886,
	"children": {
	"process_trajectory": {
	"total": 8186.032770570991,
	"count": 2504281,
	"self": 8163.696337590989,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 22.33643298000152,
	"count": 75,
	"self": 22.33643298000152
	}
	}
	},
	"_update_policy": {
	"total": 8214.99293551204,
	"count": 1793,
	"self": 5104.453318782099,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 3110.5396167299414,
	"count": 53796,
	"self": 3110.5396167299414
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 7.199996616691351e-07,
	"count": 1,
	"self": 7.199996616691351e-07
	},
	"TrainerController._save_models": {
	"total": 0.24074595600541215,
	"count": 1,
	"self": 0.0033287870028289035,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.23741716900258325,
	"count": 1,
	"self": 0.23741716900258325
	}
	}
	}
	}
	}
	}
	}