First Push

ab135a7 verified 3 months ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.0180764198303223,
	"min": 1.9686380624771118,
	"max": 3.29573130607605,
	"count": 500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 40942.734375,
	"min": 23230.611328125,
	"max": 127156.0390625,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 57.773809523809526,
	"min": 46.25471698113208,
	"max": 999.0,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19412.0,
	"min": 16304.0,
	"max": 24372.0,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1606.7540705210154,
	"min": 1194.1876210015298,
	"max": 1606.7540705210154,
	"count": 483
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 269934.68384753057,
	"min": 2392.4361146861966,
	"max": 320537.73161546723,
	"count": 483
	},
	"SoccerTwos.Step.mean": {
	"value": 4999988.0,
	"min": 9206.0,
	"max": 4999988.0,
	"count": 500
	},
	"SoccerTwos.Step.sum": {
	"value": 4999988.0,
	"min": 9206.0,
	"max": 4999988.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.08221761882305145,
	"min": -0.16408230364322662,
	"max": 0.22671149671077728,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 13.812560081481934,
	"min": -29.04256820678711,
	"max": 28.614913940429688,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.081489697098732,
	"min": -0.16812725365161896,
	"max": 0.22300933301448822,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 13.690268516540527,
	"min": -29.75852394104004,
	"max": 29.2299747467041,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.17836428469135648,
	"min": -0.5160571421895709,
	"max": 0.5442823518725003,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 29.965199828147888,
	"min": -62.956199645996094,
	"max": 55.29199993610382,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.17836428469135648,
	"min": -0.5160571421895709,
	"max": 0.5442823518725003,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 29.965199828147888,
	"min": -62.956199645996094,
	"max": 55.29199993610382,
	"count": 500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.018076893081888555,
	"min": 0.011601724340289365,
	"max": 0.02478181136199661,
	"count": 238
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.018076893081888555,
	"min": 0.011601724340289365,
	"max": 0.02478181136199661,
	"count": 238
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.09370621119936308,
	"min": 9.677321001314946e-06,
	"max": 0.10801337112983068,
	"count": 238
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.09370621119936308,
	"min": 9.677321001314946e-06,
	"max": 0.10801337112983068,
	"count": 238
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.09552678316831589,
	"min": 9.16501976462314e-06,
	"max": 0.11014168585340182,
	"count": 238
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.09552678316831589,
	"min": 9.16501976462314e-06,
	"max": 0.11014168585340182,
	"count": 238
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 238
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 238
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 238
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 238
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 238
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 238
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1726140025",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/home/ron/anaconda3/envs/rl/bin/mlagents-learn SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.4.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1726143333"
	},
	"total": 3307.778840974999,
	"count": 1,
	"self": 0.16651327399449656,
	"children": {
	"run_training.setup": {
	"total": 0.017641124002693687,
	"count": 1,
	"self": 0.017641124002693687
	},
	"TrainerController.start_learning": {
	"total": 3307.594686577002,
	"count": 1,
	"self": 2.944197011049255,
	"children": {
	"TrainerController._reset_env": {
	"total": 1.430085665993829,
	"count": 25,
	"self": 1.430085665993829
	},
	"TrainerController.advance": {
	"total": 3303.1576436479554,
	"count": 335444,
	"self": 2.829188156807504,
	"children": {
	"env_step": {
	"total": 2603.5166298651347,
	"count": 335444,
	"self": 1883.2772055045607,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 718.1913456719631,
	"count": 335444,
	"self": 21.45619433902175,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 696.7351513329413,
	"count": 635164,
	"self": 696.7351513329413
	}
	}
	},
	"workers": {
	"total": 2.0480786886109854,
	"count": 335444,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3303.6074121928505,
	"count": 335444,
	"is_parallel": true,
	"self": 1771.8287012314358,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0010473849979462102,
	"count": 2,
	"is_parallel": true,
	"self": 0.00022717300089425407,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0008202119970519561,
	"count": 8,
	"is_parallel": true,
	"self": 0.0008202119970519561
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.011166587999468902,
	"count": 1,
	"is_parallel": true,
	"self": 0.00024985900017782114,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00019514900122885592,
	"count": 1,
	"is_parallel": true,
	"self": 0.00019514900122885592
	},
	"communicator.exchange": {
	"total": 0.010036065999884158,
	"count": 1,
	"is_parallel": true,
	"self": 0.010036065999884158
	},
	"steps_from_proto": {
	"total": 0.0006855139981780667,
	"count": 2,
	"is_parallel": true,
	"self": 0.0001331999992544297,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.000552313998923637,
	"count": 8,
	"is_parallel": true,
	"self": 0.000552313998923637
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1531.7615807343973,
	"count": 335443,
	"is_parallel": true,
	"self": 89.4693392949739,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 52.059525609489356,
	"count": 335443,
	"is_parallel": true,
	"self": 52.059525609489356
	},
	"communicator.exchange": {
	"total": 1156.2756498972412,
	"count": 335443,
	"is_parallel": true,
	"self": 1156.2756498972412
	},
	"steps_from_proto": {
	"total": 233.95706593269279,
	"count": 670886,
	"is_parallel": true,
	"self": 43.36958953709109,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 190.5874763956017,
	"count": 2683544,
	"is_parallel": true,
	"self": 190.5874763956017
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.0171302270173328,
	"count": 48,
	"is_parallel": true,
	"self": 0.003224001011403743,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.013906226005929057,
	"count": 192,
	"is_parallel": true,
	"self": 0.013906226005929057
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 696.8118256260132,
	"count": 335444,
	"self": 23.83871245248156,
	"children": {
	"process_trajectory": {
	"total": 295.05417500857584,
	"count": 335444,
	"self": 294.34056990057434,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.7136051080015022,
	"count": 10,
	"self": 0.7136051080015022
	}
	}
	},
	"_update_policy": {
	"total": 377.91893816495576,
	"count": 238,
	"self": 246.29837315572877,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 131.620565009227,
	"count": 7140,
	"self": 131.620565009227
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 4.3200270738452673e-07,
	"count": 1,
	"self": 4.3200270738452673e-07
	},
	"TrainerController._save_models": {
	"total": 0.06275982000079239,
	"count": 1,
	"self": 0.0005887779989279807,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.06217104200186441,
	"count": 1,
	"self": 0.06217104200186441
	}
	}
	}
	}
	}
	}
	}