First Commit

ec95d7b over 1 year ago

20.1 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 3.15842604637146,
	"min": 3.1336007118225098,
	"max": 3.2957088947296143,
	"count": 50
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 67312.375,
	"min": 45246.9375,
	"max": 132625.390625,
	"count": 50
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 884.3333333333334,
	"min": 236.71428571428572,
	"max": 999.0,
	"count": 50
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 21224.0,
	"min": 6628.0,
	"max": 30148.0,
	"count": 50
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1215.659811500077,
	"min": 1200.2435735709535,
	"max": 1215.659811500077,
	"count": 48
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 4862.639246000308,
	"min": 2400.487147141907,
	"max": 19407.802034341934,
	"count": 48
	},
	"SoccerTwos.Step.mean": {
	"value": 499660.0,
	"min": 9770.0,
	"max": 499660.0,
	"count": 50
	},
	"SoccerTwos.Step.sum": {
	"value": 499660.0,
	"min": 9770.0,
	"max": 499660.0,
	"count": 50
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.01406072173267603,
	"min": -0.04412545636296272,
	"max": 0.008145976811647415,
	"count": 50
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.16872866451740265,
	"min": -0.7728478908538818,
	"max": 0.14344337582588196,
	"count": 50
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.012719911523163319,
	"min": -0.044171370565891266,
	"max": 0.009948012419044971,
	"count": 50
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -0.15263894200325012,
	"min": -0.7974553108215332,
	"max": 0.16911621391773224,
	"count": 50
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 50
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 50
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.1884333292643229,
	"min": -0.42857142857142855,
	"max": 0.28112380845206125,
	"count": 50
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 2.261199951171875,
	"min": -6.481600046157837,
	"max": 5.914799869060516,
	"count": 50
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.1884333292643229,
	"min": -0.42857142857142855,
	"max": 0.28112380845206125,
	"count": 50
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 2.261199951171875,
	"min": -6.481600046157837,
	"max": 5.914799869060516,
	"count": 50
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 50
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 50
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.013158223312348127,
	"min": 0.013158223312348127,
	"max": 0.02181773379512985,
	"count": 23
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.013158223312348127,
	"min": 0.013158223312348127,
	"max": 0.02181773379512985,
	"count": 23
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.002371368452440947,
	"min": 0.001030550831152747,
	"max": 0.008068540676807364,
	"count": 23
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.002371368452440947,
	"min": 0.001030550831152747,
	"max": 0.008068540676807364,
	"count": 23
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.0023823169137661654,
	"min": 0.0010245292204975462,
	"max": 0.00846226663949589,
	"count": 23
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.0023823169137661654,
	"min": 0.0010245292204975462,
	"max": 0.00846226663949589,
	"count": 23
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 23
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 23
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 23
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 23
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 23
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 23
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1686155198",
	"python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]",
	"command_line_arguments": "/root/anaconda3/envs/minerl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.exe --run-id=SoccerTwosSmall --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1686157268"
	},
	"total": 2070.2178055,
	"count": 1,
	"self": 1.0250520999998116,
	"children": {
	"run_training.setup": {
	"total": 0.00976950000006127,
	"count": 1,
	"self": 0.00976950000006127
	},
	"TrainerController.start_learning": {
	"total": 2069.1829839,
	"count": 1,
	"self": 1.3087680999606164,
	"children": {
	"TrainerController._reset_env": {
	"total": 24.69935509999982,
	"count": 24,
	"self": 24.69935509999982
	},
	"TrainerController.advance": {
	"total": 2042.8906650000397,
	"count": 41247,
	"self": 1.531998200058979,
	"children": {
	"env_step": {
	"total": 1800.0333814000205,
	"count": 41247,
	"self": 1292.097474000071,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 507.09667869996053,
	"count": 41247,
	"self": 9.963009099907708,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 497.1336696000528,
	"count": 81874,
	"self": 497.1336696000528
	}
	}
	},
	"workers": {
	"total": 0.8392286999890075,
	"count": 41247,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2064.7671305000245,
	"count": 41247,
	"is_parallel": true,
	"self": 913.0688027000447,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.021959499999979926,
	"count": 2,
	"is_parallel": true,
	"self": 0.019849999999905776,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0021095000000741493,
	"count": 8,
	"is_parallel": true,
	"self": 0.0021095000000741493
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04585650000001351,
	"count": 1,
	"is_parallel": true,
	"self": 0.000559800000019095,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0010837999999466774,
	"count": 1,
	"is_parallel": true,
	"self": 0.0010837999999466774
	},
	"communicator.exchange": {
	"total": 0.0426003000000037,
	"count": 1,
	"is_parallel": true,
	"self": 0.0426003000000037
	},
	"steps_from_proto": {
	"total": 0.00161260000004404,
	"count": 2,
	"is_parallel": true,
	"self": 0.00036639999996168626,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012462000000823537,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012462000000823537
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1151.6590933999796,
	"count": 41246,
	"is_parallel": true,
	"self": 32.20160970006327,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 21.53810140003327,
	"count": 41246,
	"is_parallel": true,
	"self": 21.53810140003327
	},
	"communicator.exchange": {
	"total": 1000.0520061999762,
	"count": 41246,
	"is_parallel": true,
	"self": 1000.0520061999762
	},
	"steps_from_proto": {
	"total": 97.867376099907,
	"count": 82492,
	"is_parallel": true,
	"self": 20.509618399821647,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 77.35775770008536,
	"count": 329968,
	"is_parallel": true,
	"self": 77.35775770008536
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.03923440000005485,
	"count": 46,
	"is_parallel": true,
	"self": 0.008302300002924312,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.030932099997130535,
	"count": 184,
	"is_parallel": true,
	"self": 0.030932099997130535
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 241.3252853999603,
	"count": 41247,
	"self": 6.886319299973252,
	"children": {
	"process_trajectory": {
	"total": 61.18131969998774,
	"count": 41247,
	"self": 60.558825599988154,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.6224940999995852,
	"count": 1,
	"self": 0.6224940999995852
	}
	}
	},
	"_update_policy": {
	"total": 173.25764639999932,
	"count": 23,
	"self": 91.8774011999974,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 81.38024520000192,
	"count": 699,
	"self": 81.38024520000192
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.5999999050109182e-06,
	"count": 1,
	"self": 1.5999999050109182e-06
	},
	"TrainerController._save_models": {
	"total": 0.2841941000001498,
	"count": 1,
	"self": 0.001792300000488467,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2824017999996613,
	"count": 1,
	"self": 0.2824017999996613
	}
	}
	}
	}
	}
	}
	}