First Version

a8a8649 over 1 year ago

20.7 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 3.0931687355041504,
	"min": 3.0931687355041504,
	"max": 3.285083770751953,
	"count": 20
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 318126.21875,
	"min": 295396.78125,
	"max": 392512.96875,
	"count": 20
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 905.2142857142857,
	"min": 742.5151515151515,
	"max": 964.2692307692307,
	"count": 20
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 101384.0,
	"min": 96920.0,
	"max": 102956.0,
	"count": 20
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1200.794760242277,
	"min": 1200.4892579168904,
	"max": 1204.2571574161518,
	"count": 20
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 14409.537122907324,
	"min": 4814.783399651233,
	"max": 33639.309722443664,
	"count": 20
	},
	"SoccerTwos.Step.mean": {
	"value": 999776.0,
	"min": 49360.0,
	"max": 999776.0,
	"count": 20
	},
	"SoccerTwos.Step.sum": {
	"value": 999776.0,
	"min": 49360.0,
	"max": 999776.0,
	"count": 20
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.0016028030076995492,
	"min": -0.004264697432518005,
	"max": 0.08232221752405167,
	"count": 20
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.08975696563720703,
	"min": -0.2430877536535263,
	"max": 4.857010841369629,
	"count": 20
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.0017203426687046885,
	"min": -0.005274998489767313,
	"max": 0.08306208997964859,
	"count": 20
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -0.09633918851613998,
	"min": -0.3006749153137207,
	"max": 4.900663375854492,
	"count": 20
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 20
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 20
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.11030000022479466,
	"min": -0.12444178960216579,
	"max": 0.052999999236177514,
	"count": 20
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -6.176800012588501,
	"min": -8.337599903345108,
	"max": 2.861999958753586,
	"count": 20
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.11030000022479466,
	"min": -0.12444178960216579,
	"max": 0.052999999236177514,
	"count": 20
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -6.176800012588501,
	"min": -8.337599903345108,
	"max": 2.861999958753586,
	"count": 20
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.016466266225458336,
	"min": 0.015288337600468365,
	"max": 0.01968905675690621,
	"count": 20
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.049398798676375005,
	"min": 0.018511507396968746,
	"max": 0.05831768332718639,
	"count": 20
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.0008875883443094306,
	"min": 0.00012735439536484705,
	"max": 0.0018866164041780088,
	"count": 20
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.0026627650329282917,
	"min": 0.0002547087907296941,
	"max": 0.005659849212534027,
	"count": 20
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.0008889668918709504,
	"min": 0.00012729530923465406,
	"max": 0.0019485034459891415,
	"count": 20
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.002666900675612851,
	"min": 0.0002545906184693081,
	"max": 0.005845510337967425,
	"count": 20
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 1.3029764060733328e-05,
	"min": 1.3029764060733328e-05,
	"max": 0.0004852640029471997,
	"count": 20
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 3.908929218219998e-05,
	"min": 3.908929218219998e-05,
	"max": 0.001392970021406,
	"count": 20
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.10260593333333333,
	"min": 0.10260593333333333,
	"max": 0.19705279999999997,
	"count": 20
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.3078178,
	"min": 0.19705279999999997,
	"max": 0.578594,
	"count": 20
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.00016609540666666662,
	"min": 0.00016609540666666662,
	"max": 0.00582346272,
	"count": 20
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.0004982862199999999,
	"min": 0.0004982862199999999,
	"max": 0.016717780600000003,
	"count": 20
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 20
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 20
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1676309823",
	"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn /content/ml-agents/config/poca/SoccerTwos.yaml --env=/content/ml-agents/training-envs-executables/linux/SoccerTwos/SoccerTwos --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.6",
	"end_time_seconds": "1676312152"
	},
	"total": 2329.668662306,
	"count": 1,
	"self": 0.377563771000041,
	"children": {
	"run_training.setup": {
	"total": 0.1968287849999797,
	"count": 1,
	"self": 0.1968287849999797
	},
	"TrainerController.start_learning": {
	"total": 2329.09426975,
	"count": 1,
	"self": 1.3139922649606888,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.492277372000331,
	"count": 5,
	"self": 6.492277372000331
	},
	"TrainerController.advance": {
	"total": 2320.937627842038,
	"count": 65137,
	"self": 1.6417428820550413,
	"children": {
	"env_step": {
	"total": 1704.1357154320035,
	"count": 65137,
	"self": 1291.5167122129455,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 411.75434580099125,
	"count": 65137,
	"self": 11.198707932950924,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 400.5556378680403,
	"count": 129396,
	"self": 73.7570395059746,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 326.7985983620657,
	"count": 129396,
	"self": 326.7985983620657
	}
	}
	}
	}
	},
	"workers": {
	"total": 0.8646574180665993,
	"count": 65137,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2324.302779778049,
	"count": 65137,
	"is_parallel": true,
	"self": 1236.861539408057,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.002927940000063245,
	"count": 2,
	"is_parallel": true,
	"self": 0.0008689640001193766,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0020589759999438684,
	"count": 8,
	"is_parallel": true,
	"self": 0.0020589759999438684
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.03854192399990097,
	"count": 1,
	"is_parallel": true,
	"self": 0.0011098549998678209,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0008918969999740511,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008918969999740511
	},
	"communicator.exchange": {
	"total": 0.032974581999951624,
	"count": 1,
	"is_parallel": true,
	"self": 0.032974581999951624
	},
	"steps_from_proto": {
	"total": 0.003565590000107477,
	"count": 2,
	"is_parallel": true,
	"self": 0.0007971310000129961,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.002768459000094481,
	"count": 8,
	"is_parallel": true,
	"self": 0.002768459000094481
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1087.4337666899917,
	"count": 65136,
	"is_parallel": true,
	"self": 64.38289495199456,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 50.44968356303423,
	"count": 65136,
	"is_parallel": true,
	"self": 50.44968356303423
	},
	"communicator.exchange": {
	"total": 763.7788883129964,
	"count": 65136,
	"is_parallel": true,
	"self": 763.7788883129964
	},
	"steps_from_proto": {
	"total": 208.82229986196648,
	"count": 130272,
	"is_parallel": true,
	"self": 42.197285519956154,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 166.62501434201033,
	"count": 521088,
	"is_parallel": true,
	"self": 166.62501434201033
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.0074736800004302495,
	"count": 8,
	"is_parallel": true,
	"self": 0.001717889000019568,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.005755791000410682,
	"count": 32,
	"is_parallel": true,
	"self": 0.005755791000410682
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 615.1601695279796,
	"count": 65137,
	"self": 11.888566690920243,
	"children": {
	"process_trajectory": {
	"total": 151.08626794405905,
	"count": 65137,
	"self": 150.48433769205917,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.6019302519998746,
	"count": 2,
	"self": 0.6019302519998746
	}
	}
	},
	"_update_policy": {
	"total": 452.18533489300034,
	"count": 46,
	"self": 269.0533900849837,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 183.13194480801667,
	"count": 2320,
	"self": 183.13194480801667
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.290003279398661e-07,
	"count": 1,
	"self": 8.290003279398661e-07
	},
	"TrainerController._save_models": {
	"total": 0.35037144200032344,
	"count": 1,
	"self": 0.003085347000251204,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.34728609500007224,
	"count": 1,
	"self": 0.34728609500007224
	}
	}
	}
	}
	}
	}
	}