poca-SoccerTwos-v3 / run_logs /timers.json

First Push

d8bbdc7 over 1 year ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.5919218063354492,
	"min": 1.4956210851669312,
	"max": 1.6350440979003906,
	"count": 200
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 32093.142578125,
	"min": 26902.1875,
	"max": 38142.2578125,
	"count": 200
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 46.96190476190476,
	"min": 42.45217391304348,
	"max": 79.375,
	"count": 200
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19724.0,
	"min": 18752.0,
	"max": 20632.0,
	"count": 200
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1624.790383699933,
	"min": 1607.4711872889911,
	"max": 1673.5935545049867,
	"count": 200
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 341205.9805769859,
	"min": 213452.26426934518,
	"max": 374231.6138551592,
	"count": 200
	},
	"SoccerTwos.Step.mean": {
	"value": 11999992.0,
	"min": 10009960.0,
	"max": 11999992.0,
	"count": 200
	},
	"SoccerTwos.Step.sum": {
	"value": 11999992.0,
	"min": 10009960.0,
	"max": 11999992.0,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.03493068367242813,
	"min": -0.12044847011566162,
	"max": 0.06294773519039154,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -7.300512790679932,
	"min": -21.56027603149414,
	"max": 10.764062881469727,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.03292582184076309,
	"min": -0.11908195167779922,
	"max": 0.06389004737138748,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -6.881496429443359,
	"min": -21.315670013427734,
	"max": 10.92519760131836,
	"count": 200
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 200
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.04784880528609718,
	"min": -0.38507246539212653,
	"max": 0.2724795910168667,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -10.000400304794312,
	"min": -57.91599977016449,
	"max": 53.40599983930588,
	"count": 200
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.04784880528609718,
	"min": -0.38507246539212653,
	"max": 0.2724795910168667,
	"count": 200
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -10.000400304794312,
	"min": -57.91599977016449,
	"max": 53.40599983930588,
	"count": 200
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 200
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 200
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.0177549017011188,
	"min": 0.009863875313506772,
	"max": 0.023703478168075283,
	"count": 97
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.0177549017011188,
	"min": 0.009863875313506772,
	"max": 0.023703478168075283,
	"count": 97
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.11240861117839814,
	"min": 0.08955958659450212,
	"max": 0.12260147780179978,
	"count": 97
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.11240861117839814,
	"min": 0.08955958659450212,
	"max": 0.12260147780179978,
	"count": 97
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.1141607624789079,
	"min": 0.09055832202235857,
	"max": 0.12472489426533381,
	"count": 97
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.1141607624789079,
	"min": 0.09055832202235857,
	"max": 0.12472489426533381,
	"count": 97
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 97
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 97
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 97
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 97
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 97
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 97
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1675764874",
	"python_version": "3.9.16 (main, Feb 6 2023, 20:06:40) \n[GCC 9.3.0]",
	"command_line_arguments": "/usr/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1675772618"
	},
	"total": 7743.998904499982,
	"count": 1,
	"self": 0.32225789997028187,
	"children": {
	"run_training.setup": {
	"total": 0.02660820001619868,
	"count": 1,
	"self": 0.02660820001619868
	},
	"TrainerController.start_learning": {
	"total": 7743.6500383999955,
	"count": 1,
	"self": 4.668742704845499,
	"children": {
	"TrainerController._reset_env": {
	"total": 1.0244025999563746,
	"count": 11,
	"self": 1.0244025999563746
	},
	"TrainerController.advance": {
	"total": 7737.361320095166,
	"count": 139159,
	"self": 4.98392969116685,
	"children": {
	"env_step": {
	"total": 4212.561896803614,
	"count": 139159,
	"self": 3654.098938797717,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 555.7198837042088,
	"count": 139159,
	"self": 23.844434808474034,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 531.8754488957347,
	"count": 250862,
	"self": 531.8754488957347
	}
	}
	},
	"workers": {
	"total": 2.743074301688466,
	"count": 139159,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 7732.718036797887,
	"count": 139159,
	"is_parallel": true,
	"self": 4541.120139499137,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0027423000137787312,
	"count": 2,
	"is_parallel": true,
	"self": 0.0007940000214148313,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0019482999923639,
	"count": 8,
	"is_parallel": true,
	"self": 0.0019482999923639
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.032378300005802885,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005550000059884042,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0003876000118907541,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003876000118907541
	},
	"communicator.exchange": {
	"total": 0.02974900000845082,
	"count": 1,
	"is_parallel": true,
	"self": 0.02974900000845082
	},
	"steps_from_proto": {
	"total": 0.0016866999794729054,
	"count": 2,
	"is_parallel": true,
	"self": 0.0003722999827004969,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013143999967724085,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013143999967724085
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.026429500081576407,
	"count": 20,
	"is_parallel": true,
	"self": 0.005045899888500571,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.021383600193075836,
	"count": 80,
	"is_parallel": true,
	"self": 0.021383600193075836
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 3191.571467798669,
	"count": 139158,
	"is_parallel": true,
	"self": 104.29615609551547,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 82.30171659815824,
	"count": 139158,
	"is_parallel": true,
	"self": 82.30171659815824
	},
	"communicator.exchange": {
	"total": 2687.287804999505,
	"count": 139158,
	"is_parallel": true,
	"self": 2687.287804999505
	},
	"steps_from_proto": {
	"total": 317.68579010549,
	"count": 278316,
	"is_parallel": true,
	"self": 69.9587420883181,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 247.7270480171719,
	"count": 1113264,
	"is_parallel": true,
	"self": 247.7270480171719
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 3519.815493600385,
	"count": 139159,
	"self": 26.330489595391555,
	"children": {
	"process_trajectory": {
	"total": 636.5708583049709,
	"count": 139159,
	"self": 635.6785552049405,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.8923031000304036,
	"count": 4,
	"self": 0.8923031000304036
	}
	}
	},
	"_update_policy": {
	"total": 2856.9141457000223,
	"count": 97,
	"self": 363.9008511992288,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 2493.0132945007936,
	"count": 2910,
	"self": 2493.0132945007936
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.300009898841381e-06,
	"count": 1,
	"self": 1.300009898841381e-06
	},
	"TrainerController._save_models": {
	"total": 0.5955717000178993,
	"count": 1,
	"self": 0.00163569999858737,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.5939360000193119,
	"count": 1,
	"self": 0.5939360000193119
	}
	}
	}
	}
	}
	}
	}