Second Push

01c4fee about 1 year ago

No virus

20.1 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 3.134723663330078,
	"min": 3.134723663330078,
	"max": 3.295743703842163,
	"count": 200
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 69014.078125,
	"min": 23137.46484375,
	"max": 112792.7890625,
	"count": 200
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 670.1428571428571,
	"min": 418.1818181818182,
	"max": 999.0,
	"count": 200
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 18764.0,
	"min": 16544.0,
	"max": 23560.0,
	"count": 200
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1207.5592719658505,
	"min": 1190.3462539934706,
	"max": 1207.5592719658505,
	"count": 165
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 7245.355631795102,
	"min": 2381.9796513433785,
	"max": 21607.680104602616,
	"count": 165
	},
	"SoccerTwos.Step.mean": {
	"value": 1999164.0,
	"min": 9140.0,
	"max": 1999164.0,
	"count": 200
	},
	"SoccerTwos.Step.sum": {
	"value": 1999164.0,
	"min": 9140.0,
	"max": 1999164.0,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.013440868817269802,
	"min": -0.02255900204181671,
	"max": 0.07795070856809616,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.18817216157913208,
	"min": -0.3406982421875,
	"max": 1.5590142011642456,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.011447346769273281,
	"min": -0.02832871302962303,
	"max": 0.07786843925714493,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -0.1602628529071808,
	"min": -0.4602850675582886,
	"max": 1.5573687553405762,
	"count": 200
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 200
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.3288285732269287,
	"min": -0.6,
	"max": 0.375925000756979,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 4.603600025177002,
	"min": -7.7368000745773315,
	"max": 6.014800012111664,
	"count": 200
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.3288285732269287,
	"min": -0.6,
	"max": 0.375925000756979,
	"count": 200
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 4.603600025177002,
	"min": -7.7368000745773315,
	"max": 6.014800012111664,
	"count": 200
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 200
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 200
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.016989466220062848,
	"min": 0.011690640903058618,
	"max": 0.02217564850967998,
	"count": 93
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.016989466220062848,
	"min": 0.011690640903058618,
	"max": 0.02217564850967998,
	"count": 93
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.0025493189576081933,
	"min": 2.715861914263466e-06,
	"max": 0.01054837116971612,
	"count": 93
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.0025493189576081933,
	"min": 2.715861914263466e-06,
	"max": 0.01054837116971612,
	"count": 93
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.002578929966936509,
	"min": 2.2835658095724892e-06,
	"max": 0.010203083076824744,
	"count": 93
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.002578929966936509,
	"min": 2.2835658095724892e-06,
	"max": 0.010203083076824744,
	"count": 93
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 93
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 93
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 93
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 93
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 93
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 93
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1681562902",
	"python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/aztleclan/training/moocs/huggingfaces/unit7/.conda/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env ./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1681566715"
	},
	"total": 3813.399794515999,
	"count": 1,
	"self": 0.3209155739987182,
	"children": {
	"run_training.setup": {
	"total": 0.012022582000099646,
	"count": 1,
	"self": 0.012022582000099646
	},
	"TrainerController.start_learning": {
	"total": 3813.06685636,
	"count": 1,
	"self": 2.9389210559420462,
	"children": {
	"TrainerController._reset_env": {
	"total": 5.7804522669994185,
	"count": 10,
	"self": 5.7804522669994185
	},
	"TrainerController.advance": {
	"total": 3804.0603381170595,
	"count": 130218,
	"self": 3.510101454347023,
	"children": {
	"env_step": {
	"total": 2834.846090115796,
	"count": 130218,
	"self": 2204.7434627477887,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 628.1614574820524,
	"count": 130218,
	"self": 23.233958940654702,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 604.9274985413977,
	"count": 258436,
	"self": 604.9274985413977
	}
	}
	},
	"workers": {
	"total": 1.9411698859548778,
	"count": 130218,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3807.1614705310885,
	"count": 130218,
	"is_parallel": true,
	"self": 1971.222390435908,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.005138307999914105,
	"count": 2,
	"is_parallel": true,
	"self": 0.001479011000810715,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0036592969991033897,
	"count": 8,
	"is_parallel": true,
	"self": 0.0036592969991033897
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.036166889000014635,
	"count": 1,
	"is_parallel": true,
	"self": 0.001194107000628719,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0007146540001485846,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007146540001485846
	},
	"communicator.exchange": {
	"total": 0.0314693599993916,
	"count": 1,
	"is_parallel": true,
	"self": 0.0314693599993916
	},
	"steps_from_proto": {
	"total": 0.0027887679998457315,
	"count": 2,
	"is_parallel": true,
	"self": 0.0005849069984833477,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.002203861001362384,
	"count": 8,
	"is_parallel": true,
	"self": 0.002203861001362384
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1835.92103960018,
	"count": 130217,
	"is_parallel": true,
	"self": 109.5906046352602,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 64.5990994740423,
	"count": 130217,
	"is_parallel": true,
	"self": 64.5990994740423
	},
	"communicator.exchange": {
	"total": 1377.2451884587445,
	"count": 130217,
	"is_parallel": true,
	"self": 1377.2451884587445
	},
	"steps_from_proto": {
	"total": 284.486147032133,
	"count": 260434,
	"is_parallel": true,
	"self": 54.12488937899434,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 230.36125765313864,
	"count": 1041736,
	"is_parallel": true,
	"self": 230.36125765313864
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.018040495000605006,
	"count": 18,
	"is_parallel": true,
	"self": 0.0036618320027628215,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.014378662997842184,
	"count": 72,
	"is_parallel": true,
	"self": 0.014378662997842184
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 965.7041465469165,
	"count": 130218,
	"self": 21.454896582661604,
	"children": {
	"process_trajectory": {
	"total": 194.95743723825217,
	"count": 130218,
	"self": 193.74353206125124,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.2139051770009246,
	"count": 4,
	"self": 1.2139051770009246
	}
	}
	},
	"_update_policy": {
	"total": 749.2918127260027,
	"count": 93,
	"self": 335.0551875339879,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 414.2366251920148,
	"count": 2796,
	"self": 414.2366251920148
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.160004654200748e-07,
	"count": 1,
	"self": 8.160004654200748e-07
	},
	"TrainerController._save_models": {
	"total": 0.2871441039987985,
	"count": 1,
	"self": 0.002259959997900296,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.28488414400089823,
	"count": 1,
	"self": 0.28488414400089823
	}
	}
	}
	}
	}
	}
	}