poca-SoccerTwos / run_logs /timers.json
Genis
First Commit
766d45f
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.6801722049713135,
"min": 1.6689929962158203,
"max": 3.295753240585327,
"count": 522
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 31345.29296875,
"min": 16059.88671875,
"max": 117480.875,
"count": 522
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 47.85436893203884,
"min": 37.19402985074627,
"max": 999.0,
"count": 522
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19716.0,
"min": 12776.0,
"max": 28128.0,
"count": 522
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1512.3841506926258,
"min": 1182.721040420331,
"max": 1520.1387888025301,
"count": 500
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 311551.1350426809,
"min": 2365.575166765614,
"max": 402909.03120493336,
"count": 500
},
"SoccerTwos.Step.mean": {
"value": 5219984.0,
"min": 9082.0,
"max": 5219984.0,
"count": 522
},
"SoccerTwos.Step.sum": {
"value": 5219984.0,
"min": 9082.0,
"max": 5219984.0,
"count": 522
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.017524413764476776,
"min": -0.12234243750572205,
"max": 0.30277761816978455,
"count": 522
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -3.5925049781799316,
"min": -24.590829849243164,
"max": 32.93498611450195,
"count": 522
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.01664070226252079,
"min": -0.12715943157672882,
"max": 0.2870791554450989,
"count": 522
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -3.411344051361084,
"min": -25.559045791625977,
"max": 31.987327575683594,
"count": 522
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 522
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 522
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.1805639040179369,
"min": -0.5964551711904591,
"max": 0.48996875062584877,
"count": 522
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -37.01560032367706,
"min": -56.88379991054535,
"max": 51.32639992237091,
"count": 522
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.1805639040179369,
"min": -0.5964551711904591,
"max": 0.48996875062584877,
"count": 522
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -37.01560032367706,
"min": -56.88379991054535,
"max": 51.32639992237091,
"count": 522
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 522
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 522
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.016975674087492128,
"min": 0.011308841101708822,
"max": 0.024441575802241763,
"count": 250
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.016975674087492128,
"min": 0.011308841101708822,
"max": 0.024441575802241763,
"count": 250
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.09598184923330942,
"min": 1.3440602704880196e-06,
"max": 0.10366184016068776,
"count": 250
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.09598184923330942,
"min": 1.3440602704880196e-06,
"max": 0.10366184016068776,
"count": 250
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.09921732048193614,
"min": 4.471496655848265e-06,
"max": 0.10685077408949534,
"count": 250
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.09921732048193614,
"min": 4.471496655848265e-06,
"max": 0.10685077408949534,
"count": 250
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0005000000000000001,
"min": 0.0005000000000000001,
"max": 0.0005000000000000001,
"count": 250
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0005000000000000001,
"min": 0.0005000000000000001,
"max": 0.0005000000000000001,
"count": 250
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 250
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 250
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 250
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 250
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1692717082",
"python_version": "3.9.17 (main, Jul 5 2023, 20:41:20) \n[GCC 11.2.0]",
"command_line_arguments": "/home/genis/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1692734710"
},
"total": 17627.666772411998,
"count": 1,
"self": 0.09028954200039152,
"children": {
"run_training.setup": {
"total": 0.008287695000035455,
"count": 1,
"self": 0.008287695000035455
},
"TrainerController.start_learning": {
"total": 17627.568195174998,
"count": 1,
"self": 7.836454700638569,
"children": {
"TrainerController._reset_env": {
"total": 2.0494618500052866,
"count": 21,
"self": 2.0494618500052866
},
"TrainerController.advance": {
"total": 17617.451557357355,
"count": 355657,
"self": 7.943129163682897,
"children": {
"env_step": {
"total": 5259.7881734208,
"count": 355657,
"self": 4268.029192443379,
"children": {
"SubprocessEnvManager._take_step": {
"total": 987.002381628069,
"count": 355657,
"self": 38.885623749441834,
"children": {
"TorchPolicy.evaluate": {
"total": 948.1167578786271,
"count": 659920,
"self": 948.1167578786271
}
}
},
"workers": {
"total": 4.756599349352882,
"count": 355656,
"self": 0.0,
"children": {
"worker_root": {
"total": 17616.246501720587,
"count": 355656,
"is_parallel": true,
"self": 14199.876406307758,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.002839553000058004,
"count": 2,
"is_parallel": true,
"self": 0.0013376410003047567,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.001501911999753247,
"count": 8,
"is_parallel": true,
"self": 0.001501911999753247
}
}
},
"UnityEnvironment.step": {
"total": 0.019501769000044078,
"count": 1,
"is_parallel": true,
"self": 0.00047463800001423806,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00035923199993703747,
"count": 1,
"is_parallel": true,
"self": 0.00035923199993703747
},
"communicator.exchange": {
"total": 0.017162689000087994,
"count": 1,
"is_parallel": true,
"self": 0.017162689000087994
},
"steps_from_proto": {
"total": 0.0015052100000048085,
"count": 2,
"is_parallel": true,
"self": 0.00028915600000800623,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0012160539999968023,
"count": 8,
"is_parallel": true,
"self": 0.0012160539999968023
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 3416.3324846668224,
"count": 355655,
"is_parallel": true,
"self": 192.92021787136537,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 129.56033859774914,
"count": 355655,
"is_parallel": true,
"self": 129.56033859774914
},
"communicator.exchange": {
"total": 2474.453554164158,
"count": 355655,
"is_parallel": true,
"self": 2474.453554164158
},
"steps_from_proto": {
"total": 619.3983740335495,
"count": 711310,
"is_parallel": true,
"self": 122.86005064013443,
"children": {
"_process_rank_one_or_two_observation": {
"total": 496.5383233934151,
"count": 2845240,
"is_parallel": true,
"self": 496.5383233934151
}
}
}
}
},
"steps_from_proto": {
"total": 0.03761074600720349,
"count": 40,
"is_parallel": true,
"self": 0.0073545120210383175,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.03025623398616517,
"count": 160,
"is_parallel": true,
"self": 0.03025623398616517
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 12349.720254772872,
"count": 355656,
"self": 53.74877238922272,
"children": {
"process_trajectory": {
"total": 1201.6411975316382,
"count": 355656,
"self": 1198.943791865635,
"children": {
"RLTrainer._checkpoint": {
"total": 2.6974056660033057,
"count": 10,
"self": 2.6974056660033057
}
}
},
"_update_policy": {
"total": 11094.33028485201,
"count": 251,
"self": 778.9787935760087,
"children": {
"TorchPOCAOptimizer.update": {
"total": 10315.351491276002,
"count": 7530,
"self": 10315.351491276002
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.0909971024375409e-06,
"count": 1,
"self": 1.0909971024375409e-06
},
"TrainerController._save_models": {
"total": 0.23072017600134131,
"count": 1,
"self": 0.0015350430003309157,
"children": {
"RLTrainer._checkpoint": {
"total": 0.2291851330010104,
"count": 1,
"self": 0.2291851330010104
}
}
}
}
}
}
}