nhiro3303's picture
Push 50M
790c485
raw
history blame contribute delete
No virus
20.2 kB
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.6343845129013062,
"min": 1.521212100982666,
"max": 1.9592007398605347,
"count": 2858
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 32060.0859375,
"min": 25845.744140625,
"max": 46363.984375,
"count": 2858
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 58.55952380952381,
"min": 38.872,
"max": 94.61538461538461,
"count": 2858
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19676.0,
"min": 17140.0,
"max": 21672.0,
"count": 2858
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1786.6314440923768,
"min": 1636.9452435120165,
"max": 1819.7730164239865,
"count": 2858
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 300154.0826075193,
"min": 173106.6109845909,
"max": 441662.6361849826,
"count": 2858
},
"SoccerTwos.Step.mean": {
"value": 49999913.0,
"min": 21429965.0,
"max": 49999913.0,
"count": 2858
},
"SoccerTwos.Step.sum": {
"value": 49999913.0,
"min": 21429965.0,
"max": 49999913.0,
"count": 2858
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": 0.032919157296419144,
"min": -0.13656257092952728,
"max": 0.08040333539247513,
"count": 2858
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": 5.563337326049805,
"min": -25.272960662841797,
"max": 13.092177391052246,
"count": 2858
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.03192002698779106,
"min": -0.13798409700393677,
"max": 0.08274845778942108,
"count": 2858
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": 5.394484519958496,
"min": -26.078994750976562,
"max": 13.456812858581543,
"count": 2858
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 2858
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 2858
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.057566864250679695,
"min": -0.3954981365559264,
"max": 0.3420427487096714,
"count": 2858
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -9.728800058364868,
"min": -63.67519998550415,
"max": 59.30879986286163,
"count": 2858
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.057566864250679695,
"min": -0.3954981365559264,
"max": 0.3420427487096714,
"count": 2858
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -9.728800058364868,
"min": -63.67519998550415,
"max": 59.30879986286163,
"count": 2858
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 2858
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 2858
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.010540140032147368,
"min": 0.005118976589680339,
"max": 0.02047771094366908,
"count": 1387
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.010540140032147368,
"min": 0.005118976589680339,
"max": 0.02047771094366908,
"count": 1387
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.11124143153429031,
"min": 0.08768866906563441,
"max": 0.14099180499712627,
"count": 1387
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.11124143153429031,
"min": 0.08768866906563441,
"max": 0.14099180499712627,
"count": 1387
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.11151622086763383,
"min": 0.08805444538593292,
"max": 0.14152407348155976,
"count": 1387
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.11151622086763383,
"min": 0.08805444538593292,
"max": 0.14152407348155976,
"count": 1387
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.00029,
"min": 0.00029,
"max": 0.00029,
"count": 1387
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.00029,
"min": 0.00029,
"max": 0.00029,
"count": 1387
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.21,
"min": 0.21,
"max": 0.21,
"count": 1387
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.21,
"min": 0.21,
"max": 0.21,
"count": 1387
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005099999999999999,
"min": 0.005099999999999999,
"max": 0.005099999999999999,
"count": 1387
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005099999999999999,
"min": 0.005099999999999999,
"max": 0.005099999999999999,
"count": 1387
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1676425082",
"python_version": "3.9.9 (main, Feb 15 2023, 00:04:22) \n[GCC 11.3.0]",
"command_line_arguments": "/home/gpu/venv/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=../training-envs-executables/linux/SoccerTwos --run-id=SoccerTwos --no-graphics --resume",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.13.1+cu117",
"numpy_version": "1.21.2",
"end_time_seconds": "1676472112"
},
"total": 47029.300314456006,
"count": 1,
"self": 0.22009283798979595,
"children": {
"run_training.setup": {
"total": 0.016478817007737234,
"count": 1,
"self": 0.016478817007737234
},
"TrainerController.start_learning": {
"total": 47029.06374280101,
"count": 1,
"self": 30.724192420369945,
"children": {
"TrainerController._reset_env": {
"total": 3.3332904600101756,
"count": 144,
"self": 3.3332904600101756
},
"TrainerController.advance": {
"total": 46994.85714822463,
"count": 1984230,
"self": 30.951789093989646,
"children": {
"env_step": {
"total": 35232.59208244787,
"count": 1984230,
"self": 22912.192437588354,
"children": {
"SubprocessEnvManager._take_step": {
"total": 12302.328775190283,
"count": 1984230,
"self": 179.16375628819515,
"children": {
"TorchPolicy.evaluate": {
"total": 12123.165018902087,
"count": 3586810,
"self": 12123.165018902087
}
}
},
"workers": {
"total": 18.070869669230888,
"count": 1984230,
"self": 0.0,
"children": {
"worker_root": {
"total": 46953.56185648771,
"count": 1984230,
"is_parallel": true,
"self": 27453.984898038718,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0015131039981497452,
"count": 2,
"is_parallel": true,
"self": 0.0003681899979710579,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0011449140001786873,
"count": 8,
"is_parallel": true,
"self": 0.0011449140001786873
}
}
},
"UnityEnvironment.step": {
"total": 0.02039232499373611,
"count": 1,
"is_parallel": true,
"self": 0.0003975409781560302,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0003643910022219643,
"count": 1,
"is_parallel": true,
"self": 0.0003643910022219643
},
"communicator.exchange": {
"total": 0.01818073600588832,
"count": 1,
"is_parallel": true,
"self": 0.01818073600588832
},
"steps_from_proto": {
"total": 0.0014496570074697956,
"count": 2,
"is_parallel": true,
"self": 0.0003064430202357471,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0011432139872340485,
"count": 8,
"is_parallel": true,
"self": 0.0011432139872340485
}
}
}
}
}
}
},
"steps_from_proto": {
"total": 0.1750064150255639,
"count": 286,
"is_parallel": true,
"self": 0.03774280825746246,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.13726360676810145,
"count": 1144,
"is_parallel": true,
"self": 0.13726360676810145
}
}
},
"UnityEnvironment.step": {
"total": 19499.401952033964,
"count": 1984229,
"is_parallel": true,
"self": 728.384919047603,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 456.81114661268657,
"count": 1984229,
"is_parallel": true,
"self": 456.81114661268657
},
"communicator.exchange": {
"total": 16176.186887175107,
"count": 1984229,
"is_parallel": true,
"self": 16176.186887175107
},
"steps_from_proto": {
"total": 2138.018999198568,
"count": 3968458,
"is_parallel": true,
"self": 454.51436859848036,
"children": {
"_process_rank_one_or_two_observation": {
"total": 1683.5046306000877,
"count": 15873832,
"is_parallel": true,
"self": 1683.5046306000877
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 11731.313276682777,
"count": 1984230,
"self": 235.73383657041995,
"children": {
"process_trajectory": {
"total": 6023.283170795083,
"count": 1984230,
"self": 6015.277920442022,
"children": {
"RLTrainer._checkpoint": {
"total": 8.005250353060546,
"count": 58,
"self": 8.005250353060546
}
}
},
"_update_policy": {
"total": 5472.296269317274,
"count": 1387,
"self": 3599.156199294346,
"children": {
"TorchPOCAOptimizer.update": {
"total": 1873.1400700229278,
"count": 20805,
"self": 1873.1400700229278
}
}
}
}
}
}
},
"trainer_threads": {
"total": 7.199996616691351e-07,
"count": 1,
"self": 7.199996616691351e-07
},
"TrainerController._save_models": {
"total": 0.149110975995427,
"count": 1,
"self": 0.0018150979885831475,
"children": {
"RLTrainer._checkpoint": {
"total": 0.14729587800684385,
"count": 1,
"self": 0.14729587800684385
}
}
}
}
}
}
}