|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 3.2010748386383057, |
|
"min": 3.125300407409668, |
|
"max": 3.2930920124053955, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 307303.1875, |
|
"min": 282047.6875, |
|
"max": 380839.5, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 911.4814814814815, |
|
"min": 597.609756097561, |
|
"max": 997.12, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 98440.0, |
|
"min": 97228.0, |
|
"max": 103384.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1197.9982579271607, |
|
"min": 1195.9461036196167, |
|
"max": 1221.9759648492238, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 7187.989547562964, |
|
"min": 4815.290022352901, |
|
"max": 67659.85144552909, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 4999006.0, |
|
"min": 49298.0, |
|
"max": 4999006.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 4999006.0, |
|
"min": 49298.0, |
|
"max": 4999006.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.005989752244204283, |
|
"min": -0.020525911822915077, |
|
"max": 0.087294802069664, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -0.3234466314315796, |
|
"min": -1.4622992277145386, |
|
"max": 5.412277698516846, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.006024852395057678, |
|
"min": -0.02027856558561325, |
|
"max": 0.08779024332761765, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -0.3253420293331146, |
|
"min": -1.46644926071167, |
|
"max": 5.442995071411133, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": 0.014903702117778637, |
|
"min": -0.3030208965290838, |
|
"max": 0.1328193553453011, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": 0.8047999143600464, |
|
"min": -20.302400067448616, |
|
"max": 8.234800031408668, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": 0.014903702117778637, |
|
"min": -0.3030208965290838, |
|
"max": 0.1328193553453011, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": 0.8047999143600464, |
|
"min": -20.302400067448616, |
|
"max": 8.234800031408668, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.017588941159192475, |
|
"min": 0.01358264352408393, |
|
"max": 0.022225120673020782, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.03517788231838495, |
|
"min": 0.02716528704816786, |
|
"max": 0.06667536201906235, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 1.032043584814346e-06, |
|
"min": 1.032043584814346e-06, |
|
"max": 0.0063071357435546815, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 2.064087169628692e-06, |
|
"min": 2.064087169628692e-06, |
|
"max": 0.01644136217655614, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 1.0190511574137418e-06, |
|
"min": 1.0190511574137418e-06, |
|
"max": 0.006349796561213831, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 2.0381023148274836e-06, |
|
"min": 2.0381023148274836e-06, |
|
"max": 0.01644182266124214, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0005000000000000001, |
|
"min": 0.0005000000000000001, |
|
"max": 0.0005000000000000001, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0010000000000000002, |
|
"min": 0.0010000000000000002, |
|
"max": 0.0015000000000000005, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.40000000000000013, |
|
"min": 0.40000000000000013, |
|
"max": 0.6000000000000002, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.010000000000000002, |
|
"min": 0.010000000000000002, |
|
"max": 0.015000000000000003, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 100 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1685981895", |
|
"python_version": "3.10.6 (main, Mar 10 2023, 10:55:28) [GCC 11.3.0]", |
|
"command_line_arguments": "/home/jordi.casalsg@local.eurecat.org/Projects/huggingface_rl_course/.venv/bin/mlagents-learn ml-agents/config/poca/SoccerTwos.yaml --env=ml-agents/training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1685991256" |
|
}, |
|
"total": 9360.728360399, |
|
"count": 1, |
|
"self": 0.2698277909985336, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.009219612999913807, |
|
"count": 1, |
|
"self": 0.009219612999913807 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 9360.449312995, |
|
"count": 1, |
|
"self": 6.83880282789687, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.395111159999942, |
|
"count": 20, |
|
"self": 2.395111159999942 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 9351.069702443105, |
|
"count": 322600, |
|
"self": 6.7799339637513185, |
|
"children": { |
|
"env_step": { |
|
"total": 5966.13806850438, |
|
"count": 322600, |
|
"self": 5015.16742263604, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 946.5662092797893, |
|
"count": 322600, |
|
"self": 40.277690839007846, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 906.2885184407814, |
|
"count": 640360, |
|
"self": 906.2885184407814 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 4.4044365885501975, |
|
"count": 322600, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 9350.874216507473, |
|
"count": 322600, |
|
"is_parallel": true, |
|
"self": 5168.509147819968, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.001656623000599211, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0003833420005321386, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0012732810000670725, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0012732810000670725 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.018593669999972917, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004340109999247943, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00042529999973339727, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00042529999973339727 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.016364310999961162, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.016364310999961162 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0013700480003535631, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.00027673399836203316, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.00109331400199153, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.00109331400199153 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 4182.324120445506, |
|
"count": 322599, |
|
"is_parallel": true, |
|
"self": 226.06505653365912, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 182.2265820848761, |
|
"count": 322599, |
|
"is_parallel": true, |
|
"self": 182.2265820848761 |
|
}, |
|
"communicator.exchange": { |
|
"total": 3018.4676932755547, |
|
"count": 322599, |
|
"is_parallel": true, |
|
"self": 3018.4676932755547 |
|
}, |
|
"steps_from_proto": { |
|
"total": 755.5647885514163, |
|
"count": 645198, |
|
"is_parallel": true, |
|
"self": 140.88628420069745, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 614.6785043507189, |
|
"count": 2580792, |
|
"is_parallel": true, |
|
"self": 614.6785043507189 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.040948241998194135, |
|
"count": 38, |
|
"is_parallel": true, |
|
"self": 0.008140299991282518, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.03280794200691162, |
|
"count": 152, |
|
"is_parallel": true, |
|
"self": 0.03280794200691162 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 3378.151699974973, |
|
"count": 322600, |
|
"self": 52.74593217319125, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 504.36863245177483, |
|
"count": 322600, |
|
"self": 502.78837369577377, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 1.580258756001058, |
|
"count": 10, |
|
"self": 1.580258756001058 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 2821.037135350007, |
|
"count": 232, |
|
"self": 693.2836983750385, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 2127.7534369749683, |
|
"count": 6969, |
|
"self": 2127.7534369749683 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 8.150018402375281e-07, |
|
"count": 1, |
|
"self": 8.150018402375281e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.14569574899724103, |
|
"count": 1, |
|
"self": 0.0010777259994938504, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.14461802299774718, |
|
"count": 1, |
|
"self": 0.14461802299774718 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |