|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 2.9276041984558105, |
|
"min": 2.4052186012268066, |
|
"max": 3.2904653549194336, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 291074.125, |
|
"min": 238352.21875, |
|
"max": 387127.46875, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 209.0252100840336, |
|
"min": 209.0252100840336, |
|
"max": 999.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 99496.0, |
|
"min": 96476.0, |
|
"max": 103388.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1247.5067176617156, |
|
"min": 1191.821214563696, |
|
"max": 1247.5067176617156, |
|
"count": 97 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 291916.57193284144, |
|
"min": 2400.650068158895, |
|
"max": 291916.57193284144, |
|
"count": 97 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 4999609.0, |
|
"min": 49542.0, |
|
"max": 4999609.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 4999609.0, |
|
"min": 49542.0, |
|
"max": 4999609.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.03594151511788368, |
|
"min": -0.7357847094535828, |
|
"max": 0.025285867974162102, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -8.554080963134766, |
|
"min": -43.41129684448242, |
|
"max": 1.5930097103118896, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.03636329248547554, |
|
"min": -0.8936510682106018, |
|
"max": 0.017634503543376923, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -8.654463768005371, |
|
"min": -52.72541427612305, |
|
"max": 1.1109737157821655, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": -0.10871008630184566, |
|
"min": -0.33413783843452866, |
|
"max": 0.13830344892781357, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": -25.873000539839268, |
|
"min": -49.45240008831024, |
|
"max": 14.424399744719267, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": -0.10871008630184566, |
|
"min": -0.33413783843452866, |
|
"max": 0.13830344892781357, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": -25.873000539839268, |
|
"min": -49.45240008831024, |
|
"max": 14.424399744719267, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.015674322063245604, |
|
"min": 0.013229400619942074, |
|
"max": 0.020409159014040293, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.047022966189736816, |
|
"min": 0.026458801239884148, |
|
"max": 0.06077529178000987, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.03280250411480665, |
|
"min": 5.554975217592073e-07, |
|
"max": 2.004074016927431, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.09840751234441995, |
|
"min": 1.1109950435184146e-06, |
|
"max": 4.008148033854862, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.03239279271413883, |
|
"min": 5.764401040172136e-06, |
|
"max": 1.9272995501135788, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.09717837814241648, |
|
"min": 1.1528802080344273e-05, |
|
"max": 3.8545991002271576, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0009, |
|
"min": 0.0006, |
|
"max": 0.0009, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.6000000000000002, |
|
"min": 0.40000000000000013, |
|
"max": 0.6000000000000002, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.015000000000000003, |
|
"min": 0.010000000000000002, |
|
"max": 0.015000000000000003, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 100 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 100 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1684325861", |
|
"python_version": "3.9.16 (main, Mar 8 2023, 10:39:24) [MSC v.1916 64 bit (AMD64)]", |
|
"command_line_arguments": "C:\\Users\\Flooow\\.conda\\envs\\rl\\Scripts\\mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./SoccerTwos/SoccerTwos.exe --run-id=SoccerTwos-10M --no-graphics", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.0.1+cu117", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1684339219" |
|
}, |
|
"total": 13358.6668326, |
|
"count": 1, |
|
"self": 2.4185096000001067, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.38227429999999885, |
|
"count": 1, |
|
"self": 0.38227429999999885 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 13355.8660487, |
|
"count": 1, |
|
"self": 9.284362800175586, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 24.4538974000049, |
|
"count": 25, |
|
"self": 24.4538974000049 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 13321.34535139982, |
|
"count": 325072, |
|
"self": 10.613710400095442, |
|
"children": { |
|
"env_step": { |
|
"total": 9782.534153199958, |
|
"count": 325072, |
|
"self": 6388.8133864996325, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 3387.858826500375, |
|
"count": 325072, |
|
"self": 75.56248100037419, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 3312.296345500001, |
|
"count": 644422, |
|
"self": 3312.296345500001 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 5.861940199950787, |
|
"count": 325072, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 13320.95867869975, |
|
"count": 325072, |
|
"is_parallel": true, |
|
"self": 8095.300613399635, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.05063430000442537, |
|
"count": 50, |
|
"is_parallel": true, |
|
"self": 0.010809200011571818, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.03982509999285355, |
|
"count": 200, |
|
"is_parallel": true, |
|
"self": 0.03982509999285355 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 5225.60743100011, |
|
"count": 325072, |
|
"is_parallel": true, |
|
"self": 219.4212635013946, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 179.61969119948486, |
|
"count": 325072, |
|
"is_parallel": true, |
|
"self": 179.61969119948486 |
|
}, |
|
"communicator.exchange": { |
|
"total": 4111.38979529952, |
|
"count": 325072, |
|
"is_parallel": true, |
|
"self": 4111.38979529952 |
|
}, |
|
"steps_from_proto": { |
|
"total": 715.1766809997105, |
|
"count": 650144, |
|
"is_parallel": true, |
|
"self": 157.391692098381, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 557.7849889013295, |
|
"count": 2600576, |
|
"is_parallel": true, |
|
"self": 557.7849889013295 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 3528.1974877997654, |
|
"count": 325072, |
|
"self": 69.7983735997991, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 770.7547103999628, |
|
"count": 325072, |
|
"self": 764.2168591999585, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 6.537851200004297, |
|
"count": 10, |
|
"self": 6.537851200004297 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 2687.6444038000036, |
|
"count": 233, |
|
"self": 1091.2508814999412, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 1596.3935223000624, |
|
"count": 6990, |
|
"self": 1596.3935223000624 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.0000003385357559e-06, |
|
"count": 1, |
|
"self": 1.0000003385357559e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.7824361000002682, |
|
"count": 1, |
|
"self": 0.024627300001156982, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.7578087999991112, |
|
"count": 1, |
|
"self": 0.7578087999991112 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |