NoNameFound's picture
First Push
984ffc4
raw
history blame contribute delete
No virus
15.6 kB
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.8765040636062622,
"min": 1.7863812446594238,
"max": 3.2957403659820557,
"count": 1000
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 38130.5625,
"min": 26096.654296875,
"max": 124687.453125,
"count": 1000
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 56.81395348837209,
"min": 40.834782608695654,
"max": 999.0,
"count": 1000
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19544.0,
"min": 7524.0,
"max": 31968.0,
"count": 1000
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1708.697937470418,
"min": 1193.9183309788523,
"max": 1729.712270819381,
"count": 977
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 293896.0452449119,
"min": 2388.7747462231155,
"max": 409305.8691895164,
"count": 977
},
"SoccerTwos.Step.mean": {
"value": 9999972.0,
"min": 9522.0,
"max": 9999972.0,
"count": 1000
},
"SoccerTwos.Step.sum": {
"value": 9999972.0,
"min": 9522.0,
"max": 9999972.0,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.018940679728984833,
"min": -0.13247385621070862,
"max": 0.1722002923488617,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -3.2577970027923584,
"min": -31.263830184936523,
"max": 27.035446166992188,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.016107002273201942,
"min": -0.13530893623828888,
"max": 0.1711462438106537,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -2.77040433883667,
"min": -31.93290901184082,
"max": 26.86996078491211,
"count": 1000
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 1000
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.1569639527520468,
"min": -0.5523571435894284,
"max": 0.5504761849130902,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -26.99779987335205,
"min": -63.495600044727325,
"max": 68.06360018253326,
"count": 1000
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.1569639527520468,
"min": -0.5523571435894284,
"max": 0.5504761849130902,
"count": 1000
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -26.99779987335205,
"min": -63.495600044727325,
"max": 68.06360018253326,
"count": 1000
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 1000
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 1000
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.01596075825897666,
"min": 0.009748829703312367,
"max": 0.02528138120736306,
"count": 482
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.01596075825897666,
"min": 0.009748829703312367,
"max": 0.02528138120736306,
"count": 482
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.11302952369054159,
"min": 1.8284332175729407e-05,
"max": 0.12636658623814584,
"count": 482
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.11302952369054159,
"min": 1.8284332175729407e-05,
"max": 0.12636658623814584,
"count": 482
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.11423842584093412,
"min": 2.9556284274197728e-05,
"max": 0.12823313375314077,
"count": 482
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.11423842584093412,
"min": 2.9556284274197728e-05,
"max": 0.12823313375314077,
"count": 482
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 482
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 482
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000004,
"max": 0.20000000000000007,
"count": 482
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000004,
"max": 0.20000000000000007,
"count": 482
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 482
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 482
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1676205365",
"python_version": "3.8.16 (default, Jan 17 2023, 22:25:28) [MSC v.1916 64 bit (AMD64)]",
"command_line_arguments": "C:\\Users\\Kaush\\miniconda3\\envs\\rl\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=pocatrainergoal2 --no-graphics",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.13.1+cu117",
"numpy_version": "1.21.2",
"end_time_seconds": "1676224341"
},
"total": 18975.6975353,
"count": 1,
"self": 0.4365185000024212,
"children": {
"run_training.setup": {
"total": 0.10058610000000012,
"count": 1,
"self": 0.10058610000000012
},
"TrainerController.start_learning": {
"total": 18975.160430699998,
"count": 1,
"self": 16.110423399986757,
"children": {
"TrainerController._reset_env": {
"total": 7.637262500006049,
"count": 50,
"self": 7.637262500006049
},
"TrainerController.advance": {
"total": 18951.275029000004,
"count": 687399,
"self": 15.667838597910304,
"children": {
"env_step": {
"total": 13553.667134001029,
"count": 687399,
"self": 8593.320714800799,
"children": {
"SubprocessEnvManager._take_step": {
"total": 4950.316458399658,
"count": 687399,
"self": 88.2371188992447,
"children": {
"TorchPolicy.evaluate": {
"total": 4862.079339500413,
"count": 1259946,
"self": 4862.079339500413
}
}
},
"workers": {
"total": 10.02996080057262,
"count": 687399,
"self": 0.0,
"children": {
"worker_root": {
"total": 18951.255278000794,
"count": 687399,
"is_parallel": true,
"self": 12080.557430200377,
"children": {
"steps_from_proto": {
"total": 0.08635440000356454,
"count": 100,
"is_parallel": true,
"self": 0.019513299986659405,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.06684110001690513,
"count": 400,
"is_parallel": true,
"self": 0.06684110001690513
}
}
},
"UnityEnvironment.step": {
"total": 6870.611493400413,
"count": 687399,
"is_parallel": true,
"self": 299.2152722992032,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 302.0881656994367,
"count": 687399,
"is_parallel": true,
"self": 302.0881656994367
},
"communicator.exchange": {
"total": 5328.05041159995,
"count": 687399,
"is_parallel": true,
"self": 5328.05041159995
},
"steps_from_proto": {
"total": 941.2576438018222,
"count": 1374798,
"is_parallel": true,
"self": 204.96093240318282,
"children": {
"_process_rank_one_or_two_observation": {
"total": 736.2967113986393,
"count": 5499192,
"is_parallel": true,
"self": 736.2967113986393
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 5381.940056401063,
"count": 687399,
"self": 106.62313190166333,
"children": {
"process_trajectory": {
"total": 2449.901281399413,
"count": 687399,
"self": 2446.799516599416,
"children": {
"RLTrainer._checkpoint": {
"total": 3.101764799996772,
"count": 20,
"self": 3.101764799996772
}
}
},
"_update_policy": {
"total": 2825.4156430999865,
"count": 482,
"self": 1816.062887099934,
"children": {
"TorchPOCAOptimizer.update": {
"total": 1009.3527560000525,
"count": 14469,
"self": 1009.3527560000525
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.0000003385357559e-06,
"count": 1,
"self": 1.0000003385357559e-06
},
"TrainerController._save_models": {
"total": 0.1377147999992303,
"count": 1,
"self": 0.0013646000006701797,
"children": {
"RLTrainer._checkpoint": {
"total": 0.13635019999856013,
"count": 1,
"self": 0.13635019999856013
}
}
}
}
}
}
}