JuneV's picture
First Push`
266851f
raw
history blame contribute delete
No virus
15.6 kB
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 2.101550817489624,
"min": 2.0928046703338623,
"max": 3.2957100868225098,
"count": 500
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 41493.01953125,
"min": 26863.70703125,
"max": 149262.984375,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 48.54545454545455,
"min": 40.601694915254235,
"max": 999.0,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19224.0,
"min": 15016.0,
"max": 27340.0,
"count": 500
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1509.5384765334704,
"min": 1199.6849224996595,
"max": 1509.5384765334704,
"count": 455
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 298888.61835362716,
"min": 2399.8665656259614,
"max": 352915.36676651496,
"count": 455
},
"SoccerTwos.Step.mean": {
"value": 4999942.0,
"min": 9688.0,
"max": 4999942.0,
"count": 500
},
"SoccerTwos.Step.sum": {
"value": 4999942.0,
"min": 9688.0,
"max": 4999942.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": 0.04167698323726654,
"min": -0.08756899833679199,
"max": 0.17874084413051605,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": 8.252042770385742,
"min": -17.601367950439453,
"max": 29.46053695678711,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.041709285229444504,
"min": -0.091096431016922,
"max": 0.18130771815776825,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": 8.258438110351562,
"min": -18.310382843017578,
"max": 30.195301055908203,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": 0.08331515150840836,
"min": -0.5126210542297677,
"max": 0.49391250126063824,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": 16.496399998664856,
"min": -46.68359994888306,
"max": 55.72399973869324,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": 0.08331515150840836,
"min": -0.5126210542297677,
"max": 0.49391250126063824,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": 16.496399998664856,
"min": -46.68359994888306,
"max": 55.72399973869324,
"count": 500
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.01637880486669019,
"min": 0.010827948125855377,
"max": 0.02561439787192891,
"count": 237
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.01637880486669019,
"min": 0.010827948125855377,
"max": 0.02561439787192891,
"count": 237
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.09951823924978574,
"min": 1.838042171584675e-05,
"max": 0.11822265212734541,
"count": 237
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.09951823924978574,
"min": 1.838042171584675e-05,
"max": 0.11822265212734541,
"count": 237
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.10291063313682874,
"min": 1.8114200580991262e-05,
"max": 0.12203358734647433,
"count": 237
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.10291063313682874,
"min": 1.8114200580991262e-05,
"max": 0.12203358734647433,
"count": 237
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 237
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 237
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 237
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 237
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 237
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 237
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1700139533",
"python_version": "3.10.7 (tags/v3.10.7:6cc6b13, Sep 5 2022, 14:08:36) [MSC v.1933 64 bit (AMD64)]",
"command_line_arguments": "\\\\?\\C:\\Users\\lecom\\OneDrive\\Bureau\\unit7\\myenv\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.1.1+cpu",
"numpy_version": "1.23.5",
"end_time_seconds": "1700156926"
},
"total": 17393.02601479995,
"count": 1,
"self": 2.814582899911329,
"children": {
"run_training.setup": {
"total": 0.12561729992739856,
"count": 1,
"self": 0.12561729992739856
},
"TrainerController.start_learning": {
"total": 17390.085814600112,
"count": 1,
"self": 9.584603649331257,
"children": {
"TrainerController._reset_env": {
"total": 33.72335370001383,
"count": 25,
"self": 33.72335370001383
},
"TrainerController.advance": {
"total": 17346.615686350735,
"count": 335460,
"self": 9.713295564521104,
"children": {
"env_step": {
"total": 7467.404956086306,
"count": 335460,
"self": 5772.600437084911,
"children": {
"SubprocessEnvManager._take_step": {
"total": 1688.5649934096728,
"count": 335460,
"self": 57.244869445450604,
"children": {
"TorchPolicy.evaluate": {
"total": 1631.3201239642221,
"count": 638264,
"self": 1631.3201239642221
}
}
},
"workers": {
"total": 6.239525591721758,
"count": 335460,
"self": 0.0,
"children": {
"worker_root": {
"total": 17344.003261046717,
"count": 335460,
"is_parallel": true,
"self": 12703.095018838532,
"children": {
"steps_from_proto": {
"total": 0.0538211006205529,
"count": 50,
"is_parallel": true,
"self": 0.010383699787780643,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.043437400832772255,
"count": 200,
"is_parallel": true,
"self": 0.043437400832772255
}
}
},
"UnityEnvironment.step": {
"total": 4640.854421107564,
"count": 335460,
"is_parallel": true,
"self": 253.85978173161857,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 197.41559677710757,
"count": 335460,
"is_parallel": true,
"self": 197.41559677710757
},
"communicator.exchange": {
"total": 3415.724447012879,
"count": 335460,
"is_parallel": true,
"self": 3415.724447012879
},
"steps_from_proto": {
"total": 773.854595585959,
"count": 670920,
"is_parallel": true,
"self": 145.52071978128515,
"children": {
"_process_rank_one_or_two_observation": {
"total": 628.3338758046739,
"count": 2683680,
"is_parallel": true,
"self": 628.3338758046739
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 9869.497434699908,
"count": 335460,
"self": 71.63206536625512,
"children": {
"process_trajectory": {
"total": 1440.7136191353202,
"count": 335460,
"self": 1438.7640956351534,
"children": {
"RLTrainer._checkpoint": {
"total": 1.9495235001668334,
"count": 10,
"self": 1.9495235001668334
}
}
},
"_update_policy": {
"total": 8357.151750198333,
"count": 237,
"self": 798.1456429066602,
"children": {
"TorchPOCAOptimizer.update": {
"total": 7559.006107291672,
"count": 7110,
"self": 7559.006107291672
}
}
}
}
}
}
},
"trainer_threads": {
"total": 8.00006091594696e-07,
"count": 1,
"self": 8.00006091594696e-07
},
"TrainerController._save_models": {
"total": 0.16217010002583265,
"count": 1,
"self": 0.011222600005567074,
"children": {
"RLTrainer._checkpoint": {
"total": 0.15094750002026558,
"count": 1,
"self": 0.15094750002026558
}
}
}
}
}
}
}