First Push`

266851f 11 months ago

No virus

15.6 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.101550817489624,
	"min": 2.0928046703338623,
	"max": 3.2957100868225098,
	"count": 500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 41493.01953125,
	"min": 26863.70703125,
	"max": 149262.984375,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 48.54545454545455,
	"min": 40.601694915254235,
	"max": 999.0,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19224.0,
	"min": 15016.0,
	"max": 27340.0,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1509.5384765334704,
	"min": 1199.6849224996595,
	"max": 1509.5384765334704,
	"count": 455
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 298888.61835362716,
	"min": 2399.8665656259614,
	"max": 352915.36676651496,
	"count": 455
	},
	"SoccerTwos.Step.mean": {
	"value": 4999942.0,
	"min": 9688.0,
	"max": 4999942.0,
	"count": 500
	},
	"SoccerTwos.Step.sum": {
	"value": 4999942.0,
	"min": 9688.0,
	"max": 4999942.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.04167698323726654,
	"min": -0.08756899833679199,
	"max": 0.17874084413051605,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 8.252042770385742,
	"min": -17.601367950439453,
	"max": 29.46053695678711,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.041709285229444504,
	"min": -0.091096431016922,
	"max": 0.18130771815776825,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 8.258438110351562,
	"min": -18.310382843017578,
	"max": 30.195301055908203,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.08331515150840836,
	"min": -0.5126210542297677,
	"max": 0.49391250126063824,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 16.496399998664856,
	"min": -46.68359994888306,
	"max": 55.72399973869324,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.08331515150840836,
	"min": -0.5126210542297677,
	"max": 0.49391250126063824,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 16.496399998664856,
	"min": -46.68359994888306,
	"max": 55.72399973869324,
	"count": 500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01637880486669019,
	"min": 0.010827948125855377,
	"max": 0.02561439787192891,
	"count": 237
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01637880486669019,
	"min": 0.010827948125855377,
	"max": 0.02561439787192891,
	"count": 237
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.09951823924978574,
	"min": 1.838042171584675e-05,
	"max": 0.11822265212734541,
	"count": 237
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.09951823924978574,
	"min": 1.838042171584675e-05,
	"max": 0.11822265212734541,
	"count": 237
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10291063313682874,
	"min": 1.8114200580991262e-05,
	"max": 0.12203358734647433,
	"count": 237
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10291063313682874,
	"min": 1.8114200580991262e-05,
	"max": 0.12203358734647433,
	"count": 237
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 237
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 237
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 237
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 237
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 237
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 237
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1700139533",
	"python_version": "3.10.7 (tags/v3.10.7:6cc6b13, Sep 5 2022, 14:08:36) [MSC v.1933 64 bit (AMD64)]",
	"command_line_arguments": "\\\\?\\C:\\Users\\lecom\\OneDrive\\Bureau\\unit7\\myenv\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.1.1+cpu",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1700156926"
	},
	"total": 17393.02601479995,
	"count": 1,
	"self": 2.814582899911329,
	"children": {
	"run_training.setup": {
	"total": 0.12561729992739856,
	"count": 1,
	"self": 0.12561729992739856
	},
	"TrainerController.start_learning": {
	"total": 17390.085814600112,
	"count": 1,
	"self": 9.584603649331257,
	"children": {
	"TrainerController._reset_env": {
	"total": 33.72335370001383,
	"count": 25,
	"self": 33.72335370001383
	},
	"TrainerController.advance": {
	"total": 17346.615686350735,
	"count": 335460,
	"self": 9.713295564521104,
	"children": {
	"env_step": {
	"total": 7467.404956086306,
	"count": 335460,
	"self": 5772.600437084911,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1688.5649934096728,
	"count": 335460,
	"self": 57.244869445450604,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1631.3201239642221,
	"count": 638264,
	"self": 1631.3201239642221
	}
	}
	},
	"workers": {
	"total": 6.239525591721758,
	"count": 335460,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 17344.003261046717,
	"count": 335460,
	"is_parallel": true,
	"self": 12703.095018838532,
	"children": {
	"steps_from_proto": {
	"total": 0.0538211006205529,
	"count": 50,
	"is_parallel": true,
	"self": 0.010383699787780643,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.043437400832772255,
	"count": 200,
	"is_parallel": true,
	"self": 0.043437400832772255
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 4640.854421107564,
	"count": 335460,
	"is_parallel": true,
	"self": 253.85978173161857,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 197.41559677710757,
	"count": 335460,
	"is_parallel": true,
	"self": 197.41559677710757
	},
	"communicator.exchange": {
	"total": 3415.724447012879,
	"count": 335460,
	"is_parallel": true,
	"self": 3415.724447012879
	},
	"steps_from_proto": {
	"total": 773.854595585959,
	"count": 670920,
	"is_parallel": true,
	"self": 145.52071978128515,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 628.3338758046739,
	"count": 2683680,
	"is_parallel": true,
	"self": 628.3338758046739
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 9869.497434699908,
	"count": 335460,
	"self": 71.63206536625512,
	"children": {
	"process_trajectory": {
	"total": 1440.7136191353202,
	"count": 335460,
	"self": 1438.7640956351534,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.9495235001668334,
	"count": 10,
	"self": 1.9495235001668334
	}
	}
	},
	"_update_policy": {
	"total": 8357.151750198333,
	"count": 237,
	"self": 798.1456429066602,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 7559.006107291672,
	"count": 7110,
	"self": 7559.006107291672
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.00006091594696e-07,
	"count": 1,
	"self": 8.00006091594696e-07
	},
	"TrainerController._save_models": {
	"total": 0.16217010002583265,
	"count": 1,
	"self": 0.011222600005567074,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.15094750002026558,
	"count": 1,
	"self": 0.15094750002026558
	}
	}
	}
	}
	}
	}
	}