First Push

1ea5c05 about 1 year ago

20.1 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.8989752531051636,
	"min": 1.874920129776001,
	"max": 3.295649528503418,
	"count": 503
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 36703.39453125,
	"min": 23047.001953125,
	"max": 149144.125,
	"count": 503
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 60.7037037037037,
	"min": 45.76851851851852,
	"max": 999.0,
	"count": 503
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19668.0,
	"min": 12040.0,
	"max": 29340.0,
	"count": 503
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1535.159289799666,
	"min": 1193.3844646799969,
	"max": 1576.6173982585622,
	"count": 498
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 248695.8049475459,
	"min": 2391.885550734001,
	"max": 338869.84806884336,
	"count": 498
	},
	"SoccerTwos.Step.mean": {
	"value": 5029966.0,
	"min": 9686.0,
	"max": 5029966.0,
	"count": 503
	},
	"SoccerTwos.Step.sum": {
	"value": 5029966.0,
	"min": 9686.0,
	"max": 5029966.0,
	"count": 503
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.05807129666209221,
	"min": -0.0826704278588295,
	"max": 0.16211707890033722,
	"count": 503
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -9.349478721618652,
	"min": -14.384654998779297,
	"max": 31.450714111328125,
	"count": 503
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.05922158807516098,
	"min": -0.07887663692235947,
	"max": 0.16130302846431732,
	"count": 503
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -9.534675598144531,
	"min": -13.72453498840332,
	"max": 31.292787551879883,
	"count": 503
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 503
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 503
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.2695354034441598,
	"min": -0.5384615384615384,
	"max": 0.44134400367736815,
	"count": 503
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -43.395199954509735,
	"min": -52.89300036430359,
	"max": 73.22740012407303,
	"count": 503
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.2695354034441598,
	"min": -0.5384615384615384,
	"max": 0.44134400367736815,
	"count": 503
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -43.395199954509735,
	"min": -52.89300036430359,
	"max": 73.22740012407303,
	"count": 503
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 503
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 503
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.014789016257661084,
	"min": 0.011286390731887272,
	"max": 0.023933018437431505,
	"count": 242
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.014789016257661084,
	"min": 0.011286390731887272,
	"max": 0.023933018437431505,
	"count": 242
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10319915811220805,
	"min": 4.78353564782689e-05,
	"max": 0.11067347327868143,
	"count": 242
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10319915811220805,
	"min": 4.78353564782689e-05,
	"max": 0.11067347327868143,
	"count": 242
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10465494121114413,
	"min": 4.857856535333364e-05,
	"max": 0.11234949777523677,
	"count": 242
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10465494121114413,
	"min": 4.857856535333364e-05,
	"max": 0.11234949777523677,
	"count": 242
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 242
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 242
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 242
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 242
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 242
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 242
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1688640495",
	"python_version": "3.10.12 (main, Jun 7 2023, 12:45:35) [GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1688651519"
	},
	"total": 11024.467642585001,
	"count": 1,
	"self": 0.429065709000497,
	"children": {
	"run_training.setup": {
	"total": 0.0402406199999632,
	"count": 1,
	"self": 0.0402406199999632
	},
	"TrainerController.start_learning": {
	"total": 11023.998336256001,
	"count": 1,
	"self": 7.7194901102848235,
	"children": {
	"TrainerController._reset_env": {
	"total": 5.000056976002384,
	"count": 26,
	"self": 5.000056976002384
	},
	"TrainerController.advance": {
	"total": 11011.274762366715,
	"count": 343453,
	"self": 8.134539232027237,
	"children": {
	"env_step": {
	"total": 8407.070216991939,
	"count": 343453,
	"self": 6689.892364141599,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1712.5903909562267,
	"count": 343453,
	"self": 52.48040861892514,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1660.1099823373015,
	"count": 634724,
	"self": 1660.1099823373015
	}
	}
	},
	"workers": {
	"total": 4.587461894113403,
	"count": 343452,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 11004.388166637087,
	"count": 343452,
	"is_parallel": true,
	"self": 5317.457861080138,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.006125395000026401,
	"count": 2,
	"is_parallel": true,
	"self": 0.0038241940001171315,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0023012009999092697,
	"count": 8,
	"is_parallel": true,
	"self": 0.0023012009999092697
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.0403233069999942,
	"count": 1,
	"is_parallel": true,
	"self": 0.001106886000002305,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0009362990000454374,
	"count": 1,
	"is_parallel": true,
	"self": 0.0009362990000454374
	},
	"communicator.exchange": {
	"total": 0.034861199000033594,
	"count": 1,
	"is_parallel": true,
	"self": 0.034861199000033594
	},
	"steps_from_proto": {
	"total": 0.0034189229999128656,
	"count": 2,
	"is_parallel": true,
	"self": 0.0006124419999196107,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.002806480999993255,
	"count": 8,
	"is_parallel": true,
	"self": 0.002806480999993255
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 5686.8759192669495,
	"count": 343451,
	"is_parallel": true,
	"self": 348.9488778605137,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 217.02216981993251,
	"count": 343451,
	"is_parallel": true,
	"self": 217.02216981993251
	},
	"communicator.exchange": {
	"total": 4029.27468528195,
	"count": 343451,
	"is_parallel": true,
	"self": 4029.27468528195
	},
	"steps_from_proto": {
	"total": 1091.6301863045542,
	"count": 686902,
	"is_parallel": true,
	"self": 183.29490319546403,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 908.3352831090901,
	"count": 2747608,
	"is_parallel": true,
	"self": 908.3352831090901
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.054386289999797555,
	"count": 50,
	"is_parallel": true,
	"self": 0.009579804985264673,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.04480648501453288,
	"count": 200,
	"is_parallel": true,
	"self": 0.04480648501453288
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 2596.070006142748,
	"count": 343452,
	"self": 64.25883360140915,
	"children": {
	"process_trajectory": {
	"total": 946.7535668233348,
	"count": 343452,
	"self": 943.8542154893336,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 2.899351334001267,
	"count": 10,
	"self": 2.899351334001267
	}
	}
	},
	"_update_policy": {
	"total": 1585.0576057180037,
	"count": 242,
	"self": 1003.065424554992,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 581.9921811630118,
	"count": 7260,
	"self": 581.9921811630118
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.1899992387043312e-06,
	"count": 1,
	"self": 1.1899992387043312e-06
	},
	"TrainerController._save_models": {
	"total": 0.004025612999612349,
	"count": 1,
	"self": 4.299700049159583e-05,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.003982615999120753,
	"count": 1,
	"self": 0.003982615999120753
	}
	}
	}
	}
	}
	}
	}