poca-SoccerTwos / run_logs /timers.json
jcnecio's picture
First Push
fd9458b
raw
history blame
20.1 kB
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 2.742280960083008,
"min": 2.6674821376800537,
"max": 3.295766830444336,
"count": 500
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 58706.75,
"min": 14465.828125,
"max": 123279.390625,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 999.0,
"min": 471.9166666666667,
"max": 999.0,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19980.0,
"min": 8100.0,
"max": 27820.0,
"count": 500
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1186.4485299524047,
"min": 1185.6992495082593,
"max": 1202.8828671100055,
"count": 265
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 2372.8970599048093,
"min": 2371.3984990165186,
"max": 14376.966472411987,
"count": 265
},
"SoccerTwos.Step.mean": {
"value": 4999230.0,
"min": 9810.0,
"max": 4999230.0,
"count": 500
},
"SoccerTwos.Step.sum": {
"value": 4999230.0,
"min": 9810.0,
"max": 4999230.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.0014187560882419348,
"min": -0.05105555057525635,
"max": 0.017309702932834625,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -0.014187561348080635,
"min": -0.7147754430770874,
"max": 0.29426494240760803,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.0010586295975372195,
"min": -0.05101824924349785,
"max": 0.028445616364479065,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -0.010586296208202839,
"min": -0.7142555117607117,
"max": 0.3413473963737488,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": 0.0,
"min": -0.5505882343825172,
"max": 0.2721428530556815,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": 0.0,
"min": -9.359999984502792,
"max": 3.809999942779541,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": 0.0,
"min": -0.5505882343825172,
"max": 0.2721428530556815,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": 0.0,
"min": -9.359999984502792,
"max": 3.809999942779541,
"count": 500
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.015296474660378106,
"min": 0.01056568751616093,
"max": 0.024043762955504158,
"count": 230
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.015296474660378106,
"min": 0.01056568751616093,
"max": 0.024043762955504158,
"count": 230
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.000789181159537596,
"min": 1.0932025655089698e-08,
"max": 0.006812173780053854,
"count": 230
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.000789181159537596,
"min": 1.0932025655089698e-08,
"max": 0.006812173780053854,
"count": 230
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.0007970635478462403,
"min": 1.8385839517520708e-08,
"max": 0.00682806756036977,
"count": 230
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.0007970635478462403,
"min": 1.8385839517520708e-08,
"max": 0.00682806756036977,
"count": 230
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 230
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 230
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000004,
"max": 0.20000000000000007,
"count": 230
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000004,
"max": 0.20000000000000007,
"count": 230
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 230
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 230
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1687184424",
"python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu113",
"numpy_version": "1.21.2",
"end_time_seconds": "1687191992"
},
"total": 7567.887915133999,
"count": 1,
"self": 0.5864291879988741,
"children": {
"run_training.setup": {
"total": 0.024859550999735802,
"count": 1,
"self": 0.024859550999735802
},
"TrainerController.start_learning": {
"total": 7567.276626395001,
"count": 1,
"self": 5.294599101051972,
"children": {
"TrainerController._reset_env": {
"total": 10.024710350998703,
"count": 25,
"self": 10.024710350998703
},
"TrainerController.advance": {
"total": 7551.59609919995,
"count": 325166,
"self": 4.93967696013442,
"children": {
"env_step": {
"total": 5984.00752947861,
"count": 325166,
"self": 3709.9503396504083,
"children": {
"SubprocessEnvManager._take_step": {
"total": 2270.194662567987,
"count": 325166,
"self": 32.29232111299052,
"children": {
"TorchPolicy.evaluate": {
"total": 2237.9023414549965,
"count": 645734,
"self": 2237.9023414549965
}
}
},
"workers": {
"total": 3.862527260214847,
"count": 325166,
"self": 0.0,
"children": {
"worker_root": {
"total": 7553.082217968909,
"count": 325166,
"is_parallel": true,
"self": 4435.193045014867,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.003049627000109467,
"count": 2,
"is_parallel": true,
"self": 0.0009371020009893982,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.002112524999120069,
"count": 8,
"is_parallel": true,
"self": 0.002112524999120069
}
}
},
"UnityEnvironment.step": {
"total": 0.019160173000273062,
"count": 1,
"is_parallel": true,
"self": 0.0002981419997922785,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0003540580000844784,
"count": 1,
"is_parallel": true,
"self": 0.0003540580000844784
},
"communicator.exchange": {
"total": 0.0176085759999296,
"count": 1,
"is_parallel": true,
"self": 0.0176085759999296
},
"steps_from_proto": {
"total": 0.0008993970004667062,
"count": 2,
"is_parallel": true,
"self": 0.00020164799980193493,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0006977490006647713,
"count": 8,
"is_parallel": true,
"self": 0.0006977490006647713
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 3117.8669260360434,
"count": 325165,
"is_parallel": true,
"self": 93.6686693062502,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 59.86260627917227,
"count": 325165,
"is_parallel": true,
"self": 59.86260627917227
},
"communicator.exchange": {
"total": 2689.9867284767593,
"count": 325165,
"is_parallel": true,
"self": 2689.9867284767593
},
"steps_from_proto": {
"total": 274.3489219738617,
"count": 650330,
"is_parallel": true,
"self": 57.017932745248345,
"children": {
"_process_rank_one_or_two_observation": {
"total": 217.33098922861336,
"count": 2601320,
"is_parallel": true,
"self": 217.33098922861336
}
}
}
}
},
"steps_from_proto": {
"total": 0.02224691799892753,
"count": 48,
"is_parallel": true,
"self": 0.004810555998119526,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.017436362000808003,
"count": 192,
"is_parallel": true,
"self": 0.017436362000808003
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 1562.6488927612058,
"count": 325166,
"self": 62.0224092779963,
"children": {
"process_trajectory": {
"total": 566.227498354217,
"count": 325166,
"self": 562.7573808262159,
"children": {
"RLTrainer._checkpoint": {
"total": 3.470117528001083,
"count": 10,
"self": 3.470117528001083
}
}
},
"_update_policy": {
"total": 934.3989851289925,
"count": 230,
"self": 501.877379921998,
"children": {
"TorchPOCAOptimizer.update": {
"total": 432.52160520699454,
"count": 6909,
"self": 432.52160520699454
}
}
}
}
}
}
},
"trainer_threads": {
"total": 5.990004865452647e-07,
"count": 1,
"self": 5.990004865452647e-07
},
"TrainerController._save_models": {
"total": 0.36121714399996563,
"count": 1,
"self": 0.039050487999702455,
"children": {
"RLTrainer._checkpoint": {
"total": 0.3221666560002632,
"count": 1,
"self": 0.3221666560002632
}
}
}
}
}
}
}