ppo-Pyramids / run_logs /timers.json
Jingwenwang's picture
First Push
610a335 verified
raw
history blame contribute delete
No virus
18.7 kB
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.7123656868934631,
"min": 0.6570796370506287,
"max": 1.428212285041809,
"count": 16
},
"Pyramids.Policy.Entropy.sum": {
"value": 21462.154296875,
"min": 19592.73828125,
"max": 43326.24609375,
"count": 16
},
"Pyramids.Step.mean": {
"value": 479926.0,
"min": 29975.0,
"max": 479926.0,
"count": 16
},
"Pyramids.Step.sum": {
"value": 479926.0,
"min": 29975.0,
"max": 479926.0,
"count": 16
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.08970457315444946,
"min": -0.09704577177762985,
"max": 0.08970457315444946,
"count": 16
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 22.246734619140625,
"min": -23.290985107421875,
"max": 22.246734619140625,
"count": 16
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.011859128251671791,
"min": 0.007869926281273365,
"max": 0.3850874602794647,
"count": 16
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 2.94106388092041,
"min": 1.904522180557251,
"max": 91.65081787109375,
"count": 16
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.066041112951805,
"min": 0.06540364939514,
"max": 0.07304739349894909,
"count": 16
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9245755813252698,
"min": 0.5493568023939963,
"max": 1.0620316853061975,
"count": 16
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.00849363308773877,
"min": 0.0010521916522333481,
"max": 0.00849363308773877,
"count": 16
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.11891086322834277,
"min": 0.009469724870100133,
"max": 0.11891086322834277,
"count": 16
},
"Pyramids.Policy.LearningRate.mean": {
"value": 2.1158192947300003e-05,
"min": 2.1158192947300003e-05,
"max": 0.00029001517832827497,
"count": 16
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.00029621470126220005,
"min": 0.00029621470126220005,
"max": 0.00285423034859,
"count": 16
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10705270000000001,
"min": 0.10705270000000001,
"max": 0.19667172500000002,
"count": 16
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4987378000000002,
"min": 1.4987378000000002,
"max": 2.3386889999999996,
"count": 16
},
"Pyramids.Policy.Beta.mean": {
"value": 0.0007145647300000002,
"min": 0.0007145647300000002,
"max": 0.0096675053275,
"count": 16
},
"Pyramids.Policy.Beta.sum": {
"value": 0.010003906220000002,
"min": 0.010003906220000002,
"max": 0.095175859,
"count": 16
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.01774653047323227,
"min": 0.017288541421294212,
"max": 0.3124820590019226,
"count": 16
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.24845142662525177,
"min": 0.24203957617282867,
"max": 2.499856472015381,
"count": 16
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 802.1621621621622,
"min": 802.1621621621622,
"max": 999.0,
"count": 16
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 29680.0,
"min": 16261.0,
"max": 32296.0,
"count": 16
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 0.3867891382526707,
"min": -0.999987552408129,
"max": 0.3867891382526707,
"count": 16
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 14.311198115348816,
"min": -31.999601677060127,
"max": 14.311198115348816,
"count": 16
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 0.3867891382526707,
"min": -0.999987552408129,
"max": 0.3867891382526707,
"count": 16
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 14.311198115348816,
"min": -31.999601677060127,
"max": 14.311198115348816,
"count": 16
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.14845000534960245,
"min": 0.14590737862965544,
"max": 5.863223752213849,
"count": 16
},
"Pyramids.Policy.RndReward.sum": {
"value": 5.492650197935291,
"min": 5.398573009297252,
"max": 105.53802753984928,
"count": 16
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 16
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 16
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1714871472",
"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=PyramidsTraining --no-graphics",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.2.1+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1714872500"
},
"total": 1028.622528084,
"count": 1,
"self": 0.8875892680000561,
"children": {
"run_training.setup": {
"total": 0.05201031299998249,
"count": 1,
"self": 0.05201031299998249
},
"TrainerController.start_learning": {
"total": 1027.6829285029999,
"count": 1,
"self": 0.685191689992962,
"children": {
"TrainerController._reset_env": {
"total": 2.4036292729999786,
"count": 1,
"self": 2.4036292729999786
},
"TrainerController.advance": {
"total": 1024.466851615007,
"count": 31565,
"self": 0.739460445024406,
"children": {
"env_step": {
"total": 705.335465500984,
"count": 31565,
"self": 638.238447736984,
"children": {
"SubprocessEnvManager._take_step": {
"total": 66.67324442501331,
"count": 31565,
"self": 2.351425785015522,
"children": {
"TorchPolicy.evaluate": {
"total": 64.32181863999779,
"count": 31310,
"self": 64.32181863999779
}
}
},
"workers": {
"total": 0.4237733389867344,
"count": 31565,
"self": 0.0,
"children": {
"worker_root": {
"total": 1024.9422049909845,
"count": 31565,
"is_parallel": true,
"self": 446.7417756769544,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.002068883999982063,
"count": 1,
"is_parallel": true,
"self": 0.0006114659997820127,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0014574180002000503,
"count": 8,
"is_parallel": true,
"self": 0.0014574180002000503
}
}
},
"UnityEnvironment.step": {
"total": 0.09730432000003475,
"count": 1,
"is_parallel": true,
"self": 0.0006878179999603162,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00044245599997339013,
"count": 1,
"is_parallel": true,
"self": 0.00044245599997339013
},
"communicator.exchange": {
"total": 0.09450887100001637,
"count": 1,
"is_parallel": true,
"self": 0.09450887100001637
},
"steps_from_proto": {
"total": 0.0016651750000846732,
"count": 1,
"is_parallel": true,
"self": 0.00033464000000549277,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0013305350000791805,
"count": 8,
"is_parallel": true,
"self": 0.0013305350000791805
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 578.2004293140301,
"count": 31564,
"is_parallel": true,
"self": 17.337495871061037,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 11.954495890984958,
"count": 31564,
"is_parallel": true,
"self": 11.954495890984958
},
"communicator.exchange": {
"total": 499.2348761090019,
"count": 31564,
"is_parallel": true,
"self": 499.2348761090019
},
"steps_from_proto": {
"total": 49.67356144298219,
"count": 31564,
"is_parallel": true,
"self": 9.907257139067724,
"children": {
"_process_rank_one_or_two_observation": {
"total": 39.76630430391447,
"count": 252512,
"is_parallel": true,
"self": 39.76630430391447
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 318.3919256689986,
"count": 31565,
"self": 1.1984411679775349,
"children": {
"process_trajectory": {
"total": 63.746216941020975,
"count": 31565,
"self": 63.582973349020904,
"children": {
"RLTrainer._checkpoint": {
"total": 0.16324359200007166,
"count": 1,
"self": 0.16324359200007166
}
}
},
"_update_policy": {
"total": 253.4472675600001,
"count": 215,
"self": 148.8158095870142,
"children": {
"TorchPPOOptimizer.update": {
"total": 104.63145797298591,
"count": 11436,
"self": 104.63145797298591
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.3059998309472576e-06,
"count": 1,
"self": 1.3059998309472576e-06
},
"TrainerController._save_models": {
"total": 0.1272546190000412,
"count": 1,
"self": 0.0022669290001431364,
"children": {
"RLTrainer._checkpoint": {
"total": 0.12498768999989807,
"count": 1,
"self": 0.12498768999989807
}
}
}
}
}
}
}