ppo-Pyramids / run_logs /timers.json
emmuzoo's picture
basic model
2e3f5ff
raw
history blame contribute delete
No virus
18.7 kB
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.4975653886795044,
"min": 0.47961491346359253,
"max": 1.3951681852340698,
"count": 33
},
"Pyramids.Policy.Entropy.sum": {
"value": 14847.3515625,
"min": 14350.078125,
"max": 42323.8203125,
"count": 33
},
"Pyramids.Step.mean": {
"value": 989894.0,
"min": 29952.0,
"max": 989894.0,
"count": 33
},
"Pyramids.Step.sum": {
"value": 989894.0,
"min": 29952.0,
"max": 989894.0,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.4085873067378998,
"min": -0.08974519371986389,
"max": 0.4677356481552124,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 108.275634765625,
"min": -21.449100494384766,
"max": 127.2240982055664,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.014104614965617657,
"min": -0.005268337205052376,
"max": 0.25343790650367737,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 3.737722873687744,
"min": -1.4066460132598877,
"max": 60.064781188964844,
"count": 33
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06710505671061397,
"min": 0.06500589805137781,
"max": 0.07254626382824657,
"count": 33
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9394707939485956,
"min": 0.5075860991809736,
"max": 1.0320246177531465,
"count": 33
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.01582775835001793,
"min": 0.0003489376471918086,
"max": 0.01644820867449097,
"count": 33
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.221588616900251,
"min": 0.004885127060685321,
"max": 0.24672313011736455,
"count": 33
},
"Pyramids.Policy.LearningRate.mean": {
"value": 7.363468974114286e-06,
"min": 7.363468974114286e-06,
"max": 0.00029515063018788575,
"count": 33
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.0001030885656376,
"min": 0.0001030885656376,
"max": 0.0036331561889480003,
"count": 33
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10245445714285714,
"min": 0.10245445714285714,
"max": 0.19838354285714285,
"count": 33
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4343624,
"min": 1.3886848,
"max": 2.6110519999999995,
"count": 33
},
"Pyramids.Policy.Beta.mean": {
"value": 0.00025520026857142863,
"min": 0.00025520026857142863,
"max": 0.00983851593142857,
"count": 33
},
"Pyramids.Policy.Beta.sum": {
"value": 0.003572803760000001,
"min": 0.003572803760000001,
"max": 0.12112409480000001,
"count": 33
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.009822138585150242,
"min": 0.009822138585150242,
"max": 0.4139936566352844,
"count": 33
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.13750994205474854,
"min": 0.13750994205474854,
"max": 2.8979556560516357,
"count": 33
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 389.09859154929575,
"min": 389.09859154929575,
"max": 999.0,
"count": 33
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 27626.0,
"min": 15984.0,
"max": 32785.0,
"count": 33
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.4136591310232458,
"min": -1.0000000521540642,
"max": 1.5503628332700048,
"count": 33
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 100.36979830265045,
"min": -29.89840167760849,
"max": 108.52539832890034,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.4136591310232458,
"min": -1.0000000521540642,
"max": 1.5503628332700048,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 100.36979830265045,
"min": -29.89840167760849,
"max": 108.52539832890034,
"count": 33
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.03946737707309707,
"min": 0.03946737707309707,
"max": 8.436937988270074,
"count": 33
},
"Pyramids.Policy.RndReward.sum": {
"value": 2.802183772189892,
"min": 2.802183772189892,
"max": 134.9910078123212,
"count": 33
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1679827432",
"python_version": "3.9.16 (main, Dec 7 2022, 01:11:51) \n[GCC 9.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids-Training-01 --no-graphics",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1679829642"
},
"total": 2209.582941508,
"count": 1,
"self": 0.48784612800000104,
"children": {
"run_training.setup": {
"total": 0.11024874600002477,
"count": 1,
"self": 0.11024874600002477
},
"TrainerController.start_learning": {
"total": 2208.984846634,
"count": 1,
"self": 1.6394397359608774,
"children": {
"TrainerController._reset_env": {
"total": 6.252175113000021,
"count": 1,
"self": 6.252175113000021
},
"TrainerController.advance": {
"total": 2200.9970362320387,
"count": 63574,
"self": 1.7514847370725874,
"children": {
"env_step": {
"total": 1559.8176929829783,
"count": 63574,
"self": 1442.1477295419309,
"children": {
"SubprocessEnvManager._take_step": {
"total": 116.75630156701459,
"count": 63574,
"self": 4.92620027300444,
"children": {
"TorchPolicy.evaluate": {
"total": 111.83010129401015,
"count": 62556,
"self": 111.83010129401015
}
}
},
"workers": {
"total": 0.9136618740329823,
"count": 63574,
"self": 0.0,
"children": {
"worker_root": {
"total": 2203.9800220379916,
"count": 63574,
"is_parallel": true,
"self": 886.5983430489539,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.001865398000006735,
"count": 1,
"is_parallel": true,
"self": 0.0005853390000538639,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.001280058999952871,
"count": 8,
"is_parallel": true,
"self": 0.001280058999952871
}
}
},
"UnityEnvironment.step": {
"total": 0.08041903200000888,
"count": 1,
"is_parallel": true,
"self": 0.0005801249999421998,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0004834540000047127,
"count": 1,
"is_parallel": true,
"self": 0.0004834540000047127
},
"communicator.exchange": {
"total": 0.07765766700003951,
"count": 1,
"is_parallel": true,
"self": 0.07765766700003951
},
"steps_from_proto": {
"total": 0.001697786000022461,
"count": 1,
"is_parallel": true,
"self": 0.0004786699998930999,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.001219116000129361,
"count": 8,
"is_parallel": true,
"self": 0.001219116000129361
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1317.3816789890377,
"count": 63573,
"is_parallel": true,
"self": 32.843421338983035,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 23.393729668981848,
"count": 63573,
"is_parallel": true,
"self": 23.393729668981848
},
"communicator.exchange": {
"total": 1164.2905567070488,
"count": 63573,
"is_parallel": true,
"self": 1164.2905567070488
},
"steps_from_proto": {
"total": 96.85397127402388,
"count": 63573,
"is_parallel": true,
"self": 20.916294354970887,
"children": {
"_process_rank_one_or_two_observation": {
"total": 75.93767691905299,
"count": 508584,
"is_parallel": true,
"self": 75.93767691905299
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 639.427858511988,
"count": 63574,
"self": 2.9213153139994574,
"children": {
"process_trajectory": {
"total": 119.87786565599055,
"count": 63574,
"self": 119.61185070899074,
"children": {
"RLTrainer._checkpoint": {
"total": 0.2660149469998032,
"count": 2,
"self": 0.2660149469998032
}
}
},
"_update_policy": {
"total": 516.6286775419981,
"count": 452,
"self": 327.54881674702926,
"children": {
"TorchPPOOptimizer.update": {
"total": 189.0798607949688,
"count": 22830,
"self": 189.0798607949688
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.0280000424245372e-06,
"count": 1,
"self": 1.0280000424245372e-06
},
"TrainerController._save_models": {
"total": 0.09619452500010084,
"count": 1,
"self": 0.001404715000262513,
"children": {
"RLTrainer._checkpoint": {
"total": 0.09478980999983833,
"count": 1,
"self": 0.09478980999983833
}
}
}
}
}
}
}