|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.7123656868934631, |
|
"min": 0.6570796370506287, |
|
"max": 1.428212285041809, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 21462.154296875, |
|
"min": 19592.73828125, |
|
"max": 43326.24609375, |
|
"count": 16 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 479926.0, |
|
"min": 29975.0, |
|
"max": 479926.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 479926.0, |
|
"min": 29975.0, |
|
"max": 479926.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.08970457315444946, |
|
"min": -0.09704577177762985, |
|
"max": 0.08970457315444946, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 22.246734619140625, |
|
"min": -23.290985107421875, |
|
"max": 22.246734619140625, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.011859128251671791, |
|
"min": 0.007869926281273365, |
|
"max": 0.3850874602794647, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 2.94106388092041, |
|
"min": 1.904522180557251, |
|
"max": 91.65081787109375, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.066041112951805, |
|
"min": 0.06540364939514, |
|
"max": 0.07304739349894909, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9245755813252698, |
|
"min": 0.5493568023939963, |
|
"max": 1.0620316853061975, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.00849363308773877, |
|
"min": 0.0010521916522333481, |
|
"max": 0.00849363308773877, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.11891086322834277, |
|
"min": 0.009469724870100133, |
|
"max": 0.11891086322834277, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 2.1158192947300003e-05, |
|
"min": 2.1158192947300003e-05, |
|
"max": 0.00029001517832827497, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00029621470126220005, |
|
"min": 0.00029621470126220005, |
|
"max": 0.00285423034859, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10705270000000001, |
|
"min": 0.10705270000000001, |
|
"max": 0.19667172500000002, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4987378000000002, |
|
"min": 1.4987378000000002, |
|
"max": 2.3386889999999996, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.0007145647300000002, |
|
"min": 0.0007145647300000002, |
|
"max": 0.0096675053275, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.010003906220000002, |
|
"min": 0.010003906220000002, |
|
"max": 0.095175859, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.01774653047323227, |
|
"min": 0.017288541421294212, |
|
"max": 0.3124820590019226, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.24845142662525177, |
|
"min": 0.24203957617282867, |
|
"max": 2.499856472015381, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 802.1621621621622, |
|
"min": 802.1621621621622, |
|
"max": 999.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29680.0, |
|
"min": 16261.0, |
|
"max": 32296.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 0.3867891382526707, |
|
"min": -0.999987552408129, |
|
"max": 0.3867891382526707, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 14.311198115348816, |
|
"min": -31.999601677060127, |
|
"max": 14.311198115348816, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 0.3867891382526707, |
|
"min": -0.999987552408129, |
|
"max": 0.3867891382526707, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 14.311198115348816, |
|
"min": -31.999601677060127, |
|
"max": 14.311198115348816, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.14845000534960245, |
|
"min": 0.14590737862965544, |
|
"max": 5.863223752213849, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 5.492650197935291, |
|
"min": 5.398573009297252, |
|
"max": 105.53802753984928, |
|
"count": 16 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 16 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1714871472", |
|
"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=PyramidsTraining --no-graphics", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.2.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1714872500" |
|
}, |
|
"total": 1028.622528084, |
|
"count": 1, |
|
"self": 0.8875892680000561, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.05201031299998249, |
|
"count": 1, |
|
"self": 0.05201031299998249 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 1027.6829285029999, |
|
"count": 1, |
|
"self": 0.685191689992962, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.4036292729999786, |
|
"count": 1, |
|
"self": 2.4036292729999786 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 1024.466851615007, |
|
"count": 31565, |
|
"self": 0.739460445024406, |
|
"children": { |
|
"env_step": { |
|
"total": 705.335465500984, |
|
"count": 31565, |
|
"self": 638.238447736984, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 66.67324442501331, |
|
"count": 31565, |
|
"self": 2.351425785015522, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 64.32181863999779, |
|
"count": 31310, |
|
"self": 64.32181863999779 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.4237733389867344, |
|
"count": 31565, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 1024.9422049909845, |
|
"count": 31565, |
|
"is_parallel": true, |
|
"self": 446.7417756769544, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.002068883999982063, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006114659997820127, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0014574180002000503, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0014574180002000503 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.09730432000003475, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006878179999603162, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00044245599997339013, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00044245599997339013 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.09450887100001637, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.09450887100001637 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0016651750000846732, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00033464000000549277, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0013305350000791805, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0013305350000791805 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 578.2004293140301, |
|
"count": 31564, |
|
"is_parallel": true, |
|
"self": 17.337495871061037, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 11.954495890984958, |
|
"count": 31564, |
|
"is_parallel": true, |
|
"self": 11.954495890984958 |
|
}, |
|
"communicator.exchange": { |
|
"total": 499.2348761090019, |
|
"count": 31564, |
|
"is_parallel": true, |
|
"self": 499.2348761090019 |
|
}, |
|
"steps_from_proto": { |
|
"total": 49.67356144298219, |
|
"count": 31564, |
|
"is_parallel": true, |
|
"self": 9.907257139067724, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 39.76630430391447, |
|
"count": 252512, |
|
"is_parallel": true, |
|
"self": 39.76630430391447 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 318.3919256689986, |
|
"count": 31565, |
|
"self": 1.1984411679775349, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 63.746216941020975, |
|
"count": 31565, |
|
"self": 63.582973349020904, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.16324359200007166, |
|
"count": 1, |
|
"self": 0.16324359200007166 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 253.4472675600001, |
|
"count": 215, |
|
"self": 148.8158095870142, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 104.63145797298591, |
|
"count": 11436, |
|
"self": 104.63145797298591 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.3059998309472576e-06, |
|
"count": 1, |
|
"self": 1.3059998309472576e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.1272546190000412, |
|
"count": 1, |
|
"self": 0.0022669290001431364, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.12498768999989807, |
|
"count": 1, |
|
"self": 0.12498768999989807 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |