|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.35815030336380005, |
|
"min": 0.35815030336380005, |
|
"max": 1.4520021677017212, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 10824.734375, |
|
"min": 10824.734375, |
|
"max": 44047.9375, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989939.0, |
|
"min": 29952.0, |
|
"max": 989939.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989939.0, |
|
"min": 29952.0, |
|
"max": 989939.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.6121128797531128, |
|
"min": -0.1827024668455124, |
|
"max": 0.6121128797531128, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 172.61582946777344, |
|
"min": -43.30048370361328, |
|
"max": 172.61582946777344, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.013274436816573143, |
|
"min": -0.009086871519684792, |
|
"max": 0.3750952482223511, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 3.743391275405884, |
|
"min": -2.444368362426758, |
|
"max": 88.89757537841797, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06830938380084088, |
|
"min": 0.06601005687526067, |
|
"max": 0.07532057773009085, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9563313732117724, |
|
"min": 0.4930694141885502, |
|
"max": 1.1146038370058582, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.01529186453539989, |
|
"min": 0.0008389395629419968, |
|
"max": 0.017027024817902463, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.21408610349559845, |
|
"min": 0.010906214318245958, |
|
"max": 0.2473431952336493, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.751175987735717e-06, |
|
"min": 7.751175987735717e-06, |
|
"max": 0.00029515063018788575, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00010851646382830004, |
|
"min": 0.00010851646382830004, |
|
"max": 0.0033828704723766, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10258369285714286, |
|
"min": 0.10258369285714286, |
|
"max": 0.19838354285714285, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4361717, |
|
"min": 1.3886848, |
|
"max": 2.5276234, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.0002681109164285715, |
|
"min": 0.0002681109164285715, |
|
"max": 0.00983851593142857, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.003753552830000001, |
|
"min": 0.003753552830000001, |
|
"max": 0.11278957766, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.015236700884997845, |
|
"min": 0.015236700884997845, |
|
"max": 0.5371481776237488, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.21331381797790527, |
|
"min": 0.21331381797790527, |
|
"max": 3.7600371837615967, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 299.4646464646465, |
|
"min": 299.4646464646465, |
|
"max": 999.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29647.0, |
|
"min": 15984.0, |
|
"max": 32726.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.680329275251639, |
|
"min": -1.0000000521540642, |
|
"max": 1.680329275251639, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 166.35259824991226, |
|
"min": -30.758001729846, |
|
"max": 166.35259824991226, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.680329275251639, |
|
"min": -1.0000000521540642, |
|
"max": 1.680329275251639, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 166.35259824991226, |
|
"min": -30.758001729846, |
|
"max": 166.35259824991226, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.04636865655096827, |
|
"min": 0.04636865655096827, |
|
"max": 11.21028440631926, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 4.590496998545859, |
|
"min": 4.590496998545859, |
|
"max": 179.36455050110817, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1674568861", |
|
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.6", |
|
"end_time_seconds": "1674570925" |
|
}, |
|
"total": 2064.574758017, |
|
"count": 1, |
|
"self": 0.424947014999816, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.09823641299999508, |
|
"count": 1, |
|
"self": 0.09823641299999508 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2064.051574589, |
|
"count": 1, |
|
"self": 1.3470079159415036, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 6.138089829999899, |
|
"count": 1, |
|
"self": 6.138089829999899 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2056.4844117180587, |
|
"count": 63880, |
|
"self": 1.3352355231222646, |
|
"children": { |
|
"env_step": { |
|
"total": 1406.8985602949476, |
|
"count": 63880, |
|
"self": 1299.2532109139909, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 106.80935217499314, |
|
"count": 63880, |
|
"self": 4.291114738973647, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 102.51823743601949, |
|
"count": 62560, |
|
"self": 34.24112053006911, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 68.27711690595038, |
|
"count": 62560, |
|
"self": 68.27711690595038 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.835997205963622, |
|
"count": 63880, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2059.4141146049765, |
|
"count": 63880, |
|
"is_parallel": true, |
|
"self": 859.2655831909165, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.001798228000097879, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006853770000816439, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001112851000016235, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001112851000016235 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.04578331000016078, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004628910000974429, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00043481900002007023, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00043481900002007023 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.043370157000026666, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.043370157000026666 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.001515443000016603, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00037851199977012584, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0011369310002464772, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0011369310002464772 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1200.14853141406, |
|
"count": 63879, |
|
"is_parallel": true, |
|
"self": 28.52736075418352, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 21.641051854971238, |
|
"count": 63879, |
|
"is_parallel": true, |
|
"self": 21.641051854971238 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1051.5371262079639, |
|
"count": 63879, |
|
"is_parallel": true, |
|
"self": 1051.5371262079639 |
|
}, |
|
"steps_from_proto": { |
|
"total": 98.4429925969414, |
|
"count": 63879, |
|
"is_parallel": true, |
|
"self": 21.90523671976007, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 76.53775587718133, |
|
"count": 511032, |
|
"is_parallel": true, |
|
"self": 76.53775587718133 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 648.250615899989, |
|
"count": 63880, |
|
"self": 2.587098024898978, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 141.44823388509235, |
|
"count": 63880, |
|
"self": 141.26757059909255, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.18066328599979897, |
|
"count": 2, |
|
"self": 0.18066328599979897 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 504.2152839899977, |
|
"count": 448, |
|
"self": 189.23464810899532, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 314.9806358810024, |
|
"count": 22794, |
|
"self": 314.9806358810024 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 9.069999578059651e-07, |
|
"count": 1, |
|
"self": 9.069999578059651e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.08206421800014141, |
|
"count": 1, |
|
"self": 0.0013815710003655113, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.0806826469997759, |
|
"count": 1, |
|
"self": 0.0806826469997759 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |