ppo-SnowballTarget / run_logs /timers.json

First Push

ecaa4bb about 1 year ago

18.4 kB

	{
	"name": "root",
	"gauges": {
	"SnowballTarget.Policy.Entropy.mean": {
	"value": 1.8527554273605347,
	"min": 1.8527554273605347,
	"max": 2.8140251636505127,
	"count": 9
	},
	"SnowballTarget.Policy.Entropy.sum": {
	"value": 18831.40625,
	"min": 18831.40625,
	"max": 28756.5234375,
	"count": 9
	},
	"SnowballTarget.Step.mean": {
	"value": 99936.0,
	"min": 19968.0,
	"max": 99936.0,
	"count": 9
	},
	"SnowballTarget.Step.sum": {
	"value": 99936.0,
	"min": 19968.0,
	"max": 99936.0,
	"count": 9
	},
	"SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
	"value": 7.591027736663818,
	"min": 1.1086370944976807,
	"max": 7.591027736663818,
	"count": 9
	},
	"SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
	"value": 1472.659423828125,
	"min": 211.74969482421875,
	"max": 1472.659423828125,
	"count": 9
	},
	"SnowballTarget.Environment.EpisodeLength.mean": {
	"value": 199.0,
	"min": 199.0,
	"max": 199.0,
	"count": 9
	},
	"SnowballTarget.Environment.EpisodeLength.sum": {
	"value": 8756.0,
	"min": 8756.0,
	"max": 10945.0,
	"count": 9
	},
	"SnowballTarget.Losses.PolicyLoss.mean": {
	"value": 0.06284199073550054,
	"min": 0.06284199073550054,
	"max": 0.07222230205068128,
	"count": 9
	},
	"SnowballTarget.Losses.PolicyLoss.sum": {
	"value": 0.25136796294200214,
	"min": 0.25136796294200214,
	"max": 0.3611115102534064,
	"count": 9
	},
	"SnowballTarget.Losses.ValueLoss.mean": {
	"value": 0.26206522405731913,
	"min": 0.18242232836143787,
	"max": 0.27795734469797095,
	"count": 9
	},
	"SnowballTarget.Losses.ValueLoss.sum": {
	"value": 1.0482608962292765,
	"min": 0.7296893134457515,
	"max": 1.3897867234898549,
	"count": 9
	},
	"SnowballTarget.Policy.LearningRate.mean": {
	"value": 1.5540094819999997e-05,
	"min": 1.5540094819999997e-05,
	"max": 0.00025314001562,
	"count": 9
	},
	"SnowballTarget.Policy.LearningRate.sum": {
	"value": 6.216037927999999e-05,
	"min": 6.216037927999999e-05,
	"max": 0.0011172001275999998,
	"count": 9
	},
	"SnowballTarget.Policy.Epsilon.mean": {
	"value": 0.10518000000000001,
	"min": 0.10518000000000001,
	"max": 0.18438000000000002,
	"count": 9
	},
	"SnowballTarget.Policy.Epsilon.sum": {
	"value": 0.42072000000000004,
	"min": 0.42072000000000004,
	"max": 0.8724,
	"count": 9
	},
	"SnowballTarget.Policy.Beta.mean": {
	"value": 0.00026848199999999995,
	"min": 0.00026848199999999995,
	"max": 0.004220562000000001,
	"count": 9
	},
	"SnowballTarget.Policy.Beta.sum": {
	"value": 0.0010739279999999998,
	"min": 0.0010739279999999998,
	"max": 0.018632759999999998,
	"count": 9
	},
	"SnowballTarget.Environment.CumulativeReward.mean": {
	"value": 16.5,
	"min": 4.795454545454546,
	"max": 16.5,
	"count": 9
	},
	"SnowballTarget.Environment.CumulativeReward.sum": {
	"value": 726.0,
	"min": 211.0,
	"max": 878.0,
	"count": 9
	},
	"SnowballTarget.Policy.ExtrinsicReward.mean": {
	"value": 16.5,
	"min": 4.795454545454546,
	"max": 16.5,
	"count": 9
	},
	"SnowballTarget.Policy.ExtrinsicReward.sum": {
	"value": 726.0,
	"min": 211.0,
	"max": 878.0,
	"count": 9
	},
	"SnowballTarget.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 9
	},
	"SnowballTarget.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 9
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1704445237",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics --resume",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.1.2+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1704445449"
	},
	"total": 212.90651439500004,
	"count": 1,
	"self": 0.4380315000000792,
	"children": {
	"run_training.setup": {
	"total": 0.05446932199993171,
	"count": 1,
	"self": 0.05446932199993171
	},
	"TrainerController.start_learning": {
	"total": 212.41401357300003,
	"count": 1,
	"self": 0.29725998599644754,
	"children": {
	"TrainerController._reset_env": {
	"total": 1.8716924619999418,
	"count": 1,
	"self": 1.8716924619999418
	},
	"TrainerController.advance": {
	"total": 210.15313940000362,
	"count": 8202,
	"self": 0.1263093730087803,
	"children": {
	"env_step": {
	"total": 210.02683002699484,
	"count": 8202,
	"self": 138.40515514498225,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 71.4880824670048,
	"count": 8202,
	"self": 0.6950981299992236,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 70.79298433700558,
	"count": 8202,
	"self": 70.79298433700558
	}
	}
	},
	"workers": {
	"total": 0.13359241500779717,
	"count": 8202,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 211.8185724749992,
	"count": 8202,
	"is_parallel": true,
	"self": 104.90280012300173,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0019655609999063017,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005625499995858263,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014030110003204754,
	"count": 10,
	"is_parallel": true,
	"self": 0.0014030110003204754
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.037417448999917724,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006318959998452556,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0003912250000439599,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003912250000439599
	},
	"communicator.exchange": {
	"total": 0.034376875000020846,
	"count": 1,
	"is_parallel": true,
	"self": 0.034376875000020846
	},
	"steps_from_proto": {
	"total": 0.002017453000007663,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003886959998453676,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0016287570001622953,
	"count": 10,
	"is_parallel": true,
	"self": 0.0016287570001622953
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 106.91577235199748,
	"count": 8201,
	"is_parallel": true,
	"self": 4.986603081994986,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 2.566246203999526,
	"count": 8201,
	"is_parallel": true,
	"self": 2.566246203999526
	},
	"communicator.exchange": {
	"total": 83.20323664700811,
	"count": 8201,
	"is_parallel": true,
	"self": 83.20323664700811
	},
	"steps_from_proto": {
	"total": 16.159686418994852,
	"count": 8201,
	"is_parallel": true,
	"self": 3.009303545009857,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 13.150382873984995,
	"count": 82010,
	"is_parallel": true,
	"self": 13.150382873984995
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 0.0003014119999988907,
	"count": 1,
	"self": 0.0003014119999988907,
	"children": {
	"thread_root": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"trainer_advance": {
	"total": 207.43462478898982,
	"count": 315782,
	"is_parallel": true,
	"self": 6.784712976016294,
	"children": {
	"process_trajectory": {
	"total": 115.88779060297293,
	"count": 315782,
	"is_parallel": true,
	"self": 115.52272035497288,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.36507024800005183,
	"count": 2,
	"is_parallel": true,
	"self": 0.36507024800005183
	}
	}
	},
	"_update_policy": {
	"total": 84.7621212100006,
	"count": 40,
	"is_parallel": true,
	"self": 27.692921618999662,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 57.06919959100094,
	"count": 2037,
	"is_parallel": true,
	"self": 57.06919959100094
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"TrainerController._save_models": {
	"total": 0.09162031300002127,
	"count": 1,
	"self": 0.0016305279999642153,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08998978500005705,
	"count": 1,
	"self": 0.08998978500005705
	}
	}
	}
	}
	}
	}
	}