Duplicate from aj555/poca-SoccerTwos

0dc361f over 1 year ago

No virus

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.7445931434631348,
	"min": 1.6850866079330444,
	"max": 3.2957451343536377,
	"count": 563
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 34724.3828125,
	"min": 10711.3671875,
	"max": 105463.84375,
	"count": 563
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 46.542857142857144,
	"min": 37.18939393939394,
	"max": 861.1111111111111,
	"count": 563
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19548.0,
	"min": 8200.0,
	"max": 31000.0,
	"count": 563
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1572.6787625822285,
	"min": 1187.8306343789218,
	"max": 1572.6787625822285,
	"count": 563
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 330262.540142268,
	"min": 4761.159386812556,
	"max": 388381.16085913655,
	"count": 563
	},
	"SoccerTwos.Step.mean": {
	"value": 5629965.0,
	"min": 9686.0,
	"max": 5629965.0,
	"count": 563
	},
	"SoccerTwos.Step.sum": {
	"value": 5629965.0,
	"min": 9686.0,
	"max": 5629965.0,
	"count": 563
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.01401924155652523,
	"min": -0.10446890443563461,
	"max": 0.21584397554397583,
	"count": 563
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -2.9440407752990723,
	"min": -20.67490005493164,
	"max": 33.303619384765625,
	"count": 563
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.014381909742951393,
	"min": -0.10639803111553192,
	"max": 0.21651381254196167,
	"count": 563
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -3.0202009677886963,
	"min": -21.695873260498047,
	"max": 36.781734466552734,
	"count": 563
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 563
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 563
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.011637141874858311,
	"min": -0.6318666656812032,
	"max": 0.4154938047966071,
	"count": 563
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 2.4437997937202454,
	"min": -55.973999977111816,
	"max": 57.87480020523071,
	"count": 563
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.011637141874858311,
	"min": -0.6318666656812032,
	"max": 0.4154938047966071,
	"count": 563
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 2.4437997937202454,
	"min": -55.973999977111816,
	"max": 57.87480020523071,
	"count": 563
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 563
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 563
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01681263987751057,
	"min": 0.009970807051286102,
	"max": 0.023588940827175976,
	"count": 271
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01681263987751057,
	"min": 0.009970807051286102,
	"max": 0.023588940827175976,
	"count": 271
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.12133442386984825,
	"min": 0.0036122541014964762,
	"max": 0.13310990159710248,
	"count": 271
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.12133442386984825,
	"min": 0.0036122541014964762,
	"max": 0.13310990159710248,
	"count": 271
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.12454693143566449,
	"min": 0.003364604473925936,
	"max": 0.13591177513202032,
	"count": 271
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.12454693143566449,
	"min": 0.003364604473925936,
	"max": 0.13591177513202032,
	"count": 271
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 271
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 271
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 271
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 271
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 271
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 271
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1675496201",
	"python_version": "3.9.16 (main, Jan 11 2023, 16:05:54) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/aj/anaconda3/envs/rl/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.13.1+cu117",
	"numpy_version": "1.21.0",
	"end_time_seconds": "1675501882"
	},
	"total": 5681.631443330001,
	"count": 1,
	"self": 0.36721379100163176,
	"children": {
	"run_training.setup": {
	"total": 0.009893450000163284,
	"count": 1,
	"self": 0.009893450000163284
	},
	"TrainerController.start_learning": {
	"total": 5681.2543360889995,
	"count": 1,
	"self": 6.013943085377832,
	"children": {
	"TrainerController._reset_env": {
	"total": 1.6326506650002557,
	"count": 29,
	"self": 1.6326506650002557
	},
	"TrainerController.advance": {
	"total": 5673.5077513796205,
	"count": 391656,
	"self": 5.791406961161556,
	"children": {
	"env_step": {
	"total": 4129.888640451547,
	"count": 391656,
	"self": 2977.331019370007,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1149.2225142639873,
	"count": 391656,
	"self": 29.32610332744298,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1119.8964109365443,
	"count": 708938,
	"self": 1119.8964109365443
	}
	}
	},
	"workers": {
	"total": 3.3351068175525143,
	"count": 391656,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 5672.611461594681,
	"count": 391656,
	"is_parallel": true,
	"self": 3284.0772732661026,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0014479720011877362,
	"count": 2,
	"is_parallel": true,
	"self": 0.0003768440037674736,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0010711279974202625,
	"count": 8,
	"is_parallel": true,
	"self": 0.0010711279974202625
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.015645661000235123,
	"count": 1,
	"is_parallel": true,
	"self": 0.00038880300053278916,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00029232899942144286,
	"count": 1,
	"is_parallel": true,
	"self": 0.00029232899942144286
	},
	"communicator.exchange": {
	"total": 0.013842027999999118,
	"count": 1,
	"is_parallel": true,
	"self": 0.013842027999999118
	},
	"steps_from_proto": {
	"total": 0.0011225010002817726,
	"count": 2,
	"is_parallel": true,
	"self": 0.00025512100182822905,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0008673799984535435,
	"count": 8,
	"is_parallel": true,
	"self": 0.0008673799984535435
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2388.50238450858,
	"count": 391655,
	"is_parallel": true,
	"self": 143.95996350808855,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 94.35225239944884,
	"count": 391655,
	"is_parallel": true,
	"self": 94.35225239944884
	},
	"communicator.exchange": {
	"total": 1740.7283542312416,
	"count": 391655,
	"is_parallel": true,
	"self": 1740.7283542312416
	},
	"steps_from_proto": {
	"total": 409.4618143698008,
	"count": 783310,
	"is_parallel": true,
	"self": 90.78960065160027,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 318.6722137182005,
	"count": 3133240,
	"is_parallel": true,
	"self": 318.6722137182005
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.031803819998458494,
	"count": 56,
	"is_parallel": true,
	"self": 0.007017880976491142,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.02478593902196735,
	"count": 224,
	"is_parallel": true,
	"self": 0.02478593902196735
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1537.827703966912,
	"count": 391656,
	"self": 36.89562855519216,
	"children": {
	"process_trajectory": {
	"total": 681.1944579387109,
	"count": 391656,
	"self": 680.1112748497108,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.0831830890001584,
	"count": 11,
	"self": 1.0831830890001584
	}
	}
	},
	"_update_policy": {
	"total": 819.7376174730089,
	"count": 272,
	"self": 533.5363305260798,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 286.20128694692903,
	"count": 8149,
	"self": 286.20128694692903
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.3709995982935652e-06,
	"count": 1,
	"self": 1.3709995982935652e-06
	},
	"TrainerController._save_models": {
	"total": 0.0999895880013355,
	"count": 1,
	"self": 0.0008468070009257644,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09914278100040974,
	"count": 1,
	"self": 0.09914278100040974
	}
	}
	}
	}
	}
	}
	}