{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 3.225499391555786, "min": 3.225499391555786, "max": 3.295750141143799, "count": 20 }, "SoccerTwos.Policy.Entropy.sum": { "value": 50059.75, "min": 39080.6796875, "max": 105463.953125, "count": 20 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 711.125, "min": 480.6, "max": 999.0, "count": 20 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 22756.0, "min": 9612.0, "max": 31968.0, "count": 20 }, "SoccerTwos.Step.mean": { "value": 199906.0, "min": 9000.0, "max": 199906.0, "count": 20 }, "SoccerTwos.Step.sum": { "value": 199906.0, "min": 9000.0, "max": 199906.0, "count": 20 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": 0.006868079304695129, "min": 0.0025794401299208403, "max": 0.05935068428516388, "count": 20 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": 0.10302118957042694, "min": 0.02579440176486969, "max": 0.8902602791786194, "count": 20 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": 0.005543396808207035, "min": 0.003897703718394041, "max": 0.05932831019163132, "count": 20 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": 0.0831509530544281, "min": 0.038977038115262985, "max": 0.8898614645004272, "count": 20 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 20 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 20 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": -0.3805066665013631, "min": -0.4716333324710528, "max": 0.15730908783999356, "count": 20 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": -5.707599997520447, "min": -5.953600000590086, "max": 1.866799920797348, "count": 20 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": -0.3805066665013631, "min": -0.4716333324710528, "max": 0.15730908783999356, "count": 20 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": -5.707599997520447, "min": -5.953600000590086, "max": 1.866799920797348, "count": 20 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 20 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 20 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1201.9106226384604, "min": 1199.5773275140164, "max": 1202.724322432375, "count": 17 }, "SoccerTwos.Self-play.ELO.sum": { "value": 9615.284981107683, "min": 2400.3573839874066, "max": 14394.927930168196, "count": 17 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.01857729412149638, "min": 0.014567442450061207, "max": 0.020088891692770023, "count": 9 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.01857729412149638, "min": 0.014567442450061207, "max": 0.020088891692770023, "count": 9 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.002594919844220082, "min": 0.0013332608408139397, "max": 0.0058968229762588935, "count": 9 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.002594919844220082, "min": 0.0013332608408139397, "max": 0.0058968229762588935, "count": 9 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.002838954865001142, "min": 0.0013385032245423645, "max": 0.005983704778676231, "count": 9 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.002838954865001142, "min": 0.0013385032245423645, "max": 0.005983704778676231, "count": 9 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 9 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 9 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 9 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 9 }, "SoccerTwos.Policy.Beta.mean": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 9 }, "SoccerTwos.Policy.Beta.sum": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 9 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1690756233", "python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", "end_time_seconds": "1690757353" }, "total": 1120.0687148419997, "count": 1, "self": 0.47720929899969633, "children": { "run_training.setup": { "total": 0.051612099000067246, "count": 1, "self": 0.051612099000067246 }, "TrainerController.start_learning": { "total": 1119.539893444, "count": 1, "self": 0.5211385340030574, "children": { "TrainerController._reset_env": { "total": 1.3276582359999338, "count": 2, "self": 1.3276582359999338 }, "TrainerController.advance": { "total": 1117.310266320997, "count": 13004, "self": 0.5846488979882452, "children": { "env_step": { "total": 463.09313726402934, "count": 13004, "self": 385.1266148120558, "children": { "SubprocessEnvManager._take_step": { "total": 77.64545934097714, "count": 13004, "self": 3.2261185269453563, "children": { "TorchPolicy.evaluate": { "total": 74.41934081403178, "count": 25804, "self": 74.41934081403178 } } }, "workers": { "total": 0.3210631109964197, "count": 13004, "self": 0.0, "children": { "worker_root": { "total": 1113.3584529080376, "count": 13004, "is_parallel": true, "self": 795.2097868370365, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.003293229000064457, "count": 2, "is_parallel": true, "self": 0.0008891030001905165, "children": { "_process_rank_one_or_two_observation": { "total": 0.0024041259998739406, "count": 8, "is_parallel": true, "self": 0.0024041259998739406 } } }, "UnityEnvironment.step": { "total": 0.04919334899977912, "count": 1, "is_parallel": true, "self": 0.00137288299993088, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0010131489998457255, "count": 1, "is_parallel": true, "self": 0.0010131489998457255 }, "communicator.exchange": { "total": 0.042369884999970964, "count": 1, "is_parallel": true, "self": 0.042369884999970964 }, "steps_from_proto": { "total": 0.004437432000031549, "count": 2, "is_parallel": true, "self": 0.000773127999764256, "children": { "_process_rank_one_or_two_observation": { "total": 0.0036643040002672933, "count": 8, "is_parallel": true, "self": 0.0036643040002672933 } } } } } } }, "UnityEnvironment.step": { "total": 318.1486660710011, "count": 13003, "is_parallel": true, "self": 19.211716871955105, "children": { "UnityEnvironment._generate_step_input": { "total": 10.209771232014646, "count": 13003, "is_parallel": true, "self": 10.209771232014646 }, "communicator.exchange": { "total": 227.49514436899062, "count": 13003, "is_parallel": true, "self": 227.49514436899062 }, "steps_from_proto": { "total": 61.23203359804074, "count": 26006, "is_parallel": true, "self": 11.028131147965269, "children": { "_process_rank_one_or_two_observation": { "total": 50.203902450075475, "count": 104024, "is_parallel": true, "self": 50.203902450075475 } } } } } } } } } } }, "trainer_advance": { "total": 653.6324801589794, "count": 13004, "self": 3.9507516069775193, "children": { "process_trajectory": { "total": 80.739217611002, "count": 13004, "self": 80.739217611002 }, "_update_policy": { "total": 568.9425109409999, "count": 9, "self": 51.49464241700025, "children": { "TorchPOCAOptimizer.update": { "total": 517.4478685239997, "count": 270, "self": 517.4478685239997 } } } } } } }, "trainer_threads": { "total": 1.204999989568023e-06, "count": 1, "self": 1.204999989568023e-06 }, "TrainerController._save_models": { "total": 0.38082914799997525, "count": 1, "self": 0.0028527250001388893, "children": { "RLTrainer._checkpoint": { "total": 0.37797642299983636, "count": 1, "self": 0.37797642299983636 } } } } } } }