{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 0.9073097109794617, "min": 0.8696509003639221, "max": 3.295811414718628, "count": 2200 }, "SoccerTwos.Policy.Entropy.sum": { "value": 35856.87890625, "min": 21059.609375, "max": 1019961.375, "count": 2200 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 24.602040816326532, "min": 17.152416356877325, "max": 392.75, "count": 2200 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 19288.0, "min": 17756.0, "max": 21412.0, "count": 2200 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1533.4588753226842, "min": 1200.328406833094, "max": 1579.4606048764724, "count": 2200 }, "SoccerTwos.Self-play.ELO.sum": { "value": 601115.8791264922, "min": 2409.9434577136913, "max": 781900.3774073822, "count": 2200 }, "SoccerTwos.Step.mean": { "value": 21999994.0, "min": 9958.0, "max": 21999994.0, "count": 2200 }, "SoccerTwos.Step.sum": { "value": 21999994.0, "min": 9958.0, "max": 21999994.0, "count": 2200 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": 0.0006931066163815558, "min": -0.11423704773187637, "max": 0.23437894880771637, "count": 2200 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": 0.27100467681884766, "min": -49.42055130004883, "max": 68.4496078491211, "count": 2200 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": 0.0009028149652294815, "min": -0.11388174444437027, "max": 0.21143116056919098, "count": 2200 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": 0.3530006408691406, "min": -50.347877502441406, "max": 67.15494537353516, "count": 2200 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 2200 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 2200 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": 0.052163681105884444, "min": -0.3903066684802373, "max": 0.5489372896440958, "count": 2200 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": 20.395999312400818, "min": -103.09040009975433, "max": 141.59099984169006, "count": 2200 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": 0.052163681105884444, "min": -0.3903066684802373, "max": 0.5489372896440958, "count": 2200 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": 20.395999312400818, "min": -103.09040009975433, "max": 141.59099984169006, "count": 2200 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 2200 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 2200 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.016792847060908875, "min": 0.01056482947509115, "max": 0.024503496209702765, "count": 1065 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.016792847060908875, "min": 0.01056482947509115, "max": 0.024503496209702765, "count": 1065 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.11256088341275851, "min": 0.005557317488516371, "max": 0.12470681170622508, "count": 1065 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.11256088341275851, "min": 0.005557317488516371, "max": 0.12470681170622508, "count": 1065 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.11302393625179927, "min": 0.005690486178112527, "max": 0.12509485532840092, "count": 1065 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.11302393625179927, "min": 0.005690486178112527, "max": 0.12509485532840092, "count": 1065 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 1.933272083181791e-07, "min": 1.933272083181791e-07, "max": 0.0002997203455477637, "count": 1065 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 1.933272083181791e-07, "min": 1.933272083181791e-07, "max": 0.0002997203455477637, "count": 1065 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.25, "min": 0.25, "max": 0.25, "count": 1065 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.25, "min": 0.25, "max": 0.25, "count": 1065 }, "SoccerTwos.Policy.Beta.mean": { "value": 1.6434468181818088e-05, "min": 1.6434468181818088e-05, "max": 0.009990687503636362, "count": 1065 }, "SoccerTwos.Policy.Beta.sum": { "value": 1.6434468181818088e-05, "min": 1.6434468181818088e-05, "max": 0.009990687503636362, "count": 1065 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1693348019", "python_version": "3.9.17 (main, Jul 5 2023, 20:41:20) \n[GCC 11.2.0]", "command_line_arguments": "/home/mgmeskill/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=Downstrike-20M --no-graphics --num-envs=32", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", "end_time_seconds": "1693373657" }, "total": 25638.07527213078, "count": 1, "self": 0.836282589007169, "children": { "run_training.setup": { "total": 0.17577498173341155, "count": 1, "self": 0.17577498173341155 }, "TrainerController.start_learning": { "total": 25637.06321456004, "count": 1, "self": 8.342477745376527, "children": { "TrainerController._reset_env": { "total": 271.783062253613, "count": 1088, "self": 271.783062253613 }, "TrainerController.advance": { "total": 25356.61511585163, "count": 108628, "self": 3.1089843809604645, "children": { "env_step": { "total": 15745.96533632977, "count": 108628, "self": 5440.94653446367, "children": { "SubprocessEnvManager._take_step": { "total": 10292.108620898332, "count": 3116235, "self": 255.61927175475284, "children": { "TorchPolicy.evaluate": { "total": 10036.48934914358, "count": 5628498, "self": 10036.48934914358 } } }, "workers": { "total": 12.910180967766792, "count": 108628, "self": 0.0, "children": { "worker_root": { "total": 818588.5154348165, "count": 3112826, "is_parallel": true, "self": 780482.6229405664, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.07693493086844683, "count": 64, "is_parallel": true, "self": 0.015927689615637064, "children": { "_process_rank_one_or_two_observation": { "total": 0.06100724125280976, "count": 256, "is_parallel": true, "self": 0.06100724125280976 } } }, "UnityEnvironment.step": { "total": 0.719481447711587, "count": 32, "is_parallel": true, "self": 0.020501975435763597, "children": { "UnityEnvironment._generate_step_input": { "total": 0.013642964884638786, "count": 32, "is_parallel": true, "self": 0.013642964884638786 }, "communicator.exchange": { "total": 0.627972015645355, "count": 32, "is_parallel": true, "self": 0.627972015645355 }, "steps_from_proto": { "total": 0.05736449174582958, "count": 64, "is_parallel": true, "self": 0.01029907027259469, "children": { "_process_rank_one_or_two_observation": { "total": 0.04706542147323489, "count": 256, "is_parallel": true, "self": 0.04706542147323489 } } } } } } }, "UnityEnvironment.step": { "total": 38019.55847894726, "count": 3112794, "is_parallel": true, "self": 2457.6824236582033, "children": { "UnityEnvironment._generate_step_input": { "total": 1512.2425317005254, "count": 3112794, "is_parallel": true, "self": 1512.2425317005254 }, "communicator.exchange": { "total": 27368.108181226067, "count": 3112794, "is_parallel": true, "self": 27368.108181226067 }, "steps_from_proto": { "total": 6681.525342362467, "count": 6225588, "is_parallel": true, "self": 1143.5824937582947, "children": { "_process_rank_one_or_two_observation": { "total": 5537.9428486041725, "count": 24902352, "is_parallel": true, "self": 5537.9428486041725 } } } } }, "steps_from_proto": { "total": 86.33401530282572, "count": 69568, "is_parallel": true, "self": 14.690878832247108, "children": { "_process_rank_one_or_two_observation": { "total": 71.64313647057861, "count": 278272, "is_parallel": true, "self": 71.64313647057861 } } } } } } } } }, "trainer_advance": { "total": 9607.5407951409, "count": 108628, "self": 132.7211998142302, "children": { "process_trajectory": { "total": 4697.321105179377, "count": 108628, "self": 4693.751423222944, "children": { "RLTrainer._checkpoint": { "total": 3.5696819564327598, "count": 11, "self": 3.5696819564327598 } } }, "_update_policy": { "total": 4777.498490147293, "count": 1065, "self": 2678.744994345121, "children": { "TorchPOCAOptimizer.update": { "total": 2098.7534958021715, "count": 31950, "self": 2098.7534958021715 } } } } } } }, "trainer_threads": { "total": 6.621703505516052e-07, "count": 1, "self": 6.621703505516052e-07 }, "TrainerController._save_models": { "total": 0.3225580472499132, "count": 1, "self": 0.0020071682520210743, "children": { "RLTrainer._checkpoint": { "total": 0.32055087899789214, "count": 1, "self": 0.32055087899789214 } } } } } } }