{
    "name": "root",
    "gauges": {
        "SoccerTwos.Policy.Entropy.mean": {
            "value": 1.5312188863754272,
            "min": 1.340819239616394,
            "max": 3.2957217693328857,
            "count": 5000
        },
        "SoccerTwos.Policy.Entropy.sum": {
            "value": 27733.4375,
            "min": 4395.8408203125,
            "max": 135703.703125,
            "count": 5000
        },
        "SoccerTwos.Environment.EpisodeLength.mean": {
            "value": 82.38983050847457,
            "min": 39.13709677419355,
            "max": 999.0,
            "count": 5000
        },
        "SoccerTwos.Environment.EpisodeLength.sum": {
            "value": 19444.0,
            "min": 164.0,
            "max": 31968.0,
            "count": 5000
        },
        "SoccerTwos.Self-play.ELO.mean": {
            "value": 1630.5894777256385,
            "min": 1181.5905922473478,
            "max": 1650.7439009494178,
            "count": 4985
        },
        "SoccerTwos.Self-play.ELO.sum": {
            "value": 192409.55837162535,
            "min": 2364.785459149737,
            "max": 384814.0138152831,
            "count": 4985
        },
        "SoccerTwos.Step.mean": {
            "value": 49999939.0,
            "min": 9968.0,
            "max": 49999939.0,
            "count": 5000
        },
        "SoccerTwos.Step.sum": {
            "value": 49999939.0,
            "min": 9968.0,
            "max": 49999939.0,
            "count": 5000
        },
        "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
            "value": -0.017107047140598297,
            "min": -0.14119431376457214,
            "max": 0.21114686131477356,
            "count": 5000
        },
        "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
            "value": -2.0186314582824707,
            "min": -25.456342697143555,
            "max": 21.229524612426758,
            "count": 5000
        },
        "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
            "value": -0.01714133657515049,
            "min": -0.14103247225284576,
            "max": 0.2098654806613922,
            "count": 5000
        },
        "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
            "value": -2.0226776599884033,
            "min": -25.710233688354492,
            "max": 20.74159049987793,
            "count": 5000
        },
        "SoccerTwos.Environment.CumulativeReward.mean": {
            "value": 0.0,
            "min": 0.0,
            "max": 0.0,
            "count": 5000
        },
        "SoccerTwos.Environment.CumulativeReward.sum": {
            "value": 0.0,
            "min": 0.0,
            "max": 0.0,
            "count": 5000
        },
        "SoccerTwos.Policy.ExtrinsicReward.mean": {
            "value": -0.010835595555224661,
            "min": -0.7297473683169013,
            "max": 0.471263162791729,
            "count": 5000
        },
        "SoccerTwos.Policy.ExtrinsicReward.sum": {
            "value": -1.27860027551651,
            "min": -60.449599623680115,
            "max": 58.70319998264313,
            "count": 5000
        },
        "SoccerTwos.Environment.GroupCumulativeReward.mean": {
            "value": -0.010835595555224661,
            "min": -0.7297473683169013,
            "max": 0.471263162791729,
            "count": 5000
        },
        "SoccerTwos.Environment.GroupCumulativeReward.sum": {
            "value": -1.27860027551651,
            "min": -60.449599623680115,
            "max": 58.70319998264313,
            "count": 5000
        },
        "SoccerTwos.IsTraining.mean": {
            "value": 1.0,
            "min": 1.0,
            "max": 1.0,
            "count": 5000
        },
        "SoccerTwos.IsTraining.sum": {
            "value": 1.0,
            "min": 1.0,
            "max": 1.0,
            "count": 5000
        },
        "SoccerTwos.Losses.PolicyLoss.mean": {
            "value": 0.020745757979845316,
            "min": 0.00981990631359319,
            "max": 0.026678954934080443,
            "count": 2421
        },
        "SoccerTwos.Losses.PolicyLoss.sum": {
            "value": 0.020745757979845316,
            "min": 0.00981990631359319,
            "max": 0.026678954934080443,
            "count": 2421
        },
        "SoccerTwos.Losses.ValueLoss.mean": {
            "value": 0.07859083066383997,
            "min": 6.963343742730407e-05,
            "max": 0.13148470247785252,
            "count": 2421
        },
        "SoccerTwos.Losses.ValueLoss.sum": {
            "value": 0.07859083066383997,
            "min": 6.963343742730407e-05,
            "max": 0.13148470247785252,
            "count": 2421
        },
        "SoccerTwos.Losses.BaselineLoss.mean": {
            "value": 0.07936860620975494,
            "min": 7.014683821277382e-05,
            "max": 0.1338403267165025,
            "count": 2421
        },
        "SoccerTwos.Losses.BaselineLoss.sum": {
            "value": 0.07936860620975494,
            "min": 7.014683821277382e-05,
            "max": 0.1338403267165025,
            "count": 2421
        },
        "SoccerTwos.Policy.LearningRate.mean": {
            "value": 0.0003,
            "min": 0.0003,
            "max": 0.0003,
            "count": 2421
        },
        "SoccerTwos.Policy.LearningRate.sum": {
            "value": 0.0003,
            "min": 0.0003,
            "max": 0.0003,
            "count": 2421
        },
        "SoccerTwos.Policy.Epsilon.mean": {
            "value": 0.20000000000000007,
            "min": 0.19999999999999996,
            "max": 0.20000000000000007,
            "count": 2421
        },
        "SoccerTwos.Policy.Epsilon.sum": {
            "value": 0.20000000000000007,
            "min": 0.19999999999999996,
            "max": 0.20000000000000007,
            "count": 2421
        },
        "SoccerTwos.Policy.Beta.mean": {
            "value": 0.005000000000000001,
            "min": 0.005,
            "max": 0.005000000000000001,
            "count": 2421
        },
        "SoccerTwos.Policy.Beta.sum": {
            "value": 0.005000000000000001,
            "min": 0.005,
            "max": 0.005000000000000001,
            "count": 2421
        }
    },
    "metadata": {
        "timer_format_version": "0.1.0",
        "start_time_seconds": "1728814196",
        "python_version": "3.10.12 (main, Jul  5 2023, 18:54:27) [GCC 11.2.0]",
        "command_line_arguments": "/home/nagi/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics",
        "mlagents_version": "1.2.0.dev0",
        "mlagents_envs_version": "1.2.0.dev0",
        "communication_protocol_version": "1.5.0",
        "pytorch_version": "2.4.1+cu121",
        "numpy_version": "1.23.5",
        "end_time_seconds": "1728886394"
    },
    "total": 72197.922459742,
    "count": 1,
    "self": 1.0210029189911438,
    "children": {
        "run_training.setup": {
            "total": 0.012210681000169643,
            "count": 1,
            "self": 0.012210681000169643
        },
        "TrainerController.start_learning": {
            "total": 72196.889246142,
            "count": 1,
            "self": 51.1761235750746,
            "children": {
                "TrainerController._reset_env": {
                    "total": 4.610870969944699,
                    "count": 250,
                    "self": 4.610870969944699
                },
                "TrainerController.advance": {
                    "total": 72141.01020455398,
                    "count": 3429249,
                    "self": 52.07689644732454,
                    "children": {
                        "env_step": {
                            "total": 57992.53542821247,
                            "count": 3429249,
                            "self": 40204.73437785148,
                            "children": {
                                "SubprocessEnvManager._take_step": {
                                    "total": 17756.30232411364,
                                    "count": 3429249,
                                    "self": 296.7708337275253,
                                    "children": {
                                        "TorchPolicy.evaluate": {
                                            "total": 17459.531490386114,
                                            "count": 6286026,
                                            "self": 17459.531490386114
                                        }
                                    }
                                },
                                "workers": {
                                    "total": 31.49872624735235,
                                    "count": 3429249,
                                    "self": 0.0,
                                    "children": {
                                        "worker_root": {
                                            "total": 72101.60515642047,
                                            "count": 3429249,
                                            "is_parallel": true,
                                            "self": 36896.33861923412,
                                            "children": {
                                                "run_training.setup": {
                                                    "total": 0.0,
                                                    "count": 0,
                                                    "is_parallel": true,
                                                    "self": 0.0,
                                                    "children": {
                                                        "steps_from_proto": {
                                                            "total": 0.0021235510000678914,
                                                            "count": 2,
                                                            "is_parallel": true,
                                                            "self": 0.00090454100018178,
                                                            "children": {
                                                                "_process_rank_one_or_two_observation": {
                                                                    "total": 0.0012190099998861115,
                                                                    "count": 8,
                                                                    "is_parallel": true,
                                                                    "self": 0.0012190099998861115
                                                                }
                                                            }
                                                        },
                                                        "UnityEnvironment.step": {
                                                            "total": 0.01977080400001796,
                                                            "count": 1,
                                                            "is_parallel": true,
                                                            "self": 0.00034734999985630566,
                                                            "children": {
                                                                "UnityEnvironment._generate_step_input": {
                                                                    "total": 0.0002519260001463408,
                                                                    "count": 1,
                                                                    "is_parallel": true,
                                                                    "self": 0.0002519260001463408
                                                                },
                                                                "communicator.exchange": {
                                                                    "total": 0.01814612099997248,
                                                                    "count": 1,
                                                                    "is_parallel": true,
                                                                    "self": 0.01814612099997248
                                                                },
                                                                "steps_from_proto": {
                                                                    "total": 0.0010254070000428328,
                                                                    "count": 2,
                                                                    "is_parallel": true,
                                                                    "self": 0.00024765400007709104,
                                                                    "children": {
                                                                        "_process_rank_one_or_two_observation": {
                                                                            "total": 0.0007777529999657418,
                                                                            "count": 8,
                                                                            "is_parallel": true,
                                                                            "self": 0.0007777529999657418
                                                                        }
                                                                    }
                                                                }
                                                            }
                                                        }
                                                    }
                                                },
                                                "UnityEnvironment.step": {
                                                    "total": 35205.030267951384,
                                                    "count": 3429248,
                                                    "is_parallel": true,
                                                    "self": 1034.706717121553,
                                                    "children": {
                                                        "UnityEnvironment._generate_step_input": {
                                                            "total": 635.1617354733712,
                                                            "count": 3429248,
                                                            "is_parallel": true,
                                                            "self": 635.1617354733712
                                                        },
                                                        "communicator.exchange": {
                                                            "total": 30483.28878681977,
                                                            "count": 3429248,
                                                            "is_parallel": true,
                                                            "self": 30483.28878681977
                                                        },
                                                        "steps_from_proto": {
                                                            "total": 3051.8730285366937,
                                                            "count": 6858496,
                                                            "is_parallel": true,
                                                            "self": 688.1159350191438,
                                                            "children": {
                                                                "_process_rank_one_or_two_observation": {
                                                                    "total": 2363.75709351755,
                                                                    "count": 27433984,
                                                                    "is_parallel": true,
                                                                    "self": 2363.75709351755
                                                                }
                                                            }
                                                        }
                                                    }
                                                },
                                                "steps_from_proto": {
                                                    "total": 0.23626923496658492,
                                                    "count": 498,
                                                    "is_parallel": true,
                                                    "self": 0.054451374094924176,
                                                    "children": {
                                                        "_process_rank_one_or_two_observation": {
                                                            "total": 0.18181786087166074,
                                                            "count": 1992,
                                                            "is_parallel": true,
                                                            "self": 0.18181786087166074
                                                        }
                                                    }
                                                }
                                            }
                                        }
                                    }
                                }
                            }
                        },
                        "trainer_advance": {
                            "total": 14096.397879894184,
                            "count": 3429249,
                            "self": 352.32939927972257,
                            "children": {
                                "process_trajectory": {
                                    "total": 7242.712258473682,
                                    "count": 3429249,
                                    "self": 7233.037569496666,
                                    "children": {
                                        "RLTrainer._checkpoint": {
                                            "total": 9.674688977015194,
                                            "count": 100,
                                            "self": 9.674688977015194
                                        }
                                    }
                                },
                                "_update_policy": {
                                    "total": 6501.35622214078,
                                    "count": 2421,
                                    "self": 3916.9756206946913,
                                    "children": {
                                        "TorchPOCAOptimizer.update": {
                                            "total": 2584.380601446089,
                                            "count": 72642,
                                            "self": 2584.380601446089
                                        }
                                    }
                                }
                            }
                        }
                    }
                },
                "trainer_threads": {
                    "total": 4.869943950325251e-07,
                    "count": 1,
                    "self": 4.869943950325251e-07
                },
                "TrainerController._save_models": {
                    "total": 0.09204655600478873,
                    "count": 1,
                    "self": 0.0009647410042816773,
                    "children": {
                        "RLTrainer._checkpoint": {
                            "total": 0.09108181500050705,
                            "count": 1,
                            "self": 0.09108181500050705
                        }
                    }
                }
            }
        }
    }
}