yizhangliu's picture
First Push
fb248e6
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.542044997215271,
"min": 1.440100073814392,
"max": 1.6137632131576538,
"count": 300
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 32814.71875,
"min": 25896.232421875,
"max": 35227.22265625,
"count": 300
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 58.80952380952381,
"min": 44.72477064220183,
"max": 86.49122807017544,
"count": 300
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19760.0,
"min": 18724.0,
"max": 20772.0,
"count": 300
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1653.1870649019568,
"min": 1567.552494060283,
"max": 1655.0609915835641,
"count": 300
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 277735.42690352874,
"min": 185288.5933308388,
"max": 353285.91771309637,
"count": 300
},
"SoccerTwos.Step.mean": {
"value": 14999930.0,
"min": 12009982.0,
"max": 14999930.0,
"count": 300
},
"SoccerTwos.Step.sum": {
"value": 14999930.0,
"min": 12009982.0,
"max": 14999930.0,
"count": 300
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.04682938754558563,
"min": -0.11298096179962158,
"max": 0.093830406665802,
"count": 300
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -7.820508003234863,
"min": -17.991260528564453,
"max": 17.358625411987305,
"count": 300
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.04404613748192787,
"min": -0.10972505807876587,
"max": 0.09695275872945786,
"count": 300
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -7.3557047843933105,
"min": -17.871688842773438,
"max": 17.936260223388672,
"count": 300
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 300
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 300
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.12098922201259407,
"min": -0.2797437529079616,
"max": 0.27960924881731153,
"count": 300
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -20.20520007610321,
"min": -46.605599999427795,
"max": 48.3724000453949,
"count": 300
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.12098922201259407,
"min": -0.2797437529079616,
"max": 0.27960924881731153,
"count": 300
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -20.20520007610321,
"min": -46.605599999427795,
"max": 48.3724000453949,
"count": 300
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 300
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 300
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.016679967249122758,
"min": 0.013073392383133372,
"max": 0.024770521942991765,
"count": 145
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.016679967249122758,
"min": 0.013073392383133372,
"max": 0.024770521942991765,
"count": 145
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.10101278101404508,
"min": 0.08707024628917376,
"max": 0.11337359274427096,
"count": 145
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.10101278101404508,
"min": 0.08707024628917376,
"max": 0.11337359274427096,
"count": 145
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.10257193421324094,
"min": 0.08828358178337416,
"max": 0.11552387624979019,
"count": 145
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.10257193421324094,
"min": 0.08828358178337416,
"max": 0.11552387624979019,
"count": 145
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 145
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 145
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 145
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 145
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 145
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 145
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1675923540",
"python_version": "3.9.16 (main, Feb 6 2023, 20:06:40) \n[GCC 9.3.0]",
"command_line_arguments": "/usr/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1675935835"
},
"total": 12295.671090400021,
"count": 1,
"self": 0.32222739997087047,
"children": {
"run_training.setup": {
"total": 0.047608000051695853,
"count": 1,
"self": 0.047608000051695853
},
"TrainerController.start_learning": {
"total": 12295.301254999998,
"count": 1,
"self": 7.271457104652654,
"children": {
"TrainerController._reset_env": {
"total": 1.7654651998891495,
"count": 16,
"self": 1.7654651998891495
},
"TrainerController.advance": {
"total": 12285.502733295492,
"count": 207000,
"self": 7.892098882293794,
"children": {
"env_step": {
"total": 6744.709322719427,
"count": 207000,
"self": 5854.004936416459,
"children": {
"SubprocessEnvManager._take_step": {
"total": 886.3216951006325,
"count": 207000,
"self": 38.47987049946096,
"children": {
"TorchPolicy.evaluate": {
"total": 847.8418246011715,
"count": 376556,
"self": 847.8418246011715
}
}
},
"workers": {
"total": 4.382691202335991,
"count": 207000,
"self": 0.0,
"children": {
"worker_root": {
"total": 12277.59570988745,
"count": 207000,
"is_parallel": true,
"self": 7156.613118898065,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.004712300025857985,
"count": 2,
"is_parallel": true,
"self": 0.0014410000294446945,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0032712999964132905,
"count": 8,
"is_parallel": true,
"self": 0.0032712999964132905
}
}
},
"UnityEnvironment.step": {
"total": 0.059866299969144166,
"count": 1,
"is_parallel": true,
"self": 0.0009093000553548336,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0013091000146232545,
"count": 1,
"is_parallel": true,
"self": 0.0013091000146232545
},
"communicator.exchange": {
"total": 0.055025899957399815,
"count": 1,
"is_parallel": true,
"self": 0.055025899957399815
},
"steps_from_proto": {
"total": 0.002621999941766262,
"count": 2,
"is_parallel": true,
"self": 0.000580199935939163,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.002041800005827099,
"count": 8,
"is_parallel": true,
"self": 0.002041800005827099
}
}
}
}
}
}
},
"steps_from_proto": {
"total": 0.034881899948231876,
"count": 30,
"is_parallel": true,
"self": 0.007476300408598036,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.02740559953963384,
"count": 120,
"is_parallel": true,
"self": 0.02740559953963384
}
}
},
"UnityEnvironment.step": {
"total": 5120.947709089436,
"count": 206999,
"is_parallel": true,
"self": 169.77864146704087,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 129.137426803587,
"count": 206999,
"is_parallel": true,
"self": 129.137426803587
},
"communicator.exchange": {
"total": 4308.419570893282,
"count": 206999,
"is_parallel": true,
"self": 4308.419570893282
},
"steps_from_proto": {
"total": 513.6120699255262,
"count": 413998,
"is_parallel": true,
"self": 112.80534110986628,
"children": {
"_process_rank_one_or_two_observation": {
"total": 400.8067288156599,
"count": 1655992,
"is_parallel": true,
"self": 400.8067288156599
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 5532.901311693771,
"count": 207000,
"self": 41.952493078657426,
"children": {
"process_trajectory": {
"total": 997.4942364149028,
"count": 207000,
"self": 996.1923424148699,
"children": {
"RLTrainer._checkpoint": {
"total": 1.3018940000329167,
"count": 6,
"self": 1.3018940000329167
}
}
},
"_update_policy": {
"total": 4493.454582200211,
"count": 145,
"self": 565.9212106984342,
"children": {
"TorchPOCAOptimizer.update": {
"total": 3927.533371501777,
"count": 4350,
"self": 3927.533371501777
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.9999570213258266e-06,
"count": 1,
"self": 1.9999570213258266e-06
},
"TrainerController._save_models": {
"total": 0.7615974000073038,
"count": 1,
"self": 0.0016035999869927764,
"children": {
"RLTrainer._checkpoint": {
"total": 0.759993800020311,
"count": 1,
"self": 0.759993800020311
}
}
}
}
}
}
}