poca-SoccerTwos / run_logs /timers.json
AlexChe's picture
Second Push
7fcd760
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.925425410270691,
"min": 1.915759801864624,
"max": 3.2958054542541504,
"count": 999
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 37584.3046875,
"min": 16128.560546875,
"max": 120293.8125,
"count": 999
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 52.34065934065934,
"min": 38.62698412698413,
"max": 999.0,
"count": 999
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19052.0,
"min": 8600.0,
"max": 31840.0,
"count": 999
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1529.3533261043233,
"min": 1183.3205100604046,
"max": 1580.9917070831711,
"count": 963
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 278342.30535098683,
"min": 2367.107393890611,
"max": 387650.7991294721,
"count": 963
},
"SoccerTwos.Step.mean": {
"value": 9999986.0,
"min": 9936.0,
"max": 9999986.0,
"count": 1000
},
"SoccerTwos.Step.sum": {
"value": 9999986.0,
"min": 9936.0,
"max": 9999986.0,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": 0.00248384615406394,
"min": -0.08259005099534988,
"max": 0.16389651596546173,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": 0.4520599842071533,
"min": -17.674270629882812,
"max": 21.08759307861328,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.0029731635004281998,
"min": -0.08249327540397644,
"max": 0.17476192116737366,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": 0.5411157608032227,
"min": -17.653560638427734,
"max": 20.636287689208984,
"count": 1000
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 1000
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": 0.06966813187022786,
"min": -0.7774249985814095,
"max": 0.592375762534864,
"count": 1000
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": 12.67960000038147,
"min": -55.94960010051727,
"max": 51.77119994163513,
"count": 1000
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": 0.06966813187022786,
"min": -0.7774249985814095,
"max": 0.592375762534864,
"count": 1000
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": 12.67960000038147,
"min": -55.94960010051727,
"max": 51.77119994163513,
"count": 1000
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 1000
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 1000
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.017772479609023624,
"min": 0.013106207802290252,
"max": 0.02294513695621087,
"count": 241
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.017772479609023624,
"min": 0.013106207802290252,
"max": 0.02294513695621087,
"count": 241
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.10266318197051684,
"min": 0.00021628589521848577,
"max": 0.10266318197051684,
"count": 241
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.10266318197051684,
"min": 0.00021628589521848577,
"max": 0.10266318197051684,
"count": 241
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.10306878151992957,
"min": 0.00021604419152936315,
"max": 0.10306878151992957,
"count": 241
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.10306878151992957,
"min": 0.00021604419152936315,
"max": 0.10306878151992957,
"count": 241
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 1.039799480599895e-07,
"min": 1.039799480599895e-07,
"max": 0.00019908356045822005,
"count": 241
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 1.039799480599895e-07,
"min": 1.039799480599895e-07,
"max": 0.00019908356045822005,
"count": 241
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.10005193999999999,
"min": 0.10005193999999999,
"max": 0.19954178000000003,
"count": 241
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.10005193999999999,
"min": 0.10005193999999999,
"max": 0.19954178000000003,
"count": 241
},
"SoccerTwos.Policy.Beta.mean": {
"value": 1.2591805999999739e-05,
"min": 1.2591805999999739e-05,
"max": 0.004977134822000001,
"count": 241
},
"SoccerTwos.Policy.Beta.sum": {
"value": 1.2591805999999739e-05,
"min": 1.2591805999999739e-05,
"max": 0.004977134822000001,
"count": 241
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1675676285",
"python_version": "3.9.15 (main, Oct 12 2022, 19:14:24) \n[GCC 9.4.0]",
"command_line_arguments": "/home/alex_ch/Documents/soccer/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos11 --no-graphics --forc",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1675689426"
},
"total": 13141.40194816608,
"count": 1,
"self": 0.2199119576252997,
"children": {
"run_training.setup": {
"total": 0.017643160186707973,
"count": 1,
"self": 0.017643160186707973
},
"TrainerController.start_learning": {
"total": 13141.164393048268,
"count": 1,
"self": 11.515696075744927,
"children": {
"TrainerController._reset_env": {
"total": 3.5481117190793157,
"count": 40,
"self": 3.5481117190793157
},
"TrainerController.advance": {
"total": 13125.719392045401,
"count": 670314,
"self": 12.56607809336856,
"children": {
"env_step": {
"total": 10137.776378094219,
"count": 670314,
"self": 7932.83226008201,
"children": {
"SubprocessEnvManager._take_step": {
"total": 2197.358084292151,
"count": 670314,
"self": 64.50146153476089,
"children": {
"TorchPolicy.evaluate": {
"total": 2132.85662275739,
"count": 1268100,
"self": 2132.85662275739
}
}
},
"workers": {
"total": 7.586033720057458,
"count": 670314,
"self": 0.0,
"children": {
"worker_root": {
"total": 13123.940445470624,
"count": 670314,
"is_parallel": true,
"self": 6547.930196742527,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0017680441960692406,
"count": 2,
"is_parallel": true,
"self": 0.0004641655832529068,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0013038786128163338,
"count": 8,
"is_parallel": true,
"self": 0.0013038786128163338
}
}
},
"UnityEnvironment.step": {
"total": 0.024935865309089422,
"count": 1,
"is_parallel": true,
"self": 0.0004292144440114498,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0003173109143972397,
"count": 1,
"is_parallel": true,
"self": 0.0003173109143972397
},
"communicator.exchange": {
"total": 0.022921456955373287,
"count": 1,
"is_parallel": true,
"self": 0.022921456955373287
},
"steps_from_proto": {
"total": 0.0012678829953074455,
"count": 2,
"is_parallel": true,
"self": 0.0002644117921590805,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.001003471203148365,
"count": 8,
"is_parallel": true,
"self": 0.001003471203148365
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 6575.949935941491,
"count": 670313,
"is_parallel": true,
"self": 386.8673889040947,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 225.78400005586445,
"count": 670313,
"is_parallel": true,
"self": 225.78400005586445
},
"communicator.exchange": {
"total": 4956.217983013019,
"count": 670313,
"is_parallel": true,
"self": 4956.217983013019
},
"steps_from_proto": {
"total": 1007.0805639685132,
"count": 1340626,
"is_parallel": true,
"self": 190.8026582240127,
"children": {
"_process_rank_one_or_two_observation": {
"total": 816.2779057445005,
"count": 5362504,
"is_parallel": true,
"self": 816.2779057445005
}
}
}
}
},
"steps_from_proto": {
"total": 0.06031278660520911,
"count": 78,
"is_parallel": true,
"self": 0.011089394800364971,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.04922339180484414,
"count": 312,
"is_parallel": true,
"self": 0.04922339180484414
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 2975.376935857814,
"count": 670314,
"self": 83.94245607219636,
"children": {
"process_trajectory": {
"total": 1001.9303183853626,
"count": 670314,
"self": 994.2248323266394,
"children": {
"RLTrainer._checkpoint": {
"total": 7.7054860587231815,
"count": 20,
"self": 7.7054860587231815
}
}
},
"_update_policy": {
"total": 1889.5041614002548,
"count": 241,
"self": 1125.2545917071402,
"children": {
"TorchPOCAOptimizer.update": {
"total": 764.2495696931146,
"count": 14466,
"self": 764.2495696931146
}
}
}
}
}
}
},
"trainer_threads": {
"total": 8.819624781608582e-07,
"count": 1,
"self": 8.819624781608582e-07
},
"TrainerController._save_models": {
"total": 0.38119232608005404,
"count": 1,
"self": 0.00203861016780138,
"children": {
"RLTrainer._checkpoint": {
"total": 0.37915371591225266,
"count": 1,
"self": 0.37915371591225266
}
}
}
}
}
}
}