poca-SoccerTwos / run_logs /timers.json
timjwhite's picture
First Push
aef946e
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.5824898481369019,
"min": 1.5824898481369019,
"max": 1.9090577363967896,
"count": 64
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 158299.625,
"min": 158299.625,
"max": 194502.90625,
"count": 64
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 51.225469728601254,
"min": 47.746588693957115,
"max": 71.39710144927537,
"count": 64
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 98148.0,
"min": 96632.0,
"max": 98816.0,
"count": 64
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1508.1363786078211,
"min": 1473.5221745025995,
"max": 1529.2443052678618,
"count": 64
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 1444794.6507062926,
"min": 1028764.0045122284,
"max": 1537430.1608911173,
"count": 64
},
"SoccerTwos.Step.mean": {
"value": 8899874.0,
"min": 5749974.0,
"max": 8899874.0,
"count": 64
},
"SoccerTwos.Step.sum": {
"value": 8899874.0,
"min": 5749974.0,
"max": 8899874.0,
"count": 64
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.0002751847496256232,
"min": -0.0704675242304802,
"max": 0.05401033163070679,
"count": 64
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -0.26335179805755615,
"min": -66.81063842773438,
"max": 42.560142517089844,
"count": 64
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.004515423439443111,
"min": -0.07144340127706528,
"max": 0.051143623888492584,
"count": 64
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -4.321260452270508,
"min": -64.05392456054688,
"max": 40.30117416381836,
"count": 64
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 64
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 64
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.02917032437389298,
"min": -0.10855413350570466,
"max": 0.09264945305671943,
"count": 64
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -27.916000425815582,
"min": -93.2480006814003,
"max": 84.68160009384155,
"count": 64
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.02917032437389298,
"min": -0.10855413350570466,
"max": 0.09264945305671943,
"count": 64
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -27.916000425815582,
"min": -93.2480006814003,
"max": 84.68160009384155,
"count": 64
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.018681833112835496,
"min": 0.014127501142401242,
"max": 0.020697781255391116,
"count": 64
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.05604549933850649,
"min": 0.028315532435226484,
"max": 0.057246277056401604,
"count": 64
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.12366595591108004,
"min": 0.08892387400070825,
"max": 0.12366595591108004,
"count": 64
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.3709978677332401,
"min": 0.1778477480014165,
"max": 0.3709978677332401,
"count": 64
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.12668096588717567,
"min": 0.09020149645706017,
"max": 0.12668096588717567,
"count": 64
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.380042897661527,
"min": 0.18040299291412035,
"max": 0.380042897661527,
"count": 64
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 64
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0009,
"min": 0.0006,
"max": 0.0009,
"count": 64
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 64
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.6000000000000002,
"min": 0.40000000000000013,
"max": 0.6000000000000002,
"count": 64
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 64
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.015000000000000003,
"min": 0.010000000000000002,
"max": 0.015000000000000003,
"count": 64
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 64
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 64
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1689545754",
"python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]",
"command_line_arguments": "/home/timjwhite/.local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --resume --no-graphics",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1689554406"
},
"total": 8652.359177459,
"count": 1,
"self": 0.24237303400150267,
"children": {
"run_training.setup": {
"total": 0.04718287900004725,
"count": 1,
"self": 0.04718287900004725
},
"TrainerController.start_learning": {
"total": 8652.069621546,
"count": 1,
"self": 4.708958225339302,
"children": {
"TrainerController._reset_env": {
"total": 9.899197846001243,
"count": 18,
"self": 9.899197846001243
},
"TrainerController.advance": {
"total": 8637.195361422659,
"count": 222816,
"self": 4.77625178893868,
"children": {
"env_step": {
"total": 6819.7162154938205,
"count": 222816,
"self": 5537.285447605323,
"children": {
"SubprocessEnvManager._take_step": {
"total": 1279.8399814283537,
"count": 222816,
"self": 30.754265482031542,
"children": {
"TorchPolicy.evaluate": {
"total": 1249.0857159463221,
"count": 401938,
"self": 1249.0857159463221
}
}
},
"workers": {
"total": 2.5907864601442725,
"count": 222815,
"self": 0.0,
"children": {
"worker_root": {
"total": 8637.943608716465,
"count": 222815,
"is_parallel": true,
"self": 3749.0665332869085,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.011673448999999891,
"count": 2,
"is_parallel": true,
"self": 0.0070754110001871595,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.004598037999812732,
"count": 8,
"is_parallel": true,
"self": 0.004598037999812732
}
}
},
"UnityEnvironment.step": {
"total": 0.03501203599989822,
"count": 1,
"is_parallel": true,
"self": 0.0014596029998301674,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.001354877000039778,
"count": 1,
"is_parallel": true,
"self": 0.001354877000039778
},
"communicator.exchange": {
"total": 0.027357521000112683,
"count": 1,
"is_parallel": true,
"self": 0.027357521000112683
},
"steps_from_proto": {
"total": 0.004840034999915588,
"count": 2,
"is_parallel": true,
"self": 0.0011863969998557877,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0036536380000598,
"count": 8,
"is_parallel": true,
"self": 0.0036536380000598
}
}
}
}
}
}
},
"steps_from_proto": {
"total": 0.07651414700058012,
"count": 34,
"is_parallel": true,
"self": 0.01597959500372781,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.060534551996852315,
"count": 136,
"is_parallel": true,
"self": 0.060534551996852315
}
}
},
"UnityEnvironment.step": {
"total": 4888.800561282556,
"count": 222814,
"is_parallel": true,
"self": 291.07946570729473,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 203.93879390035477,
"count": 222814,
"is_parallel": true,
"self": 203.93879390035477
},
"communicator.exchange": {
"total": 3481.787563310218,
"count": 222814,
"is_parallel": true,
"self": 3481.787563310218
},
"steps_from_proto": {
"total": 911.9947383646886,
"count": 445628,
"is_parallel": true,
"self": 190.49647091938618,
"children": {
"_process_rank_one_or_two_observation": {
"total": 721.4982674453024,
"count": 1782512,
"is_parallel": true,
"self": 721.4982674453024
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 1812.7028941398985,
"count": 222815,
"self": 28.87042225176083,
"children": {
"process_trajectory": {
"total": 779.9697009141312,
"count": 222815,
"self": 778.292166592131,
"children": {
"RLTrainer._checkpoint": {
"total": 1.677534322000156,
"count": 6,
"self": 1.677534322000156
}
}
},
"_update_policy": {
"total": 1003.8627709740065,
"count": 155,
"self": 636.5023784550285,
"children": {
"TorchPOCAOptimizer.update": {
"total": 367.36039251897796,
"count": 4650,
"self": 367.36039251897796
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.1709998943842947e-06,
"count": 1,
"self": 1.1709998943842947e-06
},
"TrainerController._save_models": {
"total": 0.26610288099982427,
"count": 1,
"self": 0.001952478000021074,
"children": {
"RLTrainer._checkpoint": {
"total": 0.2641504029998032,
"count": 1,
"self": 0.2641504029998032
}
}
}
}
}
}
}