|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 1.9089889526367188, |
|
"min": 1.8442237377166748, |
|
"max": 3.213865041732788, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 35919.53515625, |
|
"min": 29317.10546875, |
|
"max": 120344.625, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 62.17948717948718, |
|
"min": 42.51304347826087, |
|
"max": 999.0, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19400.0, |
|
"min": 11112.0, |
|
"max": 28436.0, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1556.9494059513054, |
|
"min": 1184.4253004330594, |
|
"max": 1576.660508881427, |
|
"count": 471 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 242884.10732840362, |
|
"min": 2370.6947943219175, |
|
"max": 334525.03998778446, |
|
"count": 471 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 5039949.0, |
|
"min": 329805.0, |
|
"max": 5039949.0, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 5039949.0, |
|
"min": 329805.0, |
|
"max": 5039949.0, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.010436630807816982, |
|
"min": -0.09697045385837555, |
|
"max": 0.1714733988046646, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -1.6385509967803955, |
|
"min": -16.600444793701172, |
|
"max": 23.41659164428711, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.01028787437826395, |
|
"min": -0.09972328692674637, |
|
"max": 0.17430460453033447, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -1.6151962280273438, |
|
"min": -17.1435546875, |
|
"max": 23.17365837097168, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": 0.10489171933216654, |
|
"min": -0.5669750012457371, |
|
"max": 0.44391110796987276, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": 16.467999935150146, |
|
"min": -50.66320013999939, |
|
"max": 46.512000262737274, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": 0.10489171933216654, |
|
"min": -0.5669750012457371, |
|
"max": 0.44391110796987276, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": 16.467999935150146, |
|
"min": -50.66320013999939, |
|
"max": 46.512000262737274, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 472 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.016275092681947476, |
|
"min": 0.010151559529488926, |
|
"max": 0.024196836646297015, |
|
"count": 227 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.016275092681947476, |
|
"min": 0.010151559529488926, |
|
"max": 0.024196836646297015, |
|
"count": 227 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.09684030537803968, |
|
"min": 0.0013416305688830714, |
|
"max": 0.11689281612634658, |
|
"count": 227 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.09684030537803968, |
|
"min": 0.0013416305688830714, |
|
"max": 0.11689281612634658, |
|
"count": 227 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.09833643784125647, |
|
"min": 0.0013579658038603763, |
|
"max": 0.11826808328429858, |
|
"count": 227 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.09833643784125647, |
|
"min": 0.0013579658038603763, |
|
"max": 0.11826808328429858, |
|
"count": 227 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 227 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 227 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 227 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 227 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 227 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 227 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1688468546", |
|
"python_version": "3.10.10 (main, Mar 21 2023, 18:45:11) [GCC 11.2.0]", |
|
"command_line_arguments": "/opt/conda/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1688485154" |
|
}, |
|
"total": 16607.525235416368, |
|
"count": 1, |
|
"self": 0.013366627972573042, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.015603977721184492, |
|
"count": 1, |
|
"self": 0.015603977721184492 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 16607.496264810674, |
|
"count": 1, |
|
"self": 8.919515123125166, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 1.5175714301876724, |
|
"count": 25, |
|
"self": 1.5175714301876724 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 16596.756896799896, |
|
"count": 322264, |
|
"self": 7.916705624666065, |
|
"children": { |
|
"env_step": { |
|
"total": 5911.727526604664, |
|
"count": 322264, |
|
"self": 4514.543463871349, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 1392.023328505922, |
|
"count": 322264, |
|
"self": 49.78212635125965, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 1342.2412021546625, |
|
"count": 595496, |
|
"self": 1342.2412021546625 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 5.1607342273928225, |
|
"count": 322264, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 16555.016848264262, |
|
"count": 322264, |
|
"is_parallel": true, |
|
"self": 12923.445410506334, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.00312175415456295, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0008582943119108677, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0022634598426520824, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0022634598426520824 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.026854357682168484, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006880271248519421, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0005317311733961105, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005317311733961105 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.023468355182558298, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.023468355182558298 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.002166244201362133, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.000483611598610878, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001682632602751255, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001682632602751255 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.053547489922493696, |
|
"count": 48, |
|
"is_parallel": true, |
|
"self": 0.010899828281253576, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.04264766164124012, |
|
"count": 192, |
|
"is_parallel": true, |
|
"self": 0.04264766164124012 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 3631.5178902680054, |
|
"count": 322263, |
|
"is_parallel": true, |
|
"self": 189.9846967374906, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 131.83427887735888, |
|
"count": 322263, |
|
"is_parallel": true, |
|
"self": 131.83427887735888 |
|
}, |
|
"communicator.exchange": { |
|
"total": 2676.0341983493418, |
|
"count": 322263, |
|
"is_parallel": true, |
|
"self": 2676.0341983493418 |
|
}, |
|
"steps_from_proto": { |
|
"total": 633.6647163038142, |
|
"count": 644526, |
|
"is_parallel": true, |
|
"self": 126.69072948535904, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 506.97398681845516, |
|
"count": 2578104, |
|
"is_parallel": true, |
|
"self": 506.97398681845516 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 10677.112664570566, |
|
"count": 322264, |
|
"self": 69.58496827818453, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 1633.3974608271383, |
|
"count": 322264, |
|
"self": 1630.1399948387407, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 3.2574659883975983, |
|
"count": 10, |
|
"self": 3.2574659883975983 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 8974.130235465243, |
|
"count": 228, |
|
"self": 946.202926828526, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 8027.9273086367175, |
|
"count": 6840, |
|
"self": 8027.9273086367175 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 2.514570951461792e-06, |
|
"count": 1, |
|
"self": 2.514570951461792e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.30227894289419055, |
|
"count": 1, |
|
"self": 0.005925939884036779, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.29635300301015377, |
|
"count": 1, |
|
"self": 0.29635300301015377 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |