|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 2.0103368759155273, |
|
"min": 1.9777865409851074, |
|
"max": 3.2957277297973633, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 38662.80078125, |
|
"min": 14614.603515625, |
|
"max": 120638.7265625, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 70.3768115942029, |
|
"min": 51.09375, |
|
"max": 999.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19424.0, |
|
"min": 15784.0, |
|
"max": 27088.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1564.4432060772401, |
|
"min": 1176.7258691064465, |
|
"max": 1580.0330219178438, |
|
"count": 492 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 215893.16243865914, |
|
"min": 2355.6993006599496, |
|
"max": 290868.49722051993, |
|
"count": 492 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 4999970.0, |
|
"min": 9560.0, |
|
"max": 4999970.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 4999970.0, |
|
"min": 9560.0, |
|
"max": 4999970.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.060075994580984116, |
|
"min": -0.10495267808437347, |
|
"max": 0.1653749793767929, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -8.290487289428711, |
|
"min": -16.626325607299805, |
|
"max": 27.782997131347656, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.06104997918009758, |
|
"min": -0.10382936894893646, |
|
"max": 0.1679215431213379, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -8.424897193908691, |
|
"min": -16.265779495239258, |
|
"max": 28.210819244384766, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": -0.13375362278758615, |
|
"min": -0.8823529411764706, |
|
"max": 0.41410149211314184, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": -18.45799994468689, |
|
"min": -41.70920014381409, |
|
"max": 50.97639989852905, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": -0.13375362278758615, |
|
"min": -0.8823529411764706, |
|
"max": 0.41410149211314184, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": -18.45799994468689, |
|
"min": -41.70920014381409, |
|
"max": 50.97639989852905, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.015407767969494064, |
|
"min": 0.011601856948497394, |
|
"max": 0.024236328400244627, |
|
"count": 239 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.015407767969494064, |
|
"min": 0.011601856948497394, |
|
"max": 0.024236328400244627, |
|
"count": 239 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.08410224045316378, |
|
"min": 0.0001900104902839909, |
|
"max": 0.10161295259992281, |
|
"count": 239 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.08410224045316378, |
|
"min": 0.0001900104902839909, |
|
"max": 0.10161295259992281, |
|
"count": 239 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.08507756615678469, |
|
"min": 0.00019070169025023158, |
|
"max": 0.10369378998875618, |
|
"count": 239 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.08507756615678469, |
|
"min": 0.00019070169025023158, |
|
"max": 0.10369378998875618, |
|
"count": 239 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 239 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 239 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 239 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 239 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 239 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 239 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1723712147", |
|
"python_version": "3.10.8 (main, Nov 24 2022, 14:13:03) [GCC 11.2.0]", |
|
"command_line_arguments": "/root/miniconda3/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --force", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.1.2+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1723724501" |
|
}, |
|
"total": 12354.318006377667, |
|
"count": 1, |
|
"self": 0.42288713436573744, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.034789071418344975, |
|
"count": 1, |
|
"self": 0.034789071418344975 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 12353.860330171883, |
|
"count": 1, |
|
"self": 5.262380417436361, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.691625320352614, |
|
"count": 21, |
|
"self": 2.691625320352614 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 12345.807688859291, |
|
"count": 333227, |
|
"self": 4.828748322091997, |
|
"children": { |
|
"env_step": { |
|
"total": 11043.155604165979, |
|
"count": 333227, |
|
"self": 10145.747690772638, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 893.9432374471799, |
|
"count": 333227, |
|
"self": 37.65499076526612, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 856.2882466819137, |
|
"count": 632172, |
|
"self": 856.2882466819137 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 3.464675946161151, |
|
"count": 333227, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 12330.256846216507, |
|
"count": 333227, |
|
"is_parallel": true, |
|
"self": 3141.1514767790213, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.007085210643708706, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0016971677541732788, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.005388042889535427, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.005388042889535427 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.04877493344247341, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0017983177676796913, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.001361580565571785, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.001361580565571785 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.04070513695478439, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.04070513695478439 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.004909898154437542, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0010248394683003426, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0038850586861371994, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0038850586861371994 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 9189.011991587467, |
|
"count": 333226, |
|
"is_parallel": true, |
|
"self": 515.4125970257446, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 333.63409104477614, |
|
"count": 333226, |
|
"is_parallel": true, |
|
"self": 333.63409104477614 |
|
}, |
|
"communicator.exchange": { |
|
"total": 6891.873233468272, |
|
"count": 333226, |
|
"is_parallel": true, |
|
"self": 6891.873233468272 |
|
}, |
|
"steps_from_proto": { |
|
"total": 1448.092070048675, |
|
"count": 666452, |
|
"is_parallel": true, |
|
"self": 286.7437717281282, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 1161.3482983205467, |
|
"count": 2665808, |
|
"is_parallel": true, |
|
"self": 1161.3482983205467 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.09337785001844168, |
|
"count": 40, |
|
"is_parallel": true, |
|
"self": 0.01847281027585268, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.074905039742589, |
|
"count": 160, |
|
"is_parallel": true, |
|
"self": 0.074905039742589 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 1297.8233363712206, |
|
"count": 333227, |
|
"self": 48.36833060905337, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 449.7733397288248, |
|
"count": 333227, |
|
"self": 448.74016169831157, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 1.033178030513227, |
|
"count": 10, |
|
"self": 1.033178030513227 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 799.6816660333425, |
|
"count": 239, |
|
"self": 540.5786511749029, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 259.10301485843956, |
|
"count": 7170, |
|
"self": 259.10301485843956 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 6.537884473800659e-07, |
|
"count": 1, |
|
"self": 6.537884473800659e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.09863492101430893, |
|
"count": 1, |
|
"self": 0.0014009485021233559, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.09723397251218557, |
|
"count": 1, |
|
"self": 0.09723397251218557 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |