|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 1.4048619270324707, |
|
"min": 1.3750499486923218, |
|
"max": 1.7051565647125244, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 28277.060546875, |
|
"min": 14701.9814453125, |
|
"max": 34322.671875, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 45.06422018348624, |
|
"min": 35.125, |
|
"max": 53.40425531914894, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19648.0, |
|
"min": 8072.0, |
|
"max": 20960.0, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1607.9046472284606, |
|
"min": 1555.6832652825399, |
|
"max": 1613.038356436412, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 350523.2130958044, |
|
"min": 163654.2453609866, |
|
"max": 434134.2547516843, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 9999982.0, |
|
"min": 6659988.0, |
|
"max": 9999982.0, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 9999982.0, |
|
"min": 6659988.0, |
|
"max": 9999982.0, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": 0.03223046660423279, |
|
"min": -0.11106479167938232, |
|
"max": 0.10332842171192169, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": 13.246722221374512, |
|
"min": -46.31401824951172, |
|
"max": 44.017906188964844, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.031953852623701096, |
|
"min": -0.11250180751085281, |
|
"max": 0.10477326810359955, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 13.133033752441406, |
|
"min": -46.91325378417969, |
|
"max": 44.6334114074707, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": 0.09531192604554903, |
|
"min": -0.381275439994377, |
|
"max": 0.26663347656634745, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": 20.777999877929688, |
|
"min": -86.93080031871796, |
|
"max": 62.125600039958954, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": 0.09531192604554903, |
|
"min": -0.381275439994377, |
|
"max": 0.26663347656634745, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": 20.777999877929688, |
|
"min": -86.93080031871796, |
|
"max": 62.125600039958954, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 335 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.01046212162455049, |
|
"min": 0.009879295097471185, |
|
"max": 0.014559235423075734, |
|
"count": 51 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.01046212162455049, |
|
"min": 0.009879295097471185, |
|
"max": 0.014559235423075734, |
|
"count": 51 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.05891079842112958, |
|
"min": 0.04971672408282757, |
|
"max": 0.05918900854885578, |
|
"count": 51 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.05891079842112958, |
|
"min": 0.04971672408282757, |
|
"max": 0.05918900854885578, |
|
"count": 51 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.05924153439700604, |
|
"min": 0.051102403877303006, |
|
"max": 0.05954511137679219, |
|
"count": 51 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.05924153439700604, |
|
"min": 0.051102403877303006, |
|
"max": 0.05954511137679219, |
|
"count": 51 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 6.4449295954992225e-09, |
|
"min": 6.4449295954992225e-09, |
|
"max": 0.00014248644558948728, |
|
"count": 51 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 6.4449295954992225e-09, |
|
"min": 6.4449295954992225e-09, |
|
"max": 0.00014248644558948728, |
|
"count": 51 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.10000085146159124, |
|
"min": 0.10000085146159124, |
|
"max": 0.11912103967704953, |
|
"count": 51 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.10000085146159124, |
|
"min": 0.10000085146159124, |
|
"max": 0.11912103967704953, |
|
"count": 51 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 1.0002659404254946e-05, |
|
"min": 1.0002659404254946e-05, |
|
"max": 6.972151274949521e-05, |
|
"count": 51 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 1.0002659404254946e-05, |
|
"min": 1.0002659404254946e-05, |
|
"max": 6.972151274949521e-05, |
|
"count": 51 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1710343829", |
|
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", |
|
"command_line_arguments": "/home/stephan/.conda/envs/rl/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./ml-agents/training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos-read-deal --width=1280 --height=720 --resume", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.2.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1710353568" |
|
}, |
|
"total": 9739.254863360999, |
|
"count": 1, |
|
"self": 0.270132729987381, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.018506341002648696, |
|
"count": 1, |
|
"self": 0.018506341002648696 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 9738.966224290009, |
|
"count": 1, |
|
"self": 4.652608350283117, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 4.244304390012985, |
|
"count": 7, |
|
"self": 4.244304390012985 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 9729.947026144713, |
|
"count": 239073, |
|
"self": 4.148107524248189, |
|
"children": { |
|
"env_step": { |
|
"total": 4354.3673745146225, |
|
"count": 239073, |
|
"self": 3721.0493522615725, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 630.4299217515072, |
|
"count": 239073, |
|
"self": 19.02124206413282, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 611.4086796873744, |
|
"count": 418182, |
|
"self": 611.4086796873744 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 2.8881005015427945, |
|
"count": 239073, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 9731.739510110943, |
|
"count": 239073, |
|
"is_parallel": true, |
|
"self": 6533.360267171403, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.06389564499841072, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.000593470991589129, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.06330217400682159, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.06330217400682159 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.02612613000383135, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.000600070008658804, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00040655999328009784, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00040655999328009784 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.02343449799809605, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.02343449799809605 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0016850020037963986, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0003057300054933876, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001379271998303011, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001379271998303011 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.012151043978519738, |
|
"count": 12, |
|
"is_parallel": true, |
|
"self": 0.002059131977148354, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.010091912001371384, |
|
"count": 48, |
|
"is_parallel": true, |
|
"self": 0.010091912001371384 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 3198.3670918955613, |
|
"count": 239072, |
|
"is_parallel": true, |
|
"self": 175.16570653802773, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 110.43290661888022, |
|
"count": 239072, |
|
"is_parallel": true, |
|
"self": 110.43290661888022 |
|
}, |
|
"communicator.exchange": { |
|
"total": 2470.8126502879313, |
|
"count": 239072, |
|
"is_parallel": true, |
|
"self": 2470.8126502879313 |
|
}, |
|
"steps_from_proto": { |
|
"total": 441.95582845072204, |
|
"count": 478144, |
|
"is_parallel": true, |
|
"self": 78.3687699053844, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 363.58705854533764, |
|
"count": 1912576, |
|
"is_parallel": true, |
|
"self": 363.58705854533764 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 5371.4315441058425, |
|
"count": 239073, |
|
"self": 26.83088273082103, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 1094.2377518599678, |
|
"count": 239073, |
|
"self": 1093.3974272879568, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.8403245720110135, |
|
"count": 7, |
|
"self": 0.8403245720110135 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 4250.362909515054, |
|
"count": 51, |
|
"self": 652.032682771809, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 3598.3302267432446, |
|
"count": 4080, |
|
"self": 3598.3302267432446 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 9.200011845678091e-07, |
|
"count": 1, |
|
"self": 9.200011845678091e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.12228448499809019, |
|
"count": 1, |
|
"self": 0.0026952329935738817, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.11958925200451631, |
|
"count": 1, |
|
"self": 0.11958925200451631 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |