Mattttthew's picture
First Push
136c481 verified
raw
history blame
15.6 kB
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 3.2957005500793457,
"min": 3.2957005500793457,
"max": 3.2957005500793457,
"count": 1
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 105462.4140625,
"min": 105462.4140625,
"max": 105462.4140625,
"count": 1
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 917.875,
"min": 917.875,
"max": 917.875,
"count": 1
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 29372.0,
"min": 29372.0,
"max": 29372.0,
"count": 1
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1199.2507195558546,
"min": 1199.2507195558546,
"max": 1199.2507195558546,
"count": 1
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 2398.5014391117093,
"min": 2398.5014391117093,
"max": 2398.5014391117093,
"count": 1
},
"SoccerTwos.Step.mean": {
"value": 9702.0,
"min": 9702.0,
"max": 9702.0,
"count": 1
},
"SoccerTwos.Step.sum": {
"value": 9702.0,
"min": 9702.0,
"max": 9702.0,
"count": 1
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.08133453130722046,
"min": -0.08133453130722046,
"max": -0.08133453130722046,
"count": 1
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -0.894679844379425,
"min": -0.894679844379425,
"max": -0.894679844379425,
"count": 1
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.0813639685511589,
"min": -0.0813639685511589,
"max": -0.0813639685511589,
"count": 1
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -0.895003616809845,
"min": -0.895003616809845,
"max": -0.895003616809845,
"count": 1
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 1
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 1
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.18181818181818182,
"min": -0.18181818181818182,
"max": -0.18181818181818182,
"count": 1
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -2.0,
"min": -2.0,
"max": -2.0,
"count": 1
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.18181818181818182,
"min": -0.18181818181818182,
"max": -0.18181818181818182,
"count": 1
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -2.0,
"min": -2.0,
"max": -2.0,
"count": 1
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 1
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 1
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1706818216",
"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./ml-agents/training-envs-executables/SoccerTwos/SoccerTwos.exe --run-id=SoccerTwos-v1 --no-graphics",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.2.0+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1706818272"
},
"total": 56.39498970999966,
"count": 1,
"self": 0.29079812299960395,
"children": {
"run_training.setup": {
"total": 0.049794839000242064,
"count": 1,
"self": 0.049794839000242064
},
"TrainerController.start_learning": {
"total": 56.05439674799982,
"count": 1,
"self": 0.04185226799108932,
"children": {
"TrainerController._reset_env": {
"total": 3.0504669280003327,
"count": 1,
"self": 3.0504669280003327
},
"TrainerController.advance": {
"total": 52.60615961500844,
"count": 1869,
"self": 0.045332208999752766,
"children": {
"env_step": {
"total": 50.107337278998784,
"count": 1869,
"self": 38.11959407299173,
"children": {
"SubprocessEnvManager._take_step": {
"total": 11.963706537995677,
"count": 1869,
"self": 0.29824500799759335,
"children": {
"TorchPolicy.evaluate": {
"total": 11.665461529998083,
"count": 3730,
"self": 11.665461529998083
}
}
},
"workers": {
"total": 0.024036668011376605,
"count": 1868,
"self": 0.0,
"children": {
"worker_root": {
"total": 55.599608670982434,
"count": 1868,
"is_parallel": true,
"self": 23.68868511599112,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.007481627999823104,
"count": 2,
"is_parallel": true,
"self": 0.005101965999074309,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0023796620007487945,
"count": 8,
"is_parallel": true,
"self": 0.0023796620007487945
}
}
},
"UnityEnvironment.step": {
"total": 0.04210882200004562,
"count": 1,
"is_parallel": true,
"self": 0.0012597169998116442,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0010210039999947185,
"count": 1,
"is_parallel": true,
"self": 0.0010210039999947185
},
"communicator.exchange": {
"total": 0.03614771999991717,
"count": 1,
"is_parallel": true,
"self": 0.03614771999991717
},
"steps_from_proto": {
"total": 0.003680381000322086,
"count": 2,
"is_parallel": true,
"self": 0.0007167789999584784,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0029636020003636077,
"count": 8,
"is_parallel": true,
"self": 0.0029636020003636077
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 31.910923554991314,
"count": 1867,
"is_parallel": true,
"self": 2.1844497469851376,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 1.4690378020013668,
"count": 1867,
"is_parallel": true,
"self": 1.4690378020013668
},
"communicator.exchange": {
"total": 21.416320795012325,
"count": 1867,
"is_parallel": true,
"self": 21.416320795012325
},
"steps_from_proto": {
"total": 6.841115210992484,
"count": 3734,
"is_parallel": true,
"self": 1.1023852910288952,
"children": {
"_process_rank_one_or_two_observation": {
"total": 5.738729919963589,
"count": 14936,
"is_parallel": true,
"self": 5.738729919963589
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 2.4534901270099,
"count": 1868,
"self": 0.19774868901231457,
"children": {
"process_trajectory": {
"total": 2.2557414379975853,
"count": 1868,
"self": 2.2557414379975853
}
}
}
}
},
"trainer_threads": {
"total": 1.4470001588051673e-06,
"count": 1,
"self": 1.4470001588051673e-06
},
"TrainerController._save_models": {
"total": 0.3559164899997995,
"count": 1,
"self": 0.006759116999546677,
"children": {
"RLTrainer._checkpoint": {
"total": 0.34915737300025285,
"count": 1,
"self": 0.34915737300025285
}
}
}
}
}
}
}