POCA-SoccerTwos-v1 / run_logs /timers.json

First Push

136c481 verified about 1 year ago

15.6 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 3.2957005500793457,
	"min": 3.2957005500793457,
	"max": 3.2957005500793457,
	"count": 1
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 105462.4140625,
	"min": 105462.4140625,
	"max": 105462.4140625,
	"count": 1
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 917.875,
	"min": 917.875,
	"max": 917.875,
	"count": 1
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 29372.0,
	"min": 29372.0,
	"max": 29372.0,
	"count": 1
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1199.2507195558546,
	"min": 1199.2507195558546,
	"max": 1199.2507195558546,
	"count": 1
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 2398.5014391117093,
	"min": 2398.5014391117093,
	"max": 2398.5014391117093,
	"count": 1
	},
	"SoccerTwos.Step.mean": {
	"value": 9702.0,
	"min": 9702.0,
	"max": 9702.0,
	"count": 1
	},
	"SoccerTwos.Step.sum": {
	"value": 9702.0,
	"min": 9702.0,
	"max": 9702.0,
	"count": 1
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.08133453130722046,
	"min": -0.08133453130722046,
	"max": -0.08133453130722046,
	"count": 1
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.894679844379425,
	"min": -0.894679844379425,
	"max": -0.894679844379425,
	"count": 1
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.0813639685511589,
	"min": -0.0813639685511589,
	"max": -0.0813639685511589,
	"count": 1
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -0.895003616809845,
	"min": -0.895003616809845,
	"max": -0.895003616809845,
	"count": 1
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 1
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 1
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.18181818181818182,
	"min": -0.18181818181818182,
	"max": -0.18181818181818182,
	"count": 1
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -2.0,
	"min": -2.0,
	"max": -2.0,
	"count": 1
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.18181818181818182,
	"min": -0.18181818181818182,
	"max": -0.18181818181818182,
	"count": 1
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -2.0,
	"min": -2.0,
	"max": -2.0,
	"count": 1
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 1
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 1
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1706818216",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./ml-agents/training-envs-executables/SoccerTwos/SoccerTwos.exe --run-id=SoccerTwos-v1 --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.0+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1706818272"
	},
	"total": 56.39498970999966,
	"count": 1,
	"self": 0.29079812299960395,
	"children": {
	"run_training.setup": {
	"total": 0.049794839000242064,
	"count": 1,
	"self": 0.049794839000242064
	},
	"TrainerController.start_learning": {
	"total": 56.05439674799982,
	"count": 1,
	"self": 0.04185226799108932,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.0504669280003327,
	"count": 1,
	"self": 3.0504669280003327
	},
	"TrainerController.advance": {
	"total": 52.60615961500844,
	"count": 1869,
	"self": 0.045332208999752766,
	"children": {
	"env_step": {
	"total": 50.107337278998784,
	"count": 1869,
	"self": 38.11959407299173,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 11.963706537995677,
	"count": 1869,
	"self": 0.29824500799759335,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 11.665461529998083,
	"count": 3730,
	"self": 11.665461529998083
	}
	}
	},
	"workers": {
	"total": 0.024036668011376605,
	"count": 1868,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 55.599608670982434,
	"count": 1868,
	"is_parallel": true,
	"self": 23.68868511599112,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.007481627999823104,
	"count": 2,
	"is_parallel": true,
	"self": 0.005101965999074309,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0023796620007487945,
	"count": 8,
	"is_parallel": true,
	"self": 0.0023796620007487945
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04210882200004562,
	"count": 1,
	"is_parallel": true,
	"self": 0.0012597169998116442,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0010210039999947185,
	"count": 1,
	"is_parallel": true,
	"self": 0.0010210039999947185
	},
	"communicator.exchange": {
	"total": 0.03614771999991717,
	"count": 1,
	"is_parallel": true,
	"self": 0.03614771999991717
	},
	"steps_from_proto": {
	"total": 0.003680381000322086,
	"count": 2,
	"is_parallel": true,
	"self": 0.0007167789999584784,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0029636020003636077,
	"count": 8,
	"is_parallel": true,
	"self": 0.0029636020003636077
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 31.910923554991314,
	"count": 1867,
	"is_parallel": true,
	"self": 2.1844497469851376,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 1.4690378020013668,
	"count": 1867,
	"is_parallel": true,
	"self": 1.4690378020013668
	},
	"communicator.exchange": {
	"total": 21.416320795012325,
	"count": 1867,
	"is_parallel": true,
	"self": 21.416320795012325
	},
	"steps_from_proto": {
	"total": 6.841115210992484,
	"count": 3734,
	"is_parallel": true,
	"self": 1.1023852910288952,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 5.738729919963589,
	"count": 14936,
	"is_parallel": true,
	"self": 5.738729919963589
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 2.4534901270099,
	"count": 1868,
	"self": 0.19774868901231457,
	"children": {
	"process_trajectory": {
	"total": 2.2557414379975853,
	"count": 1868,
	"self": 2.2557414379975853
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.4470001588051673e-06,
	"count": 1,
	"self": 1.4470001588051673e-06
	},
	"TrainerController._save_models": {
	"total": 0.3559164899997995,
	"count": 1,
	"self": 0.006759116999546677,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.34915737300025285,
	"count": 1,
	"self": 0.34915737300025285
	}
	}
	}
	}
	}
	}
	}