try again

9c344da about 1 year ago

15.7 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.0170891284942627,
	"min": 1.8789044618606567,
	"max": 3.295760154724121,
	"count": 496
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 44408.234375,
	"min": 21455.42578125,
	"max": 154475.640625,
	"count": 496
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 67.27777777777777,
	"min": 44.81651376146789,
	"max": 999.0,
	"count": 496
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19376.0,
	"min": 16228.0,
	"max": 23912.0,
	"count": 496
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1508.1163604947023,
	"min": 1182.8421708455958,
	"max": 1519.6095622292594,
	"count": 487
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 217168.75591123712,
	"min": 2369.2644624010436,
	"max": 323656.72171062784,
	"count": 487
	},
	"SoccerTwos.Step.mean": {
	"value": 4959977.0,
	"min": 9972.0,
	"max": 4959977.0,
	"count": 496
	},
	"SoccerTwos.Step.sum": {
	"value": 4959977.0,
	"min": 9972.0,
	"max": 4959977.0,
	"count": 496
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.015529231168329716,
	"min": -0.16310332715511322,
	"max": 0.27335065603256226,
	"count": 496
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 2.2517385482788086,
	"min": -25.770326614379883,
	"max": 31.36713409423828,
	"count": 496
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.010477464646100998,
	"min": -0.1623694747686386,
	"max": 0.2630256414413452,
	"count": 496
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 1.5192323923110962,
	"min": -25.654376983642578,
	"max": 31.72089385986328,
	"count": 496
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 496
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 496
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.1311737927897223,
	"min": -0.55129166568319,
	"max": 0.4727384608525496,
	"count": 496
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -19.020199954509735,
	"min": -48.20039987564087,
	"max": 62.700600147247314,
	"count": 496
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.1311737927897223,
	"min": -0.55129166568319,
	"max": 0.4727384608525496,
	"count": 496
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -19.020199954509735,
	"min": -48.20039987564087,
	"max": 62.700600147247314,
	"count": 496
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 496
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 496
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.02880678440108871,
	"min": 0.019772288502038767,
	"max": 0.031095777271548285,
	"count": 238
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.02880678440108871,
	"min": 0.019772288502038767,
	"max": 0.031095777271548285,
	"count": 238
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.07831853032112121,
	"min": 0.00012128652103874918,
	"max": 0.11398706659674644,
	"count": 238
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.07831853032112121,
	"min": 0.00012128652103874918,
	"max": 0.11398706659674644,
	"count": 238
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.0830160591751337,
	"min": 0.0001215280617182702,
	"max": 0.12332418784499169,
	"count": 238
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.0830160591751337,
	"min": 0.0001215280617182702,
	"max": 0.12332418784499169,
	"count": 238
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0006000000000000002,
	"min": 0.0006000000000000002,
	"max": 0.0006000000000000004,
	"count": 238
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0006000000000000002,
	"min": 0.0006000000000000002,
	"max": 0.0006000000000000004,
	"count": 238
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.19999999999999993,
	"min": 0.1999999999999999,
	"max": 0.19999999999999993,
	"count": 238
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.19999999999999993,
	"min": 0.1999999999999999,
	"max": 0.19999999999999993,
	"count": 238
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 238
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 238
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1696221287",
	"python_version": "3.9.13 (main, Aug 25 2022, 18:29:29) \n[Clang 12.0.0 ]",
	"command_line_arguments": "/Users/min/opt/anaconda3/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.exe --run-id=impatientSoccerPlayer --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0",
	"numpy_version": "1.21.5",
	"end_time_seconds": "1696243759"
	},
	"total": 22472.209734666,
	"count": 1,
	"self": 0.8138606240027002,
	"children": {
	"run_training.setup": {
	"total": 0.05455804200000003,
	"count": 1,
	"self": 0.05455804200000003
	},
	"TrainerController.start_learning": {
	"total": 22471.341316,
	"count": 1,
	"self": 5.888035890762694,
	"children": {
	"TrainerController._reset_env": {
	"total": 12.478927579004504,
	"count": 245,
	"self": 12.478927579004504
	},
	"TrainerController.advance": {
	"total": 22452.74893290523,
	"count": 369444,
	"self": 5.0823435700185655,
	"children": {
	"env_step": {
	"total": 5304.438053194684,
	"count": 369444,
	"self": 4300.56540087665,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1000.1727141657639,
	"count": 369444,
	"self": 26.993620021142306,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 973.1790941446216,
	"count": 694912,
	"self": 973.1790941446216
	}
	}
	},
	"workers": {
	"total": 3.6999381522700503,
	"count": 369444,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 22397.987685314532,
	"count": 369444,
	"is_parallel": true,
	"self": 18728.82446173286,
	"children": {
	"steps_from_proto": {
	"total": 0.3672039240000524,
	"count": 490,
	"is_parallel": true,
	"self": 0.06699814807154514,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.3002057759285073,
	"count": 1960,
	"is_parallel": true,
	"self": 0.3002057759285073
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 3668.796019657671,
	"count": 369444,
	"is_parallel": true,
	"self": 287.1529651292035,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 120.71345707751362,
	"count": 369444,
	"is_parallel": true,
	"self": 120.71345707751362
	},
	"communicator.exchange": {
	"total": 2755.4013959973745,
	"count": 369444,
	"is_parallel": true,
	"self": 2755.4013959973745
	},
	"steps_from_proto": {
	"total": 505.52820145357924,
	"count": 738888,
	"is_parallel": true,
	"self": 86.93492432616353,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 418.5932771274157,
	"count": 2955552,
	"is_parallel": true,
	"self": 418.5932771274157
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 17143.228536140527,
	"count": 369444,
	"self": 44.14212389020031,
	"children": {
	"process_trajectory": {
	"total": 2110.2125743713127,
	"count": 369444,
	"self": 2108.1162062453136,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 2.0963681259991063,
	"count": 9,
	"self": 2.0963681259991063
	}
	}
	},
	"_update_policy": {
	"total": 14988.873837879013,
	"count": 239,
	"self": 655.389815831033,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 14333.48402204798,
	"count": 14402,
	"self": 14333.48402204798
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.2080017768312246e-06,
	"count": 1,
	"self": 1.2080017768312246e-06
	},
	"TrainerController._save_models": {
	"total": 0.22541841699785437,
	"count": 1,
	"self": 0.0033028759971784893,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.22211554100067588,
	"count": 1,
	"self": 0.22211554100067588
	}
	}
	}
	}
	}
	}
	}