poca-SoccerTwos-v5 / run_logs /timers.json

First Push

fb248e6 almost 2 years ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.542044997215271,
	"min": 1.440100073814392,
	"max": 1.6137632131576538,
	"count": 300
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 32814.71875,
	"min": 25896.232421875,
	"max": 35227.22265625,
	"count": 300
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 58.80952380952381,
	"min": 44.72477064220183,
	"max": 86.49122807017544,
	"count": 300
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19760.0,
	"min": 18724.0,
	"max": 20772.0,
	"count": 300
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1653.1870649019568,
	"min": 1567.552494060283,
	"max": 1655.0609915835641,
	"count": 300
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 277735.42690352874,
	"min": 185288.5933308388,
	"max": 353285.91771309637,
	"count": 300
	},
	"SoccerTwos.Step.mean": {
	"value": 14999930.0,
	"min": 12009982.0,
	"max": 14999930.0,
	"count": 300
	},
	"SoccerTwos.Step.sum": {
	"value": 14999930.0,
	"min": 12009982.0,
	"max": 14999930.0,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.04682938754558563,
	"min": -0.11298096179962158,
	"max": 0.093830406665802,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -7.820508003234863,
	"min": -17.991260528564453,
	"max": 17.358625411987305,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.04404613748192787,
	"min": -0.10972505807876587,
	"max": 0.09695275872945786,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -7.3557047843933105,
	"min": -17.871688842773438,
	"max": 17.936260223388672,
	"count": 300
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 300
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.12098922201259407,
	"min": -0.2797437529079616,
	"max": 0.27960924881731153,
	"count": 300
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -20.20520007610321,
	"min": -46.605599999427795,
	"max": 48.3724000453949,
	"count": 300
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.12098922201259407,
	"min": -0.2797437529079616,
	"max": 0.27960924881731153,
	"count": 300
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -20.20520007610321,
	"min": -46.605599999427795,
	"max": 48.3724000453949,
	"count": 300
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 300
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 300
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.016679967249122758,
	"min": 0.013073392383133372,
	"max": 0.024770521942991765,
	"count": 145
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.016679967249122758,
	"min": 0.013073392383133372,
	"max": 0.024770521942991765,
	"count": 145
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10101278101404508,
	"min": 0.08707024628917376,
	"max": 0.11337359274427096,
	"count": 145
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10101278101404508,
	"min": 0.08707024628917376,
	"max": 0.11337359274427096,
	"count": 145
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10257193421324094,
	"min": 0.08828358178337416,
	"max": 0.11552387624979019,
	"count": 145
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10257193421324094,
	"min": 0.08828358178337416,
	"max": 0.11552387624979019,
	"count": 145
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 145
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 145
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 145
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 145
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 145
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 145
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1675923540",
	"python_version": "3.9.16 (main, Feb 6 2023, 20:06:40) \n[GCC 9.3.0]",
	"command_line_arguments": "/usr/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1675935835"
	},
	"total": 12295.671090400021,
	"count": 1,
	"self": 0.32222739997087047,
	"children": {
	"run_training.setup": {
	"total": 0.047608000051695853,
	"count": 1,
	"self": 0.047608000051695853
	},
	"TrainerController.start_learning": {
	"total": 12295.301254999998,
	"count": 1,
	"self": 7.271457104652654,
	"children": {
	"TrainerController._reset_env": {
	"total": 1.7654651998891495,
	"count": 16,
	"self": 1.7654651998891495
	},
	"TrainerController.advance": {
	"total": 12285.502733295492,
	"count": 207000,
	"self": 7.892098882293794,
	"children": {
	"env_step": {
	"total": 6744.709322719427,
	"count": 207000,
	"self": 5854.004936416459,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 886.3216951006325,
	"count": 207000,
	"self": 38.47987049946096,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 847.8418246011715,
	"count": 376556,
	"self": 847.8418246011715
	}
	}
	},
	"workers": {
	"total": 4.382691202335991,
	"count": 207000,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 12277.59570988745,
	"count": 207000,
	"is_parallel": true,
	"self": 7156.613118898065,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.004712300025857985,
	"count": 2,
	"is_parallel": true,
	"self": 0.0014410000294446945,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0032712999964132905,
	"count": 8,
	"is_parallel": true,
	"self": 0.0032712999964132905
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.059866299969144166,
	"count": 1,
	"is_parallel": true,
	"self": 0.0009093000553548336,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0013091000146232545,
	"count": 1,
	"is_parallel": true,
	"self": 0.0013091000146232545
	},
	"communicator.exchange": {
	"total": 0.055025899957399815,
	"count": 1,
	"is_parallel": true,
	"self": 0.055025899957399815
	},
	"steps_from_proto": {
	"total": 0.002621999941766262,
	"count": 2,
	"is_parallel": true,
	"self": 0.000580199935939163,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.002041800005827099,
	"count": 8,
	"is_parallel": true,
	"self": 0.002041800005827099
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.034881899948231876,
	"count": 30,
	"is_parallel": true,
	"self": 0.007476300408598036,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.02740559953963384,
	"count": 120,
	"is_parallel": true,
	"self": 0.02740559953963384
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 5120.947709089436,
	"count": 206999,
	"is_parallel": true,
	"self": 169.77864146704087,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 129.137426803587,
	"count": 206999,
	"is_parallel": true,
	"self": 129.137426803587
	},
	"communicator.exchange": {
	"total": 4308.419570893282,
	"count": 206999,
	"is_parallel": true,
	"self": 4308.419570893282
	},
	"steps_from_proto": {
	"total": 513.6120699255262,
	"count": 413998,
	"is_parallel": true,
	"self": 112.80534110986628,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 400.8067288156599,
	"count": 1655992,
	"is_parallel": true,
	"self": 400.8067288156599
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 5532.901311693771,
	"count": 207000,
	"self": 41.952493078657426,
	"children": {
	"process_trajectory": {
	"total": 997.4942364149028,
	"count": 207000,
	"self": 996.1923424148699,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.3018940000329167,
	"count": 6,
	"self": 1.3018940000329167
	}
	}
	},
	"_update_policy": {
	"total": 4493.454582200211,
	"count": 145,
	"self": 565.9212106984342,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 3927.533371501777,
	"count": 4350,
	"self": 3927.533371501777
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.9999570213258266e-06,
	"count": 1,
	"self": 1.9999570213258266e-06
	},
	"TrainerController._save_models": {
	"total": 0.7615974000073038,
	"count": 1,
	"self": 0.0016035999869927764,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.759993800020311,
	"count": 1,
	"self": 0.759993800020311
	}
	}
	}
	}
	}
	}
	}