First Push

7c3af56 verified 7 months ago

15.6 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 3.23771071434021,
	"min": 3.23771071434021,
	"max": 3.295820713043213,
	"count": 26
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 28491.853515625,
	"min": 8391.232421875,
	"max": 52733.12890625,
	"count": 26
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 714.0,
	"min": 191.66666666666666,
	"max": 999.0,
	"count": 26
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 8568.0,
	"min": 2204.0,
	"max": 22100.0,
	"count": 26
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1001.8291290461129,
	"min": 1000.1956409054587,
	"max": 1005.3472247237237,
	"count": 23
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 4007.3165161844518,
	"min": 2000.3912818109175,
	"max": 10038.79575043783,
	"count": 23
	},
	"SoccerTwos.Step.mean": {
	"value": 129996.0,
	"min": 4656.0,
	"max": 129996.0,
	"count": 26
	},
	"SoccerTwos.Step.sum": {
	"value": 129996.0,
	"min": 4656.0,
	"max": 129996.0,
	"count": 26
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.04069586843252182,
	"min": -0.103403240442276,
	"max": -0.03872303664684296,
	"count": 26
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.48835042119026184,
	"min": -1.34423828125,
	"max": -0.4259534180164337,
	"count": 26
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.04016890004277229,
	"min": -0.10340321063995361,
	"max": -0.03828540816903114,
	"count": 26
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -0.4820268154144287,
	"min": -1.3442367315292358,
	"max": -0.4211394786834717,
	"count": 26
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 26
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 26
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.10442667206128438,
	"min": -0.800000011920929,
	"max": 0.6459733744462332,
	"count": 26
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -0.6265600323677063,
	"min": -3.686400055885315,
	"max": 3.8758402466773987,
	"count": 26
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.1305333375930786,
	"min": -1.0,
	"max": 0.8074666857719421,
	"count": 26
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -0.7832000255584717,
	"min": -4.608000040054321,
	"max": 4.844800114631653,
	"count": 26
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 26
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 26
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.014766910806065426,
	"min": 0.013285189863139143,
	"max": 0.02072374345593606,
	"count": 6
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.014766910806065426,
	"min": 0.013285189863139143,
	"max": 0.02072374345593606,
	"count": 6
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.0021963658082919816,
	"min": 0.0018074257849630985,
	"max": 0.005299923840599755,
	"count": 6
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.0021963658082919816,
	"min": 0.0018074257849630985,
	"max": 0.005299923840599755,
	"count": 6
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.0022314870613627134,
	"min": 0.0018156477934539769,
	"max": 0.00535708706981192,
	"count": 6
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.0022314870613627134,
	"min": 0.0018156477934539769,
	"max": 0.00535708706981192,
	"count": 6
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.00029610012129996,
	"min": 0.00029610012129996,
	"max": 0.0002993284802238399,
	"count": 6
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.00029610012129996,
	"min": 0.00029610012129996,
	"max": 0.0002993284802238399,
	"count": 6
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.19870004000000005,
	"min": 0.19870004000000005,
	"max": 0.19977615999999998,
	"count": 6
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.19870004000000005,
	"min": 0.19870004000000005,
	"max": 0.19977615999999998,
	"count": 6
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.004935131995999999,
	"min": 0.004935131995999999,
	"max": 0.004988830384,
	"count": 6
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.004935131995999999,
	"min": 0.004935131995999999,
	"max": 0.004988830384,
	"count": 6
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1717155959",
	"python_version": "3.10.12 \| packaged by Anaconda, Inc. \| (main, Jul 5 2023, 19:01:18) [MSC v.1916 64 bit (AMD64)]",
	"command_line_arguments": "\\\\?\\D:\\Programs\\Anaconda3\\envs\\rl\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.3.0+cpu",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1717156185"
	},
	"total": 225.87608079996426,
	"count": 1,
	"self": 0.07468920003157109,
	"children": {
	"run_training.setup": {
	"total": 0.05783429997973144,
	"count": 1,
	"self": 0.05783429997973144
	},
	"TrainerController.start_learning": {
	"total": 225.74355729995295,
	"count": 1,
	"self": 0.16198030044324696,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.075251600006595,
	"count": 2,
	"self": 4.075251600006595
	},
	"TrainerController.advance": {
	"total": 221.3517819995177,
	"count": 8620,
	"self": 0.16290820704307407,
	"children": {
	"env_step": {
	"total": 121.70785399532178,
	"count": 8620,
	"self": 93.73711119842483,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 27.8769966987893,
	"count": 8620,
	"self": 0.9701793987769634,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 26.906817300012335,
	"count": 17146,
	"self": 26.906817300012335
	}
	}
	},
	"workers": {
	"total": 0.09374609810765833,
	"count": 8620,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 216.00840789743233,
	"count": 8620,
	"is_parallel": true,
	"self": 142.3634933962021,
	"children": {
	"steps_from_proto": {
	"total": 0.0038374000578187406,
	"count": 4,
	"is_parallel": true,
	"self": 0.0009646000689826906,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.00287279998883605,
	"count": 16,
	"is_parallel": true,
	"self": 0.00287279998883605
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 73.64107710117241,
	"count": 8620,
	"is_parallel": true,
	"self": 3.624384798342362,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 3.1010047000600025,
	"count": 8620,
	"is_parallel": true,
	"self": 3.1010047000600025
	},
	"communicator.exchange": {
	"total": 55.706702996685635,
	"count": 8620,
	"is_parallel": true,
	"self": 55.706702996685635
	},
	"steps_from_proto": {
	"total": 11.208984606084414,
	"count": 17240,
	"is_parallel": true,
	"self": 2.290967408567667,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 8.918017197516747,
	"count": 68960,
	"is_parallel": true,
	"self": 8.918017197516747
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 99.48101979715284,
	"count": 8620,
	"self": 1.4096503957989626,
	"children": {
	"process_trajectory": {
	"total": 20.840155201149173,
	"count": 8620,
	"self": 20.840155201149173
	},
	"_update_policy": {
	"total": 77.2312142002047,
	"count": 6,
	"self": 18.673083499947097,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 58.55813070025761,
	"count": 183,
	"self": 58.55813070025761
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.999494068324566e-07,
	"count": 1,
	"self": 9.999494068324566e-07
	},
	"TrainerController._save_models": {
	"total": 0.15454240003600717,
	"count": 1,
	"self": 0.002673500042874366,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.1518688999931328,
	"count": 1,
	"self": 0.1518688999931328
	}
	}
	}
	}
	}
	}
	}