First Push

ea774f5 verified 9 months ago

15.8 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.5979747772216797,
	"min": 1.511555552482605,
	"max": 3.295804500579834,
	"count": 2500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 31141.33203125,
	"min": 3777.708740234375,
	"max": 123682.1796875,
	"count": 2500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 71.68115942028986,
	"min": 42.14782608695652,
	"max": 999.0,
	"count": 2500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19784.0,
	"min": 14492.0,
	"max": 25680.0,
	"count": 2500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1826.957066560597,
	"min": 1197.322794256716,
	"max": 1843.2668183370704,
	"count": 2467
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 252120.0751853624,
	"min": 2394.645588513432,
	"max": 404495.6598818271,
	"count": 2467
	},
	"SoccerTwos.Step.mean": {
	"value": 24999998.0,
	"min": 9856.0,
	"max": 24999998.0,
	"count": 2500
	},
	"SoccerTwos.Step.sum": {
	"value": 24999998.0,
	"min": 9856.0,
	"max": 24999998.0,
	"count": 2500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.011240914463996887,
	"min": -0.14725421369075775,
	"max": 0.33110320568084717,
	"count": 2500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -1.5400053262710571,
	"min": -23.897327423095703,
	"max": 49.003273010253906,
	"count": 2500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.011732472106814384,
	"min": -0.14846444129943848,
	"max": 0.33885422348976135,
	"count": 2500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -1.6073486804962158,
	"min": -23.647857666015625,
	"max": 50.15042495727539,
	"count": 2500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 2500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 2500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.12945985533025142,
	"min": -0.49676666657129925,
	"max": 0.7677444407233486,
	"count": 2500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -17.736000180244446,
	"min": -62.46600019931793,
	"max": 99.18400037288666,
	"count": 2500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.12945985533025142,
	"min": -0.49676666657129925,
	"max": 0.7677444407233486,
	"count": 2500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -17.736000180244446,
	"min": -62.46600019931793,
	"max": 99.18400037288666,
	"count": 2500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 2500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 2500
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01654374592277842,
	"min": 0.008984572056215256,
	"max": 0.02581824016136428,
	"count": 1210
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01654374592277842,
	"min": 0.008984572056215256,
	"max": 0.02581824016136428,
	"count": 1210
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.08911005382736524,
	"min": 3.785484807394823e-07,
	"max": 0.14597028146187466,
	"count": 1210
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.08911005382736524,
	"min": 3.785484807394823e-07,
	"max": 0.14597028146187466,
	"count": 1210
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.09072775915265083,
	"min": 3.7238030851464526e-07,
	"max": 0.14897385289271672,
	"count": 1210
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.09072775915265083,
	"min": 3.7238030851464526e-07,
	"max": 0.14897385289271672,
	"count": 1210
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.00025000000000000006,
	"min": 0.00025000000000000006,
	"max": 0.00025000000000000006,
	"count": 1210
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.00025000000000000006,
	"min": 0.00025000000000000006,
	"max": 0.00025000000000000006,
	"count": 1210
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 1210
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 1210
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 1210
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 1210
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1714197161",
	"python_version": "3.10.12 \| packaged by Anaconda, Inc. \| (main, Jul 5 2023, 19:01:18) [MSC v.1916 64 bit (AMD64)]",
	"command_line_arguments": "\\\\?\\C:\\Users\\Rahil\\miniconda3\\envs\\huggingface_rl\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.3.0+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1714242608"
	},
	"total": 45445.911744100005,
	"count": 1,
	"self": 0.8529118000078597,
	"children": {
	"run_training.setup": {
	"total": 0.09120809999876656,
	"count": 1,
	"self": 0.09120809999876656
	},
	"TrainerController.start_learning": {
	"total": 45444.9676242,
	"count": 1,
	"self": 32.451057508427766,
	"children": {
	"TrainerController._reset_env": {
	"total": 9.359218000085093,
	"count": 125,
	"self": 9.359218000085093
	},
	"TrainerController.advance": {
	"total": 45402.9393858915,
	"count": 1712458,
	"self": 30.118018284418213,
	"children": {
	"env_step": {
	"total": 32565.312563302898,
	"count": 1712458,
	"self": 19509.227607912057,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 13034.285687099866,
	"count": 1712458,
	"self": 201.94590439824242,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 12832.339782701623,
	"count": 3143974,
	"self": 12832.339782701623
	}
	}
	},
	"workers": {
	"total": 21.799268290975306,
	"count": 1712458,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 45398.33970200704,
	"count": 1712458,
	"is_parallel": true,
	"self": 29911.087757495094,
	"children": {
	"steps_from_proto": {
	"total": 0.2044884001079481,
	"count": 250,
	"is_parallel": true,
	"self": 0.03695939997851383,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.16752900012943428,
	"count": 1000,
	"is_parallel": true,
	"self": 0.16752900012943428
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 15487.047456111839,
	"count": 1712458,
	"is_parallel": true,
	"self": 792.354284125744,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 694.8910819937155,
	"count": 1712458,
	"is_parallel": true,
	"self": 694.8910819937155
	},
	"communicator.exchange": {
	"total": 11344.200517301026,
	"count": 1712458,
	"is_parallel": true,
	"self": 11344.200517301026
	},
	"steps_from_proto": {
	"total": 2655.601572691354,
	"count": 3424916,
	"is_parallel": true,
	"self": 487.3085465980548,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 2168.293026093299,
	"count": 13699664,
	"is_parallel": true,
	"self": 2168.293026093299
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 12807.508804304183,
	"count": 1712458,
	"self": 246.52064090550266,
	"children": {
	"process_trajectory": {
	"total": 6219.173412498698,
	"count": 1712458,
	"self": 6209.509433798732,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 9.66397869996581,
	"count": 50,
	"self": 9.66397869996581
	}
	}
	},
	"_update_policy": {
	"total": 6341.814750899983,
	"count": 1210,
	"self": 4088.667170400142,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 2253.147580499841,
	"count": 36309,
	"self": 2253.147580499841
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.999923011288047e-07,
	"count": 1,
	"self": 8.999923011288047e-07
	},
	"TrainerController._save_models": {
	"total": 0.21796189999440685,
	"count": 1,
	"self": 0.04979129999992438,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.16817059999448247,
	"count": 1,
	"self": 0.16817059999448247
	}
	}
	}
	}
	}
	}
	}