First Push`

7f3c088 verified 10 days ago

16 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.2103099822998047,
	"min": 2.201249837875366,
	"max": 3.2957518100738525,
	"count": 500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 44064.73828125,
	"min": 9530.1552734375,
	"max": 138095.359375,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 49.58163265306123,
	"min": 40.56666666666667,
	"max": 999.0,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19436.0,
	"min": 6824.0,
	"max": 27180.0,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1462.9620152467444,
	"min": 1192.1950482485472,
	"max": 1467.2865805169836,
	"count": 415
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 286740.5549883619,
	"min": 2384.3900964970944,
	"max": 343788.7090882063,
	"count": 415
	},
	"SoccerTwos.Step.mean": {
	"value": 4999950.0,
	"min": 9128.0,
	"max": 4999950.0,
	"count": 500
	},
	"SoccerTwos.Step.sum": {
	"value": 4999950.0,
	"min": 9128.0,
	"max": 4999950.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.007671913132071495,
	"min": -0.10139797627925873,
	"max": 0.18653760850429535,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -1.511366844177246,
	"min": -21.394973754882812,
	"max": 24.597007751464844,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.005279144272208214,
	"min": -0.10384976118803024,
	"max": 0.18847353756427765,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -1.0399913787841797,
	"min": -21.91230010986328,
	"max": 24.49136734008789,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.09802131937239981,
	"min": -0.6153846153846154,
	"max": 0.5238666711030183,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -19.310199916362762,
	"min": -46.71560001373291,
	"max": 51.93000000715256,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.09802131937239981,
	"min": -0.6153846153846154,
	"max": 0.5238666711030183,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -19.310199916362762,
	"min": -46.71560001373291,
	"max": 51.93000000715256,
	"count": 500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.018605794738202047,
	"min": 0.010871664331837868,
	"max": 0.022853191460793218,
	"count": 236
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.018605794738202047,
	"min": 0.010871664331837868,
	"max": 0.022853191460793218,
	"count": 236
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10037734309832255,
	"min": 3.683921837212741e-07,
	"max": 0.10723397011558215,
	"count": 236
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10037734309832255,
	"min": 3.683921837212741e-07,
	"max": 0.10723397011558215,
	"count": 236
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10276271899541219,
	"min": 4.6114709941017886e-07,
	"max": 0.10958955039580663,
	"count": 236
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10276271899541219,
	"min": 4.6114709941017886e-07,
	"max": 0.10958955039580663,
	"count": 236
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 236
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 236
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 236
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 236
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 236
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 236
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1733624626",
	"python_version": "3.10.12 \| packaged by Anaconda, Inc. \| (main, Jul 5 2023, 19:01:18) [MSC v.1916 64 bit (AMD64)]",
	"command_line_arguments": "\\\\?\\E:\\Anaconda\\envs\\drl7\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.5.1+cpu",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1733689629"
	},
	"total": 65002.862883300055,
	"count": 1,
	"self": 0.4076301003806293,
	"children": {
	"run_training.setup": {
	"total": 0.11048809997737408,
	"count": 1,
	"self": 0.11048809997737408
	},
	"TrainerController.start_learning": {
	"total": 65002.3447650997,
	"count": 1,
	"self": 9.664195775054395,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.51482770126313,
	"count": 25,
	"self": 6.51482770126313
	},
	"TrainerController.advance": {
	"total": 64986.00757572334,
	"count": 331947,
	"self": 9.779791821725667,
	"children": {
	"env_step": {
	"total": 7535.487085077912,
	"count": 331947,
	"self": 5999.420773681719,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1530.1518038650975,
	"count": 331947,
	"self": 53.8769374191761,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1476.2748664459214,
	"count": 638022,
	"self": 1476.2748664459214
	}
	}
	},
	"workers": {
	"total": 5.914507531095296,
	"count": 331947,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 64985.299433196895,
	"count": 331947,
	"is_parallel": true,
	"self": 60197.410073976964,
	"children": {
	"steps_from_proto": {
	"total": 0.051801799796521664,
	"count": 50,
	"is_parallel": true,
	"self": 0.010555502958595753,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.04124629683792591,
	"count": 200,
	"is_parallel": true,
	"self": 0.04124629683792591
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 4787.8375574201345,
	"count": 331947,
	"is_parallel": true,
	"self": 229.60771071817726,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 208.17352842446417,
	"count": 331947,
	"is_parallel": true,
	"self": 208.17352842446417
	},
	"communicator.exchange": {
	"total": 3581.358097888995,
	"count": 331947,
	"is_parallel": true,
	"self": 3581.358097888995
	},
	"steps_from_proto": {
	"total": 768.6982203884982,
	"count": 663894,
	"is_parallel": true,
	"self": 152.91460758028552,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 615.7836128082126,
	"count": 2655576,
	"is_parallel": true,
	"self": 615.7836128082126
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 57440.740698823705,
	"count": 331947,
	"self": 59.941079049836844,
	"children": {
	"process_trajectory": {
	"total": 1198.5999041702598,
	"count": 331947,
	"self": 1196.859120070003,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.7407841002568603,
	"count": 10,
	"self": 1.7407841002568603
	}
	}
	},
	"_update_policy": {
	"total": 56182.19971560361,
	"count": 236,
	"self": 801.2737847049721,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 55380.92593089864,
	"count": 7092,
	"self": 55380.92593089864
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.0012326836586e-07,
	"count": 1,
	"self": 9.0012326836586e-07
	},
	"TrainerController._save_models": {
	"total": 0.15816499991342425,
	"count": 1,
	"self": 0.004409899935126305,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.15375509997829795,
	"count": 1,
	"self": 0.15375509997829795
	}
	}
	}
	}
	}
	}
	}