initial commit

7a6d146 verified 6 days ago

20.1 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.2883284091949463,
	"min": 2.2578766345977783,
	"max": 2.370623826980591,
	"count": 48
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 46645.28515625,
	"min": 4697.43896484375,
	"max": 49031.5625,
	"count": 48
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 45.21495327102804,
	"min": 33.9,
	"max": 56.47126436781609,
	"count": 48
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19352.0,
	"min": 1356.0,
	"max": 20012.0,
	"count": 48
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1443.1159542453488,
	"min": 1433.9323103201318,
	"max": 1485.340514475233,
	"count": 48
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 308826.8142085046,
	"min": 29073.577677292353,
	"max": 360355.0107725008,
	"count": 48
	},
	"SoccerTwos.Step.mean": {
	"value": 2999965.0,
	"min": 2529953.0,
	"max": 2999965.0,
	"count": 48
	},
	"SoccerTwos.Step.sum": {
	"value": 2999965.0,
	"min": 2529953.0,
	"max": 2999965.0,
	"count": 48
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.07176772505044937,
	"min": -0.14496664702892303,
	"max": 0.09119022637605667,
	"count": 48
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -15.358293533325195,
	"min": -28.516891479492188,
	"max": 20.791372299194336,
	"count": 48
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.07692451030015945,
	"min": -0.14932173490524292,
	"max": 0.10056917369365692,
	"count": 48
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -16.46184539794922,
	"min": -29.037235260009766,
	"max": 22.929771423339844,
	"count": 48
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 48
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 48
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.11535233788401167,
	"min": -0.4820842115502608,
	"max": 0.1686799997375125,
	"count": 48
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -24.685400307178497,
	"min": -43.16159999370575,
	"max": 35.422799944877625,
	"count": 48
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.11535233788401167,
	"min": -0.4820842115502608,
	"max": 0.1686799997375125,
	"count": 48
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -24.685400307178497,
	"min": -43.16159999370575,
	"max": 35.422799944877625,
	"count": 48
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 48
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 48
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01425742187226812,
	"min": 0.012498459182097577,
	"max": 0.022783190056604022,
	"count": 22
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01425742187226812,
	"min": 0.012498459182097577,
	"max": 0.022783190056604022,
	"count": 22
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10696341718236606,
	"min": 0.09243139326572418,
	"max": 0.11185142124692599,
	"count": 22
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10696341718236606,
	"min": 0.09243139326572418,
	"max": 0.11185142124692599,
	"count": 22
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10868611683448155,
	"min": 0.09506866857409477,
	"max": 0.11500879476467768,
	"count": 22
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10868611683448155,
	"min": 0.09506866857409477,
	"max": 0.11500879476467768,
	"count": 22
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 22
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 22
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 22
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 22
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 22
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 22
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1734126925",
	"python_version": "3.10.12 (main, Nov 6 2024, 20:22:13) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./train-soccer/SoccerTwos.yaml --env=train-soccer/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwosNew --no-graphics --resume",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.5.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1734129880"
	},
	"total": 2955.233237586999,
	"count": 1,
	"self": 0.009656171998358332,
	"children": {
	"run_training.setup": {
	"total": 0.09122801299963612,
	"count": 1,
	"self": 0.09122801299963612
	},
	"TrainerController.start_learning": {
	"total": 2955.132353402001,
	"count": 1,
	"self": 1.471143686088908,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.6418618119969324,
	"count": 4,
	"self": 3.6418618119969324
	},
	"TrainerController.advance": {
	"total": 2949.8338889549123,
	"count": 33661,
	"self": 1.4734311612919555,
	"children": {
	"env_step": {
	"total": 1088.3189411101412,
	"count": 33661,
	"self": 885.4894377948949,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 202.01222601794143,
	"count": 33661,
	"self": 7.401013266095106,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 194.61121275184632,
	"count": 59406,
	"self": 194.61121275184632
	}
	}
	},
	"workers": {
	"total": 0.8172772973048268,
	"count": 33661,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2946.748456279194,
	"count": 33661,
	"is_parallel": true,
	"self": 2214.231777096149,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.005093496998597402,
	"count": 2,
	"is_parallel": true,
	"self": 0.0014661750028608367,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0036273219957365654,
	"count": 8,
	"is_parallel": true,
	"self": 0.0036273219957365654
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.05034801800138666,
	"count": 1,
	"is_parallel": true,
	"self": 0.0018442389991832897,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0011039829987566918,
	"count": 1,
	"is_parallel": true,
	"self": 0.0011039829987566918
	},
	"communicator.exchange": {
	"total": 0.04308805600157939,
	"count": 1,
	"is_parallel": true,
	"self": 0.04308805600157939
	},
	"steps_from_proto": {
	"total": 0.0043117400018672924,
	"count": 2,
	"is_parallel": true,
	"self": 0.0007883020043664146,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.003523437997500878,
	"count": 8,
	"is_parallel": true,
	"self": 0.003523437997500878
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.008853515999362571,
	"count": 6,
	"is_parallel": true,
	"self": 0.0017533529935462866,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.007100163005816285,
	"count": 24,
	"is_parallel": true,
	"self": 0.007100163005816285
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 732.5078256670458,
	"count": 33660,
	"is_parallel": true,
	"self": 45.575933057818474,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 29.554295166686643,
	"count": 33660,
	"is_parallel": true,
	"self": 29.554295166686643
	},
	"communicator.exchange": {
	"total": 516.8730777226519,
	"count": 33660,
	"is_parallel": true,
	"self": 516.8730777226519
	},
	"steps_from_proto": {
	"total": 140.50451971988878,
	"count": 67320,
	"is_parallel": true,
	"self": 25.433041058575327,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 115.07147866131345,
	"count": 269280,
	"is_parallel": true,
	"self": 115.07147866131345
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1860.0415166834791,
	"count": 33661,
	"self": 9.422440332229598,
	"children": {
	"process_trajectory": {
	"total": 300.6208975172449,
	"count": 33661,
	"self": 300.20648151024216,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.4144160070027283,
	"count": 1,
	"self": 0.4144160070027283
	}
	}
	},
	"_update_policy": {
	"total": 1549.9981788340046,
	"count": 23,
	"self": 93.86972147709457,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 1456.12845735691,
	"count": 661,
	"self": 1456.12845735691
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.4210017980076373e-06,
	"count": 1,
	"self": 1.4210017980076373e-06
	},
	"TrainerController._save_models": {
	"total": 0.18545752800127957,
	"count": 1,
	"self": 0.0033703480003168806,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.1820871800009627,
	"count": 1,
	"self": 0.1820871800009627
	}
	}
	}
	}
	}
	}
	}