First Push

aef946e over 1 year ago

20.1 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.5824898481369019,
	"min": 1.5824898481369019,
	"max": 1.9090577363967896,
	"count": 64
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 158299.625,
	"min": 158299.625,
	"max": 194502.90625,
	"count": 64
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 51.225469728601254,
	"min": 47.746588693957115,
	"max": 71.39710144927537,
	"count": 64
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 98148.0,
	"min": 96632.0,
	"max": 98816.0,
	"count": 64
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1508.1363786078211,
	"min": 1473.5221745025995,
	"max": 1529.2443052678618,
	"count": 64
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 1444794.6507062926,
	"min": 1028764.0045122284,
	"max": 1537430.1608911173,
	"count": 64
	},
	"SoccerTwos.Step.mean": {
	"value": 8899874.0,
	"min": 5749974.0,
	"max": 8899874.0,
	"count": 64
	},
	"SoccerTwos.Step.sum": {
	"value": 8899874.0,
	"min": 5749974.0,
	"max": 8899874.0,
	"count": 64
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.0002751847496256232,
	"min": -0.0704675242304802,
	"max": 0.05401033163070679,
	"count": 64
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.26335179805755615,
	"min": -66.81063842773438,
	"max": 42.560142517089844,
	"count": 64
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.004515423439443111,
	"min": -0.07144340127706528,
	"max": 0.051143623888492584,
	"count": 64
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -4.321260452270508,
	"min": -64.05392456054688,
	"max": 40.30117416381836,
	"count": 64
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 64
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 64
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.02917032437389298,
	"min": -0.10855413350570466,
	"max": 0.09264945305671943,
	"count": 64
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -27.916000425815582,
	"min": -93.2480006814003,
	"max": 84.68160009384155,
	"count": 64
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.02917032437389298,
	"min": -0.10855413350570466,
	"max": 0.09264945305671943,
	"count": 64
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -27.916000425815582,
	"min": -93.2480006814003,
	"max": 84.68160009384155,
	"count": 64
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.018681833112835496,
	"min": 0.014127501142401242,
	"max": 0.020697781255391116,
	"count": 64
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.05604549933850649,
	"min": 0.028315532435226484,
	"max": 0.057246277056401604,
	"count": 64
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.12366595591108004,
	"min": 0.08892387400070825,
	"max": 0.12366595591108004,
	"count": 64
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.3709978677332401,
	"min": 0.1778477480014165,
	"max": 0.3709978677332401,
	"count": 64
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.12668096588717567,
	"min": 0.09020149645706017,
	"max": 0.12668096588717567,
	"count": 64
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.380042897661527,
	"min": 0.18040299291412035,
	"max": 0.380042897661527,
	"count": 64
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 64
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0009,
	"min": 0.0006,
	"max": 0.0009,
	"count": 64
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 64
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.6000000000000002,
	"min": 0.40000000000000013,
	"max": 0.6000000000000002,
	"count": 64
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 64
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.015000000000000003,
	"min": 0.010000000000000002,
	"max": 0.015000000000000003,
	"count": 64
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 64
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 64
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1689545754",
	"python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]",
	"command_line_arguments": "/home/timjwhite/.local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --resume --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1689554406"
	},
	"total": 8652.359177459,
	"count": 1,
	"self": 0.24237303400150267,
	"children": {
	"run_training.setup": {
	"total": 0.04718287900004725,
	"count": 1,
	"self": 0.04718287900004725
	},
	"TrainerController.start_learning": {
	"total": 8652.069621546,
	"count": 1,
	"self": 4.708958225339302,
	"children": {
	"TrainerController._reset_env": {
	"total": 9.899197846001243,
	"count": 18,
	"self": 9.899197846001243
	},
	"TrainerController.advance": {
	"total": 8637.195361422659,
	"count": 222816,
	"self": 4.77625178893868,
	"children": {
	"env_step": {
	"total": 6819.7162154938205,
	"count": 222816,
	"self": 5537.285447605323,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1279.8399814283537,
	"count": 222816,
	"self": 30.754265482031542,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1249.0857159463221,
	"count": 401938,
	"self": 1249.0857159463221
	}
	}
	},
	"workers": {
	"total": 2.5907864601442725,
	"count": 222815,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 8637.943608716465,
	"count": 222815,
	"is_parallel": true,
	"self": 3749.0665332869085,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.011673448999999891,
	"count": 2,
	"is_parallel": true,
	"self": 0.0070754110001871595,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.004598037999812732,
	"count": 8,
	"is_parallel": true,
	"self": 0.004598037999812732
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.03501203599989822,
	"count": 1,
	"is_parallel": true,
	"self": 0.0014596029998301674,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.001354877000039778,
	"count": 1,
	"is_parallel": true,
	"self": 0.001354877000039778
	},
	"communicator.exchange": {
	"total": 0.027357521000112683,
	"count": 1,
	"is_parallel": true,
	"self": 0.027357521000112683
	},
	"steps_from_proto": {
	"total": 0.004840034999915588,
	"count": 2,
	"is_parallel": true,
	"self": 0.0011863969998557877,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0036536380000598,
	"count": 8,
	"is_parallel": true,
	"self": 0.0036536380000598
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.07651414700058012,
	"count": 34,
	"is_parallel": true,
	"self": 0.01597959500372781,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.060534551996852315,
	"count": 136,
	"is_parallel": true,
	"self": 0.060534551996852315
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 4888.800561282556,
	"count": 222814,
	"is_parallel": true,
	"self": 291.07946570729473,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 203.93879390035477,
	"count": 222814,
	"is_parallel": true,
	"self": 203.93879390035477
	},
	"communicator.exchange": {
	"total": 3481.787563310218,
	"count": 222814,
	"is_parallel": true,
	"self": 3481.787563310218
	},
	"steps_from_proto": {
	"total": 911.9947383646886,
	"count": 445628,
	"is_parallel": true,
	"self": 190.49647091938618,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 721.4982674453024,
	"count": 1782512,
	"is_parallel": true,
	"self": 721.4982674453024
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1812.7028941398985,
	"count": 222815,
	"self": 28.87042225176083,
	"children": {
	"process_trajectory": {
	"total": 779.9697009141312,
	"count": 222815,
	"self": 778.292166592131,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.677534322000156,
	"count": 6,
	"self": 1.677534322000156
	}
	}
	},
	"_update_policy": {
	"total": 1003.8627709740065,
	"count": 155,
	"self": 636.5023784550285,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 367.36039251897796,
	"count": 4650,
	"self": 367.36039251897796
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.1709998943842947e-06,
	"count": 1,
	"self": 1.1709998943842947e-06
	},
	"TrainerController._save_models": {
	"total": 0.26610288099982427,
	"count": 1,
	"self": 0.001952478000021074,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2641504029998032,
	"count": 1,
	"self": 0.2641504029998032
	}
	}
	}
	}
	}
	}
	}