First Push

57ab324 about 1 year ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.3297736644744873,
	"min": 2.3108389377593994,
	"max": 3.2958154678344727,
	"count": 500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 46893.68359375,
	"min": 19817.169921875,
	"max": 160233.140625,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 56.91954022988506,
	"min": 43.35087719298246,
	"max": 999.0,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19808.0,
	"min": 14648.0,
	"max": 25348.0,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1534.3269811293542,
	"min": 1183.5485215813121,
	"max": 1551.405389093557,
	"count": 480
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 266972.89471650764,
	"min": 2367.0970431626242,
	"max": 341892.72860558936,
	"count": 480
	},
	"SoccerTwos.Step.mean": {
	"value": 4999939.0,
	"min": 9690.0,
	"max": 4999939.0,
	"count": 500
	},
	"SoccerTwos.Step.sum": {
	"value": 4999939.0,
	"min": 9690.0,
	"max": 4999939.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.00910065695643425,
	"min": -0.09789004176855087,
	"max": 0.23074674606323242,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 1.5835143327713013,
	"min": -14.487726211547852,
	"max": 35.30425262451172,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.008705869317054749,
	"min": -0.09969667345285416,
	"max": 0.23732972145080566,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 1.5148212909698486,
	"min": -14.755107879638672,
	"max": 36.31144714355469,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.03772988538632448,
	"min": -0.5714285714285714,
	"max": 0.3872978086889225,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 6.565000057220459,
	"min": -49.93519985675812,
	"max": 60.75959986448288,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.03772988538632448,
	"min": -0.5714285714285714,
	"max": 0.3872978086889225,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 6.565000057220459,
	"min": -49.93519985675812,
	"max": 60.75959986448288,
	"count": 500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.016802129296896357,
	"min": 0.01020057471760083,
	"max": 0.022905385214835407,
	"count": 237
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.016802129296896357,
	"min": 0.01020057471760083,
	"max": 0.022905385214835407,
	"count": 237
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10920455977320671,
	"min": 1.278151113600264e-06,
	"max": 0.11705219199260077,
	"count": 237
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10920455977320671,
	"min": 1.278151113600264e-06,
	"max": 0.11705219199260077,
	"count": 237
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.11106214225292206,
	"min": 1.2946513142727176e-06,
	"max": 0.11790347720185916,
	"count": 237
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.11106214225292206,
	"min": 1.2946513142727176e-06,
	"max": 0.11790347720185916,
	"count": 237
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 4.999999999999999e-05,
	"min": 4.999999999999999e-05,
	"max": 5e-05,
	"count": 237
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 4.999999999999999e-05,
	"min": 4.999999999999999e-05,
	"max": 5e-05,
	"count": 237
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 237
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 237
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 237
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 237
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1703425867",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/linux/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.1.2+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1703431621"
	},
	"total": 5753.9713630119995,
	"count": 1,
	"self": 10.003901086998667,
	"children": {
	"run_training.setup": {
	"total": 0.03320010800052842,
	"count": 1,
	"self": 0.03320010800052842
	},
	"TrainerController.start_learning": {
	"total": 5743.934261817,
	"count": 1,
	"self": 4.598700764327077,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.461793570003465,
	"count": 25,
	"self": 2.461793570003465
	},
	"TrainerController.advance": {
	"total": 5736.68472627367,
	"count": 336279,
	"self": 4.452538133902635,
	"children": {
	"env_step": {
	"total": 3768.169735152508,
	"count": 336279,
	"self": 2540.511554829661,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1225.00736433792,
	"count": 336279,
	"self": 27.384061780176125,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1197.623302557744,
	"count": 636948,
	"self": 1197.623302557744
	}
	}
	},
	"workers": {
	"total": 2.650815984927249,
	"count": 336279,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 5738.468630533378,
	"count": 336279,
	"is_parallel": true,
	"self": 3703.546075526435,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0022654249996776343,
	"count": 2,
	"is_parallel": true,
	"self": 0.0011427790004745475,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0011226459992030868,
	"count": 8,
	"is_parallel": true,
	"self": 0.0011226459992030868
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.017416921999938495,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006658129987044958,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0006755950007573119,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006755950007573119
	},
	"communicator.exchange": {
	"total": 0.014058880999982648,
	"count": 1,
	"is_parallel": true,
	"self": 0.014058880999982648
	},
	"steps_from_proto": {
	"total": 0.002016633000494039,
	"count": 2,
	"is_parallel": true,
	"self": 0.00039346100038528675,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0016231720001087524,
	"count": 8,
	"is_parallel": true,
	"self": 0.0016231720001087524
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2034.8957418499367,
	"count": 336278,
	"is_parallel": true,
	"self": 115.62528190730063,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 83.27074140703007,
	"count": 336278,
	"is_parallel": true,
	"self": 83.27074140703007
	},
	"communicator.exchange": {
	"total": 1483.7842008194802,
	"count": 336278,
	"is_parallel": true,
	"self": 1483.7842008194802
	},
	"steps_from_proto": {
	"total": 352.21551771612576,
	"count": 672556,
	"is_parallel": true,
	"self": 73.3906903016632,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 278.82482741446256,
	"count": 2690224,
	"is_parallel": true,
	"self": 278.82482741446256
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.026813157006472466,
	"count": 48,
	"is_parallel": true,
	"self": 0.005673642001966073,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.021139515004506393,
	"count": 192,
	"is_parallel": true,
	"self": 0.021139515004506393
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1964.0624529872593,
	"count": 336279,
	"self": 34.067328851527236,
	"children": {
	"process_trajectory": {
	"total": 543.9419646267424,
	"count": 336279,
	"self": 541.9494062307422,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.9925583960002768,
	"count": 10,
	"self": 1.9925583960002768
	}
	}
	},
	"_update_policy": {
	"total": 1386.0531595089897,
	"count": 237,
	"self": 423.7020367749792,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 962.3511227340105,
	"count": 7116,
	"self": 962.3511227340105
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 5.279998731566593e-07,
	"count": 1,
	"self": 5.279998731566593e-07
	},
	"TrainerController._save_models": {
	"total": 0.18904068099982396,
	"count": 1,
	"self": 0.0012437099994713208,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.18779697100035264,
	"count": 1,
	"self": 0.18779697100035264
	}
	}
	}
	}
	}
	}
	}