Second Push

8a152f0 about 1 year ago

20 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 3.1824750900268555,
	"min": 3.1547484397888184,
	"max": 3.2956900596618652,
	"count": 100
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 88701.9453125,
	"min": 23412.0703125,
	"max": 114764.3203125,
	"count": 100
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 860.5,
	"min": 489.9,
	"max": 999.0,
	"count": 100
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 20652.0,
	"min": 14644.0,
	"max": 27616.0,
	"count": 100
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1200.78991806887,
	"min": 1197.0440605645447,
	"max": 1207.1172065682176,
	"count": 90
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 4803.15967227548,
	"min": 2394.0881211290894,
	"max": 16784.708841766012,
	"count": 90
	},
	"SoccerTwos.Step.mean": {
	"value": 999684.0,
	"min": 9824.0,
	"max": 999684.0,
	"count": 100
	},
	"SoccerTwos.Step.sum": {
	"value": 999684.0,
	"min": 9824.0,
	"max": 999684.0,
	"count": 100
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.00797598622739315,
	"min": -0.036553021520376205,
	"max": 0.05947311595082283,
	"count": 100
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.0957118347287178,
	"min": -0.438421368598938,
	"max": 0.8325973749160767,
	"count": 100
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.006179752293974161,
	"min": -0.022581540048122406,
	"max": 0.05948488041758537,
	"count": 100
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -0.07415702939033508,
	"min": -0.27457916736602783,
	"max": 0.8327765464782715,
	"count": 100
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 100
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 100
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.16666666666666666,
	"min": -0.5860000000550196,
	"max": 0.38087058768552895,
	"count": 100
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -2.0,
	"min": -8.0,
	"max": 6.474799990653992,
	"count": 100
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.16666666666666666,
	"min": -0.5860000000550196,
	"max": 0.38087058768552895,
	"count": 100
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -2.0,
	"min": -8.0,
	"max": 6.474799990653992,
	"count": 100
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.012221555140179892,
	"min": 0.006795583742981156,
	"max": 0.016645218633736174,
	"count": 46
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.012221555140179892,
	"min": 0.006795583742981156,
	"max": 0.016645218633736174,
	"count": 46
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.003237667710830768,
	"min": 8.194062053613985e-05,
	"max": 0.01861500459102293,
	"count": 46
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.003237667710830768,
	"min": 8.194062053613985e-05,
	"max": 0.01861500459102293,
	"count": 46
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.00324154964958628,
	"min": 7.848465102142655e-05,
	"max": 0.009435744381820162,
	"count": 46
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.00324154964958628,
	"min": 7.848465102142655e-05,
	"max": 0.009435744381820162,
	"count": 46
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0006,
	"min": 0.0006,
	"max": 0.0006,
	"count": 46
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0006,
	"min": 0.0006,
	"max": 0.0006,
	"count": 46
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 46
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 46
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005,
	"min": 0.005,
	"max": 0.005,
	"count": 46
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005,
	"min": 0.005,
	"max": 0.005,
	"count": 46
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1697686348",
	"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.0.1+cu118",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1697688565"
	},
	"total": 2217.164994551,
	"count": 1,
	"self": 0.4259129499996561,
	"children": {
	"run_training.setup": {
	"total": 0.07464664500002982,
	"count": 1,
	"self": 0.07464664500002982
	},
	"TrainerController.start_learning": {
	"total": 2216.664434956,
	"count": 1,
	"self": 1.6753877999994984,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.416130657000224,
	"count": 5,
	"self": 4.416130657000224
	},
	"TrainerController.advance": {
	"total": 2210.3573846880004,
	"count": 65069,
	"self": 1.8022751490188966,
	"children": {
	"env_step": {
	"total": 1823.0047769609614,
	"count": 65069,
	"self": 1406.1171325439245,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 415.8875872410355,
	"count": 65069,
	"self": 11.887741108043144,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 403.99984613299233,
	"count": 129182,
	"self": 403.99984613299233
	}
	}
	},
	"workers": {
	"total": 1.0000571760013486,
	"count": 65069,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2212.1702933349934,
	"count": 65069,
	"is_parallel": true,
	"self": 1033.889048864969,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0044236590000537035,
	"count": 2,
	"is_parallel": true,
	"self": 0.0009960950001186575,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.003427563999935046,
	"count": 8,
	"is_parallel": true,
	"self": 0.003427563999935046
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.0418704440000397,
	"count": 1,
	"is_parallel": true,
	"self": 0.0012168680000286258,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0008716350000099737,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008716350000099737
	},
	"communicator.exchange": {
	"total": 0.035724202000039895,
	"count": 1,
	"is_parallel": true,
	"self": 0.035724202000039895
	},
	"steps_from_proto": {
	"total": 0.004057738999961202,
	"count": 2,
	"is_parallel": true,
	"self": 0.0006634809998899982,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.003394258000071204,
	"count": 8,
	"is_parallel": true,
	"self": 0.003394258000071204
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1178.2684012030245,
	"count": 65068,
	"is_parallel": true,
	"self": 75.30102161908849,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 49.89441047398384,
	"count": 65068,
	"is_parallel": true,
	"self": 49.89441047398384
	},
	"communicator.exchange": {
	"total": 818.6866904860156,
	"count": 65068,
	"is_parallel": true,
	"self": 818.6866904860156
	},
	"steps_from_proto": {
	"total": 234.38627862393668,
	"count": 130136,
	"is_parallel": true,
	"self": 37.99782386399312,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 196.38845475994356,
	"count": 520544,
	"is_parallel": true,
	"self": 196.38845475994356
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.012843266999880143,
	"count": 8,
	"is_parallel": true,
	"self": 0.002305757999351954,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.010537509000528189,
	"count": 32,
	"is_parallel": true,
	"self": 0.010537509000528189
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 385.55033257802,
	"count": 65069,
	"self": 14.281712731008213,
	"children": {
	"process_trajectory": {
	"total": 109.3654763670126,
	"count": 65069,
	"self": 108.84511364601275,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.5203627209998558,
	"count": 2,
	"self": 0.5203627209998558
	}
	}
	},
	"_update_policy": {
	"total": 261.9031434799992,
	"count": 46,
	"self": 161.58336632699843,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 100.31977715300076,
	"count": 690,
	"self": 100.31977715300076
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.0740000107034575e-06,
	"count": 1,
	"self": 1.0740000107034575e-06
	},
	"TrainerController._save_models": {
	"total": 0.2155307369998809,
	"count": 1,
	"self": 0.001797785000235308,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2137329519996456,
	"count": 1,
	"self": 0.2137329519996456
	}
	}
	}
	}
	}
	}
	}