First Push

10a6649 over 1 year ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.0744967460632324,
	"min": 2.061256170272827,
	"max": 3.2956643104553223,
	"count": 472
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 43547.8359375,
	"min": 16979.185546875,
	"max": 161875.40625,
	"count": 472
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 65.53333333333333,
	"min": 44.477064220183486,
	"max": 999.0,
	"count": 472
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19660.0,
	"min": 16120.0,
	"max": 23756.0,
	"count": 472
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1528.1564812993056,
	"min": 1194.160898636277,
	"max": 1554.9791073077633,
	"count": 453
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 229223.47219489585,
	"min": 2388.321797272554,
	"max": 331253.87356936734,
	"count": 453
	},
	"SoccerTwos.Step.mean": {
	"value": 4719898.0,
	"min": 9942.0,
	"max": 4719898.0,
	"count": 472
	},
	"SoccerTwos.Step.sum": {
	"value": 4719898.0,
	"min": 9942.0,
	"max": 4719898.0,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.01887659728527069,
	"min": -0.10542313754558563,
	"max": 0.14932888746261597,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -2.8314895629882812,
	"min": -14.300395965576172,
	"max": 20.86272430419922,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.021288074553012848,
	"min": -0.10537904500961304,
	"max": 0.14755292236804962,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -3.193211078643799,
	"min": -13.963614463806152,
	"max": 20.708911895751953,
	"count": 472
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 472
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.13239599903424581,
	"min": -0.625,
	"max": 0.49411763952058907,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -19.85939985513687,
	"min": -41.071800231933594,
	"max": 51.71139979362488,
	"count": 472
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.13239599903424581,
	"min": -0.625,
	"max": 0.49411763952058907,
	"count": 472
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -19.85939985513687,
	"min": -41.071800231933594,
	"max": 51.71139979362488,
	"count": 472
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 472
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 472
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.016272481051661694,
	"min": 0.010424615769200804,
	"max": 0.023758423148440972,
	"count": 225
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.016272481051661694,
	"min": 0.010424615769200804,
	"max": 0.023758423148440972,
	"count": 225
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10069958294431368,
	"min": 3.700576038075572e-06,
	"max": 0.11594027852018675,
	"count": 225
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10069958294431368,
	"min": 3.700576038075572e-06,
	"max": 0.11594027852018675,
	"count": 225
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10207154403130213,
	"min": 3.6573177377855853e-06,
	"max": 0.11809751565257708,
	"count": 225
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10207154403130213,
	"min": 3.6573177377855853e-06,
	"max": 0.11809751565257708,
	"count": 225
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 225
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 225
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 225
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 225
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 225
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 225
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1687879263",
	"python_version": "3.9.16 (main, May 15 2023, 23:46:34) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/rcls/APPs/anaconda3/envs/rl/bin/mlagents-learn config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos2 --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1687895159"
	},
	"total": 15896.488707362005,
	"count": 1,
	"self": 0.5369108009908814,
	"children": {
	"run_training.setup": {
	"total": 0.00820854600169696,
	"count": 1,
	"self": 0.00820854600169696
	},
	"TrainerController.start_learning": {
	"total": 15895.943588015012,
	"count": 1,
	"self": 7.708126039680792,
	"children": {
	"TrainerController._reset_env": {
	"total": 1.5737629419600125,
	"count": 24,
	"self": 1.5737629419600125
	},
	"TrainerController.advance": {
	"total": 15886.47150302236,
	"count": 317886,
	"self": 8.081340691103833,
	"children": {
	"env_step": {
	"total": 5974.421085315058,
	"count": 317886,
	"self": 4905.711345372896,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1063.8875759330112,
	"count": 317886,
	"self": 43.56820851439261,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1020.3193674186186,
	"count": 598670,
	"self": 1020.3193674186186
	}
	}
	},
	"workers": {
	"total": 4.822164009150583,
	"count": 317886,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 15881.829722142284,
	"count": 317886,
	"is_parallel": true,
	"self": 11838.092291657493,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0016371259989682585,
	"count": 2,
	"is_parallel": true,
	"self": 0.0003801429702434689,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012569830287247896,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012569830287247896
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.01787375900312327,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004416879964992404,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00041525199776515365,
	"count": 1,
	"is_parallel": true,
	"self": 0.00041525199776515365
	},
	"communicator.exchange": {
	"total": 0.01568464099545963,
	"count": 1,
	"is_parallel": true,
	"self": 0.01568464099545963
	},
	"steps_from_proto": {
	"total": 0.0013321780133992434,
	"count": 2,
	"is_parallel": true,
	"self": 0.0003262840327806771,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0010058939806185663,
	"count": 8,
	"is_parallel": true,
	"self": 0.0010058939806185663
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 4043.68896008085,
	"count": 317885,
	"is_parallel": true,
	"self": 240.81878162530484,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 168.6598716371518,
	"count": 317885,
	"is_parallel": true,
	"self": 168.6598716371518
	},
	"communicator.exchange": {
	"total": 2913.374164572335,
	"count": 317885,
	"is_parallel": true,
	"self": 2913.374164572335
	},
	"steps_from_proto": {
	"total": 720.8361422460584,
	"count": 635770,
	"is_parallel": true,
	"self": 140.4202986920136,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 580.4158435540448,
	"count": 2543080,
	"is_parallel": true,
	"self": 580.4158435540448
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.048470403940882534,
	"count": 46,
	"is_parallel": true,
	"self": 0.00948453787714243,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.038985866063740104,
	"count": 184,
	"is_parallel": true,
	"self": 0.038985866063740104
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 9903.969077016198,
	"count": 317885,
	"self": 53.17670554446522,
	"children": {
	"process_trajectory": {
	"total": 1060.648966794659,
	"count": 317885,
	"self": 1058.7333575366356,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.9156092580233235,
	"count": 9,
	"self": 1.9156092580233235
	}
	}
	},
	"_update_policy": {
	"total": 8790.143404677074,
	"count": 225,
	"self": 712.2272357027396,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 8077.916168974334,
	"count": 6750,
	"self": 8077.916168974334
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.7700076568871737e-06,
	"count": 1,
	"self": 1.7700076568871737e-06
	},
	"TrainerController._save_models": {
	"total": 0.19019424100406468,
	"count": 1,
	"self": 0.002219676011009142,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.18797456499305554,
	"count": 1,
	"self": 0.18797456499305554
	}
	}
	}
	}
	}
	}
	}