First Push

7fee360 over 1 year ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.216837540268898,
	"min": 0.216837540268898,
	"max": 1.1439133882522583,
	"count": 47
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 6591.861328125,
	"min": 1884.1458740234375,
	"max": 34317.40234375,
	"count": 47
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 47
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 47
	},
	"Pyramids.Step.mean": {
	"value": 1499974.0,
	"min": 149892.0,
	"max": 1499974.0,
	"count": 46
	},
	"Pyramids.Step.sum": {
	"value": 1499974.0,
	"min": 149892.0,
	"max": 1499974.0,
	"count": 46
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.5635429620742798,
	"min": -0.1073768362402916,
	"max": 0.623300313949585,
	"count": 46
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 160.6097412109375,
	"min": -25.98519515991211,
	"max": 177.64059448242188,
	"count": 46
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.0032277165446430445,
	"min": -0.05295085161924362,
	"max": 0.07620299607515335,
	"count": 46
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -0.9198992252349854,
	"min": -14.08492660522461,
	"max": 18.060110092163086,
	"count": 46
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06717732886456708,
	"min": 0.06439270613191184,
	"max": 0.0735065735864949,
	"count": 46
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.940482604103939,
	"min": 0.583830917285167,
	"max": 1.067276163356534,
	"count": 46
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.01711601288081424,
	"min": 0.0011009482281105403,
	"max": 0.018873407717587217,
	"count": 46
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.23962418033139937,
	"min": 0.015413275193547564,
	"max": 0.28310111576380825,
	"count": 46
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 2.8645276166190494e-06,
	"min": 2.8645276166190494e-06,
	"max": 0.000272566884144375,
	"count": 46
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 4.010338663266669e-05,
	"min": 4.010338663266669e-05,
	"max": 0.003569852210049334,
	"count": 46
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10095480952380953,
	"min": 0.10095480952380953,
	"max": 0.19085562500000003,
	"count": 46
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4133673333333334,
	"min": 1.4133673333333334,
	"max": 2.5899506666666667,
	"count": 46
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00010538547142857148,
	"min": 0.00010538547142857148,
	"max": 0.009086476937499999,
	"count": 46
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0014753966000000008,
	"min": 0.0014753966000000008,
	"max": 0.1190160716,
	"count": 46
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.007281546946614981,
	"min": 0.006628350354731083,
	"max": 0.061615318059921265,
	"count": 46
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.10194166004657745,
	"min": 0.0965542420744896,
	"max": 0.6112106442451477,
	"count": 46
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 322.6326530612245,
	"min": 288.4271844660194,
	"max": 987.3333333333334,
	"count": 46
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 31618.0,
	"min": 16326.0,
	"max": 33523.0,
	"count": 46
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.5957163070537606,
	"min": -0.854693383226792,
	"max": 1.6708420864061306,
	"count": 46
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 156.38019809126854,
	"min": -27.840401589870453,
	"max": 170.28999785333872,
	"count": 46
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.5957163070537606,
	"min": -0.854693383226792,
	"max": 1.6708420864061306,
	"count": 46
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 156.38019809126854,
	"min": -27.840401589870453,
	"max": 170.28999785333872,
	"count": 46
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.023973165170158312,
	"min": 0.022124219301162828,
	"max": 0.6562520817798727,
	"count": 46
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.3493701866755146,
	"min": 1.954352687112987,
	"max": 18.973405182361603,
	"count": 46
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1687291235",
	"python_version": "3.10.12 (main, Jun 7 2023, 12:45:35) [GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1687294292"
	},
	"total": 3056.8792389049995,
	"count": 1,
	"self": 0.7496070949996465,
	"children": {
	"run_training.setup": {
	"total": 0.03848574799985727,
	"count": 1,
	"self": 0.03848574799985727
	},
	"TrainerController.start_learning": {
	"total": 3056.091146062,
	"count": 1,
	"self": 1.6334947169725638,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.9540592440000637,
	"count": 1,
	"self": 3.9540592440000637
	},
	"TrainerController.advance": {
	"total": 3050.414175517027,
	"count": 88556,
	"self": 1.6999190719966464,
	"children": {
	"env_step": {
	"total": 2206.4400515949983,
	"count": 88556,
	"self": 2065.3934808430704,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 140.0602751009783,
	"count": 88556,
	"self": 6.13563863390732,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 133.92463646707097,
	"count": 86323,
	"self": 133.92463646707097
	}
	}
	},
	"workers": {
	"total": 0.9862956509496144,
	"count": 88556,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3049.710723735973,
	"count": 88556,
	"is_parallel": true,
	"self": 1130.1138591509684,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0027872109999407257,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008003440002539719,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001986866999686754,
	"count": 8,
	"is_parallel": true,
	"self": 0.001986866999686754
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04545206300008431,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005375059997732023,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.000490628000079596,
	"count": 1,
	"is_parallel": true,
	"self": 0.000490628000079596
	},
	"communicator.exchange": {
	"total": 0.04279957100015963,
	"count": 1,
	"is_parallel": true,
	"self": 0.04279957100015963
	},
	"steps_from_proto": {
	"total": 0.0016243580000718794,
	"count": 1,
	"is_parallel": true,
	"self": 0.000359045000095648,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012653129999762314,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012653129999762314
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1919.5968645850044,
	"count": 88555,
	"is_parallel": true,
	"self": 43.92660406803998,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 29.931304289943682,
	"count": 88555,
	"is_parallel": true,
	"self": 29.931304289943682
	},
	"communicator.exchange": {
	"total": 1712.2299676670234,
	"count": 88555,
	"is_parallel": true,
	"self": 1712.2299676670234
	},
	"steps_from_proto": {
	"total": 133.5089885599973,
	"count": 88555,
	"is_parallel": true,
	"self": 25.7646578750755,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 107.7443306849218,
	"count": 708440,
	"is_parallel": true,
	"self": 107.7443306849218
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 842.2742048500322,
	"count": 88556,
	"self": 3.339937450038633,
	"children": {
	"process_trajectory": {
	"total": 143.5362954599873,
	"count": 88556,
	"self": 143.24071930098762,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2955761589996655,
	"count": 3,
	"self": 0.2955761589996655
	}
	}
	},
	"_update_policy": {
	"total": 695.3979719400063,
	"count": 640,
	"self": 443.9013471990788,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 251.49662474092747,
	"count": 31458,
	"self": 251.49662474092747
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.145000169344712e-06,
	"count": 1,
	"self": 1.145000169344712e-06
	},
	"TrainerController._save_models": {
	"total": 0.08941543899982207,
	"count": 1,
	"self": 0.0016526210001757136,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08776281799964636,
	"count": 1,
	"self": 0.08776281799964636
	}
	}
	}
	}
	}
	}
	}