ppo-Pyramids / run_logs /timers.json
LOGQS's picture
First Push
7fee360
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.216837540268898,
"min": 0.216837540268898,
"max": 1.1439133882522583,
"count": 47
},
"Pyramids.Policy.Entropy.sum": {
"value": 6591.861328125,
"min": 1884.1458740234375,
"max": 34317.40234375,
"count": 47
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 47
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 47
},
"Pyramids.Step.mean": {
"value": 1499974.0,
"min": 149892.0,
"max": 1499974.0,
"count": 46
},
"Pyramids.Step.sum": {
"value": 1499974.0,
"min": 149892.0,
"max": 1499974.0,
"count": 46
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.5635429620742798,
"min": -0.1073768362402916,
"max": 0.623300313949585,
"count": 46
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 160.6097412109375,
"min": -25.98519515991211,
"max": 177.64059448242188,
"count": 46
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": -0.0032277165446430445,
"min": -0.05295085161924362,
"max": 0.07620299607515335,
"count": 46
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": -0.9198992252349854,
"min": -14.08492660522461,
"max": 18.060110092163086,
"count": 46
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06717732886456708,
"min": 0.06439270613191184,
"max": 0.0735065735864949,
"count": 46
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.940482604103939,
"min": 0.583830917285167,
"max": 1.067276163356534,
"count": 46
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.01711601288081424,
"min": 0.0011009482281105403,
"max": 0.018873407717587217,
"count": 46
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.23962418033139937,
"min": 0.015413275193547564,
"max": 0.28310111576380825,
"count": 46
},
"Pyramids.Policy.LearningRate.mean": {
"value": 2.8645276166190494e-06,
"min": 2.8645276166190494e-06,
"max": 0.000272566884144375,
"count": 46
},
"Pyramids.Policy.LearningRate.sum": {
"value": 4.010338663266669e-05,
"min": 4.010338663266669e-05,
"max": 0.003569852210049334,
"count": 46
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10095480952380953,
"min": 0.10095480952380953,
"max": 0.19085562500000003,
"count": 46
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4133673333333334,
"min": 1.4133673333333334,
"max": 2.5899506666666667,
"count": 46
},
"Pyramids.Policy.Beta.mean": {
"value": 0.00010538547142857148,
"min": 0.00010538547142857148,
"max": 0.009086476937499999,
"count": 46
},
"Pyramids.Policy.Beta.sum": {
"value": 0.0014753966000000008,
"min": 0.0014753966000000008,
"max": 0.1190160716,
"count": 46
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.007281546946614981,
"min": 0.006628350354731083,
"max": 0.061615318059921265,
"count": 46
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.10194166004657745,
"min": 0.0965542420744896,
"max": 0.6112106442451477,
"count": 46
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 322.6326530612245,
"min": 288.4271844660194,
"max": 987.3333333333334,
"count": 46
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 31618.0,
"min": 16326.0,
"max": 33523.0,
"count": 46
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.5957163070537606,
"min": -0.854693383226792,
"max": 1.6708420864061306,
"count": 46
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 156.38019809126854,
"min": -27.840401589870453,
"max": 170.28999785333872,
"count": 46
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.5957163070537606,
"min": -0.854693383226792,
"max": 1.6708420864061306,
"count": 46
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 156.38019809126854,
"min": -27.840401589870453,
"max": 170.28999785333872,
"count": 46
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.023973165170158312,
"min": 0.022124219301162828,
"max": 0.6562520817798727,
"count": 46
},
"Pyramids.Policy.RndReward.sum": {
"value": 2.3493701866755146,
"min": 1.954352687112987,
"max": 18.973405182361603,
"count": 46
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1687291235",
"python_version": "3.10.12 (main, Jun 7 2023, 12:45:35) [GCC 9.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1687294292"
},
"total": 3056.8792389049995,
"count": 1,
"self": 0.7496070949996465,
"children": {
"run_training.setup": {
"total": 0.03848574799985727,
"count": 1,
"self": 0.03848574799985727
},
"TrainerController.start_learning": {
"total": 3056.091146062,
"count": 1,
"self": 1.6334947169725638,
"children": {
"TrainerController._reset_env": {
"total": 3.9540592440000637,
"count": 1,
"self": 3.9540592440000637
},
"TrainerController.advance": {
"total": 3050.414175517027,
"count": 88556,
"self": 1.6999190719966464,
"children": {
"env_step": {
"total": 2206.4400515949983,
"count": 88556,
"self": 2065.3934808430704,
"children": {
"SubprocessEnvManager._take_step": {
"total": 140.0602751009783,
"count": 88556,
"self": 6.13563863390732,
"children": {
"TorchPolicy.evaluate": {
"total": 133.92463646707097,
"count": 86323,
"self": 133.92463646707097
}
}
},
"workers": {
"total": 0.9862956509496144,
"count": 88556,
"self": 0.0,
"children": {
"worker_root": {
"total": 3049.710723735973,
"count": 88556,
"is_parallel": true,
"self": 1130.1138591509684,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0027872109999407257,
"count": 1,
"is_parallel": true,
"self": 0.0008003440002539719,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.001986866999686754,
"count": 8,
"is_parallel": true,
"self": 0.001986866999686754
}
}
},
"UnityEnvironment.step": {
"total": 0.04545206300008431,
"count": 1,
"is_parallel": true,
"self": 0.0005375059997732023,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.000490628000079596,
"count": 1,
"is_parallel": true,
"self": 0.000490628000079596
},
"communicator.exchange": {
"total": 0.04279957100015963,
"count": 1,
"is_parallel": true,
"self": 0.04279957100015963
},
"steps_from_proto": {
"total": 0.0016243580000718794,
"count": 1,
"is_parallel": true,
"self": 0.000359045000095648,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0012653129999762314,
"count": 8,
"is_parallel": true,
"self": 0.0012653129999762314
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1919.5968645850044,
"count": 88555,
"is_parallel": true,
"self": 43.92660406803998,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 29.931304289943682,
"count": 88555,
"is_parallel": true,
"self": 29.931304289943682
},
"communicator.exchange": {
"total": 1712.2299676670234,
"count": 88555,
"is_parallel": true,
"self": 1712.2299676670234
},
"steps_from_proto": {
"total": 133.5089885599973,
"count": 88555,
"is_parallel": true,
"self": 25.7646578750755,
"children": {
"_process_rank_one_or_two_observation": {
"total": 107.7443306849218,
"count": 708440,
"is_parallel": true,
"self": 107.7443306849218
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 842.2742048500322,
"count": 88556,
"self": 3.339937450038633,
"children": {
"process_trajectory": {
"total": 143.5362954599873,
"count": 88556,
"self": 143.24071930098762,
"children": {
"RLTrainer._checkpoint": {
"total": 0.2955761589996655,
"count": 3,
"self": 0.2955761589996655
}
}
},
"_update_policy": {
"total": 695.3979719400063,
"count": 640,
"self": 443.9013471990788,
"children": {
"TorchPPOOptimizer.update": {
"total": 251.49662474092747,
"count": 31458,
"self": 251.49662474092747
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.145000169344712e-06,
"count": 1,
"self": 1.145000169344712e-06
},
"TrainerController._save_models": {
"total": 0.08941543899982207,
"count": 1,
"self": 0.0016526210001757136,
"children": {
"RLTrainer._checkpoint": {
"total": 0.08776281799964636,
"count": 1,
"self": 0.08776281799964636
}
}
}
}
}
}
}