ppo-Pyramids / run_logs /timers.json
KayabaEngine's picture
MLA
d593e30
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.11944945156574249,
"min": 0.11358385533094406,
"max": 1.3361033201217651,
"count": 100
},
"Pyramids.Policy.Entropy.sum": {
"value": 3602.595458984375,
"min": 3383.383544921875,
"max": 40532.03125,
"count": 100
},
"Pyramids.Step.mean": {
"value": 2999965.0,
"min": 29975.0,
"max": 2999965.0,
"count": 100
},
"Pyramids.Step.sum": {
"value": 2999965.0,
"min": 29975.0,
"max": 2999965.0,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.776624858379364,
"min": -0.10249456018209457,
"max": 0.8700633645057678,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 229.10433959960938,
"min": -24.393705368041992,
"max": 271.45977783203125,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.02705737203359604,
"min": -0.0199726652354002,
"max": 0.3841193914413452,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 7.981925010681152,
"min": -5.292756080627441,
"max": 92.95689392089844,
"count": 100
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.07030777303544573,
"min": 0.0628793473998039,
"max": 0.07355644507118583,
"count": 100
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 1.054616595531686,
"min": 0.5148951154983008,
"max": 1.0573544614211035,
"count": 100
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.01445784309986991,
"min": 0.001990515664903367,
"max": 0.017782053084119877,
"count": 100
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.21686764649804866,
"min": 0.02587670364374377,
"max": 0.2489487431776783,
"count": 100
},
"Pyramids.Policy.LearningRate.mean": {
"value": 1.4910995029999977e-06,
"min": 1.4910995029999977e-06,
"max": 0.00029838354339596195,
"count": 100
},
"Pyramids.Policy.LearningRate.sum": {
"value": 2.2366492544999967e-05,
"min": 2.2366492544999967e-05,
"max": 0.0040724449425184,
"count": 100
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10049700000000003,
"min": 0.10049700000000003,
"max": 0.19946118095238097,
"count": 100
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.5074550000000004,
"min": 1.3962282666666668,
"max": 2.8574816,
"count": 100
},
"Pyramids.Policy.Beta.mean": {
"value": 5.965029999999993e-05,
"min": 5.965029999999993e-05,
"max": 0.009946171977142856,
"count": 100
},
"Pyramids.Policy.Beta.sum": {
"value": 0.000894754499999999,
"min": 0.000894754499999999,
"max": 0.13576241184,
"count": 100
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.009918417781591415,
"min": 0.009446214884519577,
"max": 0.5738606452941895,
"count": 100
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.14877626299858093,
"min": 0.1353917419910431,
"max": 4.017024517059326,
"count": 100
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 215.36879432624113,
"min": 203.83448275862068,
"max": 986.7058823529412,
"count": 100
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 30367.0,
"min": 16774.0,
"max": 32859.0,
"count": 100
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.742072325120581,
"min": -0.8700000485953163,
"max": 1.796165507209712,
"count": 100
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 245.63219784200191,
"min": -26.347601659595966,
"max": 260.44399854540825,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.742072325120581,
"min": -0.8700000485953163,
"max": 1.796165507209712,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 245.63219784200191,
"min": -26.347601659595966,
"max": 260.44399854540825,
"count": 100
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.022262255893762187,
"min": 0.021579025778016236,
"max": 10.155288637560957,
"count": 100
},
"Pyramids.Policy.RndReward.sum": {
"value": 3.1389780810204684,
"min": 2.9726999542617705,
"max": 172.63990683853626,
"count": 100
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1697697924",
"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.0.1+cu118",
"numpy_version": "1.23.5",
"end_time_seconds": "1697705450"
},
"total": 7526.182461605001,
"count": 1,
"self": 0.6326489260009112,
"children": {
"run_training.setup": {
"total": 0.048939825999923414,
"count": 1,
"self": 0.048939825999923414
},
"TrainerController.start_learning": {
"total": 7525.500872853,
"count": 1,
"self": 4.4395564680608,
"children": {
"TrainerController._reset_env": {
"total": 7.28454001700004,
"count": 1,
"self": 7.28454001700004
},
"TrainerController.advance": {
"total": 7513.646333574939,
"count": 195421,
"self": 4.384497697824372,
"children": {
"env_step": {
"total": 5583.476512425045,
"count": 195421,
"self": 5200.603654189745,
"children": {
"SubprocessEnvManager._take_step": {
"total": 380.30148921301134,
"count": 195421,
"self": 14.169571088080033,
"children": {
"TorchPolicy.evaluate": {
"total": 366.1319181249313,
"count": 187554,
"self": 366.1319181249313
}
}
},
"workers": {
"total": 2.5713690222887635,
"count": 195421,
"self": 0.0,
"children": {
"worker_root": {
"total": 7511.006855763873,
"count": 195421,
"is_parallel": true,
"self": 2676.7122494620207,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.004688579999992726,
"count": 1,
"is_parallel": true,
"self": 0.003345408000086536,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0013431719999061897,
"count": 8,
"is_parallel": true,
"self": 0.0013431719999061897
}
}
},
"UnityEnvironment.step": {
"total": 0.07684060300005058,
"count": 1,
"is_parallel": true,
"self": 0.000678286000152184,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0005436259999669346,
"count": 1,
"is_parallel": true,
"self": 0.0005436259999669346
},
"communicator.exchange": {
"total": 0.0735342949999449,
"count": 1,
"is_parallel": true,
"self": 0.0735342949999449
},
"steps_from_proto": {
"total": 0.0020843959999865547,
"count": 1,
"is_parallel": true,
"self": 0.00041991500006588467,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.00166448099992067,
"count": 8,
"is_parallel": true,
"self": 0.00166448099992067
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 4834.294606301853,
"count": 195420,
"is_parallel": true,
"self": 108.61068526875897,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 74.2005608505965,
"count": 195420,
"is_parallel": true,
"self": 74.2005608505965
},
"communicator.exchange": {
"total": 4343.343110791254,
"count": 195420,
"is_parallel": true,
"self": 4343.343110791254
},
"steps_from_proto": {
"total": 308.1402493912434,
"count": 195420,
"is_parallel": true,
"self": 62.05968054683774,
"children": {
"_process_rank_one_or_two_observation": {
"total": 246.08056884440566,
"count": 1563360,
"is_parallel": true,
"self": 246.08056884440566
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 1925.7853234520694,
"count": 195421,
"self": 8.635148375960853,
"children": {
"process_trajectory": {
"total": 375.37493168711126,
"count": 195421,
"self": 374.69939377211176,
"children": {
"RLTrainer._checkpoint": {
"total": 0.6755379149994951,
"count": 6,
"self": 0.6755379149994951
}
}
},
"_update_policy": {
"total": 1541.7752433889973,
"count": 1408,
"self": 928.4843724531396,
"children": {
"TorchPPOOptimizer.update": {
"total": 613.2908709358577,
"count": 68340,
"self": 613.2908709358577
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.6520007193321362e-06,
"count": 1,
"self": 1.6520007193321362e-06
},
"TrainerController._save_models": {
"total": 0.1304411410001194,
"count": 1,
"self": 0.0020765829995070817,
"children": {
"RLTrainer._checkpoint": {
"total": 0.1283645580006123,
"count": 1,
"self": 0.1283645580006123
}
}
}
}
}
}
}