ppo-pyramids / run_logs /timers.json
mihirdeo16's picture
Uploaded the Pyramids agent via unit4
6771b91
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.1605914682149887,
"min": 0.15174803137779236,
"max": 1.3826720714569092,
"count": 100
},
"Pyramids.Policy.Entropy.sum": {
"value": 4810.03564453125,
"min": 4520.87744140625,
"max": 41944.73828125,
"count": 100
},
"Pyramids.Step.mean": {
"value": 2999935.0,
"min": 29984.0,
"max": 2999935.0,
"count": 100
},
"Pyramids.Step.sum": {
"value": 2999935.0,
"min": 29984.0,
"max": 2999935.0,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.7312646508216858,
"min": -0.08786865323781967,
"max": 0.864769458770752,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 212.06674194335938,
"min": -21.088476181030273,
"max": 264.61944580078125,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.031307727098464966,
"min": -0.023307139053940773,
"max": 0.28635692596435547,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 9.079240798950195,
"min": -6.316234588623047,
"max": 68.15294647216797,
"count": 100
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.069431693604981,
"min": 0.06259889548310472,
"max": 0.07356465743699421,
"count": 100
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9720437104697339,
"min": 0.5769289815857017,
"max": 1.1034698615549132,
"count": 100
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.014536273691365275,
"min": 0.0007999930532062535,
"max": 0.015559507014115109,
"count": 100
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.20350783167911385,
"min": 0.010399909691681294,
"max": 0.2178330981976115,
"count": 100
},
"Pyramids.Policy.LearningRate.mean": {
"value": 1.4781780787357106e-06,
"min": 1.4781780787357106e-06,
"max": 0.00029828360057213336,
"count": 100
},
"Pyramids.Policy.LearningRate.sum": {
"value": 2.0694493102299947e-05,
"min": 2.0694493102299947e-05,
"max": 0.004072884842371767,
"count": 100
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10049269285714287,
"min": 0.10049269285714287,
"max": 0.19942786666666668,
"count": 100
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4068977,
"min": 1.4068977,
"max": 2.8576282333333336,
"count": 100
},
"Pyramids.Policy.Beta.mean": {
"value": 5.922001642857131e-05,
"min": 5.922001642857131e-05,
"max": 0.00994284388,
"count": 100
},
"Pyramids.Policy.Beta.sum": {
"value": 0.0008290802299999984,
"min": 0.0008290802299999984,
"max": 0.13577706051,
"count": 100
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.004602502100169659,
"min": 0.004342348780483007,
"max": 0.40666961669921875,
"count": 100
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.06443502753973007,
"min": 0.06079288199543953,
"max": 3.25335693359375,
"count": 100
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 261.6694915254237,
"min": 212.27007299270073,
"max": 995.2258064516129,
"count": 100
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 30877.0,
"min": 16399.0,
"max": 33010.0,
"count": 100
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.738213657696023,
"min": -0.9315290823578835,
"max": 1.7781703653158965,
"count": 100
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 203.37099795043468,
"min": -28.877401553094387,
"max": 241.09919920563698,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.738213657696023,
"min": -0.9315290823578835,
"max": 1.7781703653158965,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 203.37099795043468,
"min": -28.877401553094387,
"max": 241.09919920563698,
"count": 100
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.01263972351655392,
"min": 0.009993327900862341,
"max": 8.080028551466325,
"count": 100
},
"Pyramids.Policy.RndReward.sum": {
"value": 1.4788476514368085,
"min": 1.3467253648414044,
"max": 137.36048537492752,
"count": 100
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1686415716",
"python_version": "3.10.12 (main, Jun 7 2023, 12:45:35) [GCC 9.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1686423339"
},
"total": 7622.912448516,
"count": 1,
"self": 0.5384192190012982,
"children": {
"run_training.setup": {
"total": 0.03806848399926821,
"count": 1,
"self": 0.03806848399926821
},
"TrainerController.start_learning": {
"total": 7622.3359608129995,
"count": 1,
"self": 5.0599678118469456,
"children": {
"TrainerController._reset_env": {
"total": 4.000870640999892,
"count": 1,
"self": 4.000870640999892
},
"TrainerController.advance": {
"total": 7613.119245360153,
"count": 194176,
"self": 5.130799042612125,
"children": {
"env_step": {
"total": 5552.522010477777,
"count": 194176,
"self": 5160.800616726953,
"children": {
"SubprocessEnvManager._take_step": {
"total": 388.7483901792739,
"count": 194176,
"self": 16.048350887313973,
"children": {
"TorchPolicy.evaluate": {
"total": 372.7000392919599,
"count": 187549,
"self": 372.7000392919599
}
}
},
"workers": {
"total": 2.97300357155018,
"count": 194176,
"self": 0.0,
"children": {
"worker_root": {
"total": 7603.66474228549,
"count": 194176,
"is_parallel": true,
"self": 2835.15157436121,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0019769840000662953,
"count": 1,
"is_parallel": true,
"self": 0.0006528850017275545,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0013240989983387408,
"count": 8,
"is_parallel": true,
"self": 0.0013240989983387408
}
}
},
"UnityEnvironment.step": {
"total": 0.05422819199975493,
"count": 1,
"is_parallel": true,
"self": 0.0005977529999654507,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0006190009999045287,
"count": 1,
"is_parallel": true,
"self": 0.0006190009999045287
},
"communicator.exchange": {
"total": 0.05116591499972856,
"count": 1,
"is_parallel": true,
"self": 0.05116591499972856
},
"steps_from_proto": {
"total": 0.0018455230001563905,
"count": 1,
"is_parallel": true,
"self": 0.00037350999900809256,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.001472013001148298,
"count": 8,
"is_parallel": true,
"self": 0.001472013001148298
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 4768.51316792428,
"count": 194175,
"is_parallel": true,
"self": 100.4952850657155,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 74.97257792979872,
"count": 194175,
"is_parallel": true,
"self": 74.97257792979872
},
"communicator.exchange": {
"total": 4266.509113628733,
"count": 194175,
"is_parallel": true,
"self": 4266.509113628733
},
"steps_from_proto": {
"total": 326.53619130003335,
"count": 194175,
"is_parallel": true,
"self": 68.81499423792684,
"children": {
"_process_rank_one_or_two_observation": {
"total": 257.7211970621065,
"count": 1553400,
"is_parallel": true,
"self": 257.7211970621065
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 2055.466435839764,
"count": 194176,
"self": 9.878107901705334,
"children": {
"process_trajectory": {
"total": 373.4966683280627,
"count": 194176,
"self": 372.5729026220615,
"children": {
"RLTrainer._checkpoint": {
"total": 0.923765706001177,
"count": 6,
"self": 0.923765706001177
}
}
},
"_update_policy": {
"total": 1672.091659609996,
"count": 1405,
"self": 1045.91738557982,
"children": {
"TorchPPOOptimizer.update": {
"total": 626.1742740301761,
"count": 68322,
"self": 626.1742740301761
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.0879994079004973e-06,
"count": 1,
"self": 1.0879994079004973e-06
},
"TrainerController._save_models": {
"total": 0.15587591199982853,
"count": 1,
"self": 0.002404238999588415,
"children": {
"RLTrainer._checkpoint": {
"total": 0.15347167300024012,
"count": 1,
"self": 0.15347167300024012
}
}
}
}
}
}
}