|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.4808414876461029, |
|
"min": 0.45646536350250244, |
|
"max": 1.4761430025100708, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 14525.259765625, |
|
"min": 13642.8369140625, |
|
"max": 44780.2734375, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989982.0, |
|
"min": 29952.0, |
|
"max": 989982.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989982.0, |
|
"min": 29952.0, |
|
"max": 989982.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.41117236018180847, |
|
"min": -0.1260172724723816, |
|
"max": 0.4495900273323059, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 108.54949951171875, |
|
"min": -30.370162963867188, |
|
"max": 121.83889770507812, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.025955229997634888, |
|
"min": 0.001035523833706975, |
|
"max": 0.307271271944046, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 6.8521809577941895, |
|
"min": 0.2692362070083618, |
|
"max": 73.74510192871094, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06972378771923318, |
|
"min": 0.06514819621779247, |
|
"max": 0.07369894572346905, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9761330280692645, |
|
"min": 0.48059853971798655, |
|
"max": 1.0672664935021505, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.010373268114048345, |
|
"min": 0.0001120277094408344, |
|
"max": 0.013814569378143335, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.14522575359667683, |
|
"min": 0.001456360222730847, |
|
"max": 0.20619688992398247, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.424154668171426e-06, |
|
"min": 7.424154668171426e-06, |
|
"max": 0.00029515063018788575, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00010393816535439997, |
|
"min": 0.00010393816535439997, |
|
"max": 0.0031400270533243997, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10247468571428572, |
|
"min": 0.10247468571428572, |
|
"max": 0.19838354285714285, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4346456, |
|
"min": 1.3691136000000002, |
|
"max": 2.3466756000000006, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.0002572211028571428, |
|
"min": 0.0002572211028571428, |
|
"max": 0.00983851593142857, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.0036010954399999994, |
|
"min": 0.0036010954399999994, |
|
"max": 0.10469289243999999, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.009374582208693027, |
|
"min": 0.009374582208693027, |
|
"max": 0.4946654140949249, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.13124415278434753, |
|
"min": 0.13124415278434753, |
|
"max": 3.462657928466797, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 449.4153846153846, |
|
"min": 388.9078947368421, |
|
"max": 999.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29212.0, |
|
"min": 15984.0, |
|
"max": 33324.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.4274553592388446, |
|
"min": -1.0000000521540642, |
|
"max": 1.5058026062814813, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 92.7845983505249, |
|
"min": -32.000001668930054, |
|
"max": 114.44099807739258, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.4274553592388446, |
|
"min": -1.0000000521540642, |
|
"max": 1.5058026062814813, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 92.7845983505249, |
|
"min": -32.000001668930054, |
|
"max": 114.44099807739258, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.04350496525741899, |
|
"min": 0.040064290778613405, |
|
"max": 11.339918397367, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.827822741732234, |
|
"min": 2.827822741732234, |
|
"max": 181.438694357872, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1690548181", |
|
"python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1690550179" |
|
}, |
|
"total": 1997.1754200600003, |
|
"count": 1, |
|
"self": 0.376533362000373, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.03642111199997089, |
|
"count": 1, |
|
"self": 0.03642111199997089 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 1996.762465586, |
|
"count": 1, |
|
"self": 1.8417457710179406, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 4.610064933000103, |
|
"count": 1, |
|
"self": 4.610064933000103 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 1990.206255852982, |
|
"count": 63469, |
|
"self": 1.7728782128874627, |
|
"children": { |
|
"env_step": { |
|
"total": 1337.9766422440039, |
|
"count": 63469, |
|
"self": 1207.4637519479638, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 129.4123704990352, |
|
"count": 63469, |
|
"self": 5.3272204789532225, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 124.08515002008198, |
|
"count": 62559, |
|
"self": 124.08515002008198 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 1.1005197970048357, |
|
"count": 63469, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 1993.7353670329908, |
|
"count": 63469, |
|
"is_parallel": true, |
|
"self": 904.2853400540353, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0021563249997598177, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006389270001818659, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0015173979995779519, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0015173979995779519 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.052196651000031125, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006926920000296377, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0005477709996739577, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005477709996739577 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.04886110600000393, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.04886110600000393 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0020950820003236004, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00041708700018716627, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001677995000136434, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001677995000136434 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1089.4500269789555, |
|
"count": 63468, |
|
"is_parallel": true, |
|
"self": 28.919261706989346, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 19.919393866924565, |
|
"count": 63468, |
|
"is_parallel": true, |
|
"self": 19.919393866924565 |
|
}, |
|
"communicator.exchange": { |
|
"total": 958.6525405869716, |
|
"count": 63468, |
|
"is_parallel": true, |
|
"self": 958.6525405869716 |
|
}, |
|
"steps_from_proto": { |
|
"total": 81.95883081807006, |
|
"count": 63468, |
|
"is_parallel": true, |
|
"self": 17.70434792986498, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 64.25448288820508, |
|
"count": 507744, |
|
"is_parallel": true, |
|
"self": 64.25448288820508 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 650.4567353960906, |
|
"count": 63469, |
|
"self": 3.028257084075449, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 108.0495058720162, |
|
"count": 63469, |
|
"self": 107.81499983501635, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.2345060369998464, |
|
"count": 2, |
|
"self": 0.2345060369998464 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 539.378972439999, |
|
"count": 435, |
|
"self": 340.66695357000526, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 198.7120188699937, |
|
"count": 22875, |
|
"self": 198.7120188699937 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 9.920004231389612e-07, |
|
"count": 1, |
|
"self": 9.920004231389612e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.10439803699955519, |
|
"count": 1, |
|
"self": 0.0014601409993701964, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.10293789600018499, |
|
"count": 1, |
|
"self": 0.10293789600018499 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |