|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.5544239282608032, |
|
"min": 0.5544239282608032, |
|
"max": 1.4804720878601074, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 16668.201171875, |
|
"min": 16668.201171875, |
|
"max": 44911.6015625, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989922.0, |
|
"min": 29952.0, |
|
"max": 989922.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989922.0, |
|
"min": 29952.0, |
|
"max": 989922.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.30720406770706177, |
|
"min": -0.09272222220897675, |
|
"max": 0.30720406770706177, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 79.25865173339844, |
|
"min": -22.438777923583984, |
|
"max": 80.10205078125, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.05198511853814125, |
|
"min": -0.05136161297559738, |
|
"max": 0.4627130329608917, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 13.412160873413086, |
|
"min": -13.456742286682129, |
|
"max": 109.6629867553711, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06746010744645185, |
|
"min": 0.06525129824395344, |
|
"max": 0.07371842501673935, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.944441504250326, |
|
"min": 0.5016560816024056, |
|
"max": 1.0327607453412686, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.01590906463500914, |
|
"min": 0.000316650339836971, |
|
"max": 0.01590906463500914, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.22272690489012797, |
|
"min": 0.0037998040780436518, |
|
"max": 0.22272690489012797, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.367004687221428e-06, |
|
"min": 7.367004687221428e-06, |
|
"max": 0.00029515063018788575, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00010313806562109999, |
|
"min": 0.00010313806562109999, |
|
"max": 0.0035072417309194993, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10245563571428572, |
|
"min": 0.10245563571428572, |
|
"max": 0.19838354285714285, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4343789, |
|
"min": 1.3691136000000002, |
|
"max": 2.5690804999999997, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.0002553180078571428, |
|
"min": 0.0002553180078571428, |
|
"max": 0.00983851593142857, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.0035744521099999992, |
|
"min": 0.0035744521099999992, |
|
"max": 0.11693114195, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.009702242910861969, |
|
"min": 0.009391454048454762, |
|
"max": 0.3962453305721283, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.13583140075206757, |
|
"min": 0.13583140075206757, |
|
"max": 2.7737174034118652, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 511.1111111111111, |
|
"min": 503.0952380952381, |
|
"max": 999.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 27600.0, |
|
"min": 15984.0, |
|
"max": 32571.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.2594188312595744, |
|
"min": -1.0000000521540642, |
|
"max": 1.2594188312595744, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 66.74919805675745, |
|
"min": -32.000001668930054, |
|
"max": 74.29959836602211, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.2594188312595744, |
|
"min": -1.0000000521540642, |
|
"max": 1.2594188312595744, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 66.74919805675745, |
|
"min": -32.000001668930054, |
|
"max": 74.29959836602211, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.05318665779960388, |
|
"min": 0.0490993660845099, |
|
"max": 8.279884029179811, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.8188928633790056, |
|
"min": 2.8188928633790056, |
|
"max": 132.47814446687698, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1705549238", |
|
"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.1.2+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1705551602" |
|
}, |
|
"total": 2364.5201285870003, |
|
"count": 1, |
|
"self": 0.5452934969998751, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.05425849399989602, |
|
"count": 1, |
|
"self": 0.05425849399989602 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2363.9205765960005, |
|
"count": 1, |
|
"self": 1.5448789630609099, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.883804895999674, |
|
"count": 1, |
|
"self": 2.883804895999674 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2359.40603280894, |
|
"count": 63364, |
|
"self": 1.6081694138529201, |
|
"children": { |
|
"env_step": { |
|
"total": 1698.5048213051073, |
|
"count": 63364, |
|
"self": 1554.6324893689957, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 142.90826377501526, |
|
"count": 63364, |
|
"self": 5.288055364071624, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 137.62020841094363, |
|
"count": 62570, |
|
"self": 137.62020841094363 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.9640681610962929, |
|
"count": 63364, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2358.1940710380572, |
|
"count": 63364, |
|
"is_parallel": true, |
|
"self": 939.2176638751071, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.002277224999943428, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006452990010075155, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0016319259989359125, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0016319259989359125 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.0990013870000439, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005712810002478363, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0005035859999225067, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005035859999225067 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.09610575799979415, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.09610575799979415 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0018207620000794122, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00040474099978382583, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0014160210002955864, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0014160210002955864 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1418.9764071629502, |
|
"count": 63363, |
|
"is_parallel": true, |
|
"self": 37.43008776197075, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 27.161011549959312, |
|
"count": 63363, |
|
"is_parallel": true, |
|
"self": 27.161011549959312 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1243.9815886220458, |
|
"count": 63363, |
|
"is_parallel": true, |
|
"self": 1243.9815886220458 |
|
}, |
|
"steps_from_proto": { |
|
"total": 110.4037192289743, |
|
"count": 63363, |
|
"is_parallel": true, |
|
"self": 23.076767019810177, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 87.32695220916412, |
|
"count": 506904, |
|
"is_parallel": true, |
|
"self": 87.32695220916412 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 659.2930420899797, |
|
"count": 63364, |
|
"self": 2.931171458021254, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 136.39527950697266, |
|
"count": 63364, |
|
"self": 136.15370416897258, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.24157533800007513, |
|
"count": 2, |
|
"self": 0.24157533800007513 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 519.9665911249858, |
|
"count": 444, |
|
"self": 310.525372385001, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 209.44121873998483, |
|
"count": 22869, |
|
"self": 209.44121873998483 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 9.530003808322363e-07, |
|
"count": 1, |
|
"self": 9.530003808322363e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.08585897499960993, |
|
"count": 1, |
|
"self": 0.0014467370001511881, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.08441223799945874, |
|
"count": 1, |
|
"self": 0.08441223799945874 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |