|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.5008999705314636, |
|
"min": 0.4773056209087372, |
|
"max": 1.4854872226715088, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 15123.171875, |
|
"min": 14242.7998046875, |
|
"max": 45063.7421875, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989944.0, |
|
"min": 29952.0, |
|
"max": 989944.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989944.0, |
|
"min": 29952.0, |
|
"max": 989944.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.24567793309688568, |
|
"min": -0.10527270287275314, |
|
"max": 0.2654494345188141, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 61.91083908081055, |
|
"min": -25.26544952392578, |
|
"max": 68.75140380859375, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.06088830158114433, |
|
"min": -0.019152160733938217, |
|
"max": 0.2694939970970154, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 15.343852043151855, |
|
"min": -4.768887996673584, |
|
"max": 63.87007522583008, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.07094593892026892, |
|
"min": 0.0651082992406091, |
|
"max": 0.07574394675795973, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 1.0641890838040338, |
|
"min": 0.5302076273057181, |
|
"max": 1.0641890838040338, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.009234968995188669, |
|
"min": 0.0005701018202355009, |
|
"max": 0.014187979038036782, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.13852453492783004, |
|
"min": 0.007981425483297012, |
|
"max": 0.19863170653251494, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.5044174985600025e-06, |
|
"min": 7.5044174985600025e-06, |
|
"max": 0.00029515063018788575, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00011256626247840004, |
|
"min": 0.00011256626247840004, |
|
"max": 0.0036301444899518994, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10250144000000001, |
|
"min": 0.10250144000000001, |
|
"max": 0.19838354285714285, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.5375216000000003, |
|
"min": 1.3886848, |
|
"max": 2.6100480999999998, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.00025989385600000013, |
|
"min": 0.00025989385600000013, |
|
"max": 0.00983851593142857, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.003898407840000002, |
|
"min": 0.003898407840000002, |
|
"max": 0.12102380519, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.008191419765353203, |
|
"min": 0.007582017220556736, |
|
"max": 0.34768661856651306, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.12287130206823349, |
|
"min": 0.10614824295043945, |
|
"max": 2.4338064193725586, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 584.0217391304348, |
|
"min": 579.433962264151, |
|
"max": 999.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 26865.0, |
|
"min": 15984.0, |
|
"max": 33031.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.0245390949041948, |
|
"min": -1.0000000521540642, |
|
"max": 1.0245390949041948, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 47.12879836559296, |
|
"min": -28.674001529812813, |
|
"max": 51.282198294997215, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.0245390949041948, |
|
"min": -1.0000000521540642, |
|
"max": 1.0245390949041948, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 47.12879836559296, |
|
"min": -28.674001529812813, |
|
"max": 51.282198294997215, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.052135885666559814, |
|
"min": 0.04904970410167992, |
|
"max": 7.379755293019116, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.3982507406617515, |
|
"min": 2.3982507406617515, |
|
"max": 118.07608468830585, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1697016972", |
|
"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training V2 --no-graphics", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.0.1+cu118", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1697019303" |
|
}, |
|
"total": 2331.076256431, |
|
"count": 1, |
|
"self": 0.48035659000015585, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.04397408300019379, |
|
"count": 1, |
|
"self": 0.04397408300019379 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2330.5519257579995, |
|
"count": 1, |
|
"self": 1.6238535508900895, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 3.7216097270002138, |
|
"count": 1, |
|
"self": 3.7216097270002138 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2325.1291281851095, |
|
"count": 63316, |
|
"self": 1.566923036195476, |
|
"children": { |
|
"env_step": { |
|
"total": 1622.062057330972, |
|
"count": 63316, |
|
"self": 1485.839115200004, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 135.26355448800177, |
|
"count": 63316, |
|
"self": 4.993670367158757, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 130.26988412084302, |
|
"count": 62560, |
|
"self": 130.26988412084302 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.9593876429662487, |
|
"count": 63316, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2325.495550961981, |
|
"count": 63316, |
|
"is_parallel": true, |
|
"self": 964.9432444899144, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0020056560001648904, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006361600012496638, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0013694959989152267, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0013694959989152267 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.08765681999966546, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005577549991357955, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0004937700000482437, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004937700000482437 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.08471973800033084, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.08471973800033084 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.001885557000150584, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00039294400085054804, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0014926129993000359, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0014926129993000359 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1360.5523064720664, |
|
"count": 63315, |
|
"is_parallel": true, |
|
"self": 35.12377299516129, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 24.168969467937586, |
|
"count": 63315, |
|
"is_parallel": true, |
|
"self": 24.168969467937586 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1191.4457042949516, |
|
"count": 63315, |
|
"is_parallel": true, |
|
"self": 1191.4457042949516 |
|
}, |
|
"steps_from_proto": { |
|
"total": 109.81385971401596, |
|
"count": 63315, |
|
"is_parallel": true, |
|
"self": 22.217671704017903, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 87.59618800999806, |
|
"count": 506520, |
|
"is_parallel": true, |
|
"self": 87.59618800999806 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 701.500147817942, |
|
"count": 63316, |
|
"self": 3.005095362015709, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 123.75213156392829, |
|
"count": 63316, |
|
"self": 123.57756627792878, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.17456528599950616, |
|
"count": 2, |
|
"self": 0.17456528599950616 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 574.742920891998, |
|
"count": 453, |
|
"self": 370.57453853799143, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 204.16838235400655, |
|
"count": 22755, |
|
"self": 204.16838235400655 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.3179997040424496e-06, |
|
"count": 1, |
|
"self": 1.3179997040424496e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.0773329769999691, |
|
"count": 1, |
|
"self": 0.001754999000695534, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.07557797799927357, |
|
"count": 1, |
|
"self": 0.07557797799927357 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |