|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.2930396795272827, |
|
"min": 0.2910306751728058, |
|
"max": 0.3772023618221283, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 8809.9453125, |
|
"min": 8684.35546875, |
|
"max": 11434.484375, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 248.008547008547, |
|
"min": 235.304, |
|
"max": 285.65346534653463, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29017.0, |
|
"min": 28296.0, |
|
"max": 31390.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 1979990.0, |
|
"min": 1529895.0, |
|
"max": 1979990.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 1979990.0, |
|
"min": 1529895.0, |
|
"max": 1979990.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.7462483048439026, |
|
"min": 0.6567258238792419, |
|
"max": 0.8047998547554016, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 219.39700317382812, |
|
"min": 187.82357788085938, |
|
"max": 243.049560546875, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.00307209393940866, |
|
"min": -0.03147309273481369, |
|
"max": 0.010138324461877346, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 0.9031956195831299, |
|
"min": -9.158669471740723, |
|
"max": 2.970529079437256, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.7343880247611265, |
|
"min": 1.6473124828189611, |
|
"max": 1.7646959874629975, |
|
"count": 16 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 202.9233988970518, |
|
"min": 173.14899863302708, |
|
"max": 220.58699843287468, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.7343880247611265, |
|
"min": 1.6473124828189611, |
|
"max": 1.7646959874629975, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 202.9233988970518, |
|
"min": 173.14899863302708, |
|
"max": 220.58699843287468, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.019553067057908904, |
|
"min": 0.01902993065235205, |
|
"max": 0.024178172263678528, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.2877088457753416, |
|
"min": 2.2583879788508057, |
|
"max": 2.7079552935319953, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.07168206840263437, |
|
"min": 0.06593017768768947, |
|
"max": 0.07168206840263437, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 1.0035489576368812, |
|
"min": 0.9230224876276526, |
|
"max": 1.0545541316775295, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.01512822743656221, |
|
"min": 0.012747654476932171, |
|
"max": 0.016180382961811988, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.21179518411187093, |
|
"min": 0.1784671626770504, |
|
"max": 0.23259178962325677, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 5.252037535067855e-06, |
|
"min": 5.252037535067855e-06, |
|
"max": 7.26182043653857e-05, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 7.352852549094997e-05, |
|
"min": 7.352852549094997e-05, |
|
"max": 0.0010166548611153998, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10175064642857147, |
|
"min": 0.10175064642857147, |
|
"max": 0.12420604285714287, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4245090500000006, |
|
"min": 1.4245090500000006, |
|
"max": 1.7511241999999998, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.00018488957821428565, |
|
"min": 0.00018488957821428565, |
|
"max": 0.0024281836814285715, |
|
"count": 16 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.002588454094999999, |
|
"min": 0.002588454094999999, |
|
"max": 0.033994571540000004, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.007591236382722855, |
|
"min": 0.007591236382722855, |
|
"max": 0.008284117095172405, |
|
"count": 16 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.10627730935811996, |
|
"min": 0.10627730935811996, |
|
"max": 0.12192925065755844, |
|
"count": 16 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 16 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 16 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1717187613", |
|
"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.3.0+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1717188961" |
|
}, |
|
"total": 1347.8709488369996, |
|
"count": 1, |
|
"self": 0.71397220200015, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.07585502799975075, |
|
"count": 1, |
|
"self": 0.07585502799975075 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 1347.0811216069997, |
|
"count": 1, |
|
"self": 0.7859482171006675, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 3.318750089999412, |
|
"count": 1, |
|
"self": 3.318750089999412 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 1342.8850223249, |
|
"count": 32833, |
|
"self": 0.8270375527827127, |
|
"children": { |
|
"env_step": { |
|
"total": 1011.166429489117, |
|
"count": 32833, |
|
"self": 939.4118349392274, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 71.27514389595308, |
|
"count": 32833, |
|
"self": 2.551690115922611, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 68.72345378003047, |
|
"count": 31306, |
|
"self": 68.72345378003047 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.4794506539365102, |
|
"count": 32833, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 1344.0018025109757, |
|
"count": 32833, |
|
"is_parallel": true, |
|
"self": 473.5056941710782, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.002649463999659929, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006987379993006471, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001950726000359282, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001950726000359282 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.04991982699993969, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006471659999078838, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0005179090003366582, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005179090003366582 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.04695517700019991, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.04695517700019991 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0017995749994952348, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00038207599936868064, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0014174990001265542, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0014174990001265542 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 870.4961083398975, |
|
"count": 32832, |
|
"is_parallel": true, |
|
"self": 17.881733952148352, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 12.423186172025453, |
|
"count": 32832, |
|
"is_parallel": true, |
|
"self": 12.423186172025453 |
|
}, |
|
"communicator.exchange": { |
|
"total": 786.9438411908104, |
|
"count": 32832, |
|
"is_parallel": true, |
|
"self": 786.9438411908104 |
|
}, |
|
"steps_from_proto": { |
|
"total": 53.247347024913324, |
|
"count": 32832, |
|
"is_parallel": true, |
|
"self": 11.437223629844084, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 41.81012339506924, |
|
"count": 262656, |
|
"is_parallel": true, |
|
"self": 41.81012339506924 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 330.89155528300034, |
|
"count": 32833, |
|
"self": 1.5352185120564172, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 70.02132520893792, |
|
"count": 32833, |
|
"self": 69.90206173393835, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.11926347499957046, |
|
"count": 1, |
|
"self": 0.11926347499957046 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 259.335011562006, |
|
"count": 237, |
|
"self": 153.22781376003695, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 106.10719780196905, |
|
"count": 11400, |
|
"self": 106.10719780196905 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 9.87999555945862e-07, |
|
"count": 1, |
|
"self": 9.87999555945862e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.09139998699993157, |
|
"count": 1, |
|
"self": 0.0019656249996842234, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.08943436200024735, |
|
"count": 1, |
|
"self": 0.08943436200024735 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |