First model

9478b92 over 1 year ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.4808414876461029,
	"min": 0.45646536350250244,
	"max": 1.4761430025100708,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 14525.259765625,
	"min": 13642.8369140625,
	"max": 44780.2734375,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989982.0,
	"min": 29952.0,
	"max": 989982.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989982.0,
	"min": 29952.0,
	"max": 989982.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.41117236018180847,
	"min": -0.1260172724723816,
	"max": 0.4495900273323059,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 108.54949951171875,
	"min": -30.370162963867188,
	"max": 121.83889770507812,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.025955229997634888,
	"min": 0.001035523833706975,
	"max": 0.307271271944046,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 6.8521809577941895,
	"min": 0.2692362070083618,
	"max": 73.74510192871094,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06972378771923318,
	"min": 0.06514819621779247,
	"max": 0.07369894572346905,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9761330280692645,
	"min": 0.48059853971798655,
	"max": 1.0672664935021505,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.010373268114048345,
	"min": 0.0001120277094408344,
	"max": 0.013814569378143335,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.14522575359667683,
	"min": 0.001456360222730847,
	"max": 0.20619688992398247,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.424154668171426e-06,
	"min": 7.424154668171426e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010393816535439997,
	"min": 0.00010393816535439997,
	"max": 0.0031400270533243997,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10247468571428572,
	"min": 0.10247468571428572,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4346456,
	"min": 1.3691136000000002,
	"max": 2.3466756000000006,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002572211028571428,
	"min": 0.0002572211028571428,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0036010954399999994,
	"min": 0.0036010954399999994,
	"max": 0.10469289243999999,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.009374582208693027,
	"min": 0.009374582208693027,
	"max": 0.4946654140949249,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.13124415278434753,
	"min": 0.13124415278434753,
	"max": 3.462657928466797,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 449.4153846153846,
	"min": 388.9078947368421,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29212.0,
	"min": 15984.0,
	"max": 33324.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.4274553592388446,
	"min": -1.0000000521540642,
	"max": 1.5058026062814813,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 92.7845983505249,
	"min": -32.000001668930054,
	"max": 114.44099807739258,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.4274553592388446,
	"min": -1.0000000521540642,
	"max": 1.5058026062814813,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 92.7845983505249,
	"min": -32.000001668930054,
	"max": 114.44099807739258,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.04350496525741899,
	"min": 0.040064290778613405,
	"max": 11.339918397367,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.827822741732234,
	"min": 2.827822741732234,
	"max": 181.438694357872,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1690548181",
	"python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1690550179"
	},
	"total": 1997.1754200600003,
	"count": 1,
	"self": 0.376533362000373,
	"children": {
	"run_training.setup": {
	"total": 0.03642111199997089,
	"count": 1,
	"self": 0.03642111199997089
	},
	"TrainerController.start_learning": {
	"total": 1996.762465586,
	"count": 1,
	"self": 1.8417457710179406,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.610064933000103,
	"count": 1,
	"self": 4.610064933000103
	},
	"TrainerController.advance": {
	"total": 1990.206255852982,
	"count": 63469,
	"self": 1.7728782128874627,
	"children": {
	"env_step": {
	"total": 1337.9766422440039,
	"count": 63469,
	"self": 1207.4637519479638,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 129.4123704990352,
	"count": 63469,
	"self": 5.3272204789532225,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 124.08515002008198,
	"count": 62559,
	"self": 124.08515002008198
	}
	}
	},
	"workers": {
	"total": 1.1005197970048357,
	"count": 63469,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 1993.7353670329908,
	"count": 63469,
	"is_parallel": true,
	"self": 904.2853400540353,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0021563249997598177,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006389270001818659,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0015173979995779519,
	"count": 8,
	"is_parallel": true,
	"self": 0.0015173979995779519
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.052196651000031125,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006926920000296377,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005477709996739577,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005477709996739577
	},
	"communicator.exchange": {
	"total": 0.04886110600000393,
	"count": 1,
	"is_parallel": true,
	"self": 0.04886110600000393
	},
	"steps_from_proto": {
	"total": 0.0020950820003236004,
	"count": 1,
	"is_parallel": true,
	"self": 0.00041708700018716627,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001677995000136434,
	"count": 8,
	"is_parallel": true,
	"self": 0.001677995000136434
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1089.4500269789555,
	"count": 63468,
	"is_parallel": true,
	"self": 28.919261706989346,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 19.919393866924565,
	"count": 63468,
	"is_parallel": true,
	"self": 19.919393866924565
	},
	"communicator.exchange": {
	"total": 958.6525405869716,
	"count": 63468,
	"is_parallel": true,
	"self": 958.6525405869716
	},
	"steps_from_proto": {
	"total": 81.95883081807006,
	"count": 63468,
	"is_parallel": true,
	"self": 17.70434792986498,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 64.25448288820508,
	"count": 507744,
	"is_parallel": true,
	"self": 64.25448288820508
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 650.4567353960906,
	"count": 63469,
	"self": 3.028257084075449,
	"children": {
	"process_trajectory": {
	"total": 108.0495058720162,
	"count": 63469,
	"self": 107.81499983501635,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2345060369998464,
	"count": 2,
	"self": 0.2345060369998464
	}
	}
	},
	"_update_policy": {
	"total": 539.378972439999,
	"count": 435,
	"self": 340.66695357000526,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 198.7120188699937,
	"count": 22875,
	"self": 198.7120188699937
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.920004231389612e-07,
	"count": 1,
	"self": 9.920004231389612e-07
	},
	"TrainerController._save_models": {
	"total": 0.10439803699955519,
	"count": 1,
	"self": 0.0014601409993701964,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.10293789600018499,
	"count": 1,
	"self": 0.10293789600018499
	}
	}
	}
	}
	}
	}
	}