First Push

bf439b4 over 1 year ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.1332024335861206,
	"min": 0.1332024335861206,
	"max": 1.4856574535369873,
	"count": 100
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 3985.4169921875,
	"min": 3985.4169921875,
	"max": 45068.90625,
	"count": 100
	},
	"Pyramids.Step.mean": {
	"value": 2999981.0,
	"min": 29952.0,
	"max": 2999981.0,
	"count": 100
	},
	"Pyramids.Step.sum": {
	"value": 2999981.0,
	"min": 29952.0,
	"max": 2999981.0,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.7220757007598877,
	"min": -0.18479059636592865,
	"max": 0.9035793542861938,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 210.1240234375,
	"min": -43.795372009277344,
	"max": 285.53106689453125,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.005038607399910688,
	"min": -0.012448417954146862,
	"max": 0.3230520784854889,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 1.466234803199768,
	"min": -3.6100411415100098,
	"max": 76.56333923339844,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07077729515054691,
	"min": 0.06282116506757093,
	"max": 0.07498741661551488,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9908821321076569,
	"min": 0.4894676464984472,
	"max": 1.1248112492327231,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.014930455326384746,
	"min": 0.0009972557743577045,
	"max": 0.017073321399428614,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.20902637456938644,
	"min": 0.010591151483697167,
	"max": 0.23902649959200062,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 1.5648137641428542e-06,
	"min": 1.5648137641428542e-06,
	"max": 0.00029838354339596195,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 2.1907392697999958e-05,
	"min": 2.1907392697999958e-05,
	"max": 0.0038439619186794,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10052157142857143,
	"min": 0.10052157142857143,
	"max": 0.19946118095238097,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.407302,
	"min": 1.3897045333333333,
	"max": 2.7674998000000004,
	"count": 100
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 6.210498571428561e-05,
	"min": 6.210498571428561e-05,
	"max": 0.009946171977142856,
	"count": 100
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0008694697999999986,
	"min": 0.0008694697999999986,
	"max": 0.12814392794,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.007337778341025114,
	"min": 0.007315483875572681,
	"max": 0.38245826959609985,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.10272889584302902,
	"min": 0.10241677612066269,
	"max": 2.6772079467773438,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 259.08620689655174,
	"min": 194.99346405228758,
	"max": 999.0,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30054.0,
	"min": 15984.0,
	"max": 34058.0,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.637427573381313,
	"min": -1.0000000521540642,
	"max": 1.8042763058880442,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 189.9415985122323,
	"min": -32.000001668930054,
	"max": 274.2499984949827,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.637427573381313,
	"min": -1.0000000521540642,
	"max": 1.8042763058880442,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 189.9415985122323,
	"min": -32.000001668930054,
	"max": 274.2499984949827,
	"count": 100
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.0198721539443419,
	"min": 0.016495678749478875,
	"max": 6.906697786413133,
	"count": 100
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.3051698575436603,
	"min": 2.1919405297594494,
	"max": 110.50716458261013,
	"count": 100
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1690758194",
	"python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1690765988"
	},
	"total": 7794.230711343,
	"count": 1,
	"self": 0.4759737079994011,
	"children": {
	"run_training.setup": {
	"total": 0.031696439999905124,
	"count": 1,
	"self": 0.031696439999905124
	},
	"TrainerController.start_learning": {
	"total": 7793.723041195,
	"count": 1,
	"self": 4.897863862055601,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.0931296399999155,
	"count": 1,
	"self": 4.0931296399999155
	},
	"TrainerController.advance": {
	"total": 7784.6364301319445,
	"count": 195274,
	"self": 4.7098956002882915,
	"children": {
	"env_step": {
	"total": 5780.250303420536,
	"count": 195274,
	"self": 5419.6898817882,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 357.6788286472911,
	"count": 195274,
	"self": 15.610241151233367,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 342.0685874960577,
	"count": 187562,
	"self": 342.0685874960577
	}
	}
	},
	"workers": {
	"total": 2.8815929850443354,
	"count": 195274,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 7775.595906087045,
	"count": 195274,
	"is_parallel": true,
	"self": 2743.7423819867836,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.002954610000415414,
	"count": 1,
	"is_parallel": true,
	"self": 0.0009622559996387281,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001992354000776686,
	"count": 8,
	"is_parallel": true,
	"self": 0.001992354000776686
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.07078826699989804,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005699690000255941,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00048718600010033697,
	"count": 1,
	"is_parallel": true,
	"self": 0.00048718600010033697
	},
	"communicator.exchange": {
	"total": 0.06776107899986528,
	"count": 1,
	"is_parallel": true,
	"self": 0.06776107899986528
	},
	"steps_from_proto": {
	"total": 0.0019700329999068344,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003818060004050494,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001588226999501785,
	"count": 8,
	"is_parallel": true,
	"self": 0.001588226999501785
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 5031.853524100261,
	"count": 195273,
	"is_parallel": true,
	"self": 108.80878000604389,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 74.82100095282249,
	"count": 195273,
	"is_parallel": true,
	"self": 74.82100095282249
	},
	"communicator.exchange": {
	"total": 4510.992968977015,
	"count": 195273,
	"is_parallel": true,
	"self": 4510.992968977015
	},
	"steps_from_proto": {
	"total": 337.2307741643799,
	"count": 195273,
	"is_parallel": true,
	"self": 70.52579006369524,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 266.70498410068467,
	"count": 1562184,
	"is_parallel": true,
	"self": 266.70498410068467
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1999.6762311111206,
	"count": 195274,
	"self": 8.923560649340743,
	"children": {
	"process_trajectory": {
	"total": 365.5521225788193,
	"count": 195274,
	"self": 364.8516358988195,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.7004866799998126,
	"count": 6,
	"self": 0.7004866799998126
	}
	}
	},
	"_update_policy": {
	"total": 1625.2005478829606,
	"count": 1395,
	"self": 1055.4422268171388,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 569.7583210658217,
	"count": 68433,
	"self": 569.7583210658217
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.990009519038722e-07,
	"count": 1,
	"self": 8.990009519038722e-07
	},
	"TrainerController._save_models": {
	"total": 0.09561666199988395,
	"count": 1,
	"self": 0.0014602150004066061,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09415644699947734,
	"count": 1,
	"self": 0.09415644699947734
	}
	}
	}
	}
	}
	}
	}