Uploaded the Pyramids agent via unit4

6771b91 over 1 year ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.1605914682149887,
	"min": 0.15174803137779236,
	"max": 1.3826720714569092,
	"count": 100
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 4810.03564453125,
	"min": 4520.87744140625,
	"max": 41944.73828125,
	"count": 100
	},
	"Pyramids.Step.mean": {
	"value": 2999935.0,
	"min": 29984.0,
	"max": 2999935.0,
	"count": 100
	},
	"Pyramids.Step.sum": {
	"value": 2999935.0,
	"min": 29984.0,
	"max": 2999935.0,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.7312646508216858,
	"min": -0.08786865323781967,
	"max": 0.864769458770752,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 212.06674194335938,
	"min": -21.088476181030273,
	"max": 264.61944580078125,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.031307727098464966,
	"min": -0.023307139053940773,
	"max": 0.28635692596435547,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 9.079240798950195,
	"min": -6.316234588623047,
	"max": 68.15294647216797,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.069431693604981,
	"min": 0.06259889548310472,
	"max": 0.07356465743699421,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9720437104697339,
	"min": 0.5769289815857017,
	"max": 1.1034698615549132,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.014536273691365275,
	"min": 0.0007999930532062535,
	"max": 0.015559507014115109,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.20350783167911385,
	"min": 0.010399909691681294,
	"max": 0.2178330981976115,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 1.4781780787357106e-06,
	"min": 1.4781780787357106e-06,
	"max": 0.00029828360057213336,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 2.0694493102299947e-05,
	"min": 2.0694493102299947e-05,
	"max": 0.004072884842371767,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10049269285714287,
	"min": 0.10049269285714287,
	"max": 0.19942786666666668,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4068977,
	"min": 1.4068977,
	"max": 2.8576282333333336,
	"count": 100
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 5.922001642857131e-05,
	"min": 5.922001642857131e-05,
	"max": 0.00994284388,
	"count": 100
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0008290802299999984,
	"min": 0.0008290802299999984,
	"max": 0.13577706051,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.004602502100169659,
	"min": 0.004342348780483007,
	"max": 0.40666961669921875,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.06443502753973007,
	"min": 0.06079288199543953,
	"max": 3.25335693359375,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 261.6694915254237,
	"min": 212.27007299270073,
	"max": 995.2258064516129,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30877.0,
	"min": 16399.0,
	"max": 33010.0,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.738213657696023,
	"min": -0.9315290823578835,
	"max": 1.7781703653158965,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 203.37099795043468,
	"min": -28.877401553094387,
	"max": 241.09919920563698,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.738213657696023,
	"min": -0.9315290823578835,
	"max": 1.7781703653158965,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 203.37099795043468,
	"min": -28.877401553094387,
	"max": 241.09919920563698,
	"count": 100
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.01263972351655392,
	"min": 0.009993327900862341,
	"max": 8.080028551466325,
	"count": 100
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 1.4788476514368085,
	"min": 1.3467253648414044,
	"max": 137.36048537492752,
	"count": 100
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1686415716",
	"python_version": "3.10.12 (main, Jun 7 2023, 12:45:35) [GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1686423339"
	},
	"total": 7622.912448516,
	"count": 1,
	"self": 0.5384192190012982,
	"children": {
	"run_training.setup": {
	"total": 0.03806848399926821,
	"count": 1,
	"self": 0.03806848399926821
	},
	"TrainerController.start_learning": {
	"total": 7622.3359608129995,
	"count": 1,
	"self": 5.0599678118469456,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.000870640999892,
	"count": 1,
	"self": 4.000870640999892
	},
	"TrainerController.advance": {
	"total": 7613.119245360153,
	"count": 194176,
	"self": 5.130799042612125,
	"children": {
	"env_step": {
	"total": 5552.522010477777,
	"count": 194176,
	"self": 5160.800616726953,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 388.7483901792739,
	"count": 194176,
	"self": 16.048350887313973,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 372.7000392919599,
	"count": 187549,
	"self": 372.7000392919599
	}
	}
	},
	"workers": {
	"total": 2.97300357155018,
	"count": 194176,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 7603.66474228549,
	"count": 194176,
	"is_parallel": true,
	"self": 2835.15157436121,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0019769840000662953,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006528850017275545,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013240989983387408,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013240989983387408
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.05422819199975493,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005977529999654507,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0006190009999045287,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006190009999045287
	},
	"communicator.exchange": {
	"total": 0.05116591499972856,
	"count": 1,
	"is_parallel": true,
	"self": 0.05116591499972856
	},
	"steps_from_proto": {
	"total": 0.0018455230001563905,
	"count": 1,
	"is_parallel": true,
	"self": 0.00037350999900809256,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001472013001148298,
	"count": 8,
	"is_parallel": true,
	"self": 0.001472013001148298
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 4768.51316792428,
	"count": 194175,
	"is_parallel": true,
	"self": 100.4952850657155,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 74.97257792979872,
	"count": 194175,
	"is_parallel": true,
	"self": 74.97257792979872
	},
	"communicator.exchange": {
	"total": 4266.509113628733,
	"count": 194175,
	"is_parallel": true,
	"self": 4266.509113628733
	},
	"steps_from_proto": {
	"total": 326.53619130003335,
	"count": 194175,
	"is_parallel": true,
	"self": 68.81499423792684,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 257.7211970621065,
	"count": 1553400,
	"is_parallel": true,
	"self": 257.7211970621065
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 2055.466435839764,
	"count": 194176,
	"self": 9.878107901705334,
	"children": {
	"process_trajectory": {
	"total": 373.4966683280627,
	"count": 194176,
	"self": 372.5729026220615,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.923765706001177,
	"count": 6,
	"self": 0.923765706001177
	}
	}
	},
	"_update_policy": {
	"total": 1672.091659609996,
	"count": 1405,
	"self": 1045.91738557982,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 626.1742740301761,
	"count": 68322,
	"self": 626.1742740301761
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.0879994079004973e-06,
	"count": 1,
	"self": 1.0879994079004973e-06
	},
	"TrainerController._save_models": {
	"total": 0.15587591199982853,
	"count": 1,
	"self": 0.002404238999588415,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.15347167300024012,
	"count": 1,
	"self": 0.15347167300024012
	}
	}
	}
	}
	}
	}
	}