First Push

b5a5521 over 1 year ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 3.0681722164154053,
	"min": 3.0086112022399902,
	"max": 3.295736312866211,
	"count": 500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 71083.4140625,
	"min": 13498.91015625,
	"max": 142699.484375,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 759.3333333333334,
	"min": 381.8333333333333,
	"max": 999.0,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 18224.0,
	"min": 11712.0,
	"max": 29128.0,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1230.7034147074687,
	"min": 1193.3253533041118,
	"max": 1232.0422570872072,
	"count": 366
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 9845.62731765975,
	"min": 2388.817898597924,
	"max": 16908.562139028272,
	"count": 366
	},
	"SoccerTwos.Step.mean": {
	"value": 4999774.0,
	"min": 9582.0,
	"max": 4999774.0,
	"count": 500
	},
	"SoccerTwos.Step.sum": {
	"value": 4999774.0,
	"min": 9582.0,
	"max": 4999774.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.005820202175527811,
	"min": -0.028853941708803177,
	"max": 0.01749301701784134,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.07566262781620026,
	"min": -0.48075154423713684,
	"max": 0.2367807775735855,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.00484585203230381,
	"min": -0.034612782299518585,
	"max": 0.018317358568310738,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -0.06299607455730438,
	"min": -0.5254640579223633,
	"max": 0.24662959575653076,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.0010307729244232178,
	"min": -0.5625,
	"max": 0.4507555663585663,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 0.013400048017501831,
	"min": -9.0,
	"max": 8.113600194454193,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.0010307729244232178,
	"min": -0.5625,
	"max": 0.4507555663585663,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 0.013400048017501831,
	"min": -9.0,
	"max": 8.113600194454193,
	"count": 500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.022048475802876055,
	"min": 0.010168385475920635,
	"max": 0.024457173788687215,
	"count": 232
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.022048475802876055,
	"min": 0.010168385475920635,
	"max": 0.024457173788687215,
	"count": 232
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.001593428628014711,
	"min": 8.304267803775171e-08,
	"max": 0.006287430979621907,
	"count": 232
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.001593428628014711,
	"min": 8.304267803775171e-08,
	"max": 0.006287430979621907,
	"count": 232
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.0016020291184152787,
	"min": 1.1614907980591246e-07,
	"max": 0.006288486144815882,
	"count": 232
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.0016020291184152787,
	"min": 1.1614907980591246e-07,
	"max": 0.006288486144815882,
	"count": 232
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 232
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 232
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 232
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 232
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 232
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 232
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1692751022",
	"python_version": "3.9.17 (main, Jul 5 2023, 20:41:20) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/agustin/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1692755762"
	},
	"total": 4740.917500071999,
	"count": 1,
	"self": 0.16804642299939587,
	"children": {
	"run_training.setup": {
	"total": 0.007140761999835377,
	"count": 1,
	"self": 0.007140761999835377
	},
	"TrainerController.start_learning": {
	"total": 4740.742312887,
	"count": 1,
	"self": 4.629413993542585,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.6082590109936064,
	"count": 25,
	"self": 3.6082590109936064
	},
	"TrainerController.advance": {
	"total": 4732.361187622464,
	"count": 325378,
	"self": 4.668138948884916,
	"children": {
	"env_step": {
	"total": 3580.960536827044,
	"count": 325378,
	"self": 2540.381440856753,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1037.7594984670468,
	"count": 325378,
	"self": 26.679753365224315,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1011.0797451018225,
	"count": 646028,
	"self": 1011.0797451018225
	}
	}
	},
	"workers": {
	"total": 2.81959750324404,
	"count": 325378,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 4734.714342336447,
	"count": 325378,
	"is_parallel": true,
	"self": 2717.457386475794,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0015060519999678945,
	"count": 2,
	"is_parallel": true,
	"self": 0.0003789260017583729,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0011271259982095216,
	"count": 8,
	"is_parallel": true,
	"self": 0.0011271259982095216
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.015841564999391267,
	"count": 1,
	"is_parallel": true,
	"self": 0.00035892199866793817,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0002934660005848855,
	"count": 1,
	"is_parallel": true,
	"self": 0.0002934660005848855
	},
	"communicator.exchange": {
	"total": 0.014033939000000828,
	"count": 1,
	"is_parallel": true,
	"self": 0.014033939000000828
	},
	"steps_from_proto": {
	"total": 0.001155238000137615,
	"count": 2,
	"is_parallel": true,
	"self": 0.00025357500089739915,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0009016629992402159,
	"count": 8,
	"is_parallel": true,
	"self": 0.0009016629992402159
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2017.229015981664,
	"count": 325377,
	"is_parallel": true,
	"self": 116.31933354324883,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 83.54269948724595,
	"count": 325377,
	"is_parallel": true,
	"self": 83.54269948724595
	},
	"communicator.exchange": {
	"total": 1450.5245641430774,
	"count": 325377,
	"is_parallel": true,
	"self": 1450.5245641430774
	},
	"steps_from_proto": {
	"total": 366.8424188080917,
	"count": 650754,
	"is_parallel": true,
	"self": 76.60866541693667,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 290.233753391155,
	"count": 2603016,
	"is_parallel": true,
	"self": 290.233753391155
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.027939878988945566,
	"count": 48,
	"is_parallel": true,
	"self": 0.0059418999935587635,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.021997978995386802,
	"count": 192,
	"is_parallel": true,
	"self": 0.021997978995386802
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1146.732511846535,
	"count": 325378,
	"self": 35.44267001867229,
	"children": {
	"process_trajectory": {
	"total": 269.43742016885517,
	"count": 325378,
	"self": 267.9769432328576,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.4604769359975762,
	"count": 10,
	"self": 1.4604769359975762
	}
	}
	},
	"_update_policy": {
	"total": 841.8524216590076,
	"count": 232,
	"self": 517.9916511429892,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 323.8607705160184,
	"count": 6960,
	"self": 323.8607705160184
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 5.700003384845331e-07,
	"count": 1,
	"self": 5.700003384845331e-07
	},
	"TrainerController._save_models": {
	"total": 0.14345168999898306,
	"count": 1,
	"self": 0.0011678609989758115,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.14228382900000724,
	"count": 1,
	"self": 0.14228382900000724
	}
	}
	}
	}
	}
	}
	}