First Push

32cb631 almost 2 years ago

46 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.3951915502548218,
	"min": 1.2634586095809937,
	"max": 3.2956900596618652,
	"count": 5000
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 28037.76953125,
	"min": 10965.564453125,
	"max": 116469.8515625,
	"count": 5000
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 66.2,
	"min": 38.22047244094488,
	"max": 999.0,
	"count": 5000
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19860.0,
	"min": 13380.0,
	"max": 30384.0,
	"count": 5000
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1628.9801477178667,
	"min": 1186.4077939590866,
	"max": 1710.7855163348008,
	"count": 4967
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 244347.02215768,
	"min": 2372.841061815623,
	"max": 416996.4578146276,
	"count": 4967
	},
	"SoccerTwos.Step.mean": {
	"value": 49999944.0,
	"min": 9208.0,
	"max": 49999944.0,
	"count": 5000
	},
	"SoccerTwos.Step.sum": {
	"value": 49999944.0,
	"min": 9208.0,
	"max": 49999944.0,
	"count": 5000
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.006404003128409386,
	"min": -0.18173165619373322,
	"max": 0.2155984342098236,
	"count": 5000
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.9606004357337952,
	"min": -30.894380569458008,
	"max": 28.37074089050293,
	"count": 5000
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.006341299507766962,
	"min": -0.18270954489707947,
	"max": 0.22243863344192505,
	"count": 5000
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -0.9511949419975281,
	"min": -31.060623168945312,
	"max": 28.434301376342773,
	"count": 5000
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 5000
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 5000
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.07260000149408977,
	"min": -0.6428571428571429,
	"max": 0.5470181866125627,
	"count": 5000
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -10.890000224113464,
	"min": -67.69480049610138,
	"max": 64.33120006322861,
	"count": 5000
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.07260000149408977,
	"min": -0.6428571428571429,
	"max": 0.5470181866125627,
	"count": 5000
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -10.890000224113464,
	"min": -67.69480049610138,
	"max": 64.33120006322861,
	"count": 5000
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 5000
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 5000
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.017803297971840947,
	"min": 0.009804022525592397,
	"max": 0.0272589957244539,
	"count": 2424
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.017803297971840947,
	"min": 0.009804022525592397,
	"max": 0.0272589957244539,
	"count": 2424
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.09014217108488083,
	"min": 5.6436319482600085e-06,
	"max": 0.13003144264221192,
	"count": 2424
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.09014217108488083,
	"min": 5.6436319482600085e-06,
	"max": 0.13003144264221192,
	"count": 2424
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.09112853507200877,
	"min": 5.387907996616074e-06,
	"max": 0.13180518274505934,
	"count": 2424
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.09112853507200877,
	"min": 5.387907996616074e-06,
	"max": 0.13180518274505934,
	"count": 2424
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 2424
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 2424
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 2424
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000004,
	"max": 0.20000000000000007,
	"count": 2424
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 2424
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 2424
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1679330450",
	"python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/aarriandiaga/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1679463673"
	},
	"total": 133223.42977892235,
	"count": 1,
	"self": 0.32382238283753395,
	"children": {
	"run_training.setup": {
	"total": 0.019948072731494904,
	"count": 1,
	"self": 0.019948072731494904
	},
	"TrainerController.start_learning": {
	"total": 133223.08600846678,
	"count": 1,
	"self": 73.28118709102273,
	"children": {
	"TrainerController._reset_env": {
	"total": 15.53060756251216,
	"count": 250,
	"self": 15.53060756251216
	},
	"TrainerController.advance": {
	"total": 133134.05893164128,
	"count": 3468332,
	"self": 73.12826198711991,
	"children": {
	"env_step": {
	"total": 111102.08651187271,
	"count": 3468332,
	"self": 95785.77327330038,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 15273.147048886865,
	"count": 3468333,
	"self": 489.84687547013164,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 14783.300173416734,
	"count": 6279312,
	"self": 14783.300173416734
	}
	}
	},
	"workers": {
	"total": 43.166189685463905,
	"count": 3468332,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 135271.72111195326,
	"count": 3468332,
	"is_parallel": true,
	"self": 50016.85263640061,
	"children": {
	"run_training.setup": {
	"total": 0.019948072731494904,
	"count": 1,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.004793088883161545,
	"count": 2,
	"is_parallel": true,
	"self": 0.0010695457458496094,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0037235431373119354,
	"count": 8,
	"is_parallel": true,
	"self": 0.0037235431373119354
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04481106624007225,
	"count": 1,
	"is_parallel": true,
	"self": 0.0012932531535625458,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0008067935705184937,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008067935705184937
	},
	"communicator.exchange": {
	"total": 0.038746923208236694,
	"count": 1,
	"is_parallel": true,
	"self": 0.038746923208236694
	},
	"steps_from_proto": {
	"total": 0.003964096307754517,
	"count": 2,
	"is_parallel": true,
	"self": 0.0008054599165916443,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0031586363911628723,
	"count": 8,
	"is_parallel": true,
	"self": 0.0031586363911628723
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 85253.62044411898,
	"count": 3468330,
	"is_parallel": true,
	"self": 5210.795454546809,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 3113.3619608581066,
	"count": 3468330,
	"is_parallel": true,
	"self": 3113.3619608581066
	},
	"communicator.exchange": {
	"total": 61663.338499210775,
	"count": 3468330,
	"is_parallel": true,
	"self": 61663.338499210775
	},
	"steps_from_proto": {
	"total": 15266.124529503286,
	"count": 6936660,
	"is_parallel": true,
	"self": 2793.6784589216113,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 12472.446070581675,
	"count": 27746640,
	"is_parallel": true,
	"self": 12472.446070581675
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 1.228083360940218,
	"count": 498,
	"is_parallel": true,
	"self": 0.21993285417556763,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 1.0081505067646503,
	"count": 1992,
	"is_parallel": true,
	"self": 1.0081505067646503
	}
	}
	},
	"TrainerController.start_learning": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"TrainerController._reset_env": {
	"total": 7.5863275825977325,
	"count": 5,
	"is_parallel": true,
	"self": 7.5863275825977325
	},
	"TrainerController.advance": {
	"total": 2281.6253745779395,
	"count": 56449,
	"is_parallel": true,
	"self": 1.814806591719389,
	"children": {
	"env_step": {
	"total": 1909.242174692452,
	"count": 56449,
	"is_parallel": true,
	"self": 1554.839233968407,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 353.3750216551125,
	"count": 56450,
	"is_parallel": true,
	"self": 12.837710570544004,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 340.5373110845685,
	"count": 112116,
	"is_parallel": true,
	"self": 340.5373110845685
	}
	}
	},
	"workers": {
	"total": 0.9727655313909054,
	"count": 56449,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2285.767784692347,
	"count": 56449,
	"is_parallel": true,
	"self": 950.0625123977661,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.004793088883161545,
	"count": 2,
	"is_parallel": true,
	"self": 0.0010695457458496094,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0037235431373119354,
	"count": 8,
	"is_parallel": true,
	"self": 0.0037235431373119354
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04481106624007225,
	"count": 1,
	"is_parallel": true,
	"self": 0.0012932531535625458,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0008067935705184937,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008067935705184937
	},
	"communicator.exchange": {
	"total": 0.038746923208236694,
	"count": 1,
	"is_parallel": true,
	"self": 0.038746923208236694
	},
	"steps_from_proto": {
	"total": 0.003964096307754517,
	"count": 2,
	"is_parallel": true,
	"self": 0.0008054599165916443,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0031586363911628723,
	"count": 8,
	"is_parallel": true,
	"self": 0.0031586363911628723
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1335.6861735731363,
	"count": 56448,
	"is_parallel": true,
	"self": 79.67445775866508,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 49.1990244500339,
	"count": 56448,
	"is_parallel": true,
	"self": 49.1990244500339
	},
	"communicator.exchange": {
	"total": 968.2461996413767,
	"count": 56448,
	"is_parallel": true,
	"self": 968.2461996413767
	},
	"steps_from_proto": {
	"total": 238.5664917230606,
	"count": 112896,
	"is_parallel": true,
	"self": 43.785972483456135,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 194.78051923960447,
	"count": 451584,
	"is_parallel": true,
	"self": 194.78051923960447
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.01909872144460678,
	"count": 8,
	"is_parallel": true,
	"self": 0.0035157501697540283,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.015582971274852753,
	"count": 32,
	"is_parallel": true,
	"self": 0.015582971274852753
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.006959825754165649,
	"count": 2,
	"is_parallel": true,
	"self": 0.0014488548040390015,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.005510970950126648,
	"count": 8,
	"is_parallel": true,
	"self": 0.005510970950126648
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.048193711787462234,
	"count": 1,
	"is_parallel": true,
	"self": 0.002052847295999527,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0011657513678073883,
	"count": 1,
	"is_parallel": true,
	"self": 0.0011657513678073883
	},
	"communicator.exchange": {
	"total": 0.03903596103191376,
	"count": 1,
	"is_parallel": true,
	"self": 0.03903596103191376
	},
	"steps_from_proto": {
	"total": 0.005939152091741562,
	"count": 2,
	"is_parallel": true,
	"self": 0.000955536961555481,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.004983615130186081,
	"count": 8,
	"is_parallel": true,
	"self": 0.004983615130186081
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 370.56839329376817,
	"count": 56449,
	"is_parallel": true,
	"self": 13.884199187159538,
	"children": {
	"process_trajectory": {
	"total": 97.8659698329866,
	"count": 56449,
	"is_parallel": true,
	"self": 97.61118080094457,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2547890320420265,
	"count": 1,
	"is_parallel": true,
	"self": 0.2547890320420265
	}
	}
	},
	"_update_policy": {
	"total": 258.81822427362204,
	"count": 40,
	"is_parallel": true,
	"self": 177.95811439305544,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 80.8601098805666,
	"count": 1200,
	"is_parallel": true,
	"self": 80.8601098805666
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 21958.844157781452,
	"count": 3468332,
	"self": 564.9205625094473,
	"children": {
	"process_trajectory": {
	"total": 9854.32756850496,
	"count": 3468332,
	"self": 9830.445356227458,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 23.88221227750182,
	"count": 100,
	"self": 23.88221227750182
	}
	}
	},
	"_update_policy": {
	"total": 11539.596026767045,
	"count": 2424,
	"self": 7461.798624768853,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 4077.797401998192,
	"count": 72726,
	"self": 4077.797401998192
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.087784767150879e-06,
	"count": 1,
	"self": 1.087784767150879e-06
	},
	"TrainerController._save_models": {
	"total": 0.21528108417987823,
	"count": 1,
	"self": 0.002195604145526886,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.21308548003435135,
	"count": 1,
	"self": 0.21308548003435135
	}
	}
	}
	}
	}
	}
	}