|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 1.3951915502548218, |
|
"min": 1.2634586095809937, |
|
"max": 3.2956900596618652, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 28037.76953125, |
|
"min": 10965.564453125, |
|
"max": 116469.8515625, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 66.2, |
|
"min": 38.22047244094488, |
|
"max": 999.0, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19860.0, |
|
"min": 13380.0, |
|
"max": 30384.0, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1628.9801477178667, |
|
"min": 1186.4077939590866, |
|
"max": 1710.7855163348008, |
|
"count": 4967 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 244347.02215768, |
|
"min": 2372.841061815623, |
|
"max": 416996.4578146276, |
|
"count": 4967 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 49999944.0, |
|
"min": 9208.0, |
|
"max": 49999944.0, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 49999944.0, |
|
"min": 9208.0, |
|
"max": 49999944.0, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.006404003128409386, |
|
"min": -0.18173165619373322, |
|
"max": 0.2155984342098236, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -0.9606004357337952, |
|
"min": -30.894380569458008, |
|
"max": 28.37074089050293, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.006341299507766962, |
|
"min": -0.18270954489707947, |
|
"max": 0.22243863344192505, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -0.9511949419975281, |
|
"min": -31.060623168945312, |
|
"max": 28.434301376342773, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": -0.07260000149408977, |
|
"min": -0.6428571428571429, |
|
"max": 0.5470181866125627, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": -10.890000224113464, |
|
"min": -67.69480049610138, |
|
"max": 64.33120006322861, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": -0.07260000149408977, |
|
"min": -0.6428571428571429, |
|
"max": 0.5470181866125627, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": -10.890000224113464, |
|
"min": -67.69480049610138, |
|
"max": 64.33120006322861, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 5000 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.017803297971840947, |
|
"min": 0.009804022525592397, |
|
"max": 0.0272589957244539, |
|
"count": 2424 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.017803297971840947, |
|
"min": 0.009804022525592397, |
|
"max": 0.0272589957244539, |
|
"count": 2424 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.09014217108488083, |
|
"min": 5.6436319482600085e-06, |
|
"max": 0.13003144264221192, |
|
"count": 2424 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.09014217108488083, |
|
"min": 5.6436319482600085e-06, |
|
"max": 0.13003144264221192, |
|
"count": 2424 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.09112853507200877, |
|
"min": 5.387907996616074e-06, |
|
"max": 0.13180518274505934, |
|
"count": 2424 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.09112853507200877, |
|
"min": 5.387907996616074e-06, |
|
"max": 0.13180518274505934, |
|
"count": 2424 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 2424 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 2424 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000004, |
|
"max": 0.20000000000000007, |
|
"count": 2424 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000004, |
|
"max": 0.20000000000000007, |
|
"count": 2424 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 2424 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 2424 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1679330450", |
|
"python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]", |
|
"command_line_arguments": "/home/aarriandiaga/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1679463673" |
|
}, |
|
"total": 133223.42977892235, |
|
"count": 1, |
|
"self": 0.32382238283753395, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.019948072731494904, |
|
"count": 1, |
|
"self": 0.019948072731494904 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 133223.08600846678, |
|
"count": 1, |
|
"self": 73.28118709102273, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 15.53060756251216, |
|
"count": 250, |
|
"self": 15.53060756251216 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 133134.05893164128, |
|
"count": 3468332, |
|
"self": 73.12826198711991, |
|
"children": { |
|
"env_step": { |
|
"total": 111102.08651187271, |
|
"count": 3468332, |
|
"self": 95785.77327330038, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 15273.147048886865, |
|
"count": 3468333, |
|
"self": 489.84687547013164, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 14783.300173416734, |
|
"count": 6279312, |
|
"self": 14783.300173416734 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 43.166189685463905, |
|
"count": 3468332, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 135271.72111195326, |
|
"count": 3468332, |
|
"is_parallel": true, |
|
"self": 50016.85263640061, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.019948072731494904, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.004793088883161545, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0010695457458496094, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0037235431373119354, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0037235431373119354 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.04481106624007225, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0012932531535625458, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0008067935705184937, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0008067935705184937 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.038746923208236694, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.038746923208236694 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.003964096307754517, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0008054599165916443, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0031586363911628723, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0031586363911628723 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 85253.62044411898, |
|
"count": 3468330, |
|
"is_parallel": true, |
|
"self": 5210.795454546809, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 3113.3619608581066, |
|
"count": 3468330, |
|
"is_parallel": true, |
|
"self": 3113.3619608581066 |
|
}, |
|
"communicator.exchange": { |
|
"total": 61663.338499210775, |
|
"count": 3468330, |
|
"is_parallel": true, |
|
"self": 61663.338499210775 |
|
}, |
|
"steps_from_proto": { |
|
"total": 15266.124529503286, |
|
"count": 6936660, |
|
"is_parallel": true, |
|
"self": 2793.6784589216113, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 12472.446070581675, |
|
"count": 27746640, |
|
"is_parallel": true, |
|
"self": 12472.446070581675 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 1.228083360940218, |
|
"count": 498, |
|
"is_parallel": true, |
|
"self": 0.21993285417556763, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 1.0081505067646503, |
|
"count": 1992, |
|
"is_parallel": true, |
|
"self": 1.0081505067646503 |
|
} |
|
} |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 7.5863275825977325, |
|
"count": 5, |
|
"is_parallel": true, |
|
"self": 7.5863275825977325 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2281.6253745779395, |
|
"count": 56449, |
|
"is_parallel": true, |
|
"self": 1.814806591719389, |
|
"children": { |
|
"env_step": { |
|
"total": 1909.242174692452, |
|
"count": 56449, |
|
"is_parallel": true, |
|
"self": 1554.839233968407, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 353.3750216551125, |
|
"count": 56450, |
|
"is_parallel": true, |
|
"self": 12.837710570544004, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 340.5373110845685, |
|
"count": 112116, |
|
"is_parallel": true, |
|
"self": 340.5373110845685 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.9727655313909054, |
|
"count": 56449, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2285.767784692347, |
|
"count": 56449, |
|
"is_parallel": true, |
|
"self": 950.0625123977661, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.004793088883161545, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0010695457458496094, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0037235431373119354, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0037235431373119354 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.04481106624007225, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0012932531535625458, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0008067935705184937, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0008067935705184937 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.038746923208236694, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.038746923208236694 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.003964096307754517, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0008054599165916443, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0031586363911628723, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0031586363911628723 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1335.6861735731363, |
|
"count": 56448, |
|
"is_parallel": true, |
|
"self": 79.67445775866508, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 49.1990244500339, |
|
"count": 56448, |
|
"is_parallel": true, |
|
"self": 49.1990244500339 |
|
}, |
|
"communicator.exchange": { |
|
"total": 968.2461996413767, |
|
"count": 56448, |
|
"is_parallel": true, |
|
"self": 968.2461996413767 |
|
}, |
|
"steps_from_proto": { |
|
"total": 238.5664917230606, |
|
"count": 112896, |
|
"is_parallel": true, |
|
"self": 43.785972483456135, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 194.78051923960447, |
|
"count": 451584, |
|
"is_parallel": true, |
|
"self": 194.78051923960447 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.01909872144460678, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0035157501697540283, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.015582971274852753, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.015582971274852753 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.006959825754165649, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0014488548040390015, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.005510970950126648, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.005510970950126648 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.048193711787462234, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.002052847295999527, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0011657513678073883, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0011657513678073883 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.03903596103191376, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.03903596103191376 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.005939152091741562, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.000955536961555481, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.004983615130186081, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.004983615130186081 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 370.56839329376817, |
|
"count": 56449, |
|
"is_parallel": true, |
|
"self": 13.884199187159538, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 97.8659698329866, |
|
"count": 56449, |
|
"is_parallel": true, |
|
"self": 97.61118080094457, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.2547890320420265, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.2547890320420265 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 258.81822427362204, |
|
"count": 40, |
|
"is_parallel": true, |
|
"self": 177.95811439305544, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 80.8601098805666, |
|
"count": 1200, |
|
"is_parallel": true, |
|
"self": 80.8601098805666 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 21958.844157781452, |
|
"count": 3468332, |
|
"self": 564.9205625094473, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 9854.32756850496, |
|
"count": 3468332, |
|
"self": 9830.445356227458, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 23.88221227750182, |
|
"count": 100, |
|
"self": 23.88221227750182 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 11539.596026767045, |
|
"count": 2424, |
|
"self": 7461.798624768853, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 4077.797401998192, |
|
"count": 72726, |
|
"self": 4077.797401998192 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.087784767150879e-06, |
|
"count": 1, |
|
"self": 1.087784767150879e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.21528108417987823, |
|
"count": 1, |
|
"self": 0.002195604145526886, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.21308548003435135, |
|
"count": 1, |
|
"self": 0.21308548003435135 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |