|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 0.29271167516708374, |
|
"min": 0.27912601828575134, |
|
"max": 3.2958128452301025, |
|
"count": 15999 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 11614.798828125, |
|
"min": 4629.82958984375, |
|
"max": 591558.875, |
|
"count": 15999 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 36.792307692307695, |
|
"min": 29.23170731707317, |
|
"max": 551.0, |
|
"count": 15999 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19132.0, |
|
"min": 15260.0, |
|
"max": 41060.0, |
|
"count": 15999 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1639.9359347156194, |
|
"min": 1198.128538137423, |
|
"max": 1680.737096359153, |
|
"count": 15999 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 426383.343026061, |
|
"min": 2397.64453146509, |
|
"max": 500426.5231898225, |
|
"count": 15999 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 159999996.0, |
|
"min": 9568.0, |
|
"max": 159999996.0, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 159999996.0, |
|
"min": 9568.0, |
|
"max": 159999996.0, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": 0.020044520497322083, |
|
"min": -0.12824246287345886, |
|
"max": 0.22821052372455597, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": 5.211575508117676, |
|
"min": -30.2033634185791, |
|
"max": 49.52168273925781, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.02062523551285267, |
|
"min": -0.1285647302865982, |
|
"max": 0.22626857459545135, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 5.362561225891113, |
|
"min": -30.095096588134766, |
|
"max": 49.10028076171875, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": 0.09029230796373808, |
|
"min": -0.46440799951553347, |
|
"max": 0.5237547838169595, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": 23.4760000705719, |
|
"min": -82.58560001850128, |
|
"max": 93.47840017080307, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": 0.09029230796373808, |
|
"min": -0.46440799951553347, |
|
"max": 0.5237547838169595, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": 23.4760000705719, |
|
"min": -82.58560001850128, |
|
"max": 93.47840017080307, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 16000 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.012796422930356736, |
|
"min": 0.00885343154077418, |
|
"max": 0.028058637352660298, |
|
"count": 7774 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.012796422930356736, |
|
"min": 0.00885343154077418, |
|
"max": 0.028058637352660298, |
|
"count": 7774 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.07961924796303113, |
|
"min": 0.005778578342869878, |
|
"max": 0.0951485348244508, |
|
"count": 7774 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.07961924796303113, |
|
"min": 0.005778578342869878, |
|
"max": 0.0951485348244508, |
|
"count": 7774 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.0797942062218984, |
|
"min": 0.005859525905301173, |
|
"max": 0.09544695367415747, |
|
"count": 7774 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.0797942062218984, |
|
"min": 0.005859525905301173, |
|
"max": 0.09544695367415747, |
|
"count": 7774 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 5.747498117483374e-09, |
|
"min": 5.747498117483374e-09, |
|
"max": 0.000299961435012855, |
|
"count": 7774 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 5.747498117483374e-09, |
|
"min": 5.747498117483374e-09, |
|
"max": 0.000299961435012855, |
|
"count": 7774 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.25, |
|
"min": 0.25, |
|
"max": 0.25, |
|
"count": 7774 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.25, |
|
"min": 0.25, |
|
"max": 0.25, |
|
"count": 7774 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 1.0188061749999443e-05, |
|
"min": 1.0188061749999443e-05, |
|
"max": 0.009998715785499998, |
|
"count": 7774 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 1.0188061749999443e-05, |
|
"min": 1.0188061749999443e-05, |
|
"max": 0.009998715785499998, |
|
"count": 7774 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1693767407", |
|
"python_version": "3.9.17 (main, Jul 5 2023, 20:41:20) \n[GCC 11.2.0]", |
|
"command_line_arguments": "/home/mgmeskill/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=Downstrike-160M --no-graphics --num-envs=8", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1693901136" |
|
}, |
|
"total": 133728.72782940418, |
|
"count": 1, |
|
"self": 0.3201414127834141, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.027171769179403782, |
|
"count": 1, |
|
"self": 0.027171769179403782 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 133728.3805162222, |
|
"count": 1, |
|
"self": 102.86563353613019, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 696.0709477802739, |
|
"count": 7947, |
|
"self": 696.0709477802739 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 132929.13862727955, |
|
"count": 3507132, |
|
"self": 80.21517739770934, |
|
"children": { |
|
"env_step": { |
|
"total": 73052.17698274832, |
|
"count": 3507132, |
|
"self": 24081.407350266818, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 48880.748980567325, |
|
"count": 14812115, |
|
"self": 1211.079614217393, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 47669.66936634993, |
|
"count": 27112404, |
|
"self": 47669.66936634993 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 90.02065191417933, |
|
"count": 3507132, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 1066995.6906433739, |
|
"count": 14784608, |
|
"is_parallel": true, |
|
"self": 875481.2676103334, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.01907126046717167, |
|
"count": 16, |
|
"is_parallel": true, |
|
"self": 0.004095900803804398, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.014975359663367271, |
|
"count": 64, |
|
"is_parallel": true, |
|
"self": 0.014975359663367271 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.17750767897814512, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.006570951547473669, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.004816613160073757, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.004816613160073757 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.14813531283289194, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.14813531283289194 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.017984801437705755, |
|
"count": 16, |
|
"is_parallel": true, |
|
"self": 0.0031336508691310883, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.014851150568574667, |
|
"count": 64, |
|
"is_parallel": true, |
|
"self": 0.014851150568574667 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 191352.52964038588, |
|
"count": 14784600, |
|
"is_parallel": true, |
|
"self": 12493.37244902039, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 8003.242103095632, |
|
"count": 14784600, |
|
"is_parallel": true, |
|
"self": 8003.242103095632 |
|
}, |
|
"communicator.exchange": { |
|
"total": 137369.81809696788, |
|
"count": 14784600, |
|
"is_parallel": true, |
|
"self": 137369.81809696788 |
|
}, |
|
"steps_from_proto": { |
|
"total": 33486.09699130198, |
|
"count": 29569200, |
|
"is_parallel": true, |
|
"self": 5620.8086648634635, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 27865.288326438516, |
|
"count": 118276800, |
|
"is_parallel": true, |
|
"self": 27865.288326438516 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 161.89339265460148, |
|
"count": 127136, |
|
"is_parallel": true, |
|
"self": 25.868383669760078, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 136.0250089848414, |
|
"count": 508544, |
|
"is_parallel": true, |
|
"self": 136.0250089848414 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 59796.74646713352, |
|
"count": 3507132, |
|
"self": 1285.6652827882208, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 24676.622614394873, |
|
"count": 3507132, |
|
"self": 24650.985279567074, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 25.63733482779935, |
|
"count": 80, |
|
"self": 25.63733482779935 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 33834.458569950424, |
|
"count": 7774, |
|
"self": 18988.026603292674, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 14846.43196665775, |
|
"count": 233220, |
|
"self": 14846.43196665775 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 5.522742867469788e-07, |
|
"count": 1, |
|
"self": 5.522742867469788e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.30530707398429513, |
|
"count": 1, |
|
"self": 0.0019307197071611881, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.30337635427713394, |
|
"count": 1, |
|
"self": 0.30337635427713394 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |